From cf3a204b89930e5148fe9e332d7e4ea5ba667b2d Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Wed, 29 Apr 2026 21:50:20 +0200
Subject: [PATCH 01/46] feat(appkit): agents() plugin, createAgent(def), and
 markdown-driven agents
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The main product layer. Turns an AppKit app into an AI-agent host with
markdown-driven agent discovery, code-defined agents, sub-agents, and
a standalone run-without-HTTP executor.

Agent runtime files land in core/agent/ from day one:

  core/agent/create-agent.ts    — createAgent() definition factory
  core/agent/run-agent.ts       — standalone adapter loop (no HTTP)
  core/agent/load-agents.ts     — markdown agent discovery
  core/agent/system-prompt.ts   — base system prompt + composition
  core/agent/types.ts           — updated with AgentDefinition,
                                   AgentsPluginConfig, RegisteredAgent, etc.

HTTP-facing concerns stay in plugins/agents/:
  agents.ts, thread-store.ts, tool-approval-gate.ts,
  event-channel.ts, event-translator.ts, schemas.ts,
  defaults.ts, manifest.json
---
 packages/appkit/src/beta.ts                   |   30 +-
 .../appkit/src/core/agent/create-agent.ts     |   53 +
 packages/appkit/src/core/agent/load-agents.ts |  370 +++++
 packages/appkit/src/core/agent/run-agent.ts   |  226 +++
 .../appkit/src/core/agent/system-prompt.ts    |   40 +
 .../src/core/agent/tests/create-agent.test.ts |   75 +
 .../src/core/agent/tests/load-agents.test.ts  |  302 ++++
 .../src/core/agent/tests/run-agent.test.ts    |  120 ++
 .../core/agent/tests/system-prompt.test.ts    |   45 +
 packages/appkit/src/core/agent/types.ts       |  177 ++-
 packages/appkit/src/plugins/agents/agents.ts  | 1268 +++++++++++++++++
 .../appkit/src/plugins/agents/defaults.ts     |   12 +
 .../src/plugins/agents/event-channel.ts       |   70 +
 .../src/plugins/agents/event-translator.ts    |  291 ++++
 packages/appkit/src/plugins/agents/index.ts   |   22 +
 .../appkit/src/plugins/agents/manifest.json   |   10 +
 packages/appkit/src/plugins/agents/schemas.ts |   69 +
 .../agents/tests/agents-plugin.test.ts        |  373 +++++
 .../agents/tests/approval-route.test.ts       |  292 ++++
 .../plugins/agents/tests/dos-limits.test.ts   |  299 ++++
 .../agents/tests/event-channel.test.ts        |   78 +
 .../agents/tests/event-translator.test.ts     |  332 +++++
 .../plugins/agents/tests/thread-store.test.ts |  138 ++
 .../agents/tests/tool-approval-gate.test.ts   |  156 ++
 .../appkit/src/plugins/agents/thread-store.ts |   66 +
 .../src/plugins/agents/tool-approval-gate.ts  |  122 ++
 packages/shared/src/agent.ts                  |   36 +-
 27 files changed, 5063 insertions(+), 9 deletions(-)
 create mode 100644 packages/appkit/src/core/agent/create-agent.ts
 create mode 100644 packages/appkit/src/core/agent/load-agents.ts
 create mode 100644 packages/appkit/src/core/agent/run-agent.ts
 create mode 100644 packages/appkit/src/core/agent/system-prompt.ts
 create mode 100644 packages/appkit/src/core/agent/tests/create-agent.test.ts
 create mode 100644 packages/appkit/src/core/agent/tests/load-agents.test.ts
 create mode 100644 packages/appkit/src/core/agent/tests/run-agent.test.ts
 create mode 100644 packages/appkit/src/core/agent/tests/system-prompt.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/agents.ts
 create mode 100644 packages/appkit/src/plugins/agents/defaults.ts
 create mode 100644 packages/appkit/src/plugins/agents/event-channel.ts
 create mode 100644 packages/appkit/src/plugins/agents/event-translator.ts
 create mode 100644 packages/appkit/src/plugins/agents/index.ts
 create mode 100644 packages/appkit/src/plugins/agents/manifest.json
 create mode 100644 packages/appkit/src/plugins/agents/schemas.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/approval-route.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/dos-limits.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/event-channel.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/event-translator.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/thread-store.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/tool-approval-gate.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/thread-store.ts
 create mode 100644 packages/appkit/src/plugins/agents/tool-approval-gate.ts

diff --git a/packages/appkit/src/beta.ts b/packages/appkit/src/beta.ts
index 801c33b1a..55c836c97 100644
--- a/packages/appkit/src/beta.ts
+++ b/packages/appkit/src/beta.ts
@@ -19,6 +19,14 @@ export type {
 } from "shared";
 export { DatabricksAdapter, parseTextToolCalls } from "./agents/databricks";
 
+// Agent runtime
+export { createAgent } from "./core/agent/create-agent";
+export {
+  type RunAgentInput,
+  type RunAgentResult,
+  runAgent,
+} from "./core/agent/run-agent";
+
 // Tool authoring primitives
 export {
   AppKitMcpClient,
@@ -37,11 +45,25 @@ export {
   tool,
   toolsFromRegistry,
 } from "./core/agent/tools";
+
+// Agent types
+export type {
+  AgentDefinition,
+  AgentsPluginConfig,
+  AgentTool,
+  AutoInheritToolsConfig,
+  BaseSystemPromptOption,
+  PromptContext,
+  RegisteredAgent,
+  ResolvedToolEntry,
+  ToolkitEntry,
+  ToolkitOptions,
+} from "./plugins/agents";
 export {
-  type AgentTool,
+  agentIdFromMarkdownPath,
   isToolkitEntry,
-  type ToolkitEntry,
-  type ToolkitOptions,
-} from "./core/agent/types";
+  loadAgentFromFile,
+  loadAgentsFromDir,
+} from "./plugins/agents";
 
 export * from "./plugins/beta-exports.generated";
diff --git a/packages/appkit/src/core/agent/create-agent.ts b/packages/appkit/src/core/agent/create-agent.ts
new file mode 100644
index 000000000..b4b119010
--- /dev/null
+++ b/packages/appkit/src/core/agent/create-agent.ts
@@ -0,0 +1,53 @@
+import { ConfigurationError } from "../../errors";
+import type { AgentDefinition } from "./types";
+
+/**
+ * Pure factory for agent definitions. Returns the passed-in definition after
+ * cycle-detecting the sub-agent graph. Accepts the full `AgentDefinition` shape
+ * and is safe to call at module top-level.
+ *
+ * The returned value is a plain `AgentDefinition` — no adapter construction,
+ * no side effects. Register it with `agents({ agents: { name: def } })` or run
+ * it standalone via `runAgent(def, input)`.
+ *
+ * @example
+ * ```ts
+ * const support = createAgent({
+ *   instructions: "You help customers.",
+ *   model: "databricks-claude-sonnet-4-5",
+ *   tools: {
+ *     get_weather: tool({ ... }),
+ *   },
+ * });
+ * ```
+ */
+export function createAgent(def: AgentDefinition): AgentDefinition {
+  detectCycles(def);
+  return def;
+}
+
+/**
+ * Walks the `agents: { ... }` sub-agent tree via DFS and throws if a cycle is
+ * found. Cycles would cause infinite recursion at tool-invocation time.
+ */
+function detectCycles(def: AgentDefinition): void {
+  const visiting = new Set<AgentDefinition>();
+  const visited = new Set<AgentDefinition>();
+
+  const walk = (current: AgentDefinition, path: string[]): void => {
+    if (visited.has(current)) return;
+    if (visiting.has(current)) {
+      throw new ConfigurationError(
+        `Agent sub-agent cycle detected: ${path.join(" -> ")}`,
+      );
+    }
+    visiting.add(current);
+    for (const [childKey, child] of Object.entries(current.agents ?? {})) {
+      walk(child, [...path, childKey]);
+    }
+    visiting.delete(current);
+    visited.add(current);
+  };
+
+  walk(def, [def.name ?? "(root)"]);
+}
diff --git a/packages/appkit/src/core/agent/load-agents.ts b/packages/appkit/src/core/agent/load-agents.ts
new file mode 100644
index 000000000..8f9fd1be7
--- /dev/null
+++ b/packages/appkit/src/core/agent/load-agents.ts
@@ -0,0 +1,370 @@
+import fs from "node:fs";
+import path from "node:path";
+import yaml from "js-yaml";
+import type { AgentAdapter } from "shared";
+import { createLogger } from "../../logging/logger";
+import type {
+  AgentDefinition,
+  AgentTool,
+  BaseSystemPromptOption,
+  ToolkitEntry,
+  ToolkitOptions,
+} from "../../core/agent/types";
+import { isToolkitEntry } from "../../core/agent/types";
+
+const logger = createLogger("agents:loader");
+
+interface ToolkitProvider {
+  toolkit: (opts?: ToolkitOptions) => Record<string, unknown>;
+}
+
+export interface LoadContext {
+  /** Default model when frontmatter has no `endpoint` and the def has no `model`. */
+  defaultModel?: AgentAdapter | Promise<AgentAdapter> | string;
+  /** Ambient tool library referenced by frontmatter `tools: [key1, key2]`. */
+  availableTools?: Record<string, AgentTool>;
+  /** Registered plugin toolkits referenced by frontmatter `toolkits: [...]`. */
+  plugins?: Map<string, ToolkitProvider>;
+  /**
+   * Code-defined agents contributed by `agents({ agents: { ... } })`. The
+   * directory loader resolves `agents:` frontmatter references against
+   * these alongside sibling markdown files, so a markdown parent can
+   * delegate to a code-defined child. Code-defined names win on collision
+   * with markdown names, matching the plugin's top-level merge precedence.
+   */
+  codeAgents?: Record<string, AgentDefinition>;
+}
+
+export interface LoadResult {
+  /** Agent definitions keyed by file-stem name. */
+  defs: Record<string, AgentDefinition>;
+  /** First file with `default: true` frontmatter, or `null`. */
+  defaultAgent: string | null;
+}
+
+interface Frontmatter {
+  endpoint?: string;
+  model?: string;
+  toolkits?: ToolkitSpec[];
+  tools?: string[];
+  /**
+   * Sibling file-stems to expose as sub-agents. Each becomes an
+   * `agent-<stem>` tool on this agent at runtime. Resolution happens at
+   * directory-load time in {@link loadAgentsFromDir}; the single-file
+   * {@link loadAgentFromFile} path rejects non-empty values since there
+   * are no siblings to resolve against.
+   */
+  agents?: string[];
+  maxSteps?: number;
+  maxTokens?: number;
+  default?: boolean;
+  baseSystemPrompt?: false | string;
+  ephemeral?: boolean;
+}
+
+type ToolkitSpec = string | { [pluginName: string]: ToolkitOptions | string[] };
+
+const ALLOWED_KEYS = new Set([
+  "endpoint",
+  "model",
+  "toolkits",
+  "tools",
+  "agents",
+  "maxSteps",
+  "maxTokens",
+  "default",
+  "baseSystemPrompt",
+  "ephemeral",
+]);
+
+/**
+ * Loads a single markdown agent file and resolves its frontmatter against
+ * registered plugin toolkits + ambient tool library.
+ *
+ * Rejects non-empty `agents:` frontmatter because single-file loads have
+ * no siblings to resolve sub-agent references against — callers must use
+ * {@link loadAgentsFromDir} when markdown agents delegate to one another.
+ */
+export async function loadAgentFromFile(
+  filePath: string,
+  ctx: LoadContext,
+): Promise<AgentDefinition> {
+  const raw = fs.readFileSync(filePath, "utf-8");
+  const name = path.basename(filePath, ".md");
+  const { data } = parseFrontmatter(raw, filePath);
+  if (Array.isArray(data?.agents) && data.agents.length > 0) {
+    throw new Error(
+      `Agent '${name}' (${filePath}) declares 'agents:' in frontmatter, ` +
+        `which requires loadAgentsFromDir to resolve sibling references. ` +
+        `Use loadAgentsFromDir, or wire sub-agents in code via createAgent({ agents: { ... } }).`,
+    );
+  }
+  return buildDefinition(name, raw, filePath, ctx);
+}
+
+/**
+ * Scans a directory for `*.md` files and produces an `AgentDefinition` record
+ * keyed by file-stem. Throws on frontmatter errors or unresolved references.
+ * Returns an empty map if the directory does not exist.
+ *
+ * Runs in two passes so sub-agent references in frontmatter (`agents: [...]`)
+ * can be resolved regardless of file-system iteration order:
+ *
+ * 1. Build every agent's definition from its own file.
+ * 2. Walk `agents:` references and wire `def.agents = { sibling: siblingDef }`
+ *    by looking them up in the complete map. Dangling names and
+ *    self-references fail loudly; mutual delegation is allowed and bounded
+ *    at runtime by `limits.maxSubAgentDepth`.
+ */
+export async function loadAgentsFromDir(
+  dir: string,
+  ctx: LoadContext,
+): Promise<LoadResult> {
+  if (!fs.existsSync(dir)) {
+    return { defs: {}, defaultAgent: null };
+  }
+  // Sort so `default: true` resolution is deterministic across platforms —
+  // `readdirSync` order is filesystem-dependent (macOS alphabetical, ext4
+  // inode order, etc.).
+  const files = fs
+    .readdirSync(dir)
+    .filter((f) => f.endsWith(".md"))
+    .sort();
+  const defs: Record<string, AgentDefinition> = {};
+  const subAgentRefs: Record<string, string[]> = {};
+  let defaultAgent: string | null = null;
+
+  // Pass 1: build every agent's definition; collect unresolved sibling refs.
+  for (const file of files) {
+    const fullPath = path.join(dir, file);
+    const raw = fs.readFileSync(fullPath, "utf-8");
+    const name = path.basename(file, ".md");
+    defs[name] = buildDefinition(name, raw, fullPath, ctx);
+    const { data } = parseFrontmatter(raw, fullPath);
+    if (data?.agents !== undefined) {
+      subAgentRefs[name] = normalizeAgentsFrontmatter(
+        data.agents,
+        name,
+        fullPath,
+      );
+    }
+    if (data?.default === true && !defaultAgent) {
+      defaultAgent = name;
+    }
+  }
+
+  // Pass 2: resolve sibling references against the complete defs map.
+  // Code-defined agents (ctx.codeAgents) take precedence over markdown ones
+  // with the same name, matching the plugin's top-level merge behaviour.
+  for (const [name, refs] of Object.entries(subAgentRefs)) {
+    if (refs.length === 0) continue;
+    const children: Record<string, AgentDefinition> = {};
+    const missing: string[] = [];
+    for (const ref of refs) {
+      if (ref === name) {
+        throw new Error(
+          `Agent '${name}' (${path.join(dir, `${name}.md`)}) cannot reference itself in 'agents:'.`,
+        );
+      }
+      const sibling = ctx.codeAgents?.[ref] ?? defs[ref];
+      if (!sibling) {
+        missing.push(ref);
+        continue;
+      }
+      children[ref] = sibling;
+    }
+    if (missing.length > 0) {
+      const available =
+        [...Object.keys(ctx.codeAgents ?? {}), ...Object.keys(defs)]
+          .sort()
+          .join(", ") || "<none>";
+      throw new Error(
+        `Agent '${name}' references sub-agent(s) '${missing.join(", ")}' in 'agents:', ` +
+          `but no markdown or code agent(s) with those names exist. ` +
+          `Available: ${available}.`,
+      );
+    }
+    defs[name].agents = children;
+  }
+
+  return { defs, defaultAgent };
+}
+
+/**
+ * Validates that `agents:` frontmatter is an array of non-empty strings and
+ * returns it with duplicates removed. Throws with a clear per-file message
+ * on malformed input rather than silently ignoring.
+ */
+function normalizeAgentsFrontmatter(
+  value: unknown,
+  agentName: string,
+  filePath: string,
+): string[] {
+  if (!Array.isArray(value)) {
+    throw new Error(
+      `Agent '${agentName}' (${filePath}) has invalid 'agents:' frontmatter: ` +
+        `expected an array of sibling file-stems, got ${typeof value}.`,
+    );
+  }
+  const out: string[] = [];
+  const seen = new Set<string>();
+  for (const item of value) {
+    if (typeof item !== "string" || item.trim() === "") {
+      throw new Error(
+        `Agent '${agentName}' (${filePath}) has invalid 'agents:' entry: ` +
+          `expected non-empty string, got ${JSON.stringify(item)}.`,
+      );
+    }
+    if (seen.has(item)) continue;
+    seen.add(item);
+    out.push(item);
+  }
+  return out;
+}
+
+/** Exposed for tests. Parses `--- yaml ---\nbody` and validates frontmatter keys. */
+export function parseFrontmatter(
+  raw: string,
+  sourcePath?: string,
+): { data: Frontmatter | null; content: string } {
+  const match = raw.match(/^---\r?\n([\s\S]*?)\r?\n---\r?\n?([\s\S]*)$/);
+  if (!match) {
+    return { data: null, content: raw.trim() };
+  }
+  let parsed: unknown;
+  try {
+    parsed = yaml.load(match[1]);
+  } catch (err) {
+    const src = sourcePath ? ` (${sourcePath})` : "";
+    throw new Error(
+      `Invalid YAML frontmatter${src}: ${err instanceof Error ? err.message : String(err)}`,
+    );
+  }
+  if (parsed === null || parsed === undefined) {
+    return { data: {}, content: match[2].trim() };
+  }
+  if (typeof parsed !== "object" || Array.isArray(parsed)) {
+    const src = sourcePath ? ` (${sourcePath})` : "";
+    throw new Error(`Frontmatter must be a YAML object${src}`);
+  }
+  const data = parsed as Record<string, unknown>;
+  for (const key of Object.keys(data)) {
+    if (!ALLOWED_KEYS.has(key)) {
+      logger.warn(
+        "Ignoring unknown frontmatter key '%s' in %s",
+        key,
+        sourcePath ?? "<inline>",
+      );
+    }
+  }
+  return { data: data as Frontmatter, content: match[2].trim() };
+}
+
+function buildDefinition(
+  name: string,
+  raw: string,
+  filePath: string,
+  ctx: LoadContext,
+): AgentDefinition {
+  const { data, content } = parseFrontmatter(raw, filePath);
+  const fm: Frontmatter = data ?? {};
+
+  const tools = resolveFrontmatterTools(name, fm, filePath, ctx);
+  const model = fm.model ?? fm.endpoint ?? ctx.defaultModel;
+
+  let baseSystemPrompt: BaseSystemPromptOption | undefined;
+  if (fm.baseSystemPrompt === false) baseSystemPrompt = false;
+  else if (typeof fm.baseSystemPrompt === "string")
+    baseSystemPrompt = fm.baseSystemPrompt;
+
+  return {
+    name,
+    instructions: content,
+    model,
+    tools: Object.keys(tools).length > 0 ? tools : undefined,
+    maxSteps: typeof fm.maxSteps === "number" ? fm.maxSteps : undefined,
+    maxTokens: typeof fm.maxTokens === "number" ? fm.maxTokens : undefined,
+    baseSystemPrompt,
+    ephemeral: typeof fm.ephemeral === "boolean" ? fm.ephemeral : undefined,
+  };
+}
+
+function resolveFrontmatterTools(
+  agentName: string,
+  fm: Frontmatter,
+  filePath: string,
+  ctx: LoadContext,
+): Record<string, AgentTool> {
+  const out: Record<string, AgentTool> = {};
+  const pluginIdx = ctx.plugins ?? new Map<string, ToolkitProvider>();
+
+  for (const spec of fm.toolkits ?? []) {
+    const [pluginName, opts] = parseToolkitSpec(spec, filePath, agentName);
+    const provider = pluginIdx.get(pluginName);
+    if (!provider) {
+      throw new Error(
+        `Agent '${agentName}' (${filePath}) references toolkit '${pluginName}', but plugin '${pluginName}' is not registered. Available: ${
+          pluginIdx.size > 0
+            ? Array.from(pluginIdx.keys()).join(", ")
+            : "<none>"
+        }`,
+      );
+    }
+    const entries = provider.toolkit(opts) as Record<string, unknown>;
+    for (const [key, entry] of Object.entries(entries)) {
+      if (!isToolkitEntry(entry)) {
+        throw new Error(
+          `Plugin '${pluginName}'.toolkit() returned a value at key '${key}' that is not a ToolkitEntry`,
+        );
+      }
+      out[key] = entry as ToolkitEntry;
+    }
+  }
+
+  for (const key of fm.tools ?? []) {
+    const tool = ctx.availableTools?.[key];
+    if (!tool) {
+      const available = ctx.availableTools
+        ? Object.keys(ctx.availableTools).join(", ")
+        : "<none>";
+      throw new Error(
+        `Agent '${agentName}' (${filePath}) references tool '${key}', which is not in the agents() plugin's tools field. Available: ${available}`,
+      );
+    }
+    out[key] = tool;
+  }
+
+  return out;
+}
+
+function parseToolkitSpec(
+  spec: ToolkitSpec,
+  filePath: string,
+  agentName: string,
+): [string, ToolkitOptions | undefined] {
+  if (typeof spec === "string") {
+    return [spec, undefined];
+  }
+  if (typeof spec !== "object" || spec === null) {
+    throw new Error(
+      `Agent '${agentName}' (${filePath}) has invalid toolkit entry: ${JSON.stringify(spec)}`,
+    );
+  }
+  const keys = Object.keys(spec);
+  if (keys.length !== 1) {
+    throw new Error(
+      `Agent '${agentName}' (${filePath}) toolkit entry must have exactly one key, got: ${keys.join(", ")}`,
+    );
+  }
+  const pluginName = keys[0];
+  const value = spec[pluginName];
+  if (Array.isArray(value)) {
+    return [pluginName, { only: value }];
+  }
+  if (typeof value === "object" && value !== null) {
+    return [pluginName, value as ToolkitOptions];
+  }
+  throw new Error(
+    `Agent '${agentName}' (${filePath}) toolkit '${pluginName}' options must be an array of tool names or an options object`,
+  );
+}
diff --git a/packages/appkit/src/core/agent/run-agent.ts b/packages/appkit/src/core/agent/run-agent.ts
new file mode 100644
index 000000000..5ef4109cf
--- /dev/null
+++ b/packages/appkit/src/core/agent/run-agent.ts
@@ -0,0 +1,226 @@
+import { randomUUID } from "node:crypto";
+import type {
+  AgentAdapter,
+  AgentEvent,
+  AgentToolDefinition,
+  Message,
+} from "shared";
+import {
+  type FunctionTool,
+  functionToolToDefinition,
+  isFunctionTool,
+} from "./tools/function-tool";
+import { isHostedTool } from "./tools/hosted-tools";
+import type {
+  AgentDefinition,
+  AgentTool,
+  ToolkitEntry,
+} from "./types";
+import { isToolkitEntry } from "./types";
+
+export interface RunAgentInput {
+  /** Seed messages for the run. Either a single user string or a full message list. */
+  messages: string | Message[];
+  /** Abort signal for cancellation. */
+  signal?: AbortSignal;
+}
+
+export interface RunAgentResult {
+  /** Aggregated text output from all `message_delta` events. */
+  text: string;
+  /** Every event the adapter yielded, in order. Useful for inspection/tests. */
+  events: AgentEvent[];
+}
+
+/**
+ * Standalone agent execution without `createApp`. Resolves the adapter, binds
+ * inline tools, and drives the adapter's `run()` loop to completion.
+ *
+ * Limitations vs. running through the agents() plugin:
+ * - No OBO: there is no HTTP request, so plugin tools run as the service
+ *   principal (when they work at all).
+ * - Plugin tools (`ToolkitEntry`) are not supported — they require a live
+ *   `PluginContext` that only exists when registered in a `createApp`
+ *   instance. This function throws a clear error if encountered.
+ * - Sub-agents (`agents: { ... }` on the def) are executed as nested
+ *   `runAgent` calls with no shared thread state.
+ */
+export async function runAgent(
+  def: AgentDefinition,
+  input: RunAgentInput,
+): Promise<RunAgentResult> {
+  const adapter = await resolveAdapter(def);
+  const messages = normalizeMessages(input.messages, def.instructions);
+  const toolIndex = buildStandaloneToolIndex(def);
+  const tools = Array.from(toolIndex.values()).map((e) => e.def);
+
+  const signal = input.signal;
+
+  const executeTool = async (name: string, args: unknown): Promise<unknown> => {
+    const entry = toolIndex.get(name);
+    if (!entry) throw new Error(`Unknown tool: ${name}`);
+    if (entry.kind === "function") {
+      return entry.tool.execute(args as Record<string, unknown>);
+    }
+    if (entry.kind === "subagent") {
+      const subInput: RunAgentInput = {
+        messages:
+          typeof args === "object" &&
+          args !== null &&
+          typeof (args as { input?: unknown }).input === "string"
+            ? (args as { input: string }).input
+            : JSON.stringify(args),
+        signal,
+      };
+      const res = await runAgent(entry.agentDef, subInput);
+      return res.text;
+    }
+    throw new Error(
+      `runAgent: tool "${name}" is a ${entry.kind} tool. ` +
+        "Plugin toolkits and MCP tools are only usable via createApp({ plugins: [..., agents(...)] }).",
+    );
+  };
+
+  const events: AgentEvent[] = [];
+  let text = "";
+
+  const stream = adapter.run(
+    {
+      messages,
+      tools,
+      threadId: randomUUID(),
+      signal,
+    },
+    { executeTool, signal },
+  );
+
+  for await (const event of stream) {
+    if (signal?.aborted) break;
+    events.push(event);
+    if (event.type === "message_delta") {
+      text += event.content;
+    } else if (event.type === "message") {
+      text = event.content;
+    }
+  }
+
+  return { text, events };
+}
+
+async function resolveAdapter(def: AgentDefinition): Promise<AgentAdapter> {
+  const { model } = def;
+  if (!model) {
+    const { DatabricksAdapter } = await import("../../agents/databricks");
+    return DatabricksAdapter.fromModelServing();
+  }
+  if (typeof model === "string") {
+    const { DatabricksAdapter } = await import("../../agents/databricks");
+    return DatabricksAdapter.fromModelServing(model);
+  }
+  return await model;
+}
+
+function normalizeMessages(
+  input: string | Message[],
+  instructions: string,
+): Message[] {
+  const systemMessage: Message = {
+    id: "system",
+    role: "system",
+    content: instructions,
+    createdAt: new Date(),
+  };
+  if (typeof input === "string") {
+    return [
+      systemMessage,
+      {
+        id: randomUUID(),
+        role: "user",
+        content: input,
+        createdAt: new Date(),
+      },
+    ];
+  }
+  return [systemMessage, ...input];
+}
+
+type StandaloneEntry =
+  | {
+      kind: "function";
+      def: AgentToolDefinition;
+      tool: FunctionTool;
+    }
+  | {
+      kind: "subagent";
+      def: AgentToolDefinition;
+      agentDef: AgentDefinition;
+    }
+  | {
+      kind: "toolkit";
+      def: AgentToolDefinition;
+      entry: ToolkitEntry;
+    }
+  | {
+      kind: "hosted";
+      def: AgentToolDefinition;
+    };
+
+function buildStandaloneToolIndex(
+  def: AgentDefinition,
+): Map<string, StandaloneEntry> {
+  const index = new Map<string, StandaloneEntry>();
+
+  for (const [key, tool] of Object.entries(def.tools ?? {})) {
+    index.set(key, classifyTool(key, tool));
+  }
+
+  for (const [childKey, child] of Object.entries(def.agents ?? {})) {
+    const toolName = `agent-${childKey}`;
+    index.set(toolName, {
+      kind: "subagent",
+      agentDef: { ...child, name: child.name ?? childKey },
+      def: {
+        name: toolName,
+        description:
+          child.instructions.slice(0, 120) ||
+          `Delegate to the ${childKey} sub-agent`,
+        parameters: {
+          type: "object",
+          properties: {
+            input: {
+              type: "string",
+              description: "Message to send to the sub-agent.",
+            },
+          },
+          required: ["input"],
+        },
+      },
+    });
+  }
+
+  return index;
+}
+
+function classifyTool(key: string, tool: AgentTool): StandaloneEntry {
+  if (isToolkitEntry(tool)) {
+    return { kind: "toolkit", def: { ...tool.def, name: key }, entry: tool };
+  }
+  if (isFunctionTool(tool)) {
+    return {
+      kind: "function",
+      tool,
+      def: { ...functionToolToDefinition(tool), name: key },
+    };
+  }
+  if (isHostedTool(tool)) {
+    return {
+      kind: "hosted",
+      def: {
+        name: key,
+        description: `Hosted tool: ${tool.type}`,
+        parameters: { type: "object", properties: {} },
+      },
+    };
+  }
+  throw new Error(`runAgent: unrecognized tool shape at key "${key}"`);
+}
diff --git a/packages/appkit/src/core/agent/system-prompt.ts b/packages/appkit/src/core/agent/system-prompt.ts
new file mode 100644
index 000000000..634f49c5f
--- /dev/null
+++ b/packages/appkit/src/core/agent/system-prompt.ts
@@ -0,0 +1,40 @@
+/**
+ * Builds the AppKit base system prompt from active plugin names.
+ *
+ * The base prompt provides guidelines and app context. It does NOT
+ * include individual tool descriptions — those are sent via the
+ * structured `tools` API parameter to the LLM.
+ */
+export function buildBaseSystemPrompt(pluginNames: string[]): string {
+  const lines: string[] = [
+    "You are an AI assistant running on Databricks AppKit.",
+  ];
+
+  if (pluginNames.length > 0) {
+    lines.push("");
+    lines.push(`Active plugins: ${pluginNames.join(", ")}`);
+  }
+
+  lines.push("");
+  lines.push("Guidelines:");
+  lines.push("- Use Databricks SQL syntax when writing queries");
+  lines.push(
+    "- When results are large, summarize key findings rather than dumping raw data",
+  );
+  lines.push("- If a tool call fails, explain the error clearly to the user");
+  lines.push("- When browsing files, verify the path exists before reading");
+
+  return lines.join("\n");
+}
+
+/**
+ * Compose the full system prompt from the base prompt and an optional
+ * per-agent user prompt.
+ */
+export function composeSystemPrompt(
+  basePrompt: string,
+  agentPrompt?: string,
+): string {
+  if (!agentPrompt) return basePrompt;
+  return `${basePrompt}\n\n${agentPrompt}`;
+}
diff --git a/packages/appkit/src/core/agent/tests/create-agent.test.ts b/packages/appkit/src/core/agent/tests/create-agent.test.ts
new file mode 100644
index 000000000..30bcc98e9
--- /dev/null
+++ b/packages/appkit/src/core/agent/tests/create-agent.test.ts
@@ -0,0 +1,75 @@
+import { describe, expect, test } from "vitest";
+import { z } from "zod";
+import { createAgent } from "../create-agent";
+import { tool } from "../../../core/agent/tools/tool";
+import type { AgentDefinition } from "../../../core/agent/types";
+
+describe("createAgent", () => {
+  test("returns the definition unchanged for a simple agent", () => {
+    const def: AgentDefinition = {
+      name: "support",
+      instructions: "You help customers.",
+      model: "endpoint-x",
+    };
+    const result = createAgent(def);
+    expect(result).toBe(def);
+  });
+
+  test("accepts tools as a keyed record", () => {
+    const get_weather = tool({
+      name: "get_weather",
+      description: "Get the weather",
+      schema: z.object({ city: z.string() }),
+      execute: async ({ city }) => `Sunny in ${city}`,
+    });
+
+    const def = createAgent({
+      instructions: "...",
+      tools: { get_weather },
+    });
+
+    expect(def.tools?.get_weather).toBe(get_weather);
+  });
+
+  test("accepts sub-agents in a keyed record", () => {
+    const researcher = createAgent({ instructions: "Research." });
+    const supervisor = createAgent({
+      instructions: "Supervise.",
+      agents: { researcher },
+    });
+    expect(supervisor.agents?.researcher).toBe(researcher);
+  });
+
+  test("throws on a direct self-cycle", () => {
+    const a: AgentDefinition = { instructions: "a" };
+    // biome-ignore lint/suspicious/noExplicitAny: intentional cycle setup for test
+    (a as any).agents = { self: a };
+    expect(() => createAgent(a)).toThrow(/cycle/i);
+  });
+
+  test("throws on an indirect cycle", () => {
+    const a: AgentDefinition = { instructions: "a" };
+    const b: AgentDefinition = { instructions: "b" };
+    a.agents = { b };
+    b.agents = { a };
+    expect(() => createAgent(a)).toThrow(/cycle/i);
+  });
+
+  test("accepts a DAG of sub-agents without throwing", () => {
+    const leaf: AgentDefinition = { instructions: "leaf" };
+    const branchA: AgentDefinition = {
+      instructions: "a",
+      agents: { leaf },
+    };
+    const branchB: AgentDefinition = {
+      instructions: "b",
+      agents: { leaf },
+    };
+    const root = createAgent({
+      instructions: "root",
+      agents: { branchA, branchB },
+    });
+    expect(root.agents?.branchA.agents?.leaf).toBe(leaf);
+    expect(root.agents?.branchB.agents?.leaf).toBe(leaf);
+  });
+});
diff --git a/packages/appkit/src/core/agent/tests/load-agents.test.ts b/packages/appkit/src/core/agent/tests/load-agents.test.ts
new file mode 100644
index 000000000..23799148e
--- /dev/null
+++ b/packages/appkit/src/core/agent/tests/load-agents.test.ts
@@ -0,0 +1,302 @@
+import fs from "node:fs";
+import os from "node:os";
+import path from "node:path";
+import { afterEach, beforeEach, describe, expect, test } from "vitest";
+import { z } from "zod";
+import { buildToolkitEntries } from "../../../core/agent/build-toolkit";
+import {
+  loadAgentFromFile,
+  loadAgentsFromDir,
+  parseFrontmatter,
+} from "../load-agents";
+import { defineTool, type ToolRegistry } from "../../../core/agent/tools/define-tool";
+import { tool } from "../../../core/agent/tools/tool";
+import type { AgentDefinition } from "../../../core/agent/types";
+
+let workDir: string;
+
+beforeEach(() => {
+  workDir = fs.mkdtempSync(path.join(os.tmpdir(), "agents-test-"));
+});
+
+afterEach(() => {
+  fs.rmSync(workDir, { recursive: true, force: true });
+});
+
+function write(name: string, content: string) {
+  fs.writeFileSync(path.join(workDir, name), content, "utf-8");
+  return path.join(workDir, name);
+}
+
+describe("parseFrontmatter", () => {
+  test("parses a simple object", () => {
+    const { data, content } = parseFrontmatter(
+      "---\nendpoint: foo\ndefault: true\n---\nHello body",
+    );
+    expect(data).toEqual({ endpoint: "foo", default: true });
+    expect(content).toBe("Hello body");
+  });
+
+  test("parses nested arrays", () => {
+    const { data } = parseFrontmatter(
+      "---\ntoolkits:\n  - analytics\n  - files: [uploads.list]\n---\nbody",
+    );
+    expect(data?.toolkits).toEqual(["analytics", { files: ["uploads.list"] }]);
+  });
+
+  test("returns null data when no frontmatter", () => {
+    const { data, content } = parseFrontmatter("No frontmatter here");
+    expect(data).toBeNull();
+    expect(content).toBe("No frontmatter here");
+  });
+
+  test("throws on invalid YAML", () => {
+    expect(() => parseFrontmatter("---\nkey: : : bad\n---\n")).toThrow(/YAML/);
+  });
+});
+
+describe("loadAgentFromFile", () => {
+  test("returns AgentDefinition with body as instructions", async () => {
+    const p = write(
+      "assistant.md",
+      "---\nendpoint: e-1\n---\nYou are helpful.",
+    );
+    const def = await loadAgentFromFile(p, {});
+    expect(def.name).toBe("assistant");
+    expect(def.instructions).toBe("You are helpful.");
+    expect(def.model).toBe("e-1");
+  });
+});
+
+describe("loadAgentsFromDir", () => {
+  test("returns empty map when dir doesn't exist", async () => {
+    const res = await loadAgentsFromDir("/nonexistent-for-tests", {});
+    expect(res.defs).toEqual({});
+    expect(res.defaultAgent).toBeNull();
+  });
+
+  test("loads all .md files keyed by file-stem", async () => {
+    write("support.md", "---\nendpoint: e-1\n---\nSupport prompt.");
+    write("sales.md", "---\nendpoint: e-2\n---\nSales prompt.");
+    const res = await loadAgentsFromDir(workDir, {});
+    expect(Object.keys(res.defs).sort()).toEqual(["sales", "support"]);
+  });
+
+  test("picks up default: true from frontmatter", async () => {
+    write("one.md", "---\nendpoint: a\n---\nOne.");
+    write("two.md", "---\nendpoint: b\ndefault: true\n---\nTwo.");
+    const res = await loadAgentsFromDir(workDir, {});
+    expect(res.defaultAgent).toBe("two");
+  });
+
+  test("throws when frontmatter references an unregistered plugin", async () => {
+    write(
+      "broken.md",
+      "---\nendpoint: e\ntoolkits: [missing]\n---\nBroken agent.",
+    );
+    await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+      /references toolkit 'missing'/,
+    );
+  });
+
+  test("throws when frontmatter references an unknown ambient tool", async () => {
+    write("broken.md", "---\nendpoint: e\ntools: [unknown_tool]\n---\nBroken.");
+    await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+      /references tool 'unknown_tool'/,
+    );
+  });
+
+  test("resolves toolkits + ambient tools when provided", async () => {
+    const registry: ToolRegistry = {
+      query: defineTool({
+        description: "q",
+        schema: z.object({ sql: z.string() }),
+        handler: () => "ok",
+      }),
+    };
+    const plugins = new Map<
+      string,
+      { toolkit: (opts?: unknown) => Record<string, unknown> }
+    >([
+      [
+        "analytics",
+        {
+          toolkit: (opts) =>
+            buildToolkitEntries("analytics", registry, opts as never),
+        },
+      ],
+    ]);
+
+    const weather = tool({
+      name: "get_weather",
+      description: "Weather",
+      schema: z.object({ city: z.string() }),
+      execute: async () => "sunny",
+    });
+
+    write(
+      "analyst.md",
+      "---\nendpoint: e\ntoolkits:\n  - analytics\ntools:\n  - get_weather\n---\nBody.",
+    );
+    const res = await loadAgentsFromDir(workDir, {
+      plugins,
+      availableTools: { get_weather: weather },
+    });
+    expect(res.defs.analyst.tools).toBeDefined();
+    expect(Object.keys(res.defs.analyst.tools ?? {}).sort()).toEqual([
+      "analytics.query",
+      "get_weather",
+    ]);
+  });
+
+  describe("agents: sibling sub-agent references", () => {
+    test("resolves sibling references into def.agents regardless of file order", async () => {
+      // Names chosen so alphabetical iteration puts `dispatcher` *before*
+      // its siblings — pass-1 populates defs in any order, pass-2 resolves.
+      write(
+        "dispatcher.md",
+        "---\nendpoint: e\nagents:\n  - analyst\n  - writer\n---\nRoute work.",
+      );
+      write("analyst.md", "---\nendpoint: e\n---\nAnalyst.");
+      write("writer.md", "---\nendpoint: e\n---\nWriter.");
+
+      const res = await loadAgentsFromDir(workDir, {});
+      expect(Object.keys(res.defs.dispatcher.agents ?? {}).sort()).toEqual([
+        "analyst",
+        "writer",
+      ]);
+      expect(res.defs.dispatcher.agents?.analyst).toBe(res.defs.analyst);
+      expect(res.defs.dispatcher.agents?.writer).toBe(res.defs.writer);
+      // Leaves with no `agents:` retain undefined — only declared keys wire.
+      expect(res.defs.analyst.agents).toBeUndefined();
+      expect(res.defs.writer.agents).toBeUndefined();
+    });
+
+    test("mutual delegation is allowed (runtime depth cap handles cycles)", async () => {
+      write("a.md", "---\nendpoint: e\nagents:\n  - b\n---\nA.");
+      write("b.md", "---\nendpoint: e\nagents:\n  - a\n---\nB.");
+
+      const res = await loadAgentsFromDir(workDir, {});
+      expect(res.defs.a.agents?.b).toBe(res.defs.b);
+      expect(res.defs.b.agents?.a).toBe(res.defs.a);
+    });
+
+    test("throws with available list when a sibling is missing", async () => {
+      write("dispatcher.md", "---\nendpoint: e\nagents:\n  - ghost\n---\nD.");
+      write("analyst.md", "---\nendpoint: e\n---\nAnalyst.");
+      await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+        /references sub-agent\(s\) 'ghost'.*Available: analyst, dispatcher/s,
+      );
+    });
+
+    test("reports every missing sibling in one error, not just the first", async () => {
+      write(
+        "dispatcher.md",
+        "---\nendpoint: e\nagents:\n  - ghost1\n  - ghost2\n---\nD.",
+      );
+      await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+        /ghost1, ghost2/,
+      );
+    });
+
+    test("throws on self-reference", async () => {
+      write("solo.md", "---\nendpoint: e\nagents:\n  - solo\n---\nSolo.");
+      await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+        /'solo'.*cannot reference itself/s,
+      );
+    });
+
+    test("throws on non-array 'agents:' value", async () => {
+      write("bad.md", "---\nendpoint: e\nagents: analyst\n---\nBad.");
+      write("analyst.md", "---\nendpoint: e\n---\nAnalyst.");
+      await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+        /invalid 'agents:' frontmatter/,
+      );
+    });
+
+    test("throws on non-string entries in 'agents:'", async () => {
+      write("bad.md", "---\nendpoint: e\nagents:\n  - 42\n---\nBad.");
+      await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+        /invalid 'agents:' entry/,
+      );
+    });
+
+    test("deduplicates repeated entries silently", async () => {
+      write(
+        "dispatcher.md",
+        "---\nendpoint: e\nagents:\n  - analyst\n  - analyst\n---\nD.",
+      );
+      write("analyst.md", "---\nendpoint: e\n---\nAnalyst.");
+      const res = await loadAgentsFromDir(workDir, {});
+      expect(Object.keys(res.defs.dispatcher.agents ?? {})).toEqual([
+        "analyst",
+      ]);
+    });
+
+    test("empty array yields no sub-agents (no-op)", async () => {
+      write("dispatcher.md", "---\nendpoint: e\nagents: []\n---\nD.");
+      const res = await loadAgentsFromDir(workDir, {});
+      expect(res.defs.dispatcher.agents).toBeUndefined();
+    });
+
+    test("resolves 'agents:' references against codeAgents when provided", async () => {
+      write("dispatcher.md", "---\nendpoint: e\nagents:\n  - support\n---\nD.");
+      const support: AgentDefinition = {
+        name: "support",
+        instructions: "Code-defined support.",
+      };
+      const res = await loadAgentsFromDir(workDir, {
+        codeAgents: { support },
+      });
+      expect(res.defs.dispatcher.agents?.support).toBe(support);
+    });
+
+    test("codeAgents takes precedence over markdown sibling with the same name", async () => {
+      write("dispatcher.md", "---\nendpoint: e\nagents:\n  - support\n---\nD.");
+      write("support.md", "---\nendpoint: e\n---\nMarkdown support.");
+      const codeSupport: AgentDefinition = {
+        name: "support",
+        instructions: "Code support.",
+      };
+      const res = await loadAgentsFromDir(workDir, {
+        codeAgents: { support: codeSupport },
+      });
+      // Reference binds to code version, matching the plugin's top-level
+      // `code wins` merge behaviour.
+      expect(res.defs.dispatcher.agents?.support).toBe(codeSupport);
+      expect(res.defs.dispatcher.agents?.support.instructions).toBe(
+        "Code support.",
+      );
+    });
+
+    test("missing-sibling error lists both markdown and code agent names", async () => {
+      write("dispatcher.md", "---\nendpoint: e\nagents:\n  - ghost\n---\nD.");
+      write("analyst.md", "---\nendpoint: e\n---\nAnalyst.");
+      const codeAgent: AgentDefinition = {
+        name: "writer",
+        instructions: "Writer.",
+      };
+      await expect(
+        loadAgentsFromDir(workDir, { codeAgents: { writer: codeAgent } }),
+      ).rejects.toThrow(/Available: analyst, dispatcher, writer/);
+    });
+  });
+});
+
+describe("loadAgentFromFile — sub-agent refs rejected", () => {
+  test("throws when 'agents:' is non-empty in a single-file load", async () => {
+    const p = write(
+      "lonely.md",
+      "---\nendpoint: e\nagents:\n  - ghost\n---\nLonely.",
+    );
+    await expect(loadAgentFromFile(p, {})).rejects.toThrow(
+      /requires loadAgentsFromDir/,
+    );
+  });
+
+  test("ignores empty 'agents:' array (treated as absent)", async () => {
+    const p = write("lonely.md", "---\nendpoint: e\nagents: []\n---\nLonely.");
+    const def = await loadAgentFromFile(p, {});
+    expect(def.agents).toBeUndefined();
+  });
+});
diff --git a/packages/appkit/src/core/agent/tests/run-agent.test.ts b/packages/appkit/src/core/agent/tests/run-agent.test.ts
new file mode 100644
index 000000000..55b3e7b39
--- /dev/null
+++ b/packages/appkit/src/core/agent/tests/run-agent.test.ts
@@ -0,0 +1,120 @@
+import type {
+  AgentAdapter,
+  AgentEvent,
+  AgentInput,
+  AgentRunContext,
+} from "shared";
+import { describe, expect, test, vi } from "vitest";
+import { z } from "zod";
+import { createAgent } from "../create-agent";
+import { runAgent } from "../run-agent";
+import { tool } from "../../../core/agent/tools/tool";
+import type { ToolkitEntry } from "../../../core/agent/types";
+
+function scriptedAdapter(events: AgentEvent[]): AgentAdapter {
+  return {
+    async *run(_input: AgentInput, _context: AgentRunContext) {
+      for (const event of events) {
+        yield event;
+      }
+    },
+  };
+}
+
+describe("runAgent", () => {
+  test("drives the adapter and returns aggregated text", async () => {
+    const events: AgentEvent[] = [
+      { type: "message_delta", content: "Hello " },
+      { type: "message_delta", content: "world" },
+      { type: "status", status: "complete" },
+    ];
+    const def = createAgent({
+      instructions: "Say hello",
+      model: scriptedAdapter(events),
+    });
+
+    const result = await runAgent(def, { messages: "hi" });
+    expect(result.text).toBe("Hello world");
+    expect(result.events).toHaveLength(3);
+  });
+
+  test("prefers terminal 'message' event over deltas when present", async () => {
+    const events: AgentEvent[] = [
+      { type: "message_delta", content: "partial" },
+      { type: "message", content: "final answer" },
+    ];
+    const def = createAgent({
+      instructions: "x",
+      model: scriptedAdapter(events),
+    });
+    const result = await runAgent(def, { messages: "hi" });
+    expect(result.text).toBe("final answer");
+  });
+
+  test("invokes inline tools via executeTool callback", async () => {
+    const weatherFn = vi.fn(async () => "Sunny in NYC");
+    const weather = tool({
+      name: "get_weather",
+      description: "Weather",
+      schema: z.object({ city: z.string() }),
+      execute: weatherFn,
+    });
+
+    let capturedCtx: AgentRunContext | null = null;
+    const adapter: AgentAdapter = {
+      async *run(_input, context) {
+        capturedCtx = context;
+        yield { type: "message_delta", content: "" };
+      },
+    };
+
+    const def = createAgent({
+      instructions: "x",
+      model: adapter,
+      tools: { get_weather: weather },
+    });
+
+    await runAgent(def, { messages: "hi" });
+    expect(capturedCtx).not.toBeNull();
+    // biome-ignore lint/style/noNonNullAssertion: asserted above
+    const result = await capturedCtx!.executeTool("get_weather", {
+      city: "NYC",
+    });
+    expect(result).toBe("Sunny in NYC");
+    expect(weatherFn).toHaveBeenCalledWith({ city: "NYC" });
+  });
+
+  test("throws a clear error when a ToolkitEntry is invoked", async () => {
+    const toolkitEntry: ToolkitEntry = {
+      __toolkitRef: true,
+      pluginName: "analytics",
+      localName: "query",
+      def: {
+        name: "analytics.query",
+        description: "SQL",
+        parameters: { type: "object", properties: {} },
+      },
+    };
+
+    let capturedCtx: AgentRunContext | null = null;
+    const adapter: AgentAdapter = {
+      async *run(_input, context) {
+        capturedCtx = context;
+        yield { type: "message_delta", content: "" };
+      },
+    };
+
+    const def = createAgent({
+      instructions: "x",
+      model: adapter,
+      tools: { "analytics.query": toolkitEntry },
+    });
+
+    await runAgent(def, { messages: "hi" });
+    expect(capturedCtx).not.toBeNull();
+    await expect(
+      // biome-ignore lint/style/noNonNullAssertion: asserted above
+      capturedCtx!.executeTool("analytics.query", {}),
+    ).rejects.toThrow(/only usable via createApp/);
+  });
+});
diff --git a/packages/appkit/src/core/agent/tests/system-prompt.test.ts b/packages/appkit/src/core/agent/tests/system-prompt.test.ts
new file mode 100644
index 000000000..83bf8e192
--- /dev/null
+++ b/packages/appkit/src/core/agent/tests/system-prompt.test.ts
@@ -0,0 +1,45 @@
+import { describe, expect, test } from "vitest";
+import { buildBaseSystemPrompt, composeSystemPrompt } from "../system-prompt";
+
+describe("buildBaseSystemPrompt", () => {
+  test("includes plugin names", () => {
+    const prompt = buildBaseSystemPrompt(["analytics", "files", "genie"]);
+    expect(prompt).toContain("Active plugins: analytics, files, genie");
+  });
+
+  test("includes guidelines", () => {
+    const prompt = buildBaseSystemPrompt([]);
+    expect(prompt).toContain("Guidelines:");
+    expect(prompt).toContain("Databricks SQL");
+    expect(prompt).toContain("summarize key findings");
+  });
+
+  test("works with no plugins", () => {
+    const prompt = buildBaseSystemPrompt([]);
+    expect(prompt).toContain("AI assistant running on Databricks AppKit");
+    expect(prompt).not.toContain("Active plugins:");
+  });
+
+  test("does NOT include individual tool names", () => {
+    const prompt = buildBaseSystemPrompt(["analytics"]);
+    expect(prompt).not.toContain("analytics.query");
+    expect(prompt).not.toContain("Available tools:");
+  });
+});
+
+describe("composeSystemPrompt", () => {
+  test("concatenates base + agent prompt with double newline", () => {
+    const composed = composeSystemPrompt("Base prompt.", "Agent prompt.");
+    expect(composed).toBe("Base prompt.\n\nAgent prompt.");
+  });
+
+  test("returns base prompt alone when no agent prompt", () => {
+    const composed = composeSystemPrompt("Base prompt.");
+    expect(composed).toBe("Base prompt.");
+  });
+
+  test("returns base prompt when agent prompt is empty string", () => {
+    const composed = composeSystemPrompt("Base prompt.", "");
+    expect(composed).toBe("Base prompt.");
+  });
+});
diff --git a/packages/appkit/src/core/agent/types.ts b/packages/appkit/src/core/agent/types.ts
index 086a0426f..d752fa019 100644
--- a/packages/appkit/src/core/agent/types.ts
+++ b/packages/appkit/src/core/agent/types.ts
@@ -1,6 +1,13 @@
-import type { AgentToolDefinition, ToolAnnotations } from "shared";
+import type {
+  AgentAdapter,
+  AgentToolDefinition,
+  BasePluginConfig,
+  ThreadStore,
+  ToolAnnotations,
+} from "shared";
 import type { FunctionTool } from "./tools/function-tool";
 import type { HostedTool } from "./tools/hosted-tools";
+import type { McpHostPolicyConfig } from "../../plugins/agents/tools/mcp-host-policy";
 
 /**
  * A tool reference produced by a plugin's `.toolkit()` call. The agents plugin
@@ -42,8 +49,172 @@ export interface ToolkitOptions {
 }
 
 /**
- * Type guard for `ToolkitEntry` — used to differentiate toolkit references
- * from inline tools in a mixed `tools` record.
+ * Context passed to `baseSystemPrompt` callbacks.
+ */
+export interface PromptContext {
+  agentName: string;
+  pluginNames: string[];
+  toolNames: string[];
+}
+
+export type BaseSystemPromptOption =
+  | false
+  | string
+  | ((ctx: PromptContext) => string);
+
+export interface AgentDefinition {
+  /** Filled in from the enclosing key when used in `agents: { foo: def }`. */
+  name?: string;
+  /** System prompt body. For markdown-loaded agents this is the file body. */
+  instructions: string;
+  /**
+   * Model adapter (or endpoint-name string sugar for
+   * `DatabricksAdapter.fromServingEndpoint({ endpointName })`). Optional —
+   * falls back to the plugin's `defaultModel`.
+   */
+  model?: AgentAdapter | Promise<AgentAdapter> | string;
+  /** Per-agent tool record. Key is the LLM-visible tool-call name. */
+  tools?: Record<string, AgentTool>;
+  /** Sub-agents, exposed as `agent-<key>` tools on this agent. */
+  agents?: Record<string, AgentDefinition>;
+  /** Override the plugin's baseSystemPrompt for this agent only. */
+  baseSystemPrompt?: BaseSystemPromptOption;
+  maxSteps?: number;
+  maxTokens?: number;
+  /**
+   * When true, the thread used for a chat request against this agent is
+   * deleted from `ThreadStore` after the stream completes (success or
+   * failure). Use for stateless one-shot agents — e.g. autocomplete, where
+   * each request is independent and retaining history would both poison
+   * future calls and accumulate unbounded state in the default
+   * `InMemoryThreadStore`. Defaults to `false`.
+   */
+  ephemeral?: boolean;
+}
+
+/**
+ * Auto-inherit configuration. When enabled for a given agent origin, agents
+ * with no explicit `tools:` declaration receive every registered ToolProvider
+ * plugin tool whose author marked `autoInheritable: true`. Tools without that
+ * flag — destructive, state-mutating, or privilege-sensitive — never spread
+ * automatically and must be wired via `tools:`, `toolkits:`, or `fromPlugin`.
+ *
+ * Defaults are `false` for both origins (safe-by-default): developers must
+ * consciously opt an origin in to any auto-inherit behaviour.
+ */
+export interface AutoInheritToolsConfig {
+  /** Default for agents loaded from markdown files. Default: `false`. */
+  file?: boolean;
+  /** Default for code-defined agents (via `agents: { foo: createAgent(...) }`). Default: `false`. */
+  code?: boolean;
+}
+
+export interface AgentsPluginConfig extends BasePluginConfig {
+  /** Directory to scan for markdown agent files. Default `./config/agents`. Set to `false` to disable. */
+  dir?: string | false;
+  /** Code-defined agents, merged with file-loaded ones (code wins on key collision). */
+  agents?: Record<string, AgentDefinition>;
+  /** Agent used when clients don't specify one. Defaults to the first-registered agent or the file with `default: true` frontmatter. */
+  defaultAgent?: string;
+  /** Default model for agents that don't specify their own (in code or frontmatter). */
+  defaultModel?: AgentAdapter | Promise<AgentAdapter> | string;
+  /** Ambient tool library. Keys may be referenced by markdown frontmatter via `tools: [key1, key2]`. */
+  tools?: Record<string, AgentTool>;
+  /** Whether to auto-inherit every ToolProvider plugin's toolkit. Accepts a boolean shorthand. */
+  autoInheritTools?: boolean | AutoInheritToolsConfig;
+  /** Persistent thread store. Default: in-memory. */
+  threadStore?: ThreadStore;
+  /** Customize or disable the AppKit base system prompt. */
+  baseSystemPrompt?: BaseSystemPromptOption;
+  /**
+   * MCP server host policy. By default only same-origin Databricks workspace
+   * URLs may be used as MCP endpoints; custom hosts must be explicitly
+   * allowlisted here. Workspace credentials (SP / OBO) are never forwarded
+   * to non-workspace hosts.
+   */
+  mcp?: McpHostPolicyConfig;
+  /**
+   * Human-in-the-loop approval gate for destructive tool calls. When enabled
+   * (the default), the agents plugin emits an `appkit.approval_pending` SSE
+   * event before executing any tool annotated `destructive: true` and waits
+   * for a `POST /chat/approve` decision from the same user who initiated the
+   * stream. A missing decision after `timeoutMs` auto-denies the call.
+   */
+  approval?: {
+    /** Require human approval for tools annotated `destructive: true`. Default: `true`. */
+    requireForDestructive?: boolean;
+    /** Milliseconds to wait before auto-denying. Default: 60_000. */
+    timeoutMs?: number;
+  };
+  /**
+   * Runtime resource limits applied during agent execution. Defaults are
+   * tuned to protect a single-instance deployment from a misbehaving user or
+   * a runaway prompt injection; tighten or relax as appropriate for the
+   * deployment's scale and trust model. Request-body caps (chat message
+   * size, invocations input size / length) are enforced statically by the
+   * Zod schemas and are not configurable here.
+   */
+  limits?: {
+    /**
+     * Max concurrent chat streams a single user may have open. Subsequent
+     * `POST /chat` requests from that user while at-limit are rejected with
+     * HTTP 429. Default: `5`.
+     */
+    maxConcurrentStreamsPerUser?: number;
+    /**
+     * Max tool invocations per agent run (across the full tool-call graph,
+     * including sub-agent invocations). A run that exceeds the budget is
+     * aborted with a terminal error event. Default: `50`.
+     */
+    maxToolCalls?: number;
+    /**
+     * Max sub-agent recursion depth. Protects against a prompt-injected
+     * agent that delegates to a sub-agent which in turn delegates back to
+     * itself (directly or transitively). Default: `3`.
+     */
+    maxSubAgentDepth?: number;
+  };
+}
+
+/** Internal tool-index entry after a tool record has been resolved to a dispatchable form. */
+export type ResolvedToolEntry =
+  | {
+      source: "toolkit";
+      pluginName: string;
+      localName: string;
+      def: AgentToolDefinition;
+    }
+  | {
+      source: "function";
+      functionTool: FunctionTool;
+      def: AgentToolDefinition;
+    }
+  | {
+      source: "mcp";
+      mcpToolName: string;
+      def: AgentToolDefinition;
+    }
+  | {
+      source: "subagent";
+      agentName: string;
+      def: AgentToolDefinition;
+    };
+
+export interface RegisteredAgent {
+  name: string;
+  instructions: string;
+  adapter: AgentAdapter;
+  toolIndex: Map<string, ResolvedToolEntry>;
+  baseSystemPrompt?: BaseSystemPromptOption;
+  maxSteps?: number;
+  maxTokens?: number;
+  /** Mirrors `AgentDefinition.ephemeral` — skip thread persistence. */
+  ephemeral?: boolean;
+}
+
+/**
+ * Type guard for `ToolkitEntry` — used by the agents plugin to differentiate
+ * toolkit references from inline tools in a mixed `tools` record.
  */
 export function isToolkitEntry(value: unknown): value is ToolkitEntry {
   return (
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
new file mode 100644
index 000000000..9c3076e6e
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -0,0 +1,1268 @@
+import { randomUUID } from "node:crypto";
+import path from "node:path";
+import type express from "express";
+import pc from "picocolors";
+import type {
+  AgentAdapter,
+  AgentEvent,
+  AgentRunContext,
+  AgentToolDefinition,
+  IAppRouter,
+  Message,
+  PluginPhase,
+  ResponseStreamEvent,
+  Thread,
+  ToolProvider,
+} from "shared";
+import { createLogger } from "../../logging/logger";
+import { Plugin, toPlugin } from "../../plugin";
+import type { PluginManifest } from "../../registry";
+import { agentStreamDefaults } from "./defaults";
+import { EventChannel } from "./event-channel";
+import { AgentEventTranslator } from "./event-translator";
+import { loadAgentsFromDir } from "../../core/agent/load-agents";
+import manifest from "./manifest.json";
+import {
+  approvalRequestSchema,
+  chatRequestSchema,
+  invocationsRequestSchema,
+} from "./schemas";
+import { buildBaseSystemPrompt, composeSystemPrompt } from "../../core/agent/system-prompt";
+import { InMemoryThreadStore } from "./thread-store";
+import { ToolApprovalGate } from "./tool-approval-gate";
+import {
+  functionToolToDefinition,
+  isFunctionTool,
+  isHostedTool,
+  resolveHostedTools,
+} from "../../core/agent/tools";
+import { buildMcpHostPolicy } from "./tools/mcp-host-policy";
+import type {
+  AgentDefinition,
+  AgentsPluginConfig,
+  BaseSystemPromptOption,
+  PromptContext,
+  RegisteredAgent,
+  ResolvedToolEntry,
+} from "../../core/agent/types";
+import { isToolkitEntry } from "../../core/agent/types";
+
+const logger = createLogger("agents");
+
+const DEFAULT_AGENTS_DIR = "./config/agents";
+
+/**
+ * Context flag recorded on the in-memory AgentDefinition to indicate whether
+ * it came from markdown (file) or from user code. Drives the asymmetric
+ * `autoInheritTools` default.
+ */
+interface AgentSource {
+  origin: "file" | "code";
+}
+
+export class AgentsPlugin extends Plugin implements ToolProvider {
+  static manifest = manifest as PluginManifest;
+  static phase: PluginPhase = "deferred";
+
+  protected declare config: AgentsPluginConfig;
+
+  private agents = new Map<string, RegisteredAgent>();
+  private defaultAgentName: string | null = null;
+  private activeStreams = new Map<
+    string,
+    { controller: AbortController; userId: string }
+  >();
+  private mcpClient: AppKitMcpClient | null = null;
+  private threadStore;
+  private approvalGate = new ToolApprovalGate();
+
+  constructor(config: AgentsPluginConfig) {
+    super(config);
+    this.config = config;
+    if (config.threadStore) {
+      this.threadStore = config.threadStore;
+    } else {
+      this.threadStore = new InMemoryThreadStore();
+      if (process.env.NODE_ENV === "production") {
+        logger.warn(
+          "InMemoryThreadStore is in use in a production build (NODE_ENV=production). " +
+            "Thread history is unbounded and lost on restart. " +
+            "Pass agents({ threadStore: <persistent impl> }) for real deployments.",
+        );
+      } else {
+        logger.info(
+          "Using default InMemoryThreadStore (dev-only — threads are lost on restart and grow without bound).",
+        );
+      }
+    }
+  }
+
+  /** Effective approval policy with defaults applied. */
+  private get resolvedApprovalPolicy(): {
+    requireForDestructive: boolean;
+    timeoutMs: number;
+  } {
+    const cfg = this.config.approval ?? {};
+    return {
+      requireForDestructive: cfg.requireForDestructive ?? true,
+      timeoutMs: cfg.timeoutMs ?? 60_000,
+    };
+  }
+
+  /** Effective DoS limits with defaults applied. */
+  private get resolvedLimits(): {
+    maxConcurrentStreamsPerUser: number;
+    maxToolCalls: number;
+    maxSubAgentDepth: number;
+  } {
+    const cfg = this.config.limits ?? {};
+    return {
+      maxConcurrentStreamsPerUser: cfg.maxConcurrentStreamsPerUser ?? 5,
+      maxToolCalls: cfg.maxToolCalls ?? 50,
+      maxSubAgentDepth: cfg.maxSubAgentDepth ?? 3,
+    };
+  }
+
+  /** Count active streams owned by a given user. */
+  private countUserStreams(userId: string): number {
+    let n = 0;
+    for (const entry of this.activeStreams.values()) {
+      if (entry.userId === userId) n++;
+    }
+    return n;
+  }
+
+  async setup() {
+    await this.loadAgents();
+    this.mountInvocationsRoute();
+    this.printRegistry();
+  }
+
+  /**
+   * Reload agents from the configured directory, preserving code-defined
+   * agents. Swaps the registry atomically at the end.
+   */
+  async reload(): Promise<void> {
+    this.agents.clear();
+    this.defaultAgentName = null;
+    if (this.mcpClient) {
+      await this.mcpClient.close();
+      this.mcpClient = null;
+    }
+    await this.loadAgents();
+  }
+
+  private async loadAgents() {
+    const { defs: fileDefs, defaultAgent: fileDefault } =
+      await this.loadFileDefinitions();
+
+    const codeDefs = this.config.agents ?? {};
+
+    for (const name of Object.keys(fileDefs)) {
+      if (codeDefs[name]) {
+        logger.warn(
+          "Agent '%s' defined in both code and a markdown file. Code definition takes precedence.",
+          name,
+        );
+      }
+    }
+
+    const merged: Record<string, { def: AgentDefinition; src: AgentSource }> =
+      {};
+    for (const [name, def] of Object.entries(fileDefs)) {
+      merged[name] = { def, src: { origin: "file" } };
+    }
+    for (const [name, def] of Object.entries(codeDefs)) {
+      merged[name] = { def, src: { origin: "code" } };
+    }
+
+    if (Object.keys(merged).length === 0) {
+      logger.info(
+        "No agents registered (no files in %s, no code-defined agents)",
+        this.resolvedAgentsDir() ?? "<disabled>",
+      );
+      return;
+    }
+
+    for (const [name, { def, src }] of Object.entries(merged)) {
+      try {
+        const registered = await this.buildRegisteredAgent(name, def, src);
+        this.agents.set(name, registered);
+        if (!this.defaultAgentName) this.defaultAgentName = name;
+      } catch (err) {
+        throw new Error(
+          `Failed to register agent '${name}' (${src.origin}): ${
+            err instanceof Error ? err.message : String(err)
+          }`,
+          { cause: err instanceof Error ? err : undefined },
+        );
+      }
+    }
+
+    if (this.config.defaultAgent) {
+      if (!this.agents.has(this.config.defaultAgent)) {
+        throw new Error(
+          `defaultAgent '${this.config.defaultAgent}' is not registered. Available: ${Array.from(this.agents.keys()).join(", ")}`,
+        );
+      }
+      this.defaultAgentName = this.config.defaultAgent;
+    } else if (fileDefault && this.agents.has(fileDefault)) {
+      this.defaultAgentName = fileDefault;
+    }
+  }
+
+  private resolvedAgentsDir(): string | null {
+    if (this.config.dir === false) return null;
+    const dir = this.config.dir ?? DEFAULT_AGENTS_DIR;
+    return path.isAbsolute(dir) ? dir : path.resolve(process.cwd(), dir);
+  }
+
+  private async loadFileDefinitions(): Promise<{
+    defs: Record<string, AgentDefinition>;
+    defaultAgent: string | null;
+  }> {
+    const dir = this.resolvedAgentsDir();
+    if (!dir) return { defs: {}, defaultAgent: null };
+
+    const pluginToolProviders = this.pluginProviderIndex();
+    const ambient = this.config.tools ?? {};
+
+    const result = await loadAgentsFromDir(dir, {
+      defaultModel: this.config.defaultModel,
+      availableTools: ambient,
+      plugins: pluginToolProviders,
+      codeAgents: this.config.agents,
+    });
+
+    return result;
+  }
+
+  /**
+   * Builds the map of plugin-name → toolkit that the markdown loader consults
+   * when resolving `toolkits:` frontmatter entries.
+   */
+  private pluginProviderIndex(): Map<
+    string,
+    { toolkit: (opts?: unknown) => Record<string, unknown> }
+  > {
+    const out = new Map();
+    if (!this.context) return out;
+    for (const { name, provider } of this.context.getToolProviders()) {
+      const withToolkit = provider as ToolProvider & {
+        toolkit?: (opts?: unknown) => Record<string, unknown>;
+      };
+      if (typeof withToolkit.toolkit === "function") {
+        out.set(name, {
+          toolkit: withToolkit.toolkit.bind(withToolkit),
+        });
+      }
+    }
+    return out;
+  }
+
+  private async buildRegisteredAgent(
+    name: string,
+    def: AgentDefinition,
+    src: AgentSource,
+  ): Promise<RegisteredAgent> {
+    const adapter = await this.resolveAdapter(def, name);
+    const toolIndex = await this.buildToolIndex(name, def, src);
+
+    return {
+      name,
+      instructions: def.instructions,
+      adapter,
+      toolIndex,
+      baseSystemPrompt: def.baseSystemPrompt,
+      maxSteps: def.maxSteps,
+      maxTokens: def.maxTokens,
+      ephemeral: def.ephemeral,
+    };
+  }
+
+  private async resolveAdapter(
+    def: AgentDefinition,
+    name: string,
+  ): Promise<AgentAdapter> {
+    const source = def.model ?? this.config.defaultModel;
+    // Per-agent adapter knobs from `AgentDefinition` / markdown frontmatter.
+    // Only applied when AppKit builds the adapter itself (string or omitted
+    // model). Users who pass a pre-built `AgentAdapter` own these settings.
+    const adapterOptions: { maxSteps?: number; maxTokens?: number } = {};
+    if (def.maxSteps !== undefined) adapterOptions.maxSteps = def.maxSteps;
+    if (def.maxTokens !== undefined) adapterOptions.maxTokens = def.maxTokens;
+
+    if (!source) {
+      const { DatabricksAdapter } = await import("../../agents/databricks");
+      try {
+        return await DatabricksAdapter.fromModelServing(
+          undefined,
+          adapterOptions,
+        );
+      } catch (err) {
+        throw new Error(
+          `Agent '${name}' has no model configured and no DATABRICKS_AGENT_ENDPOINT default available`,
+          { cause: err instanceof Error ? err : undefined },
+        );
+      }
+    }
+    if (typeof source === "string") {
+      const { DatabricksAdapter } = await import("../../agents/databricks");
+      return DatabricksAdapter.fromModelServing(source, adapterOptions);
+    }
+    return await source;
+  }
+
+  /**
+   * Resolves an agent's tool record into a per-agent dispatch index. Connects
+   * hosted tools via MCP client. Applies `autoInheritTools` defaults when the
+   * definition has no declared tools/agents.
+   */
+  private async buildToolIndex(
+    agentName: string,
+    def: AgentDefinition,
+    src: AgentSource,
+  ): Promise<Map<string, ResolvedToolEntry>> {
+    const index = new Map<string, ResolvedToolEntry>();
+    const hasExplicitTools = def.tools && Object.keys(def.tools).length > 0;
+    const hasExplicitSubAgents =
+      def.agents && Object.keys(def.agents).length > 0;
+
+    const inheritDefaults = normalizeAutoInherit(this.config.autoInheritTools);
+    const shouldInherit =
+      !hasExplicitTools &&
+      !hasExplicitSubAgents &&
+      (src.origin === "file" ? inheritDefaults.file : inheritDefaults.code);
+
+    if (shouldInherit) {
+      await this.applyAutoInherit(agentName, index);
+    }
+
+    // 1. Sub-agents → agent-<key>
+    for (const [childKey, childDef] of Object.entries(def.agents ?? {})) {
+      const toolName = `agent-${childKey}`;
+      index.set(toolName, {
+        source: "subagent",
+        agentName: childDef.name ?? childKey,
+        def: {
+          name: toolName,
+          description:
+            childDef.instructions.slice(0, 120) ||
+            `Delegate to the ${childKey} sub-agent`,
+          parameters: {
+            type: "object",
+            properties: {
+              input: {
+                type: "string",
+                description: "Message to send to the sub-agent.",
+              },
+            },
+            required: ["input"],
+          },
+        },
+      });
+    }
+
+    // 2. Explicit tools (toolkit entries, function tools, hosted tools)
+    const hostedToCollect: import("../../core/agent/tools/hosted-tools").HostedTool[] = [];
+    for (const [key, tool] of Object.entries(def.tools ?? {})) {
+      if (isToolkitEntry(tool)) {
+        index.set(key, {
+          source: "toolkit",
+          pluginName: tool.pluginName,
+          localName: tool.localName,
+          def: { ...tool.def, name: key },
+        });
+        continue;
+      }
+      if (isFunctionTool(tool)) {
+        index.set(key, {
+          source: "function",
+          functionTool: tool,
+          def: { ...functionToolToDefinition(tool), name: key },
+        });
+        continue;
+      }
+      if (isHostedTool(tool)) {
+        hostedToCollect.push(tool);
+        continue;
+      }
+      throw new Error(
+        `Agent '${agentName}' tool '${key}' has an unrecognized shape`,
+      );
+    }
+
+    if (hostedToCollect.length > 0) {
+      await this.connectHostedTools(hostedToCollect, index);
+    }
+
+    return index;
+  }
+
+  private async applyAutoInherit(
+    agentName: string,
+    index: Map<string, ResolvedToolEntry>,
+  ): Promise<void> {
+    if (!this.context) return;
+    const inherited: string[] = [];
+    const skippedByPlugin = new Map<string, string[]>();
+    const recordSkip = (pluginName: string, localName: string) => {
+      const list = skippedByPlugin.get(pluginName) ?? [];
+      list.push(localName);
+      skippedByPlugin.set(pluginName, list);
+    };
+
+    for (const {
+      name: pluginName,
+      provider,
+    } of this.context.getToolProviders()) {
+      if (pluginName === this.name) continue;
+      const withToolkit = provider as ToolProvider & {
+        toolkit?: (opts?: unknown) => Record<string, unknown>;
+      };
+      if (typeof withToolkit.toolkit === "function") {
+        const entries = withToolkit.toolkit() as Record<string, unknown>;
+        for (const [key, maybeEntry] of Object.entries(entries)) {
+          if (!isToolkitEntry(maybeEntry)) continue;
+          if (maybeEntry.autoInheritable !== true) {
+            recordSkip(maybeEntry.pluginName, maybeEntry.localName);
+            continue;
+          }
+          index.set(key, {
+            source: "toolkit",
+            pluginName: maybeEntry.pluginName,
+            localName: maybeEntry.localName,
+            def: { ...maybeEntry.def, name: key },
+          });
+          inherited.push(key);
+        }
+        continue;
+      }
+      // Fallback: providers without a toolkit() still expose getAgentTools().
+      // These cannot be selectively opted in per tool, so we conservatively
+      // skip them during auto-inherit and require explicit `tools:` wiring.
+      for (const tool of provider.getAgentTools()) {
+        recordSkip(pluginName, tool.name);
+      }
+    }
+
+    if (inherited.length > 0) {
+      logger.info(
+        "[agent %s] auto-inherited %d tool(s): %s",
+        agentName,
+        inherited.length,
+        inherited.join(", "),
+      );
+    }
+    if (skippedByPlugin.size > 0) {
+      const summary = Array.from(skippedByPlugin.entries())
+        .map(([p, tools]) => `${p}(${tools.length})`)
+        .join(", ");
+      logger.info(
+        "[agent %s] auto-inherit skipped %d tool(s) not marked autoInheritable: %s. Wire them explicitly via `tools:` if needed.",
+        agentName,
+        Array.from(skippedByPlugin.values()).reduce(
+          (n, list) => n + list.length,
+          0,
+        ),
+        summary,
+      );
+    }
+  }
+
+  private async connectHostedTools(
+    hostedTools: import("../../core/agent/tools/hosted-tools").HostedTool[],
+    index: Map<string, ResolvedToolEntry>,
+  ): Promise<void> {
+    let host: string | undefined;
+    let authenticate: () => Promise<Record<string, string>>;
+
+    try {
+      const { getWorkspaceClient } = await import("../../context");
+      const wsClient = getWorkspaceClient();
+      await wsClient.config.ensureResolved();
+      host = wsClient.config.host;
+      authenticate = async () => {
+        const headers = new Headers();
+        await wsClient.config.authenticate(headers);
+        return Object.fromEntries(headers.entries());
+      };
+    } catch {
+      host = process.env.DATABRICKS_HOST;
+      authenticate = async (): Promise<Record<string, string>> => {
+        const token = process.env.DATABRICKS_TOKEN;
+        return token ? { Authorization: `Bearer ${token}` } : {};
+      };
+    }
+
+    if (!host) {
+      logger.warn(
+        "No Databricks host available — skipping %d hosted tool(s)",
+        hostedTools.length,
+      );
+      return;
+    }
+
+    if (!this.mcpClient) {
+      const policy = buildMcpHostPolicy(this.config.mcp, host);
+      this.mcpClient = new AppKitMcpClient(host, authenticate, policy);
+    }
+
+    const endpoints = resolveHostedTools(hostedTools);
+    await this.mcpClient.connectAll(endpoints);
+
+    for (const def of this.mcpClient.getAllToolDefinitions()) {
+      index.set(def.name, {
+        source: "mcp",
+        mcpToolName: def.name,
+        def,
+      });
+    }
+  }
+
+  // ----------------- ToolProvider (no tools of our own) --------------------
+
+  getAgentTools(): AgentToolDefinition[] {
+    return [];
+  }
+
+  async executeAgentTool(): Promise<unknown> {
+    throw new Error("AgentsPlugin does not expose executeAgentTool directly");
+  }
+
+  // ----------------- Route mounting and handlers ---------------------------
+
+  private mountInvocationsRoute() {
+    if (!this.context) return;
+    this.context.addRoute(
+      "post",
+      "/invocations",
+      (req: express.Request, res: express.Response) => {
+        this._handleInvocations(req, res);
+      },
+    );
+  }
+
+  injectRoutes(router: IAppRouter) {
+    this.route(router, {
+      name: "chat",
+      method: "post",
+      path: "/chat",
+      handler: async (req, res) => this._handleChat(req, res),
+    });
+    this.route(router, {
+      name: "cancel",
+      method: "post",
+      path: "/cancel",
+      handler: async (req, res) => this._handleCancel(req, res),
+    });
+    this.route(router, {
+      name: "approve",
+      method: "post",
+      path: "/approve",
+      handler: async (req, res) => this._handleApprove(req, res),
+    });
+    this.route(router, {
+      name: "threads",
+      method: "get",
+      path: "/threads",
+      handler: async (req, res) => this._handleListThreads(req, res),
+    });
+    this.route(router, {
+      name: "thread",
+      method: "get",
+      path: "/threads/:threadId",
+      handler: async (req, res) => this._handleGetThread(req, res),
+    });
+    this.route(router, {
+      name: "deleteThread",
+      method: "delete",
+      path: "/threads/:threadId",
+      handler: async (req, res) => this._handleDeleteThread(req, res),
+    });
+    this.route(router, {
+      name: "info",
+      method: "get",
+      path: "/info",
+      handler: async (_req, res) => {
+        res.json({
+          agents: Array.from(this.agents.keys()),
+          defaultAgent: this.defaultAgentName,
+        });
+      },
+    });
+  }
+
+  clientConfig(): Record<string, unknown> {
+    return {
+      agents: Array.from(this.agents.keys()),
+      defaultAgent: this.defaultAgentName,
+    };
+  }
+
+  private async _handleChat(req: express.Request, res: express.Response) {
+    const parsed = chatRequestSchema.safeParse(req.body);
+    if (!parsed.success) {
+      res.status(400).json({
+        error: "Invalid request",
+        details: parsed.error.flatten().fieldErrors,
+      });
+      return;
+    }
+    const { message, threadId, agent: agentName } = parsed.data;
+
+    const registered = this.resolveAgent(agentName);
+    if (!registered) {
+      res.status(400).json({
+        error: agentName
+          ? `Agent "${agentName}" not found`
+          : "No agent registered",
+      });
+      return;
+    }
+
+    const userId = this.resolveUserId(req);
+
+    // Reject early (before allocating a thread) when the user is already at
+    // their concurrent-stream limit. Prevents a misbehaving client from
+    // churning thread rows while being denied elsewhere.
+    const limits = this.resolvedLimits;
+    if (this.countUserStreams(userId) >= limits.maxConcurrentStreamsPerUser) {
+      res.setHeader("Retry-After", "5");
+      res.status(429).json({
+        error: `Too many concurrent streams for this user (limit ${limits.maxConcurrentStreamsPerUser}). Wait for an existing stream to complete before starting another.`,
+      });
+      return;
+    }
+
+    let thread = threadId ? await this.threadStore.get(threadId, userId) : null;
+    if (threadId && !thread) {
+      res.status(404).json({ error: `Thread ${threadId} not found` });
+      return;
+    }
+    if (!thread) {
+      thread = await this.threadStore.create(userId);
+    }
+
+    const userMessage: Message = {
+      id: randomUUID(),
+      role: "user",
+      content: message,
+      createdAt: new Date(),
+    };
+    await this.threadStore.addMessage(thread.id, userId, userMessage);
+    return this._streamAgent(req, res, registered, thread, userId);
+  }
+
+  private async _handleInvocations(
+    req: express.Request,
+    res: express.Response,
+  ) {
+    const parsed = invocationsRequestSchema.safeParse(req.body);
+    if (!parsed.success) {
+      res.status(400).json({
+        error: "Invalid request",
+        details: parsed.error.flatten().fieldErrors,
+      });
+      return;
+    }
+    const { input } = parsed.data;
+    const registered = this.resolveAgent();
+    if (!registered) {
+      res.status(400).json({ error: "No agent registered" });
+      return;
+    }
+    const userId = this.resolveUserId(req);
+    const thread = await this.threadStore.create(userId);
+
+    if (typeof input === "string") {
+      await this.threadStore.addMessage(thread.id, userId, {
+        id: randomUUID(),
+        role: "user",
+        content: input,
+        createdAt: new Date(),
+      });
+    } else {
+      for (const item of input) {
+        const role = (item.role ?? "user") as Message["role"];
+        const content =
+          typeof item.content === "string"
+            ? item.content
+            : JSON.stringify(item.content ?? "");
+        if (!content) continue;
+        await this.threadStore.addMessage(thread.id, userId, {
+          id: randomUUID(),
+          role,
+          content,
+          createdAt: new Date(),
+        });
+      }
+    }
+
+    return this._streamAgent(req, res, registered, thread, userId);
+  }
+
+  private async _streamAgent(
+    req: express.Request,
+    res: express.Response,
+    registered: RegisteredAgent,
+    thread: Thread,
+    userId: string,
+  ): Promise<void> {
+    const abortController = new AbortController();
+    const signal = abortController.signal;
+    const requestId = randomUUID();
+    this.activeStreams.set(requestId, { controller: abortController, userId });
+
+    const tools = Array.from(registered.toolIndex.values()).map((e) => e.def);
+    const approvalPolicy = this.resolvedApprovalPolicy;
+    const limits = this.resolvedLimits;
+    const outboundEvents = new EventChannel<ResponseStreamEvent>();
+    const translator = new AgentEventTranslator();
+    // Per-run tool-call budget (shared across the top-level adapter and any
+    // sub-agents it delegates to). Counted pre-dispatch so a prompt-injected
+    // agent cannot drain the budget silently via denied calls.
+    let toolCallsUsed = 0;
+
+    const executeTool = async (
+      name: string,
+      args: unknown,
+    ): Promise<unknown> => {
+      if (toolCallsUsed >= limits.maxToolCalls) {
+        abortController.abort(
+          new Error(
+            `Tool-call budget exhausted (limit ${limits.maxToolCalls}).`,
+          ),
+        );
+        throw new Error(
+          `Tool-call budget exhausted (limit ${limits.maxToolCalls}). Raise agents({ limits: { maxToolCalls } }) or review the agent's tool-selection logic.`,
+        );
+      }
+      toolCallsUsed++;
+
+      const entry = registered.toolIndex.get(name);
+      if (!entry) throw new Error(`Unknown tool: ${name}`);
+
+      if (
+        approvalPolicy.requireForDestructive &&
+        entry.def.annotations?.destructive === true
+      ) {
+        const approvalId = randomUUID();
+        for (const ev of translator.translate({
+          type: "approval_pending",
+          approvalId,
+          streamId: requestId,
+          toolName: name,
+          args,
+          annotations: entry.def.annotations,
+        })) {
+          outboundEvents.push(ev);
+        }
+        const decision = await this.approvalGate.wait({
+          approvalId,
+          streamId: requestId,
+          userId,
+          timeoutMs: approvalPolicy.timeoutMs,
+        });
+        if (decision === "deny") {
+          return `Tool execution denied by user approval gate (tool: ${name}).`;
+        }
+      }
+
+      let result: unknown;
+      if (entry.source === "toolkit") {
+        if (!this.context) {
+          throw new Error(
+            "Plugin tool execution requires PluginContext; this should never happen through createApp",
+          );
+        }
+        result = await this.context.executeTool(
+          req,
+          entry.pluginName,
+          entry.localName,
+          args,
+          signal,
+        );
+      } else if (entry.source === "function") {
+        result = await entry.functionTool.execute(
+          args as Record<string, unknown>,
+        );
+      } else if (entry.source === "mcp") {
+        if (!this.mcpClient) throw new Error("MCP client not connected");
+        const oboToken = req.headers["x-forwarded-access-token"];
+        const mcpAuth =
+          typeof oboToken === "string"
+            ? { Authorization: `Bearer ${oboToken}` }
+            : undefined;
+        result = await this.mcpClient.callTool(
+          entry.mcpToolName,
+          args,
+          mcpAuth,
+        );
+      } else if (entry.source === "subagent") {
+        const childAgent = this.agents.get(entry.agentName);
+        if (!childAgent)
+          throw new Error(`Sub-agent not found: ${entry.agentName}`);
+        result = await this.runSubAgent(req, childAgent, args, signal, 1);
+      }
+
+      // A `void` / `undefined` return is a legitimate tool outcome (e.g., a
+      // "send notification" side-effecting tool). Return an empty string so
+      // the LLM sees a successful-but-empty result rather than a bogus
+      // "execution failed" error.
+      if (result === undefined) {
+        return "";
+      }
+      const MAX = 50_000;
+      const serialized =
+        typeof result === "string" ? result : JSON.stringify(result);
+      if (serialized.length > MAX) {
+        return `${serialized.slice(0, MAX)}\n\n[Result truncated: ${serialized.length} chars exceeds ${MAX} limit]`;
+      }
+      return result;
+    };
+
+    // Drive the adapter and the approval-event side-channel concurrently.
+    // Outbound events from both sources flow through `outboundEvents`; the
+    // generator below drains the channel in order. executeTool pushes
+    // approval-pending events into the same channel before awaiting the gate.
+    const driver = (async () => {
+      try {
+        for (const evt of translator.translate({
+          type: "metadata",
+          data: { threadId: thread.id },
+        })) {
+          outboundEvents.push(evt);
+        }
+
+        const pluginNames = this.context
+          ? this.context
+              .getPluginNames()
+              .filter((n) => n !== this.name && n !== "server")
+          : [];
+        const fullPrompt = composePromptForAgent(
+          registered,
+          this.config.baseSystemPrompt,
+          {
+            agentName: registered.name,
+            pluginNames,
+            toolNames: tools.map((t) => t.name),
+          },
+        );
+
+        const messagesWithSystem: Message[] = [
+          {
+            id: "system",
+            role: "system",
+            content: fullPrompt,
+            createdAt: new Date(),
+          },
+          ...thread.messages,
+        ];
+
+        const stream = registered.adapter.run(
+          {
+            messages: messagesWithSystem,
+            tools,
+            threadId: thread.id,
+            signal,
+          },
+          { executeTool, signal },
+        );
+
+        // Accumulate assistant output from BOTH streaming and non-streaming
+        // adapters. Delta-based adapters (Databricks, Vercel AI) emit
+        // `message_delta` chunks that we concatenate; adapters that yield a
+        // single final assistant message (e.g. LangChain's `on_chain_end`
+        // path) emit a `message` event whose content replaces whatever
+        // deltas already arrived. Without the `message` branch, multi-turn
+        // LangChain conversations silently dropped the assistant turn from
+        // thread history.
+        let fullContent = "";
+        for await (const event of stream) {
+          if (signal.aborted) break;
+          if (event.type === "message_delta") {
+            fullContent += event.content;
+          } else if (event.type === "message") {
+            fullContent = event.content;
+          }
+          for (const translated of translator.translate(event)) {
+            outboundEvents.push(translated);
+          }
+        }
+
+        if (fullContent) {
+          await this.threadStore.addMessage(thread.id, userId, {
+            id: randomUUID(),
+            role: "assistant",
+            content: fullContent,
+            createdAt: new Date(),
+          });
+        }
+
+        for (const evt of translator.finalize()) outboundEvents.push(evt);
+      } catch (error) {
+        if (signal.aborted) {
+          outboundEvents.close();
+          return;
+        }
+        logger.error("Agent chat error: %O", error);
+        outboundEvents.close(error);
+        return;
+      } finally {
+        // Any pending approval gates for this stream are auto-denied so the
+        // adapter can unwind if it was still waiting.
+        this.approvalGate.abortStream(requestId);
+        this.activeStreams.delete(requestId);
+        // Stateless agents (e.g. autocomplete) don't persist history; drop
+        // the thread so `InMemoryThreadStore` doesn't accumulate one record
+        // per request. Swallow delete errors — the stream has already
+        // finished and the client has the response.
+        if (registered.ephemeral) {
+          try {
+            await this.threadStore.delete(thread.id, userId);
+          } catch (err) {
+            logger.warn(
+              "Failed to delete ephemeral thread %s: %O",
+              thread.id,
+              err,
+            );
+          }
+        }
+      }
+      outboundEvents.close();
+    })();
+
+    await this.executeStream<ResponseStreamEvent>(
+      res,
+      async function* () {
+        try {
+          for await (const ev of outboundEvents) {
+            yield ev;
+          }
+        } finally {
+          await driver.catch(() => undefined);
+        }
+      },
+      {
+        ...agentStreamDefaults,
+        stream: { ...agentStreamDefaults.stream, streamId: requestId },
+      },
+    );
+  }
+
+  /**
+   * Runs a sub-agent in response to an `agent-<key>` tool call. Returns the
+   * concatenated text output to hand back to the parent adapter as the tool
+   * result.
+   *
+   * `depth` starts at 1 for a top-level sub-agent invocation (i.e. the
+   * outer `_streamAgent` calls `runSubAgent(..., 1)`) and increments on
+   * each nested `runSubAgent` call. Depths exceeding
+   * `limits.maxSubAgentDepth` are rejected before any adapter work.
+   */
+  private async runSubAgent(
+    req: express.Request,
+    child: RegisteredAgent,
+    args: unknown,
+    signal: AbortSignal,
+    depth: number,
+  ): Promise<string> {
+    const limits = this.resolvedLimits;
+    if (depth > limits.maxSubAgentDepth) {
+      throw new Error(
+        `Sub-agent depth exceeded (limit ${limits.maxSubAgentDepth}). ` +
+          `Raise agents({ limits: { maxSubAgentDepth } }) or break the delegation cycle.`,
+      );
+    }
+
+    const input =
+      typeof args === "object" &&
+      args !== null &&
+      typeof (args as { input?: unknown }).input === "string"
+        ? (args as { input: string }).input
+        : JSON.stringify(args);
+    const childTools = Array.from(child.toolIndex.values()).map((e) => e.def);
+
+    const childExecute = async (
+      name: string,
+      childArgs: unknown,
+    ): Promise<unknown> => {
+      const entry = child.toolIndex.get(name);
+      if (!entry) throw new Error(`Unknown tool in sub-agent: ${name}`);
+      if (entry.source === "toolkit" && this.context) {
+        return this.context.executeTool(
+          req,
+          entry.pluginName,
+          entry.localName,
+          childArgs,
+          signal,
+        );
+      }
+      if (entry.source === "function") {
+        return entry.functionTool.execute(childArgs as Record<string, unknown>);
+      }
+      if (entry.source === "subagent") {
+        const grandchild = this.agents.get(entry.agentName);
+        if (!grandchild)
+          throw new Error(`Sub-agent not found: ${entry.agentName}`);
+        return this.runSubAgent(req, grandchild, childArgs, signal, depth + 1);
+      }
+      if (entry.source === "mcp" && this.mcpClient) {
+        const oboToken = req.headers["x-forwarded-access-token"];
+        const mcpAuth =
+          typeof oboToken === "string"
+            ? { Authorization: `Bearer ${oboToken}` }
+            : undefined;
+        return this.mcpClient.callTool(entry.mcpToolName, childArgs, mcpAuth);
+      }
+      throw new Error(`Unsupported sub-agent tool source: ${entry.source}`);
+    };
+
+    const runContext: AgentRunContext = { executeTool: childExecute, signal };
+
+    const pluginNames = this.context
+      ? this.context
+          .getPluginNames()
+          .filter((n) => n !== this.name && n !== "server")
+      : [];
+    const systemPrompt = composePromptForAgent(
+      child,
+      this.config.baseSystemPrompt,
+      {
+        agentName: child.name,
+        pluginNames,
+        toolNames: childTools.map((t) => t.name),
+      },
+    );
+
+    const messages: Message[] = [
+      {
+        id: "system",
+        role: "system",
+        content: systemPrompt,
+        createdAt: new Date(),
+      },
+      {
+        id: randomUUID(),
+        role: "user",
+        content: input,
+        createdAt: new Date(),
+      },
+    ];
+
+    let output = "";
+    const events: AgentEvent[] = [];
+    for await (const event of child.adapter.run(
+      { messages, tools: childTools, threadId: randomUUID(), signal },
+      runContext,
+    )) {
+      events.push(event);
+      if (event.type === "message_delta") output += event.content;
+      else if (event.type === "message") output = event.content;
+    }
+    return output;
+  }
+
+  private async _handleCancel(req: express.Request, res: express.Response) {
+    const { streamId } = req.body as { streamId?: string };
+    if (!streamId) {
+      res.status(400).json({ error: "streamId is required" });
+      return;
+    }
+    const entry = this.activeStreams.get(streamId);
+    if (!entry) {
+      // Stream is unknown or already completed — idempotent no-op.
+      res.json({ cancelled: true });
+      return;
+    }
+    const userId = this.resolveUserId(req);
+    if (entry.userId !== userId) {
+      res.status(403).json({ error: "Forbidden" });
+      return;
+    }
+    entry.controller.abort("Cancelled by user");
+    this.activeStreams.delete(streamId);
+    this.approvalGate.abortStream(streamId);
+    res.json({ cancelled: true });
+  }
+
+  private async _handleApprove(req: express.Request, res: express.Response) {
+    const parsed = approvalRequestSchema.safeParse(req.body);
+    if (!parsed.success) {
+      res.status(400).json({
+        error: "Invalid request",
+        details: parsed.error.flatten().fieldErrors,
+      });
+      return;
+    }
+    const { streamId, approvalId, decision } = parsed.data;
+
+    const streamEntry = this.activeStreams.get(streamId);
+    if (!streamEntry) {
+      // Stream has already completed or never existed. Return 404 so the UI
+      // knows the approval token is no longer valid (the waiter, if any, has
+      // already been timed out or aborted).
+      res.status(404).json({ error: "Stream not found or already completed" });
+      return;
+    }
+
+    const userId = this.resolveUserId(req);
+    if (streamEntry.userId !== userId) {
+      res.status(403).json({ error: "Forbidden" });
+      return;
+    }
+
+    const result = this.approvalGate.submit({ approvalId, userId, decision });
+    if (!result.ok) {
+      if (result.reason === "forbidden") {
+        res.status(403).json({ error: "Forbidden" });
+        return;
+      }
+      res.status(404).json({ error: "Approval not found or already settled" });
+      return;
+    }
+
+    res.json({ decision });
+  }
+
+  private async _handleListThreads(
+    req: express.Request,
+    res: express.Response,
+  ) {
+    const userId = this.resolveUserId(req);
+    const threads = await this.threadStore.list(userId);
+    res.json({ threads });
+  }
+
+  private async _handleGetThread(req: express.Request, res: express.Response) {
+    const userId = this.resolveUserId(req);
+    const thread = await this.threadStore.get(req.params.threadId, userId);
+    if (!thread) {
+      res.status(404).json({ error: "Thread not found" });
+      return;
+    }
+    res.json(thread);
+  }
+
+  private async _handleDeleteThread(
+    req: express.Request,
+    res: express.Response,
+  ) {
+    const userId = this.resolveUserId(req);
+    const deleted = await this.threadStore.delete(req.params.threadId, userId);
+    if (!deleted) {
+      res.status(404).json({ error: "Thread not found" });
+      return;
+    }
+    res.json({ deleted: true });
+  }
+
+  private resolveAgent(name?: string): RegisteredAgent | null {
+    if (name) return this.agents.get(name) ?? null;
+    if (this.defaultAgentName) {
+      return this.agents.get(this.defaultAgentName) ?? null;
+    }
+    const first = this.agents.values().next();
+    return first.done ? null : first.value;
+  }
+
+  private printRegistry(): void {
+    if (this.agents.size === 0) return;
+    console.log("");
+    console.log(`  ${pc.bold("Agents")} ${pc.dim(`(${this.agents.size})`)}`);
+    console.log(`  ${pc.dim("─".repeat(60))}`);
+    for (const [name, reg] of this.agents) {
+      const tools = reg.toolIndex.size;
+      const marker = name === this.defaultAgentName ? pc.green("●") : " ";
+      console.log(
+        `  ${marker} ${pc.bold(name.padEnd(24))} ${pc.dim(`${tools} tools`)}`,
+      );
+    }
+    console.log(`  ${pc.dim("─".repeat(60))}`);
+    console.log("");
+  }
+
+  async shutdown(): Promise<void> {
+    this.approvalGate.abortAll();
+    if (this.mcpClient) {
+      await this.mcpClient.close();
+      this.mcpClient = null;
+    }
+  }
+
+  exports() {
+    return {
+      register: (name: string, def: AgentDefinition) =>
+        this.registerCodeAgent(name, def),
+      list: () => Array.from(this.agents.keys()),
+      get: (name: string) => this.agents.get(name) ?? null,
+      reload: () => this.reload(),
+      getDefault: () => this.defaultAgentName,
+      getThreads: (userId: string) => this.threadStore.list(userId),
+    };
+  }
+
+  private async registerCodeAgent(
+    name: string,
+    def: AgentDefinition,
+  ): Promise<void> {
+    const registered = await this.buildRegisteredAgent(name, def, {
+      origin: "code",
+    });
+    this.agents.set(name, registered);
+    if (!this.defaultAgentName) this.defaultAgentName = name;
+  }
+}
+
+function normalizeAutoInherit(value: AgentsPluginConfig["autoInheritTools"]): {
+  file: boolean;
+  code: boolean;
+} {
+  // Default is opt-out for both origins. A markdown agent or code-defined
+  // agent with no declared `tools:` gets an empty tool index unless the
+  // developer explicitly flips `autoInheritTools` on. Even then, only tools
+  // whose plugin author marked `autoInheritable: true` are spread — see
+  // `applyAutoInherit` for the filter.
+  if (value === undefined) return { file: false, code: false };
+  if (typeof value === "boolean") return { file: value, code: value };
+  return { file: value.file ?? false, code: value.code ?? false };
+}
+
+function composePromptForAgent(
+  registered: RegisteredAgent,
+  pluginLevel: BaseSystemPromptOption | undefined,
+  ctx: PromptContext,
+): string {
+  const perAgent = registered.baseSystemPrompt;
+  const resolved = perAgent !== undefined ? perAgent : pluginLevel;
+
+  let base = "";
+  if (resolved === false) {
+    base = "";
+  } else if (typeof resolved === "string") {
+    base = resolved;
+  } else if (typeof resolved === "function") {
+    base = resolved(ctx);
+  } else {
+    base = buildBaseSystemPrompt(ctx.pluginNames);
+  }
+
+  return composeSystemPrompt(base, registered.instructions);
+}
+
+/**
+ * Plugin factory for the agents plugin. Reads `config/agents/*.md` by default,
+ * resolves toolkits/tools from registered plugins, exposes `appkit.agents.*`
+ * runtime API and mounts `/invocations`.
+ *
+ * @example
+ * ```ts
+ * import { agents, analytics, createApp, server } from "@databricks/appkit";
+ *
+ * await createApp({
+ *   plugins: [server(), analytics(), agents()],
+ * });
+ * ```
+ */
+export const agents = toPlugin(AgentsPlugin);
diff --git a/packages/appkit/src/plugins/agents/defaults.ts b/packages/appkit/src/plugins/agents/defaults.ts
new file mode 100644
index 000000000..4da11bef4
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/defaults.ts
@@ -0,0 +1,12 @@
+import type { StreamExecutionSettings } from "shared";
+
+export const agentStreamDefaults: StreamExecutionSettings = {
+  default: {
+    cache: { enabled: false },
+    retry: { enabled: false },
+    timeout: 300_000,
+  },
+  stream: {
+    bufferSize: 200,
+  },
+};
diff --git a/packages/appkit/src/plugins/agents/event-channel.ts b/packages/appkit/src/plugins/agents/event-channel.ts
new file mode 100644
index 000000000..c5b60463a
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/event-channel.ts
@@ -0,0 +1,70 @@
+/**
+ * Single-producer/single-consumer async queue used by the agents plugin to
+ * merge streams of SSE events from two concurrent sources: the adapter's
+ * `run()` generator, and out-of-band events emitted by `executeTool` (e.g.
+ * human-approval requests).
+ *
+ * The consumer drains the channel as an async iterable; the producer pushes
+ * events synchronously and closes the channel when the source has completed
+ * or errored.
+ */
+interface Waiter<T> {
+  resolve: (value: IteratorResult<T>) => void;
+  reject: (error: unknown) => void;
+}
+
+export class EventChannel<T> {
+  private queue: T[] = [];
+  private waiters: Array<Waiter<T>> = [];
+  private closed = false;
+  private error: unknown = undefined;
+
+  /** Synchronously enqueue an event. Safe to call from non-async contexts. */
+  push(value: T): void {
+    if (this.closed) return;
+    const waiter = this.waiters.shift();
+    if (waiter) {
+      waiter.resolve({ value, done: false });
+    } else {
+      this.queue.push(value);
+    }
+  }
+
+  /**
+   * Close the channel. Any pending `next()` calls resolve with `done: true`.
+   * If `error` is supplied, pending `next()` calls reject with it and future
+   * calls do the same.
+   */
+  close(error?: unknown): void {
+    if (this.closed) return;
+    this.closed = true;
+    this.error = error;
+    while (this.waiters.length > 0) {
+      const waiter = this.waiters.shift();
+      if (!waiter) break;
+      if (error) {
+        waiter.reject(error);
+      } else {
+        waiter.resolve({ value: undefined as never, done: true });
+      }
+    }
+  }
+
+  [Symbol.asyncIterator](): AsyncIterator<T> {
+    return {
+      next: (): Promise<IteratorResult<T>> => {
+        if (this.queue.length > 0) {
+          const value = this.queue.shift() as T;
+          return Promise.resolve({ value, done: false });
+        }
+        if (this.closed) {
+          if (this.error) return Promise.reject(this.error);
+          return Promise.resolve({ value: undefined as never, done: true });
+        }
+        return new Promise((resolve, reject) => {
+          this.waiters.push({ resolve, reject });
+        });
+      },
+    };
+  }
+}
diff --git a/packages/appkit/src/plugins/agents/event-translator.ts b/packages/appkit/src/plugins/agents/event-translator.ts
new file mode 100644
index 000000000..54d749fb0
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/event-translator.ts
@@ -0,0 +1,291 @@
+import { randomUUID } from "node:crypto";
+import type {
+  AgentEvent,
+  ResponseFunctionCallOutput,
+  ResponseFunctionToolCall,
+  ResponseOutputMessage,
+  ResponseStreamEvent,
+} from "shared";
+
+/**
+ * Translates internal `AgentEvent` stream into Responses API SSE events.
+ *
+ * Stateful: one instance per streaming request. Tracks sequence numbers and
+ * allocates `output_index` strictly monotonically — each emitted output
+ * item (message, function call, function call output) claims the next
+ * available index and, once claimed, never reuses an earlier one. This is a
+ * Responses-API contract that OpenAI's own SDK parsers enforce.
+ *
+ * A message is opened lazily on the first `message_delta` or `message`
+ * event. If a `tool_call` or `tool_result` arrives while a message is open
+ * (common ReAct flow: partial text → tool call → more text), the open
+ * message is closed (`response.output_item.done`) BEFORE the tool item is
+ * added, so subsequent text resumes as a new message item at a strictly
+ * later index.
+ */
+export class AgentEventTranslator {
+  private seqNum = 0;
+  private nextOutputIndex = 0;
+  private currentMessage: {
+    id: string;
+    text: string;
+    outputIndex: number;
+  } | null = null;
+  private finalized = false;
+
+  translate(event: AgentEvent): ResponseStreamEvent[] {
+    switch (event.type) {
+      case "message_delta":
+        return this.handleMessageDelta(event.content);
+      case "message":
+        return this.handleFullMessage(event.content);
+      case "tool_call":
+        return this.handleToolCall(event.callId, event.name, event.args);
+      case "tool_result":
+        return this.handleToolResult(event.callId, event.result, event.error);
+      case "thinking":
+        return [
+          {
+            type: "appkit.thinking",
+            content: event.content,
+            sequence_number: this.seqNum++,
+          },
+        ];
+      case "metadata":
+        return [
+          {
+            type: "appkit.metadata",
+            data: event.data,
+            sequence_number: this.seqNum++,
+          },
+        ];
+      case "approval_pending":
+        return [
+          {
+            type: "appkit.approval_pending",
+            approval_id: event.approvalId,
+            stream_id: event.streamId,
+            tool_name: event.toolName,
+            args: event.args,
+            annotations: event.annotations,
+            sequence_number: this.seqNum++,
+          },
+        ];
+      case "status":
+        return this.handleStatus(event.status, event.error);
+    }
+  }
+
+  finalize(): ResponseStreamEvent[] {
+    if (this.finalized) return [];
+    this.finalized = true;
+
+    const events: ResponseStreamEvent[] = [];
+    const closeEvent = this.closeCurrentMessage();
+    if (closeEvent) events.push(closeEvent);
+
+    events.push({
+      type: "response.completed",
+      sequence_number: this.seqNum++,
+      response: {},
+    });
+
+    return events;
+  }
+
+  private handleMessageDelta(content: string): ResponseStreamEvent[] {
+    const events: ResponseStreamEvent[] = [];
+
+    if (!this.currentMessage) {
+      const id = `msg_${randomUUID()}`;
+      const outputIndex = this.nextOutputIndex++;
+      this.currentMessage = { id, text: content, outputIndex };
+      const item: ResponseOutputMessage = {
+        type: "message",
+        id,
+        status: "in_progress",
+        role: "assistant",
+        content: [],
+      };
+      events.push({
+        type: "response.output_item.added",
+        output_index: outputIndex,
+        item,
+        sequence_number: this.seqNum++,
+      });
+    } else {
+      this.currentMessage.text += content;
+    }
+
+    events.push({
+      type: "response.output_text.delta",
+      item_id: this.currentMessage.id,
+      output_index: this.currentMessage.outputIndex,
+      content_index: 0,
+      delta: content,
+      sequence_number: this.seqNum++,
+    });
+
+    return events;
+  }
+
+  private handleFullMessage(content: string): ResponseStreamEvent[] {
+    const events: ResponseStreamEvent[] = [];
+
+    if (!this.currentMessage) {
+      // No prior deltas — open and immediately close.
+      const id = `msg_${randomUUID()}`;
+      const outputIndex = this.nextOutputIndex++;
+      this.currentMessage = { id, text: content, outputIndex };
+      const addedItem: ResponseOutputMessage = {
+        type: "message",
+        id,
+        status: "in_progress",
+        role: "assistant",
+        content: [],
+      };
+      events.push({
+        type: "response.output_item.added",
+        output_index: outputIndex,
+        item: addedItem,
+        sequence_number: this.seqNum++,
+      });
+    } else {
+      // Deltas already opened the item; `message` overrides the accumulated
+      // text (per adapter contract) and closes it.
+      this.currentMessage.text = content;
+    }
+
+    const closeEvent = this.closeCurrentMessage();
+    if (closeEvent) events.push(closeEvent);
+    return events;
+  }
+
+  private handleToolCall(
+    callId: string,
+    name: string,
+    args: unknown,
+  ): ResponseStreamEvent[] {
+    const events: ResponseStreamEvent[] = [];
+    const closeEvent = this.closeCurrentMessage();
+    if (closeEvent) events.push(closeEvent);
+
+    const outputIndex = this.nextOutputIndex++;
+    const item: ResponseFunctionToolCall = {
+      type: "function_call",
+      id: `fc_${randomUUID()}`,
+      call_id: callId,
+      name,
+      arguments: typeof args === "string" ? args : JSON.stringify(args),
+    };
+
+    events.push(
+      {
+        type: "response.output_item.added",
+        output_index: outputIndex,
+        item,
+        sequence_number: this.seqNum++,
+      },
+      {
+        type: "response.output_item.done",
+        output_index: outputIndex,
+        item,
+        sequence_number: this.seqNum++,
+      },
+    );
+    return events;
+  }
+
+  private handleToolResult(
+    callId: string,
+    result: unknown,
+    error?: string,
+  ): ResponseStreamEvent[] {
+    const events: ResponseStreamEvent[] = [];
+    const closeEvent = this.closeCurrentMessage();
+    if (closeEvent) events.push(closeEvent);
+
+    const outputIndex = this.nextOutputIndex++;
+    // Coalesce `undefined` → "" so the wire shape is always a string (the
+    // Responses API contract). Non-string results are JSON-serialised.
+    let output: string;
+    if (error !== undefined) {
+      output = error;
+    } else if (typeof result === "string") {
+      output = result;
+    } else if (result === undefined) {
+      output = "";
+    } else {
+      output = JSON.stringify(result);
+    }
+    const item: ResponseFunctionCallOutput = {
+      type: "function_call_output",
+      id: `fc_output_${randomUUID()}`,
+      call_id: callId,
+      output,
+    };
+
+    events.push(
+      {
+        type: "response.output_item.added",
+        output_index: outputIndex,
+        item,
+        sequence_number: this.seqNum++,
+      },
+      {
+        type: "response.output_item.done",
+        output_index: outputIndex,
+        item,
+        sequence_number: this.seqNum++,
+      },
+    );
+    return events;
+  }
+
+  /**
+   * Emit an `response.output_item.done` for the currently-open message, if
+   * any, and clear the state. Returns the event to the caller so it can be
+   * pushed at the right moment in the sequence. Returns `null` when there
+   * is no open message.
+   */
+  private closeCurrentMessage(): ResponseStreamEvent | null {
+    if (!this.currentMessage) return null;
+    const { id, text, outputIndex } = this.currentMessage;
+    this.currentMessage = null;
+    const doneItem: ResponseOutputMessage = {
+      type: "message",
+      id,
+      status: "completed",
+      role: "assistant",
+      content: [{ type: "output_text", text }],
+    };
+    return {
+      type: "response.output_item.done",
+      output_index: outputIndex,
+      item: doneItem,
+      sequence_number: this.seqNum++,
+    };
+  }
+
+  private handleStatus(status: string, error?: string): ResponseStreamEvent[] {
+    if (status === "error") {
+      return [
+        {
+          type: "error",
+          error: error ?? "Unknown error",
+          sequence_number: this.seqNum++,
+        },
+        {
+          type: "response.failed",
+          sequence_number: this.seqNum++,
+        },
+      ];
+    }
+
+    if (status === "complete") {
+      return this.finalize();
+    }
+
+    return [];
+  }
+}
diff --git a/packages/appkit/src/plugins/agents/index.ts b/packages/appkit/src/plugins/agents/index.ts
new file mode 100644
index 000000000..8220a55e7
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/index.ts
@@ -0,0 +1,22 @@
+export { AgentsPlugin, agents } from "./agents";
+export { buildToolkitEntries } from "../../core/agent/build-toolkit";
+export {
+  type LoadContext,
+  type LoadResult,
+  loadAgentFromFile,
+  loadAgentsFromDir,
+  parseFrontmatter,
+} from "../../core/agent/load-agents";
+export {
+  type AgentDefinition,
+  type AgentsPluginConfig,
+  type AgentTool,
+  type AutoInheritToolsConfig,
+  type BaseSystemPromptOption,
+  isToolkitEntry,
+  type PromptContext,
+  type RegisteredAgent,
+  type ResolvedToolEntry,
+  type ToolkitEntry,
+  type ToolkitOptions,
+} from "../../core/agent/types";
diff --git a/packages/appkit/src/plugins/agents/manifest.json b/packages/appkit/src/plugins/agents/manifest.json
new file mode 100644
index 000000000..cb7a43f8b
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/manifest.json
@@ -0,0 +1,10 @@
+{
+  "$schema": "https://databricks.github.io/appkit/schemas/plugin-manifest.schema.json",
+  "name": "agents",
+  "displayName": "Agents Plugin",
+  "description": "AI agents driven by markdown configs or code, with auto-tool-discovery from registered plugins",
+  "resources": {
+    "required": [],
+    "optional": []
+  }
+}
diff --git a/packages/appkit/src/plugins/agents/schemas.ts b/packages/appkit/src/plugins/agents/schemas.ts
new file mode 100644
index 000000000..cea6c6d64
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/schemas.ts
@@ -0,0 +1,69 @@
+import { z } from "zod";
+
+/**
+ * Static body cap for the `message` field on `POST /chat`. 64 000 characters
+ * is well above any legitimate chat turn (~16k tokens at 4 chars/token) and
+ * bounds the per-request cost of appending to `InMemoryThreadStore` without
+ * requiring per-deployment configuration.
+ */
+const MAX_MESSAGE_CHARS = 64_000;
+
+/** Cap applied to `/invocations` when `input` is a raw string. */
+const MAX_INVOCATIONS_INPUT_CHARS = 64_000;
+
+/**
+ * Cap on the number of items accepted in an `/invocations` `input` array
+ * (one element per seeded message). Protects against a single request
+ * seeding hundreds of messages into the thread store.
+ */
+const MAX_INVOCATIONS_INPUT_ITEMS = 100;
+
+/** Per-message `content` size cap (string form). */
+const MAX_INVOCATIONS_ITEM_CHARS = 64_000;
+
+/** Per-message `content` size cap (array form). */
+const MAX_INVOCATIONS_ITEM_ARRAY_ITEMS = 100;
+
+export const chatRequestSchema = z.object({
+  message: z
+    .string()
+    .min(1, "message must not be empty")
+    .max(
+      MAX_MESSAGE_CHARS,
+      `message exceeds the ${MAX_MESSAGE_CHARS}-character limit`,
+    ),
+  threadId: z.string().optional(),
+  agent: z.string().optional(),
+});
+
+const messageItemSchema = z.object({
+  role: z.enum(["user", "assistant", "system"]).optional(),
+  content: z
+    .union([
+      z.string().max(MAX_INVOCATIONS_ITEM_CHARS),
+      z.array(z.any()).max(MAX_INVOCATIONS_ITEM_ARRAY_ITEMS),
+    ])
+    .optional(),
+  type: z.string().optional(),
+});
+
+export const invocationsRequestSchema = z.object({
+  input: z.union([
+    z.string().min(1).max(MAX_INVOCATIONS_INPUT_CHARS),
+    z
+      .array(messageItemSchema)
+      .min(1)
+      .max(
+        MAX_INVOCATIONS_INPUT_ITEMS,
+        `input array exceeds the ${MAX_INVOCATIONS_INPUT_ITEMS}-item limit`,
+      ),
+  ]),
+  stream: z.boolean().optional().default(true),
+  model: z.string().optional(),
+});
+
+export const approvalRequestSchema = z.object({
+  streamId: z.string().min(1, "streamId is required"),
+  approvalId: z.string().min(1, "approvalId is required"),
+  decision: z.enum(["approve", "deny"]),
+});
diff --git a/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts b/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
new file mode 100644
index 000000000..43ad8c104
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
@@ -0,0 +1,373 @@
+import fs from "node:fs";
+import os from "node:os";
+import path from "node:path";
+import type {
+  AgentAdapter,
+  AgentInput,
+  AgentRunContext,
+  AgentToolDefinition,
+  ToolProvider,
+} from "shared";
+import { afterEach, beforeEach, describe, expect, test, vi } from "vitest";
+import { z } from "zod";
+import { CacheManager } from "../../../cache";
+// Import the class directly so we can construct it without a createApp
+import { AgentsPlugin } from "../agents";
+import { buildToolkitEntries } from "../../../core/agent/build-toolkit";
+import { defineTool, type ToolRegistry } from "../../../core/agent/tools/define-tool";
+import type { AgentsPluginConfig, ToolkitEntry } from "../../../core/agent/types";
+import { isToolkitEntry } from "../../../core/agent/types";
+
+interface FakeContext {
+  providers: Array<{ name: string; provider: ToolProvider }>;
+  getToolProviders(): Array<{ name: string; provider: ToolProvider }>;
+  getPluginNames(): string[];
+  addRoute(): void;
+  executeTool: (
+    req: unknown,
+    pluginName: string,
+    localName: string,
+    args: unknown,
+  ) => Promise<unknown>;
+}
+
+function fakeContext(
+  providers: Array<{ name: string; provider: ToolProvider }>,
+): FakeContext {
+  return {
+    providers,
+    getToolProviders: () => providers,
+    getPluginNames: () => providers.map((p) => p.name),
+    addRoute: vi.fn(),
+    executeTool: vi.fn(async (_req, p, n, args) => ({
+      plugin: p,
+      tool: n,
+      args,
+    })),
+  };
+}
+
+function stubAdapter(): AgentAdapter {
+  return {
+    async *run(_input: AgentInput, _ctx: AgentRunContext) {
+      yield { type: "message_delta", content: "" };
+    },
+  };
+}
+
+function makeToolProvider(
+  pluginName: string,
+  registry: ToolRegistry,
+): ToolProvider & {
+  toolkit: (opts?: unknown) => Record<string, ToolkitEntry>;
+} {
+  return {
+    getAgentTools(): AgentToolDefinition[] {
+      return Object.entries(registry).map(([name, entry]) => ({
+        name,
+        description: entry.description,
+        parameters: { type: "object", properties: {} },
+      }));
+    },
+    async executeAgentTool(name, args) {
+      return { callFrom: pluginName, name, args };
+    },
+    toolkit: (opts) => buildToolkitEntries(pluginName, registry, opts as never),
+  };
+}
+
+let tmpDir: string;
+
+beforeEach(async () => {
+  tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), "agents-plugin-"));
+  const storage = {
+    get: vi.fn(),
+    set: vi.fn(),
+    delete: vi.fn(),
+    keys: vi.fn(),
+    healthCheck: vi.fn(async () => true),
+    close: vi.fn(async () => {}),
+  };
+  // biome-ignore lint/suspicious/noExplicitAny: test-only CacheManager wiring
+  await CacheManager.getInstance({ storage: storage as any });
+});
+
+afterEach(() => {
+  fs.rmSync(tmpDir, { recursive: true, force: true });
+});
+
+function instantiate(config: AgentsPluginConfig, ctx?: FakeContext) {
+  const plugin = new AgentsPlugin({ ...config, name: "agent" });
+  plugin.attachContext({ context: ctx as unknown as object });
+  return plugin;
+}
+
+describe("AgentsPlugin", () => {
+  test("registers code-defined agents and exposes them via exports", async () => {
+    const plugin = instantiate({
+      dir: false,
+      agents: {
+        support: {
+          instructions: "You help customers.",
+          model: stubAdapter(),
+        },
+      },
+    });
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      list: () => string[];
+      getDefault: () => string | null;
+    };
+    expect(api.list()).toEqual(["support"]);
+    expect(api.getDefault()).toBe("support");
+  });
+
+  test("loads markdown agents from a directory", async () => {
+    fs.writeFileSync(
+      path.join(tmpDir, "assistant.md"),
+      "---\ndefault: true\n---\nYou are helpful.",
+      "utf-8",
+    );
+    const plugin = instantiate({
+      dir: tmpDir,
+      defaultModel: stubAdapter(),
+    });
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      list: () => string[];
+      getDefault: () => string | null;
+    };
+    expect(api.list()).toEqual(["assistant"]);
+    expect(api.getDefault()).toBe("assistant");
+  });
+
+  test("code definitions override markdown on key collision", async () => {
+    fs.writeFileSync(
+      path.join(tmpDir, "support.md"),
+      "---\n---\nFrom markdown.",
+      "utf-8",
+    );
+    const plugin = instantiate({
+      dir: tmpDir,
+      defaultModel: stubAdapter(),
+      agents: {
+        support: {
+          instructions: "From code",
+          model: stubAdapter(),
+        },
+      },
+    });
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      get: (name: string) => { instructions: string } | null;
+    };
+    expect(api.get("support")?.instructions).toBe("From code");
+  });
+
+  test("auto-inherit default is safe (both file and code get nothing without an explicit opt-in)", async () => {
+    const registry: ToolRegistry = {
+      query: defineTool({
+        description: "q",
+        schema: z.object({ sql: z.string() }),
+        autoInheritable: true, // even with autoInheritable, no spread without opt-in
+        handler: () => "ok",
+      }),
+    };
+    const provider = makeToolProvider("analytics", registry);
+    const ctx = fakeContext([{ name: "analytics", provider }]);
+
+    fs.writeFileSync(
+      path.join(tmpDir, "assistant.md"),
+      "---\n---\nYou are helpful.",
+      "utf-8",
+    );
+
+    const plugin = instantiate(
+      {
+        dir: tmpDir,
+        defaultModel: stubAdapter(),
+        agents: {
+          manual: {
+            instructions: "Manual agent",
+            model: stubAdapter(),
+          },
+        },
+      },
+      ctx,
+    );
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+    };
+    const fileAgent = api.get("assistant");
+    const codeAgent = api.get("manual");
+
+    expect(fileAgent?.toolIndex.size).toBe(0);
+    expect(codeAgent?.toolIndex.size).toBe(0);
+  });
+
+  test("opting in with autoInheritTools: { file: true } spreads only autoInheritable tools", async () => {
+    const registry: ToolRegistry = {
+      query: defineTool({
+        description: "read-only query",
+        schema: z.object({ sql: z.string() }),
+        autoInheritable: true,
+        handler: () => "ok",
+      }),
+      destructive: defineTool({
+        description: "mutation",
+        schema: z.object({}),
+        // autoInheritable left unset → skipped even when opted in
+        handler: () => "ok",
+      }),
+    };
+    const provider = makeToolProvider("analytics", registry);
+    const ctx = fakeContext([{ name: "analytics", provider }]);
+
+    fs.writeFileSync(
+      path.join(tmpDir, "assistant.md"),
+      "---\n---\nYou are helpful.",
+      "utf-8",
+    );
+
+    const plugin = instantiate(
+      {
+        dir: tmpDir,
+        defaultModel: stubAdapter(),
+        autoInheritTools: { file: true },
+      },
+      ctx,
+    );
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+    };
+    const fileAgent = api.get("assistant");
+    const keys = Array.from(fileAgent?.toolIndex.keys() ?? []);
+    expect(keys).toEqual(["analytics.query"]);
+  });
+
+  test("autoInheritTools: true enables both origins but still filters by autoInheritable", async () => {
+    const registry: ToolRegistry = {
+      safe: defineTool({
+        description: "safe",
+        schema: z.object({}),
+        autoInheritable: true,
+        handler: () => "ok",
+      }),
+      unsafe: defineTool({
+        description: "unsafe",
+        schema: z.object({}),
+        handler: () => "ok",
+      }),
+    };
+    const provider = makeToolProvider("p", registry);
+    const ctx = fakeContext([{ name: "p", provider }]);
+
+    const plugin = instantiate(
+      {
+        dir: false,
+        defaultModel: stubAdapter(),
+        autoInheritTools: true,
+        agents: {
+          code1: {
+            instructions: "code agent",
+            model: stubAdapter(),
+          },
+        },
+      },
+      ctx,
+    );
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+    };
+    const codeAgent = api.get("code1");
+    const keys = Array.from(codeAgent?.toolIndex.keys() ?? []);
+    expect(keys).toEqual(["p.safe"]);
+  });
+
+  test("file-loaded agent respects explicit toolkits (skips auto-inherit)", async () => {
+    const registry: ToolRegistry = {
+      query: defineTool({
+        description: "q",
+        schema: z.object({ sql: z.string() }),
+        handler: () => "ok",
+      }),
+    };
+    const registry2: ToolRegistry = {
+      list: defineTool({
+        description: "l",
+        schema: z.object({}),
+        handler: () => [],
+      }),
+    };
+    const ctx = fakeContext([
+      { name: "analytics", provider: makeToolProvider("analytics", registry) },
+      { name: "files", provider: makeToolProvider("files", registry2) },
+    ]);
+
+    fs.writeFileSync(
+      path.join(tmpDir, "analyst.md"),
+      "---\ntoolkits: [analytics]\n---\nAnalyst.",
+      "utf-8",
+    );
+
+    const plugin = instantiate(
+      { dir: tmpDir, defaultModel: stubAdapter() },
+      ctx,
+    );
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+    };
+    const agent = api.get("analyst");
+    const toolNames = Array.from(agent?.toolIndex.keys() ?? []);
+    expect(toolNames.some((n) => n.startsWith("analytics."))).toBe(true);
+    expect(toolNames.some((n) => n.startsWith("files."))).toBe(false);
+  });
+
+  test("registers sub-agents as agent-<key> tools", async () => {
+    const plugin = instantiate({
+      dir: false,
+      agents: {
+        supervisor: {
+          instructions: "Supervise",
+          model: stubAdapter(),
+          agents: {
+            worker: {
+              instructions: "Work",
+              model: stubAdapter(),
+            },
+          },
+        },
+      },
+    });
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+    };
+    const sup = api.get("supervisor");
+    expect(sup?.toolIndex.has("agent-worker")).toBe(true);
+  });
+
+  test("isToolkitEntry type guard recognizes toolkit entries", () => {
+    const entry: ToolkitEntry = {
+      __toolkitRef: true,
+      pluginName: "x",
+      localName: "y",
+      def: { name: "x.y", description: "", parameters: { type: "object" } },
+    };
+    expect(isToolkitEntry(entry)).toBe(true);
+    expect(isToolkitEntry({ foo: 1 })).toBe(false);
+    expect(isToolkitEntry(null)).toBe(false);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/approval-route.test.ts b/packages/appkit/src/plugins/agents/tests/approval-route.test.ts
new file mode 100644
index 000000000..6e090bd2f
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/approval-route.test.ts
@@ -0,0 +1,292 @@
+import type express from "express";
+import { beforeEach, describe, expect, test, vi } from "vitest";
+import { CacheManager } from "../../../cache";
+import { AgentsPlugin } from "../agents";
+
+/**
+ * Focused tests for the `POST /approve` route and the associated
+ * ownership / error paths on `_handleApprove`. Covers:
+ *
+ *   - Schema validation of the request body.
+ *   - Ownership check: the user submitting the decision must be the same
+ *     user who initiated the underlying chat stream.
+ *   - 404 for unknown stream (already completed or never existed).
+ *   - 404 for unknown approvalId even when the stream is active.
+ *   - Happy-path resolution of a pending gate with `approve` and `deny`.
+ *   - Cancel of an active stream denies every pending gate on that stream.
+ */
+
+function mockReq(body: unknown, userId?: string): express.Request {
+  const headers: Record<string, string> = {};
+  if (userId) {
+    headers["x-forwarded-user"] = userId;
+    headers["x-forwarded-access-token"] = "fake-token";
+  }
+  return {
+    body,
+    headers,
+    header: (name: string) => headers[name.toLowerCase()],
+  } as unknown as express.Request;
+}
+
+function mockRes() {
+  const json = vi.fn();
+  const end = vi.fn();
+  let statusCode = 200;
+  const status = vi.fn((code: number) => {
+    statusCode = code;
+    return { json, end };
+  });
+  return {
+    res: { status, json, end } as unknown as express.Response,
+    get statusCode() {
+      return statusCode;
+    },
+    json,
+  };
+}
+
+beforeEach(() => {
+  CacheManager.getInstanceSync = vi.fn(() => ({
+    get: vi.fn(),
+    set: vi.fn(),
+    delete: vi.fn(),
+    getOrExecute: vi.fn(async (_k: unknown[], fn: () => Promise<unknown>) =>
+      fn(),
+    ),
+    generateKey: vi.fn(() => "test-key"),
+  })) as any;
+  process.env.NODE_ENV = "development";
+});
+
+describe("POST /approve route handler", () => {
+  test("rejects invalid body shape with 400", async () => {
+    const plugin = new AgentsPlugin({ dir: false });
+    const { res, json } = mockRes();
+    await (plugin as any)._handleApprove(mockReq({}, "alice"), res);
+    expect(res.status).toHaveBeenCalledWith(400);
+    expect(json).toHaveBeenCalledWith(
+      expect.objectContaining({ error: "Invalid request" }),
+    );
+  });
+
+  test("returns 404 when the streamId is unknown", async () => {
+    const plugin = new AgentsPlugin({ dir: false });
+    const { res, json } = mockRes();
+    await (
+      plugin as unknown as {
+        _handleApprove: (
+          r: express.Request,
+          w: express.Response,
+        ) => Promise<void>;
+      }
+    )._handleApprove(
+      mockReq(
+        { streamId: "ghost", approvalId: "a1", decision: "approve" },
+        "alice",
+      ),
+      res,
+    );
+    expect(res.status).toHaveBeenCalledWith(404);
+    expect(json).toHaveBeenCalledWith(
+      expect.objectContaining({ error: expect.stringMatching(/not found/i) }),
+    );
+  });
+
+  test("returns 403 when submitter is different from stream owner", async () => {
+    const plugin = new AgentsPlugin({ dir: false });
+    (plugin as any).activeStreams.set("stream-x", {
+      controller: new AbortController(),
+      userId: "alice",
+    });
+    const gate = (plugin as any).approvalGate;
+    const waiter = gate.wait({
+      approvalId: "a1",
+      streamId: "stream-x",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+
+    const { res, json } = mockRes();
+    await (
+      plugin as unknown as {
+        _handleApprove: (
+          r: express.Request,
+          w: express.Response,
+        ) => Promise<void>;
+      }
+    )._handleApprove(
+      mockReq(
+        { streamId: "stream-x", approvalId: "a1", decision: "approve" },
+        "bob",
+      ),
+      res,
+    );
+    expect(res.status).toHaveBeenCalledWith(403);
+    expect(json).toHaveBeenCalledWith(
+      expect.objectContaining({ error: "Forbidden" }),
+    );
+
+    // Settle the waiter to clean up.
+    gate.submit({ approvalId: "a1", userId: "alice", decision: "deny" });
+    await expect(waiter).resolves.toBe("deny");
+  });
+
+  test("returns 404 when approvalId is unknown on an active stream", async () => {
+    const plugin = new AgentsPlugin({ dir: false });
+    (plugin as any).activeStreams.set("stream-y", {
+      controller: new AbortController(),
+      userId: "alice",
+    });
+    const { res, json } = mockRes();
+    await (
+      plugin as unknown as {
+        _handleApprove: (
+          r: express.Request,
+          w: express.Response,
+        ) => Promise<void>;
+      }
+    )._handleApprove(
+      mockReq(
+        { streamId: "stream-y", approvalId: "unknown-a", decision: "approve" },
+        "alice",
+      ),
+      res,
+    );
+    expect(res.status).toHaveBeenCalledWith(404);
+    expect(json).toHaveBeenCalledWith(
+      expect.objectContaining({
+        error: expect.stringMatching(/not found|already settled/i),
+      }),
+    );
+  });
+
+  test("happy path: approve resolves pending gate with 'approve'", async () => {
+    const plugin = new AgentsPlugin({ dir: false });
+    (plugin as any).activeStreams.set("stream-z", {
+      controller: new AbortController(),
+      userId: "alice",
+    });
+    const gate = (plugin as any).approvalGate;
+    const waiter = gate.wait({
+      approvalId: "a42",
+      streamId: "stream-z",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+
+    const { res, json } = mockRes();
+    await (
+      plugin as unknown as {
+        _handleApprove: (
+          r: express.Request,
+          w: express.Response,
+        ) => Promise<void>;
+      }
+    )._handleApprove(
+      mockReq(
+        { streamId: "stream-z", approvalId: "a42", decision: "approve" },
+        "alice",
+      ),
+      res,
+    );
+    expect(res.status).not.toHaveBeenCalled();
+    expect(json).toHaveBeenCalledWith({ decision: "approve" });
+    await expect(waiter).resolves.toBe("approve");
+  });
+
+  test("happy path: deny resolves pending gate with 'deny'", async () => {
+    const plugin = new AgentsPlugin({ dir: false });
+    (plugin as any).activeStreams.set("stream-z", {
+      controller: new AbortController(),
+      userId: "alice",
+    });
+    const gate = (plugin as any).approvalGate;
+    const waiter = gate.wait({
+      approvalId: "a43",
+      streamId: "stream-z",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+
+    const { res, json } = mockRes();
+    await (
+      plugin as unknown as {
+        _handleApprove: (
+          r: express.Request,
+          w: express.Response,
+        ) => Promise<void>;
+      }
+    )._handleApprove(
+      mockReq(
+        { streamId: "stream-z", approvalId: "a43", decision: "deny" },
+        "alice",
+      ),
+      res,
+    );
+    expect(json).toHaveBeenCalledWith({ decision: "deny" });
+    await expect(waiter).resolves.toBe("deny");
+  });
+});
+
+describe("POST /cancel ownership + gate cleanup", () => {
+  test("cancelling a stream denies every pending approval on that stream", async () => {
+    const plugin = new AgentsPlugin({ dir: false });
+    const controller = new AbortController();
+    (plugin as any).activeStreams.set("stream-c", {
+      controller,
+      userId: "alice",
+    });
+    const gate = (plugin as any).approvalGate;
+    const a = gate.wait({
+      approvalId: "ca1",
+      streamId: "stream-c",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+    const b = gate.wait({
+      approvalId: "ca2",
+      streamId: "stream-c",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+
+    const { res, json } = mockRes();
+    await (
+      plugin as unknown as {
+        _handleCancel: (
+          r: express.Request,
+          w: express.Response,
+        ) => Promise<void>;
+      }
+    )._handleCancel(mockReq({ streamId: "stream-c" }, "alice"), res);
+
+    expect(controller.signal.aborted).toBe(true);
+    expect(json).toHaveBeenCalledWith({ cancelled: true });
+    await expect(a).resolves.toBe("deny");
+    await expect(b).resolves.toBe("deny");
+  });
+
+  test("cancel from a different user is refused with 403", async () => {
+    const plugin = new AgentsPlugin({ dir: false });
+    const controller = new AbortController();
+    (plugin as any).activeStreams.set("stream-d", {
+      controller,
+      userId: "alice",
+    });
+    const { res, json } = mockRes();
+    await (
+      plugin as unknown as {
+        _handleCancel: (
+          r: express.Request,
+          w: express.Response,
+        ) => Promise<void>;
+      }
+    )._handleCancel(mockReq({ streamId: "stream-d" }, "bob"), res);
+    expect(res.status).toHaveBeenCalledWith(403);
+    expect(controller.signal.aborted).toBe(false);
+    expect(json).toHaveBeenCalledWith(
+      expect.objectContaining({ error: "Forbidden" }),
+    );
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/dos-limits.test.ts b/packages/appkit/src/plugins/agents/tests/dos-limits.test.ts
new file mode 100644
index 000000000..935fa2403
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/dos-limits.test.ts
@@ -0,0 +1,299 @@
+import type express from "express";
+import { beforeEach, describe, expect, test, vi } from "vitest";
+import { CacheManager } from "../../../cache";
+import { AgentsPlugin } from "../agents";
+import { chatRequestSchema, invocationsRequestSchema } from "../schemas";
+
+/**
+ * Exercises the four DoS caps landed for MVP:
+ *
+ *   - `chatRequestSchema.message.max(64_000)` — body cap on `POST /chat`.
+ *   - Per-user `maxConcurrentStreamsPerUser` — 429 with Retry-After.
+ *   - Per-run `maxToolCalls` — aborts stream and throws in `executeTool`.
+ *   - Per-delegation `maxSubAgentDepth` — rejects in `runSubAgent`.
+ *
+ * Route-level tests exercise the schemas + `_handleChat` directly via the
+ * mocked req/res pattern already used by approval-route.test.ts.
+ */
+
+function mockReq(body: unknown, userId?: string): express.Request {
+  const headers: Record<string, string> = {};
+  if (userId) {
+    headers["x-forwarded-user"] = userId;
+    headers["x-forwarded-access-token"] = "fake-token";
+  }
+  return {
+    body,
+    headers,
+    header: (name: string) => headers[name.toLowerCase()],
+  } as unknown as express.Request;
+}
+
+function mockRes() {
+  const json = vi.fn();
+  const setHeader = vi.fn();
+  let statusCode = 200;
+  const status = vi.fn((code: number) => {
+    statusCode = code;
+    return { json };
+  });
+  return {
+    res: { status, json, setHeader } as unknown as express.Response,
+    get statusCode() {
+      return statusCode;
+    },
+    json,
+    setHeader,
+  };
+}
+
+beforeEach(() => {
+  CacheManager.getInstanceSync = vi.fn(() => ({
+    get: vi.fn(),
+    set: vi.fn(),
+    delete: vi.fn(),
+    getOrExecute: vi.fn(async (_k: unknown[], fn: () => Promise<unknown>) =>
+      fn(),
+    ),
+    generateKey: vi.fn(() => "test-key"),
+    // biome-ignore lint/suspicious/noExplicitAny: test mock
+  })) as any;
+  process.env.NODE_ENV = "development";
+});
+
+describe("chatRequestSchema — body cap", () => {
+  test("accepts messages up to 64_000 characters", () => {
+    const result = chatRequestSchema.safeParse({
+      message: "a".repeat(64_000),
+    });
+    expect(result.success).toBe(true);
+  });
+
+  test("rejects messages over 64_000 characters", () => {
+    const result = chatRequestSchema.safeParse({
+      message: "a".repeat(64_001),
+    });
+    expect(result.success).toBe(false);
+    if (!result.success) {
+      expect(JSON.stringify(result.error.flatten())).toMatch(/64000/);
+    }
+  });
+
+  test("rejects empty message (existing contract)", () => {
+    expect(chatRequestSchema.safeParse({ message: "" }).success).toBe(false);
+  });
+});
+
+describe("invocationsRequestSchema — input caps", () => {
+  test("accepts string input up to 64_000 characters", () => {
+    const result = invocationsRequestSchema.safeParse({
+      input: "a".repeat(64_000),
+    });
+    expect(result.success).toBe(true);
+  });
+
+  test("rejects string input over 64_000 characters", () => {
+    const result = invocationsRequestSchema.safeParse({
+      input: "a".repeat(64_001),
+    });
+    expect(result.success).toBe(false);
+  });
+
+  test("accepts array input up to 100 items", () => {
+    const items = Array.from({ length: 100 }, (_, i) => ({
+      role: "user" as const,
+      content: `m${i}`,
+    }));
+    expect(invocationsRequestSchema.safeParse({ input: items }).success).toBe(
+      true,
+    );
+  });
+
+  test("rejects array input over 100 items", () => {
+    const items = Array.from({ length: 101 }, (_, i) => ({
+      role: "user" as const,
+      content: `m${i}`,
+    }));
+    const result = invocationsRequestSchema.safeParse({ input: items });
+    expect(result.success).toBe(false);
+  });
+
+  test("rejects per-item content over 64_000 characters", () => {
+    const result = invocationsRequestSchema.safeParse({
+      input: [{ role: "user", content: "a".repeat(64_001) }],
+    });
+    expect(result.success).toBe(false);
+  });
+});
+
+describe("POST /chat — per-user concurrent-stream limit", () => {
+  function seedPlugin(
+    overrides: ConstructorParameters<typeof AgentsPlugin>[0] = { dir: false },
+  ): AgentsPlugin {
+    const plugin = new AgentsPlugin(overrides);
+    // Seed the agents map directly so _handleChat can resolve "hello"
+    // without running setup() (which would require a live model).
+    // biome-ignore lint/suspicious/noExplicitAny: seeding private state
+    (plugin as any).agents.set("hello", {
+      name: "hello",
+      instructions: "hi",
+      adapter: { async *run() {} },
+      toolIndex: new Map(),
+    });
+    // biome-ignore lint/suspicious/noExplicitAny: seeding private state
+    (plugin as any).defaultAgentName = "hello";
+    return plugin;
+  }
+
+  test("rejects with 429 + Retry-After when user is at-limit (default 5)", async () => {
+    const plugin = seedPlugin();
+    for (let i = 0; i < 5; i++) {
+      // biome-ignore lint/suspicious/noExplicitAny: seeding
+      (plugin as any).activeStreams.set(`s${i}`, {
+        controller: new AbortController(),
+        userId: "alice",
+      });
+    }
+
+    const { res, setHeader, json } = mockRes();
+    await (
+      plugin as unknown as {
+        _handleChat: (r: express.Request, w: express.Response) => Promise<void>;
+      }
+    )._handleChat(mockReq({ message: "hi" }, "alice"), res);
+
+    expect(res.status).toHaveBeenCalledWith(429);
+    expect(setHeader).toHaveBeenCalledWith("Retry-After", "5");
+    expect(json).toHaveBeenCalledWith(
+      expect.objectContaining({
+        error: expect.stringMatching(/Too many concurrent streams/),
+      }),
+    );
+  });
+
+  test("does not reject when another user is at-limit (per-user, not global)", async () => {
+    const plugin = seedPlugin();
+    for (let i = 0; i < 5; i++) {
+      // biome-ignore lint/suspicious/noExplicitAny: seeding
+      (plugin as any).activeStreams.set(`s${i}`, {
+        controller: new AbortController(),
+        userId: "alice",
+      });
+    }
+
+    // Carol's request must not see a 429 even though alice is at-limit.
+    // Don't bother running the full stream — we assert only that 429 is
+    // not the response status.
+    const { res } = mockRes();
+    // biome-ignore lint/suspicious/noExplicitAny: stub _streamAgent to avoid needing a real adapter
+    (plugin as any)._streamAgent = vi.fn(async () => undefined);
+
+    await (
+      plugin as unknown as {
+        _handleChat: (r: express.Request, w: express.Response) => Promise<void>;
+      }
+    )._handleChat(mockReq({ message: "hi" }, "carol"), res);
+
+    expect(res.status).not.toHaveBeenCalledWith(429);
+  });
+
+  test("honours agents({ limits: { maxConcurrentStreamsPerUser } })", async () => {
+    const plugin = seedPlugin({
+      dir: false,
+      limits: { maxConcurrentStreamsPerUser: 2 },
+    });
+    for (let i = 0; i < 2; i++) {
+      // biome-ignore lint/suspicious/noExplicitAny: seeding
+      (plugin as any).activeStreams.set(`s${i}`, {
+        controller: new AbortController(),
+        userId: "alice",
+      });
+    }
+
+    const { res } = mockRes();
+    await (
+      plugin as unknown as {
+        _handleChat: (r: express.Request, w: express.Response) => Promise<void>;
+      }
+    )._handleChat(mockReq({ message: "hi" }, "alice"), res);
+
+    expect(res.status).toHaveBeenCalledWith(429);
+  });
+});
+
+describe("resolvedLimits — default values", () => {
+  test("exposes the documented MVP defaults when unconfigured", () => {
+    const plugin = new AgentsPlugin({ dir: false });
+    // biome-ignore lint/suspicious/noExplicitAny: read private getter
+    const limits = (plugin as any).resolvedLimits;
+    expect(limits).toEqual({
+      maxConcurrentStreamsPerUser: 5,
+      maxToolCalls: 50,
+      maxSubAgentDepth: 3,
+    });
+  });
+
+  test("lets callers override any subset", () => {
+    const plugin = new AgentsPlugin({
+      dir: false,
+      limits: { maxToolCalls: 100 },
+    });
+    // biome-ignore lint/suspicious/noExplicitAny: read private
+    const limits = (plugin as any).resolvedLimits;
+    expect(limits.maxToolCalls).toBe(100);
+    expect(limits.maxConcurrentStreamsPerUser).toBe(5);
+    expect(limits.maxSubAgentDepth).toBe(3);
+  });
+});
+
+describe("runSubAgent — depth guard", () => {
+  test("rejects when depth exceeds the configured maximum", async () => {
+    const plugin = new AgentsPlugin({
+      dir: false,
+      limits: { maxSubAgentDepth: 2 },
+    });
+    // biome-ignore lint/suspicious/noExplicitAny: call private method directly
+    await expect(
+      (plugin as any).runSubAgent(
+        mockReq({}, "alice"),
+        { name: "child", toolIndex: new Map() },
+        {},
+        new AbortController().signal,
+        3, // exceeds limit 2
+      ),
+    ).rejects.toThrow(/Sub-agent depth exceeded \(limit 2\)/);
+  });
+
+  test("accepts at the boundary (depth === limit)", async () => {
+    // Use a stub adapter so we don't need a real model.
+    const plugin = new AgentsPlugin({
+      dir: false,
+      limits: { maxSubAgentDepth: 3 },
+      agents: {},
+    });
+
+    const stubAdapter = {
+      // biome-ignore lint/suspicious/noExplicitAny: adapter shape not under test
+      async *run(): any {
+        yield { type: "message", content: "hello from depth-3" };
+      },
+    };
+    const child = {
+      name: "child",
+      instructions: "test",
+      // biome-ignore lint/suspicious/noExplicitAny: stub shape
+      adapter: stubAdapter as any,
+      toolIndex: new Map(),
+    };
+
+    // biome-ignore lint/suspicious/noExplicitAny: call private
+    const result = await (plugin as any).runSubAgent(
+      mockReq({}, "alice"),
+      child,
+      { input: "test" },
+      new AbortController().signal,
+      3, // at the limit, not over
+    );
+    expect(result).toBe("hello from depth-3");
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/event-channel.test.ts b/packages/appkit/src/plugins/agents/tests/event-channel.test.ts
new file mode 100644
index 000000000..d80d788de
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/event-channel.test.ts
@@ -0,0 +1,78 @@
+import { describe, expect, test } from "vitest";
+import { EventChannel } from "../event-channel";
+
+async function collect<T>(ch: EventChannel<T>): Promise<T[]> {
+  const out: T[] = [];
+  for await (const v of ch) out.push(v);
+  return out;
+}
+
+describe("EventChannel", () => {
+  test("yields pushed values in order", async () => {
+    const ch = new EventChannel<number>();
+    const p = collect(ch);
+    ch.push(1);
+    ch.push(2);
+    ch.push(3);
+    ch.close();
+    await expect(p).resolves.toEqual([1, 2, 3]);
+  });
+
+  test("pushes before iteration start are buffered", async () => {
+    const ch = new EventChannel<string>();
+    ch.push("a");
+    ch.push("b");
+    ch.close();
+    await expect(collect(ch)).resolves.toEqual(["a", "b"]);
+  });
+
+  test("waiting iterator is unblocked by subsequent push", async () => {
+    const ch = new EventChannel<number>();
+    const promise = collect(ch);
+    await new Promise((r) => setTimeout(r, 5));
+    ch.push(42);
+    ch.close();
+    await expect(promise).resolves.toEqual([42]);
+  });
+
+  test("close with no pending values terminates iteration", async () => {
+    const ch = new EventChannel<number>();
+    const p = collect(ch);
+    ch.close();
+    await expect(p).resolves.toEqual([]);
+  });
+
+  test("push after close is a no-op (channel is closed)", async () => {
+    const ch = new EventChannel<number>();
+    ch.close();
+    ch.push(1);
+    await expect(collect(ch)).resolves.toEqual([]);
+  });
+
+  test("close with error rejects the waiting iterator", async () => {
+    const ch = new EventChannel<number>();
+    const promise = collect(ch);
+    await new Promise((r) => setTimeout(r, 5));
+    ch.close(new Error("boom"));
+    await expect(promise).rejects.toThrow(/boom/);
+  });
+
+  test("interleaved pushes and reads stream through", async () => {
+    const ch = new EventChannel<number>();
+    const received: number[] = [];
+    const reader = (async () => {
+      for await (const v of ch) {
+        received.push(v);
+        if (received.length === 3) break;
+      }
+    })();
+    ch.push(1);
+    await new Promise((r) => setTimeout(r, 0));
+    ch.push(2);
+    await new Promise((r) => setTimeout(r, 0));
+    ch.push(3);
+    await reader;
+    expect(received).toEqual([1, 2, 3]);
+    ch.close();
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/event-translator.test.ts b/packages/appkit/src/plugins/agents/tests/event-translator.test.ts
new file mode 100644
index 000000000..050af001a
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/event-translator.test.ts
@@ -0,0 +1,332 @@
+import type { ResponseStreamEvent } from "shared";
+import { describe, expect, test } from "vitest";
+import { AgentEventTranslator } from "../event-translator";
+
+describe("AgentEventTranslator", () => {
+  test("translates message_delta to output_item.added + output_text.delta on first delta", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "message_delta",
+      content: "Hello",
+    });
+
+    expect(events).toHaveLength(2);
+    expect(events[0].type).toBe("response.output_item.added");
+    expect(events[1].type).toBe("response.output_text.delta");
+
+    if (events[1].type === "response.output_text.delta") {
+      expect(events[1].delta).toBe("Hello");
+    }
+  });
+
+  test("subsequent message_delta only produces output_text.delta", () => {
+    const translator = new AgentEventTranslator();
+    translator.translate({ type: "message_delta", content: "Hello" });
+    const events = translator.translate({
+      type: "message_delta",
+      content: " world",
+    });
+
+    expect(events).toHaveLength(1);
+    expect(events[0].type).toBe("response.output_text.delta");
+  });
+
+  test("sequence_number is monotonically increasing", () => {
+    const translator = new AgentEventTranslator();
+    const e1 = translator.translate({ type: "message_delta", content: "a" });
+    const e2 = translator.translate({ type: "message_delta", content: "b" });
+    const e3 = translator.finalize();
+
+    const allSeqs = [...e1, ...e2, ...e3].map((e) =>
+      "sequence_number" in e ? e.sequence_number : -1,
+    );
+
+    for (let i = 1; i < allSeqs.length; i++) {
+      expect(allSeqs[i]).toBeGreaterThan(allSeqs[i - 1]);
+    }
+  });
+
+  test("translates tool_call to paired output_item.added + output_item.done", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "tool_call",
+      callId: "call_1",
+      name: "analytics.query",
+      args: { sql: "SELECT 1" },
+    });
+
+    expect(events).toHaveLength(2);
+    expect(events[0].type).toBe("response.output_item.added");
+    expect(events[1].type).toBe("response.output_item.done");
+
+    if (events[0].type === "response.output_item.added") {
+      expect(events[0].item.type).toBe("function_call");
+      if (events[0].item.type === "function_call") {
+        expect(events[0].item.name).toBe("analytics.query");
+        expect(events[0].item.call_id).toBe("call_1");
+      }
+    }
+  });
+
+  test("translates tool_result to paired output_item events", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "tool_result",
+      callId: "call_1",
+      result: { rows: 42 },
+    });
+
+    expect(events).toHaveLength(2);
+    expect(events[0].type).toBe("response.output_item.added");
+
+    if (events[0].type === "response.output_item.added") {
+      expect(events[0].item.type).toBe("function_call_output");
+    }
+  });
+
+  test("translates tool_result error", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "tool_result",
+      callId: "call_1",
+      result: null,
+      error: "Query failed",
+    });
+
+    if (
+      events[0].type === "response.output_item.added" &&
+      events[0].item.type === "function_call_output"
+    ) {
+      expect(events[0].item.output).toBe("Query failed");
+    }
+  });
+
+  test("translates thinking to appkit.thinking extension event", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "thinking",
+      content: "Let me think about this...",
+    });
+
+    expect(events).toHaveLength(1);
+    expect(events[0].type).toBe("appkit.thinking");
+    if (events[0].type === "appkit.thinking") {
+      expect(events[0].content).toBe("Let me think about this...");
+    }
+  });
+
+  test("translates metadata to appkit.metadata extension event", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "metadata",
+      data: { threadId: "t-123" },
+    });
+
+    expect(events).toHaveLength(1);
+    expect(events[0].type).toBe("appkit.metadata");
+    if (events[0].type === "appkit.metadata") {
+      expect(events[0].data.threadId).toBe("t-123");
+    }
+  });
+
+  test("status:complete triggers finalize with response.completed", () => {
+    const translator = new AgentEventTranslator();
+    translator.translate({ type: "message_delta", content: "Hi" });
+    const events = translator.translate({ type: "status", status: "complete" });
+
+    const types = events.map((e) => e.type);
+    expect(types).toContain("response.output_item.done");
+    expect(types).toContain("response.completed");
+  });
+
+  test("status:error emits error + response.failed", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "status",
+      status: "error",
+      error: "Something broke",
+    });
+
+    expect(events).toHaveLength(2);
+    expect(events[0].type).toBe("error");
+    expect(events[1].type).toBe("response.failed");
+
+    if (events[0].type === "error") {
+      expect(events[0].error).toBe("Something broke");
+    }
+  });
+
+  test("finalize produces response.completed", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.finalize();
+
+    expect(events.some((e) => e.type === "response.completed")).toBe(true);
+  });
+
+  test("finalize with accumulated message text produces output_item.done", () => {
+    const translator = new AgentEventTranslator();
+    translator.translate({ type: "message_delta", content: "Hello " });
+    translator.translate({ type: "message_delta", content: "world" });
+    const events = translator.finalize();
+
+    const doneEvent = events.find(
+      (e) => e.type === "response.output_item.done",
+    );
+    expect(doneEvent).toBeDefined();
+    if (
+      doneEvent?.type === "response.output_item.done" &&
+      doneEvent.item.type === "message"
+    ) {
+      expect(doneEvent.item.content[0].text).toBe("Hello world");
+    }
+  });
+
+  test("output_index increments for tool calls", () => {
+    const translator = new AgentEventTranslator();
+    const e1 = translator.translate({
+      type: "tool_call",
+      callId: "c1",
+      name: "tool1",
+      args: {},
+    });
+    const e2 = translator.translate({
+      type: "tool_result",
+      callId: "c1",
+      result: "ok",
+    });
+
+    if (
+      e1[0].type === "response.output_item.added" &&
+      e2[0].type === "response.output_item.added"
+    ) {
+      expect(e2[0].output_index).toBeGreaterThan(e1[0].output_index);
+    }
+  });
+});
+
+describe("AgentEventTranslator — monotonic output_index", () => {
+  /**
+   * Helper: every emitted `response.output_item.added`/`output_item.done`
+   * event's `output_index` must be >= every prior add/done `output_index`.
+   * This is the strict contract Responses-API clients (OpenAI's own SDK
+   * parser) enforce.
+   */
+  function assertMonotonic(events: ResponseStreamEvent[]) {
+    let last = -1;
+    for (const ev of events) {
+      if (
+        ev.type === "response.output_item.added" ||
+        ev.type === "response.output_item.done"
+      ) {
+        expect(ev.output_index).toBeGreaterThanOrEqual(last);
+        last = ev.output_index;
+      }
+    }
+  }
+
+  test("tool_call followed by message_delta emits monotonic indices (regression)", () => {
+    // Before the fix this produced: tool_call at index 1, then
+    // message_delta.added at 0 — monotonicity violated.
+    const t = new AgentEventTranslator();
+    const all: ResponseStreamEvent[] = [];
+    all.push(
+      ...t.translate({
+        type: "tool_call",
+        callId: "c1",
+        name: "lookup",
+        args: { q: "x" },
+      }),
+    );
+    all.push(
+      ...t.translate({ type: "tool_result", callId: "c1", result: "ok" }),
+    );
+    all.push(...t.translate({ type: "message_delta", content: "Result: " }));
+    all.push(...t.translate({ type: "message_delta", content: "ok." }));
+    all.push(...t.finalize());
+
+    assertMonotonic(all);
+
+    const added = all.filter((e) => e.type === "response.output_item.added");
+    // Three items: tool_call, tool_result, message. Indices 0/1/2.
+    expect(added.map((e) => e.output_index)).toEqual([0, 1, 2]);
+  });
+
+  test("message interrupted by tool_call is closed before the tool_call opens", () => {
+    const t = new AgentEventTranslator();
+    const all: ResponseStreamEvent[] = [];
+    all.push(...t.translate({ type: "message_delta", content: "thinking..." }));
+    all.push(
+      ...t.translate({
+        type: "tool_call",
+        callId: "c1",
+        name: "lookup",
+        args: {},
+      }),
+    );
+    all.push(
+      ...t.translate({ type: "tool_result", callId: "c1", result: "ok" }),
+    );
+    all.push(...t.translate({ type: "message_delta", content: "final" }));
+    all.push(...t.finalize());
+
+    assertMonotonic(all);
+
+    // Structure: msg0.added, msg0.delta, msg0.done (closed before tool),
+    // tool_call.added/done, tool_result.added/done, msg1.added, msg1.delta,
+    // msg1.done (from finalize), response.completed.
+    const addedDone = all.filter(
+      (e) =>
+        e.type === "response.output_item.added" ||
+        e.type === "response.output_item.done",
+    );
+    expect(addedDone.map((e) => `${e.type}@${e.output_index}`)).toEqual([
+      "response.output_item.added@0",
+      "response.output_item.done@0",
+      "response.output_item.added@1",
+      "response.output_item.done@1",
+      "response.output_item.added@2",
+      "response.output_item.done@2",
+      "response.output_item.added@3",
+      "response.output_item.done@3",
+    ]);
+  });
+
+  test("full `message` event after deltas does not double-emit output_item.added", () => {
+    const t = new AgentEventTranslator();
+    const all: ResponseStreamEvent[] = [];
+    all.push(...t.translate({ type: "message_delta", content: "partial" }));
+    all.push(
+      ...t.translate({ type: "message", content: "full final content" }),
+    );
+    all.push(...t.finalize());
+
+    const added = all.filter((e) => e.type === "response.output_item.added");
+    const done = all.filter((e) => e.type === "response.output_item.done");
+    // Exactly one added (from the first delta) and one done (from the full
+    // message). finalize() must not emit a second done for the same item.
+    expect(added).toHaveLength(1);
+    expect(done).toHaveLength(1);
+    if (done[0].type === "response.output_item.done") {
+      const item = done[0].item;
+      if (item.type === "message") {
+        expect(item.content[0].text).toBe("full final content");
+      }
+    }
+  });
+
+  test("tool_result coerces undefined result to empty-string output", () => {
+    const t = new AgentEventTranslator();
+    const events = t.translate({
+      type: "tool_result",
+      callId: "c1",
+      result: undefined,
+    });
+    const done = events.find((e) => e.type === "response.output_item.done");
+    if (done?.type === "response.output_item.done") {
+      const item = done.item;
+      if (item.type === "function_call_output") {
+        expect(item.output).toBe("");
+      }
+    }
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/thread-store.test.ts b/packages/appkit/src/plugins/agents/tests/thread-store.test.ts
new file mode 100644
index 000000000..ed4f70bab
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/thread-store.test.ts
@@ -0,0 +1,138 @@
+import { describe, expect, test } from "vitest";
+import { InMemoryThreadStore } from "../thread-store";
+
+describe("InMemoryThreadStore", () => {
+  test("create() returns a new thread with the given userId", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+
+    expect(thread.id).toBeDefined();
+    expect(thread.userId).toBe("user-1");
+    expect(thread.messages).toEqual([]);
+    expect(thread.createdAt).toBeInstanceOf(Date);
+    expect(thread.updatedAt).toBeInstanceOf(Date);
+  });
+
+  test("get() returns the thread for the correct user", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+
+    const retrieved = await store.get(thread.id, "user-1");
+    expect(retrieved).toEqual(thread);
+  });
+
+  test("get() returns null for wrong user", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+
+    const retrieved = await store.get(thread.id, "user-2");
+    expect(retrieved).toBeNull();
+  });
+
+  test("get() returns null for non-existent thread", async () => {
+    const store = new InMemoryThreadStore();
+    const retrieved = await store.get("non-existent", "user-1");
+    expect(retrieved).toBeNull();
+  });
+
+  test("list() returns threads sorted by updatedAt desc", async () => {
+    const store = new InMemoryThreadStore();
+    const t1 = await store.create("user-1");
+    const t2 = await store.create("user-1");
+
+    // Make t1 more recently updated
+    await store.addMessage(t1.id, "user-1", {
+      id: "msg-1",
+      role: "user",
+      content: "hello",
+      createdAt: new Date(),
+    });
+
+    const threads = await store.list("user-1");
+    expect(threads).toHaveLength(2);
+    expect(threads[0].id).toBe(t1.id);
+    expect(threads[1].id).toBe(t2.id);
+  });
+
+  test("list() returns empty for unknown user", async () => {
+    const store = new InMemoryThreadStore();
+    await store.create("user-1");
+
+    const threads = await store.list("user-2");
+    expect(threads).toEqual([]);
+  });
+
+  test("addMessage() appends to thread and updates timestamp", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+    const originalUpdatedAt = thread.updatedAt;
+
+    // Small delay to ensure timestamp differs
+    await new Promise((r) => setTimeout(r, 5));
+
+    await store.addMessage(thread.id, "user-1", {
+      id: "msg-1",
+      role: "user",
+      content: "hello",
+      createdAt: new Date(),
+    });
+
+    const updated = await store.get(thread.id, "user-1");
+    expect(updated?.messages).toHaveLength(1);
+    expect(updated?.messages[0].content).toBe("hello");
+    expect(updated?.updatedAt.getTime()).toBeGreaterThanOrEqual(
+      originalUpdatedAt.getTime(),
+    );
+  });
+
+  test("addMessage() throws for non-existent thread", async () => {
+    const store = new InMemoryThreadStore();
+
+    await expect(
+      store.addMessage("non-existent", "user-1", {
+        id: "msg-1",
+        role: "user",
+        content: "hello",
+        createdAt: new Date(),
+      }),
+    ).rejects.toThrow("Thread non-existent not found");
+  });
+
+  test("delete() removes a thread and returns true", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+
+    const deleted = await store.delete(thread.id, "user-1");
+    expect(deleted).toBe(true);
+
+    const retrieved = await store.get(thread.id, "user-1");
+    expect(retrieved).toBeNull();
+  });
+
+  test("delete() returns false for non-existent thread", async () => {
+    const store = new InMemoryThreadStore();
+    const deleted = await store.delete("non-existent", "user-1");
+    expect(deleted).toBe(false);
+  });
+
+  test("delete() returns false for wrong user", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+
+    const deleted = await store.delete(thread.id, "user-2");
+    expect(deleted).toBe(false);
+  });
+
+  test("threads are isolated per user", async () => {
+    const store = new InMemoryThreadStore();
+    await store.create("user-1");
+    await store.create("user-1");
+    await store.create("user-2");
+
+    const user1Threads = await store.list("user-1");
+    const user2Threads = await store.list("user-2");
+
+    expect(user1Threads).toHaveLength(2);
+    expect(user2Threads).toHaveLength(1);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/tool-approval-gate.test.ts b/packages/appkit/src/plugins/agents/tests/tool-approval-gate.test.ts
new file mode 100644
index 000000000..1e17ddf63
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/tool-approval-gate.test.ts
@@ -0,0 +1,156 @@
+import { afterEach, beforeEach, describe, expect, test, vi } from "vitest";
+import { ToolApprovalGate } from "../tool-approval-gate";
+
+describe("ToolApprovalGate", () => {
+  let gate: ToolApprovalGate;
+
+  beforeEach(() => {
+    vi.useFakeTimers();
+    gate = new ToolApprovalGate();
+  });
+
+  afterEach(() => {
+    vi.useRealTimers();
+  });
+
+  test("resolves with 'approve' when a matching submit arrives", async () => {
+    const waiter = gate.wait({
+      approvalId: "a1",
+      streamId: "s1",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+    expect(gate.size).toBe(1);
+
+    const result = gate.submit({
+      approvalId: "a1",
+      userId: "alice",
+      decision: "approve",
+    });
+
+    expect(result).toEqual({ ok: true });
+    await expect(waiter).resolves.toBe("approve");
+    expect(gate.size).toBe(0);
+  });
+
+  test("resolves with 'deny' on explicit deny", async () => {
+    const waiter = gate.wait({
+      approvalId: "a2",
+      streamId: "s1",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+    gate.submit({
+      approvalId: "a2",
+      userId: "alice",
+      decision: "deny",
+    });
+    await expect(waiter).resolves.toBe("deny");
+  });
+
+  test("auto-denies after timeoutMs with no submit", async () => {
+    const waiter = gate.wait({
+      approvalId: "a3",
+      streamId: "s1",
+      userId: "alice",
+      timeoutMs: 1000,
+    });
+    vi.advanceTimersByTime(1000);
+    await expect(waiter).resolves.toBe("deny");
+    expect(gate.size).toBe(0);
+  });
+
+  test("refuses a submit from a different user (ownership check)", async () => {
+    const waiter = gate.wait({
+      approvalId: "a4",
+      streamId: "s1",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+    const result = gate.submit({
+      approvalId: "a4",
+      userId: "bob",
+      decision: "approve",
+    });
+    expect(result).toEqual({ ok: false, reason: "forbidden" });
+    expect(gate.size).toBe(1);
+    // Waiter is still pending; cleanup to let fake timers drain.
+    gate.submit({
+      approvalId: "a4",
+      userId: "alice",
+      decision: "deny",
+    });
+    await expect(waiter).resolves.toBe("deny");
+  });
+
+  test("returns 'unknown' reason when approvalId is not registered", () => {
+    expect(
+      gate.submit({ approvalId: "nope", userId: "x", decision: "approve" }),
+    ).toEqual({ ok: false, reason: "unknown" });
+  });
+
+  test("abortStream denies every pending gate for that stream", async () => {
+    const a = gate.wait({
+      approvalId: "a5",
+      streamId: "s1",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+    const b = gate.wait({
+      approvalId: "a6",
+      streamId: "s1",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+    const c = gate.wait({
+      approvalId: "a7",
+      streamId: "s2",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+    gate.abortStream("s1");
+    await expect(a).resolves.toBe("deny");
+    await expect(b).resolves.toBe("deny");
+    expect(gate.size).toBe(1);
+    // s2's waiter is still pending; settle it to clean up timers.
+    gate.submit({ approvalId: "a7", userId: "alice", decision: "deny" });
+    await expect(c).resolves.toBe("deny");
+  });
+
+  test("abortAll denies every pending gate", async () => {
+    const a = gate.wait({
+      approvalId: "a8",
+      streamId: "s1",
+      userId: "alice",
+      timeoutMs: 60_000,
+    });
+    const b = gate.wait({
+      approvalId: "a9",
+      streamId: "s2",
+      userId: "bob",
+      timeoutMs: 60_000,
+    });
+    gate.abortAll();
+    await expect(a).resolves.toBe("deny");
+    await expect(b).resolves.toBe("deny");
+    expect(gate.size).toBe(0);
+  });
+
+  test("a timed-out approval cannot be resolved by a late submit", async () => {
+    const waiter = gate.wait({
+      approvalId: "a10",
+      streamId: "s1",
+      userId: "alice",
+      timeoutMs: 500,
+    });
+    vi.advanceTimersByTime(500);
+    await expect(waiter).resolves.toBe("deny");
+
+    const late = gate.submit({
+      approvalId: "a10",
+      userId: "alice",
+      decision: "approve",
+    });
+    expect(late).toEqual({ ok: false, reason: "unknown" });
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/thread-store.ts b/packages/appkit/src/plugins/agents/thread-store.ts
new file mode 100644
index 000000000..7c4622cd3
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/thread-store.ts
@@ -0,0 +1,66 @@
+import { randomUUID } from "node:crypto";
+import type { Message, Thread, ThreadStore } from "shared";
+
+/**
+ * In-memory thread store backed by a nested Map.
+ *
+ * Outer key: userId, inner key: threadId. Thread history is retained for the
+ * lifetime of the process with no eviction, caps, or TTL — a chatty user will
+ * grow the in-memory footprint monotonically, and the server loses every
+ * thread on restart. **This implementation is intended for local development
+ * and single-process demos only.**
+ *
+ * For any real deployment, pass a persistent `ThreadStore` to `agents({ ... })`
+ * (e.g. a Lakebase- or Postgres-backed implementation). A bounded
+ * `InMemoryThreadStore` with eviction policies is tracked as a follow-up.
+ */
+export class InMemoryThreadStore implements ThreadStore {
+  private store = new Map<string, Map<string, Thread>>();
+
+  async create(userId: string): Promise<Thread> {
+    const now = new Date();
+    const thread: Thread = {
+      id: randomUUID(),
+      userId,
+      messages: [],
+      createdAt: now,
+      updatedAt: now,
+    };
+    this.userMap(userId).set(thread.id, thread);
+    return thread;
+  }
+
+  async get(threadId: string, userId: string): Promise<Thread | null> {
+    return this.userMap(userId).get(threadId) ?? null;
+  }
+
+  async list(userId: string): Promise<Thread[]> {
+    return Array.from(this.userMap(userId).values()).sort(
+      (a, b) => b.updatedAt.getTime() - a.updatedAt.getTime(),
+    );
+  }
+
+  async addMessage(
+    threadId: string,
+    userId: string,
+    message: Message,
+  ): Promise<void> {
+    const thread = this.userMap(userId).get(threadId);
+    if (!thread) throw new Error(`Thread ${threadId} not found`);
+    thread.messages.push(message);
+    thread.updatedAt = new Date();
+  }
+
+  async delete(threadId: string, userId: string): Promise<boolean> {
+    return this.userMap(userId).delete(threadId);
+  }
+
+  private userMap(userId: string): Map<string, Thread> {
+    let map = this.store.get(userId);
+    if (!map) {
+      map = new Map();
+      this.store.set(userId, map);
+    }
+    return map;
+  }
+}
diff --git a/packages/appkit/src/plugins/agents/tool-approval-gate.ts b/packages/appkit/src/plugins/agents/tool-approval-gate.ts
new file mode 100644
index 000000000..669f30a96
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tool-approval-gate.ts
@@ -0,0 +1,122 @@
+/**
+ * Server-side state for the human-in-the-loop approval gate on
+ * `destructive: true` agent tool calls.
+ *
+ * Lifecycle:
+ *
+ * 1. `wait(...)` is called from inside `executeTool` when a destructive tool
+ *    is about to execute. A `Pending` record is registered and a timer is
+ *    scheduled for auto-deny. The returned promise is what blocks the
+ *    adapter until the decision arrives.
+ * 2. The client receives an `appkit.approval_pending` SSE event carrying the
+ *    `approvalId` + `streamId` and posts a decision to `POST /chat/approve`.
+ *    The route calls {@link ToolApprovalGate.submit} which resolves the
+ *    pending promise and clears the timer.
+ * 3. If no submit arrives within `timeoutMs`, the timer fires and the
+ *    promise resolves with `"deny"`.
+ *
+ * Security invariants:
+ *
+ * - `submit` verifies that the decider's user id matches the user who
+ *   initiated the stream (set by `wait`). Mismatches are rejected without
+ *   resolving the pending promise — this prevents a second user from
+ *   approving (or denying) another user's destructive action.
+ * - `abort(streamId)` cancels every pending gate for a stream and denies
+ *   each one. Used when the enclosing stream is cancelled or the plugin is
+ *   shutting down.
+ */
+type ApprovalDecision = "approve" | "deny";
+
+interface Pending {
+  resolve: (decision: ApprovalDecision) => void;
+  userId: string;
+  streamId: string;
+  timeout: ReturnType<typeof setTimeout>;
+}
+
+type ApprovalSubmitResult =
+  | { ok: true }
+  | { ok: false; reason: "unknown" | "forbidden" };
+
+export class ToolApprovalGate {
+  private pending = new Map<string, Pending>();
+
+  /**
+   * Register a pending approval and return a promise that resolves with the
+   * user's decision or with `"deny"` when the timeout elapses. The returned
+   * promise never rejects.
+   */
+  wait(args: {
+    approvalId: string;
+    streamId: string;
+    userId: string;
+    timeoutMs: number;
+  }): Promise<ApprovalDecision> {
+    const { approvalId, streamId, userId, timeoutMs } = args;
+    return new Promise<ApprovalDecision>((resolve) => {
+      const timeout = setTimeout(() => {
+        if (this.pending.delete(approvalId)) {
+          resolve("deny");
+        }
+      }, timeoutMs);
+      this.pending.set(approvalId, {
+        resolve,
+        userId,
+        streamId,
+        timeout,
+      });
+    });
+  }
+
+  /**
+   * Settle an approval with a user decision. Returns:
+   * - `{ ok: true }` if the pending record existed, the userId matched, and
+   *   the promise was resolved.
+   * - `{ ok: false, reason: "unknown" }` if no pending record matches the id.
+   * - `{ ok: false, reason: "forbidden" }` if the userId does not match the
+   *   user who initiated the stream.
+   */
+  submit(args: {
+    approvalId: string;
+    userId: string;
+    decision: ApprovalDecision;
+  }): ApprovalSubmitResult {
+    const { approvalId, userId, decision } = args;
+    const p = this.pending.get(approvalId);
+    if (!p) return { ok: false, reason: "unknown" };
+    if (p.userId !== userId) return { ok: false, reason: "forbidden" };
+    clearTimeout(p.timeout);
+    this.pending.delete(approvalId);
+    p.resolve(decision);
+    return { ok: true };
+  }
+
+  /**
+   * Cancel all pending gates for a specific stream (e.g., when the user
+   * cancels the stream). Each gate resolves with `"deny"` so the adapter
+   * unwinds cleanly.
+   */
+  abortStream(streamId: string): void {
+    for (const [id, p] of this.pending) {
+      if (p.streamId === streamId) {
+        clearTimeout(p.timeout);
+        this.pending.delete(id);
+        p.resolve("deny");
+      }
+    }
+  }
+
+  /** Cancel every pending gate. Used at plugin shutdown. */
+  abortAll(): void {
+    for (const [id, p] of this.pending) {
+      clearTimeout(p.timeout);
+      this.pending.delete(id);
+      p.resolve("deny");
+    }
+  }
+
+  /** Number of pending approvals (test/diagnostic helper). */
+  get size(): number {
+    return this.pending.size;
+  }
+}
diff --git a/packages/shared/src/agent.ts b/packages/shared/src/agent.ts
index ef532c7c7..2594b3e6d 100644
--- a/packages/shared/src/agent.ts
+++ b/packages/shared/src/agent.ts
@@ -86,7 +86,21 @@ export type AgentEvent =
       status: "running" | "waiting" | "complete" | "error";
       error?: string;
     }
-  | { type: "metadata"; data: Record<string, unknown> };
+  | { type: "metadata"; data: Record<string, unknown> }
+  | {
+      /**
+       * Emitted by the agents plugin (not adapters) when a tool call annotated
+       * `destructive: true` is awaiting human approval. Clients should render
+       * an approval prompt and POST to `/chat/approve` with the matching
+       * `approvalId` and a `decision` of `approve` or `deny`.
+       */
+      type: "approval_pending";
+      approvalId: string;
+      streamId: string;
+      toolName: string;
+      args: unknown;
+      annotations?: ToolAnnotations;
+    };
 
 // ---------------------------------------------------------------------------
 // Responses API types (OpenAI-compatible wire format for HTTP boundary)
@@ -178,6 +192,23 @@ export interface AppKitMetadataEvent {
   sequence_number: number;
 }
 
+/**
+ * Emitted when a destructive tool call is awaiting human approval. The client
+ * should render an approval UI and POST the decision to `/chat/approve` with
+ * `{ streamId, approvalId, decision: "approve" | "deny" }`. If no decision
+ * arrives before the server-side timeout, the call is auto-denied and the
+ * agent receives a denial string as the tool output.
+ */
+export interface AppKitApprovalPendingEvent {
+  type: "appkit.approval_pending";
+  approval_id: string;
+  stream_id: string;
+  tool_name: string;
+  args: unknown;
+  annotations?: ToolAnnotations;
+  sequence_number: number;
+}
+
 export type ResponseStreamEvent =
   | ResponseOutputItemAddedEvent
   | ResponseOutputItemDoneEvent
@@ -186,7 +217,8 @@ export type ResponseStreamEvent =
   | ResponseErrorEvent
   | ResponseFailedEvent
   | AppKitThinkingEvent
-  | AppKitMetadataEvent;
+  | AppKitMetadataEvent
+  | AppKitApprovalPendingEvent;
 
 // ---------------------------------------------------------------------------
 // Adapter contract

From 3107741e326fdcfaca03854b6e90a70240b93d30 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Thu, 23 Apr 2026 17:59:39 +0200
Subject: [PATCH 02/46] refactor(appkit): generalize default base system prompt

Tool-agnostic guidelines instead of SQL/files-specific defaults; accept full
PromptContext in buildBaseSystemPrompt for parity with custom callbacks.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 .../appkit/src/core/agent/system-prompt.ts    | 32 +++++++++++++------
 .../core/agent/tests/system-prompt.test.ts    | 30 ++++++++++++-----
 packages/appkit/src/plugins/agents/agents.ts  |  8 +++--
 3 files changed, 50 insertions(+), 20 deletions(-)

diff --git a/packages/appkit/src/core/agent/system-prompt.ts b/packages/appkit/src/core/agent/system-prompt.ts
index 634f49c5f..01f3fe9b0 100644
--- a/packages/appkit/src/core/agent/system-prompt.ts
+++ b/packages/appkit/src/core/agent/system-prompt.ts
@@ -1,28 +1,40 @@
+import type { PromptContext } from "./types";
+
 /**
- * Builds the AppKit base system prompt from active plugin names.
+ * Default base system prompt: product identity, active AppKit plugins, and
+ * tool-agnostic behavior hints.
  *
- * The base prompt provides guidelines and app context. It does NOT
- * include individual tool descriptions — those are sent via the
- * structured `tools` API parameter to the LLM.
+ * Individual tool definitions and JSON Schemas are still sent through the
+ * model's `tools` / function-calling channel — this string is not a second
+ * copy of that list. `ctx.toolNames` is available for custom
+ * `baseSystemPrompt` callbacks; the default text stays short and does not
+ * enumerate tools to avoid drift and token bloat.
  */
-export function buildBaseSystemPrompt(pluginNames: string[]): string {
+export function buildBaseSystemPrompt(ctx: PromptContext): string {
+  const { pluginNames } = ctx;
   const lines: string[] = [
     "You are an AI assistant running on Databricks AppKit.",
   ];
 
   if (pluginNames.length > 0) {
     lines.push("");
-    lines.push(`Active plugins: ${pluginNames.join(", ")}`);
+    lines.push(`Active AppKit plugins: ${pluginNames.join(", ")}`);
   }
 
   lines.push("");
   lines.push("Guidelines:");
-  lines.push("- Use Databricks SQL syntax when writing queries");
   lines.push(
-    "- When results are large, summarize key findings rather than dumping raw data",
+    "- Be concise: for large or noisy tool output, summarize what matters and how to go deeper instead of pasting everything.",
+  );
+  lines.push(
+    "- Use each tool as defined: pass required arguments and use the syntax, dialect, or path rules the target system expects (see each tool’s description and schema).",
+  );
+  lines.push(
+    "- If a tool call fails, explain the error in plain language and suggest a fix or next step.",
+  );
+  lines.push(
+    "- Respect tool metadata and app policy: read-only vs destructive tools, user/identity context, and any approval or safety flows the app provides.",
   );
-  lines.push("- If a tool call fails, explain the error clearly to the user");
-  lines.push("- When browsing files, verify the path exists before reading");
 
   return lines.join("\n");
 }
diff --git a/packages/appkit/src/core/agent/tests/system-prompt.test.ts b/packages/appkit/src/core/agent/tests/system-prompt.test.ts
index 83bf8e192..25724259e 100644
--- a/packages/appkit/src/core/agent/tests/system-prompt.test.ts
+++ b/packages/appkit/src/core/agent/tests/system-prompt.test.ts
@@ -1,27 +1,41 @@
 import { describe, expect, test } from "vitest";
 import { buildBaseSystemPrompt, composeSystemPrompt } from "../system-prompt";
 
+const emptyCtx = {
+  agentName: "a",
+  pluginNames: [] as string[],
+  toolNames: [] as string[],
+};
+
 describe("buildBaseSystemPrompt", () => {
   test("includes plugin names", () => {
-    const prompt = buildBaseSystemPrompt(["analytics", "files", "genie"]);
-    expect(prompt).toContain("Active plugins: analytics, files, genie");
+    const prompt = buildBaseSystemPrompt({
+      agentName: "assistant",
+      pluginNames: ["analytics", "files", "genie"],
+      toolNames: [],
+    });
+    expect(prompt).toContain("Active AppKit plugins: analytics, files, genie");
   });
 
   test("includes guidelines", () => {
-    const prompt = buildBaseSystemPrompt([]);
+    const prompt = buildBaseSystemPrompt(emptyCtx);
     expect(prompt).toContain("Guidelines:");
-    expect(prompt).toContain("Databricks SQL");
-    expect(prompt).toContain("summarize key findings");
+    expect(prompt).toContain("syntax, dialect, or path rules");
+    expect(prompt).toContain("summarize what matters");
   });
 
   test("works with no plugins", () => {
-    const prompt = buildBaseSystemPrompt([]);
+    const prompt = buildBaseSystemPrompt(emptyCtx);
     expect(prompt).toContain("AI assistant running on Databricks AppKit");
-    expect(prompt).not.toContain("Active plugins:");
+    expect(prompt).not.toContain("Active AppKit plugins:");
   });
 
   test("does NOT include individual tool names", () => {
-    const prompt = buildBaseSystemPrompt(["analytics"]);
+    const prompt = buildBaseSystemPrompt({
+      agentName: "a",
+      pluginNames: ["analytics"],
+      toolNames: ["analytics.query"],
+    });
     expect(prompt).not.toContain("analytics.query");
     expect(prompt).not.toContain("Available tools:");
   });
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index 9c3076e6e..7b4006bc8 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -27,7 +27,11 @@ import {
   chatRequestSchema,
   invocationsRequestSchema,
 } from "./schemas";
-import { buildBaseSystemPrompt, composeSystemPrompt } from "../../core/agent/system-prompt";
+import {
+  buildBaseSystemPrompt,
+  composeSystemPrompt,
+} from "../../core/agent/system-prompt";
+import { AppKitMcpClient } from "../../connectors/mcp";
 import { InMemoryThreadStore } from "./thread-store";
 import { ToolApprovalGate } from "./tool-approval-gate";
 import {
@@ -1245,7 +1249,7 @@ function composePromptForAgent(
   } else if (typeof resolved === "function") {
     base = resolved(ctx);
   } else {
-    base = buildBaseSystemPrompt(ctx.pluginNames);
+    base = buildBaseSystemPrompt(ctx);
   }
 
   return composeSystemPrompt(base, registered.instructions);

From 2ba1577c157b2ec27274eda39ee11363a9362eb6 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Thu, 23 Apr 2026 18:01:42 +0200
Subject: [PATCH 03/46] feat(appkit): optional serving_endpoint on agents
 plugin manifest

Register DATABRICKS_SERVING_ENDPOINT_NAME as optional CAN_QUERY so apps using
Databricks-hosted agent models get resource wiring; optional when agents use
only external adapters. Sync template/appkit.plugins.json.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 .../appkit/src/plugins/agents/manifest.json   | 16 ++++++++++++-
 template/appkit.plugins.json                  | 24 +++++++++++++++++++
 2 files changed, 39 insertions(+), 1 deletion(-)

diff --git a/packages/appkit/src/plugins/agents/manifest.json b/packages/appkit/src/plugins/agents/manifest.json
index cb7a43f8b..f2766b808 100644
--- a/packages/appkit/src/plugins/agents/manifest.json
+++ b/packages/appkit/src/plugins/agents/manifest.json
@@ -5,6 +5,20 @@
   "description": "AI agents driven by markdown configs or code, with auto-tool-discovery from registered plugins",
   "resources": {
     "required": [],
-    "optional": []
+    "optional": [
+      {
+        "type": "serving_endpoint",
+        "alias": "Model Serving (agents)",
+        "resourceKey": "agents-serving-endpoint",
+        "description": "Databricks Model Serving endpoint for agent runs that use workspace-hosted models (DatabricksAdapter, optional default serving endpoint env, or markdown configs that resolve to serving). Omit when agents rely only on external/custom model adapters.",
+        "permission": "CAN_QUERY",
+        "fields": {
+          "name": {
+            "env": "DATABRICKS_SERVING_ENDPOINT_NAME",
+            "description": "Serving endpoint name used for agent LLM inference when configured for Databricks Model Serving"
+          }
+        }
+      }
+    ]
   }
 }
diff --git a/template/appkit.plugins.json b/template/appkit.plugins.json
index d3c8702f9..918ad83f0 100644
--- a/template/appkit.plugins.json
+++ b/template/appkit.plugins.json
@@ -2,6 +2,30 @@
   "$schema": "https://databricks.github.io/appkit/schemas/template-plugins.schema.json",
   "version": "1.1",
   "plugins": {
+    "agents": {
+      "name": "agents",
+      "displayName": "Agents Plugin",
+      "description": "AI agents driven by markdown configs or code, with auto-tool-discovery from registered plugins",
+      "package": "@databricks/appkit",
+      "resources": {
+        "required": [],
+        "optional": [
+          {
+            "type": "serving_endpoint",
+            "alias": "Model Serving (agents)",
+            "resourceKey": "agents-serving-endpoint",
+            "description": "Databricks Model Serving endpoint for agent runs that use workspace-hosted models (DatabricksAdapter, optional default serving endpoint env, or markdown configs that resolve to serving). Omit when agents rely only on external/custom model adapters.",
+            "permission": "CAN_QUERY",
+            "fields": {
+              "name": {
+                "env": "DATABRICKS_SERVING_ENDPOINT_NAME",
+                "description": "Serving endpoint name used for agent LLM inference when configured for Databricks Model Serving"
+              }
+            }
+          }
+        ]
+      }
+    },
     "analytics": {
       "name": "analytics",
       "displayName": "Analytics Plugin",

From 1c4f8d2e529acb829be84ae6a4a8ea5f1ee9d1ba Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Thu, 23 Apr 2026 18:03:21 +0200
Subject: [PATCH 04/46] fix(appkit): agents manifest uses
 DATABRICKS_AGENT_ENDPOINT
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Align optional serving resource with `DatabricksAdapter.fromModelServing()`, which
reads `DATABRICKS_AGENT_ENDPOINT` — not `DATABRICKS_SERVING_ENDPOINT_NAME`
(serving plugin). Sync template.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 packages/appkit/src/plugins/agents/manifest.json | 6 +++---
 template/appkit.plugins.json                     | 6 +++---
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/packages/appkit/src/plugins/agents/manifest.json b/packages/appkit/src/plugins/agents/manifest.json
index f2766b808..f3986c837 100644
--- a/packages/appkit/src/plugins/agents/manifest.json
+++ b/packages/appkit/src/plugins/agents/manifest.json
@@ -10,12 +10,12 @@
         "type": "serving_endpoint",
         "alias": "Model Serving (agents)",
         "resourceKey": "agents-serving-endpoint",
-        "description": "Databricks Model Serving endpoint for agent runs that use workspace-hosted models (DatabricksAdapter, optional default serving endpoint env, or markdown configs that resolve to serving). Omit when agents rely only on external/custom model adapters.",
+        "description": "Databricks Model Serving endpoint for agents using workspace-hosted models (`DatabricksAdapter.fromModelServing`). Wire the same endpoint name AppKit reads from `DATABRICKS_AGENT_ENDPOINT` when no per-agent model is configured. Omit when agents use only external adapters.",
         "permission": "CAN_QUERY",
         "fields": {
           "name": {
-            "env": "DATABRICKS_SERVING_ENDPOINT_NAME",
-            "description": "Serving endpoint name used for agent LLM inference when configured for Databricks Model Serving"
+            "env": "DATABRICKS_AGENT_ENDPOINT",
+            "description": "Endpoint name passed to Model Serving when agents default to `DatabricksAdapter.fromModelServing()`"
           }
         }
       }
diff --git a/template/appkit.plugins.json b/template/appkit.plugins.json
index 918ad83f0..2f22a50c1 100644
--- a/template/appkit.plugins.json
+++ b/template/appkit.plugins.json
@@ -14,12 +14,12 @@
             "type": "serving_endpoint",
             "alias": "Model Serving (agents)",
             "resourceKey": "agents-serving-endpoint",
-            "description": "Databricks Model Serving endpoint for agent runs that use workspace-hosted models (DatabricksAdapter, optional default serving endpoint env, or markdown configs that resolve to serving). Omit when agents rely only on external/custom model adapters.",
+            "description": "Databricks Model Serving endpoint for agents using workspace-hosted models (`DatabricksAdapter.fromModelServing`). Wire the same endpoint name AppKit reads from `DATABRICKS_AGENT_ENDPOINT` when no per-agent model is configured. Omit when agents use only external adapters.",
             "permission": "CAN_QUERY",
             "fields": {
               "name": {
-                "env": "DATABRICKS_SERVING_ENDPOINT_NAME",
-                "description": "Serving endpoint name used for agent LLM inference when configured for Databricks Model Serving"
+                "env": "DATABRICKS_AGENT_ENDPOINT",
+                "description": "Endpoint name passed to Model Serving when agents default to `DatabricksAdapter.fromModelServing()`"
               }
             }
           }

From 68dcd9c1e6eddef885922d8eb369c03f52830ed7 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Thu, 23 Apr 2026 18:20:05 +0200
Subject: [PATCH 05/46] feat(agents): folder-based markdown discovery
 (<id>/agent.md)

BREAKING CHANGE: top-level config/agents/*.md is no longer loaded. Use
<agentId>/agent.md. The skills directory name is reserved and skipped.
Orphan top-level .md files error at load; subdirs without agent.md error.

Export agentIdFromMarkdownPath for path-based id resolution.
---
 packages/appkit/src/core/agent/load-agents.ts | 109 ++++++++-----
 .../src/core/agent/tests/load-agents.test.ts  | 146 ++++++++++++------
 packages/appkit/src/core/agent/types.ts       |   2 +-
 packages/appkit/src/plugins/agents/index.ts   |   1 +
 .../agents/tests/agents-plugin.test.ts        |  36 ++---
 5 files changed, 192 insertions(+), 102 deletions(-)

diff --git a/packages/appkit/src/core/agent/load-agents.ts b/packages/appkit/src/core/agent/load-agents.ts
index 8f9fd1be7..e557a1ebb 100644
--- a/packages/appkit/src/core/agent/load-agents.ts
+++ b/packages/appkit/src/core/agent/load-agents.ts
@@ -36,9 +36,9 @@ export interface LoadContext {
 }
 
 export interface LoadResult {
-  /** Agent definitions keyed by file-stem name. */
+  /** Agent definitions keyed by agent id (directory name under `dir`). */
   defs: Record<string, AgentDefinition>;
-  /** First file with `default: true` frontmatter, or `null`. */
+  /** First agent with `default: true` frontmatter (sorted id order), or `null`. */
   defaultAgent: string | null;
 }
 
@@ -48,11 +48,10 @@ interface Frontmatter {
   toolkits?: ToolkitSpec[];
   tools?: string[];
   /**
-   * Sibling file-stems to expose as sub-agents. Each becomes an
-   * `agent-<stem>` tool on this agent at runtime. Resolution happens at
-   * directory-load time in {@link loadAgentsFromDir}; the single-file
-   * {@link loadAgentFromFile} path rejects non-empty values since there
-   * are no siblings to resolve against.
+   * Other agent ids to expose as sub-agents. Each becomes an `agent-<id>`
+   * tool at runtime. Resolution happens at directory-load time in
+   * {@link loadAgentsFromDir}; the single-file {@link loadAgentFromFile} path
+   * rejects non-empty values since there are no siblings to resolve against.
    */
   agents?: string[];
   maxSteps?: number;
@@ -64,6 +63,21 @@ interface Frontmatter {
 
 type ToolkitSpec = string | { [pluginName: string]: ToolkitOptions | string[] };
 
+/**
+ * Derives the logical agent id from a markdown path. When the file is named
+ * `agent.md`, the id is the parent directory name (folder-based layout);
+ * otherwise the id is the file stem (e.g. legacy single-file paths).
+ */
+export function agentIdFromMarkdownPath(filePath: string): string {
+  const normalized = path.normalize(filePath);
+  const base = path.basename(normalized);
+  const parent = path.basename(path.dirname(normalized));
+  if (base === "agent.md" && parent && parent !== "." && parent !== "..") {
+    return parent;
+  }
+  return path.basename(normalized, ".md");
+}
+
 const ALLOWED_KEYS = new Set([
   "endpoint",
   "model",
@@ -90,7 +104,7 @@ export async function loadAgentFromFile(
   ctx: LoadContext,
 ): Promise<AgentDefinition> {
   const raw = fs.readFileSync(filePath, "utf-8");
-  const name = path.basename(filePath, ".md");
+  const name = agentIdFromMarkdownPath(filePath);
   const { data } = parseFrontmatter(raw, filePath);
   if (Array.isArray(data?.agents) && data.agents.length > 0) {
     throw new Error(
@@ -103,15 +117,19 @@ export async function loadAgentFromFile(
 }
 
 /**
- * Scans a directory for `*.md` files and produces an `AgentDefinition` record
- * keyed by file-stem. Throws on frontmatter errors or unresolved references.
- * Returns an empty map if the directory does not exist.
+ * Scans a directory for one subdirectory per agent, each containing
+ * `agent.md` (frontmatter + body). Produces an `AgentDefinition` record keyed
+ * by agent id (folder name). Throws on frontmatter errors or unresolved
+ * references. Returns an empty map if the directory does not exist.
+ *
+ * Legacy top-level `*.md` files are rejected with an error — migrate each to
+ * `<id>/agent.md` under a sibling folder named for the agent id.
  *
  * Runs in two passes so sub-agent references in frontmatter (`agents: [...]`)
- * can be resolved regardless of file-system iteration order:
+ * can be resolved regardless of directory iteration order:
  *
- * 1. Build every agent's definition from its own file.
- * 2. Walk `agents:` references and wire `def.agents = { sibling: siblingDef }`
+ * 1. Build every agent's definition from its own `agent.md`.
+ * 2. Walk `agents:` references and wire `def.agents = { child: childDef }`
  *    by looking them up in the complete map. Dangling names and
  *    self-references fail loudly; mutual delegation is allowed and bounded
  *    at runtime by `limits.maxSubAgentDepth`.
@@ -123,37 +141,56 @@ export async function loadAgentsFromDir(
   if (!fs.existsSync(dir)) {
     return { defs: {}, defaultAgent: null };
   }
-  // Sort so `default: true` resolution is deterministic across platforms —
-  // `readdirSync` order is filesystem-dependent (macOS alphabetical, ext4
-  // inode order, etc.).
-  const files = fs
-    .readdirSync(dir)
-    .filter((f) => f.endsWith(".md"))
+
+  const entries = fs.readdirSync(dir, { withFileTypes: true });
+  const orphanMd = entries
+    .filter((e) => e.isFile() && e.name.endsWith(".md"))
+    .map((e) => e.name)
     .sort();
+
+  if (orphanMd.length > 0) {
+    const hint = orphanMd
+      .map((f) => `${path.basename(f, ".md")}/agent.md`)
+      .join(", ");
+    throw new Error(
+      `Agents directory contains unsupported top-level markdown file(s): ${orphanMd.join(", ")}. ` +
+        `Use one folder per agent with a fixed entry file, e.g. ${hint}.`,
+    );
+  }
+
+  /** Reserved folder name until per-agent skills land; not an agent package. */
+  const RESERVED_DIRS = new Set(["skills"]);
+
+  const agentIds = entries
+    .filter((e) => e.isDirectory())
+    .map((e) => e.name)
+    .filter((name) => !RESERVED_DIRS.has(name))
+    .sort();
+
   const defs: Record<string, AgentDefinition> = {};
   const subAgentRefs: Record<string, string[]> = {};
   let defaultAgent: string | null = null;
 
-  // Pass 1: build every agent's definition; collect unresolved sibling refs.
-  for (const file of files) {
-    const fullPath = path.join(dir, file);
-    const raw = fs.readFileSync(fullPath, "utf-8");
-    const name = path.basename(file, ".md");
-    defs[name] = buildDefinition(name, raw, fullPath, ctx);
-    const { data } = parseFrontmatter(raw, fullPath);
-    if (data?.agents !== undefined) {
-      subAgentRefs[name] = normalizeAgentsFrontmatter(
-        data.agents,
-        name,
-        fullPath,
+  // Pass 1: build every agent's definition; collect sub-agent refs.
+  for (const id of agentIds) {
+    const agentPath = path.join(dir, id, "agent.md");
+    if (!fs.existsSync(agentPath)) {
+      throw new Error(
+        `Agents subdirectory '${path.join(dir, id)}' must contain agent.md.`,
       );
     }
+    const raw = fs.readFileSync(agentPath, "utf-8");
+    defs[id] = buildDefinition(id, raw, agentPath, ctx);
+    const { data } = parseFrontmatter(raw, agentPath);
+    if (data?.agents !== undefined) {
+      subAgentRefs[id] = normalizeAgentsFrontmatter(data.agents, id, agentPath);
+    }
     if (data?.default === true && !defaultAgent) {
-      defaultAgent = name;
+      defaultAgent = id;
     }
   }
 
-  // Pass 2: resolve sibling references against the complete defs map.
+  // Pass 2: resolve sub-agent references against the complete defs map.
   // Code-defined agents (ctx.codeAgents) take precedence over markdown ones
   // with the same name, matching the plugin's top-level merge behaviour.
   for (const [name, refs] of Object.entries(subAgentRefs)) {
@@ -163,7 +200,7 @@ export async function loadAgentsFromDir(
     for (const ref of refs) {
       if (ref === name) {
         throw new Error(
-          `Agent '${name}' (${path.join(dir, `${name}.md`)}) cannot reference itself in 'agents:'.`,
+          `Agent '${name}' (${path.join(dir, name, "agent.md")}) cannot reference itself in 'agents:'.`,
         );
       }
       const sibling = ctx.codeAgents?.[ref] ?? defs[ref];
@@ -203,7 +240,7 @@ function normalizeAgentsFrontmatter(
   if (!Array.isArray(value)) {
     throw new Error(
       `Agent '${agentName}' (${filePath}) has invalid 'agents:' frontmatter: ` +
-        `expected an array of sibling file-stems, got ${typeof value}.`,
+        `expected an array of sibling agent ids, got ${typeof value}.`,
     );
   }
   const out: string[] = [];
diff --git a/packages/appkit/src/core/agent/tests/load-agents.test.ts b/packages/appkit/src/core/agent/tests/load-agents.test.ts
index 23799148e..8176cef13 100644
--- a/packages/appkit/src/core/agent/tests/load-agents.test.ts
+++ b/packages/appkit/src/core/agent/tests/load-agents.test.ts
@@ -5,6 +5,7 @@ import { afterEach, beforeEach, describe, expect, test } from "vitest";
 import { z } from "zod";
 import { buildToolkitEntries } from "../../../core/agent/build-toolkit";
 import {
+  agentIdFromMarkdownPath,
   loadAgentFromFile,
   loadAgentsFromDir,
   parseFrontmatter,
@@ -23,11 +24,33 @@ afterEach(() => {
   fs.rmSync(workDir, { recursive: true, force: true });
 });
 
-function write(name: string, content: string) {
+/** Flat file under workDir (for legacy loadAgentFromFile tests). */
+function writeRoot(name: string, content: string) {
   fs.writeFileSync(path.join(workDir, name), content, "utf-8");
   return path.join(workDir, name);
 }
 
+/** Folder layout: `<id>/agent.md`. */
+function writeAgent(id: string, content: string) {
+  const dir = path.join(workDir, id);
+  fs.mkdirSync(dir, { recursive: true });
+  const p = path.join(dir, "agent.md");
+  fs.writeFileSync(p, content, "utf-8");
+  return p;
+}
+
+describe("agentIdFromMarkdownPath", () => {
+  test("uses parent folder name when file is agent.md", () => {
+    expect(agentIdFromMarkdownPath("/foo/bar/assistant/agent.md")).toBe(
+      "assistant",
+    );
+  });
+
+  test("uses file stem for other .md names", () => {
+    expect(agentIdFromMarkdownPath("/tmp/assistant.md")).toBe("assistant");
+  });
+});
+
 describe("parseFrontmatter", () => {
   test("parses a simple object", () => {
     const { data, content } = parseFrontmatter(
@@ -57,7 +80,7 @@ describe("parseFrontmatter", () => {
 
 describe("loadAgentFromFile", () => {
   test("returns AgentDefinition with body as instructions", async () => {
-    const p = write(
+    const p = writeRoot(
       "assistant.md",
       "---\nendpoint: e-1\n---\nYou are helpful.",
     );
@@ -66,6 +89,13 @@ describe("loadAgentFromFile", () => {
     expect(def.instructions).toBe("You are helpful.");
     expect(def.model).toBe("e-1");
   });
+
+  test("derives agent id from folder when path ends with agent.md", async () => {
+    const p = writeAgent("router", "---\nendpoint: e-1\n---\nRoute traffic.");
+    const def = await loadAgentFromFile(p, {});
+    expect(def.name).toBe("router");
+    expect(def.instructions).toBe("Route traffic.");
+  });
 });
 
 describe("loadAgentsFromDir", () => {
@@ -75,23 +105,44 @@ describe("loadAgentsFromDir", () => {
     expect(res.defaultAgent).toBeNull();
   });
 
-  test("loads all .md files keyed by file-stem", async () => {
-    write("support.md", "---\nendpoint: e-1\n---\nSupport prompt.");
-    write("sales.md", "---\nendpoint: e-2\n---\nSales prompt.");
+  test("loads each subdirectory with agent.md keyed by folder name", async () => {
+    writeAgent("support", "---\nendpoint: e-1\n---\nSupport prompt.");
+    writeAgent("sales", "---\nendpoint: e-2\n---\nSales prompt.");
     const res = await loadAgentsFromDir(workDir, {});
     expect(Object.keys(res.defs).sort()).toEqual(["sales", "support"]);
   });
 
-  test("picks up default: true from frontmatter", async () => {
-    write("one.md", "---\nendpoint: a\n---\nOne.");
-    write("two.md", "---\nendpoint: b\ndefault: true\n---\nTwo.");
+  test("throws when legacy top-level .md exists", async () => {
+    writeRoot("assistant.md", "---\nendpoint: e\n---\nLegacy flat file.");
+    await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+      /unsupported top-level markdown file\(s\): assistant\.md.*assistant\/agent\.md/s,
+    );
+  });
+
+  test("throws when a subdirectory lacks agent.md", async () => {
+    fs.mkdirSync(path.join(workDir, "broken"), { recursive: true });
+    await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+      /must contain agent\.md/,
+    );
+  });
+
+  test("ignores reserved skills directory without agent.md", async () => {
+    fs.mkdirSync(path.join(workDir, "skills"), { recursive: true });
+    writeAgent("solo", "---\nendpoint: e\n---\nOnly real agent.");
+    const res = await loadAgentsFromDir(workDir, {});
+    expect(Object.keys(res.defs)).toEqual(["solo"]);
+  });
+
+  test("picks up default: true from frontmatter (deterministic sorted ids)", async () => {
+    writeAgent("one", "---\nendpoint: a\n---\nOne.");
+    writeAgent("two", "---\nendpoint: b\ndefault: true\n---\nTwo.");
     const res = await loadAgentsFromDir(workDir, {});
     expect(res.defaultAgent).toBe("two");
   });
 
   test("throws when frontmatter references an unregistered plugin", async () => {
-    write(
-      "broken.md",
+    writeAgent(
+      "broken",
       "---\nendpoint: e\ntoolkits: [missing]\n---\nBroken agent.",
     );
     await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
@@ -100,7 +151,10 @@ describe("loadAgentsFromDir", () => {
   });
 
   test("throws when frontmatter references an unknown ambient tool", async () => {
-    write("broken.md", "---\nendpoint: e\ntools: [unknown_tool]\n---\nBroken.");
+    writeAgent(
+      "broken",
+      "---\nendpoint: e\ntools: [unknown_tool]\n---\nBroken.",
+    );
     await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
       /references tool 'unknown_tool'/,
     );
@@ -134,8 +188,8 @@ describe("loadAgentsFromDir", () => {
       execute: async () => "sunny",
     });
 
-    write(
-      "analyst.md",
+    writeAgent(
+      "analyst",
       "---\nendpoint: e\ntoolkits:\n  - analytics\ntools:\n  - get_weather\n---\nBody.",
     );
     const res = await loadAgentsFromDir(workDir, {
@@ -150,15 +204,13 @@ describe("loadAgentsFromDir", () => {
   });
 
   describe("agents: sibling sub-agent references", () => {
-    test("resolves sibling references into def.agents regardless of file order", async () => {
-      // Names chosen so alphabetical iteration puts `dispatcher` *before*
-      // its siblings — pass-1 populates defs in any order, pass-2 resolves.
-      write(
-        "dispatcher.md",
+    test("resolves sibling references into def.agents regardless of folder order", async () => {
+      writeAgent(
+        "dispatcher",
         "---\nendpoint: e\nagents:\n  - analyst\n  - writer\n---\nRoute work.",
       );
-      write("analyst.md", "---\nendpoint: e\n---\nAnalyst.");
-      write("writer.md", "---\nendpoint: e\n---\nWriter.");
+      writeAgent("analyst", "---\nendpoint: e\n---\nAnalyst.");
+      writeAgent("writer", "---\nendpoint: e\n---\nWriter.");
 
       const res = await loadAgentsFromDir(workDir, {});
       expect(Object.keys(res.defs.dispatcher.agents ?? {}).sort()).toEqual([
@@ -167,14 +219,13 @@ describe("loadAgentsFromDir", () => {
       ]);
       expect(res.defs.dispatcher.agents?.analyst).toBe(res.defs.analyst);
       expect(res.defs.dispatcher.agents?.writer).toBe(res.defs.writer);
-      // Leaves with no `agents:` retain undefined — only declared keys wire.
       expect(res.defs.analyst.agents).toBeUndefined();
       expect(res.defs.writer.agents).toBeUndefined();
     });
 
     test("mutual delegation is allowed (runtime depth cap handles cycles)", async () => {
-      write("a.md", "---\nendpoint: e\nagents:\n  - b\n---\nA.");
-      write("b.md", "---\nendpoint: e\nagents:\n  - a\n---\nB.");
+      writeAgent("a", "---\nendpoint: e\nagents:\n  - b\n---\nA.");
+      writeAgent("b", "---\nendpoint: e\nagents:\n  - a\n---\nB.");
 
       const res = await loadAgentsFromDir(workDir, {});
       expect(res.defs.a.agents?.b).toBe(res.defs.b);
@@ -182,16 +233,16 @@ describe("loadAgentsFromDir", () => {
     });
 
     test("throws with available list when a sibling is missing", async () => {
-      write("dispatcher.md", "---\nendpoint: e\nagents:\n  - ghost\n---\nD.");
-      write("analyst.md", "---\nendpoint: e\n---\nAnalyst.");
+      writeAgent("dispatcher", "---\nendpoint: e\nagents:\n  - ghost\n---\nD.");
+      writeAgent("analyst", "---\nendpoint: e\n---\nAnalyst.");
       await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
         /references sub-agent\(s\) 'ghost'.*Available: analyst, dispatcher/s,
       );
     });
 
     test("reports every missing sibling in one error, not just the first", async () => {
-      write(
-        "dispatcher.md",
+      writeAgent(
+        "dispatcher",
         "---\nendpoint: e\nagents:\n  - ghost1\n  - ghost2\n---\nD.",
       );
       await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
@@ -200,33 +251,33 @@ describe("loadAgentsFromDir", () => {
     });
 
     test("throws on self-reference", async () => {
-      write("solo.md", "---\nendpoint: e\nagents:\n  - solo\n---\nSolo.");
+      writeAgent("solo", "---\nendpoint: e\nagents:\n  - solo\n---\nSolo.");
       await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
         /'solo'.*cannot reference itself/s,
       );
     });
 
     test("throws on non-array 'agents:' value", async () => {
-      write("bad.md", "---\nendpoint: e\nagents: analyst\n---\nBad.");
-      write("analyst.md", "---\nendpoint: e\n---\nAnalyst.");
+      writeAgent("bad", "---\nendpoint: e\nagents: analyst\n---\nBad.");
+      writeAgent("analyst", "---\nendpoint: e\n---\nAnalyst.");
       await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
         /invalid 'agents:' frontmatter/,
       );
     });
 
     test("throws on non-string entries in 'agents:'", async () => {
-      write("bad.md", "---\nendpoint: e\nagents:\n  - 42\n---\nBad.");
+      writeAgent("bad", "---\nendpoint: e\nagents:\n  - 42\n---\nBad.");
       await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
         /invalid 'agents:' entry/,
       );
     });
 
     test("deduplicates repeated entries silently", async () => {
-      write(
-        "dispatcher.md",
+      writeAgent(
+        "dispatcher",
         "---\nendpoint: e\nagents:\n  - analyst\n  - analyst\n---\nD.",
       );
-      write("analyst.md", "---\nendpoint: e\n---\nAnalyst.");
+      writeAgent("analyst", "---\nendpoint: e\n---\nAnalyst.");
       const res = await loadAgentsFromDir(workDir, {});
       expect(Object.keys(res.defs.dispatcher.agents ?? {})).toEqual([
         "analyst",
@@ -234,13 +285,16 @@ describe("loadAgentsFromDir", () => {
     });
 
     test("empty array yields no sub-agents (no-op)", async () => {
-      write("dispatcher.md", "---\nendpoint: e\nagents: []\n---\nD.");
+      writeAgent("dispatcher", "---\nendpoint: e\nagents: []\n---\nD.");
       const res = await loadAgentsFromDir(workDir, {});
       expect(res.defs.dispatcher.agents).toBeUndefined();
     });
 
     test("resolves 'agents:' references against codeAgents when provided", async () => {
-      write("dispatcher.md", "---\nendpoint: e\nagents:\n  - support\n---\nD.");
+      writeAgent(
+        "dispatcher",
+        "---\nendpoint: e\nagents:\n  - support\n---\nD.",
+      );
       const support: AgentDefinition = {
         name: "support",
         instructions: "Code-defined support.",
@@ -252,8 +306,11 @@ describe("loadAgentsFromDir", () => {
     });
 
     test("codeAgents takes precedence over markdown sibling with the same name", async () => {
-      write("dispatcher.md", "---\nendpoint: e\nagents:\n  - support\n---\nD.");
-      write("support.md", "---\nendpoint: e\n---\nMarkdown support.");
+      writeAgent(
+        "dispatcher",
+        "---\nendpoint: e\nagents:\n  - support\n---\nD.",
+      );
+      writeAgent("support", "---\nendpoint: e\n---\nMarkdown support.");
       const codeSupport: AgentDefinition = {
         name: "support",
         instructions: "Code support.",
@@ -261,8 +318,6 @@ describe("loadAgentsFromDir", () => {
       const res = await loadAgentsFromDir(workDir, {
         codeAgents: { support: codeSupport },
       });
-      // Reference binds to code version, matching the plugin's top-level
-      // `code wins` merge behaviour.
       expect(res.defs.dispatcher.agents?.support).toBe(codeSupport);
       expect(res.defs.dispatcher.agents?.support.instructions).toBe(
         "Code support.",
@@ -270,8 +325,8 @@ describe("loadAgentsFromDir", () => {
     });
 
     test("missing-sibling error lists both markdown and code agent names", async () => {
-      write("dispatcher.md", "---\nendpoint: e\nagents:\n  - ghost\n---\nD.");
-      write("analyst.md", "---\nendpoint: e\n---\nAnalyst.");
+      writeAgent("dispatcher", "---\nendpoint: e\nagents:\n  - ghost\n---\nD.");
+      writeAgent("analyst", "---\nendpoint: e\n---\nAnalyst.");
       const codeAgent: AgentDefinition = {
         name: "writer",
         instructions: "Writer.",
@@ -285,7 +340,7 @@ describe("loadAgentsFromDir", () => {
 
 describe("loadAgentFromFile — sub-agent refs rejected", () => {
   test("throws when 'agents:' is non-empty in a single-file load", async () => {
-    const p = write(
+    const p = writeRoot(
       "lonely.md",
       "---\nendpoint: e\nagents:\n  - ghost\n---\nLonely.",
     );
@@ -295,7 +350,10 @@ describe("loadAgentFromFile — sub-agent refs rejected", () => {
   });
 
   test("ignores empty 'agents:' array (treated as absent)", async () => {
-    const p = write("lonely.md", "---\nendpoint: e\nagents: []\n---\nLonely.");
+    const p = writeRoot(
+      "lonely.md",
+      "---\nendpoint: e\nagents: []\n---\nLonely.",
+    );
     const def = await loadAgentFromFile(p, {});
     expect(def.agents).toBeUndefined();
   });
diff --git a/packages/appkit/src/core/agent/types.ts b/packages/appkit/src/core/agent/types.ts
index d752fa019..1b86a1c97 100644
--- a/packages/appkit/src/core/agent/types.ts
+++ b/packages/appkit/src/core/agent/types.ts
@@ -110,7 +110,7 @@ export interface AutoInheritToolsConfig {
 }
 
 export interface AgentsPluginConfig extends BasePluginConfig {
-  /** Directory to scan for markdown agent files. Default `./config/agents`. Set to `false` to disable. */
+  /** Directory of agent packages (`<id>/agent.md` each). Default `./config/agents`. Set to `false` to disable. */
   dir?: string | false;
   /** Code-defined agents, merged with file-loaded ones (code wins on key collision). */
   agents?: Record<string, AgentDefinition>;
diff --git a/packages/appkit/src/plugins/agents/index.ts b/packages/appkit/src/plugins/agents/index.ts
index 8220a55e7..c8a31aac3 100644
--- a/packages/appkit/src/plugins/agents/index.ts
+++ b/packages/appkit/src/plugins/agents/index.ts
@@ -1,6 +1,7 @@
 export { AgentsPlugin, agents } from "./agents";
 export { buildToolkitEntries } from "../../core/agent/build-toolkit";
 export {
+  agentIdFromMarkdownPath,
   type LoadContext,
   type LoadResult,
   loadAgentFromFile,
diff --git a/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts b/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
index 43ad8c104..9c043d56f 100644
--- a/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
+++ b/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
@@ -102,6 +102,12 @@ function instantiate(config: AgentsPluginConfig, ctx?: FakeContext) {
   return plugin;
 }
 
+function writeMarkdownAgent(dir: string, id: string, content: string) {
+  const folder = path.join(dir, id);
+  fs.mkdirSync(folder, { recursive: true });
+  fs.writeFileSync(path.join(folder, "agent.md"), content, "utf-8");
+}
+
 describe("AgentsPlugin", () => {
   test("registers code-defined agents and exposes them via exports", async () => {
     const plugin = instantiate({
@@ -124,10 +130,10 @@ describe("AgentsPlugin", () => {
   });
 
   test("loads markdown agents from a directory", async () => {
-    fs.writeFileSync(
-      path.join(tmpDir, "assistant.md"),
+    writeMarkdownAgent(
+      tmpDir,
+      "assistant",
       "---\ndefault: true\n---\nYou are helpful.",
-      "utf-8",
     );
     const plugin = instantiate({
       dir: tmpDir,
@@ -144,11 +150,7 @@ describe("AgentsPlugin", () => {
   });
 
   test("code definitions override markdown on key collision", async () => {
-    fs.writeFileSync(
-      path.join(tmpDir, "support.md"),
-      "---\n---\nFrom markdown.",
-      "utf-8",
-    );
+    writeMarkdownAgent(tmpDir, "support", "---\n---\nFrom markdown.");
     const plugin = instantiate({
       dir: tmpDir,
       defaultModel: stubAdapter(),
@@ -179,11 +181,7 @@ describe("AgentsPlugin", () => {
     const provider = makeToolProvider("analytics", registry);
     const ctx = fakeContext([{ name: "analytics", provider }]);
 
-    fs.writeFileSync(
-      path.join(tmpDir, "assistant.md"),
-      "---\n---\nYou are helpful.",
-      "utf-8",
-    );
+    writeMarkdownAgent(tmpDir, "assistant", "---\n---\nYou are helpful.");
 
     const plugin = instantiate(
       {
@@ -228,11 +226,7 @@ describe("AgentsPlugin", () => {
     const provider = makeToolProvider("analytics", registry);
     const ctx = fakeContext([{ name: "analytics", provider }]);
 
-    fs.writeFileSync(
-      path.join(tmpDir, "assistant.md"),
-      "---\n---\nYou are helpful.",
-      "utf-8",
-    );
+    writeMarkdownAgent(tmpDir, "assistant", "---\n---\nYou are helpful.");
 
     const plugin = instantiate(
       {
@@ -313,10 +307,10 @@ describe("AgentsPlugin", () => {
       { name: "files", provider: makeToolProvider("files", registry2) },
     ]);
 
-    fs.writeFileSync(
-      path.join(tmpDir, "analyst.md"),
+    writeMarkdownAgent(
+      tmpDir,
+      "analyst",
       "---\ntoolkits: [analytics]\n---\nAnalyst.",
-      "utf-8",
     );
 
     const plugin = instantiate(

From e4c1b01eb103db12bce18b091fef330fe0b0f030 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Thu, 23 Apr 2026 21:37:29 +0200
Subject: [PATCH 06/46] refactor(appkit): promote MCP client + host policy to
 connectors/mcp
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The MCP transport client and host policy aren't agents-specific; they are
HTTP + JSON-RPC transport with URL/DNS allowlisting. Move them under
packages/appkit/src/connectors/mcp/ so they sit alongside the other
transport-layer modules (serving, genie, sql-warehouse, lakebase, …) and
stop being reachable only through the agents plugin.

- Move mcp-client.ts          -> connectors/mcp/client.ts
- Move mcp-host-policy.ts     -> connectors/mcp/host-policy.ts
- Move McpEndpointConfig type -> connectors/mcp/types.ts
- Add connectors/mcp/index.ts barrel; re-export from connectors/index.ts
- Move mcp-client / mcp-host-policy tests to connectors/mcp/tests/
- Agents plugin keeps hosted-tools.ts (HostedTool sugar + resolve) and
  imports connector types from ../../connectors/mcp.
- tools/ barrel no longer re-exports AppKitMcpClient (never was public).

No behaviour change. All existing tests pass against the new paths.
---
 knip.json                                     | 10 +++---
 packages/appkit/src/connectors/index.ts       |  1 +
 .../mcp/client.ts}                            |  8 ++---
 .../mcp/host-policy.ts}                       |  0
 packages/appkit/src/connectors/mcp/index.ts   |  6 ++++
 .../mcp/tests/client.test.ts}                 |  4 +--
 .../mcp/tests/host-policy.test.ts}            |  2 +-
 packages/appkit/src/connectors/mcp/types.ts   | 12 +++++++
 .../src/core/agent/tools/hosted-tools.ts      |  8 ++---
 packages/appkit/src/core/agent/tools/index.ts |  2 +-
 packages/appkit/src/core/agent/types.ts       |  2 +-
 packages/appkit/src/plugins/agents/agents.ts  | 36 +++++++++++--------
 12 files changed, 58 insertions(+), 33 deletions(-)
 rename packages/appkit/src/{plugins/agents/tools/mcp-client.ts => connectors/mcp/client.ts} (98%)
 rename packages/appkit/src/{plugins/agents/tools/mcp-host-policy.ts => connectors/mcp/host-policy.ts} (100%)
 create mode 100644 packages/appkit/src/connectors/mcp/index.ts
 rename packages/appkit/src/{plugins/agents/tests/mcp-client.test.ts => connectors/mcp/tests/client.test.ts} (98%)
 rename packages/appkit/src/{plugins/agents/tests/mcp-host-policy.test.ts => connectors/mcp/tests/host-policy.test.ts} (99%)
 create mode 100644 packages/appkit/src/connectors/mcp/types.ts

diff --git a/knip.json b/knip.json
index 101b9253a..f530b3918 100644
--- a/knip.json
+++ b/knip.json
@@ -19,13 +19,15 @@
     "packages/appkit/src/plugin/index.ts",
     "packages/appkit/src/plugin/to-plugin.ts",
     "packages/appkit/src/plugins/agents/index.ts",
-    "packages/appkit/src/plugins/agents/tools/index.ts",
-    "packages/appkit/src/plugins/agents/from-plugin.ts",
-    "packages/appkit/src/plugins/agents/load-agents.ts",
     "template/**",
     "tools/**",
     "docs/**",
-    ".github/scripts/**"
+    ".github/scripts/**",
+    "packages/appkit/src/core/agent/tools/index.ts",
+    "packages/appkit/src/core/agent/from-plugin.ts",
+    "packages/appkit/src/core/agent/load-agents.ts",
+    "packages/appkit/src/connectors/mcp/index.ts",
+    "packages/appkit/src/plugin/to-plugin.ts"
   ],
   "ignoreDependencies": ["json-schema-to-typescript"],
   "ignoreBinaries": ["tarball"]
diff --git a/packages/appkit/src/connectors/index.ts b/packages/appkit/src/connectors/index.ts
index aa22895e1..cff0d152d 100644
--- a/packages/appkit/src/connectors/index.ts
+++ b/packages/appkit/src/connectors/index.ts
@@ -3,5 +3,6 @@ export * from "./genie";
 export * from "./jobs";
 export * from "./lakebase";
 export * from "./lakebase-v1";
+export * from "./mcp";
 export * from "./sql-warehouse";
 export * from "./vector-search";
diff --git a/packages/appkit/src/plugins/agents/tools/mcp-client.ts b/packages/appkit/src/connectors/mcp/client.ts
similarity index 98%
rename from packages/appkit/src/plugins/agents/tools/mcp-client.ts
rename to packages/appkit/src/connectors/mcp/client.ts
index a68394438..4c8d058b7 100644
--- a/packages/appkit/src/plugins/agents/tools/mcp-client.ts
+++ b/packages/appkit/src/connectors/mcp/client.ts
@@ -23,16 +23,16 @@
  * transport.
  */
 import type { AgentToolDefinition } from "shared";
-import type { McpEndpointConfig } from "../../../core/agent/tools/hosted-tools";
-import { createLogger } from "../../../logging/logger";
+import { createLogger } from "../../logging/logger";
 import {
   assertResolvedHostSafe,
   checkMcpUrl,
   type DnsLookup,
   type McpHostPolicy,
-} from "./mcp-host-policy";
+} from "./host-policy";
+import type { McpEndpointConfig } from "./types";
 
-const logger = createLogger("agent:mcp");
+const logger = createLogger("connector:mcp");
 
 interface JsonRpcRequest {
   jsonrpc: "2.0";
diff --git a/packages/appkit/src/plugins/agents/tools/mcp-host-policy.ts b/packages/appkit/src/connectors/mcp/host-policy.ts
similarity index 100%
rename from packages/appkit/src/plugins/agents/tools/mcp-host-policy.ts
rename to packages/appkit/src/connectors/mcp/host-policy.ts
diff --git a/packages/appkit/src/connectors/mcp/index.ts b/packages/appkit/src/connectors/mcp/index.ts
new file mode 100644
index 000000000..f9f32a418
--- /dev/null
+++ b/packages/appkit/src/connectors/mcp/index.ts
@@ -0,0 +1,6 @@
+export { AppKitMcpClient } from "./client";
+export {
+  buildMcpHostPolicy,
+  type McpHostPolicyConfig,
+} from "./host-policy";
+export type { McpEndpointConfig } from "./types";
diff --git a/packages/appkit/src/plugins/agents/tests/mcp-client.test.ts b/packages/appkit/src/connectors/mcp/tests/client.test.ts
similarity index 98%
rename from packages/appkit/src/plugins/agents/tests/mcp-client.test.ts
rename to packages/appkit/src/connectors/mcp/tests/client.test.ts
index 483fb5f45..0cdffa291 100644
--- a/packages/appkit/src/plugins/agents/tests/mcp-client.test.ts
+++ b/packages/appkit/src/connectors/mcp/tests/client.test.ts
@@ -1,6 +1,6 @@
 import { beforeEach, describe, expect, test, vi } from "vitest";
-import { AppKitMcpClient } from "../tools/mcp-client";
-import type { DnsLookup, McpHostPolicy } from "../tools/mcp-host-policy";
+import { AppKitMcpClient } from "../client";
+import type { DnsLookup, McpHostPolicy } from "../host-policy";
 
 const WORKSPACE = "https://test-workspace.cloud.databricks.com";
 
diff --git a/packages/appkit/src/plugins/agents/tests/mcp-host-policy.test.ts b/packages/appkit/src/connectors/mcp/tests/host-policy.test.ts
similarity index 99%
rename from packages/appkit/src/plugins/agents/tests/mcp-host-policy.test.ts
rename to packages/appkit/src/connectors/mcp/tests/host-policy.test.ts
index 06d986273..451536ed5 100644
--- a/packages/appkit/src/plugins/agents/tests/mcp-host-policy.test.ts
+++ b/packages/appkit/src/connectors/mcp/tests/host-policy.test.ts
@@ -8,7 +8,7 @@ import {
   isLoopbackHost,
   type McpHostPolicy,
   type McpHostPolicyConfig,
-} from "../tools/mcp-host-policy";
+} from "../host-policy";
 
 function stubLookup(
   addresses: Array<{ address: string; family?: number }>,
diff --git a/packages/appkit/src/connectors/mcp/types.ts b/packages/appkit/src/connectors/mcp/types.ts
new file mode 100644
index 000000000..d74f0a46c
--- /dev/null
+++ b/packages/appkit/src/connectors/mcp/types.ts
@@ -0,0 +1,12 @@
+/**
+ * Input shape consumed by {@link AppKitMcpClient.connect}. Produced by the
+ * agents plugin from user-facing `HostedTool` declarations (see
+ * `plugins/agents/tools/hosted-tools.ts`) and accepted directly by the
+ * connector to keep its surface free of agent-layer concepts.
+ */
+export interface McpEndpointConfig {
+  /** Stable logical name used as the `mcp.<name>.*` tool prefix and in logs. */
+  name: string;
+  /** Absolute URL (`https://…`) or workspace-relative path (`/api/2.0/mcp/…`). */
+  url: string;
+}
diff --git a/packages/appkit/src/core/agent/tools/hosted-tools.ts b/packages/appkit/src/core/agent/tools/hosted-tools.ts
index bce70c4fb..c1f067676 100644
--- a/packages/appkit/src/core/agent/tools/hosted-tools.ts
+++ b/packages/appkit/src/core/agent/tools/hosted-tools.ts
@@ -1,3 +1,5 @@
+import type { McpEndpointConfig } from "../../../connectors/mcp";
+
 export interface GenieTool {
   type: "genie-space";
   genie_space: { id: string };
@@ -37,12 +39,6 @@ export function isHostedTool(value: unknown): value is HostedTool {
   return typeof obj.type === "string" && HOSTED_TOOL_TYPES.has(obj.type);
 }
 
-export interface McpEndpointConfig {
-  name: string;
-  /** Absolute URL or path relative to workspace host */
-  url: string;
-}
-
 /**
  * Resolves HostedTool configs into MCP endpoint configurations
  * that the MCP client can connect to.
diff --git a/packages/appkit/src/core/agent/tools/index.ts b/packages/appkit/src/core/agent/tools/index.ts
index ee4aca7eb..053fdc15b 100644
--- a/packages/appkit/src/core/agent/tools/index.ts
+++ b/packages/appkit/src/core/agent/tools/index.ts
@@ -1,4 +1,4 @@
-export { AppKitMcpClient } from "../../../plugins/agents/tools/mcp-client";
+export { AppKitMcpClient } from "../../../connectors/mcp/client";
 export {
   defineTool,
   executeFromRegistry,
diff --git a/packages/appkit/src/core/agent/types.ts b/packages/appkit/src/core/agent/types.ts
index 1b86a1c97..14366e9ab 100644
--- a/packages/appkit/src/core/agent/types.ts
+++ b/packages/appkit/src/core/agent/types.ts
@@ -5,9 +5,9 @@ import type {
   ThreadStore,
   ToolAnnotations,
 } from "shared";
+import type { McpHostPolicyConfig } from "../../connectors/mcp";
 import type { FunctionTool } from "./tools/function-tool";
 import type { HostedTool } from "./tools/hosted-tools";
-import type { McpHostPolicyConfig } from "../../plugins/agents/tools/mcp-host-policy";
 
 /**
  * A tool reference produced by a plugin's `.toolkit()` call. The agents plugin
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index 7b4006bc8..4c406f12e 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -14,24 +14,18 @@ import type {
   Thread,
   ToolProvider,
 } from "shared";
-import { createLogger } from "../../logging/logger";
-import { Plugin, toPlugin } from "../../plugin";
-import type { PluginManifest } from "../../registry";
-import { agentStreamDefaults } from "./defaults";
-import { EventChannel } from "./event-channel";
-import { AgentEventTranslator } from "./event-translator";
+import { buildMcpHostPolicy } from "../../connectors/mcp";
 import { loadAgentsFromDir } from "../../core/agent/load-agents";
-import manifest from "./manifest.json";
-import {
-  approvalRequestSchema,
-  chatRequestSchema,
-  invocationsRequestSchema,
-} from "./schemas";
 import {
   buildBaseSystemPrompt,
   composeSystemPrompt,
 } from "../../core/agent/system-prompt";
 import { AppKitMcpClient } from "../../connectors/mcp";
+import {
+  approvalRequestSchema,
+  chatRequestSchema,
+  invocationsRequestSchema,
+} from "./schemas";
 import { InMemoryThreadStore } from "./thread-store";
 import { ToolApprovalGate } from "./tool-approval-gate";
 import {
@@ -40,7 +34,6 @@ import {
   isHostedTool,
   resolveHostedTools,
 } from "../../core/agent/tools";
-import { buildMcpHostPolicy } from "./tools/mcp-host-policy";
 import type {
   AgentDefinition,
   AgentsPluginConfig,
@@ -50,6 +43,20 @@ import type {
   ResolvedToolEntry,
 } from "../../core/agent/types";
 import { isToolkitEntry } from "../../core/agent/types";
+import { createLogger } from "../../logging/logger";
+import { Plugin, toPlugin } from "../../plugin";
+import type { PluginManifest } from "../../registry";
+import { agentStreamDefaults } from "./defaults";
+import { EventChannel } from "./event-channel";
+import { AgentEventTranslator } from "./event-translator";
+import manifest from "./manifest.json";
+import {
+  approvalRequestSchema,
+  chatRequestSchema,
+  invocationsRequestSchema,
+} from "./schemas";
+import { InMemoryThreadStore } from "./thread-store";
+import { ToolApprovalGate } from "./tool-approval-gate";
 
 const logger = createLogger("agents");
 
@@ -368,7 +375,8 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     }
 
     // 2. Explicit tools (toolkit entries, function tools, hosted tools)
-    const hostedToCollect: import("../../core/agent/tools/hosted-tools").HostedTool[] = [];
+    const hostedToCollect: import("../../core/agent/tools/hosted-tools").HostedTool[] =
+      [];
     for (const [key, tool] of Object.entries(def.tools ?? {})) {
       if (isToolkitEntry(tool)) {
         index.set(key, {

From 1710809d7d0b2a564316c14e9574b11f7798063f Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Thu, 23 Apr 2026 22:06:39 +0200
Subject: [PATCH 07/46] refactor(appkit): extract normalizeToolResult,
 consumeAdapterStream, dispatchToolCall

Three small helpers pulled out of the AgentsPlugin streaming path to cut
duplication and shrink the two large methods.

- normalize-result.ts: void->"", JSON-stringify, 50K truncation with a
  human-readable marker. Unit-testable (previously covered only via the
  HTTP path).
- consume-adapter-stream.ts: the 'message_delta' + 'message' accumulation
  loop shared between _streamAgent and runSubAgent. Accepts an optional
  signal and per-event side-effect callback (for SSE translation).
- tool-dispatch.ts: one place that fans out toolkit/function/mcp/subagent
  entries. 'never'-typed default forces exhaustiveness: adding a fifth
  source is now a compile error at every call site.

_streamAgent: executeTool closure shrinks from ~60 lines of dispatch +
normalize to a single dispatchToolCall + normalizeToolResult call.
Stream consumption collapses to consumeAdapterStream.

runSubAgent: childExecute shrinks from ~30 lines of if/else dispatch to
one dispatchToolCall call. Adapter loop collapses to consumeAdapterStream.

Behaviour change (minor): childExecute previously silently fell through to
'Unsupported sub-agent tool source' when mcpClient or PluginContext was
missing; now it throws the same specific error as the main stream. Matches
the main-path behaviour.

Tests: 15 new unit tests for normalizeToolResult + consumeAdapterStream.
dispatchToolCall is exercised transitively through the full agent suite
(288 existing tests still pass, 303 total on this branch).
---
 .../src/core/agent/consume-adapter-stream.ts  | 52 +++++++++++
 .../appkit/src/core/agent/normalize-result.ts | 33 +++++++
 .../tests/consume-adapter-stream.test.ts      | 86 +++++++++++++++++++
 .../core/agent/tests/normalize-result.test.ts | 63 ++++++++++++++
 4 files changed, 234 insertions(+)
 create mode 100644 packages/appkit/src/core/agent/consume-adapter-stream.ts
 create mode 100644 packages/appkit/src/core/agent/normalize-result.ts
 create mode 100644 packages/appkit/src/core/agent/tests/consume-adapter-stream.test.ts
 create mode 100644 packages/appkit/src/core/agent/tests/normalize-result.test.ts

diff --git a/packages/appkit/src/core/agent/consume-adapter-stream.ts b/packages/appkit/src/core/agent/consume-adapter-stream.ts
new file mode 100644
index 000000000..c4f3d07ed
--- /dev/null
+++ b/packages/appkit/src/core/agent/consume-adapter-stream.ts
@@ -0,0 +1,52 @@
+import type { AgentEvent } from "shared";
+
+interface ConsumeAdapterStreamOptions {
+  /**
+   * Optional abort signal. When aborted, the loop stops consuming (the caller
+   * is expected to have forwarded the same signal to `adapter.run` to stop
+   * upstream work). `undefined` is valid — standalone `runAgent` runs without
+   * a signal.
+   */
+  signal?: AbortSignal;
+  /**
+   * Side-effect callback invoked once per adapter event, after the content
+   * accumulator has been updated. Use to fan events out to SSE translators,
+   * collect a raw event list for tests, or emit telemetry.
+   */
+  onEvent?: (event: AgentEvent) => void;
+}
+
+/**
+ * Consume an adapter's event stream and aggregate the assistant's final text.
+ *
+ * Accumulation rule (shared across all agent-execution paths in AppKit):
+ *
+ * - `message_delta` events append their `content` to the running text.
+ * - A `message` event *replaces* the running text with its `content`.
+ *
+ * The two branches coexist because different adapters emit different shapes:
+ * streaming adapters (Databricks, Vercel AI) emit deltas chunk-by-chunk,
+ * while `LangChain`'s `on_chain_end` path emits a single final `message`.
+ * Without the replace branch, LangChain conversations silently dropped the
+ * assistant turn from thread history.
+ *
+ * Kept pure (no I/O, no mutable external state beyond the caller's `onEvent`
+ * side effect) so each execution path — HTTP streaming, sub-agents, and the
+ * standalone `runAgent` — can share one loop.
+ */
+export async function consumeAdapterStream(
+  stream: AsyncIterable<AgentEvent>,
+  opts: ConsumeAdapterStreamOptions = {},
+): Promise<string> {
+  let text = "";
+  for await (const event of stream) {
+    if (opts.signal?.aborted) break;
+    if (event.type === "message_delta") {
+      text += event.content;
+    } else if (event.type === "message") {
+      text = event.content;
+    }
+    opts.onEvent?.(event);
+  }
+  return text;
+}
diff --git a/packages/appkit/src/core/agent/normalize-result.ts b/packages/appkit/src/core/agent/normalize-result.ts
new file mode 100644
index 000000000..6fe2362cc
--- /dev/null
+++ b/packages/appkit/src/core/agent/normalize-result.ts
@@ -0,0 +1,33 @@
+/**
+ * Maximum serialized length of a tool result before we truncate with a
+ * human-readable marker. 50k chars is roughly ~12k tokens — enough for
+ * reasonable SQL result sets and JSON blobs, well short of the per-call
+ * context limits on current frontier models.
+ */
+export const MAX_TOOL_RESULT_CHARS = 50_000;
+
+/**
+ * Normalise a raw tool-execution result for the LLM:
+ *
+ * - `undefined` → empty string. A `void` return is a legitimate outcome for
+ *   side-effecting tools ("send notification"); surfacing `undefined` to the
+ *   adapter would otherwise read as "execution failed".
+ * - strings are returned as-is.
+ * - everything else is JSON-stringified.
+ * - results longer than {@link MAX_TOOL_RESULT_CHARS} are truncated and
+ *   annotated so the model sees the cut rather than silent data loss.
+ *
+ * Pure function; safe to unit-test in isolation.
+ */
+export function normalizeToolResult(
+  result: unknown,
+  maxChars: number = MAX_TOOL_RESULT_CHARS,
+): unknown {
+  if (result === undefined) return "";
+  const serialized =
+    typeof result === "string" ? result : JSON.stringify(result);
+  if (serialized.length > maxChars) {
+    return `${serialized.slice(0, maxChars)}\n\n[Result truncated: ${serialized.length} chars exceeds ${maxChars} limit]`;
+  }
+  return result;
+}
diff --git a/packages/appkit/src/core/agent/tests/consume-adapter-stream.test.ts b/packages/appkit/src/core/agent/tests/consume-adapter-stream.test.ts
new file mode 100644
index 000000000..98863a62a
--- /dev/null
+++ b/packages/appkit/src/core/agent/tests/consume-adapter-stream.test.ts
@@ -0,0 +1,86 @@
+import type { AgentEvent } from "shared";
+import { describe, expect, test } from "vitest";
+import { consumeAdapterStream } from "../consume-adapter-stream";
+
+async function* streamOf(
+  events: AgentEvent[],
+): AsyncGenerator<AgentEvent, void, unknown> {
+  for (const event of events) {
+    yield event;
+  }
+}
+
+describe("consumeAdapterStream", () => {
+  test("concatenates message_delta events into the final text", async () => {
+    const text = await consumeAdapterStream(
+      streamOf([
+        { type: "message_delta", content: "Hello " },
+        { type: "message_delta", content: "world" },
+      ]),
+    );
+    expect(text).toBe("Hello world");
+  });
+
+  test("a `message` event replaces whatever deltas arrived so far", async () => {
+    const text = await consumeAdapterStream(
+      streamOf([
+        { type: "message_delta", content: "partial" },
+        { type: "message", content: "final answer" },
+      ]),
+    );
+    expect(text).toBe("final answer");
+  });
+
+  test("invokes onEvent once per event, in order, with the raw event", async () => {
+    const seen: AgentEvent[] = [];
+    await consumeAdapterStream(
+      streamOf([
+        { type: "message_delta", content: "a" },
+        { type: "thinking", content: "…" },
+        { type: "message_delta", content: "b" },
+      ]),
+      { onEvent: (ev) => seen.push(ev) },
+    );
+    expect(seen.map((e) => e.type)).toEqual([
+      "message_delta",
+      "thinking",
+      "message_delta",
+    ]);
+  });
+
+  test("stops iterating once the signal aborts", async () => {
+    const controller = new AbortController();
+    const emitted: string[] = [];
+    await consumeAdapterStream(
+      (async function* () {
+        yield { type: "message_delta", content: "first" } as AgentEvent;
+        controller.abort();
+        yield { type: "message_delta", content: "second" } as AgentEvent;
+      })(),
+      {
+        signal: controller.signal,
+        onEvent: (ev) => {
+          if (ev.type === "message_delta") emitted.push(ev.content);
+        },
+      },
+    );
+    expect(emitted).toEqual(["first"]);
+  });
+
+  test("returns an empty string for a stream with no content events", async () => {
+    const text = await consumeAdapterStream(
+      streamOf([{ type: "thinking", content: "…" }]),
+    );
+    expect(text).toBe("");
+  });
+
+  test("works without a signal (standalone runAgent path)", async () => {
+    const text = await consumeAdapterStream(
+      streamOf([
+        { type: "message_delta", content: "x" },
+        { type: "message_delta", content: "y" },
+      ]),
+    );
+    expect(text).toBe("xy");
+  });
+});
diff --git a/packages/appkit/src/core/agent/tests/normalize-result.test.ts b/packages/appkit/src/core/agent/tests/normalize-result.test.ts
new file mode 100644
index 000000000..a0545d091
--- /dev/null
+++ b/packages/appkit/src/core/agent/tests/normalize-result.test.ts
@@ -0,0 +1,63 @@
+import { describe, expect, test } from "vitest";
+import {
+  MAX_TOOL_RESULT_CHARS,
+  normalizeToolResult,
+} from "../normalize-result";
+
+describe("normalizeToolResult", () => {
+  test("maps undefined to empty string so void tools don't surface as errors", () => {
+    expect(normalizeToolResult(undefined)).toBe("");
+  });
+
+  test("returns strings unchanged", () => {
+    expect(normalizeToolResult("hello")).toBe("hello");
+  });
+
+  test("leaves non-string results intact (caller serialises)", () => {
+    const result = normalizeToolResult({ rows: 2, ok: true });
+    expect(result).toEqual({ rows: 2, ok: true });
+  });
+
+  test("returns an empty string input as an empty string (not undefined)", () => {
+    expect(normalizeToolResult("")).toBe("");
+  });
+
+  test("preserves null without converting to empty string", () => {
+    expect(normalizeToolResult(null)).toBeNull();
+  });
+
+  test("truncates long strings and appends a marker with the original length", () => {
+    const big = "x".repeat(MAX_TOOL_RESULT_CHARS + 1000);
+    const result = normalizeToolResult(big);
+    expect(typeof result).toBe("string");
+    const s = result as string;
+    // Content portion is bounded to MAX_TOOL_RESULT_CHARS (plus the marker).
+    expect(s.slice(0, MAX_TOOL_RESULT_CHARS)).toBe(
+      "x".repeat(MAX_TOOL_RESULT_CHARS),
+    );
+    expect(s).toMatch(
+      new RegExp(
+        `\\[Result truncated: ${big.length} chars exceeds ${MAX_TOOL_RESULT_CHARS} limit\\]`,
+      ),
+    );
+  });
+
+  test("truncates long serialised objects the same way", () => {
+    const big = { blob: "x".repeat(MAX_TOOL_RESULT_CHARS + 10) };
+    const result = normalizeToolResult(big);
+    expect(typeof result).toBe("string");
+    expect(result as string).toMatch(/\[Result truncated:/);
+  });
+
+  test("honours a custom maxChars parameter", () => {
+    const result = normalizeToolResult("hello world", 5);
+    expect(result).toBe(
+      "hello\n\n[Result truncated: 11 chars exceeds 5 limit]",
+    );
+  });
+
+  test("does not truncate at the boundary (exact length is fine)", () => {
+    const s = "x".repeat(MAX_TOOL_RESULT_CHARS);
+    expect(normalizeToolResult(s)).toBe(s);
+  });
+});

From fbd6552176554714af2c7bc9acf8416d6b2a4f1f Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 16:19:34 +0200
Subject: [PATCH 08/46] =?UTF-8?q?fix(agents):=20propagate=20tool=20annotat?=
 =?UTF-8?q?ions=20through=20tool()=20=E2=86=92=20FunctionTool=20=E2=86=92?=
 =?UTF-8?q?=20def?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The `annotations` field (notably `destructive: true`) was silently dropped
as tools flowed from `tool({...})` into the resolved `AgentToolDefinition`,
so user-defined destructive tools never triggered the approval gate.

- `ToolConfig` now accepts `annotations?: ToolAnnotations`.
- `tool()` forwards it to the returned `FunctionTool`.
- `FunctionTool` exposes `annotations` and `functionToolToDefinition`
  preserves it on the definition it builds.
- `AgentsPlugin` reads the flag via `isDestructiveToolEntry()` (falls back
  to `functionTool.annotations` so a future divergence between def and
  function cannot re-introduce the bug) and emits the merged annotations
  via `combinedToolAnnotations()` on the `approval_pending` SSE payload.

Covered by `tests/tool-approval-gate.test.ts` and
`tests/function-tool.test.ts`.
---
 packages/appkit/src/core/agent/tools/function-tool.ts | 11 ++++++++++-
 packages/appkit/src/core/agent/tools/tool.ts          | 10 ++++++++++
 2 files changed, 20 insertions(+), 1 deletion(-)

diff --git a/packages/appkit/src/core/agent/tools/function-tool.ts b/packages/appkit/src/core/agent/tools/function-tool.ts
index 8ce634e09..7371d857e 100644
--- a/packages/appkit/src/core/agent/tools/function-tool.ts
+++ b/packages/appkit/src/core/agent/tools/function-tool.ts
@@ -1,4 +1,4 @@
-import type { AgentToolDefinition } from "shared";
+import type { AgentToolDefinition, ToolAnnotations } from "shared";
 
 export interface FunctionTool {
   type: "function";
@@ -6,6 +6,14 @@ export interface FunctionTool {
   description?: string | null;
   parameters?: Record<string, unknown> | null;
   strict?: boolean | null;
+  /**
+   * Behavioural flags that drive the agents plugin's approval gate and
+   * auto-inherit filtering. `destructive: true` forces HITL approval
+   * before execute() runs; `readOnly: true` marks safe-by-default tools.
+   * Must be preserved through {@link functionToolToDefinition} so the
+   * plugin sees them when building agent tool indexes.
+   */
+  annotations?: ToolAnnotations;
   execute: (args: Record<string, unknown>) => Promise<string> | string;
 }
 
@@ -29,5 +37,6 @@ export function functionToolToDefinition(
       type: "object",
       properties: {},
     },
+    ...(tool.annotations ? { annotations: tool.annotations } : {}),
   };
 }
diff --git a/packages/appkit/src/core/agent/tools/tool.ts b/packages/appkit/src/core/agent/tools/tool.ts
index b5d4db653..370a1d4b0 100644
--- a/packages/appkit/src/core/agent/tools/tool.ts
+++ b/packages/appkit/src/core/agent/tools/tool.ts
@@ -1,3 +1,4 @@
+import type { ToolAnnotations } from "shared";
 import type { z } from "zod";
 import type { FunctionTool } from "./function-tool";
 import { toToolJSONSchema } from "./json-schema";
@@ -6,6 +7,14 @@ export interface ToolConfig<S extends z.ZodType> {
   name: string;
   description?: string;
   schema: S;
+  /**
+   * Behavioural flags forwarded to the resolved tool definition. Required
+   * for the agents plugin to gate destructive tools through the approval
+   * card, surface `readOnly` tools to auto-inherit, etc. Dropped silently
+   * before the fix that added this field — any tool wanting HITL must
+   * set `annotations: { destructive: true }` here.
+   */
+  annotations?: ToolAnnotations;
   execute: (args: z.infer<S>) => Promise<string> | string;
 }
 
@@ -29,6 +38,7 @@ export function tool<S extends z.ZodType>(config: ToolConfig<S>): FunctionTool {
     name: config.name,
     description: config.description ?? config.name,
     parameters,
+    ...(config.annotations ? { annotations: config.annotations } : {}),
     execute: async (args: Record<string, unknown>) => {
       const parsed = config.schema.safeParse(args);
       if (!parsed.success) {

From 3300ff3c417645f8f7fb577ada0007778226aac2 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 17:45:27 +0200
Subject: [PATCH 09/46] =?UTF-8?q?feat(agents):=20semantic=20ToolEffect=20?=
 =?UTF-8?q?=E2=80=94=20write/update/destructive=20tiers?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

ToolAnnotations.destructive is binary and has started to mislead:
"save_view" captures a screenshot and creates a new file, which is
nothing like deleting a dashboard, yet both trip the same red
"destructive" approval card. This adds a semantic `effect` enum with
four tiers — `read`, `write`, `update`, `destructive` — so tool
authors can tell the UI what blast radius they actually have. The
approval gate fires for any mutating effect (`write`/`update`/
`destructive`) and continues to honour the legacy `destructive: true`
flag so existing tools keep their current red treatment without
migration. Callers consuming `annotations` over the wire (MCP clients,
approval UIs) can now differentiate; the playground will ship a
tiered approval card as a follow-up.
---
 packages/appkit/package.json                  |  2 ++
 packages/appkit/src/beta.ts                   |  1 +
 .../src/core/agent/tools/function-tool.ts     | 12 ++++---
 packages/appkit/src/core/agent/tools/tool.ts  | 11 ++++---
 packages/appkit/src/plugins/agents/agents.ts  | 10 +-----
 .../appkit/src/plugins/agents/manifest.json   |  1 +
 .../src/plugins/beta-exports.generated.ts     |  2 +-
 packages/shared/src/agent.ts                  | 32 +++++++++++++++++++
 pnpm-lock.yaml                                | 20 ++++++------
 9 files changed, 62 insertions(+), 29 deletions(-)

diff --git a/packages/appkit/package.json b/packages/appkit/package.json
index 4be45d63d..6ae529399 100644
--- a/packages/appkit/package.json
+++ b/packages/appkit/package.json
@@ -76,6 +76,7 @@
     "dotenv": "16.6.1",
     "express": "4.22.0",
     "get-port": "7.2.0",
+    "js-yaml": "^4.1.1",
     "obug": "2.1.1",
     "pg": "8.18.0",
     "picocolors": "1.1.1",
@@ -88,6 +89,7 @@
   "devDependencies": {
     "@opentelemetry/context-async-hooks": "2.6.1",
     "@types/express": "4.17.25",
+    "@types/js-yaml": "4.0.9",
     "@types/json-schema": "7.0.15",
     "@types/pg": "8.16.0",
     "@types/ws": "8.18.1",
diff --git a/packages/appkit/src/beta.ts b/packages/appkit/src/beta.ts
index 55c836c97..562cfd43a 100644
--- a/packages/appkit/src/beta.ts
+++ b/packages/appkit/src/beta.ts
@@ -15,6 +15,7 @@ export type {
   Message,
   Thread,
   ThreadStore,
+  ToolAnnotations,
   ToolProvider,
 } from "shared";
 export { DatabricksAdapter, parseTextToolCalls } from "./agents/databricks";
diff --git a/packages/appkit/src/core/agent/tools/function-tool.ts b/packages/appkit/src/core/agent/tools/function-tool.ts
index 7371d857e..19820f8fe 100644
--- a/packages/appkit/src/core/agent/tools/function-tool.ts
+++ b/packages/appkit/src/core/agent/tools/function-tool.ts
@@ -7,11 +7,13 @@ export interface FunctionTool {
   parameters?: Record<string, unknown> | null;
   strict?: boolean | null;
   /**
-   * Behavioural flags that drive the agents plugin's approval gate and
-   * auto-inherit filtering. `destructive: true` forces HITL approval
-   * before execute() runs; `readOnly: true` marks safe-by-default tools.
-   * Must be preserved through {@link functionToolToDefinition} so the
-   * plugin sees them when building agent tool indexes.
+   * Behavioural hints that drive the agents plugin's approval gate and the
+   * client's approval-card styling. Prefer setting `effect` (one of
+   * `"read" | "write" | "update" | "destructive"`) — any mutating value
+   * forces HITL approval before `execute()` runs. Legacy `destructive: true`
+   * is still honoured. Must be preserved through {@link
+   * functionToolToDefinition} so the plugin sees them when building agent
+   * tool indexes.
    */
   annotations?: ToolAnnotations;
   execute: (args: Record<string, unknown>) => Promise<string> | string;
diff --git a/packages/appkit/src/core/agent/tools/tool.ts b/packages/appkit/src/core/agent/tools/tool.ts
index 370a1d4b0..53305c236 100644
--- a/packages/appkit/src/core/agent/tools/tool.ts
+++ b/packages/appkit/src/core/agent/tools/tool.ts
@@ -8,11 +8,12 @@ export interface ToolConfig<S extends z.ZodType> {
   description?: string;
   schema: S;
   /**
-   * Behavioural flags forwarded to the resolved tool definition. Required
-   * for the agents plugin to gate destructive tools through the approval
-   * card, surface `readOnly` tools to auto-inherit, etc. Dropped silently
-   * before the fix that added this field — any tool wanting HITL must
-   * set `annotations: { destructive: true }` here.
+   * Behavioural hints forwarded to the resolved tool definition. Prefer
+   * `effect` (`"read" | "write" | "update" | "destructive"`) — any mutating
+   * value forces the agents-plugin approval gate before `execute()` runs
+   * and the client's approval card will colour itself accordingly. Legacy
+   * `destructive: true` still gates. Dropped silently before the fix that
+   * added this field.
    */
   annotations?: ToolAnnotations;
   execute: (args: z.infer<S>) => Promise<string> | string;
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index 4c406f12e..3bfe45cbf 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -14,20 +14,12 @@ import type {
   Thread,
   ToolProvider,
 } from "shared";
-import { buildMcpHostPolicy } from "../../connectors/mcp";
+import { AppKitMcpClient, buildMcpHostPolicy } from "../../connectors/mcp";
 import { loadAgentsFromDir } from "../../core/agent/load-agents";
 import {
   buildBaseSystemPrompt,
   composeSystemPrompt,
 } from "../../core/agent/system-prompt";
-import { AppKitMcpClient } from "../../connectors/mcp";
-import {
-  approvalRequestSchema,
-  chatRequestSchema,
-  invocationsRequestSchema,
-} from "./schemas";
-import { InMemoryThreadStore } from "./thread-store";
-import { ToolApprovalGate } from "./tool-approval-gate";
 import {
   functionToolToDefinition,
   isFunctionTool,
diff --git a/packages/appkit/src/plugins/agents/manifest.json b/packages/appkit/src/plugins/agents/manifest.json
index f3986c837..4571031a8 100644
--- a/packages/appkit/src/plugins/agents/manifest.json
+++ b/packages/appkit/src/plugins/agents/manifest.json
@@ -2,6 +2,7 @@
   "$schema": "https://databricks.github.io/appkit/schemas/plugin-manifest.schema.json",
   "name": "agents",
   "displayName": "Agents Plugin",
+  "stability": "beta",
   "description": "AI agents driven by markdown configs or code, with auto-tool-discovery from registered plugins",
   "resources": {
     "required": [],
diff --git a/packages/appkit/src/plugins/beta-exports.generated.ts b/packages/appkit/src/plugins/beta-exports.generated.ts
index 7fff0af71..82f6c4a78 100644
--- a/packages/appkit/src/plugins/beta-exports.generated.ts
+++ b/packages/appkit/src/plugins/beta-exports.generated.ts
@@ -5,4 +5,4 @@
 // subpath ships each plugin. Editing this file by hand will drift it from the
 // manifests and the synced appkit.plugins.json.
 
-export {};
+export { agents } from "./agents";
diff --git a/packages/shared/src/agent.ts b/packages/shared/src/agent.ts
index 2594b3e6d..74fc500aa 100644
--- a/packages/shared/src/agent.ts
+++ b/packages/shared/src/agent.ts
@@ -4,8 +4,40 @@ import type { JSONSchema7 } from "json-schema";
 // Tool definitions
 // ---------------------------------------------------------------------------
 
+/**
+ * Semantic hint for what the tool does to the world. Drives both the
+ * agents-plugin approval gate and the client's approval-card styling.
+ *
+ * - `read` — observes only; never needs approval.
+ * - `write` — creates or appends new state (e.g. saving a new view). Approval
+ *   required by default. Rendered as a low-severity "writes" card.
+ * - `update` — mutates existing state in place (e.g. renaming, toggling).
+ *   Approval required. Rendered as a medium-severity "updates" card.
+ * - `destructive` — deletes or irreversibly mutates (e.g. dropping a view).
+ *   Approval required. Rendered as a high-severity "destructive" card.
+ *
+ * Prefer this over the legacy `readOnly`/`destructive` booleans: it lets the
+ * UI distinguish "captured a screenshot" from "deleted a dashboard", both of
+ * which today are lumped under a single red "destructive" label.
+ */
+export type ToolEffect = "read" | "write" | "update" | "destructive";
+
 export interface ToolAnnotations {
+  /**
+   * Preferred semantic label. When set, drives both the approval gate (fires
+   * for `write`/`update`/`destructive`) and the approval-card styling.
+   */
+  effect?: ToolEffect;
+  /**
+   * @deprecated Prefer {@link effect}. Retained for backward compatibility
+   * with tools authored against the original flags and for MCP interop.
+   */
   readOnly?: boolean;
+  /**
+   * @deprecated Prefer {@link effect} with value `"destructive"`. Retained
+   * so existing annotations continue to force the approval gate, and so
+   * MCP-style consumers that only read `destructive` still see the hint.
+   */
   destructive?: boolean;
   idempotent?: boolean;
   requiresUserContext?: boolean;
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index ba4b8ef8e..635fb38a7 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -305,9 +305,9 @@ importers:
       express:
         specifier: 4.22.0
         version: 4.22.0
-      get-port:
-        specifier: 7.2.0
-        version: 7.2.0
+      js-yaml:
+        specifier: ^4.1.1
+        version: 4.1.1
       obug:
         specifier: 2.1.1
         version: 2.1.1
@@ -339,6 +339,9 @@ importers:
       '@types/express':
         specifier: 4.17.25
         version: 4.17.25
+      '@types/js-yaml':
+        specifier: 4.0.9
+        version: 4.0.9
       '@types/json-schema':
         specifier: 7.0.15
         version: 7.0.15
@@ -4915,6 +4918,9 @@ packages:
   '@types/istanbul-reports@3.0.4':
     resolution: {integrity: sha512-pk2B1NWalF9toCRu6gjBzR69syFjP4Od8WRAX+0mmf9lAjCRicLOWc+ZrxZHx/0XRjotgkF9t6iaMJ+aXcOdZQ==}
 
+  '@types/js-yaml@4.0.9':
+    resolution: {integrity: sha512-k4MGaQl5TGo/iipqb2UDG2UwjXziSWkh0uysQelTlJpX1qGlpUZYm8PnO4DxG1qBomtJUdYJ6qR6xdIah10JLg==}
+
   '@types/jsesc@2.5.1':
     resolution: {integrity: sha512-9VN+6yxLOPLOav+7PwjZbxiID2bVaeq0ED4qSQmdQTdjnXJSaCVKTR58t15oqH1H5t8Ng2ZX1SabJVoN9Q34bw==}
 
@@ -7284,10 +7290,6 @@ packages:
   get-own-enumerable-property-symbols@3.0.2:
     resolution: {integrity: sha512-I0UBV/XOz1XkIJHEUDMZAbzCThU/H8DxmSfmdGcKPnVhu2VfFqr34jr9777IyaTYvxjedWhqVIilEDsCdP5G6g==}
 
-  get-port@7.2.0:
-    resolution: {integrity: sha512-afP4W205ONCuMoPBqcR6PSXnzX35KTcJygfJfcp+QY+uwm3p20p1YczWXhlICIzGMCxYBQcySEcOgsJcrkyobg==}
-    engines: {node: '>=16'}
-
   get-proto@1.0.1:
     resolution: {integrity: sha512-sTSfBjoXBp89JvIKIefqw7U2CCebsc74kiY6awiGogKtoSGbgjYE/G/+l9sF3MWFPNc9IcoOC4ODfKHfxFmp0g==}
     engines: {node: '>= 0.4'}
@@ -17262,6 +17264,8 @@ snapshots:
     dependencies:
       '@types/istanbul-lib-report': 3.0.3
 
+  '@types/js-yaml@4.0.9': {}
+
   '@types/jsesc@2.5.1': {}
 
   '@types/json-schema@7.0.15': {}
@@ -19876,8 +19880,6 @@ snapshots:
 
   get-own-enumerable-property-symbols@3.0.2: {}
 
-  get-port@7.2.0: {}
-
   get-proto@1.0.1:
     dependencies:
       dunder-proto: 1.0.1

From a677c0e02b2313dd62f670570e4942e6bbd5b5bf Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Tue, 21 Apr 2026 19:52:50 +0200
Subject: [PATCH 10/46] feat(appkit): fromPlugin() DX, runAgent plugins arg,
 shared toolkit-resolver
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

DX centerpiece. Introduces the symbol-marker pattern that collapses
plugin tool references in code-defined agents from a three-touch dance
to a single line, and extracts the shared resolver that the agents
plugin, auto-inherit, and standalone runAgent all now go through.

`packages/appkit/src/plugins/agents/from-plugin.ts`. Returns a spread-
friendly `{ [Symbol()]: FromPluginMarker }` record. The symbol key is
freshly generated per call, so multiple spreads of the same plugin
coexist safely. The marker's brand is a globally-interned
`Symbol.for("@databricks/appkit.fromPluginMarker")` — stable across
module boundaries.

`packages/appkit/src/plugins/agents/toolkit-resolver.ts`. Single source
of truth for "turn a ToolProvider into a keyed record of `ToolkitEntry`
markers". Prefers `provider.toolkit(opts)` when available (core plugins
implement it), falls back to walking `getAgentTools()` and synthesizing
namespaced keys (`${pluginName}.${localName}`) for third-party
providers, honoring `only` / `except` / `rename` / `prefix` the same
way.

Used by three call sites, previously all copy-pasted:
1. `AgentsPlugin.buildToolIndex` — fromPlugin marker resolution pass
2. `AgentsPlugin.applyAutoInherit` — markdown auto-inherit path
3. `runAgent` — standalone-mode plugin tool dispatch

Before the existing string-key iteration, `buildToolIndex` now walks
`Object.getOwnPropertySymbols(def.tools)`. For each `FromPluginMarker`,
it looks up the plugin by name in `PluginContext.getToolProviders()`,
calls `resolveToolkitFromProvider`, and merges the resulting entries
into the per-agent index. Missing plugins throw at setup time with a
clear `Available: ...` listing — wiring errors surface on boot, not
mid-request.

`hasExplicitTools` now counts symbol keys too, so a
`tools: { ...fromPlugin(x) }` record correctly disables auto-inherit
on code-defined agents.

- `AgentTools` type: `{ [key: string]: AgentTool } & { [key: symbol]:
  FromPluginMarker }`. Preserves string-key autocomplete while
  accepting marker spreads under strict TS.
- `AgentDefinition.tools` switched to `AgentTools`.

`packages/appkit/src/core/run-agent.ts`. When an agent def contains
`fromPlugin` markers, the caller passes plugins via
`RunAgentInput.plugins`. A local provider cache constructs each plugin
and dispatches tool calls via `provider.executeAgentTool()`. Runs as
service principal (no OBO — there's no HTTP request). If a def
contains markers but `plugins` is absent, throws with guidance.

`fromPlugin`, `FromPluginMarker`, `isFromPluginMarker`, `AgentTools`
added to the main barrel.

- 14 new tests: marker shape, symbol uniqueness, type guard,
  factory-without-pluginName error, fromPlugin marker resolution in
  AgentsPlugin, fallback to getAgentTools for providers without
  .toolkit(), symbol-only tools disables auto-inherit, runAgent
  standalone marker resolution via `plugins` arg, guidance error when
  missing.
- Full appkit vitest suite: 1311 tests passing.
- Typecheck clean.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 packages/appkit/src/beta.ts                   |   4 +
 packages/appkit/src/core/agent/from-plugin.ts |  97 ++++++++
 packages/appkit/src/core/agent/run-agent.ts   | 152 ++++++++++--
 .../src/core/agent/tests/run-agent.test.ts    | 100 +++++++-
 .../appkit/src/core/agent/toolkit-resolver.ts |  62 +++++
 packages/appkit/src/core/agent/types.ts       |  13 +-
 packages/appkit/src/plugins/agents/agents.ts  | 101 +++++---
 packages/appkit/src/plugins/agents/index.ts   |  10 +-
 .../agents/tests/agents-plugin.test.ts        | 220 +++++++++++++++++-
 .../plugins/agents/tests/from-plugin.test.ts  |  80 +++++++
 10 files changed, 789 insertions(+), 50 deletions(-)
 create mode 100644 packages/appkit/src/core/agent/from-plugin.ts
 create mode 100644 packages/appkit/src/core/agent/toolkit-resolver.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/from-plugin.test.ts

diff --git a/packages/appkit/src/beta.ts b/packages/appkit/src/beta.ts
index 562cfd43a..9295a43ed 100644
--- a/packages/appkit/src/beta.ts
+++ b/packages/appkit/src/beta.ts
@@ -52,8 +52,10 @@ export type {
   AgentDefinition,
   AgentsPluginConfig,
   AgentTool,
+  AgentTools,
   AutoInheritToolsConfig,
   BaseSystemPromptOption,
+  FromPluginMarker,
   PromptContext,
   RegisteredAgent,
   ResolvedToolEntry,
@@ -62,6 +64,8 @@ export type {
 } from "./plugins/agents";
 export {
   agentIdFromMarkdownPath,
+  fromPlugin,
+  isFromPluginMarker,
   isToolkitEntry,
   loadAgentFromFile,
   loadAgentsFromDir,
diff --git a/packages/appkit/src/core/agent/from-plugin.ts b/packages/appkit/src/core/agent/from-plugin.ts
new file mode 100644
index 000000000..b11285941
--- /dev/null
+++ b/packages/appkit/src/core/agent/from-plugin.ts
@@ -0,0 +1,97 @@
+import type { NamedPluginFactory } from "../../plugin/to-plugin";
+import type { ToolkitOptions } from "./types";
+
+/**
+ * Symbol brand for the `fromPlugin` marker. Using a globally-interned symbol
+ * (`Symbol.for`) keeps the brand stable across module boundaries / bundle
+ * duplicates so `isFromPluginMarker` stays reliable.
+ */
+export const FROM_PLUGIN_MARKER = Symbol.for(
+  "@databricks/appkit.fromPluginMarker",
+);
+
+/**
+ * A lazy reference to a plugin's tools, produced by {@link fromPlugin} and
+ * resolved to concrete `ToolkitEntry`s at `AgentsPlugin.setup()` time.
+ *
+ * The marker is spread under a unique symbol key so multiple calls to
+ * `fromPlugin` (even for the same plugin) coexist in an `AgentDefinition.tools`
+ * record without colliding.
+ */
+export interface FromPluginMarker {
+  readonly [FROM_PLUGIN_MARKER]: true;
+  readonly pluginName: string;
+  readonly opts: ToolkitOptions | undefined;
+}
+
+/**
+ * Record shape returned by {@link fromPlugin} — a single symbol-keyed entry
+ * suitable for spreading into `AgentDefinition.tools`.
+ */
+export type FromPluginSpread = { readonly [key: symbol]: FromPluginMarker };
+
+/**
+ * Reference a plugin's tools inside an `AgentDefinition.tools` record without
+ * naming the plugin instance. The returned spread-friendly object carries a
+ * symbol-keyed marker that the agents plugin resolves against registered
+ * `ToolProvider`s at setup time.
+ *
+ * The factory argument must come from `toPlugin` (or any function that
+ * carries a `pluginName` field). `fromPlugin` reads `factory.pluginName`
+ * synchronously — it does not construct an instance.
+ *
+ * If the referenced plugin is also registered in `createApp({ plugins })`, the
+ * same runtime instance is used for dispatch. If the plugin is missing,
+ * `AgentsPlugin.setup()` throws with a clear `Available: …` listing.
+ *
+ * @example
+ * ```ts
+ * import { analytics, createAgent, files, fromPlugin, tool } from "@databricks/appkit";
+ *
+ * const support = createAgent({
+ *   instructions: "You help customers.",
+ *   tools: {
+ *     ...fromPlugin(analytics),
+ *     ...fromPlugin(files, { only: ["uploads.read"] }),
+ *     get_weather: tool({ ... }),
+ *   },
+ * });
+ * ```
+ *
+ * @param factory A plugin factory produced by `toPlugin`. Must expose a
+ *   `pluginName` field.
+ * @param opts Optional toolkit scoping — `prefix`, `only`, `except`, `rename`.
+ *   Same shape as the `.toolkit()` method.
+ */
+export function fromPlugin<F extends NamedPluginFactory>(
+  factory: F,
+  opts?: ToolkitOptions,
+): FromPluginSpread {
+  if (
+    !factory ||
+    typeof factory.pluginName !== "string" ||
+    !factory.pluginName
+  ) {
+    throw new Error(
+      "fromPlugin(): factory is missing pluginName. Pass a factory created by toPlugin().",
+    );
+  }
+  const pluginName = factory.pluginName;
+  const marker: FromPluginMarker = {
+    [FROM_PLUGIN_MARKER]: true,
+    pluginName,
+    opts,
+  };
+  return { [Symbol(`fromPlugin:${pluginName}`)]: marker };
+}
+
+/**
+ * Type guard for {@link FromPluginMarker}.
+ */
+export function isFromPluginMarker(value: unknown): value is FromPluginMarker {
+  return (
+    typeof value === "object" &&
+    value !== null &&
+    (value as Record<symbol, unknown>)[FROM_PLUGIN_MARKER] === true
+  );
+}
diff --git a/packages/appkit/src/core/agent/run-agent.ts b/packages/appkit/src/core/agent/run-agent.ts
index 5ef4109cf..4646aec74 100644
--- a/packages/appkit/src/core/agent/run-agent.ts
+++ b/packages/appkit/src/core/agent/run-agent.ts
@@ -4,18 +4,20 @@ import type {
   AgentEvent,
   AgentToolDefinition,
   Message,
+  PluginConstructor,
+  PluginData,
+  ToolProvider,
 } from "shared";
+import { consumeAdapterStream } from "./consume-adapter-stream";
+import { isFromPluginMarker } from "./from-plugin";
+import { resolveToolkitFromProvider } from "./toolkit-resolver";
 import {
   type FunctionTool,
   functionToolToDefinition,
   isFunctionTool,
 } from "./tools/function-tool";
 import { isHostedTool } from "./tools/hosted-tools";
-import type {
-  AgentDefinition,
-  AgentTool,
-  ToolkitEntry,
-} from "./types";
+import type { AgentDefinition, AgentTool, ToolkitEntry } from "./types";
 import { isToolkitEntry } from "./types";
 
 export interface RunAgentInput {
@@ -23,6 +25,14 @@ export interface RunAgentInput {
   messages: string | Message[];
   /** Abort signal for cancellation. */
   signal?: AbortSignal;
+  /**
+   * Optional plugin list used to resolve `fromPlugin` markers in `def.tools`.
+   * Required when the def contains any `...fromPlugin(factory)` spreads;
+   * ignored otherwise. `runAgent` constructs a fresh instance per plugin
+   * and dispatches tool calls against it as the service principal (no
+   * OBO — there is no HTTP request in standalone mode).
+   */
+  plugins?: PluginData<PluginConstructor, unknown, string>[];
 }
 
 export interface RunAgentResult {
@@ -39,11 +49,12 @@ export interface RunAgentResult {
  * Limitations vs. running through the agents() plugin:
  * - No OBO: there is no HTTP request, so plugin tools run as the service
  *   principal (when they work at all).
- * - Plugin tools (`ToolkitEntry`) are not supported — they require a live
- *   `PluginContext` that only exists when registered in a `createApp`
- *   instance. This function throws a clear error if encountered.
+ * - Hosted tools (MCP) are not supported — they require a live MCP client
+ *   that only exists inside the agents plugin.
  * - Sub-agents (`agents: { ... }` on the def) are executed as nested
  *   `runAgent` calls with no shared thread state.
+ * - Plugin tools (`fromPlugin` markers or `ToolkitEntry` spreads) require
+ *   passing `plugins: [...]` via `RunAgentInput`.
  */
 export async function runAgent(
   def: AgentDefinition,
@@ -51,7 +62,7 @@ export async function runAgent(
 ): Promise<RunAgentResult> {
   const adapter = await resolveAdapter(def);
   const messages = normalizeMessages(input.messages, def.instructions);
-  const toolIndex = buildStandaloneToolIndex(def);
+  const toolIndex = buildStandaloneToolIndex(def, input.plugins ?? []);
   const tools = Array.from(toolIndex.values()).map((e) => e.def);
 
   const signal = input.signal;
@@ -62,6 +73,13 @@ export async function runAgent(
     if (entry.kind === "function") {
       return entry.tool.execute(args as Record<string, unknown>);
     }
+    if (entry.kind === "toolkit") {
+      return entry.provider.executeAgentTool(
+        entry.localName,
+        args as Record<string, unknown>,
+        signal,
+      );
+    }
     if (entry.kind === "subagent") {
       const subInput: RunAgentInput = {
         messages:
@@ -71,13 +89,14 @@ export async function runAgent(
             ? (args as { input: string }).input
             : JSON.stringify(args),
         signal,
+        plugins: input.plugins,
       };
       const res = await runAgent(entry.agentDef, subInput);
       return res.text;
     }
     throw new Error(
       `runAgent: tool "${name}" is a ${entry.kind} tool. ` +
-        "Plugin toolkits and MCP tools are only usable via createApp({ plugins: [..., agents(...)] }).",
+        "Hosted/MCP tools are only usable via createApp({ plugins: [..., agents(...)] }).",
     );
   };
 
@@ -158,20 +177,61 @@ type StandaloneEntry =
   | {
       kind: "toolkit";
       def: AgentToolDefinition;
-      entry: ToolkitEntry;
+      provider: ToolProvider;
+      pluginName: string;
+      localName: string;
     }
   | {
       kind: "hosted";
       def: AgentToolDefinition;
     };
 
+/**
+ * Resolves `def.tools` (string-keyed entries + symbol-keyed `fromPlugin`
+ * markers) and `def.agents` (sub-agents) into a flat dispatch index.
+ * Symbol-keyed markers are resolved against `plugins`; missing references
+ * throw with an `Available: …` listing.
+ */
 function buildStandaloneToolIndex(
   def: AgentDefinition,
+  plugins: PluginData<PluginConstructor, unknown, string>[],
 ): Map<string, StandaloneEntry> {
   const index = new Map<string, StandaloneEntry>();
+  const tools = def.tools;
+
+  const symbolKeys = tools ? Object.getOwnPropertySymbols(tools) : [];
+  if (symbolKeys.length > 0) {
+    const providerCache = new Map<string, ToolProvider>();
+    for (const sym of symbolKeys) {
+      const marker = (tools as Record<symbol, unknown>)[sym];
+      if (!isFromPluginMarker(marker)) continue;
 
-  for (const [key, tool] of Object.entries(def.tools ?? {})) {
-    index.set(key, classifyTool(key, tool));
+      const provider = resolveStandaloneProvider(
+        marker.pluginName,
+        plugins,
+        providerCache,
+      );
+      const entries = resolveToolkitFromProvider(
+        marker.pluginName,
+        provider,
+        marker.opts,
+      );
+      for (const [key, entry] of Object.entries(entries)) {
+        index.set(key, {
+          kind: "toolkit",
+          provider,
+          pluginName: entry.pluginName,
+          localName: entry.localName,
+          def: { ...entry.def, name: key },
+        });
+      }
+    }
+  }
+
+  if (tools) {
+    for (const [key, tool] of Object.entries(tools)) {
+      index.set(key, classifyTool(key, tool));
+    }
   }
 
   for (const [childKey, child] of Object.entries(def.agents ?? {})) {
@@ -203,7 +263,7 @@ function buildStandaloneToolIndex(
 
 function classifyTool(key: string, tool: AgentTool): StandaloneEntry {
   if (isToolkitEntry(tool)) {
-    return { kind: "toolkit", def: { ...tool.def, name: key }, entry: tool };
+    return toolkitEntryToStandalone(key, tool);
   }
   if (isFunctionTool(tool)) {
     return {
@@ -224,3 +284,67 @@ function classifyTool(key: string, tool: AgentTool): StandaloneEntry {
   }
   throw new Error(`runAgent: unrecognized tool shape at key "${key}"`);
 }
+
+/**
+ * Pre-`fromPlugin` code could reach a `ToolkitEntry` by calling
+ * `.toolkit()` at module scope (which requires an instance). Those entries
+ * still flow through `def.tools` but without a provider we can dispatch
+ * against — runAgent cannot execute them and errors clearly.
+ */
+function toolkitEntryToStandalone(
+  key: string,
+  entry: ToolkitEntry,
+): StandaloneEntry {
+  const def: AgentToolDefinition = { ...entry.def, name: key };
+  return {
+    kind: "hosted",
+    def: {
+      ...def,
+      description:
+        `${def.description ?? ""} ` +
+        `[runAgent: this ToolkitEntry refers to plugin '${entry.pluginName}' but ` +
+        "runAgent cannot dispatch it without the plugin instance. Pass the " +
+        "plugin via plugins: [...] and use fromPlugin(factory) instead of " +
+        ".toolkit() spreads.]".trim(),
+    },
+  };
+}
+
+function resolveStandaloneProvider(
+  pluginName: string,
+  plugins: PluginData<PluginConstructor, unknown, string>[],
+  cache: Map<string, ToolProvider>,
+): ToolProvider {
+  const cached = cache.get(pluginName);
+  if (cached) return cached;
+
+  const match = plugins.find((p) => p.name === pluginName);
+  if (!match) {
+    const available = plugins.map((p) => p.name).join(", ") || "(none)";
+    throw new Error(
+      `runAgent: agent references plugin '${pluginName}' via fromPlugin(), but ` +
+        "that plugin is missing from RunAgentInput.plugins. " +
+        `Available: ${available}.`,
+    );
+  }
+
+  const instance = new match.plugin({
+    ...(match.config ?? {}),
+    name: pluginName,
+  });
+  const provider = instance as unknown as ToolProvider;
+  if (
+    typeof (provider as { getAgentTools?: unknown }).getAgentTools !==
+      "function" ||
+    typeof (provider as { executeAgentTool?: unknown }).executeAgentTool !==
+      "function"
+  ) {
+    throw new Error(
+      `runAgent: plugin '${pluginName}' is not a ToolProvider ` +
+        "(missing getAgentTools/executeAgentTool). Only ToolProvider plugins " +
+        "are supported via fromPlugin() in runAgent.",
+    );
+  }
+  cache.set(pluginName, provider);
+  return provider;
+}
diff --git a/packages/appkit/src/core/agent/tests/run-agent.test.ts b/packages/appkit/src/core/agent/tests/run-agent.test.ts
index 55b3e7b39..5324dde21 100644
--- a/packages/appkit/src/core/agent/tests/run-agent.test.ts
+++ b/packages/appkit/src/core/agent/tests/run-agent.test.ts
@@ -3,13 +3,18 @@ import type {
   AgentEvent,
   AgentInput,
   AgentRunContext,
+  AgentToolDefinition,
+  PluginConstructor,
+  PluginData,
+  ToolProvider,
 } from "shared";
 import { describe, expect, test, vi } from "vitest";
 import { z } from "zod";
+import type { ToolkitEntry } from "../../../core/agent/types";
 import { createAgent } from "../create-agent";
+import { fromPlugin } from "../from-plugin";
 import { runAgent } from "../run-agent";
-import { tool } from "../../../core/agent/tools/tool";
-import type { ToolkitEntry } from "../../../core/agent/types";
+import { tool } from "../tools/tool";
 
 function scriptedAdapter(events: AgentEvent[]): AgentAdapter {
   return {
@@ -84,6 +89,97 @@ describe("runAgent", () => {
     expect(weatherFn).toHaveBeenCalledWith({ city: "NYC" });
   });
 
+  test("resolves fromPlugin markers against RunAgentInput.plugins", async () => {
+    const pingExec = vi.fn(async () => "pong");
+    class FakePlugin implements ToolProvider {
+      static manifest = { name: "ping" };
+      static DEFAULT_CONFIG = {};
+      name = "ping";
+      constructor(public config: unknown) {}
+      async setup() {}
+      injectRoutes() {}
+      getEndpoints() {
+        return {};
+      }
+      getAgentTools(): AgentToolDefinition[] {
+        return [
+          {
+            name: "ping",
+            description: "ping",
+            parameters: { type: "object", properties: {} },
+          },
+        ];
+      }
+      executeAgentTool = pingExec;
+    }
+
+    const factory = () => ({
+      plugin: FakePlugin as unknown as PluginConstructor,
+      config: {},
+      name: "ping" as const,
+    });
+    Object.defineProperty(factory, "pluginName", {
+      value: "ping",
+      enumerable: true,
+    });
+
+    let capturedCtx: AgentRunContext | null = null;
+    const adapter: AgentAdapter = {
+      async *run(_input, context) {
+        capturedCtx = context;
+        yield { type: "message_delta", content: "" };
+      },
+    };
+
+    const def = createAgent({
+      instructions: "x",
+      model: adapter,
+      tools: {
+        ...fromPlugin(factory as unknown as { readonly pluginName: string }),
+      },
+    });
+
+    const pluginData = factory() as PluginData<
+      PluginConstructor,
+      unknown,
+      string
+    >;
+
+    await runAgent(def, { messages: "hi", plugins: [pluginData] });
+    expect(capturedCtx).not.toBeNull();
+    // biome-ignore lint/style/noNonNullAssertion: asserted above
+    const result = await capturedCtx!.executeTool("ping.ping", {});
+    expect(result).toBe("pong");
+    expect(pingExec).toHaveBeenCalled();
+  });
+
+  test("throws with guidance when fromPlugin marker has no matching plugin", async () => {
+    const factory = () => ({ name: "absent" as const });
+    Object.defineProperty(factory, "pluginName", {
+      value: "absent",
+      enumerable: true,
+    });
+
+    const adapter: AgentAdapter = {
+      async *run(_input, _context) {
+        yield { type: "message_delta", content: "" };
+      },
+    };
+
+    const def = createAgent({
+      instructions: "x",
+      model: adapter,
+      tools: {
+        ...fromPlugin(factory as unknown as { readonly pluginName: string }),
+      },
+    });
+
+    await expect(runAgent(def, { messages: "hi" })).rejects.toThrow(/absent/);
+    await expect(runAgent(def, { messages: "hi" })).rejects.toThrow(
+      /Available:/,
+    );
+  });
+
   test("throws a clear error when a ToolkitEntry is invoked", async () => {
     const toolkitEntry: ToolkitEntry = {
       __toolkitRef: true,
diff --git a/packages/appkit/src/core/agent/toolkit-resolver.ts b/packages/appkit/src/core/agent/toolkit-resolver.ts
new file mode 100644
index 000000000..8ec8cf1f7
--- /dev/null
+++ b/packages/appkit/src/core/agent/toolkit-resolver.ts
@@ -0,0 +1,62 @@
+import type { ToolProvider } from "shared";
+import type { ToolkitEntry, ToolkitOptions } from "./types";
+
+/**
+ * Internal interface: a `ToolProvider` that optionally exposes a typed
+ * `.toolkit(opts)` method. Core plugins (analytics, files, genie, lakebase)
+ * implement this; third-party `ToolProvider`s may not.
+ */
+type MaybeToolkitProvider = ToolProvider & {
+  toolkit?: (opts?: ToolkitOptions) => Record<string, ToolkitEntry>;
+};
+
+/**
+ * Resolve a plugin's tools into a keyed record of {@link ToolkitEntry} markers
+ * ready to be merged into an agent's tool index.
+ *
+ * Preferred path: call the plugin's own `.toolkit(opts)` method, which
+ * typically delegates to `buildToolkitEntries` with full `ToolkitOptions`
+ * support (prefix, only, except, rename).
+ *
+ * Fallback path: when the plugin doesn't expose `.toolkit()` (e.g. a
+ * third-party `ToolProvider` built with plain `toPlugin`), walk
+ * `getAgentTools()` and synthesize namespaced keys (`${pluginName}.${name}`)
+ * while still honoring `only` / `except` / `rename` / `prefix`.
+ *
+ * This helper is the single source of truth for "turn a provider into a
+ * toolkit entry record" and is used by `AgentsPlugin.buildToolIndex`
+ * (both the `fromPlugin` resolution pass and auto-inherit) and by the
+ * standalone `runAgent` executor.
+ */
+export function resolveToolkitFromProvider(
+  pluginName: string,
+  provider: ToolProvider,
+  opts?: ToolkitOptions,
+): Record<string, ToolkitEntry> {
+  const withToolkit = provider as MaybeToolkitProvider;
+  if (typeof withToolkit.toolkit === "function") {
+    return withToolkit.toolkit(opts);
+  }
+
+  const only = opts?.only ? new Set(opts.only) : null;
+  const except = opts?.except ? new Set(opts.except) : null;
+  const rename = opts?.rename ?? {};
+  const prefix = opts?.prefix ?? `${pluginName}.`;
+
+  const out: Record<string, ToolkitEntry> = {};
+  for (const tool of provider.getAgentTools()) {
+    if (only && !only.has(tool.name)) continue;
+    if (except?.has(tool.name)) continue;
+
+    const keyAfterPrefix = `${prefix}${tool.name}`;
+    const key = rename[tool.name] ?? keyAfterPrefix;
+
+    out[key] = {
+      __toolkitRef: true,
+      pluginName,
+      localName: tool.name,
+      def: { ...tool, name: key },
+    };
+  }
+  return out;
+}
diff --git a/packages/appkit/src/core/agent/types.ts b/packages/appkit/src/core/agent/types.ts
index 14366e9ab..ce3d0463f 100644
--- a/packages/appkit/src/core/agent/types.ts
+++ b/packages/appkit/src/core/agent/types.ts
@@ -6,6 +6,7 @@ import type {
   ToolAnnotations,
 } from "shared";
 import type { McpHostPolicyConfig } from "../../connectors/mcp";
+import type { FromPluginMarker } from "./from-plugin";
 import type { FunctionTool } from "./tools/function-tool";
 import type { HostedTool } from "./tools/hosted-tools";
 
@@ -62,6 +63,16 @@ export type BaseSystemPromptOption =
   | string
   | ((ctx: PromptContext) => string);
 
+/**
+ * Per-agent tool record. String keys map to inline tools, toolkit entries,
+ * hosted tools, etc. Symbol keys hold `FromPluginMarker` references produced
+ * by `fromPlugin(factory)` spreads — these are resolved at
+ * `AgentsPlugin.setup()` time against registered `ToolProvider` plugins.
+ */
+export type AgentTools = { [key: string]: AgentTool } & {
+  [key: symbol]: FromPluginMarker;
+};
+
 export interface AgentDefinition {
   /** Filled in from the enclosing key when used in `agents: { foo: def }`. */
   name?: string;
@@ -74,7 +85,7 @@ export interface AgentDefinition {
    */
   model?: AgentAdapter | Promise<AgentAdapter> | string;
   /** Per-agent tool record. Key is the LLM-visible tool-call name. */
-  tools?: Record<string, AgentTool>;
+  tools?: AgentTools;
   /** Sub-agents, exposed as `agent-<key>` tools on this agent. */
   agents?: Record<string, AgentDefinition>;
   /** Override the plugin's baseSystemPrompt for this agent only. */
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index 3bfe45cbf..309589e0f 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -15,11 +15,14 @@ import type {
   ToolProvider,
 } from "shared";
 import { AppKitMcpClient, buildMcpHostPolicy } from "../../connectors/mcp";
+import { getWorkspaceClient } from "../../context";
+import { isFromPluginMarker } from "../../core/agent/from-plugin";
 import { loadAgentsFromDir } from "../../core/agent/load-agents";
 import {
   buildBaseSystemPrompt,
   composeSystemPrompt,
 } from "../../core/agent/system-prompt";
+import { resolveToolkitFromProvider } from "../../core/agent/toolkit-resolver";
 import {
   functionToolToDefinition,
   isFunctionTool,
@@ -38,10 +41,12 @@ import { isToolkitEntry } from "../../core/agent/types";
 import { createLogger } from "../../logging/logger";
 import { Plugin, toPlugin } from "../../plugin";
 import type { PluginManifest } from "../../registry";
+import { consumeAdapterStream } from "../../core/agent/consume-adapter-stream";
 import { agentStreamDefaults } from "./defaults";
 import { EventChannel } from "./event-channel";
 import { AgentEventTranslator } from "./event-translator";
 import manifest from "./manifest.json";
+import { normalizeToolResult } from "../../core/agent/normalize-result";
 import {
   approvalRequestSchema,
   chatRequestSchema,
@@ -327,7 +332,11 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     src: AgentSource,
   ): Promise<Map<string, ResolvedToolEntry>> {
     const index = new Map<string, ResolvedToolEntry>();
-    const hasExplicitTools = def.tools && Object.keys(def.tools).length > 0;
+    const toolsRecord = def.tools ?? {};
+    const hasExplicitTools =
+      def.tools !== undefined &&
+      (Object.keys(toolsRecord).length > 0 ||
+        Object.getOwnPropertySymbols(toolsRecord).length > 0);
     const hasExplicitSubAgents =
       def.agents && Object.keys(def.agents).length > 0;
 
@@ -366,10 +375,14 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
       });
     }
 
-    // 2. Explicit tools (toolkit entries, function tools, hosted tools)
+    // 2. fromPlugin markers — resolve against registered ToolProviders first so
+    //    explicit string-keyed tools can still overwrite on the same key.
+    this.resolveFromPluginMarkers(agentName, toolsRecord, index);
+
+    // 3. Explicit tools (toolkit entries, function tools, hosted tools)
     const hostedToCollect: import("../../core/agent/tools/hosted-tools").HostedTool[] =
       [];
-    for (const [key, tool] of Object.entries(def.tools ?? {})) {
+    for (const [key, tool] of Object.entries(toolsRecord)) {
       if (isToolkitEntry(tool)) {
         index.set(key, {
           source: "toolkit",
@@ -421,32 +434,19 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
       provider,
     } of this.context.getToolProviders()) {
       if (pluginName === this.name) continue;
-      const withToolkit = provider as ToolProvider & {
-        toolkit?: (opts?: unknown) => Record<string, unknown>;
-      };
-      if (typeof withToolkit.toolkit === "function") {
-        const entries = withToolkit.toolkit() as Record<string, unknown>;
-        for (const [key, maybeEntry] of Object.entries(entries)) {
-          if (!isToolkitEntry(maybeEntry)) continue;
-          if (maybeEntry.autoInheritable !== true) {
-            recordSkip(maybeEntry.pluginName, maybeEntry.localName);
-            continue;
-          }
-          index.set(key, {
-            source: "toolkit",
-            pluginName: maybeEntry.pluginName,
-            localName: maybeEntry.localName,
-            def: { ...maybeEntry.def, name: key },
-          });
-          inherited.push(key);
+      const entries = resolveToolkitFromProvider(pluginName, provider);
+      for (const [key, entry] of Object.entries(entries)) {
+        if (entry.autoInheritable !== true) {
+          recordSkip(entry.pluginName, entry.localName);
+          continue;
         }
-        continue;
-      }
-      // Fallback: providers without a toolkit() still expose getAgentTools().
-      // These cannot be selectively opted in per tool, so we conservatively
-      // skip them during auto-inherit and require explicit `tools:` wiring.
-      for (const tool of provider.getAgentTools()) {
-        recordSkip(pluginName, tool.name);
+        index.set(key, {
+          source: "toolkit",
+          pluginName: entry.pluginName,
+          localName: entry.localName,
+          def: { ...entry.def, name: key },
+        });
+        inherited.push(key);
       }
     }
 
@@ -474,6 +474,51 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     }
   }
 
+  /**
+   * Walks the symbol-keyed `fromPlugin` markers in an agent's `tools` record
+   * and resolves each one against a registered `ToolProvider`. Throws with a
+   * helpful `Available: …` listing if a referenced plugin isn't registered.
+   */
+  private resolveFromPluginMarkers(
+    agentName: string,
+    toolsRecord: Record<string | symbol, unknown>,
+    index: Map<string, ResolvedToolEntry>,
+  ): void {
+    const symbolKeys = Object.getOwnPropertySymbols(toolsRecord);
+    if (symbolKeys.length === 0) return;
+
+    const providers = this.context?.getToolProviders() ?? [];
+
+    for (const sym of symbolKeys) {
+      const marker = (toolsRecord as Record<symbol, unknown>)[sym];
+      if (!isFromPluginMarker(marker)) continue;
+
+      const providerEntry = providers.find((p) => p.name === marker.pluginName);
+      if (!providerEntry) {
+        const available = providers.map((p) => p.name).join(", ") || "(none)";
+        throw new Error(
+          `Agent '${agentName}' references plugin '${marker.pluginName}' via ` +
+            `fromPlugin(), but that plugin is not registered in createApp. ` +
+            `Available: ${available}.`,
+        );
+      }
+
+      const entries = resolveToolkitFromProvider(
+        marker.pluginName,
+        providerEntry.provider,
+        marker.opts,
+      );
+      for (const [key, entry] of Object.entries(entries)) {
+        index.set(key, {
+          source: "toolkit",
+          pluginName: entry.pluginName,
+          localName: entry.localName,
+          def: { ...entry.def, name: key },
+        });
+      }
+    }
+  }
+
   private async connectHostedTools(
     hostedTools: import("../../core/agent/tools/hosted-tools").HostedTool[],
     index: Map<string, ResolvedToolEntry>,
diff --git a/packages/appkit/src/plugins/agents/index.ts b/packages/appkit/src/plugins/agents/index.ts
index c8a31aac3..404da2432 100644
--- a/packages/appkit/src/plugins/agents/index.ts
+++ b/packages/appkit/src/plugins/agents/index.ts
@@ -1,5 +1,11 @@
-export { AgentsPlugin, agents } from "./agents";
 export { buildToolkitEntries } from "../../core/agent/build-toolkit";
+export {
+  FROM_PLUGIN_MARKER,
+  type FromPluginMarker,
+  type FromPluginSpread,
+  fromPlugin,
+  isFromPluginMarker,
+} from "../../core/agent/from-plugin";
 export {
   agentIdFromMarkdownPath,
   type LoadContext,
@@ -12,6 +18,7 @@ export {
   type AgentDefinition,
   type AgentsPluginConfig,
   type AgentTool,
+  type AgentTools,
   type AutoInheritToolsConfig,
   type BaseSystemPromptOption,
   isToolkitEntry,
@@ -21,3 +28,4 @@ export {
   type ToolkitEntry,
   type ToolkitOptions,
 } from "../../core/agent/types";
+export { AgentsPlugin, agents } from "./agents";
diff --git a/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts b/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
index 9c043d56f..42cb6b127 100644
--- a/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
+++ b/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
@@ -11,12 +11,26 @@ import type {
 import { afterEach, beforeEach, describe, expect, test, vi } from "vitest";
 import { z } from "zod";
 import { CacheManager } from "../../../cache";
-// Import the class directly so we can construct it without a createApp
-import { AgentsPlugin } from "../agents";
 import { buildToolkitEntries } from "../../../core/agent/build-toolkit";
-import { defineTool, type ToolRegistry } from "../../../core/agent/tools/define-tool";
-import type { AgentsPluginConfig, ToolkitEntry } from "../../../core/agent/types";
+import { fromPlugin } from "../../../core/agent/from-plugin";
+import {
+  defineTool,
+  type ToolRegistry,
+} from "../../../core/agent/tools/define-tool";
+import { tool } from "../../../core/agent/tools/tool";
+import type {
+  AgentsPluginConfig,
+  ToolkitEntry,
+} from "../../../core/agent/types";
 import { isToolkitEntry } from "../../../core/agent/types";
+// Import the class directly so we can construct it without a createApp
+import { AgentsPlugin } from "../agents";
+
+function namedFactory(name: string) {
+  const f = () => ({ name });
+  Object.defineProperty(f, "pluginName", { value: name, enumerable: true });
+  return f as typeof f & { readonly pluginName: string };
+}
 
 interface FakeContext {
   providers: Array<{ name: string; provider: ToolProvider }>;
@@ -364,4 +378,202 @@ describe("AgentsPlugin", () => {
     expect(isToolkitEntry({ foo: 1 })).toBe(false);
     expect(isToolkitEntry(null)).toBe(false);
   });
+
+  describe("fromPlugin markers", () => {
+    test("spreading fromPlugin registers all tools from the referenced plugin", async () => {
+      const registry: ToolRegistry = {
+        query: defineTool({
+          description: "q",
+          schema: z.object({ sql: z.string() }),
+          handler: () => "ok",
+        }),
+      };
+      const ctx = fakeContext([
+        {
+          name: "analytics",
+          provider: makeToolProvider("analytics", registry),
+        },
+      ]);
+
+      const plugin = instantiate(
+        {
+          dir: false,
+          agents: {
+            support: {
+              instructions: "...",
+              model: stubAdapter(),
+              tools: { ...fromPlugin(namedFactory("analytics")) },
+            },
+          },
+        },
+        ctx,
+      );
+      await plugin.setup();
+
+      const api = plugin.exports() as {
+        get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+      };
+      const agent = api.get("support");
+      expect(agent?.toolIndex.has("analytics.query")).toBe(true);
+    });
+
+    test("mixed inline + fromPlugin tools coexist", async () => {
+      const registry: ToolRegistry = {
+        query: defineTool({
+          description: "q",
+          schema: z.object({ sql: z.string() }),
+          handler: () => "ok",
+        }),
+      };
+      const ctx = fakeContext([
+        {
+          name: "analytics",
+          provider: makeToolProvider("analytics", registry),
+        },
+      ]);
+
+      const plugin = instantiate(
+        {
+          dir: false,
+          agents: {
+            support: {
+              instructions: "...",
+              model: stubAdapter(),
+              tools: {
+                ...fromPlugin(namedFactory("analytics")),
+                get_weather: tool({
+                  name: "get_weather",
+                  description: "Weather",
+                  schema: z.object({ city: z.string() }),
+                  execute: async ({ city }) => `Sunny in ${city}`,
+                }),
+              },
+            },
+          },
+        },
+        ctx,
+      );
+      await plugin.setup();
+
+      const api = plugin.exports() as {
+        get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+      };
+      const agent = api.get("support");
+      expect(agent?.toolIndex.has("analytics.query")).toBe(true);
+      expect(agent?.toolIndex.has("get_weather")).toBe(true);
+    });
+
+    test("missing plugin throws at setup with Available: listing", async () => {
+      const ctx = fakeContext([
+        {
+          name: "files",
+          provider: makeToolProvider("files", {}),
+        },
+      ]);
+
+      const plugin = instantiate(
+        {
+          dir: false,
+          agents: {
+            support: {
+              instructions: "...",
+              model: stubAdapter(),
+              tools: { ...fromPlugin(namedFactory("analytics")) },
+            },
+          },
+        },
+        ctx,
+      );
+      await expect(plugin.setup()).rejects.toThrow(/analytics/);
+      await expect(plugin.setup()).rejects.toThrow(/Available:/);
+      await expect(plugin.setup()).rejects.toThrow(/files/);
+    });
+
+    test("symbol-only tools record disables auto-inherit", async () => {
+      const analyticsReg: ToolRegistry = {
+        query: defineTool({
+          description: "q",
+          schema: z.object({ sql: z.string() }),
+          handler: () => "ok",
+        }),
+      };
+      const filesReg: ToolRegistry = {
+        list: defineTool({
+          description: "l",
+          schema: z.object({}),
+          handler: () => [],
+        }),
+      };
+      const ctx = fakeContext([
+        {
+          name: "analytics",
+          provider: makeToolProvider("analytics", analyticsReg),
+        },
+        {
+          name: "files",
+          provider: makeToolProvider("files", filesReg),
+        },
+      ]);
+
+      const plugin = instantiate(
+        {
+          dir: false,
+          autoInheritTools: { code: true },
+          agents: {
+            support: {
+              instructions: "...",
+              model: stubAdapter(),
+              tools: { ...fromPlugin(namedFactory("analytics")) },
+            },
+          },
+        },
+        ctx,
+      );
+      await plugin.setup();
+
+      const api = plugin.exports() as {
+        get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+      };
+      const agent = api.get("support");
+      const toolNames = Array.from(agent?.toolIndex.keys() ?? []);
+      expect(toolNames.some((n) => n.startsWith("analytics."))).toBe(true);
+      expect(toolNames.some((n) => n.startsWith("files."))).toBe(false);
+    });
+
+    test("falls back to getAgentTools() for providers without toolkit()", async () => {
+      // Provider lacks .toolkit() — only getAgentTools/executeAgentTool.
+      const bareProvider: ToolProvider = {
+        getAgentTools: () => [
+          {
+            name: "ping",
+            description: "ping",
+            parameters: { type: "object", properties: {} },
+          },
+        ],
+        executeAgentTool: vi.fn(async () => "pong"),
+      };
+      const ctx = fakeContext([{ name: "bare", provider: bareProvider }]);
+
+      const plugin = instantiate(
+        {
+          dir: false,
+          agents: {
+            support: {
+              instructions: "...",
+              model: stubAdapter(),
+              tools: { ...fromPlugin(namedFactory("bare")) },
+            },
+          },
+        },
+        ctx,
+      );
+      await plugin.setup();
+
+      const api = plugin.exports() as {
+        get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+      };
+      const agent = api.get("support");
+      expect(agent?.toolIndex.has("bare.ping")).toBe(true);
+    });
+  });
 });
diff --git a/packages/appkit/src/plugins/agents/tests/from-plugin.test.ts b/packages/appkit/src/plugins/agents/tests/from-plugin.test.ts
new file mode 100644
index 000000000..eb31d0f7d
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/from-plugin.test.ts
@@ -0,0 +1,80 @@
+import { describe, expect, test } from "vitest";
+import {
+  FROM_PLUGIN_MARKER,
+  fromPlugin,
+  isFromPluginMarker,
+} from "../../../core/agent/from-plugin";
+
+function fakeFactory(name: string) {
+  const f = () => ({ name });
+  Object.defineProperty(f, "pluginName", { value: name, enumerable: true });
+  return f as typeof f & { readonly pluginName: string };
+}
+
+describe("fromPlugin", () => {
+  test("returns a spread-friendly object with a single symbol-keyed marker", () => {
+    const spread = fromPlugin(fakeFactory("analytics"));
+
+    expect(Object.keys(spread)).toHaveLength(0);
+    const syms = Object.getOwnPropertySymbols(spread);
+    expect(syms).toHaveLength(1);
+
+    const marker = (spread as Record<symbol, unknown>)[syms[0]!];
+    expect(isFromPluginMarker(marker)).toBe(true);
+    expect((marker as { pluginName: string }).pluginName).toBe("analytics");
+  });
+
+  test("multiple calls produce distinct symbol keys (spreads coexist)", () => {
+    const spread = {
+      ...fromPlugin(fakeFactory("analytics")),
+      ...fromPlugin(fakeFactory("analytics")),
+      ...fromPlugin(fakeFactory("files")),
+    };
+
+    const syms = Object.getOwnPropertySymbols(spread);
+    expect(syms).toHaveLength(3);
+  });
+
+  test("passes opts through to the marker", () => {
+    const spread = fromPlugin(fakeFactory("analytics"), {
+      only: ["query"],
+      prefix: "q_",
+    });
+    const sym = Object.getOwnPropertySymbols(spread)[0]!;
+    const marker = (spread as Record<symbol, unknown>)[sym] as {
+      opts: { only: string[]; prefix: string };
+    };
+    expect(marker.opts.only).toEqual(["query"]);
+    expect(marker.opts.prefix).toBe("q_");
+  });
+
+  test("throws when factory has no pluginName", () => {
+    const missing = () => ({ name: "nope" });
+    expect(() =>
+      fromPlugin(missing as unknown as { readonly pluginName: string }),
+    ).toThrow(/missing pluginName/);
+  });
+
+  test("FROM_PLUGIN_MARKER is a globally-interned symbol", () => {
+    expect(FROM_PLUGIN_MARKER).toBe(
+      Symbol.for("@databricks/appkit.fromPluginMarker"),
+    );
+  });
+});
+
+describe("isFromPluginMarker", () => {
+  test("returns true for real markers", () => {
+    const spread = fromPlugin(fakeFactory("analytics"));
+    const sym = Object.getOwnPropertySymbols(spread)[0]!;
+    expect(isFromPluginMarker((spread as Record<symbol, unknown>)[sym])).toBe(
+      true,
+    );
+  });
+
+  test("returns false for objects without the brand", () => {
+    expect(isFromPluginMarker({ pluginName: "x" })).toBe(false);
+    expect(isFromPluginMarker(null)).toBe(false);
+    expect(isFromPluginMarker(undefined)).toBe(false);
+    expect(isFromPluginMarker("string")).toBe(false);
+  });
+});

From f45ac9243ac18ed0dc376c643230187cbbda9a17 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Thu, 23 Apr 2026 22:07:53 +0200
Subject: [PATCH 11/46] refactor(appkit): use consumeAdapterStream in
 core/run-agent

runAgent()'s adapter-consumption loop is now the same consumeAdapterStream
helper introduced in the agents-plugin layer. One loop covers all three
execution paths: HTTP streaming (_streamAgent), sub-agents (runSubAgent),
and standalone runAgent. The message_delta + message accumulation rule
(with its LangChain on_chain_end quirk) lives in exactly one place.
---
 packages/appkit/src/core/agent/run-agent.ts   | 28 +++---
 .../appkit/src/core/agent/tool-dispatch.ts    | 97 +++++++++++++++++++
 2 files changed, 108 insertions(+), 17 deletions(-)
 create mode 100644 packages/appkit/src/core/agent/tool-dispatch.ts

diff --git a/packages/appkit/src/core/agent/run-agent.ts b/packages/appkit/src/core/agent/run-agent.ts
index 4646aec74..9c7c655fd 100644
--- a/packages/appkit/src/core/agent/run-agent.ts
+++ b/packages/appkit/src/core/agent/run-agent.ts
@@ -101,28 +101,22 @@ export async function runAgent(
   };
 
   const events: AgentEvent[] = [];
-  let text = "";
-
-  const stream = adapter.run(
+  const text = await consumeAdapterStream(
+    adapter.run(
+      {
+        messages,
+        tools,
+        threadId: randomUUID(),
+        signal,
+      },
+      { executeTool, signal },
+    ),
     {
-      messages,
-      tools,
-      threadId: randomUUID(),
       signal,
+      onEvent: (event) => events.push(event),
     },
-    { executeTool, signal },
   );
 
-  for await (const event of stream) {
-    if (signal?.aborted) break;
-    events.push(event);
-    if (event.type === "message_delta") {
-      text += event.content;
-    } else if (event.type === "message") {
-      text = event.content;
-    }
-  }
-
   return { text, events };
 }
 
diff --git a/packages/appkit/src/core/agent/tool-dispatch.ts b/packages/appkit/src/core/agent/tool-dispatch.ts
new file mode 100644
index 000000000..a3e220bbd
--- /dev/null
+++ b/packages/appkit/src/core/agent/tool-dispatch.ts
@@ -0,0 +1,97 @@
+import type express from "express";
+import type { AppKitMcpClient } from "../../connectors/mcp";
+import type { PluginContext } from "../../core/plugin-context";
+import type { ResolvedToolEntry } from "./types";
+
+interface ToolDispatchContext {
+  /**
+   * The originating HTTP request. Used by `toolkit` entries to scope execution
+   * to the caller's user context (`asUser(req)`) and by `mcp` entries to pick
+   * up the OBO bearer token from `x-forwarded-access-token`.
+   */
+  req: express.Request;
+  /** Cancellation signal, forwarded to the tool implementation. */
+  signal: AbortSignal;
+  /**
+   * PluginContext mediator — required to dispatch `toolkit` entries. Absent in
+   * unit tests that construct `AgentsPlugin` directly; callers may pass
+   * `null` / `undefined`, in which case toolkit calls throw a clear error.
+   */
+  pluginContext?: PluginContext | null;
+  /** Live MCP client. Required for `mcp` entries. */
+  mcpClient?: AppKitMcpClient | null;
+  /**
+   * Delegates a sub-agent invocation. The closure owns the recursion depth so
+   * the dispatcher itself remains depth-agnostic — the top-level caller
+   * passes `depth = 1`, and a sub-agent's inner dispatcher passes `depth + 1`.
+   */
+  runSubAgent: (agentName: string, args: unknown) => Promise<unknown>;
+}
+
+/**
+ * Fan-out a resolved tool entry to the correct executor. One place to add a
+ * fifth `source` variant; `never`-typed default forces every caller to
+ * update in lockstep.
+ *
+ * This only handles dispatch — result normalisation (`normalizeToolResult`),
+ * budget counting, and approval gating remain at the call site, where each
+ * stream has different policies.
+ */
+export async function dispatchToolCall(
+  entry: ResolvedToolEntry,
+  args: unknown,
+  ctx: ToolDispatchContext,
+): Promise<unknown> {
+  switch (entry.source) {
+    case "toolkit": {
+      if (!ctx.pluginContext) {
+        throw new Error(
+          "Plugin tool execution requires PluginContext; " +
+            "this should never happen through createApp.",
+        );
+      }
+      return ctx.pluginContext.executeTool(
+        ctx.req,
+        entry.pluginName,
+        entry.localName,
+        args,
+        ctx.signal,
+      );
+    }
+    case "function":
+      return entry.functionTool.execute(args as Record<string, unknown>);
+    case "mcp": {
+      if (!ctx.mcpClient) throw new Error("MCP client not connected");
+      return ctx.mcpClient.callTool(
+        entry.mcpToolName,
+        args,
+        extractOboMcpAuth(ctx.req),
+      );
+    }
+    case "subagent":
+      return ctx.runSubAgent(entry.agentName, args);
+    default: {
+      // Exhaustiveness guard: adding a new `source` to ResolvedToolEntry
+      // without teaching this switch breaks the build here.
+      const _exhaustive: never = entry;
+      throw new Error(
+        `Unsupported tool source: ${(_exhaustive as ResolvedToolEntry).source}`,
+      );
+    }
+  }
+}
+
+/**
+ * Extracts the caller's OBO bearer token from the standard Databricks Apps
+ * forwarded-auth header. MCP destinations that `forwardWorkspaceAuth` admits
+ * as same-origin will receive this header; non-workspace destinations drop
+ * it inside {@link AppKitMcpClient.callTool}.
+ */
+function extractOboMcpAuth(
+  req: express.Request,
+): Record<string, string> | undefined {
+  const oboToken = req.headers["x-forwarded-access-token"];
+  return typeof oboToken === "string"
+    ? { Authorization: `Bearer ${oboToken}` }
+    : undefined;
+}

From 3e23d0c9f7bada1a076de6835884f48342c91972 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 4 May 2026 14:59:08 +0200
Subject: [PATCH 12/46] fix(agents): update agents.ts imports to core/agent/
 paths after Option A rewrite

normalize-result, consume-adapter-stream, tool-dispatch were extracted to
core/agent/ but agents.ts still imported them from plugins/agents/. Update
the import paths to match the final file locations.
---
 packages/appkit/src/plugins/agents/agents.ts | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index 309589e0f..d7218eec7 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -16,12 +16,15 @@ import type {
 } from "shared";
 import { AppKitMcpClient, buildMcpHostPolicy } from "../../connectors/mcp";
 import { getWorkspaceClient } from "../../context";
+import { consumeAdapterStream } from "../../core/agent/consume-adapter-stream";
 import { isFromPluginMarker } from "../../core/agent/from-plugin";
 import { loadAgentsFromDir } from "../../core/agent/load-agents";
+import { normalizeToolResult } from "../../core/agent/normalize-result";
 import {
   buildBaseSystemPrompt,
   composeSystemPrompt,
 } from "../../core/agent/system-prompt";
+import { dispatchToolCall } from "../../core/agent/tool-dispatch";
 import { resolveToolkitFromProvider } from "../../core/agent/toolkit-resolver";
 import {
   functionToolToDefinition,
@@ -41,12 +44,10 @@ import { isToolkitEntry } from "../../core/agent/types";
 import { createLogger } from "../../logging/logger";
 import { Plugin, toPlugin } from "../../plugin";
 import type { PluginManifest } from "../../registry";
-import { consumeAdapterStream } from "../../core/agent/consume-adapter-stream";
 import { agentStreamDefaults } from "./defaults";
 import { EventChannel } from "./event-channel";
 import { AgentEventTranslator } from "./event-translator";
 import manifest from "./manifest.json";
-import { normalizeToolResult } from "../../core/agent/normalize-result";
 import {
   approvalRequestSchema,
   chatRequestSchema,

From e22db6239fd28e0d5f3a44c2737721e019c5dddd Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 4 May 2026 19:49:58 +0200
Subject: [PATCH 13/46] feat(appkit): sub-agent approval gate and
 HttpToolExecutor path (SDK)

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 packages/appkit/src/plugins/agents/agents.ts | 373 ++++++++++---------
 1 file changed, 206 insertions(+), 167 deletions(-)

diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index d7218eec7..684315229 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -12,49 +12,47 @@ import type {
   PluginPhase,
   ResponseStreamEvent,
   Thread,
+  ToolAnnotations,
   ToolProvider,
 } from "shared";
 import { AppKitMcpClient, buildMcpHostPolicy } from "../../connectors/mcp";
 import { getWorkspaceClient } from "../../context";
-import { consumeAdapterStream } from "../../core/agent/consume-adapter-stream";
-import { isFromPluginMarker } from "../../core/agent/from-plugin";
-import { loadAgentsFromDir } from "../../core/agent/load-agents";
-import { normalizeToolResult } from "../../core/agent/normalize-result";
-import {
-  buildBaseSystemPrompt,
-  composeSystemPrompt,
-} from "../../core/agent/system-prompt";
-import { dispatchToolCall } from "../../core/agent/tool-dispatch";
-import { resolveToolkitFromProvider } from "../../core/agent/toolkit-resolver";
-import {
-  functionToolToDefinition,
-  isFunctionTool,
-  isHostedTool,
-  resolveHostedTools,
-} from "../../core/agent/tools";
-import type {
-  AgentDefinition,
-  AgentsPluginConfig,
-  BaseSystemPromptOption,
-  PromptContext,
-  RegisteredAgent,
-  ResolvedToolEntry,
-} from "../../core/agent/types";
-import { isToolkitEntry } from "../../core/agent/types";
 import { createLogger } from "../../logging/logger";
 import { Plugin, toPlugin } from "../../plugin";
 import type { PluginManifest } from "../../registry";
+import { consumeAdapterStream } from "./consume-adapter-stream";
 import { agentStreamDefaults } from "./defaults";
 import { EventChannel } from "./event-channel";
 import { AgentEventTranslator } from "./event-translator";
+import { isFromPluginMarker } from "./from-plugin";
+import { loadAgentsFromDir } from "./load-agents";
 import manifest from "./manifest.json";
+import { normalizeToolResult } from "./normalize-result";
 import {
   approvalRequestSchema,
   chatRequestSchema,
   invocationsRequestSchema,
 } from "./schemas";
+import { buildBaseSystemPrompt, composeSystemPrompt } from "./system-prompt";
 import { InMemoryThreadStore } from "./thread-store";
 import { ToolApprovalGate } from "./tool-approval-gate";
+import { dispatchToolCall } from "./tool-dispatch";
+import { resolveToolkitFromProvider } from "./toolkit-resolver";
+import {
+  functionToolToDefinition,
+  isFunctionTool,
+  isHostedTool,
+  resolveHostedTools,
+} from "./tools";
+import type {
+  AgentDefinition,
+  AgentsPluginConfig,
+  BaseSystemPromptOption,
+  PromptContext,
+  RegisteredAgent,
+  ResolvedToolEntry,
+} from "./types";
+import { isToolkitEntry } from "./types";
 
 const logger = createLogger("agents");
 
@@ -381,8 +379,7 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     this.resolveFromPluginMarkers(agentName, toolsRecord, index);
 
     // 3. Explicit tools (toolkit entries, function tools, hosted tools)
-    const hostedToCollect: import("../../core/agent/tools/hosted-tools").HostedTool[] =
-      [];
+    const hostedToCollect: import("./tools/hosted-tools").HostedTool[] = [];
     for (const [key, tool] of Object.entries(toolsRecord)) {
       if (isToolkitEntry(tool)) {
         index.set(key, {
@@ -521,38 +518,28 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
   }
 
   private async connectHostedTools(
-    hostedTools: import("../../core/agent/tools/hosted-tools").HostedTool[],
+    hostedTools: import("./tools/hosted-tools").HostedTool[],
     index: Map<string, ResolvedToolEntry>,
   ): Promise<void> {
-    let host: string | undefined;
-    let authenticate: () => Promise<Record<string, string>>;
-
-    try {
-      const { getWorkspaceClient } = await import("../../context");
-      const wsClient = getWorkspaceClient();
-      await wsClient.config.ensureResolved();
-      host = wsClient.config.host;
-      authenticate = async () => {
-        const headers = new Headers();
-        await wsClient.config.authenticate(headers);
-        return Object.fromEntries(headers.entries());
-      };
-    } catch {
-      host = process.env.DATABRICKS_HOST;
-      authenticate = async (): Promise<Record<string, string>> => {
-        const token = process.env.DATABRICKS_TOKEN;
-        return token ? { Authorization: `Bearer ${token}` } : {};
-      };
-    }
+    const wsClient = await this.resolveWorkspaceClient();
+    await wsClient.config.ensureResolved();
+    const host = wsClient.config.host;
 
     if (!host) {
       logger.warn(
-        "No Databricks host available — skipping %d hosted tool(s)",
+        "No Databricks host available — skipping %d hosted tool(s). " +
+          "Set DATABRICKS_HOST or configure a profile in ~/.databrickscfg.",
         hostedTools.length,
       );
       return;
     }
 
+    const authenticate = async (): Promise<Record<string, string>> => {
+      const headers = new Headers();
+      await wsClient.config.authenticate(headers);
+      return Object.fromEntries(headers.entries());
+    };
+
     if (!this.mcpClient) {
       const policy = buildMcpHostPolicy(this.config.mcp, host);
       this.mcpClient = new AppKitMcpClient(host, authenticate, policy);
@@ -570,6 +557,23 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     }
   }
 
+  /**
+   * Return the ambient workspace client from {@link getWorkspaceClient} when
+   * `ServiceContext` is initialized (the normal `createApp` path). Fall back
+   * to a fresh `WorkspaceClient()` that walks the SDK's credential chain —
+   * `DATABRICKS_HOST` / `DATABRICKS_TOKEN`, `~/.databrickscfg` profiles,
+   * DAB auth, OAuth, metadata service — for test rigs and manual embeds
+   * that never ran through `createApp`.
+   */
+  private async resolveWorkspaceClient() {
+    try {
+      return getWorkspaceClient();
+    } catch {
+      const { WorkspaceClient } = await import("@databricks/sdk-experimental");
+      return new WorkspaceClient({});
+    }
+  }
+
   // ----------------- ToolProvider (no tools of our own) --------------------
 
   getAgentTools(): AgentToolDefinition[] {
@@ -793,83 +797,76 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
       const entry = registered.toolIndex.get(name);
       if (!entry) throw new Error(`Unknown tool: ${name}`);
 
-      if (
-        approvalPolicy.requireForDestructive &&
-        entry.def.annotations?.destructive === true
-      ) {
+      // Approval flow used by BOTH the parent stream and any sub-agents
+      // delegated to from it. Sub-agents were previously running destructive
+      // tools without ever surfacing the gate; this closure lifts the check
+      // so `runSubAgent.childExecute` can reuse the exact same semantics
+      // (event emission + gate.wait + deny string).
+      const checkApproval = async (
+        toolEntry: ResolvedToolEntry,
+        toolArgs: unknown,
+      ): Promise<"approve" | "deny" | null> => {
+        if (!approvalPolicy.requireForDestructive) return null;
+        if (!isDestructiveToolEntry(toolEntry)) return null;
         const approvalId = randomUUID();
         for (const ev of translator.translate({
           type: "approval_pending",
           approvalId,
           streamId: requestId,
-          toolName: name,
-          args,
-          annotations: entry.def.annotations,
+          toolName: toolEntry.def.name,
+          args: toolArgs,
+          annotations: combinedToolAnnotations(toolEntry),
         })) {
           outboundEvents.push(ev);
         }
-        const decision = await this.approvalGate.wait({
+        return this.approvalGate.wait({
           approvalId,
           streamId: requestId,
           userId,
           timeoutMs: approvalPolicy.timeoutMs,
         });
-        if (decision === "deny") {
-          return `Tool execution denied by user approval gate (tool: ${name}).`;
-        }
+      };
+
+      const decision = await checkApproval(entry, args);
+      if (decision === "deny") {
+        return `Tool execution denied by user approval gate (tool: ${name}).`;
       }
 
-      let result: unknown;
-      if (entry.source === "toolkit") {
-        if (!this.context) {
-          throw new Error(
-            "Plugin tool execution requires PluginContext; this should never happen through createApp",
-          );
+      // Forward tool-call / tool-result events from nested sub-agents into
+      // the parent's outbound SSE stream. Without this the client only sees
+      // the outer `agent-<name>` function call and never the inner tool
+      // invocations the sub-agent makes — so UI-action tools (apply_filter,
+      // highlight_period, etc.) that rely on SSE-based dispatch are
+      // invisible to the browser. Message deltas and metadata are
+      // deliberately NOT forwarded: that would bleed the sub-agent's
+      // assistant text into the parent's chat and double-emit threadIds.
+      const forwardSubAgentToolEvent = (ev: AgentEvent): void => {
+        if (ev.type !== "tool_call" && ev.type !== "tool_result") return;
+        for (const translated of translator.translate(ev)) {
+          outboundEvents.push(translated);
         }
-        result = await this.context.executeTool(
-          req,
-          entry.pluginName,
-          entry.localName,
-          args,
-          signal,
-        );
-      } else if (entry.source === "function") {
-        result = await entry.functionTool.execute(
-          args as Record<string, unknown>,
-        );
-      } else if (entry.source === "mcp") {
-        if (!this.mcpClient) throw new Error("MCP client not connected");
-        const oboToken = req.headers["x-forwarded-access-token"];
-        const mcpAuth =
-          typeof oboToken === "string"
-            ? { Authorization: `Bearer ${oboToken}` }
-            : undefined;
-        result = await this.mcpClient.callTool(
-          entry.mcpToolName,
-          args,
-          mcpAuth,
-        );
-      } else if (entry.source === "subagent") {
-        const childAgent = this.agents.get(entry.agentName);
-        if (!childAgent)
-          throw new Error(`Sub-agent not found: ${entry.agentName}`);
-        result = await this.runSubAgent(req, childAgent, args, signal, 1);
-      }
+      };
 
-      // A `void` / `undefined` return is a legitimate tool outcome (e.g., a
-      // "send notification" side-effecting tool). Return an empty string so
-      // the LLM sees a successful-but-empty result rather than a bogus
-      // "execution failed" error.
-      if (result === undefined) {
-        return "";
-      }
-      const MAX = 50_000;
-      const serialized =
-        typeof result === "string" ? result : JSON.stringify(result);
-      if (serialized.length > MAX) {
-        return `${serialized.slice(0, MAX)}\n\n[Result truncated: ${serialized.length} chars exceeds ${MAX} limit]`;
-      }
-      return result;
+      const raw = await dispatchToolCall(entry, args, {
+        req,
+        signal,
+        pluginContext: this.context,
+        mcpClient: this.mcpClient,
+        runSubAgent: (agentName, subArgs) => {
+          const childAgent = this.agents.get(agentName);
+          if (!childAgent) throw new Error(`Sub-agent not found: ${agentName}`);
+          return this.runSubAgent(
+            req,
+            childAgent,
+            subArgs,
+            signal,
+            1,
+            forwardSubAgentToolEvent,
+            checkApproval,
+          );
+        },
+      });
+      return normalizeToolResult(raw);
     };
 
     // Drive the adapter and the approval-event side-channel concurrently.
@@ -920,26 +917,14 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
           { executeTool, signal },
         );
 
-        // Accumulate assistant output from BOTH streaming and non-streaming
-        // adapters. Delta-based adapters (Databricks, Vercel AI) emit
-        // `message_delta` chunks that we concatenate; adapters that yield a
-        // single final assistant message (e.g. LangChain's `on_chain_end`
-        // path) emit a `message` event whose content replaces whatever
-        // deltas already arrived. Without the `message` branch, multi-turn
-        // LangChain conversations silently dropped the assistant turn from
-        // thread history.
-        let fullContent = "";
-        for await (const event of stream) {
-          if (signal.aborted) break;
-          if (event.type === "message_delta") {
-            fullContent += event.content;
-          } else if (event.type === "message") {
-            fullContent = event.content;
-          }
-          for (const translated of translator.translate(event)) {
-            outboundEvents.push(translated);
-          }
-        }
+        const fullContent = await consumeAdapterStream(stream, {
+          signal,
+          onEvent: (event) => {
+            for (const translated of translator.translate(event)) {
+              outboundEvents.push(translated);
+            }
+          },
+        });
 
         if (fullContent) {
           await this.threadStore.addMessage(thread.id, userId, {
@@ -1017,6 +1002,26 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     args: unknown,
     signal: AbortSignal,
     depth: number,
+    /**
+     * Optional per-event sink installed by the parent `_streamAgent`. When
+     * supplied, each adapter event the child yields is passed through —
+     * the parent's closure filters it to `tool_call` / `tool_result` so
+     * inner tool invocations surface to the client's SSE stream without
+     * also bleeding the sub-agent's assistant text.
+     */
+    onEvent?: (event: AgentEvent) => void,
+    /**
+     * Optional approval gate injected by the parent `_streamAgent`. When
+     * present, sub-agent tool calls annotated `destructive: true` fire
+     * `appkit.approval_pending` through the parent's outbound channel and
+     * await the user's decision, exactly like the parent's own executeTool.
+     * Absent (or returning `null`) means no gate — non-destructive tools
+     * or approval disabled policy-wide.
+     */
+    checkApproval?: (
+      entry: ResolvedToolEntry,
+      toolArgs: unknown,
+    ) => Promise<"approve" | "deny" | null>,
   ): Promise<string> {
     const limits = this.resolvedLimits;
     if (depth > limits.maxSubAgentDepth) {
@@ -1040,33 +1045,33 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     ): Promise<unknown> => {
       const entry = child.toolIndex.get(name);
       if (!entry) throw new Error(`Unknown tool in sub-agent: ${name}`);
-      if (entry.source === "toolkit" && this.context) {
-        return this.context.executeTool(
-          req,
-          entry.pluginName,
-          entry.localName,
-          childArgs,
-          signal,
-        );
-      }
-      if (entry.source === "function") {
-        return entry.functionTool.execute(childArgs as Record<string, unknown>);
-      }
-      if (entry.source === "subagent") {
-        const grandchild = this.agents.get(entry.agentName);
-        if (!grandchild)
-          throw new Error(`Sub-agent not found: ${entry.agentName}`);
-        return this.runSubAgent(req, grandchild, childArgs, signal, depth + 1);
-      }
-      if (entry.source === "mcp" && this.mcpClient) {
-        const oboToken = req.headers["x-forwarded-access-token"];
-        const mcpAuth =
-          typeof oboToken === "string"
-            ? { Authorization: `Bearer ${oboToken}` }
-            : undefined;
-        return this.mcpClient.callTool(entry.mcpToolName, childArgs, mcpAuth);
+
+      if (checkApproval) {
+        const decision = await checkApproval(entry, childArgs);
+        if (decision === "deny") {
+          return `Tool execution denied by user approval gate (tool: ${name}).`;
+        }
       }
-      throw new Error(`Unsupported sub-agent tool source: ${entry.source}`);
+
+      return dispatchToolCall(entry, childArgs, {
+        req,
+        signal,
+        pluginContext: this.context,
+        mcpClient: this.mcpClient,
+        runSubAgent: (agentName, args) => {
+          const grandchild = this.agents.get(agentName);
+          if (!grandchild) throw new Error(`Sub-agent not found: ${agentName}`);
+          return this.runSubAgent(
+            req,
+            grandchild,
+            args,
+            signal,
+            depth + 1,
+            onEvent,
+            checkApproval,
+          );
+        },
+      });
     };
 
     const runContext: AgentRunContext = { executeTool: childExecute, signal };
@@ -1101,17 +1106,13 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
       },
     ];
 
-    let output = "";
-    const events: AgentEvent[] = [];
-    for await (const event of child.adapter.run(
-      { messages, tools: childTools, threadId: randomUUID(), signal },
-      runContext,
-    )) {
-      events.push(event);
-      if (event.type === "message_delta") output += event.content;
-      else if (event.type === "message") output = event.content;
-    }
-    return output;
+    return consumeAdapterStream(
+      child.adapter.run(
+        { messages, tools: childTools, threadId: randomUUID(), signal },
+        runContext,
+      ),
+      { signal, onEvent },
+    );
   }
 
   private async _handleCancel(req: express.Request, res: express.Response) {
@@ -1265,6 +1266,44 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
   }
 }
 
+/**
+ * True when the tool should go through the approval gate. Historically
+ * scoped to `destructive: true` — hence the name — but now also fires for
+ * the semantic `effect` enum on {@link ToolAnnotations}. Any effect that
+ * mutates the world (`write` | `update` | `destructive`) gates; `read` and
+ * unannotated tools do not. `def.annotations` is the normal path; for
+ * `function` tools we also read `functionTool.annotations` so a mismatch
+ * between the spread def and the original {@link FunctionTool} cannot drop
+ * the hint.
+ */
+function isDestructiveToolEntry(entry: ResolvedToolEntry): boolean {
+  const defAnn = entry.def.annotations;
+  const fnAnn =
+    entry.source === "function" ? entry.functionTool.annotations : undefined;
+
+  const effect = defAnn?.effect ?? fnAnn?.effect;
+  if (effect === "write" || effect === "update" || effect === "destructive") {
+    return true;
+  }
+  if (defAnn?.destructive === true) return true;
+  if (fnAnn?.destructive === true) return true;
+  return false;
+}
+
+/** Merged annotations for the approval SSE payload (client UI + debugging). */
+function combinedToolAnnotations(
+  entry: ResolvedToolEntry,
+): ToolAnnotations | undefined {
+  if (entry.source === "function") {
+    const merged: ToolAnnotations = {
+      ...entry.functionTool.annotations,
+      ...entry.def.annotations,
+    };
+    return Object.keys(merged).length > 0 ? merged : undefined;
+  }
+  return entry.def.annotations;
+}
+
 function normalizeAutoInherit(value: AgentsPluginConfig["autoInheritTools"]): {
   file: boolean;
   code: boolean;
@@ -1302,7 +1341,7 @@ function composePromptForAgent(
 }
 
 /**
- * Plugin factory for the agents plugin. Reads `config/agents/*.md` by default,
+ * Plugin factory for the agents plugin. Reads `config/agents/<id>/agent.md` by default,
  * resolves toolkits/tools from registered plugins, exposes `appkit.agents.*`
  * runtime API and mounts `/invocations`.
  *

From 62dc7f3e1e9788e7d709ff9aba92a2e6f6a73ba7 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 4 May 2026 19:50:02 +0200
Subject: [PATCH 14/46] fix(appkit): forward all sub-agent events except
 metadata (SDK)

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 packages/appkit/src/plugins/agents/agents.ts | 33 +++++++++++---------
 1 file changed, 19 insertions(+), 14 deletions(-)

diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index 684315229..ab264b295 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -832,16 +832,21 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
         return `Tool execution denied by user approval gate (tool: ${name}).`;
       }
 
-      // Forward tool-call / tool-result events from nested sub-agents into
-      // the parent's outbound SSE stream. Without this the client only sees
-      // the outer `agent-<name>` function call and never the inner tool
-      // invocations the sub-agent makes — so UI-action tools (apply_filter,
-      // highlight_period, etc.) that rely on SSE-based dispatch are
-      // invisible to the browser. Message deltas and metadata are
-      // deliberately NOT forwarded: that would bleed the sub-agent's
-      // assistant text into the parent's chat and double-emit threadIds.
-      const forwardSubAgentToolEvent = (ev: AgentEvent): void => {
-        if (ev.type !== "tool_call" && ev.type !== "tool_result") return;
+      // Forward events from nested sub-agents into the parent's outbound
+      // SSE stream so the client sees inner tool calls AND the sub-agent's
+      // streaming text as it's generated. Without this the user stares at
+      // "thinking…" for the full duration of the sub-agent run.
+      //
+      // The one exception is `metadata`: sub-agents have their own
+      // threadId, and forwarding it would overwrite the parent's thread
+      // state on the client and break multi-turn continuity.
+      //
+      // `approval_pending` is not emitted by adapters directly — it comes
+      // through `checkApproval()` which already pushes to the parent's
+      // outboundEvents — so sub-agent destructive approvals surface
+      // independently of this forwarder.
+      const forwardSubAgentEvent = (ev: AgentEvent): void => {
+        if (ev.type === "metadata") return;
         for (const translated of translator.translate(ev)) {
           outboundEvents.push(translated);
         }
@@ -861,7 +866,7 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
             subArgs,
             signal,
             1,
-            forwardSubAgentToolEvent,
+            forwardSubAgentEvent,
             checkApproval,
           );
         },
@@ -1005,9 +1010,9 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     /**
      * Optional per-event sink installed by the parent `_streamAgent`. When
      * supplied, each adapter event the child yields is passed through —
-     * the parent's closure filters it to `tool_call` / `tool_result` so
-     * inner tool invocations surface to the client's SSE stream without
-     * also bleeding the sub-agent's assistant text.
+     * the parent's closure forwards everything except `metadata` so the
+     * sub-agent's streaming text, tool invocations, and thinking blocks
+     * all surface to the client's SSE stream in real time.
      */
     onEvent?: (event: AgentEvent) => void,
     /**

From 732498d3951aa80d4c967404fd93201a9dec049c Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Wed, 29 Apr 2026 18:19:25 +0200
Subject: [PATCH 15/46] refactor(appkit): move agent runtime to core/agent/

Flips the layering: agent types, helpers, and the standalone runner now
live in core/agent/ instead of plugins/agents/. The HTTP-facing agents()
plugin still owns its routes/streaming/threads but no longer re-exports
framework primitives that peer plugins depend on.

Moved (with git mv to preserve history):
- plugins/agents/{types,from-plugin,build-toolkit,toolkit-resolver,
  consume-adapter-stream,normalize-result,tool-dispatch,system-prompt,
  load-agents}.ts -> core/agent/
- plugins/agents/tools/{tool,define-tool,function-tool,hosted-tools,
  sql-policy,json-schema,index}.ts -> core/agent/tools/
- core/{run-agent,create-agent-def}.ts -> core/agent/{run-agent,create-agent}.ts
- 14 corresponding test files -> core/agent/tests/

Stayed in plugins/agents/ (HTTP/route concerns):
- agents.ts, event-channel.ts, event-translator.ts, tool-approval-gate.ts,
  thread-store.ts, schemas.ts, defaults.ts, manifest.json, index.ts

Updated imports across analytics, files, genie, lakebase to source from
core/agent/ directly. plugins/agents/index.ts stays as a back-compat
barrel that re-exports the moved primitives, so the public package
surface (@databricks/appkit) is byte-identical.

Verified: tsc --noEmit clean, 1581/1581 appkit tests pass.
---
 knip.json                                     | 10 +--
 packages/appkit/src/connectors/mcp/types.ts   |  2 +-
 packages/appkit/src/core/agent/index.ts       | 64 +++++++++++++++++++
 .../src/core/agent/tests/create-agent.test.ts |  4 +-
 .../agent}/tests/from-plugin.test.ts          |  0
 .../agent}/tests/mcp-server-helper.test.ts    |  0
 .../src/core/agent/tests/run-agent.test.ts    |  2 +-
 .../appkit/src/core/agent/tool-dispatch.ts    |  2 +-
 packages/appkit/src/plugins/agents/agents.ts  | 52 ++++++++-------
 packages/appkit/src/plugins/agents/index.ts   |  3 +
 10 files changed, 105 insertions(+), 34 deletions(-)
 create mode 100644 packages/appkit/src/core/agent/index.ts
 rename packages/appkit/src/{plugins/agents => core/agent}/tests/from-plugin.test.ts (100%)
 rename packages/appkit/src/{plugins/agents => core/agent}/tests/mcp-server-helper.test.ts (100%)

diff --git a/knip.json b/knip.json
index f530b3918..0a2351b79 100644
--- a/knip.json
+++ b/knip.json
@@ -19,15 +19,15 @@
     "packages/appkit/src/plugin/index.ts",
     "packages/appkit/src/plugin/to-plugin.ts",
     "packages/appkit/src/plugins/agents/index.ts",
-    "template/**",
-    "tools/**",
-    "docs/**",
-    ".github/scripts/**",
+    "packages/appkit/src/core/agent/index.ts",
     "packages/appkit/src/core/agent/tools/index.ts",
     "packages/appkit/src/core/agent/from-plugin.ts",
     "packages/appkit/src/core/agent/load-agents.ts",
     "packages/appkit/src/connectors/mcp/index.ts",
-    "packages/appkit/src/plugin/to-plugin.ts"
+    "template/**",
+    "tools/**",
+    "docs/**",
+    ".github/scripts/**"
   ],
   "ignoreDependencies": ["json-schema-to-typescript"],
   "ignoreBinaries": ["tarball"]
diff --git a/packages/appkit/src/connectors/mcp/types.ts b/packages/appkit/src/connectors/mcp/types.ts
index d74f0a46c..aeb61788e 100644
--- a/packages/appkit/src/connectors/mcp/types.ts
+++ b/packages/appkit/src/connectors/mcp/types.ts
@@ -1,7 +1,7 @@
 /**
  * Input shape consumed by {@link AppKitMcpClient.connect}. Produced by the
  * agents plugin from user-facing `HostedTool` declarations (see
- * `plugins/agents/tools/hosted-tools.ts`) and accepted directly by the
+ * `core/agent/tools/hosted-tools.ts`) and accepted directly by the
  * connector to keep its surface free of agent-layer concepts.
  */
 export interface McpEndpointConfig {
diff --git a/packages/appkit/src/core/agent/index.ts b/packages/appkit/src/core/agent/index.ts
new file mode 100644
index 000000000..c11c48282
--- /dev/null
+++ b/packages/appkit/src/core/agent/index.ts
@@ -0,0 +1,64 @@
+/**
+ * Agent runtime primitives. All framework-level agent types, tool helpers,
+ * and the standalone runner live here. The HTTP-facing `agents()` plugin in
+ * `plugins/agents/` consumes these but does not own them — peer plugins
+ * (analytics, files, genie, lakebase) can depend on this module without
+ * reaching across the sibling boundary.
+ */
+export { buildToolkitEntries } from "./build-toolkit";
+export { consumeAdapterStream } from "./consume-adapter-stream";
+export { createAgent } from "./create-agent";
+export {
+  FROM_PLUGIN_MARKER,
+  type FromPluginMarker,
+  type FromPluginSpread,
+  fromPlugin,
+  isFromPluginMarker,
+} from "./from-plugin";
+export {
+  agentIdFromMarkdownPath,
+  type LoadContext,
+  type LoadResult,
+  loadAgentFromFile,
+  loadAgentsFromDir,
+  parseFrontmatter,
+} from "./load-agents";
+export { normalizeToolResult } from "./normalize-result";
+export {
+  type RunAgentInput,
+  type RunAgentResult,
+  runAgent,
+} from "./run-agent";
+export { buildBaseSystemPrompt, composeSystemPrompt } from "./system-prompt";
+export { dispatchToolCall } from "./tool-dispatch";
+export { resolveToolkitFromProvider } from "./toolkit-resolver";
+export {
+  defineTool,
+  executeFromRegistry,
+  type FunctionTool,
+  functionToolToDefinition,
+  type HostedTool,
+  isFunctionTool,
+  isHostedTool,
+  mcpServer,
+  resolveHostedTools,
+  type ToolConfig,
+  type ToolEntry,
+  type ToolRegistry,
+  tool,
+  toolsFromRegistry,
+} from "./tools";
+export {
+  type AgentDefinition,
+  type AgentsPluginConfig,
+  type AgentTool,
+  type AgentTools,
+  type AutoInheritToolsConfig,
+  type BaseSystemPromptOption,
+  isToolkitEntry,
+  type PromptContext,
+  type RegisteredAgent,
+  type ResolvedToolEntry,
+  type ToolkitEntry,
+  type ToolkitOptions,
+} from "./types";
diff --git a/packages/appkit/src/core/agent/tests/create-agent.test.ts b/packages/appkit/src/core/agent/tests/create-agent.test.ts
index 30bcc98e9..df920369e 100644
--- a/packages/appkit/src/core/agent/tests/create-agent.test.ts
+++ b/packages/appkit/src/core/agent/tests/create-agent.test.ts
@@ -1,8 +1,8 @@
 import { describe, expect, test } from "vitest";
 import { z } from "zod";
 import { createAgent } from "../create-agent";
-import { tool } from "../../../core/agent/tools/tool";
-import type { AgentDefinition } from "../../../core/agent/types";
+import { tool } from "../tools/tool";
+import type { AgentDefinition } from "../types";
 
 describe("createAgent", () => {
   test("returns the definition unchanged for a simple agent", () => {
diff --git a/packages/appkit/src/plugins/agents/tests/from-plugin.test.ts b/packages/appkit/src/core/agent/tests/from-plugin.test.ts
similarity index 100%
rename from packages/appkit/src/plugins/agents/tests/from-plugin.test.ts
rename to packages/appkit/src/core/agent/tests/from-plugin.test.ts
diff --git a/packages/appkit/src/plugins/agents/tests/mcp-server-helper.test.ts b/packages/appkit/src/core/agent/tests/mcp-server-helper.test.ts
similarity index 100%
rename from packages/appkit/src/plugins/agents/tests/mcp-server-helper.test.ts
rename to packages/appkit/src/core/agent/tests/mcp-server-helper.test.ts
diff --git a/packages/appkit/src/core/agent/tests/run-agent.test.ts b/packages/appkit/src/core/agent/tests/run-agent.test.ts
index 5324dde21..9ead2c177 100644
--- a/packages/appkit/src/core/agent/tests/run-agent.test.ts
+++ b/packages/appkit/src/core/agent/tests/run-agent.test.ts
@@ -10,11 +10,11 @@ import type {
 } from "shared";
 import { describe, expect, test, vi } from "vitest";
 import { z } from "zod";
-import type { ToolkitEntry } from "../../../core/agent/types";
 import { createAgent } from "../create-agent";
 import { fromPlugin } from "../from-plugin";
 import { runAgent } from "../run-agent";
 import { tool } from "../tools/tool";
+import type { ToolkitEntry } from "../types";
 
 function scriptedAdapter(events: AgentEvent[]): AgentAdapter {
   return {
diff --git a/packages/appkit/src/core/agent/tool-dispatch.ts b/packages/appkit/src/core/agent/tool-dispatch.ts
index a3e220bbd..728f57990 100644
--- a/packages/appkit/src/core/agent/tool-dispatch.ts
+++ b/packages/appkit/src/core/agent/tool-dispatch.ts
@@ -1,6 +1,6 @@
 import type express from "express";
 import type { AppKitMcpClient } from "../../connectors/mcp";
-import type { PluginContext } from "../../core/plugin-context";
+import type { PluginContext } from "../plugin-context";
 import type { ResolvedToolEntry } from "./types";
 
 interface ToolDispatchContext {
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index ab264b295..a3af8a78a 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -17,42 +17,45 @@ import type {
 } from "shared";
 import { AppKitMcpClient, buildMcpHostPolicy } from "../../connectors/mcp";
 import { getWorkspaceClient } from "../../context";
+import { consumeAdapterStream } from "../../core/agent/consume-adapter-stream";
+import { isFromPluginMarker } from "../../core/agent/from-plugin";
+import { loadAgentsFromDir } from "../../core/agent/load-agents";
+import { normalizeToolResult } from "../../core/agent/normalize-result";
+import {
+  buildBaseSystemPrompt,
+  composeSystemPrompt,
+} from "../../core/agent/system-prompt";
+import { dispatchToolCall } from "../../core/agent/tool-dispatch";
+import { resolveToolkitFromProvider } from "../../core/agent/toolkit-resolver";
+import {
+  functionToolToDefinition,
+  isFunctionTool,
+  isHostedTool,
+  resolveHostedTools,
+} from "../../core/agent/tools";
+import type {
+  AgentDefinition,
+  AgentsPluginConfig,
+  BaseSystemPromptOption,
+  PromptContext,
+  RegisteredAgent,
+  ResolvedToolEntry,
+} from "../../core/agent/types";
+import { isToolkitEntry } from "../../core/agent/types";
 import { createLogger } from "../../logging/logger";
 import { Plugin, toPlugin } from "../../plugin";
 import type { PluginManifest } from "../../registry";
-import { consumeAdapterStream } from "./consume-adapter-stream";
 import { agentStreamDefaults } from "./defaults";
 import { EventChannel } from "./event-channel";
 import { AgentEventTranslator } from "./event-translator";
-import { isFromPluginMarker } from "./from-plugin";
-import { loadAgentsFromDir } from "./load-agents";
 import manifest from "./manifest.json";
-import { normalizeToolResult } from "./normalize-result";
 import {
   approvalRequestSchema,
   chatRequestSchema,
   invocationsRequestSchema,
 } from "./schemas";
-import { buildBaseSystemPrompt, composeSystemPrompt } from "./system-prompt";
 import { InMemoryThreadStore } from "./thread-store";
 import { ToolApprovalGate } from "./tool-approval-gate";
-import { dispatchToolCall } from "./tool-dispatch";
-import { resolveToolkitFromProvider } from "./toolkit-resolver";
-import {
-  functionToolToDefinition,
-  isFunctionTool,
-  isHostedTool,
-  resolveHostedTools,
-} from "./tools";
-import type {
-  AgentDefinition,
-  AgentsPluginConfig,
-  BaseSystemPromptOption,
-  PromptContext,
-  RegisteredAgent,
-  ResolvedToolEntry,
-} from "./types";
-import { isToolkitEntry } from "./types";
 
 const logger = createLogger("agents");
 
@@ -379,7 +382,8 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     this.resolveFromPluginMarkers(agentName, toolsRecord, index);
 
     // 3. Explicit tools (toolkit entries, function tools, hosted tools)
-    const hostedToCollect: import("./tools/hosted-tools").HostedTool[] = [];
+    const hostedToCollect: import("../../core/agent/tools/hosted-tools").HostedTool[] =
+      [];
     for (const [key, tool] of Object.entries(toolsRecord)) {
       if (isToolkitEntry(tool)) {
         index.set(key, {
@@ -518,7 +522,7 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
   }
 
   private async connectHostedTools(
-    hostedTools: import("./tools/hosted-tools").HostedTool[],
+    hostedTools: import("../../core/agent/tools/hosted-tools").HostedTool[],
     index: Map<string, ResolvedToolEntry>,
   ): Promise<void> {
     const wsClient = await this.resolveWorkspaceClient();
diff --git a/packages/appkit/src/plugins/agents/index.ts b/packages/appkit/src/plugins/agents/index.ts
index 404da2432..f630cc681 100644
--- a/packages/appkit/src/plugins/agents/index.ts
+++ b/packages/appkit/src/plugins/agents/index.ts
@@ -1,3 +1,6 @@
+// Re-exports of agent primitives that now live in core/agent/. Kept here so
+// the public package barrel (`@databricks/appkit`) and any callers that
+// already imported via `./plugins/agents` continue to resolve unchanged.
 export { buildToolkitEntries } from "../../core/agent/build-toolkit";
 export {
   FROM_PLUGIN_MARKER,

From 3e4eaca326a781ebb562459b728e2b3dd26ffb4e Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Wed, 29 Apr 2026 18:35:43 +0200
Subject: [PATCH 16/46] refactor(appkit): extract AgentRunner + ToolExecutor
 strategy
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Collapses the two parallel agent loops (`_streamAgent` in the plugin and
`runAgent` in core) onto a single AgentRunner that drives the adapter to
completion and surfaces events. Tool dispatch policy moves behind a
ToolExecutor strategy injected by the caller.

New:
- core/agent/runner.ts (AgentRunner + ToolExecutor interface, ~65 lines)
- core/agent/standalone-tool-executor.ts (in-process dispatch, ~78 lines)
- plugins/agents/http-tool-executor.ts (HTTP-path executor: budget +
  approval gate + OBO dispatch + sub-agent recursion, ~243 lines)
- plugins/agents/tests/http-tool-executor.test.ts (8 focused tests
  including sub-agent approval forwarding — was effectively untestable
  pre-refactor because the logic lived inside a private nested closure)

Refactored:
- core/agent/run-agent.ts: 348 -> 296 lines; the ~120-line executeTool
  closure is now a StandaloneToolExecutor + AgentRunner instantiation
  (~25 lines).
- plugins/agents/agents.ts: 1362 -> 1262 lines; `_streamAgent`
  shrinks from 233 lines (with a 95-line nested executeTool closure)
  to ~150 lines that build an HttpToolExecutor + AgentRunner.

Behaviour preserved:
- Top-level budget enforcement (sub-agents pass budget=null, mirroring
  the original closure that only counted at the outer executeTool)
- Approval gate fires on `effect: write|update|destructive` and the
  legacy `destructive: true` flag
- Sub-agents reuse the parent's checkApproval + outboundEvents +
  translator + abortController so destructive sub-agent tools surface
  approval_pending on the parent's SSE stream
- Sub-agent event forwarding skips `metadata` to avoid clobbering the
  parent thread state, matching the prior closure exactly

Verified: tsc --noEmit clean, knip clean, 1589/1589 appkit tests pass.
---
 packages/appkit/src/core/agent/run-agent.ts   |  97 ++---
 packages/appkit/src/core/agent/runner.ts      |  65 ++++
 .../core/agent/standalone-tool-executor.ts    |  78 ++++
 packages/appkit/src/plugins/agents/agents.ts  | 210 +++--------
 .../src/plugins/agents/http-tool-executor.ts  | 243 ++++++++++++
 .../agents/tests/http-tool-executor.test.ts   | 357 ++++++++++++++++++
 6 files changed, 822 insertions(+), 228 deletions(-)
 create mode 100644 packages/appkit/src/core/agent/runner.ts
 create mode 100644 packages/appkit/src/core/agent/standalone-tool-executor.ts
 create mode 100644 packages/appkit/src/plugins/agents/http-tool-executor.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/http-tool-executor.test.ts

diff --git a/packages/appkit/src/core/agent/run-agent.ts b/packages/appkit/src/core/agent/run-agent.ts
index 9c7c655fd..2c7e60f07 100644
--- a/packages/appkit/src/core/agent/run-agent.ts
+++ b/packages/appkit/src/core/agent/run-agent.ts
@@ -8,11 +8,14 @@ import type {
   PluginData,
   ToolProvider,
 } from "shared";
-import { consumeAdapterStream } from "./consume-adapter-stream";
 import { isFromPluginMarker } from "./from-plugin";
+import { AgentRunner } from "./runner";
+import {
+  type StandaloneEntry,
+  StandaloneToolExecutor,
+} from "./standalone-tool-executor";
 import { resolveToolkitFromProvider } from "./toolkit-resolver";
 import {
-  type FunctionTool,
   functionToolToDefinition,
   isFunctionTool,
 } from "./tools/function-tool";
@@ -65,58 +68,33 @@ export async function runAgent(
   const toolIndex = buildStandaloneToolIndex(def, input.plugins ?? []);
   const tools = Array.from(toolIndex.values()).map((e) => e.def);
 
-  const signal = input.signal;
+  // `runAgent` historically allowed callers to omit a signal. Synthesize one
+  // so AgentRunner / ToolExecutor can rely on always having a real signal.
+  const signal = input.signal ?? new AbortController().signal;
 
-  const executeTool = async (name: string, args: unknown): Promise<unknown> => {
-    const entry = toolIndex.get(name);
-    if (!entry) throw new Error(`Unknown tool: ${name}`);
-    if (entry.kind === "function") {
-      return entry.tool.execute(args as Record<string, unknown>);
-    }
-    if (entry.kind === "toolkit") {
-      return entry.provider.executeAgentTool(
-        entry.localName,
-        args as Record<string, unknown>,
-        signal,
-      );
-    }
-    if (entry.kind === "subagent") {
-      const subInput: RunAgentInput = {
-        messages:
-          typeof args === "object" &&
-          args !== null &&
-          typeof (args as { input?: unknown }).input === "string"
-            ? (args as { input: string }).input
-            : JSON.stringify(args),
-        signal,
+  const events: AgentEvent[] = [];
+
+  const executor = new StandaloneToolExecutor(
+    toolIndex,
+    async (subDef, subInput, subSignal) => {
+      const res = await runAgent(subDef, {
+        messages: subInput,
+        signal: subSignal,
         plugins: input.plugins,
-      };
-      const res = await runAgent(entry.agentDef, subInput);
+      });
       return res.text;
-    }
-    throw new Error(
-      `runAgent: tool "${name}" is a ${entry.kind} tool. ` +
-        "Hosted/MCP tools are only usable via createApp({ plugins: [..., agents(...)] }).",
-    );
-  };
-
-  const events: AgentEvent[] = [];
-  const text = await consumeAdapterStream(
-    adapter.run(
-      {
-        messages,
-        tools,
-        threadId: randomUUID(),
-        signal,
-      },
-      { executeTool, signal },
-    ),
-    {
-      signal,
-      onEvent: (event) => events.push(event),
     },
   );
 
+  const runner = new AgentRunner({
+    adapter,
+    tools,
+    executeTool: executor,
+    signal,
+    onEvent: (event) => events.push(event),
+  });
+
+  const text = await runner.run({ messages, threadId: randomUUID() });
   return { text, events };
 }
 
@@ -157,29 +135,6 @@ function normalizeMessages(
   return [systemMessage, ...input];
 }
 
-type StandaloneEntry =
-  | {
-      kind: "function";
-      def: AgentToolDefinition;
-      tool: FunctionTool;
-    }
-  | {
-      kind: "subagent";
-      def: AgentToolDefinition;
-      agentDef: AgentDefinition;
-    }
-  | {
-      kind: "toolkit";
-      def: AgentToolDefinition;
-      provider: ToolProvider;
-      pluginName: string;
-      localName: string;
-    }
-  | {
-      kind: "hosted";
-      def: AgentToolDefinition;
-    };
-
 /**
  * Resolves `def.tools` (string-keyed entries + symbol-keyed `fromPlugin`
  * markers) and `def.agents` (sub-agents) into a flat dispatch index.
diff --git a/packages/appkit/src/core/agent/runner.ts b/packages/appkit/src/core/agent/runner.ts
new file mode 100644
index 000000000..ac6f2ed3f
--- /dev/null
+++ b/packages/appkit/src/core/agent/runner.ts
@@ -0,0 +1,65 @@
+import type {
+  AgentAdapter,
+  AgentEvent,
+  AgentToolDefinition,
+  Message,
+} from "shared";
+import { consumeAdapterStream } from "./consume-adapter-stream";
+
+/**
+ * Execution strategy for a tool call. Lives behind {@link AgentRunner} so
+ * the runner doesn't care whether the tool ends up dispatched via HTTP
+ * plumbing (approval gate, OBO, MCP client) or by direct in-process call.
+ *
+ * The runner injects the adapter's per-invocation {@link AbortSignal} so
+ * implementations can wire it through to long-running work.
+ */
+export interface ToolExecutor {
+  execute(name: string, args: unknown, signal: AbortSignal): Promise<unknown>;
+}
+
+interface AgentRunnerInput {
+  messages: Message[];
+  threadId: string;
+}
+
+interface AgentRunnerDeps {
+  adapter: AgentAdapter;
+  tools: AgentToolDefinition[];
+  executeTool: ToolExecutor;
+  signal: AbortSignal;
+  /** Called for every event the adapter emits, in order. */
+  onEvent?: (event: AgentEvent) => void;
+}
+
+/**
+ * Single execution loop for an AgentDefinition. Intentionally thin — its
+ * only job is to drive the adapter to completion and surface events.
+ *
+ * Tool-dispatch policy (approval gating, per-user budget, OBO, MCP)
+ * is owned by the injected {@link ToolExecutor}. The plugin layer wires an
+ * `HttpToolExecutor` for the streaming chat path; `runAgent()` wires a
+ * `StandaloneToolExecutor` for in-process scripts.
+ */
+export class AgentRunner {
+  constructor(private deps: AgentRunnerDeps) {}
+
+  async run(input: AgentRunnerInput): Promise<string> {
+    const { adapter, tools, executeTool, signal, onEvent } = this.deps;
+    return consumeAdapterStream(
+      adapter.run(
+        {
+          messages: input.messages,
+          tools,
+          threadId: input.threadId,
+          signal,
+        },
+        {
+          executeTool: (name, args) => executeTool.execute(name, args, signal),
+          signal,
+        },
+      ),
+      { signal, onEvent },
+    );
+  }
+}
diff --git a/packages/appkit/src/core/agent/standalone-tool-executor.ts b/packages/appkit/src/core/agent/standalone-tool-executor.ts
new file mode 100644
index 000000000..d78e0e6bc
--- /dev/null
+++ b/packages/appkit/src/core/agent/standalone-tool-executor.ts
@@ -0,0 +1,78 @@
+import type { AgentToolDefinition, ToolProvider } from "shared";
+import type { ToolExecutor } from "./runner";
+import type { FunctionTool } from "./tools/function-tool";
+import type { AgentDefinition } from "./types";
+
+/**
+ * Tool entry shape used by `runAgent`'s in-process dispatcher. Distinct
+ * from {@link import("./types").ResolvedToolEntry} because the standalone
+ * path holds live `provider`/`agentDef` references at index-build time
+ * (no PluginContext to resolve from at dispatch time).
+ */
+export type StandaloneEntry =
+  | { kind: "function"; def: AgentToolDefinition; tool: FunctionTool }
+  | { kind: "subagent"; def: AgentToolDefinition; agentDef: AgentDefinition }
+  | {
+      kind: "toolkit";
+      def: AgentToolDefinition;
+      provider: ToolProvider;
+      pluginName: string;
+      localName: string;
+    }
+  | { kind: "hosted"; def: AgentToolDefinition };
+
+/**
+ * In-process tool executor for {@link import("./run-agent").runAgent}.
+ *
+ * No approval gate, no per-user budget, no OBO — there is no HTTP
+ * request in standalone mode. Hosted/MCP tools error with a clear
+ * message because they require a live MCP client owned by the
+ * `agents()` plugin.
+ *
+ * Sub-agent recursion delegates back to the caller (which is `runAgent`
+ * itself); this keeps the executor free of a circular import on the
+ * top-level entry point.
+ */
+export class StandaloneToolExecutor implements ToolExecutor {
+  constructor(
+    private readonly toolIndex: Map<string, StandaloneEntry>,
+    private readonly subAgentRunner: (
+      def: AgentDefinition,
+      input: string,
+      signal: AbortSignal,
+    ) => Promise<string>,
+  ) {}
+
+  async execute(
+    name: string,
+    args: unknown,
+    signal: AbortSignal,
+  ): Promise<unknown> {
+    const entry = this.toolIndex.get(name);
+    if (!entry) throw new Error(`Unknown tool: ${name}`);
+
+    if (entry.kind === "function") {
+      return entry.tool.execute(args as Record<string, unknown>);
+    }
+    if (entry.kind === "toolkit") {
+      return entry.provider.executeAgentTool(
+        entry.localName,
+        args as Record<string, unknown>,
+        signal,
+      );
+    }
+    if (entry.kind === "subagent") {
+      const sub =
+        typeof args === "object" &&
+        args !== null &&
+        typeof (args as { input?: unknown }).input === "string"
+          ? (args as { input: string }).input
+          : JSON.stringify(args);
+      return this.subAgentRunner(entry.agentDef, sub, signal);
+    }
+    throw new Error(
+      `runAgent: tool "${name}" is a ${entry.kind} tool. ` +
+        "Hosted/MCP tools are only usable via createApp({ plugins: [..., agents(...)] }).",
+    );
+  }
+}
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index a3af8a78a..5b56c48d5 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -12,7 +12,6 @@ import type {
   PluginPhase,
   ResponseStreamEvent,
   Thread,
-  ToolAnnotations,
   ToolProvider,
 } from "shared";
 import { AppKitMcpClient, buildMcpHostPolicy } from "../../connectors/mcp";
@@ -20,7 +19,7 @@ import { getWorkspaceClient } from "../../context";
 import { consumeAdapterStream } from "../../core/agent/consume-adapter-stream";
 import { isFromPluginMarker } from "../../core/agent/from-plugin";
 import { loadAgentsFromDir } from "../../core/agent/load-agents";
-import { normalizeToolResult } from "../../core/agent/normalize-result";
+import { AgentRunner } from "../../core/agent/runner";
 import {
   buildBaseSystemPrompt,
   composeSystemPrompt,
@@ -48,6 +47,11 @@ import type { PluginManifest } from "../../registry";
 import { agentStreamDefaults } from "./defaults";
 import { EventChannel } from "./event-channel";
 import { AgentEventTranslator } from "./event-translator";
+import {
+  type ApprovalCheck,
+  HttpToolExecutor,
+  type ToolBudget,
+} from "./http-tool-executor";
 import manifest from "./manifest.json";
 import {
   approvalRequestSchema,
@@ -773,110 +777,53 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     this.activeStreams.set(requestId, { controller: abortController, userId });
 
     const tools = Array.from(registered.toolIndex.values()).map((e) => e.def);
-    const approvalPolicy = this.resolvedApprovalPolicy;
     const limits = this.resolvedLimits;
     const outboundEvents = new EventChannel<ResponseStreamEvent>();
     const translator = new AgentEventTranslator();
-    // Per-run tool-call budget (shared across the top-level adapter and any
-    // sub-agents it delegates to). Counted pre-dispatch so a prompt-injected
+    // Per-run tool-call budget shared across the top-level adapter and any
+    // sub-agents it delegates to. Counted pre-dispatch so a prompt-injected
     // agent cannot drain the budget silently via denied calls.
-    let toolCallsUsed = 0;
-
-    const executeTool = async (
-      name: string,
-      args: unknown,
-    ): Promise<unknown> => {
-      if (toolCallsUsed >= limits.maxToolCalls) {
-        abortController.abort(
-          new Error(
-            `Tool-call budget exhausted (limit ${limits.maxToolCalls}).`,
-          ),
-        );
-        throw new Error(
-          `Tool-call budget exhausted (limit ${limits.maxToolCalls}). Raise agents({ limits: { maxToolCalls } }) or review the agent's tool-selection logic.`,
+    const budget: ToolBudget = { used: 0, limit: limits.maxToolCalls };
+
+    const executor = new HttpToolExecutor({
+      toolIndex: registered.toolIndex,
+      approvalPolicy: this.resolvedApprovalPolicy,
+      approvalGate: this.approvalGate,
+      translator,
+      outboundEvents,
+      abortController,
+      budget,
+      req,
+      streamId: requestId,
+      userId,
+      pluginContext: this.context,
+      mcpClient: this.mcpClient,
+      runSubAgent: (agentName, subArgs, subSignal, forwardEvent, check) => {
+        const childAgent = this.agents.get(agentName);
+        if (!childAgent) throw new Error(`Sub-agent not found: ${agentName}`);
+        return this.runSubAgent(
+          req,
+          childAgent,
+          subArgs,
+          subSignal,
+          1,
+          forwardEvent,
+          check,
         );
-      }
-      toolCallsUsed++;
-
-      const entry = registered.toolIndex.get(name);
-      if (!entry) throw new Error(`Unknown tool: ${name}`);
-
-      // Approval flow used by BOTH the parent stream and any sub-agents
-      // delegated to from it. Sub-agents were previously running destructive
-      // tools without ever surfacing the gate; this closure lifts the check
-      // so `runSubAgent.childExecute` can reuse the exact same semantics
-      // (event emission + gate.wait + deny string).
-      const checkApproval = async (
-        toolEntry: ResolvedToolEntry,
-        toolArgs: unknown,
-      ): Promise<"approve" | "deny" | null> => {
-        if (!approvalPolicy.requireForDestructive) return null;
-        if (!isDestructiveToolEntry(toolEntry)) return null;
-        const approvalId = randomUUID();
-        for (const ev of translator.translate({
-          type: "approval_pending",
-          approvalId,
-          streamId: requestId,
-          toolName: toolEntry.def.name,
-          args: toolArgs,
-          annotations: combinedToolAnnotations(toolEntry),
-        })) {
-          outboundEvents.push(ev);
-        }
-        return this.approvalGate.wait({
-          approvalId,
-          streamId: requestId,
-          userId,
-          timeoutMs: approvalPolicy.timeoutMs,
-        });
-      };
-
-      const decision = await checkApproval(entry, args);
-      if (decision === "deny") {
-        return `Tool execution denied by user approval gate (tool: ${name}).`;
-      }
+      },
+    });
 
-      // Forward events from nested sub-agents into the parent's outbound
-      // SSE stream so the client sees inner tool calls AND the sub-agent's
-      // streaming text as it's generated. Without this the user stares at
-      // "thinking…" for the full duration of the sub-agent run.
-      //
-      // The one exception is `metadata`: sub-agents have their own
-      // threadId, and forwarding it would overwrite the parent's thread
-      // state on the client and break multi-turn continuity.
-      //
-      // `approval_pending` is not emitted by adapters directly — it comes
-      // through `checkApproval()` which already pushes to the parent's
-      // outboundEvents — so sub-agent destructive approvals surface
-      // independently of this forwarder.
-      const forwardSubAgentEvent = (ev: AgentEvent): void => {
-        if (ev.type === "metadata") return;
-        for (const translated of translator.translate(ev)) {
+    const runner = new AgentRunner({
+      adapter: registered.adapter,
+      tools,
+      executeTool: executor,
+      signal,
+      onEvent: (event) => {
+        for (const translated of translator.translate(event)) {
           outboundEvents.push(translated);
         }
-      };
-
-      const raw = await dispatchToolCall(entry, args, {
-        req,
-        signal,
-        pluginContext: this.context,
-        mcpClient: this.mcpClient,
-        runSubAgent: (agentName, subArgs) => {
-          const childAgent = this.agents.get(agentName);
-          if (!childAgent) throw new Error(`Sub-agent not found: ${agentName}`);
-          return this.runSubAgent(
-            req,
-            childAgent,
-            subArgs,
-            signal,
-            1,
-            forwardSubAgentEvent,
-            checkApproval,
-          );
-        },
-      });
-      return normalizeToolResult(raw);
-    };
+      },
+    });
 
     // Drive the adapter and the approval-event side-channel concurrently.
     // Outbound events from both sources flow through `outboundEvents`; the
@@ -916,23 +863,9 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
           ...thread.messages,
         ];
 
-        const stream = registered.adapter.run(
-          {
-            messages: messagesWithSystem,
-            tools,
-            threadId: thread.id,
-            signal,
-          },
-          { executeTool, signal },
-        );
-
-        const fullContent = await consumeAdapterStream(stream, {
-          signal,
-          onEvent: (event) => {
-            for (const translated of translator.translate(event)) {
-              outboundEvents.push(translated);
-            }
-          },
+        const fullContent = await runner.run({
+          messages: messagesWithSystem,
+          threadId: thread.id,
         });
 
         if (fullContent) {
@@ -1027,10 +960,7 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
      * Absent (or returning `null`) means no gate — non-destructive tools
      * or approval disabled policy-wide.
      */
-    checkApproval?: (
-      entry: ResolvedToolEntry,
-      toolArgs: unknown,
-    ) => Promise<"approve" | "deny" | null>,
+    checkApproval?: ApprovalCheck,
   ): Promise<string> {
     const limits = this.resolvedLimits;
     if (depth > limits.maxSubAgentDepth) {
@@ -1048,6 +978,10 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
         : JSON.stringify(args);
     const childTools = Array.from(child.toolIndex.values()).map((e) => e.def);
 
+    // Sub-agent dispatch reuses the parent's approval check so a destructive
+    // tool fires `approval_pending` on the parent's SSE stream. Sub-agents
+    // do not enforce their own budget — the parent already counted the
+    // `agent-<key>` invocation.
     const childExecute = async (
       name: string,
       childArgs: unknown,
@@ -1275,44 +1209,6 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
   }
 }
 
-/**
- * True when the tool should go through the approval gate. Historically
- * scoped to `destructive: true` — hence the name — but now also fires for
- * the semantic `effect` enum on {@link ToolAnnotations}. Any effect that
- * mutates the world (`write` | `update` | `destructive`) gates; `read` and
- * unannotated tools do not. `def.annotations` is the normal path; for
- * `function` tools we also read `functionTool.annotations` so a mismatch
- * between the spread def and the original {@link FunctionTool} cannot drop
- * the hint.
- */
-function isDestructiveToolEntry(entry: ResolvedToolEntry): boolean {
-  const defAnn = entry.def.annotations;
-  const fnAnn =
-    entry.source === "function" ? entry.functionTool.annotations : undefined;
-
-  const effect = defAnn?.effect ?? fnAnn?.effect;
-  if (effect === "write" || effect === "update" || effect === "destructive") {
-    return true;
-  }
-  if (defAnn?.destructive === true) return true;
-  if (fnAnn?.destructive === true) return true;
-  return false;
-}
-
-/** Merged annotations for the approval SSE payload (client UI + debugging). */
-function combinedToolAnnotations(
-  entry: ResolvedToolEntry,
-): ToolAnnotations | undefined {
-  if (entry.source === "function") {
-    const merged: ToolAnnotations = {
-      ...entry.functionTool.annotations,
-      ...entry.def.annotations,
-    };
-    return Object.keys(merged).length > 0 ? merged : undefined;
-  }
-  return entry.def.annotations;
-}
-
 function normalizeAutoInherit(value: AgentsPluginConfig["autoInheritTools"]): {
   file: boolean;
   code: boolean;
diff --git a/packages/appkit/src/plugins/agents/http-tool-executor.ts b/packages/appkit/src/plugins/agents/http-tool-executor.ts
new file mode 100644
index 000000000..5217ab414
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/http-tool-executor.ts
@@ -0,0 +1,243 @@
+import { randomUUID } from "node:crypto";
+import type express from "express";
+import type { AgentEvent, ResponseStreamEvent, ToolAnnotations } from "shared";
+import type { AppKitMcpClient } from "../../connectors/mcp";
+import { normalizeToolResult } from "../../core/agent/normalize-result";
+import type { ToolExecutor } from "../../core/agent/runner";
+import { dispatchToolCall } from "../../core/agent/tool-dispatch";
+import type { ResolvedToolEntry } from "../../core/agent/types";
+import type { PluginContext } from "../../core/plugin-context";
+import type { EventChannel } from "./event-channel";
+import type { AgentEventTranslator } from "./event-translator";
+import type { ToolApprovalGate } from "./tool-approval-gate";
+
+/**
+ * Decision returned by the approval check. `null` means "no gate fires"
+ * (tool isn't gated, or policy disabled gating). `"approve"` / `"deny"`
+ * mirror the user's submission via `POST /approve`.
+ */
+export type ApprovalDecision = "approve" | "deny" | null;
+
+/**
+ * Approval-check function reused by both the parent stream's executor and
+ * any sub-agent executors it spawns. Lifted to a callable so sub-agents
+ * can share the parent's translator + outboundEvents + approvalGate.
+ */
+export type ApprovalCheck = (
+  entry: ResolvedToolEntry,
+  args: unknown,
+) => Promise<ApprovalDecision>;
+
+/**
+ * Sub-agent runner injected by the plugin. Returns the sub-agent's
+ * concatenated text output to hand back to the parent adapter as the
+ * tool result. Hidden behind a callback so the executor doesn't need to
+ * import the plugin class (cycle).
+ */
+type RunSubAgentFn = (
+  agentName: string,
+  args: unknown,
+  signal: AbortSignal,
+  forwardEvent: (e: AgentEvent) => void,
+  checkApproval: ApprovalCheck,
+) => Promise<string>;
+
+/**
+ * Mutable per-run tool-call budget. Shared by reference between the
+ * top-level executor and any sub-agent executors so `maxToolCalls` is
+ * enforced across the whole run, not per-agent.
+ */
+export interface ToolBudget {
+  used: number;
+  limit: number;
+}
+
+interface HttpToolExecutorDeps {
+  toolIndex: Map<string, ResolvedToolEntry>;
+  /** Approval policy as resolved from `agents({ approval: ... })`. */
+  approvalPolicy: { requireForDestructive: boolean; timeoutMs: number };
+  approvalGate: ToolApprovalGate;
+  /** Translator used to emit `approval_pending` to the SSE stream. */
+  translator: AgentEventTranslator;
+  /** Channel the SSE stream drains. Approval events are pushed here. */
+  outboundEvents: EventChannel<ResponseStreamEvent>;
+  /** Aborted on budget exhaustion to unwind the adapter promptly. */
+  abortController: AbortController;
+  /**
+   * Shared tool-call budget. Pass the same object to every executor in the
+   * run (top-level + sub-agents) so the cap is global. Pass `null` for
+   * sub-agent executors that should not count against the budget — only
+   * the parent enforces, mirroring the original closure's behaviour.
+   */
+  budget: ToolBudget | null;
+  /** OBO source: forwarded to dispatchToolCall for plugin-tool dispatch. */
+  req: express.Request;
+  /** SSE stream id (used for approval gate scoping + telemetry). */
+  streamId: string;
+  /** Authenticated user id, scoped per-stream by `_handleApprove`. */
+  userId: string;
+  /** PluginContext for OBO tool dispatch. May be undefined in tests. */
+  pluginContext: PluginContext | undefined;
+  /** MCP client for hosted-tool dispatch. May be null pre-connect. */
+  mcpClient: AppKitMcpClient | null;
+  /** Plugin-supplied factory that runs a sub-agent. */
+  runSubAgent: RunSubAgentFn;
+}
+
+/**
+ * HTTP-path tool executor for the streaming chat surface.
+ *
+ * Wraps the same logic that used to live as a closure inside
+ * `_streamAgent`: per-run budget, the approval gate, OBO dispatch via
+ * {@link dispatchToolCall}, sub-agent recursion, and event forwarding.
+ *
+ * Sub-agents share the parent's `translator`, `outboundEvents`,
+ * `approvalGate`, and `abortController` (so a sub-agent's destructive
+ * tool surfaces an `approval_pending` event on the parent's SSE stream
+ * and a sub-agent's budget exhaustion aborts the whole run). The
+ * `budget` is null for sub-agents so they don't double-count against
+ * the top-level cap — the parent already incremented when it dispatched
+ * the `agent-<key>` call.
+ */
+export class HttpToolExecutor implements ToolExecutor {
+  constructor(private deps: HttpToolExecutorDeps) {}
+
+  async execute(
+    name: string,
+    args: unknown,
+    signal: AbortSignal,
+  ): Promise<unknown> {
+    const { budget, abortController } = this.deps;
+
+    if (budget) {
+      if (budget.used >= budget.limit) {
+        abortController.abort(
+          new Error(`Tool-call budget exhausted (limit ${budget.limit}).`),
+        );
+        throw new Error(
+          `Tool-call budget exhausted (limit ${budget.limit}). ` +
+            "Raise agents({ limits: { maxToolCalls } }) or review the agent's tool-selection logic.",
+        );
+      }
+      budget.used++;
+    }
+
+    const entry = this.deps.toolIndex.get(name);
+    if (!entry) throw new Error(`Unknown tool: ${name}`);
+
+    const decision = await this.checkApproval(entry, args);
+    if (decision === "deny") {
+      return `Tool execution denied by user approval gate (tool: ${name}).`;
+    }
+
+    // Forward events from nested sub-agents into the parent's outbound SSE
+    // stream so the client sees inner tool calls AND the sub-agent's
+    // streaming text as it's generated. Without this the user stares at
+    // "thinking…" for the full duration of the sub-agent run.
+    //
+    // The one exception is `metadata`: sub-agents have their own threadId,
+    // and forwarding it would overwrite the parent's thread state on the
+    // client and break multi-turn continuity.
+    //
+    // `approval_pending` is not emitted by adapters directly — it comes
+    // through `checkApproval()` which already pushes to the parent's
+    // outboundEvents — so sub-agent destructive approvals surface
+    // independently of this forwarder.
+    const forwardSubAgentEvent = (ev: AgentEvent): void => {
+      if (ev.type === "metadata") return;
+      for (const translated of this.deps.translator.translate(ev)) {
+        this.deps.outboundEvents.push(translated);
+      }
+    };
+
+    const raw = await dispatchToolCall(entry, args, {
+      req: this.deps.req,
+      signal,
+      pluginContext: this.deps.pluginContext,
+      mcpClient: this.deps.mcpClient,
+      runSubAgent: (agentName, subArgs) =>
+        this.deps.runSubAgent(
+          agentName,
+          subArgs,
+          signal,
+          forwardSubAgentEvent,
+          this.checkApproval,
+        ),
+    });
+    return normalizeToolResult(raw);
+  }
+
+  /**
+   * Approval gate hook. Bound as an arrow so sub-agent executors can pass
+   * it through to {@link RunSubAgentFn} and the gate fires using the
+   * parent's translator + outboundEvents + approvalGate. Public so tests
+   * can drive it directly.
+   */
+  readonly checkApproval: ApprovalCheck = async (entry, args) => {
+    const {
+      approvalPolicy,
+      approvalGate,
+      translator,
+      outboundEvents,
+      streamId,
+      userId,
+    } = this.deps;
+    if (!approvalPolicy.requireForDestructive) return null;
+    if (!isDestructiveToolEntry(entry)) return null;
+    const approvalId = randomUUID();
+    for (const ev of translator.translate({
+      type: "approval_pending",
+      approvalId,
+      streamId,
+      toolName: entry.def.name,
+      args,
+      annotations: combinedToolAnnotations(entry),
+    })) {
+      outboundEvents.push(ev);
+    }
+    return approvalGate.wait({
+      approvalId,
+      streamId,
+      userId,
+      timeoutMs: approvalPolicy.timeoutMs,
+    });
+  };
+}
+
+/**
+ * True when the tool should go through the approval gate. Historically
+ * scoped to `destructive: true` — hence the name — but now also fires for
+ * the semantic `effect` enum on {@link ToolAnnotations}. Any effect that
+ * mutates the world (`write` | `update` | `destructive`) gates; `read` and
+ * unannotated tools do not. `def.annotations` is the normal path; for
+ * `function` tools we also read `functionTool.annotations` so a mismatch
+ * between the spread def and the original {@link FunctionTool} cannot drop
+ * the hint.
+ */
+function isDestructiveToolEntry(entry: ResolvedToolEntry): boolean {
+  const defAnn = entry.def.annotations;
+  const fnAnn =
+    entry.source === "function" ? entry.functionTool.annotations : undefined;
+
+  const effect = defAnn?.effect ?? fnAnn?.effect;
+  if (effect === "write" || effect === "update" || effect === "destructive") {
+    return true;
+  }
+  if (defAnn?.destructive === true) return true;
+  if (fnAnn?.destructive === true) return true;
+  return false;
+}
+
+/** Merged annotations for the approval SSE payload (client UI + debugging). */
+function combinedToolAnnotations(
+  entry: ResolvedToolEntry,
+): ToolAnnotations | undefined {
+  if (entry.source === "function") {
+    const merged: ToolAnnotations = {
+      ...entry.functionTool.annotations,
+      ...entry.def.annotations,
+    };
+    return Object.keys(merged).length > 0 ? merged : undefined;
+  }
+  return entry.def.annotations;
+}
diff --git a/packages/appkit/src/plugins/agents/tests/http-tool-executor.test.ts b/packages/appkit/src/plugins/agents/tests/http-tool-executor.test.ts
new file mode 100644
index 000000000..90b6d0ff4
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/http-tool-executor.test.ts
@@ -0,0 +1,357 @@
+import type express from "express";
+import type { ResponseStreamEvent } from "shared";
+import { describe, expect, test, vi } from "vitest";
+import type { ResolvedToolEntry } from "../../../core/agent/types";
+import { EventChannel } from "../event-channel";
+import { AgentEventTranslator } from "../event-translator";
+import { HttpToolExecutor, type ToolBudget } from "../http-tool-executor";
+import { ToolApprovalGate } from "../tool-approval-gate";
+
+/**
+ * Focused tests for HttpToolExecutor — particularly the sub-agent approval
+ * forwarding path. The runner-level abstraction makes it tractable to drive
+ * the executor without spinning up a full HTTP stream:
+ *
+ *   - Per-run budget gating (top-level enforces, sub-agents skip)
+ *   - approval_pending emission to the parent's outbound channel
+ *   - approve / deny decision flow
+ *   - Sub-agent dispatch reuses the parent's checkApproval (the bit that
+ *     used to be a private nested closure inside `_streamAgent` and was
+ *     hard to test pre-refactor)
+ */
+
+function functionEntry(
+  name: string,
+  opts?: { effect?: "write" | "destructive" },
+) {
+  const ann = opts?.effect ? { effect: opts.effect } : undefined;
+  return {
+    source: "function",
+    def: {
+      name,
+      description: `${name} tool`,
+      parameters: { type: "object", properties: {} },
+      annotations: ann,
+    },
+    functionTool: {
+      name,
+      description: `${name} tool`,
+      schema: { type: "object", properties: {} },
+      annotations: ann,
+      execute: vi.fn(async () => `${name}-result`),
+    },
+  } as unknown as ResolvedToolEntry;
+}
+
+function subAgentEntry(name: string) {
+  return {
+    source: "subagent",
+    agentName: name,
+    def: {
+      name: `agent-${name}`,
+      description: `Delegate to ${name}`,
+      parameters: { type: "object", properties: {} },
+    },
+  } as unknown as ResolvedToolEntry;
+}
+
+function mockReq(): express.Request {
+  return {
+    headers: { "x-forwarded-user": "alice" },
+    header: () => "alice",
+  } as unknown as express.Request;
+}
+
+function fixture(opts?: {
+  budget?: ToolBudget | null;
+  requireForDestructive?: boolean;
+  toolIndex?: Map<string, ResolvedToolEntry>;
+  runSubAgent?: HttpToolExecutorDepsRunSubAgent;
+}) {
+  const outboundEvents = new EventChannel<ResponseStreamEvent>();
+  const translator = new AgentEventTranslator();
+  const approvalGate = new ToolApprovalGate();
+  const abortController = new AbortController();
+  const toolIndex =
+    opts?.toolIndex ??
+    new Map<string, ResolvedToolEntry>([
+      ["safe", functionEntry("safe")],
+      ["risky", functionEntry("risky", { effect: "write" })],
+    ]);
+
+  const executor = new HttpToolExecutor({
+    toolIndex,
+    approvalPolicy: {
+      requireForDestructive: opts?.requireForDestructive ?? true,
+      timeoutMs: 5_000,
+    },
+    approvalGate,
+    translator,
+    outboundEvents,
+    abortController,
+    budget: opts?.budget === undefined ? { used: 0, limit: 50 } : opts.budget,
+    req: mockReq(),
+    streamId: "stream-1",
+    userId: "alice",
+    pluginContext: undefined,
+    mcpClient: null,
+    runSubAgent:
+      opts?.runSubAgent ??
+      ((_n, _a, _s, _f, _c) => Promise.resolve("(no sub-agent)")),
+  });
+
+  return {
+    executor,
+    outboundEvents,
+    approvalGate,
+    abortController,
+    toolIndex,
+    drainEvents: async () => {
+      const events: ResponseStreamEvent[] = [];
+      // Cap reads so a hang here surfaces as a test timeout, not a leak.
+      for (let i = 0; i < 100; i++) {
+        const next = await Promise.race([
+          (async () => {
+            for await (const ev of outboundEvents) return ev;
+            return null;
+          })(),
+          new Promise<null>((r) => setTimeout(() => r(null), 10)),
+        ]);
+        if (!next) break;
+        events.push(next);
+      }
+      return events;
+    },
+  };
+}
+
+type HttpToolExecutorDepsRunSubAgent = ConstructorParameters<
+  typeof HttpToolExecutor
+>[0]["runSubAgent"];
+
+describe("HttpToolExecutor", () => {
+  describe("budget", () => {
+    test("rejects + aborts when top-level budget is exhausted", async () => {
+      const { executor, abortController } = fixture({
+        budget: { used: 50, limit: 50 },
+      });
+
+      await expect(
+        executor.execute("safe", {}, abortController.signal),
+      ).rejects.toThrow(/Tool-call budget exhausted/);
+
+      expect(abortController.signal.aborted).toBe(true);
+    });
+
+    test("budget=null skips counting (sub-agent semantics)", async () => {
+      const { executor, abortController } = fixture({ budget: null });
+
+      const r1 = await executor.execute("safe", {}, abortController.signal);
+      const r2 = await executor.execute("safe", {}, abortController.signal);
+      expect(r1).toBe("safe-result");
+      expect(r2).toBe("safe-result");
+      expect(abortController.signal.aborted).toBe(false);
+    });
+  });
+
+  describe("approval gate", () => {
+    test("non-destructive tools bypass the gate", async () => {
+      const { executor, abortController, outboundEvents } = fixture();
+
+      const result = await executor.execute("safe", {}, abortController.signal);
+
+      expect(result).toBe("safe-result");
+      // Drain — there should be no approval_pending event in the channel.
+      outboundEvents.close();
+      const events: ResponseStreamEvent[] = [];
+      for await (const ev of outboundEvents) events.push(ev);
+      const approvals = events.filter(
+        (e) => e.type === "appkit.approval_pending",
+      );
+      expect(approvals).toEqual([]);
+    });
+
+    test("write-effect tool emits approval_pending and waits for decision", async () => {
+      const { executor, abortController, approvalGate, outboundEvents } =
+        fixture();
+
+      const promise = executor.execute("risky", {}, abortController.signal);
+
+      // The executor pushes approval_pending synchronously and then awaits
+      // the gate. Settle the gate by reading the approvalId from the SSE
+      // payload — this mirrors what `POST /approve` does in production.
+      const approvalId = await readApprovalId(outboundEvents);
+      expect(approvalId).toBeDefined();
+
+      approvalGate.submit({
+        approvalId,
+        userId: "alice",
+        decision: "approve",
+      });
+
+      const result = await promise;
+      expect(result).toBe("risky-result");
+    });
+
+    test("denied destructive tool returns a deny string instead of dispatching", async () => {
+      const { executor, abortController, approvalGate, outboundEvents } =
+        fixture();
+
+      const promise = executor.execute("risky", {}, abortController.signal);
+
+      const approvalId = await readApprovalId(outboundEvents);
+
+      approvalGate.submit({
+        approvalId,
+        userId: "alice",
+        decision: "deny",
+      });
+
+      const result = await promise;
+      expect(result).toMatch(/denied by user approval gate/);
+    });
+
+    test("requireForDestructive=false short-circuits the gate even on write tools", async () => {
+      const { executor, abortController, outboundEvents } = fixture({
+        requireForDestructive: false,
+      });
+
+      const result = await executor.execute(
+        "risky",
+        {},
+        abortController.signal,
+      );
+      expect(result).toBe("risky-result");
+
+      outboundEvents.close();
+      const seen: ResponseStreamEvent[] = [];
+      for await (const ev of outboundEvents) seen.push(ev);
+      expect(seen.some((e) => e.type === "appkit.approval_pending")).toBe(
+        false,
+      );
+    });
+  });
+
+  describe("sub-agent approval forwarding", () => {
+    test("destructive tool inside a sub-agent surfaces approval_pending on the parent's stream", async () => {
+      // This is the bit that used to be a private nested closure inside
+      // `_streamAgent` and was effectively untestable pre-refactor: the
+      // parent's `checkApproval` is passed *into* the sub-agent's runner
+      // so the SSE payload lands on the parent's outbound channel.
+      const childIndex = new Map<string, ResolvedToolEntry>([
+        ["destroy", functionEntry("destroy", { effect: "destructive" })],
+      ]);
+
+      const parentIndex = new Map<string, ResolvedToolEntry>([
+        ["agent-worker", subAgentEntry("worker")],
+      ]);
+
+      // Spy on what the runSubAgent factory receives.
+      const runSubAgentSpy = vi.fn<HttpToolExecutorDepsRunSubAgent>(
+        async (_name, _args, signal, _forwardEvent, checkApproval) => {
+          // Sub-agent invokes its destructive tool through the parent's
+          // approval check, exactly as `runSubAgent.childExecute` does.
+          const childEntry = childIndex.get("destroy");
+          if (!childEntry) throw new Error("destroy missing from child index");
+          const decision = await checkApproval(childEntry, { x: 1 });
+          if (decision === "deny") return "denied";
+          if (signal.aborted) throw new Error("aborted");
+          return "destroyed";
+        },
+      );
+
+      const { executor, approvalGate, outboundEvents, abortController } =
+        fixture({
+          toolIndex: parentIndex,
+          runSubAgent: runSubAgentSpy,
+        });
+
+      const promise = executor.execute(
+        "agent-worker",
+        { input: "do it" },
+        abortController.signal,
+      );
+
+      const { approvalId, toolName } =
+        await readApprovalDetails(outboundEvents);
+
+      expect(toolName, "approval_pending must surface on parent stream").toBe(
+        "destroy",
+      );
+
+      approvalGate.submit({
+        approvalId,
+        userId: "alice",
+        decision: "approve",
+      });
+
+      await expect(promise).resolves.toBe("destroyed");
+      expect(runSubAgentSpy).toHaveBeenCalledTimes(1);
+    });
+
+    test("denied sub-agent tool yields a deny string handled inside the sub-agent", async () => {
+      const childIndex = new Map<string, ResolvedToolEntry>([
+        ["destroy", functionEntry("destroy", { effect: "destructive" })],
+      ]);
+      const parentIndex = new Map<string, ResolvedToolEntry>([
+        ["agent-worker", subAgentEntry("worker")],
+      ]);
+
+      const runSubAgentSpy = vi.fn<HttpToolExecutorDepsRunSubAgent>(
+        async (_name, _args, _signal, _forward, checkApproval) => {
+          const childEntry = childIndex.get("destroy");
+          if (!childEntry) throw new Error("destroy missing from child index");
+          const decision = await checkApproval(childEntry, {});
+          if (decision === "deny") return "child-saw-deny";
+          return "should-not-happen";
+        },
+      );
+
+      const { executor, approvalGate, outboundEvents, abortController } =
+        fixture({
+          toolIndex: parentIndex,
+          runSubAgent: runSubAgentSpy,
+        });
+
+      const promise = executor.execute(
+        "agent-worker",
+        { input: "x" },
+        abortController.signal,
+      );
+
+      const approvalId = await readApprovalId(outboundEvents);
+
+      approvalGate.submit({
+        approvalId,
+        userId: "alice",
+        decision: "deny",
+      });
+
+      await expect(promise).resolves.toBe("child-saw-deny");
+    });
+  });
+});
+
+interface ApprovalEvent {
+  type: "appkit.approval_pending";
+  approval_id: string;
+  tool_name: string;
+}
+
+async function readApprovalDetails(
+  channel: EventChannel<ResponseStreamEvent>,
+): Promise<{ approvalId: string; toolName: string }> {
+  for await (const ev of channel) {
+    if (ev.type === "appkit.approval_pending") {
+      const a = ev as unknown as ApprovalEvent;
+      return { approvalId: a.approval_id, toolName: a.tool_name };
+    }
+  }
+  throw new Error("Channel closed before approval_pending arrived");
+}
+
+async function readApprovalId(
+  channel: EventChannel<ResponseStreamEvent>,
+): Promise<string> {
+  return (await readApprovalDetails(channel)).approvalId;
+}

From 8993db241ab2c99b782ca3ca4c733003e5ff151f Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Wed, 29 Apr 2026 18:41:56 +0200
Subject: [PATCH 17/46] refactor(appkit): split agents.ts helpers into separate
 modules
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Extracts `composePromptForAgent` + `normalizeAutoInherit` into
plugins/agents/prompt.ts and `printRegistry` into
plugins/agents/registry-printer.ts. These were free-function helpers at
the bottom of agents.ts with no dependency on plugin state — pure
candidates for extraction.

Also opens the door for the bigger split (route handlers and
`_streamAgent`/`runSubAgent` extracted into routes/*.ts and
tool-execution.ts) by relaxing the access modifier on plugin members
those modules will need (`agents`, `activeStreams`, `mcpClient`,
`threadStore`, `approvalGate`, `resolvedApprovalPolicy`,
`resolvedLimits`, `countUserStreams`). All marked `@internal` to
keep the public surface unchanged.

Note: the full split into `routes/` and `tool-execution.ts` proposed
in plans/agent-architecture-followup.md is deferred. Route handlers
and `_streamAgent`/`runSubAgent` remain as methods on AgentsPlugin
because they have heavy plugin-state coupling and cross-call patterns
(`runSubAgent` recurses, `_handleChat` calls `_streamAgent`,
etc.) that don't translate cleanly to free functions without a larger
refactor. Tracked as a follow-up.

agents.ts: 1262 -> 1212 lines (-50). The plan's aspirational target
of <=280 isn't met because the per-route extraction pass is deferred,
but the helper extraction + access-modifier relaxation lays the
groundwork.

Verified: tsc --noEmit clean, 1589/1589 appkit tests pass.
---
 packages/appkit/src/plugins/agents/agents.ts  | 92 +++++--------------
 packages/appkit/src/plugins/agents/prompt.ts  | 57 ++++++++++++
 .../src/plugins/agents/registry-printer.ts    | 25 +++++
 3 files changed, 103 insertions(+), 71 deletions(-)
 create mode 100644 packages/appkit/src/plugins/agents/prompt.ts
 create mode 100644 packages/appkit/src/plugins/agents/registry-printer.ts

diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index 5b56c48d5..d2a113f4c 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -20,10 +20,6 @@ import { consumeAdapterStream } from "../../core/agent/consume-adapter-stream";
 import { isFromPluginMarker } from "../../core/agent/from-plugin";
 import { loadAgentsFromDir } from "../../core/agent/load-agents";
 import { AgentRunner } from "../../core/agent/runner";
-import {
-  buildBaseSystemPrompt,
-  composeSystemPrompt,
-} from "../../core/agent/system-prompt";
 import { dispatchToolCall } from "../../core/agent/tool-dispatch";
 import { resolveToolkitFromProvider } from "../../core/agent/toolkit-resolver";
 import {
@@ -35,8 +31,6 @@ import {
 import type {
   AgentDefinition,
   AgentsPluginConfig,
-  BaseSystemPromptOption,
-  PromptContext,
   RegisteredAgent,
   ResolvedToolEntry,
 } from "../../core/agent/types";
@@ -53,6 +47,8 @@ import {
   type ToolBudget,
 } from "./http-tool-executor";
 import manifest from "./manifest.json";
+import { composePromptForAgent, normalizeAutoInherit } from "./prompt";
+import { printRegistry } from "./registry-printer";
 import {
   approvalRequestSchema,
   chatRequestSchema,
@@ -80,15 +76,21 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
 
   protected declare config: AgentsPluginConfig;
 
-  private agents = new Map<string, RegisteredAgent>();
-  private defaultAgentName: string | null = null;
-  private activeStreams = new Map<
+  /** @internal - Mutated by route handlers and tool-execution helpers. */
+  agents = new Map<string, RegisteredAgent>();
+  /** @internal */
+  defaultAgentName: string | null = null;
+  /** @internal */
+  activeStreams = new Map<
     string,
     { controller: AbortController; userId: string }
   >();
-  private mcpClient: AppKitMcpClient | null = null;
-  private threadStore;
-  private approvalGate = new ToolApprovalGate();
+  /** @internal */
+  mcpClient: AppKitMcpClient | null = null;
+  /** @internal */
+  threadStore;
+  /** @internal */
+  approvalGate = new ToolApprovalGate();
 
   constructor(config: AgentsPluginConfig) {
     super(config);
@@ -111,8 +113,8 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     }
   }
 
-  /** Effective approval policy with defaults applied. */
-  private get resolvedApprovalPolicy(): {
+  /** Effective approval policy with defaults applied. @internal */
+  get resolvedApprovalPolicy(): {
     requireForDestructive: boolean;
     timeoutMs: number;
   } {
@@ -123,8 +125,8 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     };
   }
 
-  /** Effective DoS limits with defaults applied. */
-  private get resolvedLimits(): {
+  /** Effective DoS limits with defaults applied. @internal */
+  get resolvedLimits(): {
     maxConcurrentStreamsPerUser: number;
     maxToolCalls: number;
     maxSubAgentDepth: number;
@@ -137,8 +139,8 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     };
   }
 
-  /** Count active streams owned by a given user. */
-  private countUserStreams(userId: string): number {
+  /** Count active streams owned by a given user. @internal */
+  countUserStreams(userId: string): number {
     let n = 0;
     for (const entry of this.activeStreams.values()) {
       if (entry.userId === userId) n++;
@@ -149,7 +151,7 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
   async setup() {
     await this.loadAgents();
     this.mountInvocationsRoute();
-    this.printRegistry();
+    printRegistry(this.agents, this.defaultAgentName);
   }
 
   /**
@@ -1161,22 +1163,6 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     return first.done ? null : first.value;
   }
 
-  private printRegistry(): void {
-    if (this.agents.size === 0) return;
-    console.log("");
-    console.log(`  ${pc.bold("Agents")} ${pc.dim(`(${this.agents.size})`)}`);
-    console.log(`  ${pc.dim("─".repeat(60))}`);
-    for (const [name, reg] of this.agents) {
-      const tools = reg.toolIndex.size;
-      const marker = name === this.defaultAgentName ? pc.green("●") : " ";
-      console.log(
-        `  ${marker} ${pc.bold(name.padEnd(24))} ${pc.dim(`${tools} tools`)}`,
-      );
-    }
-    console.log(`  ${pc.dim("─".repeat(60))}`);
-    console.log("");
-  }
-
   async shutdown(): Promise<void> {
     this.approvalGate.abortAll();
     if (this.mcpClient) {
@@ -1209,42 +1195,6 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
   }
 }
 
-function normalizeAutoInherit(value: AgentsPluginConfig["autoInheritTools"]): {
-  file: boolean;
-  code: boolean;
-} {
-  // Default is opt-out for both origins. A markdown agent or code-defined
-  // agent with no declared `tools:` gets an empty tool index unless the
-  // developer explicitly flips `autoInheritTools` on. Even then, only tools
-  // whose plugin author marked `autoInheritable: true` are spread — see
-  // `applyAutoInherit` for the filter.
-  if (value === undefined) return { file: false, code: false };
-  if (typeof value === "boolean") return { file: value, code: value };
-  return { file: value.file ?? false, code: value.code ?? false };
-}
-
-function composePromptForAgent(
-  registered: RegisteredAgent,
-  pluginLevel: BaseSystemPromptOption | undefined,
-  ctx: PromptContext,
-): string {
-  const perAgent = registered.baseSystemPrompt;
-  const resolved = perAgent !== undefined ? perAgent : pluginLevel;
-
-  let base = "";
-  if (resolved === false) {
-    base = "";
-  } else if (typeof resolved === "string") {
-    base = resolved;
-  } else if (typeof resolved === "function") {
-    base = resolved(ctx);
-  } else {
-    base = buildBaseSystemPrompt(ctx);
-  }
-
-  return composeSystemPrompt(base, registered.instructions);
-}
-
 /**
  * Plugin factory for the agents plugin. Reads `config/agents/<id>/agent.md` by default,
  * resolves toolkits/tools from registered plugins, exposes `appkit.agents.*`
diff --git a/packages/appkit/src/plugins/agents/prompt.ts b/packages/appkit/src/plugins/agents/prompt.ts
new file mode 100644
index 000000000..d38c6e645
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/prompt.ts
@@ -0,0 +1,57 @@
+import {
+  buildBaseSystemPrompt,
+  composeSystemPrompt,
+} from "../../core/agent/system-prompt";
+import type {
+  AgentsPluginConfig,
+  BaseSystemPromptOption,
+  PromptContext,
+  RegisteredAgent,
+} from "../../core/agent/types";
+
+/**
+ * Resolves the per-agent and plugin-level base prompt options into the
+ * final system prompt sent to the adapter. Per-agent setting wins over
+ * plugin-level; `false` opts out entirely; functions receive the same
+ * `PromptContext` that the default builder uses.
+ */
+export function composePromptForAgent(
+  registered: RegisteredAgent,
+  pluginLevel: BaseSystemPromptOption | undefined,
+  ctx: PromptContext,
+): string {
+  const perAgent = registered.baseSystemPrompt;
+  const resolved = perAgent !== undefined ? perAgent : pluginLevel;
+
+  let base = "";
+  if (resolved === false) {
+    base = "";
+  } else if (typeof resolved === "string") {
+    base = resolved;
+  } else if (typeof resolved === "function") {
+    base = resolved(ctx);
+  } else {
+    base = buildBaseSystemPrompt(ctx);
+  }
+
+  return composeSystemPrompt(base, registered.instructions);
+}
+
+/**
+ * Resolves the plugin-level `autoInheritTools` config into a per-origin
+ * decision. Default is opt-out for both origins. A markdown agent or
+ * code-defined agent with no declared `tools:` gets an empty tool index
+ * unless the developer explicitly flips `autoInheritTools` on. Even then,
+ * only tools whose plugin author marked `autoInheritable: true` are
+ * spread — see `applyAutoInherit` for the filter.
+ */
+export function normalizeAutoInherit(
+  value: AgentsPluginConfig["autoInheritTools"],
+): {
+  file: boolean;
+  code: boolean;
+} {
+  if (value === undefined) return { file: false, code: false };
+  if (typeof value === "boolean") return { file: value, code: value };
+  return { file: value.file ?? false, code: value.code ?? false };
+}
diff --git a/packages/appkit/src/plugins/agents/registry-printer.ts b/packages/appkit/src/plugins/agents/registry-printer.ts
new file mode 100644
index 000000000..9231ee077
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/registry-printer.ts
@@ -0,0 +1,25 @@
+import pc from "picocolors";
+import type { RegisteredAgent } from "../../core/agent/types";
+
+/**
+ * Pretty-prints the registered agent set during plugin setup. Decorative —
+ * no behaviour change if it's skipped (e.g., from tests).
+ */
+export function printRegistry(
+  agents: Map<string, RegisteredAgent>,
+  defaultAgentName: string | null,
+): void {
+  if (agents.size === 0) return;
+  console.log("");
+  console.log(`  ${pc.bold("Agents")} ${pc.dim(`(${agents.size})`)}`);
+  console.log(`  ${pc.dim("─".repeat(60))}`);
+  for (const [name, reg] of agents) {
+    const tools = reg.toolIndex.size;
+    const marker = name === defaultAgentName ? pc.green("●") : " ";
+    console.log(
+      `  ${marker} ${pc.bold(name.padEnd(24))} ${pc.dim(`${tools} tools`)}`,
+    );
+  }
+  console.log(`  ${pc.dim("─".repeat(60))}`);
+  console.log("");
+}

From b739024308b2c05fd2d24396701c971cd12302f6 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 4 May 2026 19:50:25 +0200
Subject: [PATCH 18/46] feat(appkit): unify on DATABRICKS_SERVING_ENDPOINT_NAME
 (SDK + template manifest)

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 packages/appkit/src/plugins/agents/agents.ts     | 2 +-
 packages/appkit/src/plugins/agents/manifest.json | 6 +++---
 template/appkit.plugins.json                     | 6 +++---
 3 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index d2a113f4c..80cda55e4 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -317,7 +317,7 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
         );
       } catch (err) {
         throw new Error(
-          `Agent '${name}' has no model configured and no DATABRICKS_AGENT_ENDPOINT default available`,
+          `Agent '${name}' has no model configured and no DATABRICKS_SERVING_ENDPOINT_NAME default available`,
           { cause: err instanceof Error ? err : undefined },
         );
       }
diff --git a/packages/appkit/src/plugins/agents/manifest.json b/packages/appkit/src/plugins/agents/manifest.json
index 4571031a8..01e843a85 100644
--- a/packages/appkit/src/plugins/agents/manifest.json
+++ b/packages/appkit/src/plugins/agents/manifest.json
@@ -11,12 +11,12 @@
         "type": "serving_endpoint",
         "alias": "Model Serving (agents)",
         "resourceKey": "agents-serving-endpoint",
-        "description": "Databricks Model Serving endpoint for agents using workspace-hosted models (`DatabricksAdapter.fromModelServing`). Wire the same endpoint name AppKit reads from `DATABRICKS_AGENT_ENDPOINT` when no per-agent model is configured. Omit when agents use only external adapters.",
+        "description": "Databricks Model Serving endpoint for agents using workspace-hosted models (`DatabricksAdapter.fromModelServing`). Wire the same endpoint name AppKit reads from `DATABRICKS_SERVING_ENDPOINT_NAME` when no per-agent model is configured. The same env var the `serving` plugin reads — one value covers both. Omit when agents use only external adapters.",
         "permission": "CAN_QUERY",
         "fields": {
           "name": {
-            "env": "DATABRICKS_AGENT_ENDPOINT",
-            "description": "Endpoint name passed to Model Serving when agents default to `DatabricksAdapter.fromModelServing()`"
+            "env": "DATABRICKS_SERVING_ENDPOINT_NAME",
+            "description": "Endpoint name passed to Model Serving when agents default to `DatabricksAdapter.fromModelServing()`. Shared with the `serving` plugin."
           }
         }
       }
diff --git a/template/appkit.plugins.json b/template/appkit.plugins.json
index 2f22a50c1..87e4304ac 100644
--- a/template/appkit.plugins.json
+++ b/template/appkit.plugins.json
@@ -14,12 +14,12 @@
             "type": "serving_endpoint",
             "alias": "Model Serving (agents)",
             "resourceKey": "agents-serving-endpoint",
-            "description": "Databricks Model Serving endpoint for agents using workspace-hosted models (`DatabricksAdapter.fromModelServing`). Wire the same endpoint name AppKit reads from `DATABRICKS_AGENT_ENDPOINT` when no per-agent model is configured. Omit when agents use only external adapters.",
+            "description": "Databricks Model Serving endpoint for agents using workspace-hosted models (`DatabricksAdapter.fromModelServing`). Wire the same endpoint name AppKit reads from `DATABRICKS_SERVING_ENDPOINT_NAME` when no per-agent model is configured. The same env var the `serving` plugin reads — one value covers both. Omit when agents use only external adapters.",
             "permission": "CAN_QUERY",
             "fields": {
               "name": {
-                "env": "DATABRICKS_AGENT_ENDPOINT",
-                "description": "Endpoint name passed to Model Serving when agents default to `DatabricksAdapter.fromModelServing()`"
+                "env": "DATABRICKS_SERVING_ENDPOINT_NAME",
+                "description": "Endpoint name passed to Model Serving when agents default to `DatabricksAdapter.fromModelServing()`. Shared with the `serving` plugin."
               }
             }
           }

From e460364e3bb2accb2804051979a4d1fbfe2a62ae Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Tue, 21 Apr 2026 19:58:04 +0200
Subject: [PATCH 19/46] feat(appkit): reference agent-app, dev-playground chat
 UI, docs, and template
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Final layer of the agents feature stack. Everything needed to
exercise, demonstrate, and learn the feature.

`apps/agent-app/` — a standalone app purpose-built around the agents
feature. Ships with:

- `server.ts` — full example of code-defined agents via `fromPlugin`:
  ```ts
  const support = createAgent({
    instructions: "…",
    tools: {
      ...fromPlugin(analytics),
      ...fromPlugin(files),
      get_weather,
      "mcp.vector-search": mcpServer("vector-search", "https://…"),
    },
  });

  await createApp({
    plugins: [server({ port }), analytics(), files(), agents({ agents: { support } })],
  });
  ```
- `config/agents/assistant.md` — markdown-driven agent alongside the
  code-defined one, showing the asymmetric auto-inherit default.
- Vite + React 19 + TailwindCSS frontend with a chat UI.
- Databricks deployment config (`databricks.yml`, `app.yaml`) and
  deploy scripts.

`apps/dev-playground/client/src/routes/agent.route.tsx` — chat UI with
inline autocomplete (hits the `autocomplete` markdown agent) and a
full threaded conversation panel (hits the default agent).

`apps/dev-playground/server/index.ts` — adds a code-defined `helper`
agent using `fromPlugin(analytics)` alongside the markdown-driven
`autocomplete` agent in `config/agents/`. Exercises the mixed-style
setup (markdown + code) against the same plugin list.

`apps/dev-playground/config/agents/*.md` — both agents defined with
valid YAML frontmatter.

`docs/docs/plugins/agents.md` — progressive five-level guide:

1. Drop a markdown file → it just works.
2. Scope tools via `toolkits:` / `tools:` frontmatter.
3. Code-defined agents with `fromPlugin()`.
4. Sub-agents.
5. Standalone `runAgent()` (no `createApp` or HTTP).

Plus a configuration reference, runtime API reference, and frontmatter
schema table.

`docs/docs/api/appkit/` — regenerated typedoc for the new public
surface (fromPlugin, runAgent, AgentDefinition, AgentsPluginConfig,
ToolkitEntry, ToolkitOptions, all adapter types, and the agents
plugin factory).

`template/appkit.plugins.json` — adds the `agent` plugin entry so
`npx @databricks/appkit init --features agent` scaffolds the plugin
correctly.

- Full appkit vitest suite: 1311 tests passing
- Typecheck clean across all 8 workspace projects
- `pnpm docs:build` clean (no broken links)
- `pnpm --filter=@databricks/appkit build:package` clean, publint
  clean

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>

Documents the new `mcp` configuration block and the rules it enforces:
same-origin-only by default, explicit `trustedHosts` for external MCP
servers, plaintext `http://` refused outside localhost-in-dev, and
DNS-level blocking of private / link-local IP ranges (covers cloud
metadata services). See PR #302 for the policy implementation and
PR #304 for the `AgentsPluginConfig.mcp` wiring.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>

- `docs/docs/plugins/agents.md`: new "SQL agent tools" subsection
  covering `analytics.query` readOnly enforcement, `lakebase.query`
  opt-in via `exposeAsAgentTool`, and the approval flow. New
  "Human-in-the-loop approval for destructive tools" subsection
  documents the config, SSE event shape, and `POST /chat/approve`
  contract.

- `apps/agent-app`: approval-card component rendered inline in the
  chat stream whenever an `appkit.approval_pending` event arrives.
  Destructive badge + Approve/Deny buttons POST to
  `/api/agent/approve` with the carried `streamId`/`approvalId`.

- `apps/dev-playground/client`: matching approval-card on the agent
  route, using the existing appkit-ui `Button` component and
  Tailwind utility classes.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>

Updates `docs/docs/plugins/agents.md` to document the new
two-key auto-inherit model introduced in PR #302 (per-tool
`autoInheritable` flag) and PR #304 (safe-by-default
`autoInheritTools: { file: false, code: false }`). Adds an
"Auto-inherit posture" subsection explaining that the developer
must opt into `autoInheritTools` AND the plugin author must mark
each tool `autoInheritable: true` for a tool to spread without
explicit wiring.

Includes a table documenting the `autoInheritable` marking on each
core plugin tool, plus an example of the setup-time audit log so
operators can see exactly what's inherited vs. skipped.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>

- **Reference app no longer ships hardcoded dogfood URLs.** The three
  `https://e2-dogfood.staging.cloud.databricks.com/...` and
  `https://mario-mcp-hello-*.staging.aws.databricksapps.com/...` MCP
  URLs in `apps/agent-app/server.ts` are replaced with optional
  env-driven `VECTOR_SEARCH_MCP_URL` / `CUSTOM_MCP_URL` config. When
  set, their hostnames are auto-added to `agents({ mcp: { trustedHosts
  } })`. `.env.example` uses placeholder values the reader can replace
  instead of another team's workspace.

- **`appkit.agent` → `appkit.agents` in the reference app.** The
  prior `appkit.agent as { list, getDefault }` cast papered over the
  plugin-name mismatch fixed in PR #304. The runtime key now matches
  the docs, the manifest, and the factory name; the cast is gone.

- **Auto-inherit opt-in added to the reference config.** Since the
  defaults flipped to `{ file: false, code: false }` (PR #304, S-3),
  the reference now explicitly enables `autoInheritTools: { file:
  true }` so the markdown agents that ship alongside the code-defined
  one still pick up the analytics / files read-only tools. This is the
  pattern a real deployment should follow — opt in deliberately.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>

- `apps/dev-playground/config/agents/autocomplete.md` sets
  `ephemeral: true`. Each debounced autocomplete keystroke no longer
  leaves an orphan thread in `InMemoryThreadStore` — the server now
  deletes the thread in the stream's `finally` (PR #304). Closes R1
  from the MVP re-review.
- `docs/docs/plugins/agents.md` documents the new `ephemeral`
  frontmatter key alongside the other AgentDefinition knobs.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>

Documents the MVP resource caps landed in PR #304: the static
request-body caps (enforced by the Zod schemas) and the three
configurable runtime limits (`maxConcurrentStreamsPerUser`,
`maxToolCalls`, `maxSubAgentDepth`). Includes the config-block
shape in the main reference and a new "Resource limits" subsection
under the Configuration section explaining the intent and per-user
semantics of each cap.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 apps/agent-app/.env.example                   |  16 +
 apps/agent-app/.gitignore                     |   3 +
 apps/agent-app/app.yaml                       |   8 +
 apps/agent-app/config/agents/assistant.md     |  23 +
 apps/agent-app/config/agents/support.md       |  17 +
 apps/agent-app/databricks.yml                 |  50 ++
 apps/agent-app/index.html                     |  12 +
 apps/agent-app/package.json                   |  40 ++
 apps/agent-app/postcss.config.js              |   6 +
 apps/agent-app/server.ts                      | 100 +++
 apps/agent-app/src/App.css                    | 440 ++++++++++++++
 apps/agent-app/src/App.tsx                    | 405 +++++++++++++
 .../src/components/theme-selector.tsx         | 135 +++++
 apps/agent-app/src/index.css                  |   1 +
 apps/agent-app/src/main.tsx                   |  15 +
 apps/agent-app/tailwind.config.ts             |  11 +
 apps/agent-app/tsconfig.app.json              |  24 +
 apps/agent-app/tsconfig.json                  |   7 +
 apps/agent-app/tsconfig.node.json             |  22 +
 apps/agent-app/vite.config.ts                 |  31 +
 .../client/src/routeTree.gen.ts               |  21 +
 .../client/src/routes/__root.tsx              |   8 +
 .../client/src/routes/agent.route.tsx         | 567 ++++++++++++++++++
 .../client/src/routes/index.tsx               |  29 +-
 .../dev-playground/config/agents/assistant.md |   6 +
 .../config/agents/autocomplete.md             |   7 +
 apps/dev-playground/server/index.ts           |  25 +-
 docs/docs/api/appkit/Function.createAgent.md  |  35 ++
 docs/docs/api/appkit/Function.fromPlugin.md   |  50 ++
 .../api/appkit/Function.isFromPluginMarker.md |  17 +
 .../api/appkit/Function.isFunctionTool.md     |  15 +
 docs/docs/api/appkit/Function.isHostedTool.md |  15 +
 .../api/appkit/Function.isToolkitEntry.md     |  18 +
 .../api/appkit/Function.loadAgentFromFile.md  |  23 +
 .../api/appkit/Function.loadAgentsFromDir.md  |  29 +
 docs/docs/api/appkit/Function.mcpServer.md    |  26 +
 docs/docs/api/appkit/Function.runAgent.md     |  29 +
 docs/docs/api/appkit/Function.tool.md         |  29 +
 .../docs/api/appkit/Interface.AgentAdapter.md |  20 +
 .../api/appkit/Interface.AgentDefinition.md   |  97 +++
 docs/docs/api/appkit/Interface.AgentInput.md  |  33 +
 .../api/appkit/Interface.AgentRunContext.md   |  28 +
 .../appkit/Interface.AgentToolDefinition.md   |  33 +
 .../appkit/Interface.AgentsPluginConfig.md    | 227 +++++++
 .../api/appkit/Interface.BasePluginConfig.md  |   1 +
 .../api/appkit/Interface.FromPluginMarker.md  |  32 +
 .../docs/api/appkit/Interface.FunctionTool.md |  59 ++
 docs/docs/api/appkit/Interface.Message.md     |  49 ++
 .../api/appkit/Interface.PromptContext.md     |  27 +
 .../api/appkit/Interface.RunAgentInput.md     |  35 ++
 .../api/appkit/Interface.RunAgentResult.md    |  21 +
 docs/docs/api/appkit/Interface.Thread.md      |  41 ++
 docs/docs/api/appkit/Interface.ThreadStore.md |  98 +++
 docs/docs/api/appkit/Interface.ToolConfig.md  |  49 ++
 .../docs/api/appkit/Interface.ToolProvider.md |  36 ++
 .../docs/api/appkit/Interface.ToolkitEntry.md |  59 ++
 .../api/appkit/Interface.ToolkitOptions.md    |  41 ++
 docs/docs/api/appkit/TypeAlias.AgentEvent.md  | 268 +++++++++
 docs/docs/api/appkit/TypeAlias.AgentTool.md   |  12 +
 docs/docs/api/appkit/TypeAlias.AgentTools.md  |  14 +
 .../TypeAlias.BaseSystemPromptOption.md       |   8 +
 docs/docs/api/appkit/TypeAlias.HostedTool.md  |   9 +
 docs/docs/api/appkit/Variable.agents.md       |  19 +
 docs/docs/api/appkit/index.md                 |  35 ++
 docs/docs/api/appkit/typedoc-sidebar.ts       | 175 ++++++
 docs/docs/plugins/agents.md                   | 398 ++++++++++++
 pnpm-lock.yaml                                | 336 ++++++++++-
 67 files changed, 4521 insertions(+), 54 deletions(-)
 create mode 100644 apps/agent-app/.env.example
 create mode 100644 apps/agent-app/.gitignore
 create mode 100644 apps/agent-app/app.yaml
 create mode 100644 apps/agent-app/config/agents/assistant.md
 create mode 100644 apps/agent-app/config/agents/support.md
 create mode 100644 apps/agent-app/databricks.yml
 create mode 100644 apps/agent-app/index.html
 create mode 100644 apps/agent-app/package.json
 create mode 100644 apps/agent-app/postcss.config.js
 create mode 100644 apps/agent-app/server.ts
 create mode 100644 apps/agent-app/src/App.css
 create mode 100644 apps/agent-app/src/App.tsx
 create mode 100644 apps/agent-app/src/components/theme-selector.tsx
 create mode 100644 apps/agent-app/src/index.css
 create mode 100644 apps/agent-app/src/main.tsx
 create mode 100644 apps/agent-app/tailwind.config.ts
 create mode 100644 apps/agent-app/tsconfig.app.json
 create mode 100644 apps/agent-app/tsconfig.json
 create mode 100644 apps/agent-app/tsconfig.node.json
 create mode 100644 apps/agent-app/vite.config.ts
 create mode 100644 apps/dev-playground/client/src/routes/agent.route.tsx
 create mode 100644 apps/dev-playground/config/agents/assistant.md
 create mode 100644 apps/dev-playground/config/agents/autocomplete.md
 create mode 100644 docs/docs/api/appkit/Function.createAgent.md
 create mode 100644 docs/docs/api/appkit/Function.fromPlugin.md
 create mode 100644 docs/docs/api/appkit/Function.isFromPluginMarker.md
 create mode 100644 docs/docs/api/appkit/Function.isFunctionTool.md
 create mode 100644 docs/docs/api/appkit/Function.isHostedTool.md
 create mode 100644 docs/docs/api/appkit/Function.isToolkitEntry.md
 create mode 100644 docs/docs/api/appkit/Function.loadAgentFromFile.md
 create mode 100644 docs/docs/api/appkit/Function.loadAgentsFromDir.md
 create mode 100644 docs/docs/api/appkit/Function.mcpServer.md
 create mode 100644 docs/docs/api/appkit/Function.runAgent.md
 create mode 100644 docs/docs/api/appkit/Function.tool.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentAdapter.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentDefinition.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentInput.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentRunContext.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentToolDefinition.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentsPluginConfig.md
 create mode 100644 docs/docs/api/appkit/Interface.FromPluginMarker.md
 create mode 100644 docs/docs/api/appkit/Interface.FunctionTool.md
 create mode 100644 docs/docs/api/appkit/Interface.Message.md
 create mode 100644 docs/docs/api/appkit/Interface.PromptContext.md
 create mode 100644 docs/docs/api/appkit/Interface.RunAgentInput.md
 create mode 100644 docs/docs/api/appkit/Interface.RunAgentResult.md
 create mode 100644 docs/docs/api/appkit/Interface.Thread.md
 create mode 100644 docs/docs/api/appkit/Interface.ThreadStore.md
 create mode 100644 docs/docs/api/appkit/Interface.ToolConfig.md
 create mode 100644 docs/docs/api/appkit/Interface.ToolProvider.md
 create mode 100644 docs/docs/api/appkit/Interface.ToolkitEntry.md
 create mode 100644 docs/docs/api/appkit/Interface.ToolkitOptions.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.AgentEvent.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.AgentTool.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.AgentTools.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.BaseSystemPromptOption.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.HostedTool.md
 create mode 100644 docs/docs/api/appkit/Variable.agents.md
 create mode 100644 docs/docs/plugins/agents.md

diff --git a/apps/agent-app/.env.example b/apps/agent-app/.env.example
new file mode 100644
index 000000000..055bb94c1
--- /dev/null
+++ b/apps/agent-app/.env.example
@@ -0,0 +1,16 @@
+# Databricks workspace (auto-injected by platform on deploy)
+DATABRICKS_HOST=https://your-workspace.cloud.databricks.com
+
+# Agent LLM endpoint (Model Serving endpoint name)
+DATABRICKS_AGENT_ENDPOINT=databricks-claude-sonnet-4-5
+
+# Analytics plugin — SQL warehouse ID
+DATABRICKS_WAREHOUSE_ID=your-warehouse-id
+
+# Files plugin — Volume path (catalog.schema.volume)
+DATABRICKS_VOLUME_FILES=/Volumes/your-catalog/your-schema/your-volume
+
+# Optional: Custom MCP servers the agent can call. When set, the hostname
+# is automatically added to agents({ mcp: { trustedHosts } }).
+# VECTOR_SEARCH_MCP_URL=https://<workspace>/api/2.0/mcp/vector-search/<catalog>/<schema>/<index>
+# CUSTOM_MCP_URL=https://<your-mcp-server>/mcp
diff --git a/apps/agent-app/.gitignore b/apps/agent-app/.gitignore
new file mode 100644
index 000000000..9c97bbd46
--- /dev/null
+++ b/apps/agent-app/.gitignore
@@ -0,0 +1,3 @@
+node_modules
+dist
+.env
diff --git a/apps/agent-app/app.yaml b/apps/agent-app/app.yaml
new file mode 100644
index 000000000..215b89ec3
--- /dev/null
+++ b/apps/agent-app/app.yaml
@@ -0,0 +1,8 @@
+command: ['node', '--import', 'tsx', 'server.ts']
+env:
+  - name: DATABRICKS_WAREHOUSE_ID
+    valueFrom: sql-warehouse
+  - name: DATABRICKS_AGENT_ENDPOINT
+    valueFrom: serving-endpoint
+  - name: DATABRICKS_VOLUME_FILES
+    valueFrom: volume
diff --git a/apps/agent-app/config/agents/assistant.md b/apps/agent-app/config/agents/assistant.md
new file mode 100644
index 000000000..1eb5a84fc
--- /dev/null
+++ b/apps/agent-app/config/agents/assistant.md
@@ -0,0 +1,23 @@
+---
+endpoint: databricks-claude-sonnet-4-5
+default: true
+toolkits:
+  - files: [files.list, files.upload, files.delete]
+agents:
+  - support
+  - researcher
+---
+
+You are a front-desk dispatcher running on Databricks.
+
+Delegate requests to the right specialist:
+
+- `agent-support` — data analysis (SQL via analytics), file browsing, and general questions.
+- `agent-researcher` — research and knowledge lookups that benefit from MCP-hosted tools (vector search, custom endpoints).
+
+Only use your own tools (`files.upload`, `files.delete`, `files.list`) for
+file-management actions the user explicitly asks for. Destructive ones
+(`upload`, `delete`) will prompt the user for approval before running.
+
+Keep your own responses short — mostly routing decisions plus a brief summary
+of what the specialist returned.
diff --git a/apps/agent-app/config/agents/support.md b/apps/agent-app/config/agents/support.md
new file mode 100644
index 000000000..68d7e964d
--- /dev/null
+++ b/apps/agent-app/config/agents/support.md
@@ -0,0 +1,17 @@
+---
+endpoint: databricks-claude-sonnet-4-5
+toolkits:
+  - analytics
+  - files
+tools:
+  - get_weather
+  # Optional MCP servers — uncomment the ones whose env vars are set in
+  # .env (VECTOR_SEARCH_MCP_URL, CUSTOM_MCP_URL). `server.ts` only
+  # registers each as ambient when its URL is configured, so leaving a
+  # reference here while the env var is unset will fail at startup.
+  # - mcp.vector-search
+  # - mcp.custom
+---
+
+You help customers with data analysis, file browsing, and general questions.
+Use the available tools as needed and summarize results concisely.
diff --git a/apps/agent-app/databricks.yml b/apps/agent-app/databricks.yml
new file mode 100644
index 000000000..3ed6e50ad
--- /dev/null
+++ b/apps/agent-app/databricks.yml
@@ -0,0 +1,50 @@
+bundle:
+  name: appkit-agent-app
+
+variables:
+  sql_warehouse_id:
+    description: SQL Warehouse ID for analytics queries
+  serving_endpoint_name:
+    description: Model Serving endpoint name for the agent LLM
+  volume_full_name:
+    description: "UC Volume full name (e.g. catalog.schema.volume_name)"
+
+resources:
+  apps:
+    agent_app:
+      name: "appkit-agent-app"
+      description: "AppKit agent with auto-discovered tools from analytics, files, and genie plugins"
+      source_code_path: ./
+
+      user_api_scopes:
+        - sql
+        - files.files
+        - dashboards.genie
+
+      resources:
+        - name: sql-warehouse
+          sql_warehouse:
+            id: ${var.sql_warehouse_id}
+            permission: CAN_USE
+
+        - name: serving-endpoint
+          serving_endpoint:
+            name: ${var.serving_endpoint_name}
+            permission: CAN_QUERY
+
+        - name: volume
+          uc_securable:
+            securable_type: VOLUME
+            securable_full_name: ${var.volume_full_name}
+            permission: WRITE_VOLUME
+
+targets:
+  dogfood:
+    default: true
+    workspace:
+      host: https://e2-dogfood.staging.cloud.databricks.com
+
+    variables:
+      sql_warehouse_id: dd43ee29fedd958d
+      serving_endpoint_name: databricks-claude-sonnet-4-5
+      volume_full_name: main.mario.mario-vol
diff --git a/apps/agent-app/index.html b/apps/agent-app/index.html
new file mode 100644
index 000000000..80e54faf6
--- /dev/null
+++ b/apps/agent-app/index.html
@@ -0,0 +1,12 @@
+<!doctype html>
+<html lang="en">
+  <head>
+    <meta charset="UTF-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+    <title>AppKit Agent</title>
+  </head>
+  <body>
+    <div id="root"></div>
+    <script type="module" src="/src/main.tsx"></script>
+  </body>
+</html>
diff --git a/apps/agent-app/package.json b/apps/agent-app/package.json
new file mode 100644
index 000000000..ed159ca8d
--- /dev/null
+++ b/apps/agent-app/package.json
@@ -0,0 +1,40 @@
+{
+  "name": "agent-app",
+  "private": true,
+  "version": "0.0.0",
+  "type": "module",
+  "scripts": {
+    "dev": "NODE_ENV=development tsx watch server.ts",
+    "build": "tsc -b && vite build",
+    "preview": "vite preview"
+  },
+  "dependencies": {
+    "@databricks/appkit": "workspace:*",
+    "@databricks/appkit-ui": "workspace:*",
+    "@databricks/sdk-experimental": "^0.16.0",
+    "dotenv": "^16.6.1",
+    "lucide-react": "^0.511.0",
+    "react": "19.2.0",
+    "react-dom": "19.2.0",
+    "marked": "^15.0.0",
+    "zod": "^4.0.0"
+  },
+  "devDependencies": {
+    "@tailwindcss/postcss": "4.1.17",
+    "@types/node": "24.10.1",
+    "@types/react": "19.2.7",
+    "@types/react-dom": "19.2.3",
+    "@vitejs/plugin-react": "5.1.1",
+    "autoprefixer": "10.4.21",
+    "postcss": "8.5.6",
+    "tailwindcss": "4.1.17",
+    "tailwindcss-animate": "1.0.7",
+    "tw-animate-css": "1.4.0",
+    "tsx": "4.20.6",
+    "typescript": "5.9.3",
+    "vite": "npm:rolldown-vite@7.1.14"
+  },
+  "overrides": {
+    "vite": "npm:rolldown-vite@7.1.14"
+  }
+}
diff --git a/apps/agent-app/postcss.config.js b/apps/agent-app/postcss.config.js
new file mode 100644
index 000000000..f69c5d411
--- /dev/null
+++ b/apps/agent-app/postcss.config.js
@@ -0,0 +1,6 @@
+export default {
+  plugins: {
+    "@tailwindcss/postcss": {},
+    autoprefixer: {},
+  },
+};
diff --git a/apps/agent-app/server.ts b/apps/agent-app/server.ts
new file mode 100644
index 000000000..8ea63c224
--- /dev/null
+++ b/apps/agent-app/server.ts
@@ -0,0 +1,100 @@
+import {
+  agents,
+  analytics,
+  createAgent,
+  createApp,
+  files,
+  mcpServer,
+  server,
+  tool,
+} from "@databricks/appkit";
+import { z } from "zod";
+
+const port = Number(process.env.DATABRICKS_APP_PORT) || 8003;
+
+// Ambient function tool. Referenced from `config/agents/support.md` under
+// `tools: [get_weather]`. Markdown frontmatter looks up this name against
+// the `tools:` record passed to `agents({ tools: { get_weather } })` below.
+const get_weather = tool({
+  name: "get_weather",
+  description: "Get the current weather for a city",
+  schema: z.object({
+    city: z.string().describe("City name"),
+  }),
+  execute: async ({ city }) => `The weather in ${city} is sunny, 22°C`,
+});
+
+// MCP servers are conditional on runtime env vars — something markdown
+// frontmatter can't express. This is the motivating case for defining
+// the `researcher` agent in code below: it wires whatever MCP tools are
+// configured at boot, and is always callable (with a graceful fallback
+// when nothing is wired).
+//
+// Any MCP URL configured here must also be allowlisted via
+// `agents({ mcp: { trustedHosts: [...] } })` before outbound calls will
+// be allowed by the zero-trust host policy.
+const customMcpServers: Record<string, ReturnType<typeof mcpServer>> = {};
+if (process.env.VECTOR_SEARCH_MCP_URL) {
+  customMcpServers["mcp.vector-search"] = mcpServer(
+    "vector-search",
+    process.env.VECTOR_SEARCH_MCP_URL,
+  );
+}
+if (process.env.CUSTOM_MCP_URL) {
+  customMcpServers["mcp.custom"] = mcpServer(
+    "custom",
+    process.env.CUSTOM_MCP_URL,
+  );
+}
+
+// Code-defined research specialist. `assistant.md` references this by name
+// under `agents: [researcher]`; the agents plugin resolves that reference
+// against both markdown siblings and code-defined agents, with code winning
+// on collision. Defined in code so its MCP toolset can flex on env vars.
+const researcher = createAgent({
+  instructions:
+    "You are a research specialist. When MCP tools are available " +
+    "(vector search, custom endpoints), prefer them for knowledge lookups. " +
+    "If no MCP tools are configured, say so briefly and answer from general " +
+    "knowledge. Always include your source or note when you're answering " +
+    "without search.",
+  tools: {
+    get_weather,
+    ...customMcpServers,
+  },
+});
+
+const trustedMcpHosts = [
+  process.env.VECTOR_SEARCH_MCP_URL,
+  process.env.CUSTOM_MCP_URL,
+]
+  .filter((u): u is string => typeof u === "string" && u.length > 0)
+  .map((u) => new URL(u).hostname);
+
+const appkit = await createApp({
+  plugins: [
+    server({ port }),
+    analytics(),
+    files(),
+    agents({
+      // Code-defined agents merged with markdown agents; code wins on name
+      // collision. Markdown `agents: [...]` frontmatter can reference either.
+      agents: { researcher },
+      // Ambient tool library for markdown agents referencing names under
+      // their `tools:` frontmatter.
+      tools: { get_weather, ...customMcpServers },
+      // Enables auto-inherit of read-only plugin tools (analytics/files) into
+      // markdown agents that declare no explicit `toolkits:` / `tools:`. Both
+      // assistant.md and support.md are explicit, so this is a no-op today,
+      // but kept as a knob markdown authors can rely on.
+      autoInheritTools: { file: true },
+      mcp: { trustedHosts: trustedMcpHosts },
+    }),
+  ],
+});
+
+console.log(
+  `Agent app running on port ${port}. ` +
+    `Agents: ${appkit.agents.list().join(", ") || "(none)"}. ` +
+    `Default: ${appkit.agents.getDefault() ?? "(none)"}.`,
+);
diff --git a/apps/agent-app/src/App.css b/apps/agent-app/src/App.css
new file mode 100644
index 000000000..545b438cd
--- /dev/null
+++ b/apps/agent-app/src/App.css
@@ -0,0 +1,440 @@
+:root {
+  --bg: #fafafa;
+  --card: #ffffff;
+  --border: #e5e5e5;
+  --text: #171717;
+  --text-muted: #737373;
+  --text-faint: #a3a3a3;
+  --primary: #2563eb;
+  --primary-fg: #ffffff;
+  --muted: #f5f5f5;
+  --ring: #93c5fd;
+  --radius: 10px;
+  --font: system-ui, -apple-system, sans-serif;
+  --mono: "SF Mono", "Cascadia Code", "Fira Code", monospace;
+}
+
+:root.dark {
+  --bg: #0a0a0a;
+  --card: #171717;
+  --border: #262626;
+  --text: #fafafa;
+  --text-muted: #a3a3a3;
+  --text-faint: #525252;
+  --primary: #3b82f6;
+  --primary-fg: #ffffff;
+  --muted: #262626;
+  --ring: #1d4ed8;
+}
+
+* {
+  margin: 0;
+  padding: 0;
+  box-sizing: border-box;
+}
+
+body {
+  font-family: var(--font);
+  background: var(--bg);
+  color: var(--text);
+  -webkit-font-smoothing: antialiased;
+}
+
+.app {
+  min-height: 100vh;
+}
+
+.container {
+  max-width: 1100px;
+  margin: 0 auto;
+  padding: 2.5rem 1.5rem;
+}
+
+.header {
+  margin-bottom: 1.5rem;
+  display: flex;
+  align-items: flex-start;
+  justify-content: space-between;
+}
+
+.header h1 {
+  font-size: 1.75rem;
+  font-weight: 700;
+  letter-spacing: -0.025em;
+}
+
+.subtitle {
+  color: var(--text-muted);
+  font-size: 0.875rem;
+  margin-top: 0.25rem;
+}
+
+.thread-id {
+  font-family: var(--mono);
+  font-size: 0.75rem;
+  opacity: 0.6;
+}
+
+.main-layout {
+  display: flex;
+  gap: 1.25rem;
+  height: 700px;
+}
+
+.chat-panel {
+  flex: 1;
+  display: flex;
+  flex-direction: column;
+  border: 1px solid var(--border);
+  border-radius: var(--radius);
+  background: var(--card);
+  min-width: 0;
+  overflow: hidden;
+}
+
+.messages {
+  flex: 1;
+  overflow-y: auto;
+  padding: 1.25rem;
+  display: flex;
+  flex-direction: column;
+  gap: 1rem;
+}
+
+.empty-state {
+  text-align: center;
+  padding: 5rem 1rem;
+  color: var(--text-muted);
+}
+
+.empty-title {
+  font-size: 1.1rem;
+  font-weight: 500;
+}
+
+.empty-sub {
+  font-size: 0.85rem;
+  margin-top: 0.5rem;
+  color: var(--text-faint);
+}
+
+.message-row {
+  display: flex;
+}
+
+.message-row.user {
+  justify-content: flex-end;
+}
+
+.message-row.assistant {
+  justify-content: flex-start;
+}
+
+.bubble {
+  max-width: 80%;
+  padding: 0.625rem 0.875rem;
+  border-radius: var(--radius);
+  font-size: 0.875rem;
+  line-height: 1.5;
+  word-break: break-word;
+}
+
+.bubble.user {
+  white-space: pre-wrap;
+  background: var(--primary);
+  color: var(--primary-fg);
+  border-bottom-right-radius: 3px;
+}
+
+.bubble.assistant {
+  background: var(--muted);
+  color: var(--text);
+  border-bottom-left-radius: 3px;
+}
+
+.bubble.thinking {
+  color: var(--text-muted);
+  animation: pulse 1.5s ease-in-out infinite;
+}
+
+.bubble.approval-card {
+  border: 1px solid #d96b3a;
+  background: color-mix(in srgb, #d96b3a 10%, var(--muted));
+}
+
+.approval-header {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  margin-bottom: 8px;
+}
+
+.approval-badge {
+  display: inline-block;
+  padding: 2px 8px;
+  font-size: 0.75rem;
+  font-weight: 600;
+  letter-spacing: 0.02em;
+  text-transform: uppercase;
+  color: #fff;
+  background: #d96b3a;
+  border-radius: 3px;
+}
+
+.approval-body {
+  font-size: 0.9rem;
+}
+
+.approval-args {
+  margin: 6px 0 0;
+  padding: 8px;
+  font-size: 0.8rem;
+  max-height: 220px;
+  overflow: auto;
+  background: var(--bg);
+  border-radius: 4px;
+  white-space: pre-wrap;
+  word-break: break-word;
+}
+
+.approval-actions {
+  display: flex;
+  gap: 8px;
+  margin-top: 10px;
+  justify-content: flex-end;
+}
+
+.approval-actions button {
+  padding: 6px 14px;
+  font-size: 0.85rem;
+  font-weight: 500;
+  border-radius: 4px;
+  border: 1px solid transparent;
+  cursor: pointer;
+  transition:
+    background 0.15s,
+    border-color 0.15s;
+}
+
+.approval-deny {
+  background: transparent;
+  color: var(--text);
+  border-color: var(--border);
+}
+
+.approval-deny:hover {
+  background: var(--muted);
+}
+
+.approval-approve {
+  background: #d96b3a;
+  color: #fff;
+}
+
+.approval-approve:hover {
+  background: #c35a2b;
+}
+
+.bubble.assistant > * + * {
+  margin-top: 0.5em;
+}
+
+.bubble.assistant p {
+  margin: 0;
+}
+
+.bubble.assistant p + p {
+  margin-top: 0.4em;
+}
+
+.bubble.assistant code {
+  font-family: var(--mono);
+  font-size: 0.8em;
+  background: color-mix(in srgb, var(--text) 8%, transparent);
+  padding: 0.15em 0.35em;
+  border-radius: 4px;
+}
+
+.bubble.assistant pre {
+  margin: 0.5em 0;
+  padding: 0.75em;
+  border-radius: 6px;
+  background: color-mix(in srgb, var(--text) 6%, transparent);
+  overflow-x: auto;
+}
+
+.bubble.assistant pre code {
+  background: none;
+  padding: 0;
+  font-size: 0.8em;
+}
+
+.bubble.assistant ul,
+.bubble.assistant ol {
+  margin: 0.4em 0;
+  padding-left: 1.5em;
+}
+
+.bubble.assistant li {
+  margin: 0.15em 0;
+}
+
+.bubble.assistant h1,
+.bubble.assistant h2,
+.bubble.assistant h3 {
+  font-weight: 600;
+}
+
+.bubble.assistant h1 {
+  font-size: 1.1em;
+}
+.bubble.assistant h2 {
+  font-size: 1em;
+}
+.bubble.assistant h3 {
+  font-size: 0.95em;
+}
+
+.bubble.assistant blockquote {
+  margin: 0.4em 0;
+  padding-left: 0.75em;
+  border-left: 3px solid var(--border);
+  color: var(--text-muted);
+}
+
+.bubble.assistant table {
+  border-collapse: collapse;
+  margin: 0.5em 0;
+  font-size: 0.85em;
+}
+
+.bubble.assistant th,
+.bubble.assistant td {
+  border: 1px solid var(--border);
+  padding: 0.35em 0.6em;
+}
+
+.bubble.assistant th {
+  background: color-mix(in srgb, var(--text) 4%, transparent);
+  font-weight: 600;
+}
+
+@keyframes pulse {
+  0%,
+  100% {
+    opacity: 1;
+  }
+  50% {
+    opacity: 0.5;
+  }
+}
+
+.input-bar {
+  display: flex;
+  gap: 0.5rem;
+  padding: 0.875rem 1rem;
+  border-top: 1px solid var(--border);
+}
+
+.input-bar textarea {
+  flex: 1;
+  padding: 0.5rem 0.75rem;
+  border: 1px solid var(--border);
+  border-radius: 8px;
+  background: var(--bg);
+  color: var(--text);
+  font-family: var(--font);
+  font-size: 0.875rem;
+  resize: none;
+  outline: none;
+  transition: border-color 0.15s;
+}
+
+.input-bar textarea:focus {
+  border-color: var(--ring);
+  box-shadow: 0 0 0 2px color-mix(in srgb, var(--ring) 25%, transparent);
+}
+
+.input-bar textarea:disabled {
+  opacity: 0.5;
+}
+
+.input-bar button {
+  padding: 0.5rem 1rem;
+  border: none;
+  border-radius: 8px;
+  background: var(--primary);
+  color: var(--primary-fg);
+  font-family: var(--font);
+  font-size: 0.875rem;
+  font-weight: 500;
+  cursor: pointer;
+  transition: opacity 0.15s;
+  align-self: flex-end;
+}
+
+.input-bar button:hover:not(:disabled) {
+  opacity: 0.9;
+}
+
+.input-bar button:disabled {
+  opacity: 0.4;
+  cursor: not-allowed;
+}
+
+.event-panel {
+  width: 300px;
+  flex-shrink: 0;
+  display: flex;
+  flex-direction: column;
+  border: 1px solid var(--border);
+  border-radius: var(--radius);
+  background: var(--card);
+  overflow: hidden;
+}
+
+.event-header {
+  padding: 0.625rem 0.875rem;
+  border-bottom: 1px solid var(--border);
+  font-size: 0.8rem;
+  font-weight: 600;
+  color: var(--text-muted);
+  text-transform: uppercase;
+  letter-spacing: 0.05em;
+}
+
+.event-list {
+  flex: 1;
+  overflow-y: auto;
+  padding: 0.75rem;
+  display: flex;
+  flex-direction: column;
+  gap: 0.25rem;
+}
+
+.event-empty {
+  text-align: center;
+  padding: 2.5rem 0;
+  font-size: 0.75rem;
+  color: var(--text-faint);
+}
+
+.event-row {
+  font-family: var(--mono);
+  font-size: 0.7rem;
+  line-height: 1.4;
+  display: flex;
+  gap: 0.5rem;
+}
+
+.event-type {
+  flex-shrink: 0;
+  width: 90px;
+  text-align: right;
+  color: var(--text-faint);
+}
+
+.event-detail {
+  color: var(--text-muted);
+  word-break: break-all;
+}
diff --git a/apps/agent-app/src/App.tsx b/apps/agent-app/src/App.tsx
new file mode 100644
index 000000000..1de373c94
--- /dev/null
+++ b/apps/agent-app/src/App.tsx
@@ -0,0 +1,405 @@
+import { TooltipProvider } from "@databricks/appkit-ui/react";
+import { useCallback, useEffect, useRef, useState } from "react";
+import "./App.css";
+import { ThemeSelector } from "./components/theme-selector";
+
+interface SSEEvent {
+  type: string;
+  delta?: string;
+  item_id?: string;
+  item?: {
+    type?: string;
+    id?: string;
+    call_id?: string;
+    name?: string;
+    arguments?: string;
+    output?: string;
+    status?: string;
+  };
+  content?: string;
+  data?: Record<string, unknown>;
+  error?: string;
+  sequence_number?: number;
+  output_index?: number;
+  approval_id?: string;
+  stream_id?: string;
+  tool_name?: string;
+  args?: unknown;
+  annotations?: {
+    readOnly?: boolean;
+    destructive?: boolean;
+    idempotent?: boolean;
+  };
+}
+
+interface ChatMessage {
+  id: number;
+  role: "user" | "assistant";
+  content: string;
+}
+
+interface PendingApproval {
+  approvalId: string;
+  streamId: string;
+  toolName: string;
+  args: unknown;
+  annotations?: {
+    readOnly?: boolean;
+    destructive?: boolean;
+    idempotent?: boolean;
+  };
+}
+
+export default function App() {
+  const [messages, setMessages] = useState<ChatMessage[]>([]);
+  const [events, setEvents] = useState<SSEEvent[]>([]);
+  const [input, setInput] = useState("");
+  const [isLoading, setIsLoading] = useState(false);
+  const [threadId, setThreadId] = useState<string | null>(null);
+  const [pendingApprovals, setPendingApprovals] = useState<PendingApproval[]>(
+    [],
+  );
+  const currentStreamIdRef = useRef<string | null>(null);
+  const messagesEndRef = useRef<HTMLDivElement>(null);
+  const idRef = useRef(0);
+
+  const [toolCount, setToolCount] = useState(0);
+
+  const decideApproval = useCallback(
+    async (approvalId: string, decision: "approve" | "deny") => {
+      const approval = pendingApprovals.find(
+        (a) => a.approvalId === approvalId,
+      );
+      if (!approval) return;
+      try {
+        await fetch("/api/agent/approve", {
+          method: "POST",
+          headers: { "Content-Type": "application/json" },
+          body: JSON.stringify({
+            streamId: approval.streamId,
+            approvalId,
+            decision,
+          }),
+        });
+      } finally {
+        setPendingApprovals((prev) =>
+          prev.filter((a) => a.approvalId !== approvalId),
+        );
+      }
+    },
+    [pendingApprovals],
+  );
+
+  useEffect(() => {
+    const timer = setTimeout(() => {
+      fetch("/api/agent/info")
+        .then((r) => r.json())
+        .then((data) => setToolCount(data.toolCount ?? 0))
+        .catch(() => {});
+    }, 500);
+    return () => clearTimeout(timer);
+  }, []);
+
+  // biome-ignore lint/correctness/useExhaustiveDependencies: scroll on new messages
+  useEffect(() => {
+    messagesEndRef.current?.scrollIntoView({ behavior: "smooth" });
+  }, [messages]);
+
+  const sendMessage = useCallback(async () => {
+    if (!input.trim() || isLoading) return;
+
+    const text = input.trim();
+    setInput("");
+    setMessages((prev) => [
+      ...prev,
+      { id: ++idRef.current, role: "user", content: text },
+    ]);
+    setEvents([]);
+    setIsLoading(true);
+
+    try {
+      const res = await fetch("/api/agent/chat", {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({
+          message: text,
+          ...(threadId && { threadId }),
+        }),
+      });
+
+      if (!res.ok) {
+        const err = await res.json();
+        setMessages((prev) => [
+          ...prev,
+          {
+            id: ++idRef.current,
+            role: "assistant",
+            content: `Error: ${err.error}`,
+          },
+        ]);
+        return;
+      }
+
+      const reader = res.body?.getReader();
+      if (!reader) return;
+
+      const decoder = new TextDecoder();
+      let content = "";
+      let buffer = "";
+
+      while (true) {
+        const { done, value } = await reader.read();
+        if (done) break;
+        buffer += decoder.decode(value, { stream: true });
+        const lines = buffer.split("\n");
+        buffer = lines.pop() ?? "";
+
+        for (const line of lines) {
+          if (!line.startsWith("data: ")) continue;
+          const data = line.slice(6).trim();
+          if (!data || data === "[DONE]") continue;
+          try {
+            const event: SSEEvent = JSON.parse(data);
+            if (!event.type) continue;
+            setEvents((prev) => [...prev, event]);
+
+            if (event.type === "appkit.metadata" && event.data?.threadId) {
+              setThreadId(event.data.threadId as string);
+              if (typeof event.data.streamId === "string") {
+                currentStreamIdRef.current = event.data.streamId;
+              }
+            }
+            if (
+              event.type === "appkit.approval_pending" &&
+              event.approval_id &&
+              event.stream_id &&
+              event.tool_name
+            ) {
+              currentStreamIdRef.current = event.stream_id;
+              setPendingApprovals((prev) => [
+                ...prev,
+                {
+                  approvalId: event.approval_id as string,
+                  streamId: event.stream_id as string,
+                  toolName: event.tool_name as string,
+                  args: event.args,
+                  annotations: event.annotations,
+                },
+              ]);
+            }
+            if (event.type === "response.output_text.delta" && event.delta) {
+              content += event.delta;
+              setMessages((prev) => {
+                const updated = [...prev];
+                const last = updated[updated.length - 1];
+                if (last?.role === "assistant") {
+                  updated[updated.length - 1] = { ...last, content };
+                } else {
+                  updated.push({
+                    id: ++idRef.current,
+                    role: "assistant",
+                    content,
+                  });
+                }
+                return updated;
+              });
+            }
+          } catch {
+            /* skip */
+          }
+        }
+      }
+    } catch (err) {
+      setMessages((prev) => [
+        ...prev,
+        {
+          id: ++idRef.current,
+          role: "assistant",
+          content: `Error: ${err instanceof Error ? err.message : "Unknown error"}`,
+        },
+      ]);
+    } finally {
+      setIsLoading(false);
+    }
+  }, [input, isLoading, threadId]);
+
+  return (
+    <TooltipProvider>
+      <div className="app">
+        <div className="container">
+          <header className="header">
+            <div>
+              <h1>Agent Chat</h1>
+              <p className="subtitle">
+                AI agent with {toolCount} auto-discovered tools
+                {threadId && (
+                  <span className="thread-id">
+                    {" "}
+                    · Thread {threadId.slice(0, 8)}
+                  </span>
+                )}
+              </p>
+            </div>
+            <ThemeSelector />
+          </header>
+
+          <div className="main-layout">
+            <div className="chat-panel">
+              <div className="messages">
+                {messages.length === 0 && (
+                  <div className="empty-state">
+                    <p className="empty-title">
+                      Send a message to start a conversation
+                    </p>
+                    <p className="empty-sub">
+                      The agent can query data, browse files, and more
+                    </p>
+                  </div>
+                )}
+
+                {messages.map((msg) => (
+                  <div
+                    key={msg.id}
+                    className={`message-row ${msg.role === "user" ? "user" : "assistant"}`}
+                  >
+                    <div className={`bubble ${msg.role}`}>
+                      <p className="whitespace-pre-wrap">{msg.content}</p>
+                    </div>
+                  </div>
+                ))}
+
+                {pendingApprovals.map((approval) => (
+                  <div
+                    key={approval.approvalId}
+                    className="message-row assistant"
+                  >
+                    <div className="bubble assistant approval-card">
+                      <div className="approval-header">
+                        <span className="approval-badge">
+                          Destructive tool — approval required
+                        </span>
+                      </div>
+                      <div className="approval-body">
+                        <strong>{approval.toolName}</strong>
+                        <pre className="approval-args">
+                          {JSON.stringify(approval.args, null, 2)}
+                        </pre>
+                      </div>
+                      <div className="approval-actions">
+                        <button
+                          type="button"
+                          className="approval-deny"
+                          onClick={() =>
+                            decideApproval(approval.approvalId, "deny")
+                          }
+                        >
+                          Deny
+                        </button>
+                        <button
+                          type="button"
+                          className="approval-approve"
+                          onClick={() =>
+                            decideApproval(approval.approvalId, "approve")
+                          }
+                        >
+                          Approve
+                        </button>
+                      </div>
+                    </div>
+                  </div>
+                ))}
+
+                {isLoading &&
+                  pendingApprovals.length === 0 &&
+                  messages[messages.length - 1]?.role === "user" && (
+                    <div className="message-row assistant">
+                      <div className="bubble assistant thinking">
+                        Thinking...
+                      </div>
+                    </div>
+                  )}
+
+                <div ref={messagesEndRef} />
+              </div>
+
+              <form
+                className="input-bar"
+                onSubmit={(e) => {
+                  e.preventDefault();
+                  sendMessage();
+                }}
+              >
+                <textarea
+                  value={input}
+                  onChange={(e) => setInput(e.target.value)}
+                  onKeyDown={(e) => {
+                    if (e.key === "Enter" && !e.shiftKey) {
+                      e.preventDefault();
+                      sendMessage();
+                    }
+                  }}
+                  placeholder="Ask a question..."
+                  disabled={isLoading}
+                  rows={1}
+                />
+                <button type="submit" disabled={isLoading || !input.trim()}>
+                  Send
+                </button>
+              </form>
+            </div>
+
+            <div className="event-panel">
+              <div className="event-header">Event Stream</div>
+              <div className="event-list">
+                {events.length === 0 && (
+                  <p className="event-empty">Events will appear here</p>
+                )}
+                {events.map((event, i) => {
+                  let detail: string;
+                  switch (event.type) {
+                    case "response.output_text.delta":
+                      detail = event.delta?.slice(0, 60) ?? "";
+                      break;
+                    case "response.output_item.added":
+                    case "response.output_item.done":
+                      detail =
+                        event.item?.type === "function_call"
+                          ? `${event.item.name}(${(event.item.arguments ?? "").slice(0, 40)})`
+                          : event.item?.type === "function_call_output"
+                            ? (event.item.output?.slice(0, 60) ?? "")
+                            : (event.item?.status ?? event.item?.type ?? "");
+                      break;
+                    case "response.completed":
+                      detail = "done";
+                      break;
+                    case "error":
+                      detail = event.error ?? "unknown";
+                      break;
+                    case "appkit.metadata":
+                      detail = JSON.stringify(event.data).slice(0, 60);
+                      break;
+                    case "appkit.thinking":
+                      detail = event.content?.slice(0, 60) ?? "";
+                      break;
+                    default:
+                      detail = JSON.stringify(event).slice(0, 60);
+                  }
+                  return (
+                    <div key={`${event.type}-${i}`} className="event-row">
+                      <span className="event-type">
+                        {event.type
+                          .replace("response.", "")
+                          .replace("appkit.", "")}
+                      </span>
+                      <span className="event-detail">{detail}</span>
+                    </div>
+                  );
+                })}
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+    </TooltipProvider>
+  );
+}
diff --git a/apps/agent-app/src/components/theme-selector.tsx b/apps/agent-app/src/components/theme-selector.tsx
new file mode 100644
index 000000000..18bb4f142
--- /dev/null
+++ b/apps/agent-app/src/components/theme-selector.tsx
@@ -0,0 +1,135 @@
+import {
+  Button,
+  DropdownMenu,
+  DropdownMenuContent,
+  DropdownMenuItem,
+  DropdownMenuTrigger,
+} from "@databricks/appkit-ui/react";
+import { MonitorIcon, MoonIcon, SunIcon } from "lucide-react";
+import { useEffect, useState } from "react";
+
+type Theme = "light" | "dark" | "system";
+
+const THEME_STORAGE_KEY = "agent-app-theme";
+
+function getSystemTheme(): "light" | "dark" {
+  if (typeof window === "undefined") return "light";
+  return window.matchMedia("(prefers-color-scheme: dark)").matches
+    ? "dark"
+    : "light";
+}
+
+function getStoredTheme(): Theme {
+  if (typeof window === "undefined") return "system";
+  const stored = localStorage.getItem(THEME_STORAGE_KEY);
+  return (stored as Theme) || "system";
+}
+
+function applyTheme(theme: Theme) {
+  if (typeof window === "undefined") return;
+
+  const root = document.documentElement;
+  root.classList.remove("light", "dark");
+
+  if (theme === "system") {
+    const systemTheme = getSystemTheme();
+    root.classList.add(systemTheme);
+  } else {
+    root.classList.add(theme);
+  }
+}
+
+export function ThemeSelector() {
+  const [theme, setTheme] = useState<Theme>(() => getStoredTheme());
+  const [mounted, setMounted] = useState(false);
+  const [systemTheme, setSystemTheme] = useState<"light" | "dark">(() =>
+    getSystemTheme(),
+  );
+
+  useEffect(() => {
+    setMounted(true);
+    applyTheme(theme);
+  }, [theme]);
+
+  useEffect(() => {
+    const mediaQuery = window.matchMedia("(prefers-color-scheme: dark)");
+    const handleChange = (e: MediaQueryListEvent | MediaQueryList) => {
+      const isDark = e.matches;
+      setSystemTheme(isDark ? "dark" : "light");
+      if (theme === "system") {
+        applyTheme("system");
+      }
+    };
+
+    handleChange(mediaQuery);
+
+    if (mediaQuery.addEventListener) {
+      mediaQuery.addEventListener("change", handleChange);
+      return () => mediaQuery.removeEventListener("change", handleChange);
+    } else {
+      mediaQuery.addListener(handleChange);
+      return () => mediaQuery.removeListener(handleChange);
+    }
+  }, [theme]);
+
+  const handleThemeChange = (newTheme: Theme) => {
+    setTheme(newTheme);
+    localStorage.setItem(THEME_STORAGE_KEY, newTheme);
+    applyTheme(newTheme);
+  };
+
+  const effectiveTheme = theme === "system" ? systemTheme : theme;
+
+  if (!mounted) {
+    return (
+      <Button variant="ghost" size="icon" className="h-9 w-9">
+        <SunIcon className="h-4 w-4" />
+      </Button>
+    );
+  }
+
+  return (
+    <DropdownMenu>
+      <DropdownMenuTrigger asChild>
+        <Button
+          variant="ghost"
+          size="icon"
+          className="h-9 w-9 text-foreground hover:text-secondary-foreground"
+          aria-label="Toggle theme"
+        >
+          {effectiveTheme === "dark" ? (
+            <MoonIcon className="h-4 w-4" />
+          ) : (
+            <SunIcon className="h-4 w-4" />
+          )}
+        </Button>
+      </DropdownMenuTrigger>
+      <DropdownMenuContent align="end">
+        <DropdownMenuItem
+          onClick={() => handleThemeChange("light")}
+          className="cursor-pointer"
+        >
+          <SunIcon className="mr-2 h-4 w-4" />
+          <span>Light</span>
+          {theme === "light" && <span className="ml-auto text-xs">✓</span>}
+        </DropdownMenuItem>
+        <DropdownMenuItem
+          onClick={() => handleThemeChange("dark")}
+          className="cursor-pointer"
+        >
+          <MoonIcon className="mr-2 h-4 w-4" />
+          <span>Dark</span>
+          {theme === "dark" && <span className="ml-auto text-xs">✓</span>}
+        </DropdownMenuItem>
+        <DropdownMenuItem
+          onClick={() => handleThemeChange("system")}
+          className="cursor-pointer"
+        >
+          <MonitorIcon className="mr-2 h-4 w-4" />
+          <span>System</span>
+          {theme === "system" && <span className="ml-auto text-xs">✓</span>}
+        </DropdownMenuItem>
+      </DropdownMenuContent>
+    </DropdownMenu>
+  );
+}
diff --git a/apps/agent-app/src/index.css b/apps/agent-app/src/index.css
new file mode 100644
index 000000000..5dcc4cf86
--- /dev/null
+++ b/apps/agent-app/src/index.css
@@ -0,0 +1 @@
+@import "@databricks/appkit-ui/styles.css";
diff --git a/apps/agent-app/src/main.tsx b/apps/agent-app/src/main.tsx
new file mode 100644
index 000000000..98b62364b
--- /dev/null
+++ b/apps/agent-app/src/main.tsx
@@ -0,0 +1,15 @@
+import { StrictMode } from "react";
+import { createRoot } from "react-dom/client";
+import App from "./App.tsx";
+import "./index.css";
+
+const rootElement = document.getElementById("root");
+if (!rootElement) {
+  throw new Error("Root element not found");
+}
+
+createRoot(rootElement).render(
+  <StrictMode>
+    <App />
+  </StrictMode>,
+);
diff --git a/apps/agent-app/tailwind.config.ts b/apps/agent-app/tailwind.config.ts
new file mode 100644
index 000000000..fad89bf65
--- /dev/null
+++ b/apps/agent-app/tailwind.config.ts
@@ -0,0 +1,11 @@
+import path from "node:path";
+import type { Config } from "tailwindcss";
+
+export default {
+  darkMode: ["class", "media"],
+  content: [
+    path.resolve(__dirname, "./index.html"),
+    path.resolve(__dirname, "./src/**/*.{js,ts,jsx,tsx}"),
+  ],
+  plugins: [require("tailwindcss-animate")],
+} satisfies Config;
diff --git a/apps/agent-app/tsconfig.app.json b/apps/agent-app/tsconfig.app.json
new file mode 100644
index 000000000..2877c2180
--- /dev/null
+++ b/apps/agent-app/tsconfig.app.json
@@ -0,0 +1,24 @@
+{
+  "compilerOptions": {
+    "tsBuildInfoFile": "./node_modules/.tmp/tsconfig.app.tsbuildinfo",
+    "target": "ES2022",
+    "useDefineForClassFields": true,
+    "lib": ["ES2022", "DOM", "DOM.Iterable"],
+    "module": "ESNext",
+    "types": ["vite/client"],
+    "skipLibCheck": true,
+    "moduleResolution": "bundler",
+    "allowImportingTsExtensions": true,
+    "verbatimModuleSyntax": true,
+    "moduleDetection": "force",
+    "noEmit": true,
+    "jsx": "react-jsx",
+    "strict": true,
+    "noUnusedLocals": true,
+    "noUnusedParameters": true,
+    "erasableSyntaxOnly": true,
+    "noFallthroughCasesInSwitch": true,
+    "noUncheckedSideEffectImports": true
+  },
+  "include": ["src"]
+}
diff --git a/apps/agent-app/tsconfig.json b/apps/agent-app/tsconfig.json
new file mode 100644
index 000000000..1ffef600d
--- /dev/null
+++ b/apps/agent-app/tsconfig.json
@@ -0,0 +1,7 @@
+{
+  "files": [],
+  "references": [
+    { "path": "./tsconfig.app.json" },
+    { "path": "./tsconfig.node.json" }
+  ]
+}
diff --git a/apps/agent-app/tsconfig.node.json b/apps/agent-app/tsconfig.node.json
new file mode 100644
index 000000000..35bcd1182
--- /dev/null
+++ b/apps/agent-app/tsconfig.node.json
@@ -0,0 +1,22 @@
+{
+  "compilerOptions": {
+    "tsBuildInfoFile": "./node_modules/.tmp/tsconfig.node.tsbuildinfo",
+    "target": "ES2023",
+    "lib": ["ES2023"],
+    "module": "ESNext",
+    "types": ["node"],
+    "skipLibCheck": true,
+    "moduleResolution": "bundler",
+    "allowImportingTsExtensions": true,
+    "verbatimModuleSyntax": true,
+    "moduleDetection": "force",
+    "noEmit": true,
+    "strict": true,
+    "noUnusedLocals": true,
+    "noUnusedParameters": true,
+    "erasableSyntaxOnly": true,
+    "noFallthroughCasesInSwitch": true,
+    "noUncheckedSideEffectImports": true
+  },
+  "include": ["vite.config.ts"]
+}
diff --git a/apps/agent-app/vite.config.ts b/apps/agent-app/vite.config.ts
new file mode 100644
index 000000000..bd1cea62c
--- /dev/null
+++ b/apps/agent-app/vite.config.ts
@@ -0,0 +1,31 @@
+import path from "node:path";
+import react from "@vitejs/plugin-react";
+import { defineConfig } from "vite";
+
+export default defineConfig({
+  plugins: [react()],
+  optimizeDeps: {
+    include: [
+      "react",
+      "react-dom",
+      "react/jsx-dev-runtime",
+      "react/jsx-runtime",
+    ],
+    exclude: ["@databricks/appkit-ui", "@databricks/appkit"],
+  },
+  server: {
+    hmr: {
+      port: 24679,
+    },
+  },
+  resolve: {
+    dedupe: ["react", "react-dom"],
+    preserveSymlinks: true,
+    alias: {
+      "@databricks/appkit-ui": path.resolve(
+        __dirname,
+        "../../packages/appkit-ui/dist",
+      ),
+    },
+  },
+});
diff --git a/apps/dev-playground/client/src/routeTree.gen.ts b/apps/dev-playground/client/src/routeTree.gen.ts
index 45e280700..378a77ea6 100644
--- a/apps/dev-playground/client/src/routeTree.gen.ts
+++ b/apps/dev-playground/client/src/routeTree.gen.ts
@@ -24,6 +24,7 @@ import { Route as DataVisualizationRouteRouteImport } from './routes/data-visual
 import { Route as ChartInferenceRouteRouteImport } from './routes/chart-inference.route'
 import { Route as ArrowAnalyticsRouteRouteImport } from './routes/arrow-analytics.route'
 import { Route as AnalyticsRouteRouteImport } from './routes/analytics.route'
+import { Route as AgentRouteRouteImport } from './routes/agent.route'
 import { Route as IndexRouteImport } from './routes/index'
 
 const VectorSearchRouteRoute = VectorSearchRouteRouteImport.update({
@@ -101,6 +102,11 @@ const AnalyticsRouteRoute = AnalyticsRouteRouteImport.update({
   path: '/analytics',
   getParentRoute: () => rootRouteImport,
 } as any)
+const AgentRouteRoute = AgentRouteRouteImport.update({
+  id: '/agent',
+  path: '/agent',
+  getParentRoute: () => rootRouteImport,
+} as any)
 const IndexRoute = IndexRouteImport.update({
   id: '/',
   path: '/',
@@ -109,6 +115,7 @@ const IndexRoute = IndexRouteImport.update({
 
 export interface FileRoutesByFullPath {
   '/': typeof IndexRoute
+  '/agent': typeof AgentRouteRoute
   '/analytics': typeof AnalyticsRouteRoute
   '/arrow-analytics': typeof ArrowAnalyticsRouteRoute
   '/chart-inference': typeof ChartInferenceRouteRoute
@@ -127,6 +134,7 @@ export interface FileRoutesByFullPath {
 }
 export interface FileRoutesByTo {
   '/': typeof IndexRoute
+  '/agent': typeof AgentRouteRoute
   '/analytics': typeof AnalyticsRouteRoute
   '/arrow-analytics': typeof ArrowAnalyticsRouteRoute
   '/chart-inference': typeof ChartInferenceRouteRoute
@@ -146,6 +154,7 @@ export interface FileRoutesByTo {
 export interface FileRoutesById {
   __root__: typeof rootRouteImport
   '/': typeof IndexRoute
+  '/agent': typeof AgentRouteRoute
   '/analytics': typeof AnalyticsRouteRoute
   '/arrow-analytics': typeof ArrowAnalyticsRouteRoute
   '/chart-inference': typeof ChartInferenceRouteRoute
@@ -166,6 +175,7 @@ export interface FileRouteTypes {
   fileRoutesByFullPath: FileRoutesByFullPath
   fullPaths:
     | '/'
+    | '/agent'
     | '/analytics'
     | '/arrow-analytics'
     | '/chart-inference'
@@ -184,6 +194,7 @@ export interface FileRouteTypes {
   fileRoutesByTo: FileRoutesByTo
   to:
     | '/'
+    | '/agent'
     | '/analytics'
     | '/arrow-analytics'
     | '/chart-inference'
@@ -202,6 +213,7 @@ export interface FileRouteTypes {
   id:
     | '__root__'
     | '/'
+    | '/agent'
     | '/analytics'
     | '/arrow-analytics'
     | '/chart-inference'
@@ -221,6 +233,7 @@ export interface FileRouteTypes {
 }
 export interface RootRouteChildren {
   IndexRoute: typeof IndexRoute
+  AgentRouteRoute: typeof AgentRouteRoute
   AnalyticsRouteRoute: typeof AnalyticsRouteRoute
   ArrowAnalyticsRouteRoute: typeof ArrowAnalyticsRouteRoute
   ChartInferenceRouteRoute: typeof ChartInferenceRouteRoute
@@ -345,6 +358,13 @@ declare module '@tanstack/react-router' {
       preLoaderRoute: typeof AnalyticsRouteRouteImport
       parentRoute: typeof rootRouteImport
     }
+    '/agent': {
+      id: '/agent'
+      path: '/agent'
+      fullPath: '/agent'
+      preLoaderRoute: typeof AgentRouteRouteImport
+      parentRoute: typeof rootRouteImport
+    }
     '/': {
       id: '/'
       path: '/'
@@ -357,6 +377,7 @@ declare module '@tanstack/react-router' {
 
 const rootRouteChildren: RootRouteChildren = {
   IndexRoute: IndexRoute,
+  AgentRouteRoute: AgentRouteRoute,
   AnalyticsRouteRoute: AnalyticsRouteRoute,
   ArrowAnalyticsRouteRoute: ArrowAnalyticsRouteRoute,
   ChartInferenceRouteRoute: ChartInferenceRouteRoute,
diff --git a/apps/dev-playground/client/src/routes/__root.tsx b/apps/dev-playground/client/src/routes/__root.tsx
index db42fdafb..6ce0c0756 100644
--- a/apps/dev-playground/client/src/routes/__root.tsx
+++ b/apps/dev-playground/client/src/routes/__root.tsx
@@ -136,6 +136,14 @@ function RootComponent() {
                     Vector Search
                   </Button>
                 </Link>
+                <Link to="/agent" className="no-underline">
+                  <Button
+                    variant="ghost"
+                    className="text-foreground hover:text-secondary-foreground"
+                  >
+                    Agent
+                  </Button>
+                </Link>
                 <ThemeSelector />
               </div>
             </nav>
diff --git a/apps/dev-playground/client/src/routes/agent.route.tsx b/apps/dev-playground/client/src/routes/agent.route.tsx
new file mode 100644
index 000000000..d1d1d1008
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/agent.route.tsx
@@ -0,0 +1,567 @@
+import { getPluginClientConfig } from "@databricks/appkit-ui/js";
+import { Button } from "@databricks/appkit-ui/react";
+import { createFileRoute } from "@tanstack/react-router";
+import { useCallback, useEffect, useRef, useState } from "react";
+
+export const Route = createFileRoute("/agent")({
+  component: AgentRoute,
+});
+
+interface SSEEvent {
+  type: string;
+  delta?: string;
+  item_id?: string;
+  item?: {
+    type?: string;
+    id?: string;
+    call_id?: string;
+    name?: string;
+    arguments?: string;
+    output?: string;
+    status?: string;
+  };
+  content?: string;
+  data?: Record<string, unknown>;
+  error?: string;
+  sequence_number?: number;
+  output_index?: number;
+  approval_id?: string;
+  stream_id?: string;
+  tool_name?: string;
+  args?: unknown;
+  annotations?: {
+    readOnly?: boolean;
+    destructive?: boolean;
+    idempotent?: boolean;
+  };
+}
+
+interface ChatMessage {
+  id: number;
+  role: "user" | "assistant";
+  content: string;
+}
+
+interface PendingApproval {
+  approvalId: string;
+  streamId: string;
+  toolName: string;
+  args: unknown;
+}
+
+function useAutocomplete(enabled: boolean) {
+  const [suggestion, setSuggestion] = useState("");
+  const [isLoading, setIsLoading] = useState(false);
+  const abortRef = useRef<AbortController | null>(null);
+  const timerRef = useRef<ReturnType<typeof setTimeout> | null>(null);
+
+  const requestSuggestion = useCallback(
+    (text: string) => {
+      setSuggestion("");
+
+      if (timerRef.current) clearTimeout(timerRef.current);
+      if (abortRef.current) abortRef.current.abort();
+
+      if (!text.trim() || text.length < 3 || !enabled) {
+        return;
+      }
+
+      timerRef.current = setTimeout(async () => {
+        const controller = new AbortController();
+        abortRef.current = controller;
+        setIsLoading(true);
+
+        try {
+          const response = await fetch("/api/agent/chat", {
+            method: "POST",
+            headers: { "Content-Type": "application/json" },
+            body: JSON.stringify({ message: text, agent: "autocomplete" }),
+            signal: controller.signal,
+          });
+
+          if (!response.ok || !response.body) return;
+
+          const reader = response.body.getReader();
+          const decoder = new TextDecoder();
+          let result = "";
+          let buffer = "";
+
+          while (true) {
+            const { done, value } = await reader.read();
+            if (done) break;
+
+            buffer += decoder.decode(value, { stream: true });
+            const lines = buffer.split("\n");
+            buffer = lines.pop() ?? "";
+
+            for (const line of lines) {
+              if (!line.startsWith("data: ")) continue;
+              const data = line.slice(6).trim();
+              if (!data || data === "[DONE]") continue;
+              try {
+                const event = JSON.parse(data);
+                if (
+                  event.type === "response.output_text.delta" &&
+                  event.delta
+                ) {
+                  result += event.delta;
+                  setSuggestion(result);
+                }
+              } catch {
+                /* skip */
+              }
+            }
+          }
+        } catch {
+          /* aborted or failed */
+        } finally {
+          setIsLoading(false);
+        }
+      }, 500);
+    },
+    [enabled],
+  );
+
+  const clear = useCallback(() => {
+    setSuggestion("");
+    if (timerRef.current) clearTimeout(timerRef.current);
+    if (abortRef.current) abortRef.current.abort();
+  }, []);
+
+  return {
+    suggestion,
+    isLoading: isLoading && !suggestion,
+    requestSuggestion,
+    clear,
+  };
+}
+
+function AgentRoute() {
+  const [messages, setMessages] = useState<ChatMessage[]>([]);
+  const [events, setEvents] = useState<AgentEvent[]>([]);
+  const [input, setInput] = useState("");
+  const [isLoading, setIsLoading] = useState(false);
+  const [threadId, setThreadId] = useState<string | null>(null);
+  const [pendingApprovals, setPendingApprovals] = useState<PendingApproval[]>(
+    [],
+  );
+
+  const decideApproval = useCallback(
+    async (approvalId: string, decision: "approve" | "deny") => {
+      const approval = pendingApprovals.find(
+        (a) => a.approvalId === approvalId,
+      );
+      if (!approval) return;
+      try {
+        await fetch("/api/agent/approve", {
+          method: "POST",
+          headers: { "Content-Type": "application/json" },
+          body: JSON.stringify({
+            streamId: approval.streamId,
+            approvalId,
+            decision,
+          }),
+        });
+      } finally {
+        setPendingApprovals((prev) =>
+          prev.filter((a) => a.approvalId !== approvalId),
+        );
+      }
+    },
+    [pendingApprovals],
+  );
+  const messagesEndRef = useRef<HTMLDivElement>(null);
+  const inputRef = useRef<HTMLTextAreaElement>(null);
+  const msgIdCounter = useRef(0);
+
+  const agentConfig = getPluginClientConfig<{
+    agents?: string[];
+    defaultAgent?: string;
+  }>("agent");
+  const hasAutocomplete = (agentConfig.agents ?? []).includes("autocomplete");
+
+  const {
+    suggestion,
+    isLoading: isAutocompleting,
+    requestSuggestion,
+    clear: clearSuggestion,
+  } = useAutocomplete(hasAutocomplete);
+
+  // biome-ignore lint/correctness/useExhaustiveDependencies: scroll on new messages
+  useEffect(() => {
+    messagesEndRef.current?.scrollIntoView({ behavior: "smooth" });
+  }, [messages]);
+
+  const sendMessage = useCallback(async () => {
+    if (!input.trim() || isLoading) return;
+
+    clearSuggestion();
+    const userMessage = input.trim();
+    setInput("");
+    setMessages((prev) => [
+      ...prev,
+      { id: ++msgIdCounter.current, role: "user", content: userMessage },
+    ]);
+    setEvents([]);
+    setIsLoading(true);
+
+    try {
+      const response = await fetch("/api/agent/chat", {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({
+          message: userMessage,
+          ...(threadId && { threadId }),
+        }),
+      });
+
+      if (!response.ok) {
+        const error = await response.json();
+        setMessages((prev) => [
+          ...prev,
+          {
+            id: ++msgIdCounter.current,
+            role: "assistant",
+            content: `Error: ${error.error}`,
+          },
+        ]);
+        return;
+      }
+
+      const reader = response.body?.getReader();
+      if (!reader) return;
+
+      const decoder = new TextDecoder();
+      let assistantContent = "";
+      let buffer = "";
+
+      while (true) {
+        const { done, value } = await reader.read();
+        if (done) break;
+
+        buffer += decoder.decode(value, { stream: true });
+        const lines = buffer.split("\n");
+        buffer = lines.pop() ?? "";
+
+        for (const line of lines) {
+          if (!line.startsWith("data: ")) continue;
+          const data = line.slice(6).trim();
+          if (!data || data === "[DONE]") continue;
+
+          try {
+            const event: SSEEvent = JSON.parse(data);
+            if (!event.type) continue;
+            setEvents((prev) => [...prev, event]);
+
+            if (
+              event.type === "appkit.approval_pending" &&
+              event.approval_id &&
+              event.stream_id &&
+              event.tool_name
+            ) {
+              setPendingApprovals((prev) => [
+                ...prev,
+                {
+                  approvalId: event.approval_id as string,
+                  streamId: event.stream_id as string,
+                  toolName: event.tool_name as string,
+                  args: event.args,
+                },
+              ]);
+            }
+            if (event.type === "appkit.metadata" && event.data?.threadId) {
+              setThreadId(event.data.threadId as string);
+            }
+
+            if (event.type === "response.output_text.delta" && event.delta) {
+              assistantContent += event.delta;
+              setMessages((prev) => {
+                const updated = [...prev];
+                const last = updated[updated.length - 1];
+                if (last?.role === "assistant") {
+                  updated[updated.length - 1] = {
+                    ...last,
+                    content: assistantContent,
+                  };
+                } else {
+                  updated.push({
+                    id: ++msgIdCounter.current,
+                    role: "assistant",
+                    content: assistantContent,
+                  });
+                }
+                return updated;
+              });
+            }
+          } catch {
+            // skip malformed events
+          }
+        }
+      }
+    } catch (err) {
+      setMessages((prev) => [
+        ...prev,
+        {
+          id: ++msgIdCounter.current,
+          role: "assistant",
+          content: `Error: ${err instanceof Error ? err.message : "Unknown error"}`,
+        },
+      ]);
+    } finally {
+      setIsLoading(false);
+    }
+  }, [input, isLoading, threadId, clearSuggestion]);
+
+  const handleInputChange = (value: string) => {
+    setInput(value);
+    requestSuggestion(value);
+  };
+
+  const acceptSuggestion = () => {
+    if (!suggestion) return;
+    const newValue = input + suggestion;
+    setInput(newValue);
+    clearSuggestion();
+    inputRef.current?.focus();
+  };
+
+  return (
+    <div className="min-h-screen bg-background">
+      <div className="max-w-7xl mx-auto px-6 py-12">
+        <div className="mb-8 flex items-end justify-between">
+          <div>
+            <h1 className="text-3xl font-bold mb-2">Agent Chat</h1>
+            <p className="text-base text-muted-foreground">
+              AI agent with auto-discovered tools from all AppKit plugins.
+              {threadId && (
+                <span className="ml-2 text-xs font-mono opacity-60">
+                  Thread: {threadId.slice(0, 8)}...
+                </span>
+              )}
+            </p>
+          </div>
+          {hasAutocomplete && (
+            <span className="text-xs text-muted-foreground bg-muted px-2 py-1 rounded">
+              Autocomplete enabled
+            </span>
+          )}
+        </div>
+
+        <div className="flex gap-6 h-[700px]">
+          <div className="flex-1 flex flex-col border rounded-lg bg-card min-w-0">
+            <div className="flex-1 overflow-y-auto p-4 space-y-4">
+              {messages.length === 0 && (
+                <div className="text-center text-muted-foreground py-20">
+                  <p className="text-lg">
+                    Send a message to start a conversation
+                  </p>
+                  <p className="text-sm mt-2">
+                    The agent can use analytics, files, genie, and lakebase
+                    tools.
+                    {hasAutocomplete && " Start typing for inline suggestions."}
+                  </p>
+                </div>
+              )}
+
+              {messages.map((msg) => (
+                <div
+                  key={msg.id}
+                  className={`flex ${msg.role === "user" ? "justify-end" : "justify-start"}`}
+                >
+                  <div
+                    className={`max-w-[85%] rounded-lg px-4 py-2 ${
+                      msg.role === "user"
+                        ? "bg-primary text-primary-foreground"
+                        : "bg-muted"
+                    }`}
+                  >
+                    <p className="whitespace-pre-wrap text-sm">{msg.content}</p>
+                  </div>
+                </div>
+              ))}
+
+              {pendingApprovals.map((approval) => (
+                <div key={approval.approvalId} className="flex justify-start">
+                  <div className="max-w-[80%] rounded-lg border border-orange-500/60 bg-orange-500/10 px-4 py-3">
+                    <div className="mb-2 flex items-center gap-2">
+                      <span className="rounded bg-orange-600 px-2 py-0.5 text-xs font-semibold uppercase tracking-wide text-white">
+                        Destructive tool — approval required
+                      </span>
+                    </div>
+                    <div className="text-sm">
+                      <strong>{approval.toolName}</strong>
+                      <pre className="mt-1 max-h-52 overflow-auto whitespace-pre-wrap break-words rounded bg-background p-2 text-xs">
+                        {JSON.stringify(approval.args, null, 2)}
+                      </pre>
+                    </div>
+                    <div className="mt-3 flex justify-end gap-2">
+                      <Button
+                        type="button"
+                        variant="outline"
+                        size="sm"
+                        onClick={() =>
+                          decideApproval(approval.approvalId, "deny")
+                        }
+                      >
+                        Deny
+                      </Button>
+                      <Button
+                        type="button"
+                        size="sm"
+                        onClick={() =>
+                          decideApproval(approval.approvalId, "approve")
+                        }
+                      >
+                        Approve
+                      </Button>
+                    </div>
+                  </div>
+                </div>
+              ))}
+
+              {isLoading &&
+                pendingApprovals.length === 0 &&
+                messages[messages.length - 1]?.role === "user" && (
+                  <div className="flex justify-start">
+                    <div className="bg-muted rounded-lg px-4 py-2">
+                      <p className="text-sm text-muted-foreground animate-pulse">
+                        Thinking...
+                      </p>
+                    </div>
+                  </div>
+                )}
+
+              <div ref={messagesEndRef} />
+            </div>
+
+            <div className="border-t p-4">
+              {hasAutocomplete && (suggestion || isAutocompleting) && (
+                <div className="flex items-center gap-2 mb-2 text-xs text-muted-foreground">
+                  {isAutocompleting && (
+                    <span className="animate-pulse">Thinking...</span>
+                  )}
+                  {suggestion && (
+                    <span>
+                      Press{" "}
+                      <kbd className="px-1.5 py-0.5 rounded bg-muted border text-[10px] font-mono">
+                        Tab
+                      </kbd>{" "}
+                      to accept suggestion
+                    </span>
+                  )}
+                </div>
+              )}
+              <form
+                onSubmit={(e) => {
+                  e.preventDefault();
+                  sendMessage();
+                }}
+                className="flex gap-2"
+              >
+                <div className="flex-1 relative">
+                  <div
+                    aria-hidden
+                    className="absolute inset-0 px-3 py-2 text-sm pointer-events-none whitespace-pre-wrap break-words overflow-hidden"
+                  >
+                    <span className="invisible">{input}</span>
+                    <span className="text-muted-foreground/40">
+                      {suggestion}
+                    </span>
+                  </div>
+                  <textarea
+                    ref={inputRef}
+                    value={input}
+                    onChange={(e) => handleInputChange(e.target.value)}
+                    onKeyDown={(e) => {
+                      if (e.key === "Tab" && suggestion) {
+                        e.preventDefault();
+                        acceptSuggestion();
+                      }
+                      if (e.key === "Escape" && suggestion) {
+                        clearSuggestion();
+                      }
+                      if (e.key === "Enter" && !e.shiftKey && !suggestion) {
+                        e.preventDefault();
+                        sendMessage();
+                      }
+                    }}
+                    placeholder="Ask a question..."
+                    disabled={isLoading}
+                    rows={1}
+                    className="w-full rounded-md border border-input bg-transparent px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring disabled:opacity-50 resize-none"
+                  />
+                </div>
+                <Button
+                  type="submit"
+                  disabled={isLoading || !input.trim()}
+                  className="self-end"
+                >
+                  Send
+                </Button>
+              </form>
+            </div>
+          </div>
+
+          <div className="w-80 shrink-0 flex flex-col border rounded-lg bg-card">
+            <div className="px-3 py-2 border-b">
+              <h3 className="text-sm font-semibold text-muted-foreground">
+                Event Stream
+              </h3>
+            </div>
+            <div className="flex-1 overflow-y-auto p-3 space-y-1">
+              {events.length === 0 && (
+                <p className="text-xs text-muted-foreground/50 text-center py-8">
+                  Events will appear here
+                </p>
+              )}
+              {events.map((event, i) => {
+                let detail: string;
+                switch (event.type) {
+                  case "response.output_text.delta":
+                    detail = event.delta?.slice(0, 60) ?? "";
+                    break;
+                  case "response.output_item.added":
+                  case "response.output_item.done":
+                    detail =
+                      event.item?.type === "function_call"
+                        ? `${event.item.name}(${(event.item.arguments ?? "").slice(0, 40)})`
+                        : event.item?.type === "function_call_output"
+                          ? (event.item.output?.slice(0, 60) ?? "")
+                          : (event.item?.status ?? event.item?.type ?? "");
+                    break;
+                  case "response.completed":
+                    detail = "done";
+                    break;
+                  case "error":
+                    detail = event.error ?? "unknown";
+                    break;
+                  case "appkit.metadata":
+                    detail = JSON.stringify(event.data).slice(0, 60);
+                    break;
+                  case "appkit.thinking":
+                    detail = event.content?.slice(0, 60) ?? "";
+                    break;
+                  default:
+                    detail = JSON.stringify(event).slice(0, 60);
+                }
+                return (
+                  <div
+                    key={`${event.type}-${i}`}
+                    className="font-mono text-xs text-muted-foreground"
+                  >
+                    <span className="inline-block w-24 text-right mr-2 opacity-50">
+                      {event.type
+                        .replace("response.", "")
+                        .replace("appkit.", "")}
+                    </span>
+                    <span className="opacity-80 break-all">{detail}</span>
+                  </div>
+                );
+              })}
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/index.tsx b/apps/dev-playground/client/src/routes/index.tsx
index ec2d9a50a..896a6e9d8 100644
--- a/apps/dev-playground/client/src/routes/index.tsx
+++ b/apps/dev-playground/client/src/routes/index.tsx
@@ -222,35 +222,18 @@ function IndexRoute() {
           <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
             <div className="flex flex-col h-full">
               <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Lakeflow Jobs
+                Custom Agent
               </h3>
               <p className="text-muted-foreground mb-6 flex-grow">
-                Trigger and monitor Databricks Lakeflow Jobs. View run history,
-                stream live status updates, and cancel in-flight runs.
+                AI agent powered by Databricks Model Serving with
+                auto-discovered tools from all AppKit plugins. Chat with your
+                data using natural language.
               </p>
               <Button
-                onClick={() => navigate({ to: "/jobs" })}
+                onClick={() => navigate({ to: "/agent" })}
                 className="w-full"
               >
-                Manage Jobs
-              </Button>
-            </div>
-          </Card>
-
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Model Serving
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Chat with a Databricks Model Serving endpoint using streaming
-                completions with real-time SSE responses.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/serving" })}
-                className="w-full"
-              >
-                Try Model Serving
+                Chat with Agent
               </Button>
             </div>
           </Card>
diff --git a/apps/dev-playground/config/agents/assistant.md b/apps/dev-playground/config/agents/assistant.md
new file mode 100644
index 000000000..ea99d47bb
--- /dev/null
+++ b/apps/dev-playground/config/agents/assistant.md
@@ -0,0 +1,6 @@
+---
+endpoint: databricks-claude-sonnet-4-5
+default: true
+---
+
+You are a helpful data assistant. Use the available tools to query data and help users with their analysis.
diff --git a/apps/dev-playground/config/agents/autocomplete.md b/apps/dev-playground/config/agents/autocomplete.md
new file mode 100644
index 000000000..0b8270f07
--- /dev/null
+++ b/apps/dev-playground/config/agents/autocomplete.md
@@ -0,0 +1,7 @@
+---
+endpoint: databricks-gemini-3-1-flash-lite
+maxSteps: 1
+ephemeral: true
+---
+
+You are an autocomplete engine. The user will give you the beginning of a sentence or paragraph. Continue the text naturally, as if you are the same author. Do NOT repeat the input. Only output the continuation. Do NOT use tools. Do NOT explain. Just write the next words.
diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index 91179dacd..cfd6c9eae 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -1,19 +1,22 @@
 import "reflect-metadata";
 import {
+  agents,
   analytics,
+  createAgent,
   createApp,
   type FilePolicy,
   files,
+  fromPlugin,
   genie,
   jobs,
   PolicyDeniedError,
   server,
   serving,
+  tool,
   WRITE_ACTIONS,
 } from "@databricks/appkit";
 import { WorkspaceClient } from "@databricks/sdk-experimental";
-// TODO: re-enable once vector-search is exported from @databricks/appkit
-// import { vectorSearch } from "@databricks/appkit";
+import { z } from "zod";
 import { lakebaseExamples } from "./lakebase-examples-plugin";
 import { reconnect } from "./reconnect-plugin";
 import { telemetryExamples } from "./telemetry-example-plugin";
@@ -49,6 +52,23 @@ const adminOnly: FilePolicy = (action, _resource, user) => {
   return true;
 };
 
+// Code-defined demo agent showing the fromPlugin() API alongside the
+// markdown-driven agents in config/agents/.
+const helper = createAgent({
+  instructions:
+    "You are a demo helper. Use analytics tools to answer data questions, " +
+    "or get_weather for light small-talk.",
+  tools: {
+    ...fromPlugin(analytics),
+    get_weather: tool({
+      name: "get_weather",
+      description: "Get the current weather for a city",
+      schema: z.object({ city: z.string().describe("City name") }),
+      execute: async ({ city }) => `The weather in ${city} is sunny, 22°C`,
+    }),
+  },
+});
+
 createApp({
   plugins: [
     server(),
@@ -84,6 +104,7 @@ createApp({
     }),
     jobs(),
     serving(),
+    agents({ agents: { helper } }),
     // TODO: re-enable once vector-search is exported from @databricks/appkit
     // vectorSearch({
     //   indexes: {
diff --git a/docs/docs/api/appkit/Function.createAgent.md b/docs/docs/api/appkit/Function.createAgent.md
new file mode 100644
index 000000000..61064e512
--- /dev/null
+++ b/docs/docs/api/appkit/Function.createAgent.md
@@ -0,0 +1,35 @@
+# Function: createAgent()
+
+```ts
+function createAgent(def: AgentDefinition): AgentDefinition;
+```
+
+Pure factory for agent definitions. Returns the passed-in definition after
+cycle-detecting the sub-agent graph. Accepts the full `AgentDefinition` shape
+and is safe to call at module top-level.
+
+The returned value is a plain `AgentDefinition` — no adapter construction,
+no side effects. Register it with `agents({ agents: { name: def } })` or run
+it standalone via `runAgent(def, input)`.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `def` | [`AgentDefinition`](Interface.AgentDefinition.md) |
+
+## Returns
+
+[`AgentDefinition`](Interface.AgentDefinition.md)
+
+## Example
+
+```ts
+const support = createAgent({
+  instructions: "You help customers.",
+  model: "databricks-claude-sonnet-4-5",
+  tools: {
+    get_weather: tool({ ... }),
+  },
+});
+```
diff --git a/docs/docs/api/appkit/Function.fromPlugin.md b/docs/docs/api/appkit/Function.fromPlugin.md
new file mode 100644
index 000000000..5262ef541
--- /dev/null
+++ b/docs/docs/api/appkit/Function.fromPlugin.md
@@ -0,0 +1,50 @@
+# Function: fromPlugin()
+
+```ts
+function fromPlugin<F>(factory: F, opts?: ToolkitOptions): FromPluginSpread;
+```
+
+Reference a plugin's tools inside an `AgentDefinition.tools` record without
+naming the plugin instance. The returned spread-friendly object carries a
+symbol-keyed marker that the agents plugin resolves against registered
+`ToolProvider`s at setup time.
+
+The factory argument must come from `toPlugin` (or any function that
+carries a `pluginName` field). `fromPlugin` reads `factory.pluginName`
+synchronously — it does not construct an instance.
+
+If the referenced plugin is also registered in `createApp({ plugins })`, the
+same runtime instance is used for dispatch. If the plugin is missing,
+`AgentsPlugin.setup()` throws with a clear `Available: …` listing.
+
+## Type Parameters
+
+| Type Parameter |
+| ------ |
+| `F` *extends* `NamedPluginFactory` |
+
+## Parameters
+
+| Parameter | Type | Description |
+| ------ | ------ | ------ |
+| `factory` | `F` | A plugin factory produced by `toPlugin`. Must expose a `pluginName` field. |
+| `opts?` | [`ToolkitOptions`](Interface.ToolkitOptions.md) | Optional toolkit scoping — `prefix`, `only`, `except`, `rename`. Same shape as the `.toolkit()` method. |
+
+## Returns
+
+`FromPluginSpread`
+
+## Example
+
+```ts
+import { analytics, createAgent, files, fromPlugin, tool } from "@databricks/appkit";
+
+const support = createAgent({
+  instructions: "You help customers.",
+  tools: {
+    ...fromPlugin(analytics),
+    ...fromPlugin(files, { only: ["uploads.read"] }),
+    get_weather: tool({ ... }),
+  },
+});
+```
diff --git a/docs/docs/api/appkit/Function.isFromPluginMarker.md b/docs/docs/api/appkit/Function.isFromPluginMarker.md
new file mode 100644
index 000000000..2ba9c752f
--- /dev/null
+++ b/docs/docs/api/appkit/Function.isFromPluginMarker.md
@@ -0,0 +1,17 @@
+# Function: isFromPluginMarker()
+
+```ts
+function isFromPluginMarker(value: unknown): value is FromPluginMarker;
+```
+
+Type guard for [FromPluginMarker](Interface.FromPluginMarker.md).
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `value` | `unknown` |
+
+## Returns
+
+`value is FromPluginMarker`
diff --git a/docs/docs/api/appkit/Function.isFunctionTool.md b/docs/docs/api/appkit/Function.isFunctionTool.md
new file mode 100644
index 000000000..ebd84ee4f
--- /dev/null
+++ b/docs/docs/api/appkit/Function.isFunctionTool.md
@@ -0,0 +1,15 @@
+# Function: isFunctionTool()
+
+```ts
+function isFunctionTool(value: unknown): value is FunctionTool;
+```
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `value` | `unknown` |
+
+## Returns
+
+`value is FunctionTool`
diff --git a/docs/docs/api/appkit/Function.isHostedTool.md b/docs/docs/api/appkit/Function.isHostedTool.md
new file mode 100644
index 000000000..73be7e16b
--- /dev/null
+++ b/docs/docs/api/appkit/Function.isHostedTool.md
@@ -0,0 +1,15 @@
+# Function: isHostedTool()
+
+```ts
+function isHostedTool(value: unknown): value is HostedTool;
+```
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `value` | `unknown` |
+
+## Returns
+
+`value is HostedTool`
diff --git a/docs/docs/api/appkit/Function.isToolkitEntry.md b/docs/docs/api/appkit/Function.isToolkitEntry.md
new file mode 100644
index 000000000..892907a41
--- /dev/null
+++ b/docs/docs/api/appkit/Function.isToolkitEntry.md
@@ -0,0 +1,18 @@
+# Function: isToolkitEntry()
+
+```ts
+function isToolkitEntry(value: unknown): value is ToolkitEntry;
+```
+
+Type guard for `ToolkitEntry` — used by the agents plugin to differentiate
+toolkit references from inline tools in a mixed `tools` record.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `value` | `unknown` |
+
+## Returns
+
+`value is ToolkitEntry`
diff --git a/docs/docs/api/appkit/Function.loadAgentFromFile.md b/docs/docs/api/appkit/Function.loadAgentFromFile.md
new file mode 100644
index 000000000..55c2cd342
--- /dev/null
+++ b/docs/docs/api/appkit/Function.loadAgentFromFile.md
@@ -0,0 +1,23 @@
+# Function: loadAgentFromFile()
+
+```ts
+function loadAgentFromFile(filePath: string, ctx: LoadContext): Promise<AgentDefinition>;
+```
+
+Loads a single markdown agent file and resolves its frontmatter against
+registered plugin toolkits + ambient tool library.
+
+Rejects non-empty `agents:` frontmatter because single-file loads have
+no siblings to resolve sub-agent references against — callers must use
+[loadAgentsFromDir](Function.loadAgentsFromDir.md) when markdown agents delegate to one another.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `filePath` | `string` |
+| `ctx` | `LoadContext` |
+
+## Returns
+
+`Promise`\<[`AgentDefinition`](Interface.AgentDefinition.md)\>
diff --git a/docs/docs/api/appkit/Function.loadAgentsFromDir.md b/docs/docs/api/appkit/Function.loadAgentsFromDir.md
new file mode 100644
index 000000000..9745286e4
--- /dev/null
+++ b/docs/docs/api/appkit/Function.loadAgentsFromDir.md
@@ -0,0 +1,29 @@
+# Function: loadAgentsFromDir()
+
+```ts
+function loadAgentsFromDir(dir: string, ctx: LoadContext): Promise<LoadResult>;
+```
+
+Scans a directory for `*.md` files and produces an `AgentDefinition` record
+keyed by file-stem. Throws on frontmatter errors or unresolved references.
+Returns an empty map if the directory does not exist.
+
+Runs in two passes so sub-agent references in frontmatter (`agents: [...]`)
+can be resolved regardless of file-system iteration order:
+
+1. Build every agent's definition from its own file.
+2. Walk `agents:` references and wire `def.agents = { sibling: siblingDef }`
+   by looking them up in the complete map. Dangling names and
+   self-references fail loudly; mutual delegation is allowed and bounded
+   at runtime by `limits.maxSubAgentDepth`.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `dir` | `string` |
+| `ctx` | `LoadContext` |
+
+## Returns
+
+`Promise`\<`LoadResult`\>
diff --git a/docs/docs/api/appkit/Function.mcpServer.md b/docs/docs/api/appkit/Function.mcpServer.md
new file mode 100644
index 000000000..cafd46572
--- /dev/null
+++ b/docs/docs/api/appkit/Function.mcpServer.md
@@ -0,0 +1,26 @@
+# Function: mcpServer()
+
+```ts
+function mcpServer(name: string, url: string): CustomMcpServerTool;
+```
+
+Factory for declaring a custom MCP server tool.
+
+Replaces the verbose `{ type: "custom_mcp_server", custom_mcp_server: { app_name, app_url } }`
+wrapper with a concise positional call.
+
+Example:
+```ts
+mcpServer("my-app", "https://my-app.databricksapps.com/mcp")
+```
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `name` | `string` |
+| `url` | `string` |
+
+## Returns
+
+`CustomMcpServerTool`
diff --git a/docs/docs/api/appkit/Function.runAgent.md b/docs/docs/api/appkit/Function.runAgent.md
new file mode 100644
index 000000000..4e1f86087
--- /dev/null
+++ b/docs/docs/api/appkit/Function.runAgent.md
@@ -0,0 +1,29 @@
+# Function: runAgent()
+
+```ts
+function runAgent(def: AgentDefinition, input: RunAgentInput): Promise<RunAgentResult>;
+```
+
+Standalone agent execution without `createApp`. Resolves the adapter, binds
+inline tools, and drives the adapter's `run()` loop to completion.
+
+Limitations vs. running through the agents() plugin:
+- No OBO: there is no HTTP request, so plugin tools run as the service
+  principal (when they work at all).
+- Hosted tools (MCP) are not supported — they require a live MCP client
+  that only exists inside the agents plugin.
+- Sub-agents (`agents: { ... }` on the def) are executed as nested
+  `runAgent` calls with no shared thread state.
+- Plugin tools (`fromPlugin` markers or `ToolkitEntry` spreads) require
+  passing `plugins: [...]` via `RunAgentInput`.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `def` | [`AgentDefinition`](Interface.AgentDefinition.md) |
+| `input` | [`RunAgentInput`](Interface.RunAgentInput.md) |
+
+## Returns
+
+`Promise`\<[`RunAgentResult`](Interface.RunAgentResult.md)\>
diff --git a/docs/docs/api/appkit/Function.tool.md b/docs/docs/api/appkit/Function.tool.md
new file mode 100644
index 000000000..d6799cfd1
--- /dev/null
+++ b/docs/docs/api/appkit/Function.tool.md
@@ -0,0 +1,29 @@
+# Function: tool()
+
+```ts
+function tool<S>(config: ToolConfig<S>): FunctionTool;
+```
+
+Factory for defining function tools with Zod schemas.
+
+- Generates JSON Schema (for the LLM) from the Zod schema via `z.toJSONSchema()`.
+- Infers the `execute` argument type from the schema.
+- Validates tool call arguments at runtime. On validation failure, returns
+  a formatted error string to the LLM instead of throwing, so the model
+  can self-correct on its next turn.
+
+## Type Parameters
+
+| Type Parameter |
+| ------ |
+| `S` *extends* `ZodType`\<`unknown`, `unknown`, `$ZodTypeInternals`\<`unknown`, `unknown`\>\> |
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `config` | [`ToolConfig`](Interface.ToolConfig.md)\<`S`\> |
+
+## Returns
+
+[`FunctionTool`](Interface.FunctionTool.md)
diff --git a/docs/docs/api/appkit/Interface.AgentAdapter.md b/docs/docs/api/appkit/Interface.AgentAdapter.md
new file mode 100644
index 000000000..52083157e
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentAdapter.md
@@ -0,0 +1,20 @@
+# Interface: AgentAdapter
+
+## Methods
+
+### run()
+
+```ts
+run(input: AgentInput, context: AgentRunContext): AsyncGenerator<AgentEvent, void, unknown>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `input` | [`AgentInput`](Interface.AgentInput.md) |
+| `context` | [`AgentRunContext`](Interface.AgentRunContext.md) |
+
+#### Returns
+
+`AsyncGenerator`\<[`AgentEvent`](TypeAlias.AgentEvent.md), `void`, `unknown`\>
diff --git a/docs/docs/api/appkit/Interface.AgentDefinition.md b/docs/docs/api/appkit/Interface.AgentDefinition.md
new file mode 100644
index 000000000..87db651d0
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentDefinition.md
@@ -0,0 +1,97 @@
+# Interface: AgentDefinition
+
+## Properties
+
+### agents?
+
+```ts
+optional agents: Record<string, AgentDefinition>;
+```
+
+Sub-agents, exposed as `agent-<key>` tools on this agent.
+
+***
+
+### baseSystemPrompt?
+
+```ts
+optional baseSystemPrompt: BaseSystemPromptOption;
+```
+
+Override the plugin's baseSystemPrompt for this agent only.
+
+***
+
+### ephemeral?
+
+```ts
+optional ephemeral: boolean;
+```
+
+When true, the thread used for a chat request against this agent is
+deleted from `ThreadStore` after the stream completes (success or
+failure). Use for stateless one-shot agents — e.g. autocomplete, where
+each request is independent and retaining history would both poison
+future calls and accumulate unbounded state in the default
+`InMemoryThreadStore`. Defaults to `false`.
+
+***
+
+### instructions
+
+```ts
+instructions: string;
+```
+
+System prompt body. For markdown-loaded agents this is the file body.
+
+***
+
+### maxSteps?
+
+```ts
+optional maxSteps: number;
+```
+
+***
+
+### maxTokens?
+
+```ts
+optional maxTokens: number;
+```
+
+***
+
+### model?
+
+```ts
+optional model: 
+  | string
+  | AgentAdapter
+| Promise<AgentAdapter>;
+```
+
+Model adapter (or endpoint-name string sugar for
+`DatabricksAdapter.fromServingEndpoint({ endpointName })`). Optional —
+falls back to the plugin's `defaultModel`.
+
+***
+
+### name?
+
+```ts
+optional name: string;
+```
+
+Filled in from the enclosing key when used in `agents: { foo: def }`.
+
+***
+
+### tools?
+
+```ts
+optional tools: AgentTools;
+```
+
+Per-agent tool record. Key is the LLM-visible tool-call name.
diff --git a/docs/docs/api/appkit/Interface.AgentInput.md b/docs/docs/api/appkit/Interface.AgentInput.md
new file mode 100644
index 000000000..6d2eff8b0
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentInput.md
@@ -0,0 +1,33 @@
+# Interface: AgentInput
+
+## Properties
+
+### messages
+
+```ts
+messages: Message[];
+```
+
+***
+
+### signal?
+
+```ts
+optional signal: AbortSignal;
+```
+
+***
+
+### threadId
+
+```ts
+threadId: string;
+```
+
+***
+
+### tools
+
+```ts
+tools: AgentToolDefinition[];
+```
diff --git a/docs/docs/api/appkit/Interface.AgentRunContext.md b/docs/docs/api/appkit/Interface.AgentRunContext.md
new file mode 100644
index 000000000..c9bfcb79f
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentRunContext.md
@@ -0,0 +1,28 @@
+# Interface: AgentRunContext
+
+## Properties
+
+### executeTool()
+
+```ts
+executeTool: (name: string, args: unknown) => Promise<unknown>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `name` | `string` |
+| `args` | `unknown` |
+
+#### Returns
+
+`Promise`\<`unknown`\>
+
+***
+
+### signal?
+
+```ts
+optional signal: AbortSignal;
+```
diff --git a/docs/docs/api/appkit/Interface.AgentToolDefinition.md b/docs/docs/api/appkit/Interface.AgentToolDefinition.md
new file mode 100644
index 000000000..51c375955
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentToolDefinition.md
@@ -0,0 +1,33 @@
+# Interface: AgentToolDefinition
+
+## Properties
+
+### annotations?
+
+```ts
+optional annotations: ToolAnnotations;
+```
+
+***
+
+### description
+
+```ts
+description: string;
+```
+
+***
+
+### name
+
+```ts
+name: string;
+```
+
+***
+
+### parameters
+
+```ts
+parameters: JSONSchema7;
+```
diff --git a/docs/docs/api/appkit/Interface.AgentsPluginConfig.md b/docs/docs/api/appkit/Interface.AgentsPluginConfig.md
new file mode 100644
index 000000000..dcf7573ce
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentsPluginConfig.md
@@ -0,0 +1,227 @@
+# Interface: AgentsPluginConfig
+
+Base configuration interface for AppKit plugins
+
+## Extends
+
+- [`BasePluginConfig`](Interface.BasePluginConfig.md)
+
+## Indexable
+
+```ts
+[key: string]: unknown
+```
+
+## Properties
+
+### agents?
+
+```ts
+optional agents: Record<string, AgentDefinition>;
+```
+
+Code-defined agents, merged with file-loaded ones (code wins on key collision).
+
+***
+
+### approval?
+
+```ts
+optional approval: {
+  requireForDestructive?: boolean;
+  timeoutMs?: number;
+};
+```
+
+Human-in-the-loop approval gate for destructive tool calls. When enabled
+(the default), the agents plugin emits an `appkit.approval_pending` SSE
+event before executing any tool annotated `destructive: true` and waits
+for a `POST /chat/approve` decision from the same user who initiated the
+stream. A missing decision after `timeoutMs` auto-denies the call.
+
+#### requireForDestructive?
+
+```ts
+optional requireForDestructive: boolean;
+```
+
+Require human approval for tools annotated `destructive: true`. Default: `true`.
+
+#### timeoutMs?
+
+```ts
+optional timeoutMs: number;
+```
+
+Milliseconds to wait before auto-denying. Default: 60_000.
+
+***
+
+### autoInheritTools?
+
+```ts
+optional autoInheritTools: boolean | AutoInheritToolsConfig;
+```
+
+Whether to auto-inherit every ToolProvider plugin's toolkit. Accepts a boolean shorthand.
+
+***
+
+### baseSystemPrompt?
+
+```ts
+optional baseSystemPrompt: BaseSystemPromptOption;
+```
+
+Customize or disable the AppKit base system prompt.
+
+***
+
+### defaultAgent?
+
+```ts
+optional defaultAgent: string;
+```
+
+Agent used when clients don't specify one. Defaults to the first-registered agent or the file with `default: true` frontmatter.
+
+***
+
+### defaultModel?
+
+```ts
+optional defaultModel: 
+  | string
+  | AgentAdapter
+| Promise<AgentAdapter>;
+```
+
+Default model for agents that don't specify their own (in code or frontmatter).
+
+***
+
+### dir?
+
+```ts
+optional dir: string | false;
+```
+
+Directory to scan for markdown agent files. Default `./config/agents`. Set to `false` to disable.
+
+***
+
+### host?
+
+```ts
+optional host: string;
+```
+
+#### Inherited from
+
+[`BasePluginConfig`](Interface.BasePluginConfig.md).[`host`](Interface.BasePluginConfig.md#host)
+
+***
+
+### limits?
+
+```ts
+optional limits: {
+  maxConcurrentStreamsPerUser?: number;
+  maxSubAgentDepth?: number;
+  maxToolCalls?: number;
+};
+```
+
+Runtime resource limits applied during agent execution. Defaults are
+tuned to protect a single-instance deployment from a misbehaving user or
+a runaway prompt injection; tighten or relax as appropriate for the
+deployment's scale and trust model. Request-body caps (chat message
+size, invocations input size / length) are enforced statically by the
+Zod schemas and are not configurable here.
+
+#### maxConcurrentStreamsPerUser?
+
+```ts
+optional maxConcurrentStreamsPerUser: number;
+```
+
+Max concurrent chat streams a single user may have open. Subsequent
+`POST /chat` requests from that user while at-limit are rejected with
+HTTP 429. Default: `5`.
+
+#### maxSubAgentDepth?
+
+```ts
+optional maxSubAgentDepth: number;
+```
+
+Max sub-agent recursion depth. Protects against a prompt-injected
+agent that delegates to a sub-agent which in turn delegates back to
+itself (directly or transitively). Default: `3`.
+
+#### maxToolCalls?
+
+```ts
+optional maxToolCalls: number;
+```
+
+Max tool invocations per agent run (across the full tool-call graph,
+including sub-agent invocations). A run that exceeds the budget is
+aborted with a terminal error event. Default: `50`.
+
+***
+
+### mcp?
+
+```ts
+optional mcp: McpHostPolicyConfig;
+```
+
+MCP server host policy. By default only same-origin Databricks workspace
+URLs may be used as MCP endpoints; custom hosts must be explicitly
+allowlisted here. Workspace credentials (SP / OBO) are never forwarded
+to non-workspace hosts.
+
+***
+
+### name?
+
+```ts
+optional name: string;
+```
+
+#### Inherited from
+
+[`BasePluginConfig`](Interface.BasePluginConfig.md).[`name`](Interface.BasePluginConfig.md#name)
+
+***
+
+### telemetry?
+
+```ts
+optional telemetry: TelemetryOptions;
+```
+
+#### Inherited from
+
+[`BasePluginConfig`](Interface.BasePluginConfig.md).[`telemetry`](Interface.BasePluginConfig.md#telemetry)
+
+***
+
+### threadStore?
+
+```ts
+optional threadStore: ThreadStore;
+```
+
+Persistent thread store. Default: in-memory.
+
+***
+
+### tools?
+
+```ts
+optional tools: Record<string, AgentTool>;
+```
+
+Ambient tool library. Keys may be referenced by markdown frontmatter via `tools: [key1, key2]`.
diff --git a/docs/docs/api/appkit/Interface.BasePluginConfig.md b/docs/docs/api/appkit/Interface.BasePluginConfig.md
index 3483c136e..653df68ce 100644
--- a/docs/docs/api/appkit/Interface.BasePluginConfig.md
+++ b/docs/docs/api/appkit/Interface.BasePluginConfig.md
@@ -4,6 +4,7 @@ Base configuration interface for AppKit plugins
 
 ## Extended by
 
+- [`AgentsPluginConfig`](Interface.AgentsPluginConfig.md)
 - [`IJobsConfig`](Interface.IJobsConfig.md)
 
 ## Indexable
diff --git a/docs/docs/api/appkit/Interface.FromPluginMarker.md b/docs/docs/api/appkit/Interface.FromPluginMarker.md
new file mode 100644
index 000000000..1a1fedd3c
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.FromPluginMarker.md
@@ -0,0 +1,32 @@
+# Interface: FromPluginMarker
+
+A lazy reference to a plugin's tools, produced by [fromPlugin](Function.fromPlugin.md) and
+resolved to concrete `ToolkitEntry`s at `AgentsPlugin.setup()` time.
+
+The marker is spread under a unique symbol key so multiple calls to
+`fromPlugin` (even for the same plugin) coexist in an `AgentDefinition.tools`
+record without colliding.
+
+## Properties
+
+### \[FROM\_PLUGIN\_MARKER\]
+
+```ts
+readonly [FROM_PLUGIN_MARKER]: true;
+```
+
+***
+
+### opts
+
+```ts
+readonly opts: ToolkitOptions | undefined;
+```
+
+***
+
+### pluginName
+
+```ts
+readonly pluginName: string;
+```
diff --git a/docs/docs/api/appkit/Interface.FunctionTool.md b/docs/docs/api/appkit/Interface.FunctionTool.md
new file mode 100644
index 000000000..c096dacac
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.FunctionTool.md
@@ -0,0 +1,59 @@
+# Interface: FunctionTool
+
+## Properties
+
+### description?
+
+```ts
+optional description: string | null;
+```
+
+***
+
+### execute()
+
+```ts
+execute: (args: Record<string, unknown>) => string | Promise<string>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `args` | `Record`\<`string`, `unknown`\> |
+
+#### Returns
+
+`string` \| `Promise`\<`string`\>
+
+***
+
+### name
+
+```ts
+name: string;
+```
+
+***
+
+### parameters?
+
+```ts
+optional parameters: Record<string, unknown> | null;
+```
+
+***
+
+### strict?
+
+```ts
+optional strict: boolean | null;
+```
+
+***
+
+### type
+
+```ts
+type: "function";
+```
diff --git a/docs/docs/api/appkit/Interface.Message.md b/docs/docs/api/appkit/Interface.Message.md
new file mode 100644
index 000000000..ed818408d
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.Message.md
@@ -0,0 +1,49 @@
+# Interface: Message
+
+## Properties
+
+### content
+
+```ts
+content: string;
+```
+
+***
+
+### createdAt
+
+```ts
+createdAt: Date;
+```
+
+***
+
+### id
+
+```ts
+id: string;
+```
+
+***
+
+### role
+
+```ts
+role: "user" | "assistant" | "system" | "tool";
+```
+
+***
+
+### toolCallId?
+
+```ts
+optional toolCallId: string;
+```
+
+***
+
+### toolCalls?
+
+```ts
+optional toolCalls: ToolCall[];
+```
diff --git a/docs/docs/api/appkit/Interface.PromptContext.md b/docs/docs/api/appkit/Interface.PromptContext.md
new file mode 100644
index 000000000..e26ea167d
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.PromptContext.md
@@ -0,0 +1,27 @@
+# Interface: PromptContext
+
+Context passed to `baseSystemPrompt` callbacks.
+
+## Properties
+
+### agentName
+
+```ts
+agentName: string;
+```
+
+***
+
+### pluginNames
+
+```ts
+pluginNames: string[];
+```
+
+***
+
+### toolNames
+
+```ts
+toolNames: string[];
+```
diff --git a/docs/docs/api/appkit/Interface.RunAgentInput.md b/docs/docs/api/appkit/Interface.RunAgentInput.md
new file mode 100644
index 000000000..c7fa4b02e
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.RunAgentInput.md
@@ -0,0 +1,35 @@
+# Interface: RunAgentInput
+
+## Properties
+
+### messages
+
+```ts
+messages: string | Message[];
+```
+
+Seed messages for the run. Either a single user string or a full message list.
+
+***
+
+### plugins?
+
+```ts
+optional plugins: PluginData<PluginConstructor, unknown, string>[];
+```
+
+Optional plugin list used to resolve `fromPlugin` markers in `def.tools`.
+Required when the def contains any `...fromPlugin(factory)` spreads;
+ignored otherwise. `runAgent` constructs a fresh instance per plugin
+and dispatches tool calls against it as the service principal (no
+OBO — there is no HTTP request in standalone mode).
+
+***
+
+### signal?
+
+```ts
+optional signal: AbortSignal;
+```
+
+Abort signal for cancellation.
diff --git a/docs/docs/api/appkit/Interface.RunAgentResult.md b/docs/docs/api/appkit/Interface.RunAgentResult.md
new file mode 100644
index 000000000..a9ba258dd
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.RunAgentResult.md
@@ -0,0 +1,21 @@
+# Interface: RunAgentResult
+
+## Properties
+
+### events
+
+```ts
+events: AgentEvent[];
+```
+
+Every event the adapter yielded, in order. Useful for inspection/tests.
+
+***
+
+### text
+
+```ts
+text: string;
+```
+
+Aggregated text output from all `message_delta` events.
diff --git a/docs/docs/api/appkit/Interface.Thread.md b/docs/docs/api/appkit/Interface.Thread.md
new file mode 100644
index 000000000..e9f15fee0
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.Thread.md
@@ -0,0 +1,41 @@
+# Interface: Thread
+
+## Properties
+
+### createdAt
+
+```ts
+createdAt: Date;
+```
+
+***
+
+### id
+
+```ts
+id: string;
+```
+
+***
+
+### messages
+
+```ts
+messages: Message[];
+```
+
+***
+
+### updatedAt
+
+```ts
+updatedAt: Date;
+```
+
+***
+
+### userId
+
+```ts
+userId: string;
+```
diff --git a/docs/docs/api/appkit/Interface.ThreadStore.md b/docs/docs/api/appkit/Interface.ThreadStore.md
new file mode 100644
index 000000000..215b76a2c
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ThreadStore.md
@@ -0,0 +1,98 @@
+# Interface: ThreadStore
+
+## Methods
+
+### addMessage()
+
+```ts
+addMessage(
+   threadId: string, 
+   userId: string, 
+message: Message): Promise<void>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `threadId` | `string` |
+| `userId` | `string` |
+| `message` | [`Message`](Interface.Message.md) |
+
+#### Returns
+
+`Promise`\<`void`\>
+
+***
+
+### create()
+
+```ts
+create(userId: string): Promise<Thread>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `userId` | `string` |
+
+#### Returns
+
+`Promise`\<[`Thread`](Interface.Thread.md)\>
+
+***
+
+### delete()
+
+```ts
+delete(threadId: string, userId: string): Promise<boolean>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `threadId` | `string` |
+| `userId` | `string` |
+
+#### Returns
+
+`Promise`\<`boolean`\>
+
+***
+
+### get()
+
+```ts
+get(threadId: string, userId: string): Promise<Thread | null>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `threadId` | `string` |
+| `userId` | `string` |
+
+#### Returns
+
+`Promise`\<[`Thread`](Interface.Thread.md) \| `null`\>
+
+***
+
+### list()
+
+```ts
+list(userId: string): Promise<Thread[]>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `userId` | `string` |
+
+#### Returns
+
+`Promise`\<[`Thread`](Interface.Thread.md)[]\>
diff --git a/docs/docs/api/appkit/Interface.ToolConfig.md b/docs/docs/api/appkit/Interface.ToolConfig.md
new file mode 100644
index 000000000..48828a387
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ToolConfig.md
@@ -0,0 +1,49 @@
+# Interface: ToolConfig\<S\>
+
+## Type Parameters
+
+| Type Parameter |
+| ------ |
+| `S` *extends* `z.ZodType` |
+
+## Properties
+
+### description?
+
+```ts
+optional description: string;
+```
+
+***
+
+### execute()
+
+```ts
+execute: (args: output<S>) => string | Promise<string>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `args` | `output`\<`S`\> |
+
+#### Returns
+
+`string` \| `Promise`\<`string`\>
+
+***
+
+### name
+
+```ts
+name: string;
+```
+
+***
+
+### schema
+
+```ts
+schema: S;
+```
diff --git a/docs/docs/api/appkit/Interface.ToolProvider.md b/docs/docs/api/appkit/Interface.ToolProvider.md
new file mode 100644
index 000000000..9c8851a06
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ToolProvider.md
@@ -0,0 +1,36 @@
+# Interface: ToolProvider
+
+## Methods
+
+### executeAgentTool()
+
+```ts
+executeAgentTool(
+   name: string, 
+   args: unknown, 
+signal?: AbortSignal): Promise<unknown>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `name` | `string` |
+| `args` | `unknown` |
+| `signal?` | `AbortSignal` |
+
+#### Returns
+
+`Promise`\<`unknown`\>
+
+***
+
+### getAgentTools()
+
+```ts
+getAgentTools(): AgentToolDefinition[];
+```
+
+#### Returns
+
+[`AgentToolDefinition`](Interface.AgentToolDefinition.md)[]
diff --git a/docs/docs/api/appkit/Interface.ToolkitEntry.md b/docs/docs/api/appkit/Interface.ToolkitEntry.md
new file mode 100644
index 000000000..626cc8981
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ToolkitEntry.md
@@ -0,0 +1,59 @@
+# Interface: ToolkitEntry
+
+A tool reference produced by a plugin's `.toolkit()` call. The agents plugin
+recognizes the `__toolkitRef` brand and dispatches tool invocations through
+`PluginContext.executeTool(req, pluginName, localName, ...)`, preserving
+OBO (asUser) and telemetry spans.
+
+## Properties
+
+### \_\_toolkitRef
+
+```ts
+readonly __toolkitRef: true;
+```
+
+***
+
+### annotations?
+
+```ts
+optional annotations: ToolAnnotations;
+```
+
+***
+
+### autoInheritable?
+
+```ts
+optional autoInheritable: boolean;
+```
+
+Whether this tool is eligible for `autoInheritTools` spreading. Mirrors
+ToolEntry.autoInheritable from the source registry so the agents
+plugin can filter auto-inherited tools without re-walking the provider's
+internal registry.
+
+***
+
+### def
+
+```ts
+def: AgentToolDefinition;
+```
+
+***
+
+### localName
+
+```ts
+localName: string;
+```
+
+***
+
+### pluginName
+
+```ts
+pluginName: string;
+```
diff --git a/docs/docs/api/appkit/Interface.ToolkitOptions.md b/docs/docs/api/appkit/Interface.ToolkitOptions.md
new file mode 100644
index 000000000..1beb22b0f
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ToolkitOptions.md
@@ -0,0 +1,41 @@
+# Interface: ToolkitOptions
+
+## Properties
+
+### except?
+
+```ts
+optional except: string[];
+```
+
+Exclude tools whose local name matches one of these.
+
+***
+
+### only?
+
+```ts
+optional only: string[];
+```
+
+Only include tools whose local name matches one of these.
+
+***
+
+### prefix?
+
+```ts
+optional prefix: string;
+```
+
+Key prefix to prepend to each tool's local name. Defaults to `${pluginName}.`.
+
+***
+
+### rename?
+
+```ts
+optional rename: Record<string, string>;
+```
+
+Remap specific local names to different keys (applied after prefix).
diff --git a/docs/docs/api/appkit/TypeAlias.AgentEvent.md b/docs/docs/api/appkit/TypeAlias.AgentEvent.md
new file mode 100644
index 000000000..a854a8049
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.AgentEvent.md
@@ -0,0 +1,268 @@
+# Type Alias: AgentEvent
+
+```ts
+type AgentEvent = 
+  | {
+  content: string;
+  type: "message_delta";
+}
+  | {
+  content: string;
+  type: "message";
+}
+  | {
+  args: unknown;
+  callId: string;
+  name: string;
+  type: "tool_call";
+}
+  | {
+  callId: string;
+  error?: string;
+  result: unknown;
+  type: "tool_result";
+}
+  | {
+  content: string;
+  type: "thinking";
+}
+  | {
+  error?: string;
+  status: "running" | "waiting" | "complete" | "error";
+  type: "status";
+}
+  | {
+  data: Record<string, unknown>;
+  type: "metadata";
+}
+  | {
+  annotations?: ToolAnnotations;
+  approvalId: string;
+  args: unknown;
+  streamId: string;
+  toolName: string;
+  type: "approval_pending";
+};
+```
+
+## Type Declaration
+
+```ts
+{
+  content: string;
+  type: "message_delta";
+}
+```
+
+### content
+
+```ts
+content: string;
+```
+
+### type
+
+```ts
+type: "message_delta";
+```
+
+```ts
+{
+  content: string;
+  type: "message";
+}
+```
+
+### content
+
+```ts
+content: string;
+```
+
+### type
+
+```ts
+type: "message";
+```
+
+```ts
+{
+  args: unknown;
+  callId: string;
+  name: string;
+  type: "tool_call";
+}
+```
+
+### args
+
+```ts
+args: unknown;
+```
+
+### callId
+
+```ts
+callId: string;
+```
+
+### name
+
+```ts
+name: string;
+```
+
+### type
+
+```ts
+type: "tool_call";
+```
+
+```ts
+{
+  callId: string;
+  error?: string;
+  result: unknown;
+  type: "tool_result";
+}
+```
+
+### callId
+
+```ts
+callId: string;
+```
+
+### error?
+
+```ts
+optional error: string;
+```
+
+### result
+
+```ts
+result: unknown;
+```
+
+### type
+
+```ts
+type: "tool_result";
+```
+
+```ts
+{
+  content: string;
+  type: "thinking";
+}
+```
+
+### content
+
+```ts
+content: string;
+```
+
+### type
+
+```ts
+type: "thinking";
+```
+
+```ts
+{
+  error?: string;
+  status: "running" | "waiting" | "complete" | "error";
+  type: "status";
+}
+```
+
+### error?
+
+```ts
+optional error: string;
+```
+
+### status
+
+```ts
+status: "running" | "waiting" | "complete" | "error";
+```
+
+### type
+
+```ts
+type: "status";
+```
+
+```ts
+{
+  data: Record<string, unknown>;
+  type: "metadata";
+}
+```
+
+### data
+
+```ts
+data: Record<string, unknown>;
+```
+
+### type
+
+```ts
+type: "metadata";
+```
+
+```ts
+{
+  annotations?: ToolAnnotations;
+  approvalId: string;
+  args: unknown;
+  streamId: string;
+  toolName: string;
+  type: "approval_pending";
+}
+```
+
+### annotations?
+
+```ts
+optional annotations: ToolAnnotations;
+```
+
+### approvalId
+
+```ts
+approvalId: string;
+```
+
+### args
+
+```ts
+args: unknown;
+```
+
+### streamId
+
+```ts
+streamId: string;
+```
+
+### toolName
+
+```ts
+toolName: string;
+```
+
+### type
+
+```ts
+type: "approval_pending";
+```
+
+Emitted by the agents plugin (not adapters) when a tool call annotated
+`destructive: true` is awaiting human approval. Clients should render
+an approval prompt and POST to `/chat/approve` with the matching
+`approvalId` and a `decision` of `approve` or `deny`.
diff --git a/docs/docs/api/appkit/TypeAlias.AgentTool.md b/docs/docs/api/appkit/TypeAlias.AgentTool.md
new file mode 100644
index 000000000..e165cec66
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.AgentTool.md
@@ -0,0 +1,12 @@
+# Type Alias: AgentTool
+
+```ts
+type AgentTool = 
+  | FunctionTool
+  | HostedTool
+  | ToolkitEntry;
+```
+
+Any tool an agent can invoke: inline function tools (`tool()`), hosted MCP
+tools (`mcpServer()` / raw hosted), or toolkit references from plugins
+(`analytics().toolkit()`).
diff --git a/docs/docs/api/appkit/TypeAlias.AgentTools.md b/docs/docs/api/appkit/TypeAlias.AgentTools.md
new file mode 100644
index 000000000..05b9ce619
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.AgentTools.md
@@ -0,0 +1,14 @@
+# Type Alias: AgentTools
+
+```ts
+type AgentTools = {
+[key: string]: AgentTool;
+} & {
+[key: symbol]: FromPluginMarker;
+};
+```
+
+Per-agent tool record. String keys map to inline tools, toolkit entries,
+hosted tools, etc. Symbol keys hold `FromPluginMarker` references produced
+by `fromPlugin(factory)` spreads — these are resolved at
+`AgentsPlugin.setup()` time against registered `ToolProvider` plugins.
diff --git a/docs/docs/api/appkit/TypeAlias.BaseSystemPromptOption.md b/docs/docs/api/appkit/TypeAlias.BaseSystemPromptOption.md
new file mode 100644
index 000000000..c59226619
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.BaseSystemPromptOption.md
@@ -0,0 +1,8 @@
+# Type Alias: BaseSystemPromptOption
+
+```ts
+type BaseSystemPromptOption = 
+  | false
+  | string
+  | (ctx: PromptContext) => string;
+```
diff --git a/docs/docs/api/appkit/TypeAlias.HostedTool.md b/docs/docs/api/appkit/TypeAlias.HostedTool.md
new file mode 100644
index 000000000..433c0ac8a
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.HostedTool.md
@@ -0,0 +1,9 @@
+# Type Alias: HostedTool
+
+```ts
+type HostedTool = 
+  | GenieTool
+  | VectorSearchIndexTool
+  | CustomMcpServerTool
+  | ExternalMcpServerTool;
+```
diff --git a/docs/docs/api/appkit/Variable.agents.md b/docs/docs/api/appkit/Variable.agents.md
new file mode 100644
index 000000000..d5bc7a093
--- /dev/null
+++ b/docs/docs/api/appkit/Variable.agents.md
@@ -0,0 +1,19 @@
+# Variable: agents
+
+```ts
+const agents: ToPlugin<typeof AgentsPlugin, AgentsPluginConfig, string> & NamedPluginFactory<string>;
+```
+
+Plugin factory for the agents plugin. Reads `config/agents/*.md` by default,
+resolves toolkits/tools from registered plugins, exposes `appkit.agents.*`
+runtime API and mounts `/invocations`.
+
+## Example
+
+```ts
+import { agents, analytics, createApp, server } from "@databricks/appkit";
+
+await createApp({
+  plugins: [server(), analytics(), agents()],
+});
+```
diff --git a/docs/docs/api/appkit/index.md b/docs/docs/api/appkit/index.md
index 5a21e935f..ec44cd683 100644
--- a/docs/docs/api/appkit/index.md
+++ b/docs/docs/api/appkit/index.md
@@ -31,12 +31,20 @@ plugin architecture, and React integration.
 
 | Interface | Description |
 | ------ | ------ |
+| [AgentAdapter](Interface.AgentAdapter.md) | - |
+| [AgentDefinition](Interface.AgentDefinition.md) | - |
+| [AgentInput](Interface.AgentInput.md) | - |
+| [AgentRunContext](Interface.AgentRunContext.md) | - |
+| [AgentsPluginConfig](Interface.AgentsPluginConfig.md) | Base configuration interface for AppKit plugins |
+| [AgentToolDefinition](Interface.AgentToolDefinition.md) | - |
 | [BasePluginConfig](Interface.BasePluginConfig.md) | Base configuration interface for AppKit plugins |
 | [CacheConfig](Interface.CacheConfig.md) | Configuration for the CacheInterceptor. Controls TTL, size limits, storage backend, and probabilistic cleanup. |
 | [DatabaseCredential](Interface.DatabaseCredential.md) | Database credentials with OAuth token for Postgres connection |
 | [EndpointConfig](Interface.EndpointConfig.md) | - |
 | [FilePolicyUser](Interface.FilePolicyUser.md) | Minimal user identity passed to the policy function. |
 | [FileResource](Interface.FileResource.md) | Describes the file or directory being acted upon. |
+| [FromPluginMarker](Interface.FromPluginMarker.md) | A lazy reference to a plugin's tools, produced by [fromPlugin](Function.fromPlugin.md) and resolved to concrete `ToolkitEntry`s at `AgentsPlugin.setup()` time. |
+| [FunctionTool](Interface.FunctionTool.md) | - |
 | [GenerateDatabaseCredentialRequest](Interface.GenerateDatabaseCredentialRequest.md) | Request parameters for generating database OAuth credentials |
 | [IJobsConfig](Interface.IJobsConfig.md) | Configuration for the Jobs plugin. |
 | [ITelemetry](Interface.ITelemetry.md) | Plugin-facing interface for OpenTelemetry instrumentation. Provides a thin abstraction over OpenTelemetry APIs for plugins. |
@@ -44,26 +52,41 @@ plugin architecture, and React integration.
 | [JobConfig](Interface.JobConfig.md) | Per-job configuration options. |
 | [JobsConnectorConfig](Interface.JobsConnectorConfig.md) | - |
 | [LakebasePoolConfig](Interface.LakebasePoolConfig.md) | Configuration for creating a Lakebase connection pool |
+| [Message](Interface.Message.md) | - |
 | [PluginManifest](Interface.PluginManifest.md) | Plugin manifest that declares metadata and resource requirements. Attached to plugin classes as a static property. Extends the shared PluginManifest with strict resource types. |
+| [PromptContext](Interface.PromptContext.md) | Context passed to `baseSystemPrompt` callbacks. |
 | [RequestedClaims](Interface.RequestedClaims.md) | Optional claims for fine-grained Unity Catalog table permissions When specified, the returned token will be scoped to only the requested tables |
 | [RequestedResource](Interface.RequestedResource.md) | Resource to request permissions for in Unity Catalog |
 | [ResourceEntry](Interface.ResourceEntry.md) | Internal representation of a resource in the registry. Extends ResourceRequirement with resolution state and plugin ownership. |
 | [ResourceFieldEntry](Interface.ResourceFieldEntry.md) | Defines a single field for a resource. Each field has its own environment variable and optional description. Single-value types use one key (e.g. id); multi-value types (database, secret) use multiple (e.g. instance_name, database_name or scope, key). |
 | [ResourceRequirement](Interface.ResourceRequirement.md) | Declares a resource requirement for a plugin. Can be defined statically in a manifest or dynamically via getResourceRequirements(). Narrows the generated base: type → ResourceType enum, permission → ResourcePermission union. |
+| [RunAgentInput](Interface.RunAgentInput.md) | - |
+| [RunAgentResult](Interface.RunAgentResult.md) | - |
 | [ServingEndpointEntry](Interface.ServingEndpointEntry.md) | Shape of a single registry entry. |
 | [ServingEndpointRegistry](Interface.ServingEndpointRegistry.md) | Registry interface for serving endpoint type generation. Empty by default — augmented by the Vite type generator's `.d.ts` output via module augmentation. When populated, provides autocomplete for alias names and typed request/response/chunk per endpoint. |
 | [StreamExecutionSettings](Interface.StreamExecutionSettings.md) | Execution settings for streaming endpoints. Extends PluginExecutionSettings with SSE stream configuration. |
 | [TelemetryConfig](Interface.TelemetryConfig.md) | OpenTelemetry configuration for AppKit applications |
+| [Thread](Interface.Thread.md) | - |
+| [ThreadStore](Interface.ThreadStore.md) | - |
+| [ToolConfig](Interface.ToolConfig.md) | - |
+| [ToolkitEntry](Interface.ToolkitEntry.md) | A tool reference produced by a plugin's `.toolkit()` call. The agents plugin recognizes the `__toolkitRef` brand and dispatches tool invocations through `PluginContext.executeTool(req, pluginName, localName, ...)`, preserving OBO (asUser) and telemetry spans. |
+| [ToolkitOptions](Interface.ToolkitOptions.md) | - |
+| [ToolProvider](Interface.ToolProvider.md) | - |
 | [ValidationResult](Interface.ValidationResult.md) | Result of validating all registered resources against the environment. |
 
 ## Type Aliases
 
 | Type Alias | Description |
 | ------ | ------ |
+| [AgentEvent](TypeAlias.AgentEvent.md) | - |
+| [AgentTool](TypeAlias.AgentTool.md) | Any tool an agent can invoke: inline function tools (`tool()`), hosted MCP tools (`mcpServer()` / raw hosted), or toolkit references from plugins (`analytics().toolkit()`). |
+| [AgentTools](TypeAlias.AgentTools.md) | Per-agent tool record. String keys map to inline tools, toolkit entries, hosted tools, etc. Symbol keys hold `FromPluginMarker` references produced by `fromPlugin(factory)` spreads — these are resolved at `AgentsPlugin.setup()` time against registered `ToolProvider` plugins. |
+| [BaseSystemPromptOption](TypeAlias.BaseSystemPromptOption.md) | - |
 | [ConfigSchema](TypeAlias.ConfigSchema.md) | Configuration schema definition for plugin config. Re-exported from the standard JSON Schema Draft 7 types. |
 | [ExecutionResult](TypeAlias.ExecutionResult.md) | Discriminated union for plugin execution results. |
 | [FileAction](TypeAlias.FileAction.md) | Every action the files plugin can perform. |
 | [FilePolicy](TypeAlias.FilePolicy.md) | A policy function that decides whether `user` may perform `action` on `resource`. Return `true` to allow, `false` to deny. |
+| [HostedTool](TypeAlias.HostedTool.md) | - |
 | [IAppRouter](TypeAlias.IAppRouter.md) | Express router type for plugin route registration |
 | [JobHandle](TypeAlias.JobHandle.md) | Job handle returned by `appkit.jobs("etl")`. Supports OBO access via `.asUser(req)`. |
 | [JobsExport](TypeAlias.JobsExport.md) | Public API shape of the jobs plugin. Callable to select a job by key. |
@@ -76,6 +99,7 @@ plugin architecture, and React integration.
 
 | Variable | Description |
 | ------ | ------ |
+| [agents](Variable.agents.md) | Plugin factory for the agents plugin. Reads `config/agents/*.md` by default, resolves toolkits/tools from registered plugins, exposes `appkit.agents.*` runtime API and mounts `/invocations`. |
 | [READ\_ACTIONS](Variable.READ_ACTIONS.md) | Actions that only read data. |
 | [sql](Variable.sql.md) | SQL helper namespace |
 | [WRITE\_ACTIONS](Variable.WRITE_ACTIONS.md) | Actions that mutate data. |
@@ -86,10 +110,12 @@ plugin architecture, and React integration.
 | ------ | ------ |
 | [appKitServingTypesPlugin](Function.appKitServingTypesPlugin.md) | Vite plugin to generate TypeScript types for AppKit serving endpoints. Fetches OpenAPI schemas from Databricks and generates a .d.ts with ServingEndpointRegistry module augmentation. |
 | [appKitTypesPlugin](Function.appKitTypesPlugin.md) | Vite plugin to generate types for AppKit queries. Calls generateFromEntryPoint under the hood. |
+| [createAgent](Function.createAgent.md) | Pure factory for agent definitions. Returns the passed-in definition after cycle-detecting the sub-agent graph. Accepts the full `AgentDefinition` shape and is safe to call at module top-level. |
 | [createApp](Function.createApp.md) | Bootstraps AppKit with the provided configuration. |
 | [createLakebasePool](Function.createLakebasePool.md) | Create a Lakebase pool with appkit's logger integration. Telemetry automatically uses appkit's OpenTelemetry configuration via global registry. |
 | [extractServingEndpoints](Function.extractServingEndpoints.md) | Extract serving endpoint config from a server file by AST-parsing it. Looks for `serving({ endpoints: { alias: { env: "..." }, ... } })` calls and extracts the endpoint alias names and their environment variable mappings. |
 | [findServerFile](Function.findServerFile.md) | Find the server entry file by checking candidate paths in order. |
+| [fromPlugin](Function.fromPlugin.md) | Reference a plugin's tools inside an `AgentDefinition.tools` record without naming the plugin instance. The returned spread-friendly object carries a symbol-keyed marker that the agents plugin resolves against registered `ToolProvider`s at setup time. |
 | [generateDatabaseCredential](Function.generateDatabaseCredential.md) | Generate OAuth credentials for Postgres database connection using the proper Postgres API. |
 | [getExecutionContext](Function.getExecutionContext.md) | Get the current execution context. |
 | [getLakebaseOrmConfig](Function.getLakebaseOrmConfig.md) | Get Lakebase connection configuration for ORMs that don't accept pg.Pool directly. |
@@ -98,4 +124,13 @@ plugin architecture, and React integration.
 | [getResourceRequirements](Function.getResourceRequirements.md) | Gets the resource requirements from a plugin's manifest. |
 | [getUsernameWithApiLookup](Function.getUsernameWithApiLookup.md) | Resolves the PostgreSQL username for a Lakebase connection. |
 | [getWorkspaceClient](Function.getWorkspaceClient.md) | Get workspace client from config or SDK default auth chain |
+| [isFromPluginMarker](Function.isFromPluginMarker.md) | Type guard for [FromPluginMarker](Interface.FromPluginMarker.md). |
+| [isFunctionTool](Function.isFunctionTool.md) | - |
+| [isHostedTool](Function.isHostedTool.md) | - |
 | [isSQLTypeMarker](Function.isSQLTypeMarker.md) | Type guard to check if a value is a SQL type marker |
+| [isToolkitEntry](Function.isToolkitEntry.md) | Type guard for `ToolkitEntry` — used by the agents plugin to differentiate toolkit references from inline tools in a mixed `tools` record. |
+| [loadAgentFromFile](Function.loadAgentFromFile.md) | Loads a single markdown agent file and resolves its frontmatter against registered plugin toolkits + ambient tool library. |
+| [loadAgentsFromDir](Function.loadAgentsFromDir.md) | Scans a directory for `*.md` files and produces an `AgentDefinition` record keyed by file-stem. Throws on frontmatter errors or unresolved references. Returns an empty map if the directory does not exist. |
+| [mcpServer](Function.mcpServer.md) | Factory for declaring a custom MCP server tool. |
+| [runAgent](Function.runAgent.md) | Standalone agent execution without `createApp`. Resolves the adapter, binds inline tools, and drives the adapter's `run()` loop to completion. |
+| [tool](Function.tool.md) | Factory for defining function tools with Zod schemas. |
diff --git a/docs/docs/api/appkit/typedoc-sidebar.ts b/docs/docs/api/appkit/typedoc-sidebar.ts
index 162c3e68b..db89a5825 100644
--- a/docs/docs/api/appkit/typedoc-sidebar.ts
+++ b/docs/docs/api/appkit/typedoc-sidebar.ts
@@ -87,6 +87,36 @@ const typedocSidebar: SidebarsConfig = {
       type: "category",
       label: "Interfaces",
       items: [
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentAdapter",
+          label: "AgentAdapter"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentDefinition",
+          label: "AgentDefinition"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentInput",
+          label: "AgentInput"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentRunContext",
+          label: "AgentRunContext"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentsPluginConfig",
+          label: "AgentsPluginConfig"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentToolDefinition",
+          label: "AgentToolDefinition"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.BasePluginConfig",
@@ -117,6 +147,16 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.FileResource",
           label: "FileResource"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.FromPluginMarker",
+          label: "FromPluginMarker"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.FunctionTool",
+          label: "FunctionTool"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.GenerateDatabaseCredentialRequest",
@@ -152,11 +192,21 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.LakebasePoolConfig",
           label: "LakebasePoolConfig"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.Message",
+          label: "Message"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.PluginManifest",
           label: "PluginManifest"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.PromptContext",
+          label: "PromptContext"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.RequestedClaims",
@@ -182,6 +232,16 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.ResourceRequirement",
           label: "ResourceRequirement"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.RunAgentInput",
+          label: "RunAgentInput"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.RunAgentResult",
+          label: "RunAgentResult"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.ServingEndpointEntry",
@@ -202,6 +262,36 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.TelemetryConfig",
           label: "TelemetryConfig"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.Thread",
+          label: "Thread"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ThreadStore",
+          label: "ThreadStore"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ToolConfig",
+          label: "ToolConfig"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ToolkitEntry",
+          label: "ToolkitEntry"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ToolkitOptions",
+          label: "ToolkitOptions"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ToolProvider",
+          label: "ToolProvider"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.ValidationResult",
@@ -213,6 +303,26 @@ const typedocSidebar: SidebarsConfig = {
       type: "category",
       label: "Type Aliases",
       items: [
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.AgentEvent",
+          label: "AgentEvent"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.AgentTool",
+          label: "AgentTool"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.AgentTools",
+          label: "AgentTools"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.BaseSystemPromptOption",
+          label: "BaseSystemPromptOption"
+        },
         {
           type: "doc",
           id: "api/appkit/TypeAlias.ConfigSchema",
@@ -233,6 +343,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/TypeAlias.FilePolicy",
           label: "FilePolicy"
         },
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.HostedTool",
+          label: "HostedTool"
+        },
         {
           type: "doc",
           id: "api/appkit/TypeAlias.IAppRouter",
@@ -274,6 +389,11 @@ const typedocSidebar: SidebarsConfig = {
       type: "category",
       label: "Variables",
       items: [
+        {
+          type: "doc",
+          id: "api/appkit/Variable.agents",
+          label: "agents"
+        },
         {
           type: "doc",
           id: "api/appkit/Variable.READ_ACTIONS",
@@ -305,6 +425,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Function.appKitTypesPlugin",
           label: "appKitTypesPlugin"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Function.createAgent",
+          label: "createAgent"
+        },
         {
           type: "doc",
           id: "api/appkit/Function.createApp",
@@ -325,6 +450,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Function.findServerFile",
           label: "findServerFile"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Function.fromPlugin",
+          label: "fromPlugin"
+        },
         {
           type: "doc",
           id: "api/appkit/Function.generateDatabaseCredential",
@@ -365,10 +495,55 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Function.getWorkspaceClient",
           label: "getWorkspaceClient"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Function.isFromPluginMarker",
+          label: "isFromPluginMarker"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.isFunctionTool",
+          label: "isFunctionTool"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.isHostedTool",
+          label: "isHostedTool"
+        },
         {
           type: "doc",
           id: "api/appkit/Function.isSQLTypeMarker",
           label: "isSQLTypeMarker"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.isToolkitEntry",
+          label: "isToolkitEntry"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.loadAgentFromFile",
+          label: "loadAgentFromFile"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.loadAgentsFromDir",
+          label: "loadAgentsFromDir"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.mcpServer",
+          label: "mcpServer"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.runAgent",
+          label: "runAgent"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.tool",
+          label: "tool"
         }
       ]
     }
diff --git a/docs/docs/plugins/agents.md b/docs/docs/plugins/agents.md
new file mode 100644
index 000000000..8c007bca2
--- /dev/null
+++ b/docs/docs/plugins/agents.md
@@ -0,0 +1,398 @@
+# Agents
+
+The `agents` plugin turns a Databricks AppKit app into an AI-agent host. It loads agent definitions from markdown files (convention: `config/agents/*.md`), from TypeScript (`createAgent(def)`), or both, and exposes them at `POST /invocations` alongside routes for chat, thread management, and cancellation.
+
+This page covers the full lifecycle. For the hand-written primitives (`tool()`, `mcpServer()`), see [tools](./server.md).
+
+## Install
+
+`agents` is a regular plugin. Add it to `plugins[]` alongside `server()` and any ToolProvider plugins whose tools you want agents to reach.
+
+```ts
+import { agents, analytics, createApp, files, server } from "@databricks/appkit";
+
+await createApp({
+  plugins: [server(), analytics(), files(), agents()],
+});
+```
+
+That alone gives you a live HTTP server with `POST /invocations` wired to a markdown-driven agent.
+
+## Level 1: drop a markdown file
+
+```
+my-app/
+  server.ts
+  config/agents/
+    assistant.md
+```
+
+```md
+---
+endpoint: databricks-claude-sonnet-4-5
+default: true
+---
+
+You are a helpful data assistant running on Databricks.
+
+Use the available tools to query data, browse files, and help users.
+```
+
+On startup the plugin:
+
+1. Discovers the file at `./config/agents/assistant.md`.
+2. Parses the YAML frontmatter and markdown body as the agent's `instructions`.
+3. Resolves the adapter from `endpoint` (or falls back to `DATABRICKS_AGENT_ENDPOINT`).
+4. Auto-inherits every registered ToolProvider plugin's tools (`analytics.*`, `files.*`, …).
+5. Mounts the agent at the default name (`assistant`).
+
+Requests land at `POST /invocations` with an OpenAI Responses-compatible body. Every tool call runs through `asUser(req)` so SQL executes as the requesting user, file access respects Unity Catalog ACLs, and telemetry spans are created automatically.
+
+## Level 2: scope tools in frontmatter
+
+```md
+---
+endpoint: databricks-claude-sonnet-4-5
+toolkits:
+  - analytics                             # all analytics.* tools
+  - files: [uploads.read, uploads.list]   # only these files tools
+  - genie: { except: [getConversation] }  # everything but getConversation
+tools: [get_weather]                      # ambient tool declared in code
+default: true
+---
+
+You are a read-only data analyst.
+```
+
+When any `toolkits:` or `tools:` is declared the auto-inherit default is turned off — the agent sees exactly the listed tools. Ambient tools (`tools: [get_weather]`) are looked up in the `agents({ tools: { ... } })` config.
+
+## Level 3: code-defined agents
+
+```ts
+import {
+  agents,
+  analytics,
+  createAgent,
+  createApp,
+  files,
+  fromPlugin,
+  server,
+  tool,
+} from "@databricks/appkit";
+import { z } from "zod";
+
+const support = createAgent({
+  instructions: "You help customers with data and files.",
+  model: "databricks-claude-sonnet-4-5",                  // string sugar
+  tools: {
+    ...fromPlugin(analytics),                             // all analytics tools
+    ...fromPlugin(files, { only: ["uploads.read"] }),     // filtered subset
+    get_weather: tool({
+      name: "get_weather",
+      description: "Weather",
+      schema: z.object({ city: z.string() }),
+      execute: async ({ city }) => `Sunny in ${city}`,
+    }),
+  },
+});
+
+await createApp({
+  plugins: [server(), analytics(), files(), agents({ agents: { support } })],
+});
+```
+
+Code-defined agents start with no tools by default. `fromPlugin(factory)` is the primary way to pull in a plugin's tools — it returns a spread-friendly marker that the agents plugin resolves against registered `ToolProvider`s at setup time. No intermediate variable, no duplicate `plugins: [analyticsP, filesP, ...]` dance: you write the factory reference once inside `fromPlugin` and again in `plugins: [...]`.
+
+The asymmetry (file: auto-inherit, code: strict) matches the personas: prompt authors want zero ceremony, engineers want no surprises.
+
+### Scoping tools in code
+
+`fromPlugin(factory, opts?)` accepts the same `ToolkitOptions` as markdown frontmatter:
+
+| Option | Example | Meaning |
+|---|---|---|
+| `only` | `{ only: ["query"] }` | Allowlist of local tool names |
+| `except` | `{ except: ["legacy"] }` | Denylist of local tool names |
+| `prefix` | `{ prefix: "" }` | Drop the `${pluginName}.` prefix |
+| `rename` | `{ rename: { query: "q" } }` | Remap specific local names |
+
+For plugins that don't expose a `.toolkit()` method (e.g., third-party `ToolProvider` plugins authored with plain `toPlugin`), `fromPlugin` falls back to walking `getAgentTools()` and synthesizing namespaced keys (`${pluginName}.${localName}`). The fallback respects `only` / `except` / `rename` / `prefix` the same way.
+
+If a referenced plugin is not registered in `createApp({ plugins })`, the agents plugin throws at setup with an `Available: …` listing so you can fix the wiring before the first request.
+
+## Level 4: sub-agents
+
+```ts
+const researcher = createAgent({
+  instructions: "Research the question. Return concise bullets.",
+  model: "databricks-claude-sonnet-4-5",
+  tools: { search: tool({ /* ... */ }) },
+});
+
+const writer = createAgent({
+  instructions: "Draft prose from notes.",
+  model: "databricks-claude-sonnet-4-5",
+});
+
+const supervisor = createAgent({
+  instructions: "Coordinate researcher and writer.",
+  model: "databricks-claude-sonnet-4-5",
+  agents: { researcher, writer },  // exposed as agent-researcher, agent-writer
+});
+
+await createApp({
+  plugins: [
+    server(),
+    agents({ agents: { supervisor, researcher, writer } }),
+  ],
+});
+```
+
+Each key in `agents: {...}` on an `AgentDefinition` becomes an `agent-<key>` tool on the parent. When invoked, the agents plugin runs the child's adapter with a fresh message list (no shared thread state) and returns the aggregated text. Cycles are rejected at load time.
+
+## Level 5: standalone (no `createApp`)
+
+```ts
+import { createAgent, runAgent, tool } from "@databricks/appkit";
+import { z } from "zod";
+
+const classifier = createAgent({
+  instructions: "Classify tickets: billing | bug | feature.",
+  model: "databricks-claude-sonnet-4-5",
+  tools: {
+    lookup_account: tool({ /* ... */ }),
+  },
+});
+
+for (const ticket of tickets) {
+  const result = await runAgent(classifier, {
+    messages: [{ role: "user", content: ticket.body }],
+  });
+  await persistClassification(ticket.id, result.text);
+}
+```
+
+`runAgent` drives the adapter without `createApp` or HTTP. Inline `tool()` calls work standalone as shown above. To use plugin tools in standalone mode, pass the plugin factories through `RunAgentInput.plugins` — `runAgent` will resolve any `fromPlugin` markers in the def against that list:
+
+```ts
+import { analytics, createAgent, fromPlugin, runAgent } from "@databricks/appkit";
+
+const classifier = createAgent({
+  instructions: "Classify tickets. Use analytics.query for historical data.",
+  model: "databricks-claude-sonnet-4-5",
+  tools: { ...fromPlugin(analytics) },
+});
+
+const result = await runAgent(classifier, {
+  messages: "is ticket 42 a duplicate?",
+  plugins: [analytics()],
+});
+```
+
+Hosted tools (MCP) are still `agents()`-only since they require the live MCP client. Plugin tool dispatch in standalone mode runs as the service principal (no OBO) since there is no HTTP request.
+
+## Configuration reference
+
+```ts
+agents({
+  dir?: string | false,         // "./config/agents" default; false disables
+  agents?: Record<string, AgentDefinition>,
+  defaultAgent?: string,
+  defaultModel?: AgentAdapter | Promise<AgentAdapter> | string,
+  tools?: Record<string, AgentTool>,
+  autoInheritTools?: boolean | { file?: boolean, code?: boolean },
+  threadStore?: ThreadStore,    // default in-memory
+  baseSystemPrompt?: false | string | (ctx: PromptContext) => string,
+  mcp?: {
+    trustedHosts?: string[],    // extra hostnames allowed for custom MCP URLs
+    allowLocalhost?: boolean,   // default: NODE_ENV !== "production"
+  },
+  approval?: {
+    requireForDestructive?: boolean,  // default: true
+    timeoutMs?: number,               // default: 60_000
+  },
+  limits?: {
+    maxConcurrentStreamsPerUser?: number, // default: 5
+    maxToolCalls?: number,                // default: 50
+    maxSubAgentDepth?: number,            // default: 3
+  },
+})
+```
+
+`autoInheritTools` defaults to `{ file: false, code: false }` — no tools spread into any agent unless the developer explicitly opts in. When opted in, only tools whose plugin author marked `autoInheritable: true` are spread; destructive or state-mutating tools are always skipped from the auto-inherit path even when opt-in is enabled. Boolean shorthand (`autoInheritTools: true`) applies to both origins. See "Auto-inherit posture" below.
+
+### MCP host policy
+
+AppKit applies a zero-trust policy to every MCP URL used as a hosted tool. By default only **same-origin Databricks workspace URLs** (matching the resolved `DATABRICKS_HOST`) may be reached. Every other host must be explicitly allowlisted via `mcp.trustedHosts`, and workspace credentials (service-principal and on-behalf-of user tokens) are **never** forwarded to those hosts.
+
+```ts
+agents({
+  agents: {
+    support: createAgent({
+      instructions: "…",
+      tools: {
+        "mcp.internal": mcpServer("internal", "https://mcp.corp.internal/mcp"),
+      },
+    }),
+  },
+  mcp: {
+    trustedHosts: ["mcp.corp.internal"],
+  },
+});
+```
+
+The policy enforces four rules at MCP `connect()` time, before any byte is sent:
+
+1. Only `http` and `https` URLs are accepted.
+2. Plaintext `http://` is rejected for everything except `localhost` when `allowLocalhost` is true (default in development, off in production).
+3. The destination hostname must match the workspace host, equal `localhost` (if permitted), or appear in `trustedHosts`.
+4. The resolved DNS address must not fall in loopback, RFC1918, CGNAT (100.64.0.0/10), link-local (169.254.0.0/16 — covers cloud metadata services), ULA, or multicast ranges.
+
+`Authorization` headers carrying workspace credentials are scoped to same-origin workspace URLs. A `mcpServer(name, url)` pointing at a trusted external host must authenticate itself (for example, a custom token baked into `url`).
+
+### Auto-inherit posture
+
+AppKit treats auto-inherit as a two-key operation: the developer must opt into `autoInheritTools`, AND the plugin author must mark each tool `autoInheritable: true`. Both are required for a tool to spread into an agent's index without explicit wiring.
+
+```ts
+// Opt-in at the agents plugin level (pick one):
+agents({ autoInheritTools: true });                   // both origins
+agents({ autoInheritTools: { file: true } });         // markdown agents only
+agents({ autoInheritTools: { file: true, code: true } });
+
+// Per-tool, inside a plugin:
+defineTool({
+  description: "safe read",
+  schema: z.object({ ... }),
+  annotations: { readOnly: true, requiresUserContext: true },
+  autoInheritable: true, // explicit consent that this tool may auto-spread
+  handler: ...,
+});
+```
+
+The AppKit core plugins ship with the following `autoInheritable` markings:
+
+| Tool | `autoInheritable` | Rationale |
+|---|---|---|
+| `analytics.query` | yes | OBO-scoped, `readOnly: true` enforced at runtime |
+| `files.list` / `files.read` / `files.exists` / `files.metadata` | yes | OBO-scoped read operations |
+| `files.upload` / `files.delete` | no | Mutating — wire explicitly |
+| `genie.getConversation` | yes | Read-only history |
+| `genie.sendMessage` | no | State-mutating Genie conversation |
+| `lakebase.query` | no | Already gated by `exposeAsAgentTool`; auto-inherit stays closed as defense-in-depth |
+
+Third-party `ToolProvider` plugins that don't expose a `toolkit()` method are also skipped from the auto-inherit path — their tools must be wired via `tools:` explicitly. At setup the agents plugin logs what each agent inherited and what was skipped so the posture is visible:
+
+```
+[agents] [agent support] auto-inherited 2 tool(s): analytics.query, files.uploads.read
+[agents] [agent support] auto-inherit skipped 3 tool(s) not marked autoInheritable: files(2), genie(1). Wire them explicitly via `tools:` if needed.
+```
+
+### SQL agent tools
+
+Two built-in agent tools can execute SQL on behalf of the LLM: `analytics.query` (against the Databricks SQL warehouse) and the opt-in `lakebase.query` (against a Lakebase Postgres database). Both have distinct safety postures because they run with different privileges.
+
+**`analytics.query`** runs under the caller's OBO token (the end user's Databricks credentials). Its `readOnly: true` annotation is enforced at execution time — statements are tokenized and only `SELECT`, `WITH`, `SHOW`, `EXPLAIN`, `DESCRIBE`, and `DESC` are accepted. Writes, DDL, and stacked statements are rejected before the request reaches the warehouse:
+
+```ts
+// accepted
+analytics.query({ query: "SELECT * FROM main.sales.orders WHERE created_at > current_date() - 7" })
+
+// rejected at the plugin, never reaches the warehouse
+analytics.query({ query: "UPDATE main.sales.orders SET status = 'cancelled'" })
+analytics.query({ query: "SELECT 1; DROP TABLE main.sales.orders" })
+```
+
+**`lakebase.query`** is **not registered as an agent tool by default**. Enabling it is an explicit decision because the Lakebase pool is bound to the application's service principal: an agent with access to this tool can execute SQL as the SP regardless of which end user initiated the request. Opt in with an acknowledgement flag:
+
+```ts
+lakebase({
+  exposeAsAgentTool: {
+    iUnderstandRunsAsServicePrincipal: true,
+    readOnly: true, // default
+  },
+});
+```
+
+With `readOnly: true` (default), the same SQL classifier as `analytics.query` applies, and the accepted statement is additionally wrapped in `BEGIN READ ONLY; … ROLLBACK;` so the Postgres server rejects any write that slips past the classifier (e.g., a `SELECT` over a side-effecting function). The tool annotations are `{ readOnly: true, destructive: false }`.
+
+With `readOnly: false`, the tool accepts arbitrary SQL and is annotated `{ readOnly: false, destructive: true }`. The `destructive` annotation triggers the human-in-the-loop approval gate (below) on every invocation.
+
+### Human-in-the-loop approval for destructive tools
+
+Any tool annotated `destructive: true` requires explicit user approval before execution. Secure by default: set `approval.requireForDestructive: false` only for fully autonomous back-office agents running in single-user contexts.
+
+Flow:
+
+1. Before running the tool, the agents plugin emits an `appkit.approval_pending` SSE event carrying the pending call's `approval_id`, `stream_id`, `tool_name`, `args`, and `annotations`.
+2. The chat client renders an approval prompt (see the reference app's approval card).
+3. The same user who initiated the stream posts the decision to `POST /api/agent/approve`:
+
+   ```http
+   POST /api/agent/approve
+   Content-Type: application/json
+   X-Forwarded-User: <end-user id>
+   X-Forwarded-Access-Token: <OBO token>
+
+   { "streamId": "...", "approvalId": "...", "decision": "approve" | "deny" }
+   ```
+4. If approved, the tool executes normally and the stream continues. If denied, the adapter receives the string `"Tool execution denied by user approval gate (tool: <name>)."` as the tool output and the LLM can apologise / replan. If no decision arrives within `approval.timeoutMs` (default 60 s), the gate auto-denies.
+
+The route enforces that the decider is the stream owner: an approve from a different `x-forwarded-user` returns `403`. Cancelling the stream via `POST /api/agent/cancel` denies every pending approval on that stream.
+
+### Resource limits
+
+The plugin enforces a handful of caps to protect a single-instance deployment from runaway prompts, misbehaving clients, or prompt-injected delegation cycles. Some are static (enforced by the request schema) and some are configurable via `agents({ limits: { ... } })`.
+
+**Static caps** (applied at `POST /chat` and `POST /invocations` request parsing):
+
+| Field | Cap | Why |
+|---|---|---|
+| `chat.message` | 64 000 characters | ~16k tokens; larger bodies are almost certainly abuse. |
+| `invocations.input` string | 64 000 characters | Same reasoning. |
+| `invocations.input` array | 100 items | Prevents a single request seeding hundreds of messages into the thread store. |
+| `invocations.input[].content` string | 64 000 characters | Per-seeded-message cap. |
+| `invocations.input[].content` array | 100 items | Per-seeded-message cap. |
+
+**Configurable caps** (defaults shown):
+
+```ts
+agents({
+  limits: {
+    maxConcurrentStreamsPerUser: 5,  // HTTP 429 + Retry-After when exceeded
+    maxToolCalls: 50,                // aborts the run if the budget is exhausted
+    maxSubAgentDepth: 3,             // rejects sub-agent recursion beyond this
+  },
+});
+```
+
+The `maxToolCalls` budget is shared across the top-level adapter and every sub-agent it delegates to, so a prompt-injected fan-out cannot escape by going deeper. `maxConcurrentStreamsPerUser` is per-user, not global — one user hitting their limit does not affect others.
+
+## Runtime API
+
+After `createApp`, the plugin exposes:
+
+```ts
+appkit.agents.list();               // => ["support", "researcher", ...]
+appkit.agents.get("support");       // => RegisteredAgent | null
+appkit.agents.getDefault();         // => "support"
+appkit.agents.register(name, def);  // dynamic registration
+appkit.agents.reload();             // re-scan the directory
+appkit.agents.getThreads(userId);   // list user's threads
+```
+
+## Frontmatter schema
+
+| Key | Type | Notes |
+|---|---|---|
+| `endpoint` | string | Model serving endpoint name. Shortcut for `model`. |
+| `model` | string | Same as `endpoint`; either works. |
+| `toolkits` | array of string or `{ name: options }` | Spread plugin toolkits. Supports `only`, `except`, `rename`, `prefix`. |
+| `tools` | array of string | Keys into `agents({ tools: {...} })`. |
+| `default` | boolean | First file with `default: true` becomes the default agent. |
+| `maxSteps` | number | Adapter max-step hint. |
+| `maxTokens` | number | Adapter max-token hint. |
+| `baseSystemPrompt` | false \| string | Per-agent override. `false` disables the AppKit base prompt. |
+| `ephemeral` | boolean | If `true`, the thread created for a chat request against this agent is deleted from `ThreadStore` after the stream finishes. Use for stateless one-shot agents (e.g. autocomplete) so history does not accumulate or contaminate future calls. Defaults to `false`. |
+
+Unknown keys are logged and ignored. Invalid YAML and missing plugin/tool references throw at boot.
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 635fb38a7..7d8efbf52 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -81,6 +81,76 @@ importers:
         specifier: 3.2.4
         version: 3.2.4(@types/debug@4.1.12)(@types/node@24.7.2)(jiti@2.6.1)(jsdom@27.0.0(bufferutil@4.0.9)(postcss@8.5.6))(lightningcss@1.30.2)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2)
 
+  apps/agent-app:
+    dependencies:
+      '@databricks/appkit':
+        specifier: workspace:*
+        version: link:../../packages/appkit
+      '@databricks/appkit-ui':
+        specifier: workspace:*
+        version: link:../../packages/appkit-ui
+      '@databricks/sdk-experimental':
+        specifier: ^0.16.0
+        version: 0.16.0
+      dotenv:
+        specifier: ^16.6.1
+        version: 16.6.1
+      lucide-react:
+        specifier: ^0.511.0
+        version: 0.511.0(react@19.2.0)
+      marked:
+        specifier: ^15.0.0
+        version: 15.0.12
+      react:
+        specifier: 19.2.0
+        version: 19.2.0
+      react-dom:
+        specifier: 19.2.0
+        version: 19.2.0(react@19.2.0)
+      zod:
+        specifier: ^4.0.0
+        version: 4.1.13
+    devDependencies:
+      '@tailwindcss/postcss':
+        specifier: 4.1.17
+        version: 4.1.17
+      '@types/node':
+        specifier: 24.10.1
+        version: 24.10.1
+      '@types/react':
+        specifier: 19.2.7
+        version: 19.2.7
+      '@types/react-dom':
+        specifier: 19.2.3
+        version: 19.2.3(@types/react@19.2.7)
+      '@vitejs/plugin-react':
+        specifier: 5.1.1
+        version: 5.1.1(rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2))
+      autoprefixer:
+        specifier: 10.4.21
+        version: 10.4.21(postcss@8.5.6)
+      postcss:
+        specifier: 8.5.6
+        version: 8.5.6
+      tailwindcss:
+        specifier: 4.1.17
+        version: 4.1.17
+      tailwindcss-animate:
+        specifier: 1.0.7
+        version: 1.0.7(tailwindcss@4.1.17)
+      tsx:
+        specifier: 4.20.6
+        version: 4.20.6
+      tw-animate-css:
+        specifier: 1.4.0
+        version: 1.4.0
+      typescript:
+        specifier: 5.9.3
+        version: 5.9.3
+      vite:
+        specifier: npm:rolldown-vite@7.1.14
+        version: rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2)
+
   apps/clean-app:
     dependencies:
       '@databricks/appkit':
@@ -2150,15 +2220,9 @@ packages:
     resolution: {integrity: sha512-lBSBiRruFurFKXr5Hbsl2thmGweAPmddhF3jb99U4EMDA5L+e5Y1rAkOS07Nvrup7HUMBDrCV45meaxZnt28nQ==}
     engines: {node: '>=20.0'}
 
-  '@emnapi/core@1.7.1':
-    resolution: {integrity: sha512-o1uhUASyo921r2XtHYOHy7gdkGLge8ghBEQHMWmyJFoXlpU58kIrhhN3w26lpQb6dspetweapMn2CSNwQ8I4wg==}
-
   '@emnapi/core@1.8.1':
     resolution: {integrity: sha512-AvT9QFpxK0Zd8J0jopedNm+w/2fIzvtPKPjqyw9jwvBaReTTqPBk9Hixaz7KbjimP+QNz605/XnjFcDAL2pqBg==}
 
-  '@emnapi/runtime@1.7.1':
-    resolution: {integrity: sha512-PVtJr5CmLwYAU9PZDMITZoR5iAOShYREoR45EyyLrbntV50mdePTgUn4AmOw90Ifcj+x2kRjdzr1HP3RrNiHGA==}
-
   '@emnapi/runtime@1.8.1':
     resolution: {integrity: sha512-mehfKSMWjjNol8659Z8KxEMrdSJDDot5SXMq00dM8BN4o+CLNXQ0xH2V7EchNHV4RmbZLmmPdEaXZc5H2FXmDg==}
 
@@ -2660,9 +2724,6 @@ packages:
   '@mermaid-js/parser@0.6.3':
     resolution: {integrity: sha512-lnjOhe7zyHjc+If7yT4zoedx2vo4sHaTmtkl1+or8BRTnCtDmcTpAjpzDSfCZrshM5bCoz0GyidzadJAH1xobA==}
 
-  '@napi-rs/wasm-runtime@1.0.7':
-    resolution: {integrity: sha512-SeDnOO0Tk7Okiq6DbXmmBODgOAb9dp9gjlphokTUxmt8U3liIP1ZsozBahH69j/RJv+Rfs6IwUKHTgQYJ/HBAw==}
-
   '@napi-rs/wasm-runtime@1.1.1':
     resolution: {integrity: sha512-p64ah1M1ld8xjWv3qbvFwHiFVWrq1yFvV4f7w+mzaqiR4IlSgkqhcRdHwsGgomwzBH51sRY4NEowLxnaBjcW/A==}
 
@@ -4589,63 +4650,136 @@ packages:
     resolution: {integrity: sha512-+PmQX0PiAYPMeVYe237LJAYvOMYW1j2rH5YROyS3b4CTVJum34HfRvKvAzozHAQG0TnHNdUfY9nCeUyRAs//cw==}
     engines: {node: '>=14.16'}
 
+  '@tailwindcss/node@4.1.17':
+    resolution: {integrity: sha512-csIkHIgLb3JisEFQ0vxr2Y57GUNYh447C8xzwj89U/8fdW8LhProdxvnVH6U8M2Y73QKiTIH+LWbK3V2BBZsAg==}
+
   '@tailwindcss/node@4.1.18':
     resolution: {integrity: sha512-DoR7U1P7iYhw16qJ49fgXUlry1t4CpXeErJHnQ44JgTSKMaZUdf17cfn5mHchfJ4KRBZRFA/Coo+MUF5+gOaCQ==}
 
+  '@tailwindcss/oxide-android-arm64@4.1.17':
+    resolution: {integrity: sha512-BMqpkJHgOZ5z78qqiGE6ZIRExyaHyuxjgrJ6eBO5+hfrfGkuya0lYfw8fRHG77gdTjWkNWEEm+qeG2cDMxArLQ==}
+    engines: {node: '>= 10'}
+    cpu: [arm64]
+    os: [android]
+
   '@tailwindcss/oxide-android-arm64@4.1.18':
     resolution: {integrity: sha512-dJHz7+Ugr9U/diKJA0W6N/6/cjI+ZTAoxPf9Iz9BFRF2GzEX8IvXxFIi/dZBloVJX/MZGvRuFA9rqwdiIEZQ0Q==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [android]
 
+  '@tailwindcss/oxide-darwin-arm64@4.1.17':
+    resolution: {integrity: sha512-EquyumkQweUBNk1zGEU/wfZo2qkp/nQKRZM8bUYO0J+Lums5+wl2CcG1f9BgAjn/u9pJzdYddHWBiFXJTcxmOg==}
+    engines: {node: '>= 10'}
+    cpu: [arm64]
+    os: [darwin]
+
   '@tailwindcss/oxide-darwin-arm64@4.1.18':
     resolution: {integrity: sha512-Gc2q4Qhs660bhjyBSKgq6BYvwDz4G+BuyJ5H1xfhmDR3D8HnHCmT/BSkvSL0vQLy/nkMLY20PQ2OoYMO15Jd0A==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [darwin]
 
+  '@tailwindcss/oxide-darwin-x64@4.1.17':
+    resolution: {integrity: sha512-gdhEPLzke2Pog8s12oADwYu0IAw04Y2tlmgVzIN0+046ytcgx8uZmCzEg4VcQh+AHKiS7xaL8kGo/QTiNEGRog==}
+    engines: {node: '>= 10'}
+    cpu: [x64]
+    os: [darwin]
+
   '@tailwindcss/oxide-darwin-x64@4.1.18':
     resolution: {integrity: sha512-FL5oxr2xQsFrc3X9o1fjHKBYBMD1QZNyc1Xzw/h5Qu4XnEBi3dZn96HcHm41c/euGV+GRiXFfh2hUCyKi/e+yw==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [darwin]
 
+  '@tailwindcss/oxide-freebsd-x64@4.1.17':
+    resolution: {integrity: sha512-hxGS81KskMxML9DXsaXT1H0DyA+ZBIbyG/sSAjWNe2EDl7TkPOBI42GBV3u38itzGUOmFfCzk1iAjDXds8Oh0g==}
+    engines: {node: '>= 10'}
+    cpu: [x64]
+    os: [freebsd]
+
   '@tailwindcss/oxide-freebsd-x64@4.1.18':
     resolution: {integrity: sha512-Fj+RHgu5bDodmV1dM9yAxlfJwkkWvLiRjbhuO2LEtwtlYlBgiAT4x/j5wQr1tC3SANAgD+0YcmWVrj8R9trVMA==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [freebsd]
 
+  '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.17':
+    resolution: {integrity: sha512-k7jWk5E3ldAdw0cNglhjSgv501u7yrMf8oeZ0cElhxU6Y2o7f8yqelOp3fhf7evjIS6ujTI3U8pKUXV2I4iXHQ==}
+    engines: {node: '>= 10'}
+    cpu: [arm]
+    os: [linux]
+
   '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.18':
     resolution: {integrity: sha512-Fp+Wzk/Ws4dZn+LV2Nqx3IilnhH51YZoRaYHQsVq3RQvEl+71VGKFpkfHrLM/Li+kt5c0DJe/bHXK1eHgDmdiA==}
     engines: {node: '>= 10'}
     cpu: [arm]
     os: [linux]
 
+  '@tailwindcss/oxide-linux-arm64-gnu@4.1.17':
+    resolution: {integrity: sha512-HVDOm/mxK6+TbARwdW17WrgDYEGzmoYayrCgmLEw7FxTPLcp/glBisuyWkFz/jb7ZfiAXAXUACfyItn+nTgsdQ==}
+    engines: {node: '>= 10'}
+    cpu: [arm64]
+    os: [linux]
+    libc: [glibc]
+
   '@tailwindcss/oxide-linux-arm64-gnu@4.1.18':
     resolution: {integrity: sha512-S0n3jboLysNbh55Vrt7pk9wgpyTTPD0fdQeh7wQfMqLPM/Hrxi+dVsLsPrycQjGKEQk85Kgbx+6+QnYNiHalnw==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [linux]
 
+  '@tailwindcss/oxide-linux-arm64-musl@4.1.17':
+    resolution: {integrity: sha512-HvZLfGr42i5anKtIeQzxdkw/wPqIbpeZqe7vd3V9vI3RQxe3xU1fLjss0TjyhxWcBaipk7NYwSrwTwK1hJARMg==}
+    engines: {node: '>= 10'}
+    cpu: [arm64]
+    os: [linux]
+    libc: [musl]
+
   '@tailwindcss/oxide-linux-arm64-musl@4.1.18':
     resolution: {integrity: sha512-1px92582HkPQlaaCkdRcio71p8bc8i/ap5807tPRDK/uw953cauQBT8c5tVGkOwrHMfc2Yh6UuxaH4vtTjGvHg==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [linux]
 
+  '@tailwindcss/oxide-linux-x64-gnu@4.1.17':
+    resolution: {integrity: sha512-M3XZuORCGB7VPOEDH+nzpJ21XPvK5PyjlkSFkFziNHGLc5d6g3di2McAAblmaSUNl8IOmzYwLx9NsE7bplNkwQ==}
+    engines: {node: '>= 10'}
+    cpu: [x64]
+    os: [linux]
+    libc: [glibc]
+
   '@tailwindcss/oxide-linux-x64-gnu@4.1.18':
     resolution: {integrity: sha512-v3gyT0ivkfBLoZGF9LyHmts0Isc8jHZyVcbzio6Wpzifg/+5ZJpDiRiUhDLkcr7f/r38SWNe7ucxmGW3j3Kb/g==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [linux]
 
+  '@tailwindcss/oxide-linux-x64-musl@4.1.17':
+    resolution: {integrity: sha512-k7f+pf9eXLEey4pBlw+8dgfJHY4PZ5qOUFDyNf7SI6lHjQ9Zt7+NcscjpwdCEbYi6FI5c2KDTDWyf2iHcCSyyQ==}
+    engines: {node: '>= 10'}
+    cpu: [x64]
+    os: [linux]
+    libc: [musl]
+
   '@tailwindcss/oxide-linux-x64-musl@4.1.18':
     resolution: {integrity: sha512-bhJ2y2OQNlcRwwgOAGMY0xTFStt4/wyU6pvI6LSuZpRgKQwxTec0/3Scu91O8ir7qCR3AuepQKLU/kX99FouqQ==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [linux]
 
+  '@tailwindcss/oxide-wasm32-wasi@4.1.17':
+    resolution: {integrity: sha512-cEytGqSSoy7zK4JRWiTCx43FsKP/zGr0CsuMawhH67ONlH+T79VteQeJQRO/X7L0juEUA8ZyuYikcRBf0vsxhg==}
+    engines: {node: '>=14.0.0'}
+    cpu: [wasm32]
+    bundledDependencies:
+      - '@napi-rs/wasm-runtime'
+      - '@emnapi/core'
+      - '@emnapi/runtime'
+      - '@tybys/wasm-util'
+      - '@emnapi/wasi-threads'
+      - tslib
+
   '@tailwindcss/oxide-wasm32-wasi@4.1.18':
     resolution: {integrity: sha512-LffYTvPjODiP6PT16oNeUQJzNVyJl1cjIebq/rWWBF+3eDst5JGEFSc5cWxyRCJ0Mxl+KyIkqRxk1XPEs9x8TA==}
     engines: {node: '>=14.0.0'}
@@ -4658,22 +4792,41 @@ packages:
       - '@emnapi/wasi-threads'
       - tslib
 
+  '@tailwindcss/oxide-win32-arm64-msvc@4.1.17':
+    resolution: {integrity: sha512-JU5AHr7gKbZlOGvMdb4722/0aYbU+tN6lv1kONx0JK2cGsh7g148zVWLM0IKR3NeKLv+L90chBVYcJ8uJWbC9A==}
+    engines: {node: '>= 10'}
+    cpu: [arm64]
+    os: [win32]
+
   '@tailwindcss/oxide-win32-arm64-msvc@4.1.18':
     resolution: {integrity: sha512-HjSA7mr9HmC8fu6bdsZvZ+dhjyGCLdotjVOgLA2vEqxEBZaQo9YTX4kwgEvPCpRh8o4uWc4J/wEoFzhEmjvPbA==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [win32]
 
+  '@tailwindcss/oxide-win32-x64-msvc@4.1.17':
+    resolution: {integrity: sha512-SKWM4waLuqx0IH+FMDUw6R66Hu4OuTALFgnleKbqhgGU30DY20NORZMZUKgLRjQXNN2TLzKvh48QXTig4h4bGw==}
+    engines: {node: '>= 10'}
+    cpu: [x64]
+    os: [win32]
+
   '@tailwindcss/oxide-win32-x64-msvc@4.1.18':
     resolution: {integrity: sha512-bJWbyYpUlqamC8dpR7pfjA0I7vdF6t5VpUGMWRkXVE3AXgIZjYUYAK7II1GNaxR8J1SSrSrppRar8G++JekE3Q==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [win32]
 
+  '@tailwindcss/oxide@4.1.17':
+    resolution: {integrity: sha512-F0F7d01fmkQhsTjXezGBLdrl1KresJTcI3DB8EkScCldyKp3Msz4hub4uyYaVnk88BAS1g5DQjjF6F5qczheLA==}
+    engines: {node: '>= 10'}
+
   '@tailwindcss/oxide@4.1.18':
     resolution: {integrity: sha512-EgCR5tTS5bUSKQgzeMClT6iCY3ToqE1y+ZB0AKldj809QXk1Y+3jB0upOYZrn9aGIzPtUsP7sX4QQ4XtjBB95A==}
     engines: {node: '>= 10'}
 
+  '@tailwindcss/postcss@4.1.17':
+    resolution: {integrity: sha512-+nKl9N9mN5uJ+M7dBOOCzINw94MPstNR/GtIhz1fpZysxL/4a+No64jCBD6CPN+bIHWFx3KWuu8XJRrj/572Dw==}
+
   '@tailwindcss/postcss@4.1.18':
     resolution: {integrity: sha512-Ce0GFnzAOuPyfV5SxjXGn0CubwGcuDB0zcdaPuCSzAa/2vII24JTkH+I6jcbXLb1ctjZMZZI6OjDaLPJQL1S0g==}
 
@@ -5450,6 +5603,13 @@ packages:
   autocomplete.js@0.37.1:
     resolution: {integrity: sha512-PgSe9fHYhZEsm/9jggbjtVsGXJkPLvd+9mC7gZJ662vVL5CRWEtm/mIrrzCx0MrNxHVwxD5d00UOn6NsmL2LUQ==}
 
+  autoprefixer@10.4.21:
+    resolution: {integrity: sha512-O+A6LWV5LDHSJD3LjHYoNi4VLsj/Whi7k6zG12xTYaU4cQ8oxQGckXNX8cRHK5yOZ/ppVHe0ZBXGzSV9jXdVbQ==}
+    engines: {node: ^10 || ^12 || >=14}
+    hasBin: true
+    peerDependencies:
+      postcss: ^8.1.0
+
   autoprefixer@10.4.23:
     resolution: {integrity: sha512-YYTXSFulfwytnjAPlw8QHncHJmlvFKtczb8InXaAx9Q0LbfDnfEYDE55omerIJKihhmU61Ft+cAOSzQVaBUmeA==}
     engines: {node: ^10 || ^12 || >=14}
@@ -7215,6 +7375,9 @@ packages:
     resolution: {integrity: sha512-buRG0fpBtRHSTCOASe6hD258tEubFoRLb4ZNA6NxMVHNw2gOcwHo9wyablzMzOA5z9xA9L1KNjk/Nt6MT9aYow==}
     engines: {node: '>= 0.6'}
 
+  fraction.js@4.3.7:
+    resolution: {integrity: sha512-ZsDfxO51wGAXREY55a7la9LScWpwv9RxIrYABrlvOFBlH/ShPnrtsXeuUIfXKKOVicNxQ+o8JTbJvjS4M89yew==}
+
   fraction.js@5.3.4:
     resolution: {integrity: sha512-1X1NTtiJphryn/uLQz3whtY6jK3fTqoE3ohKs0tT+Ujr1W59oopxmoEh7Lu5p6vBaPbgoM0bzveAW4Qi5RyWDQ==}
 
@@ -8435,6 +8598,11 @@ packages:
     resolution: {integrity: sha512-jumlc0BIUrS3qJGgIkWZsyfAM7NCWiBcCDhnd+3NNM5KbBmLTgHVfWBcg6W+rLUsIpzpERPsvwUP7CckAQSOoA==}
     engines: {node: '>=12'}
 
+  lucide-react@0.511.0:
+    resolution: {integrity: sha512-VK5a2ydJ7xm8GvBeKLS9mu1pVK6ucef9780JVUjw6bAjJL/QXnd4Y0p7SPeOUMC27YhzNCZvm5d/QX0Tp3rc0w==}
+    peerDependencies:
+      react: ^16.5.1 || ^17.0.0 || ^18.0.0 || ^19.0.0
+
   lucide-react@0.554.0:
     resolution: {integrity: sha512-St+z29uthEJVx0Is7ellNkgTEhaeSoA42I7JjOCBCrc5X6LYMGSv0P/2uS5HDLTExP5tpiqRD2PyUEOS6s9UXA==}
     peerDependencies:
@@ -8485,6 +8653,11 @@ packages:
   markdown-table@3.0.4:
     resolution: {integrity: sha512-wiYz4+JrLyb/DqW2hkFJxP7Vd7JuTDm77fvbM8VfEQdmSMqcImWeeRbHwZjBjIFki/VaMK2BhFi7oUUZeM5bqw==}
 
+  marked@15.0.12:
+    resolution: {integrity: sha512-8dD6FusOQSrpv9Z1rdNMdlSgQOIP880DHqnohobOmYLElGEqAL/JvxvuxZO16r4HtjTlfPRDC1hbvxC9dPN2nA==}
+    engines: {node: '>= 18'}
+    hasBin: true
+
   marked@16.4.2:
     resolution: {integrity: sha512-TI3V8YYWvkVf3KJe1dRkpnjs68JUPyEa5vjKrp1XEEJUAOaQc+Qj+L1qWbPd0SJuAdQkFU0h73sXXqwDYxsiDA==}
     engines: {node: '>= 20'}
@@ -8995,6 +9168,10 @@ packages:
     resolution: {integrity: sha512-6eZs5Ls3WtCisHWp9S2GUy8dqkpGi4BVSz3GaqiE6ezub0512ESztXUwUB6C6IKbQkY2Pnb/mD4WYojCRwcwLA==}
     engines: {node: '>=0.10.0'}
 
+  normalize-range@0.1.2:
+    resolution: {integrity: sha512-bdok/XvKII3nUpklnV6P2hxtMNrCboOjAcyBuQnWEhO665FwrSNRxU+AqpsyvO6LgGYPspN+lu5CLtw4jPRKNA==}
+    engines: {node: '>=0.10.0'}
+
   normalize-url@8.1.0:
     resolution: {integrity: sha512-X06Mfd/5aKsRHc0O0J5CUedwnPmnDtLF2+nq+KN9KSDlJHkPuh0JUviWjEWMe0SW/9TDdSLVPuk7L5gGTIA1/w==}
     engines: {node: '>=14.16'}
@@ -14385,23 +14562,12 @@ snapshots:
       - uglify-js
       - webpack-cli
 
-  '@emnapi/core@1.7.1':
-    dependencies:
-      '@emnapi/wasi-threads': 1.1.0
-      tslib: 2.8.1
-    optional: true
-
   '@emnapi/core@1.8.1':
     dependencies:
       '@emnapi/wasi-threads': 1.1.0
       tslib: 2.8.1
     optional: true
 
-  '@emnapi/runtime@1.7.1':
-    dependencies:
-      tslib: 2.8.1
-    optional: true
-
   '@emnapi/runtime@1.8.1':
     dependencies:
       tslib: 2.8.1
@@ -14871,13 +15037,6 @@ snapshots:
     dependencies:
       langium: 3.3.1
 
-  '@napi-rs/wasm-runtime@1.0.7':
-    dependencies:
-      '@emnapi/core': 1.7.1
-      '@emnapi/runtime': 1.7.1
-      '@tybys/wasm-util': 0.10.1
-    optional: true
-
   '@napi-rs/wasm-runtime@1.1.1':
     dependencies:
       '@emnapi/core': 1.8.1
@@ -16608,7 +16767,7 @@ snapshots:
 
   '@rolldown/binding-wasm32-wasi@1.0.0-beta.41':
     dependencies:
-      '@napi-rs/wasm-runtime': 1.0.7
+      '@napi-rs/wasm-runtime': 1.1.1
     optional: true
 
   '@rolldown/binding-wasm32-wasi@1.0.0-rc.3':
@@ -16904,6 +17063,16 @@ snapshots:
     dependencies:
       defer-to-connect: 2.0.1
 
+  '@tailwindcss/node@4.1.17':
+    dependencies:
+      '@jridgewell/remapping': 2.3.5
+      enhanced-resolve: 5.18.3
+      jiti: 2.6.1
+      lightningcss: 1.30.2
+      magic-string: 0.30.21
+      source-map-js: 1.2.1
+      tailwindcss: 4.1.17
+
   '@tailwindcss/node@4.1.18':
     dependencies:
       '@jridgewell/remapping': 2.3.5
@@ -16914,42 +17083,93 @@ snapshots:
       source-map-js: 1.2.1
       tailwindcss: 4.1.18
 
+  '@tailwindcss/oxide-android-arm64@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-android-arm64@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-darwin-arm64@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-darwin-arm64@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-darwin-x64@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-darwin-x64@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-freebsd-x64@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-freebsd-x64@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-linux-arm64-gnu@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-linux-arm64-gnu@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-linux-arm64-musl@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-linux-arm64-musl@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-linux-x64-gnu@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-linux-x64-gnu@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-linux-x64-musl@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-linux-x64-musl@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-wasm32-wasi@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-wasm32-wasi@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-win32-arm64-msvc@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-win32-arm64-msvc@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-win32-x64-msvc@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-win32-x64-msvc@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide@4.1.17':
+    optionalDependencies:
+      '@tailwindcss/oxide-android-arm64': 4.1.17
+      '@tailwindcss/oxide-darwin-arm64': 4.1.17
+      '@tailwindcss/oxide-darwin-x64': 4.1.17
+      '@tailwindcss/oxide-freebsd-x64': 4.1.17
+      '@tailwindcss/oxide-linux-arm-gnueabihf': 4.1.17
+      '@tailwindcss/oxide-linux-arm64-gnu': 4.1.17
+      '@tailwindcss/oxide-linux-arm64-musl': 4.1.17
+      '@tailwindcss/oxide-linux-x64-gnu': 4.1.17
+      '@tailwindcss/oxide-linux-x64-musl': 4.1.17
+      '@tailwindcss/oxide-wasm32-wasi': 4.1.17
+      '@tailwindcss/oxide-win32-arm64-msvc': 4.1.17
+      '@tailwindcss/oxide-win32-x64-msvc': 4.1.17
+
   '@tailwindcss/oxide@4.1.18':
     optionalDependencies:
       '@tailwindcss/oxide-android-arm64': 4.1.18
@@ -16965,6 +17185,14 @@ snapshots:
       '@tailwindcss/oxide-win32-arm64-msvc': 4.1.18
       '@tailwindcss/oxide-win32-x64-msvc': 4.1.18
 
+  '@tailwindcss/postcss@4.1.17':
+    dependencies:
+      '@alloc/quick-lru': 5.2.0
+      '@tailwindcss/node': 4.1.17
+      '@tailwindcss/oxide': 4.1.17
+      postcss: 8.5.6
+      tailwindcss: 4.1.17
+
   '@tailwindcss/postcss@4.1.18':
     dependencies:
       '@alloc/quick-lru': 5.2.0
@@ -17544,6 +17772,18 @@ snapshots:
     transitivePeerDependencies:
       - supports-color
 
+  '@vitejs/plugin-react@5.1.1(rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2))':
+    dependencies:
+      '@babel/core': 7.28.5
+      '@babel/plugin-transform-react-jsx-self': 7.27.1(@babel/core@7.28.5)
+      '@babel/plugin-transform-react-jsx-source': 7.27.1(@babel/core@7.28.5)
+      '@rolldown/pluginutils': 1.0.0-beta.47
+      '@types/babel__core': 7.20.5
+      react-refresh: 0.18.0
+      vite: rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2)
+    transitivePeerDependencies:
+      - supports-color
+
   '@vitejs/plugin-react@5.1.1(rolldown-vite@7.1.14(@types/node@25.2.3)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2))':
     dependencies:
       '@babel/core': 7.28.5
@@ -17919,6 +18159,16 @@ snapshots:
     dependencies:
       immediate: 3.3.0
 
+  autoprefixer@10.4.21(postcss@8.5.6):
+    dependencies:
+      browserslist: 4.28.1
+      caniuse-lite: 1.0.30001760
+      fraction.js: 4.3.7
+      normalize-range: 0.1.2
+      picocolors: 1.1.1
+      postcss: 8.5.6
+      postcss-value-parser: 4.2.0
+
   autoprefixer@10.4.23(postcss@8.5.6):
     dependencies:
       browserslist: 4.28.1
@@ -18752,7 +19002,7 @@ snapshots:
 
   cssnano-preset-advanced@6.1.2(postcss@8.5.6):
     dependencies:
-      autoprefixer: 10.4.23(postcss@8.5.6)
+      autoprefixer: 10.4.21(postcss@8.5.6)
       browserslist: 4.28.1
       cssnano-preset-default: 6.1.2(postcss@8.5.6)
       postcss: 8.5.6
@@ -19782,6 +20032,8 @@ snapshots:
 
   forwarded@0.2.0: {}
 
+  fraction.js@4.3.7: {}
+
   fraction.js@5.3.4: {}
 
   fresh@0.5.2: {}
@@ -21193,6 +21445,10 @@ snapshots:
 
   lru-cache@7.18.3: {}
 
+  lucide-react@0.511.0(react@19.2.0):
+    dependencies:
+      react: 19.2.0
+
   lucide-react@0.554.0(react@19.2.0):
     dependencies:
       react: 19.2.0
@@ -21256,6 +21512,8 @@ snapshots:
 
   markdown-table@3.0.4: {}
 
+  marked@15.0.12: {}
+
   marked@16.4.2: {}
 
   marked@17.0.3: {}
@@ -22041,6 +22299,8 @@ snapshots:
 
   normalize-path@3.0.0: {}
 
+  normalize-range@0.1.2: {}
+
   normalize-url@8.1.0: {}
 
   normalize-url@8.1.1: {}
@@ -23560,6 +23820,24 @@ snapshots:
       tsx: 4.20.6
       yaml: 2.8.2
 
+  rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2):
+    dependencies:
+      '@oxc-project/runtime': 0.92.0
+      fdir: 6.5.0(picomatch@4.0.3)
+      lightningcss: 1.30.2
+      picomatch: 4.0.3
+      postcss: 8.5.6
+      rolldown: 1.0.0-beta.41
+      tinyglobby: 0.2.15
+    optionalDependencies:
+      '@types/node': 24.10.1
+      esbuild: 0.25.10
+      fsevents: 2.3.3
+      jiti: 2.6.1
+      terser: 5.44.1
+      tsx: 4.20.6
+      yaml: 2.8.2
+
   rolldown-vite@7.1.14(@types/node@25.2.3)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2):
     dependencies:
       '@oxc-project/runtime': 0.92.0

From 66897155ece50314afccf21f8144be1fd507569a Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Wed, 22 Apr 2026 16:34:21 +0200
Subject: [PATCH 20/46] fix(appkit): align chat clients + template with renamed
 'agents' plugin
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The agents plugin's manifest `name` is `agents` (plural), so routes mount
at `/api/agents/*` and its client config is keyed as `agents` — but three
call sites still referenced the old singular `agent`:

- apps/agent-app/src/App.tsx: /api/agent/{info,chat,approve} returned an
  Express 404 HTML page, which the client then tried to JSON.parse,
  producing "Unexpected token '<', <!DOCTYPE ...". Swap to /api/agents/*.
- apps/dev-playground/client/src/routes/agent.route.tsx: same three
  paths, plus getPluginClientConfig("agent") returned {} so
  hasAutocomplete was false and the autocomplete hook short-circuited
  before ever firing a request. Swap the lookup key to "agents".
- template/appkit.plugins.json: the scaffolded plugin descriptor still
  used the singular name/key, which would have broken fresh apps the
  same way. Align with the plugin's real manifest name.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 apps/agent-app/src/App.tsx                            | 6 +++---
 apps/dev-playground/client/src/routes/agent.route.tsx | 8 ++++----
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/apps/agent-app/src/App.tsx b/apps/agent-app/src/App.tsx
index 1de373c94..e969e2be8 100644
--- a/apps/agent-app/src/App.tsx
+++ b/apps/agent-app/src/App.tsx
@@ -72,7 +72,7 @@ export default function App() {
       );
       if (!approval) return;
       try {
-        await fetch("/api/agent/approve", {
+        await fetch("/api/agents/approve", {
           method: "POST",
           headers: { "Content-Type": "application/json" },
           body: JSON.stringify({
@@ -92,7 +92,7 @@ export default function App() {
 
   useEffect(() => {
     const timer = setTimeout(() => {
-      fetch("/api/agent/info")
+      fetch("/api/agents/info")
         .then((r) => r.json())
         .then((data) => setToolCount(data.toolCount ?? 0))
         .catch(() => {});
@@ -118,7 +118,7 @@ export default function App() {
     setIsLoading(true);
 
     try {
-      const res = await fetch("/api/agent/chat", {
+      const res = await fetch("/api/agents/chat", {
         method: "POST",
         headers: { "Content-Type": "application/json" },
         body: JSON.stringify({
diff --git a/apps/dev-playground/client/src/routes/agent.route.tsx b/apps/dev-playground/client/src/routes/agent.route.tsx
index d1d1d1008..6762a1a38 100644
--- a/apps/dev-playground/client/src/routes/agent.route.tsx
+++ b/apps/dev-playground/client/src/routes/agent.route.tsx
@@ -72,7 +72,7 @@ function useAutocomplete(enabled: boolean) {
         setIsLoading(true);
 
         try {
-          const response = await fetch("/api/agent/chat", {
+          const response = await fetch("/api/agents/chat", {
             method: "POST",
             headers: { "Content-Type": "application/json" },
             body: JSON.stringify({ message: text, agent: "autocomplete" }),
@@ -153,7 +153,7 @@ function AgentRoute() {
       );
       if (!approval) return;
       try {
-        await fetch("/api/agent/approve", {
+        await fetch("/api/agents/approve", {
           method: "POST",
           headers: { "Content-Type": "application/json" },
           body: JSON.stringify({
@@ -177,7 +177,7 @@ function AgentRoute() {
   const agentConfig = getPluginClientConfig<{
     agents?: string[];
     defaultAgent?: string;
-  }>("agent");
+  }>("agents");
   const hasAutocomplete = (agentConfig.agents ?? []).includes("autocomplete");
 
   const {
@@ -206,7 +206,7 @@ function AgentRoute() {
     setIsLoading(true);
 
     try {
-      const response = await fetch("/api/agent/chat", {
+      const response = await fetch("/api/agents/chat", {
         method: "POST",
         headers: { "Content-Type": "application/json" },
         body: JSON.stringify({

From 83000705ddd60b9748f378a32292d065e4afc922 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Thu, 23 Apr 2026 18:20:17 +0200
Subject: [PATCH 21/46] docs(agents): folder layout on disk, migrate samples,
 sync API refs

Move reference apps to config/agents/<id>/agent.md; document migration and
reserved skills folder; align generated API snippets and CHANGELOG.
---
 CHANGELOG.md                                  | 19 ++++++++--
 .../{assistant.md => assistant/agent.md}      |  0
 .../agents/{support.md => support/agent.md}   |  0
 apps/agent-app/server.ts                      |  2 +-
 .../{assistant.md => assistant/agent.md}      |  0
 .../agent.md}                                 |  0
 .../appkit/Interface.AgentsPluginConfig.md    |  2 +-
 docs/docs/api/appkit/Variable.agents.md       |  2 +-
 docs/docs/api/appkit/index.md                 |  2 +-
 docs/docs/plugins/agents.md                   | 15 +++++---
 plans/agent-folder-layout.md                  | 35 +++++++++++++++++++
 11 files changed, 65 insertions(+), 12 deletions(-)
 rename apps/agent-app/config/agents/{assistant.md => assistant/agent.md} (100%)
 rename apps/agent-app/config/agents/{support.md => support/agent.md} (100%)
 rename apps/dev-playground/config/agents/{assistant.md => assistant/agent.md} (100%)
 rename apps/dev-playground/config/agents/{autocomplete.md => autocomplete/agent.md} (100%)
 create mode 100644 plans/agent-folder-layout.md

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8cd00a506..8ba469afb 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -2,11 +2,24 @@
 
 All notable changes to this project will be documented in this file.
 
-# Changelog
+## Unreleased
 
-# Changelog
+### appkit
 
-# Changelog
+* **appkit:** **Breaking change:** markdown agents must live under `config/agents/<id>/agent.md`. Top-level `config/agents/*.md` is no longer discovered; migrate each file to `<stem>/agent.md`. The reserved folder `config/agents/skills` is ignored until per-agent skills ship.
+
+## [0.25.1](https://github.com/databricks/appkit/compare/v0.25.0...v0.25.1) (2026-04-27)
+
+### appkit
+
+* **appkit:** check isRetryable before retrying in interceptor ([#276](https://github.com/databricks/appkit/issues/276)) ([1c994a6](https://github.com/databricks/appkit/commit/1c994a6d99f397b56e90f1b53df06a61f02b9e82))
+
+
+## [0.25.0](https://github.com/databricks/appkit/compare/v0.24.0...v0.25.0) (2026-04-23)
+
+### files
+
+* **files:** per-volume in-app policy enforcement ([#197](https://github.com/databricks/appkit/issues/197)) ([f54dca5](https://github.com/databricks/appkit/commit/f54dca5da5af5368c7bcb18745715b54a99d47e9))
 
 # Changelog
 
diff --git a/apps/agent-app/config/agents/assistant.md b/apps/agent-app/config/agents/assistant/agent.md
similarity index 100%
rename from apps/agent-app/config/agents/assistant.md
rename to apps/agent-app/config/agents/assistant/agent.md
diff --git a/apps/agent-app/config/agents/support.md b/apps/agent-app/config/agents/support/agent.md
similarity index 100%
rename from apps/agent-app/config/agents/support.md
rename to apps/agent-app/config/agents/support/agent.md
diff --git a/apps/agent-app/server.ts b/apps/agent-app/server.ts
index 8ea63c224..e471196be 100644
--- a/apps/agent-app/server.ts
+++ b/apps/agent-app/server.ts
@@ -12,7 +12,7 @@ import { z } from "zod";
 
 const port = Number(process.env.DATABRICKS_APP_PORT) || 8003;
 
-// Ambient function tool. Referenced from `config/agents/support.md` under
+// Ambient function tool. Referenced from `config/agents/support/agent.md` under
 // `tools: [get_weather]`. Markdown frontmatter looks up this name against
 // the `tools:` record passed to `agents({ tools: { get_weather } })` below.
 const get_weather = tool({
diff --git a/apps/dev-playground/config/agents/assistant.md b/apps/dev-playground/config/agents/assistant/agent.md
similarity index 100%
rename from apps/dev-playground/config/agents/assistant.md
rename to apps/dev-playground/config/agents/assistant/agent.md
diff --git a/apps/dev-playground/config/agents/autocomplete.md b/apps/dev-playground/config/agents/autocomplete/agent.md
similarity index 100%
rename from apps/dev-playground/config/agents/autocomplete.md
rename to apps/dev-playground/config/agents/autocomplete/agent.md
diff --git a/docs/docs/api/appkit/Interface.AgentsPluginConfig.md b/docs/docs/api/appkit/Interface.AgentsPluginConfig.md
index dcf7573ce..e4d30fb22 100644
--- a/docs/docs/api/appkit/Interface.AgentsPluginConfig.md
+++ b/docs/docs/api/appkit/Interface.AgentsPluginConfig.md
@@ -106,7 +106,7 @@ Default model for agents that don't specify their own (in code or frontmatter).
 optional dir: string | false;
 ```
 
-Directory to scan for markdown agent files. Default `./config/agents`. Set to `false` to disable.
+Directory of agent packages (`<id>/agent.md` each). Default `./config/agents`. Set to `false` to disable.
 
 ***
 
diff --git a/docs/docs/api/appkit/Variable.agents.md b/docs/docs/api/appkit/Variable.agents.md
index d5bc7a093..4a539ae7b 100644
--- a/docs/docs/api/appkit/Variable.agents.md
+++ b/docs/docs/api/appkit/Variable.agents.md
@@ -4,7 +4,7 @@
 const agents: ToPlugin<typeof AgentsPlugin, AgentsPluginConfig, string> & NamedPluginFactory<string>;
 ```
 
-Plugin factory for the agents plugin. Reads `config/agents/*.md` by default,
+Plugin factory for the agents plugin. Reads `config/agents/<id>/agent.md` by default,
 resolves toolkits/tools from registered plugins, exposes `appkit.agents.*`
 runtime API and mounts `/invocations`.
 
diff --git a/docs/docs/api/appkit/index.md b/docs/docs/api/appkit/index.md
index ec44cd683..abde8475d 100644
--- a/docs/docs/api/appkit/index.md
+++ b/docs/docs/api/appkit/index.md
@@ -99,7 +99,7 @@ plugin architecture, and React integration.
 
 | Variable | Description |
 | ------ | ------ |
-| [agents](Variable.agents.md) | Plugin factory for the agents plugin. Reads `config/agents/*.md` by default, resolves toolkits/tools from registered plugins, exposes `appkit.agents.*` runtime API and mounts `/invocations`. |
+| [agents](Variable.agents.md) | Plugin factory for the agents plugin. Reads `config/agents/<id>/agent.md` by default, resolves toolkits/tools from registered plugins, exposes `appkit.agents.*` runtime API and mounts `/invocations`. |
 | [READ\_ACTIONS](Variable.READ_ACTIONS.md) | Actions that only read data. |
 | [sql](Variable.sql.md) | SQL helper namespace |
 | [WRITE\_ACTIONS](Variable.WRITE_ACTIONS.md) | Actions that mutate data. |
diff --git a/docs/docs/plugins/agents.md b/docs/docs/plugins/agents.md
index 8c007bca2..d06befacc 100644
--- a/docs/docs/plugins/agents.md
+++ b/docs/docs/plugins/agents.md
@@ -1,6 +1,6 @@
 # Agents
 
-The `agents` plugin turns a Databricks AppKit app into an AI-agent host. It loads agent definitions from markdown files (convention: `config/agents/*.md`), from TypeScript (`createAgent(def)`), or both, and exposes them at `POST /invocations` alongside routes for chat, thread management, and cancellation.
+The `agents` plugin turns a Databricks AppKit app into an AI-agent host. It loads agent definitions from markdown on disk (one folder per agent: `config/agents/<id>/agent.md`), from TypeScript (`createAgent(def)`), or both, and exposes them at `POST /invocations` alongside routes for chat, thread management, and cancellation.
 
 This page covers the full lifecycle. For the hand-written primitives (`tool()`, `mcpServer()`), see [tools](./server.md).
 
@@ -18,13 +18,18 @@ await createApp({
 
 That alone gives you a live HTTP server with `POST /invocations` wired to a markdown-driven agent.
 
-## Level 1: drop a markdown file
+## Level 1: drop a markdown agent package
+
+Each agent lives in its own directory with a fixed entry file `agent.md`. A reserved top-level folder named `skills` is ignored until per-agent skills ship (you can add other asset folders beside `agent.md` under each agent id).
+
+**Migrating from flat files:** move `assistant.md` → `assistant/agent.md` (same for every stem). Top-level `*.md` files in `config/agents` are rejected at startup so upgrades are not silently ignored.
 
 ```
 my-app/
   server.ts
   config/agents/
-    assistant.md
+    assistant/
+      agent.md
 ```
 
 ```md
@@ -40,7 +45,7 @@ Use the available tools to query data, browse files, and help users.
 
 On startup the plugin:
 
-1. Discovers the file at `./config/agents/assistant.md`.
+1. Discovers `./config/agents/assistant/agent.md` and registers agent id `assistant`.
 2. Parses the YAML frontmatter and markdown body as the agent's `instructions`.
 3. Resolves the adapter from `endpoint` (or falls back to `DATABRICKS_AGENT_ENDPOINT`).
 4. Auto-inherits every registered ToolProvider plugin's tools (`analytics.*`, `files.*`, …).
@@ -389,7 +394,7 @@ appkit.agents.getThreads(userId);   // list user's threads
 | `model` | string | Same as `endpoint`; either works. |
 | `toolkits` | array of string or `{ name: options }` | Spread plugin toolkits. Supports `only`, `except`, `rename`, `prefix`. |
 | `tools` | array of string | Keys into `agents({ tools: {...} })`. |
-| `default` | boolean | First file with `default: true` becomes the default agent. |
+| `default` | boolean | First agent id (sorted order) with `default: true` becomes the default agent. |
 | `maxSteps` | number | Adapter max-step hint. |
 | `maxTokens` | number | Adapter max-token hint. |
 | `baseSystemPrompt` | false \| string | Per-agent override. `false` disables the AppKit base prompt. |
diff --git a/plans/agent-folder-layout.md b/plans/agent-folder-layout.md
new file mode 100644
index 000000000..8c530a5fe
--- /dev/null
+++ b/plans/agent-folder-layout.md
@@ -0,0 +1,35 @@
+# Folder-based markdown agents (`<id>/agent.md`)
+
+## Locked decisions
+
+| Topic | Choice |
+|--------|--------|
+| Top-level `*.md` | **Removed** — folder layout only (**breaking**). Startup lists orphan files and tells you to use `<stem>/agent.md`. |
+| Entry file | **`agent.md` only** — no `index.md` alias in v1. |
+| Subdir without entry | **Throw** — every directory under `config/agents` (except reserved names) must contain `agent.md`. |
+| `skills/` at repo root under `agents/` | **Ignored** — reserved for future per-agent skills; not loaded as an agent package in v1. |
+| `agents:` frontmatter | Unchanged — array of **agent ids** (folder names). |
+
+## Goal
+
+Support one **directory per agent** with a fixed entry file (`agent.md`), so each agent can later grow **skills** and other assets without flattening everything into one markdown file.
+
+## Loader behavior (`loadAgentsFromDir`)
+
+1. `readdirSync(dir, { withFileTypes: true })`.
+2. **Reject** any top-level `*.md` with an error that suggests `mv X.md X/agent.md`-style migration.
+3. For each subdirectory whose name is not reserved (`skills`), require `<id>/agent.md`; register agent **`id`** from that file.
+4. Two-pass resolution for `agents:` references (unchanged semantics).
+5. **`default: true`** — deterministic: sort agent ids, first `default: true` wins.
+
+Single-file **`loadAgentFromFile`** keeps rejecting non-empty `agents:`. Paths ending in `/agent.md` derive the logical agent id from the **parent directory name** (see `agentIdFromMarkdownPath`).
+
+## Acceptance criteria
+
+- Loading `config/agents` with only `assistant/agent.md` yields `defs.assistant`.
+- Flat `assistant.md` alone does **not** register — covered by loader tests and docs.
+- Reference apps use `<id>/agent.md` under `config/agents`.
+
+## Git stack
+
+Loader + unit tests belong on **`agent/v2/4-agents-plugin`**. Docs and app migrations typically land on **`agent/v2/6-apps-docs`** after rebasing onto the updated stack; **`git push --force-with-lease`** stacked branches **4 → 5 → 6** when coordinating PRs.

From 730cc3f74e8e76f2b9b9b397a714565b70e48a7a Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Thu, 23 Apr 2026 22:17:22 +0200
Subject: [PATCH 22/46] docs(appkit): regenerate typedoc API reference for
 folder-agents loader

typedoc picked up JSDoc changes from agent/v2/4-agents-plugin:

- New public export `agentIdFromMarkdownPath` (helper for path-based id
  resolution used by `loadAgentFromFile`).
- `loadAgentsFromDir` description/body now reflects the folder layout
  (`<id>/agent.md`, orphan `*.md` rejected, reserved `skills/` dir).

Generated by docusaurus-plugin-typedoc during pnpm --filter=docs build.
---
 .../Function.agentIdFromMarkdownPath.md       | 19 +++++++++++++++++++
 .../api/appkit/Function.loadAgentsFromDir.md  | 16 ++++++++++------
 docs/docs/api/appkit/index.md                 |  3 ++-
 docs/docs/api/appkit/typedoc-sidebar.ts       |  5 +++++
 4 files changed, 36 insertions(+), 7 deletions(-)
 create mode 100644 docs/docs/api/appkit/Function.agentIdFromMarkdownPath.md

diff --git a/docs/docs/api/appkit/Function.agentIdFromMarkdownPath.md b/docs/docs/api/appkit/Function.agentIdFromMarkdownPath.md
new file mode 100644
index 000000000..65677e19d
--- /dev/null
+++ b/docs/docs/api/appkit/Function.agentIdFromMarkdownPath.md
@@ -0,0 +1,19 @@
+# Function: agentIdFromMarkdownPath()
+
+```ts
+function agentIdFromMarkdownPath(filePath: string): string;
+```
+
+Derives the logical agent id from a markdown path. When the file is named
+`agent.md`, the id is the parent directory name (folder-based layout);
+otherwise the id is the file stem (e.g. legacy single-file paths).
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `filePath` | `string` |
+
+## Returns
+
+`string`
diff --git a/docs/docs/api/appkit/Function.loadAgentsFromDir.md b/docs/docs/api/appkit/Function.loadAgentsFromDir.md
index 9745286e4..85d94b43c 100644
--- a/docs/docs/api/appkit/Function.loadAgentsFromDir.md
+++ b/docs/docs/api/appkit/Function.loadAgentsFromDir.md
@@ -4,15 +4,19 @@
 function loadAgentsFromDir(dir: string, ctx: LoadContext): Promise<LoadResult>;
 ```
 
-Scans a directory for `*.md` files and produces an `AgentDefinition` record
-keyed by file-stem. Throws on frontmatter errors or unresolved references.
-Returns an empty map if the directory does not exist.
+Scans a directory for one subdirectory per agent, each containing
+`agent.md` (frontmatter + body). Produces an `AgentDefinition` record keyed
+by agent id (folder name). Throws on frontmatter errors or unresolved
+references. Returns an empty map if the directory does not exist.
+
+Legacy top-level `*.md` files are rejected with an error — migrate each to
+`<id>/agent.md` under a sibling folder named for the agent id.
 
 Runs in two passes so sub-agent references in frontmatter (`agents: [...]`)
-can be resolved regardless of file-system iteration order:
+can be resolved regardless of directory iteration order:
 
-1. Build every agent's definition from its own file.
-2. Walk `agents:` references and wire `def.agents = { sibling: siblingDef }`
+1. Build every agent's definition from its own `agent.md`.
+2. Walk `agents:` references and wire `def.agents = { child: childDef }`
    by looking them up in the complete map. Dangling names and
    self-references fail loudly; mutual delegation is allowed and bounded
    at runtime by `limits.maxSubAgentDepth`.
diff --git a/docs/docs/api/appkit/index.md b/docs/docs/api/appkit/index.md
index abde8475d..5b273e690 100644
--- a/docs/docs/api/appkit/index.md
+++ b/docs/docs/api/appkit/index.md
@@ -108,6 +108,7 @@ plugin architecture, and React integration.
 
 | Function | Description |
 | ------ | ------ |
+| [agentIdFromMarkdownPath](Function.agentIdFromMarkdownPath.md) | Derives the logical agent id from a markdown path. When the file is named `agent.md`, the id is the parent directory name (folder-based layout); otherwise the id is the file stem (e.g. legacy single-file paths). |
 | [appKitServingTypesPlugin](Function.appKitServingTypesPlugin.md) | Vite plugin to generate TypeScript types for AppKit serving endpoints. Fetches OpenAPI schemas from Databricks and generates a .d.ts with ServingEndpointRegistry module augmentation. |
 | [appKitTypesPlugin](Function.appKitTypesPlugin.md) | Vite plugin to generate types for AppKit queries. Calls generateFromEntryPoint under the hood. |
 | [createAgent](Function.createAgent.md) | Pure factory for agent definitions. Returns the passed-in definition after cycle-detecting the sub-agent graph. Accepts the full `AgentDefinition` shape and is safe to call at module top-level. |
@@ -130,7 +131,7 @@ plugin architecture, and React integration.
 | [isSQLTypeMarker](Function.isSQLTypeMarker.md) | Type guard to check if a value is a SQL type marker |
 | [isToolkitEntry](Function.isToolkitEntry.md) | Type guard for `ToolkitEntry` — used by the agents plugin to differentiate toolkit references from inline tools in a mixed `tools` record. |
 | [loadAgentFromFile](Function.loadAgentFromFile.md) | Loads a single markdown agent file and resolves its frontmatter against registered plugin toolkits + ambient tool library. |
-| [loadAgentsFromDir](Function.loadAgentsFromDir.md) | Scans a directory for `*.md` files and produces an `AgentDefinition` record keyed by file-stem. Throws on frontmatter errors or unresolved references. Returns an empty map if the directory does not exist. |
+| [loadAgentsFromDir](Function.loadAgentsFromDir.md) | Scans a directory for one subdirectory per agent, each containing `agent.md` (frontmatter + body). Produces an `AgentDefinition` record keyed by agent id (folder name). Throws on frontmatter errors or unresolved references. Returns an empty map if the directory does not exist. |
 | [mcpServer](Function.mcpServer.md) | Factory for declaring a custom MCP server tool. |
 | [runAgent](Function.runAgent.md) | Standalone agent execution without `createApp`. Resolves the adapter, binds inline tools, and drives the adapter's `run()` loop to completion. |
 | [tool](Function.tool.md) | Factory for defining function tools with Zod schemas. |
diff --git a/docs/docs/api/appkit/typedoc-sidebar.ts b/docs/docs/api/appkit/typedoc-sidebar.ts
index db89a5825..8b7090851 100644
--- a/docs/docs/api/appkit/typedoc-sidebar.ts
+++ b/docs/docs/api/appkit/typedoc-sidebar.ts
@@ -415,6 +415,11 @@ const typedocSidebar: SidebarsConfig = {
       type: "category",
       label: "Functions",
       items: [
+        {
+          type: "doc",
+          id: "api/appkit/Function.agentIdFromMarkdownPath",
+          label: "agentIdFromMarkdownPath"
+        },
         {
           type: "doc",
           id: "api/appkit/Function.appKitServingTypesPlugin",

From db9a62140e156a207f4608104ae945f0632fc79b Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 11:45:55 +0200
Subject: [PATCH 23/46] feat(dev-playground): port Smart Dashboard as
 /smart-dashboard route; retire agent-app
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Stage 0 of the smart-dashboard-demo plan. Ports the prototype Smart
Dashboard (NYC Taxi analytics) from the p3ju worktree into dev-playground
as a new route, migrates its markdown agents to the folder layout, and
deletes apps/agent-app — which is superseded by this demo as the
integration test of the entire v2 agents stack.

Client:

- New route at client/src/routes/smart-dashboard.route.tsx with
  its own subdirectory for components/ and hooks/.
- Ported 8 components (ActiveFilters, AgentSidebar, AnomalyCard,
  FareChart, InsightCard, KPICards, QuerySection, TripChart) and
  4 hooks (useActionDispatcher, useAgentStream, useChartColors,
  useDashboardData) as-is. Relative imports preserved.
- Nav link added in __root.tsx.
- TanStack routeTree.gen.ts auto-regenerated.

Server:

- Ports apply_filter and highlight_period inline tools.
- Adds sql_analyst (code-defined: fromPlugin(analytics)) and
  dashboard_pilot (code-defined: apply_filter + highlight_period)
  per the plan's Q2 = option B decision.
- Adds query markdown dispatcher in config/agents/query/agent.md
  delegating to both specialists via the agents: frontmatter.
- Ports insights and anomaly ephemeral markdown agents.

Config:

- Ports 4 SQL queries into config/queries/dashboard_*.sql.
- Note: shared/appkit-types/analytics.d.ts not regenerated in this
  commit; useAnalyticsQuery("dashboard_*", ...) uses explicit as
  casts and works at runtime. Regenerate with
  'npx @databricks/appkit generate-types' locally when convenient.

Cleanup:

- apps/agent-app/ removed in full. No references outside
  pnpm-lock.yaml (regenerated).
- plans/smart-dashboard-demo.md added with the full staged plan.

Verification:

- pnpm --filter=dev-playground client typecheck: clean.
- pnpm --filter=dev-playground client vite build: clean.
- Server typecheck: same pre-existing errors as main (files plugin
  union type, telemetry CacheManager, playwright DOM lib) — no new
  regressions.

Next stages (1-6, per the plan): dispatcher integration verified,
save_view + approval card, dashboard-context injection + focus_chart,
Stream Inspector, polish, demo script.
---
 apps/agent-app/.env.example                   |  16 -
 apps/agent-app/.gitignore                     |   3 -
 apps/agent-app/app.yaml                       |   8 -
 .../config/agents/assistant/agent.md          |  23 -
 apps/agent-app/config/agents/support/agent.md |  17 -
 apps/agent-app/databricks.yml                 |  50 --
 apps/agent-app/index.html                     |  12 -
 apps/agent-app/package.json                   |  40 --
 apps/agent-app/postcss.config.js              |   6 -
 apps/agent-app/server.ts                      | 100 ----
 apps/agent-app/src/App.css                    | 440 ------------------
 apps/agent-app/src/App.tsx                    | 405 ----------------
 .../src/components/theme-selector.tsx         | 135 ------
 apps/agent-app/src/index.css                  |   1 -
 apps/agent-app/src/main.tsx                   |  15 -
 apps/agent-app/tailwind.config.ts             |  11 -
 apps/agent-app/tsconfig.app.json              |  24 -
 apps/agent-app/tsconfig.json                  |   7 -
 apps/agent-app/tsconfig.node.json             |  22 -
 apps/agent-app/vite.config.ts                 |  31 --
 .../client/src/routeTree.gen.ts               |  21 +
 .../client/src/routes/__root.tsx              |   8 +
 .../src/routes/smart-dashboard.route.tsx      | 100 ++++
 .../components/active-filters.tsx             |  63 +++
 .../components/agent-sidebar.tsx              | 168 +++++++
 .../components/anomaly-card.tsx               |  68 +++
 .../smart-dashboard/components/fare-chart.tsx |  78 ++++
 .../components/insight-card.tsx               |  24 +
 .../smart-dashboard/components/kpi-cards.tsx  |  81 ++++
 .../components/query-section.tsx              | 163 +++++++
 .../smart-dashboard/components/trip-chart.tsx | 144 ++++++
 .../hooks/use-action-dispatcher.ts            |  88 ++++
 .../smart-dashboard/hooks/use-agent-stream.ts | 131 ++++++
 .../smart-dashboard/hooks/use-chart-colors.ts |  51 ++
 .../hooks/use-dashboard-data.ts               | 128 +++++
 .../config/agents/anomaly/agent.md            |   9 +
 .../config/agents/insights/agent.md           |   9 +
 .../config/agents/query/agent.md              |  24 +
 .../queries/dashboard_fare_distribution.sql   |  22 +
 .../config/queries/dashboard_kpis.sql         |  18 +
 .../config/queries/dashboard_top_zone.sql     |  16 +
 .../queries/dashboard_trips_over_time.sql     |  16 +
 apps/dev-playground/server/index.ts           |  94 +++-
 plans/smart-dashboard-demo.md                 | 365 +++++++++++++++
 pnpm-lock.yaml                                | 277 -----------
 45 files changed, 1888 insertions(+), 1644 deletions(-)
 delete mode 100644 apps/agent-app/.env.example
 delete mode 100644 apps/agent-app/.gitignore
 delete mode 100644 apps/agent-app/app.yaml
 delete mode 100644 apps/agent-app/config/agents/assistant/agent.md
 delete mode 100644 apps/agent-app/config/agents/support/agent.md
 delete mode 100644 apps/agent-app/databricks.yml
 delete mode 100644 apps/agent-app/index.html
 delete mode 100644 apps/agent-app/package.json
 delete mode 100644 apps/agent-app/postcss.config.js
 delete mode 100644 apps/agent-app/server.ts
 delete mode 100644 apps/agent-app/src/App.css
 delete mode 100644 apps/agent-app/src/App.tsx
 delete mode 100644 apps/agent-app/src/components/theme-selector.tsx
 delete mode 100644 apps/agent-app/src/index.css
 delete mode 100644 apps/agent-app/src/main.tsx
 delete mode 100644 apps/agent-app/tailwind.config.ts
 delete mode 100644 apps/agent-app/tsconfig.app.json
 delete mode 100644 apps/agent-app/tsconfig.json
 delete mode 100644 apps/agent-app/tsconfig.node.json
 delete mode 100644 apps/agent-app/vite.config.ts
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/components/active-filters.tsx
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/components/agent-sidebar.tsx
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/components/anomaly-card.tsx
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/components/fare-chart.tsx
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/components/insight-card.tsx
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/components/kpi-cards.tsx
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/components/query-section.tsx
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/components/trip-chart.tsx
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-action-dispatcher.ts
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-agent-stream.ts
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-chart-colors.ts
 create mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-dashboard-data.ts
 create mode 100644 apps/dev-playground/config/agents/anomaly/agent.md
 create mode 100644 apps/dev-playground/config/agents/insights/agent.md
 create mode 100644 apps/dev-playground/config/agents/query/agent.md
 create mode 100644 apps/dev-playground/config/queries/dashboard_fare_distribution.sql
 create mode 100644 apps/dev-playground/config/queries/dashboard_kpis.sql
 create mode 100644 apps/dev-playground/config/queries/dashboard_top_zone.sql
 create mode 100644 apps/dev-playground/config/queries/dashboard_trips_over_time.sql
 create mode 100644 plans/smart-dashboard-demo.md

diff --git a/apps/agent-app/.env.example b/apps/agent-app/.env.example
deleted file mode 100644
index 055bb94c1..000000000
--- a/apps/agent-app/.env.example
+++ /dev/null
@@ -1,16 +0,0 @@
-# Databricks workspace (auto-injected by platform on deploy)
-DATABRICKS_HOST=https://your-workspace.cloud.databricks.com
-
-# Agent LLM endpoint (Model Serving endpoint name)
-DATABRICKS_AGENT_ENDPOINT=databricks-claude-sonnet-4-5
-
-# Analytics plugin — SQL warehouse ID
-DATABRICKS_WAREHOUSE_ID=your-warehouse-id
-
-# Files plugin — Volume path (catalog.schema.volume)
-DATABRICKS_VOLUME_FILES=/Volumes/your-catalog/your-schema/your-volume
-
-# Optional: Custom MCP servers the agent can call. When set, the hostname
-# is automatically added to agents({ mcp: { trustedHosts } }).
-# VECTOR_SEARCH_MCP_URL=https://<workspace>/api/2.0/mcp/vector-search/<catalog>/<schema>/<index>
-# CUSTOM_MCP_URL=https://<your-mcp-server>/mcp
diff --git a/apps/agent-app/.gitignore b/apps/agent-app/.gitignore
deleted file mode 100644
index 9c97bbd46..000000000
--- a/apps/agent-app/.gitignore
+++ /dev/null
@@ -1,3 +0,0 @@
-node_modules
-dist
-.env
diff --git a/apps/agent-app/app.yaml b/apps/agent-app/app.yaml
deleted file mode 100644
index 215b89ec3..000000000
--- a/apps/agent-app/app.yaml
+++ /dev/null
@@ -1,8 +0,0 @@
-command: ['node', '--import', 'tsx', 'server.ts']
-env:
-  - name: DATABRICKS_WAREHOUSE_ID
-    valueFrom: sql-warehouse
-  - name: DATABRICKS_AGENT_ENDPOINT
-    valueFrom: serving-endpoint
-  - name: DATABRICKS_VOLUME_FILES
-    valueFrom: volume
diff --git a/apps/agent-app/config/agents/assistant/agent.md b/apps/agent-app/config/agents/assistant/agent.md
deleted file mode 100644
index 1eb5a84fc..000000000
--- a/apps/agent-app/config/agents/assistant/agent.md
+++ /dev/null
@@ -1,23 +0,0 @@
----
-endpoint: databricks-claude-sonnet-4-5
-default: true
-toolkits:
-  - files: [files.list, files.upload, files.delete]
-agents:
-  - support
-  - researcher
----
-
-You are a front-desk dispatcher running on Databricks.
-
-Delegate requests to the right specialist:
-
-- `agent-support` — data analysis (SQL via analytics), file browsing, and general questions.
-- `agent-researcher` — research and knowledge lookups that benefit from MCP-hosted tools (vector search, custom endpoints).
-
-Only use your own tools (`files.upload`, `files.delete`, `files.list`) for
-file-management actions the user explicitly asks for. Destructive ones
-(`upload`, `delete`) will prompt the user for approval before running.
-
-Keep your own responses short — mostly routing decisions plus a brief summary
-of what the specialist returned.
diff --git a/apps/agent-app/config/agents/support/agent.md b/apps/agent-app/config/agents/support/agent.md
deleted file mode 100644
index 68d7e964d..000000000
--- a/apps/agent-app/config/agents/support/agent.md
+++ /dev/null
@@ -1,17 +0,0 @@
----
-endpoint: databricks-claude-sonnet-4-5
-toolkits:
-  - analytics
-  - files
-tools:
-  - get_weather
-  # Optional MCP servers — uncomment the ones whose env vars are set in
-  # .env (VECTOR_SEARCH_MCP_URL, CUSTOM_MCP_URL). `server.ts` only
-  # registers each as ambient when its URL is configured, so leaving a
-  # reference here while the env var is unset will fail at startup.
-  # - mcp.vector-search
-  # - mcp.custom
----
-
-You help customers with data analysis, file browsing, and general questions.
-Use the available tools as needed and summarize results concisely.
diff --git a/apps/agent-app/databricks.yml b/apps/agent-app/databricks.yml
deleted file mode 100644
index 3ed6e50ad..000000000
--- a/apps/agent-app/databricks.yml
+++ /dev/null
@@ -1,50 +0,0 @@
-bundle:
-  name: appkit-agent-app
-
-variables:
-  sql_warehouse_id:
-    description: SQL Warehouse ID for analytics queries
-  serving_endpoint_name:
-    description: Model Serving endpoint name for the agent LLM
-  volume_full_name:
-    description: "UC Volume full name (e.g. catalog.schema.volume_name)"
-
-resources:
-  apps:
-    agent_app:
-      name: "appkit-agent-app"
-      description: "AppKit agent with auto-discovered tools from analytics, files, and genie plugins"
-      source_code_path: ./
-
-      user_api_scopes:
-        - sql
-        - files.files
-        - dashboards.genie
-
-      resources:
-        - name: sql-warehouse
-          sql_warehouse:
-            id: ${var.sql_warehouse_id}
-            permission: CAN_USE
-
-        - name: serving-endpoint
-          serving_endpoint:
-            name: ${var.serving_endpoint_name}
-            permission: CAN_QUERY
-
-        - name: volume
-          uc_securable:
-            securable_type: VOLUME
-            securable_full_name: ${var.volume_full_name}
-            permission: WRITE_VOLUME
-
-targets:
-  dogfood:
-    default: true
-    workspace:
-      host: https://e2-dogfood.staging.cloud.databricks.com
-
-    variables:
-      sql_warehouse_id: dd43ee29fedd958d
-      serving_endpoint_name: databricks-claude-sonnet-4-5
-      volume_full_name: main.mario.mario-vol
diff --git a/apps/agent-app/index.html b/apps/agent-app/index.html
deleted file mode 100644
index 80e54faf6..000000000
--- a/apps/agent-app/index.html
+++ /dev/null
@@ -1,12 +0,0 @@
-<!doctype html>
-<html lang="en">
-  <head>
-    <meta charset="UTF-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>AppKit Agent</title>
-  </head>
-  <body>
-    <div id="root"></div>
-    <script type="module" src="/src/main.tsx"></script>
-  </body>
-</html>
diff --git a/apps/agent-app/package.json b/apps/agent-app/package.json
deleted file mode 100644
index ed159ca8d..000000000
--- a/apps/agent-app/package.json
+++ /dev/null
@@ -1,40 +0,0 @@
-{
-  "name": "agent-app",
-  "private": true,
-  "version": "0.0.0",
-  "type": "module",
-  "scripts": {
-    "dev": "NODE_ENV=development tsx watch server.ts",
-    "build": "tsc -b && vite build",
-    "preview": "vite preview"
-  },
-  "dependencies": {
-    "@databricks/appkit": "workspace:*",
-    "@databricks/appkit-ui": "workspace:*",
-    "@databricks/sdk-experimental": "^0.16.0",
-    "dotenv": "^16.6.1",
-    "lucide-react": "^0.511.0",
-    "react": "19.2.0",
-    "react-dom": "19.2.0",
-    "marked": "^15.0.0",
-    "zod": "^4.0.0"
-  },
-  "devDependencies": {
-    "@tailwindcss/postcss": "4.1.17",
-    "@types/node": "24.10.1",
-    "@types/react": "19.2.7",
-    "@types/react-dom": "19.2.3",
-    "@vitejs/plugin-react": "5.1.1",
-    "autoprefixer": "10.4.21",
-    "postcss": "8.5.6",
-    "tailwindcss": "4.1.17",
-    "tailwindcss-animate": "1.0.7",
-    "tw-animate-css": "1.4.0",
-    "tsx": "4.20.6",
-    "typescript": "5.9.3",
-    "vite": "npm:rolldown-vite@7.1.14"
-  },
-  "overrides": {
-    "vite": "npm:rolldown-vite@7.1.14"
-  }
-}
diff --git a/apps/agent-app/postcss.config.js b/apps/agent-app/postcss.config.js
deleted file mode 100644
index f69c5d411..000000000
--- a/apps/agent-app/postcss.config.js
+++ /dev/null
@@ -1,6 +0,0 @@
-export default {
-  plugins: {
-    "@tailwindcss/postcss": {},
-    autoprefixer: {},
-  },
-};
diff --git a/apps/agent-app/server.ts b/apps/agent-app/server.ts
deleted file mode 100644
index e471196be..000000000
--- a/apps/agent-app/server.ts
+++ /dev/null
@@ -1,100 +0,0 @@
-import {
-  agents,
-  analytics,
-  createAgent,
-  createApp,
-  files,
-  mcpServer,
-  server,
-  tool,
-} from "@databricks/appkit";
-import { z } from "zod";
-
-const port = Number(process.env.DATABRICKS_APP_PORT) || 8003;
-
-// Ambient function tool. Referenced from `config/agents/support/agent.md` under
-// `tools: [get_weather]`. Markdown frontmatter looks up this name against
-// the `tools:` record passed to `agents({ tools: { get_weather } })` below.
-const get_weather = tool({
-  name: "get_weather",
-  description: "Get the current weather for a city",
-  schema: z.object({
-    city: z.string().describe("City name"),
-  }),
-  execute: async ({ city }) => `The weather in ${city} is sunny, 22°C`,
-});
-
-// MCP servers are conditional on runtime env vars — something markdown
-// frontmatter can't express. This is the motivating case for defining
-// the `researcher` agent in code below: it wires whatever MCP tools are
-// configured at boot, and is always callable (with a graceful fallback
-// when nothing is wired).
-//
-// Any MCP URL configured here must also be allowlisted via
-// `agents({ mcp: { trustedHosts: [...] } })` before outbound calls will
-// be allowed by the zero-trust host policy.
-const customMcpServers: Record<string, ReturnType<typeof mcpServer>> = {};
-if (process.env.VECTOR_SEARCH_MCP_URL) {
-  customMcpServers["mcp.vector-search"] = mcpServer(
-    "vector-search",
-    process.env.VECTOR_SEARCH_MCP_URL,
-  );
-}
-if (process.env.CUSTOM_MCP_URL) {
-  customMcpServers["mcp.custom"] = mcpServer(
-    "custom",
-    process.env.CUSTOM_MCP_URL,
-  );
-}
-
-// Code-defined research specialist. `assistant.md` references this by name
-// under `agents: [researcher]`; the agents plugin resolves that reference
-// against both markdown siblings and code-defined agents, with code winning
-// on collision. Defined in code so its MCP toolset can flex on env vars.
-const researcher = createAgent({
-  instructions:
-    "You are a research specialist. When MCP tools are available " +
-    "(vector search, custom endpoints), prefer them for knowledge lookups. " +
-    "If no MCP tools are configured, say so briefly and answer from general " +
-    "knowledge. Always include your source or note when you're answering " +
-    "without search.",
-  tools: {
-    get_weather,
-    ...customMcpServers,
-  },
-});
-
-const trustedMcpHosts = [
-  process.env.VECTOR_SEARCH_MCP_URL,
-  process.env.CUSTOM_MCP_URL,
-]
-  .filter((u): u is string => typeof u === "string" && u.length > 0)
-  .map((u) => new URL(u).hostname);
-
-const appkit = await createApp({
-  plugins: [
-    server({ port }),
-    analytics(),
-    files(),
-    agents({
-      // Code-defined agents merged with markdown agents; code wins on name
-      // collision. Markdown `agents: [...]` frontmatter can reference either.
-      agents: { researcher },
-      // Ambient tool library for markdown agents referencing names under
-      // their `tools:` frontmatter.
-      tools: { get_weather, ...customMcpServers },
-      // Enables auto-inherit of read-only plugin tools (analytics/files) into
-      // markdown agents that declare no explicit `toolkits:` / `tools:`. Both
-      // assistant.md and support.md are explicit, so this is a no-op today,
-      // but kept as a knob markdown authors can rely on.
-      autoInheritTools: { file: true },
-      mcp: { trustedHosts: trustedMcpHosts },
-    }),
-  ],
-});
-
-console.log(
-  `Agent app running on port ${port}. ` +
-    `Agents: ${appkit.agents.list().join(", ") || "(none)"}. ` +
-    `Default: ${appkit.agents.getDefault() ?? "(none)"}.`,
-);
diff --git a/apps/agent-app/src/App.css b/apps/agent-app/src/App.css
deleted file mode 100644
index 545b438cd..000000000
--- a/apps/agent-app/src/App.css
+++ /dev/null
@@ -1,440 +0,0 @@
-:root {
-  --bg: #fafafa;
-  --card: #ffffff;
-  --border: #e5e5e5;
-  --text: #171717;
-  --text-muted: #737373;
-  --text-faint: #a3a3a3;
-  --primary: #2563eb;
-  --primary-fg: #ffffff;
-  --muted: #f5f5f5;
-  --ring: #93c5fd;
-  --radius: 10px;
-  --font: system-ui, -apple-system, sans-serif;
-  --mono: "SF Mono", "Cascadia Code", "Fira Code", monospace;
-}
-
-:root.dark {
-  --bg: #0a0a0a;
-  --card: #171717;
-  --border: #262626;
-  --text: #fafafa;
-  --text-muted: #a3a3a3;
-  --text-faint: #525252;
-  --primary: #3b82f6;
-  --primary-fg: #ffffff;
-  --muted: #262626;
-  --ring: #1d4ed8;
-}
-
-* {
-  margin: 0;
-  padding: 0;
-  box-sizing: border-box;
-}
-
-body {
-  font-family: var(--font);
-  background: var(--bg);
-  color: var(--text);
-  -webkit-font-smoothing: antialiased;
-}
-
-.app {
-  min-height: 100vh;
-}
-
-.container {
-  max-width: 1100px;
-  margin: 0 auto;
-  padding: 2.5rem 1.5rem;
-}
-
-.header {
-  margin-bottom: 1.5rem;
-  display: flex;
-  align-items: flex-start;
-  justify-content: space-between;
-}
-
-.header h1 {
-  font-size: 1.75rem;
-  font-weight: 700;
-  letter-spacing: -0.025em;
-}
-
-.subtitle {
-  color: var(--text-muted);
-  font-size: 0.875rem;
-  margin-top: 0.25rem;
-}
-
-.thread-id {
-  font-family: var(--mono);
-  font-size: 0.75rem;
-  opacity: 0.6;
-}
-
-.main-layout {
-  display: flex;
-  gap: 1.25rem;
-  height: 700px;
-}
-
-.chat-panel {
-  flex: 1;
-  display: flex;
-  flex-direction: column;
-  border: 1px solid var(--border);
-  border-radius: var(--radius);
-  background: var(--card);
-  min-width: 0;
-  overflow: hidden;
-}
-
-.messages {
-  flex: 1;
-  overflow-y: auto;
-  padding: 1.25rem;
-  display: flex;
-  flex-direction: column;
-  gap: 1rem;
-}
-
-.empty-state {
-  text-align: center;
-  padding: 5rem 1rem;
-  color: var(--text-muted);
-}
-
-.empty-title {
-  font-size: 1.1rem;
-  font-weight: 500;
-}
-
-.empty-sub {
-  font-size: 0.85rem;
-  margin-top: 0.5rem;
-  color: var(--text-faint);
-}
-
-.message-row {
-  display: flex;
-}
-
-.message-row.user {
-  justify-content: flex-end;
-}
-
-.message-row.assistant {
-  justify-content: flex-start;
-}
-
-.bubble {
-  max-width: 80%;
-  padding: 0.625rem 0.875rem;
-  border-radius: var(--radius);
-  font-size: 0.875rem;
-  line-height: 1.5;
-  word-break: break-word;
-}
-
-.bubble.user {
-  white-space: pre-wrap;
-  background: var(--primary);
-  color: var(--primary-fg);
-  border-bottom-right-radius: 3px;
-}
-
-.bubble.assistant {
-  background: var(--muted);
-  color: var(--text);
-  border-bottom-left-radius: 3px;
-}
-
-.bubble.thinking {
-  color: var(--text-muted);
-  animation: pulse 1.5s ease-in-out infinite;
-}
-
-.bubble.approval-card {
-  border: 1px solid #d96b3a;
-  background: color-mix(in srgb, #d96b3a 10%, var(--muted));
-}
-
-.approval-header {
-  display: flex;
-  align-items: center;
-  gap: 8px;
-  margin-bottom: 8px;
-}
-
-.approval-badge {
-  display: inline-block;
-  padding: 2px 8px;
-  font-size: 0.75rem;
-  font-weight: 600;
-  letter-spacing: 0.02em;
-  text-transform: uppercase;
-  color: #fff;
-  background: #d96b3a;
-  border-radius: 3px;
-}
-
-.approval-body {
-  font-size: 0.9rem;
-}
-
-.approval-args {
-  margin: 6px 0 0;
-  padding: 8px;
-  font-size: 0.8rem;
-  max-height: 220px;
-  overflow: auto;
-  background: var(--bg);
-  border-radius: 4px;
-  white-space: pre-wrap;
-  word-break: break-word;
-}
-
-.approval-actions {
-  display: flex;
-  gap: 8px;
-  margin-top: 10px;
-  justify-content: flex-end;
-}
-
-.approval-actions button {
-  padding: 6px 14px;
-  font-size: 0.85rem;
-  font-weight: 500;
-  border-radius: 4px;
-  border: 1px solid transparent;
-  cursor: pointer;
-  transition:
-    background 0.15s,
-    border-color 0.15s;
-}
-
-.approval-deny {
-  background: transparent;
-  color: var(--text);
-  border-color: var(--border);
-}
-
-.approval-deny:hover {
-  background: var(--muted);
-}
-
-.approval-approve {
-  background: #d96b3a;
-  color: #fff;
-}
-
-.approval-approve:hover {
-  background: #c35a2b;
-}
-
-.bubble.assistant > * + * {
-  margin-top: 0.5em;
-}
-
-.bubble.assistant p {
-  margin: 0;
-}
-
-.bubble.assistant p + p {
-  margin-top: 0.4em;
-}
-
-.bubble.assistant code {
-  font-family: var(--mono);
-  font-size: 0.8em;
-  background: color-mix(in srgb, var(--text) 8%, transparent);
-  padding: 0.15em 0.35em;
-  border-radius: 4px;
-}
-
-.bubble.assistant pre {
-  margin: 0.5em 0;
-  padding: 0.75em;
-  border-radius: 6px;
-  background: color-mix(in srgb, var(--text) 6%, transparent);
-  overflow-x: auto;
-}
-
-.bubble.assistant pre code {
-  background: none;
-  padding: 0;
-  font-size: 0.8em;
-}
-
-.bubble.assistant ul,
-.bubble.assistant ol {
-  margin: 0.4em 0;
-  padding-left: 1.5em;
-}
-
-.bubble.assistant li {
-  margin: 0.15em 0;
-}
-
-.bubble.assistant h1,
-.bubble.assistant h2,
-.bubble.assistant h3 {
-  font-weight: 600;
-}
-
-.bubble.assistant h1 {
-  font-size: 1.1em;
-}
-.bubble.assistant h2 {
-  font-size: 1em;
-}
-.bubble.assistant h3 {
-  font-size: 0.95em;
-}
-
-.bubble.assistant blockquote {
-  margin: 0.4em 0;
-  padding-left: 0.75em;
-  border-left: 3px solid var(--border);
-  color: var(--text-muted);
-}
-
-.bubble.assistant table {
-  border-collapse: collapse;
-  margin: 0.5em 0;
-  font-size: 0.85em;
-}
-
-.bubble.assistant th,
-.bubble.assistant td {
-  border: 1px solid var(--border);
-  padding: 0.35em 0.6em;
-}
-
-.bubble.assistant th {
-  background: color-mix(in srgb, var(--text) 4%, transparent);
-  font-weight: 600;
-}
-
-@keyframes pulse {
-  0%,
-  100% {
-    opacity: 1;
-  }
-  50% {
-    opacity: 0.5;
-  }
-}
-
-.input-bar {
-  display: flex;
-  gap: 0.5rem;
-  padding: 0.875rem 1rem;
-  border-top: 1px solid var(--border);
-}
-
-.input-bar textarea {
-  flex: 1;
-  padding: 0.5rem 0.75rem;
-  border: 1px solid var(--border);
-  border-radius: 8px;
-  background: var(--bg);
-  color: var(--text);
-  font-family: var(--font);
-  font-size: 0.875rem;
-  resize: none;
-  outline: none;
-  transition: border-color 0.15s;
-}
-
-.input-bar textarea:focus {
-  border-color: var(--ring);
-  box-shadow: 0 0 0 2px color-mix(in srgb, var(--ring) 25%, transparent);
-}
-
-.input-bar textarea:disabled {
-  opacity: 0.5;
-}
-
-.input-bar button {
-  padding: 0.5rem 1rem;
-  border: none;
-  border-radius: 8px;
-  background: var(--primary);
-  color: var(--primary-fg);
-  font-family: var(--font);
-  font-size: 0.875rem;
-  font-weight: 500;
-  cursor: pointer;
-  transition: opacity 0.15s;
-  align-self: flex-end;
-}
-
-.input-bar button:hover:not(:disabled) {
-  opacity: 0.9;
-}
-
-.input-bar button:disabled {
-  opacity: 0.4;
-  cursor: not-allowed;
-}
-
-.event-panel {
-  width: 300px;
-  flex-shrink: 0;
-  display: flex;
-  flex-direction: column;
-  border: 1px solid var(--border);
-  border-radius: var(--radius);
-  background: var(--card);
-  overflow: hidden;
-}
-
-.event-header {
-  padding: 0.625rem 0.875rem;
-  border-bottom: 1px solid var(--border);
-  font-size: 0.8rem;
-  font-weight: 600;
-  color: var(--text-muted);
-  text-transform: uppercase;
-  letter-spacing: 0.05em;
-}
-
-.event-list {
-  flex: 1;
-  overflow-y: auto;
-  padding: 0.75rem;
-  display: flex;
-  flex-direction: column;
-  gap: 0.25rem;
-}
-
-.event-empty {
-  text-align: center;
-  padding: 2.5rem 0;
-  font-size: 0.75rem;
-  color: var(--text-faint);
-}
-
-.event-row {
-  font-family: var(--mono);
-  font-size: 0.7rem;
-  line-height: 1.4;
-  display: flex;
-  gap: 0.5rem;
-}
-
-.event-type {
-  flex-shrink: 0;
-  width: 90px;
-  text-align: right;
-  color: var(--text-faint);
-}
-
-.event-detail {
-  color: var(--text-muted);
-  word-break: break-all;
-}
diff --git a/apps/agent-app/src/App.tsx b/apps/agent-app/src/App.tsx
deleted file mode 100644
index e969e2be8..000000000
--- a/apps/agent-app/src/App.tsx
+++ /dev/null
@@ -1,405 +0,0 @@
-import { TooltipProvider } from "@databricks/appkit-ui/react";
-import { useCallback, useEffect, useRef, useState } from "react";
-import "./App.css";
-import { ThemeSelector } from "./components/theme-selector";
-
-interface SSEEvent {
-  type: string;
-  delta?: string;
-  item_id?: string;
-  item?: {
-    type?: string;
-    id?: string;
-    call_id?: string;
-    name?: string;
-    arguments?: string;
-    output?: string;
-    status?: string;
-  };
-  content?: string;
-  data?: Record<string, unknown>;
-  error?: string;
-  sequence_number?: number;
-  output_index?: number;
-  approval_id?: string;
-  stream_id?: string;
-  tool_name?: string;
-  args?: unknown;
-  annotations?: {
-    readOnly?: boolean;
-    destructive?: boolean;
-    idempotent?: boolean;
-  };
-}
-
-interface ChatMessage {
-  id: number;
-  role: "user" | "assistant";
-  content: string;
-}
-
-interface PendingApproval {
-  approvalId: string;
-  streamId: string;
-  toolName: string;
-  args: unknown;
-  annotations?: {
-    readOnly?: boolean;
-    destructive?: boolean;
-    idempotent?: boolean;
-  };
-}
-
-export default function App() {
-  const [messages, setMessages] = useState<ChatMessage[]>([]);
-  const [events, setEvents] = useState<SSEEvent[]>([]);
-  const [input, setInput] = useState("");
-  const [isLoading, setIsLoading] = useState(false);
-  const [threadId, setThreadId] = useState<string | null>(null);
-  const [pendingApprovals, setPendingApprovals] = useState<PendingApproval[]>(
-    [],
-  );
-  const currentStreamIdRef = useRef<string | null>(null);
-  const messagesEndRef = useRef<HTMLDivElement>(null);
-  const idRef = useRef(0);
-
-  const [toolCount, setToolCount] = useState(0);
-
-  const decideApproval = useCallback(
-    async (approvalId: string, decision: "approve" | "deny") => {
-      const approval = pendingApprovals.find(
-        (a) => a.approvalId === approvalId,
-      );
-      if (!approval) return;
-      try {
-        await fetch("/api/agents/approve", {
-          method: "POST",
-          headers: { "Content-Type": "application/json" },
-          body: JSON.stringify({
-            streamId: approval.streamId,
-            approvalId,
-            decision,
-          }),
-        });
-      } finally {
-        setPendingApprovals((prev) =>
-          prev.filter((a) => a.approvalId !== approvalId),
-        );
-      }
-    },
-    [pendingApprovals],
-  );
-
-  useEffect(() => {
-    const timer = setTimeout(() => {
-      fetch("/api/agents/info")
-        .then((r) => r.json())
-        .then((data) => setToolCount(data.toolCount ?? 0))
-        .catch(() => {});
-    }, 500);
-    return () => clearTimeout(timer);
-  }, []);
-
-  // biome-ignore lint/correctness/useExhaustiveDependencies: scroll on new messages
-  useEffect(() => {
-    messagesEndRef.current?.scrollIntoView({ behavior: "smooth" });
-  }, [messages]);
-
-  const sendMessage = useCallback(async () => {
-    if (!input.trim() || isLoading) return;
-
-    const text = input.trim();
-    setInput("");
-    setMessages((prev) => [
-      ...prev,
-      { id: ++idRef.current, role: "user", content: text },
-    ]);
-    setEvents([]);
-    setIsLoading(true);
-
-    try {
-      const res = await fetch("/api/agents/chat", {
-        method: "POST",
-        headers: { "Content-Type": "application/json" },
-        body: JSON.stringify({
-          message: text,
-          ...(threadId && { threadId }),
-        }),
-      });
-
-      if (!res.ok) {
-        const err = await res.json();
-        setMessages((prev) => [
-          ...prev,
-          {
-            id: ++idRef.current,
-            role: "assistant",
-            content: `Error: ${err.error}`,
-          },
-        ]);
-        return;
-      }
-
-      const reader = res.body?.getReader();
-      if (!reader) return;
-
-      const decoder = new TextDecoder();
-      let content = "";
-      let buffer = "";
-
-      while (true) {
-        const { done, value } = await reader.read();
-        if (done) break;
-        buffer += decoder.decode(value, { stream: true });
-        const lines = buffer.split("\n");
-        buffer = lines.pop() ?? "";
-
-        for (const line of lines) {
-          if (!line.startsWith("data: ")) continue;
-          const data = line.slice(6).trim();
-          if (!data || data === "[DONE]") continue;
-          try {
-            const event: SSEEvent = JSON.parse(data);
-            if (!event.type) continue;
-            setEvents((prev) => [...prev, event]);
-
-            if (event.type === "appkit.metadata" && event.data?.threadId) {
-              setThreadId(event.data.threadId as string);
-              if (typeof event.data.streamId === "string") {
-                currentStreamIdRef.current = event.data.streamId;
-              }
-            }
-            if (
-              event.type === "appkit.approval_pending" &&
-              event.approval_id &&
-              event.stream_id &&
-              event.tool_name
-            ) {
-              currentStreamIdRef.current = event.stream_id;
-              setPendingApprovals((prev) => [
-                ...prev,
-                {
-                  approvalId: event.approval_id as string,
-                  streamId: event.stream_id as string,
-                  toolName: event.tool_name as string,
-                  args: event.args,
-                  annotations: event.annotations,
-                },
-              ]);
-            }
-            if (event.type === "response.output_text.delta" && event.delta) {
-              content += event.delta;
-              setMessages((prev) => {
-                const updated = [...prev];
-                const last = updated[updated.length - 1];
-                if (last?.role === "assistant") {
-                  updated[updated.length - 1] = { ...last, content };
-                } else {
-                  updated.push({
-                    id: ++idRef.current,
-                    role: "assistant",
-                    content,
-                  });
-                }
-                return updated;
-              });
-            }
-          } catch {
-            /* skip */
-          }
-        }
-      }
-    } catch (err) {
-      setMessages((prev) => [
-        ...prev,
-        {
-          id: ++idRef.current,
-          role: "assistant",
-          content: `Error: ${err instanceof Error ? err.message : "Unknown error"}`,
-        },
-      ]);
-    } finally {
-      setIsLoading(false);
-    }
-  }, [input, isLoading, threadId]);
-
-  return (
-    <TooltipProvider>
-      <div className="app">
-        <div className="container">
-          <header className="header">
-            <div>
-              <h1>Agent Chat</h1>
-              <p className="subtitle">
-                AI agent with {toolCount} auto-discovered tools
-                {threadId && (
-                  <span className="thread-id">
-                    {" "}
-                    · Thread {threadId.slice(0, 8)}
-                  </span>
-                )}
-              </p>
-            </div>
-            <ThemeSelector />
-          </header>
-
-          <div className="main-layout">
-            <div className="chat-panel">
-              <div className="messages">
-                {messages.length === 0 && (
-                  <div className="empty-state">
-                    <p className="empty-title">
-                      Send a message to start a conversation
-                    </p>
-                    <p className="empty-sub">
-                      The agent can query data, browse files, and more
-                    </p>
-                  </div>
-                )}
-
-                {messages.map((msg) => (
-                  <div
-                    key={msg.id}
-                    className={`message-row ${msg.role === "user" ? "user" : "assistant"}`}
-                  >
-                    <div className={`bubble ${msg.role}`}>
-                      <p className="whitespace-pre-wrap">{msg.content}</p>
-                    </div>
-                  </div>
-                ))}
-
-                {pendingApprovals.map((approval) => (
-                  <div
-                    key={approval.approvalId}
-                    className="message-row assistant"
-                  >
-                    <div className="bubble assistant approval-card">
-                      <div className="approval-header">
-                        <span className="approval-badge">
-                          Destructive tool — approval required
-                        </span>
-                      </div>
-                      <div className="approval-body">
-                        <strong>{approval.toolName}</strong>
-                        <pre className="approval-args">
-                          {JSON.stringify(approval.args, null, 2)}
-                        </pre>
-                      </div>
-                      <div className="approval-actions">
-                        <button
-                          type="button"
-                          className="approval-deny"
-                          onClick={() =>
-                            decideApproval(approval.approvalId, "deny")
-                          }
-                        >
-                          Deny
-                        </button>
-                        <button
-                          type="button"
-                          className="approval-approve"
-                          onClick={() =>
-                            decideApproval(approval.approvalId, "approve")
-                          }
-                        >
-                          Approve
-                        </button>
-                      </div>
-                    </div>
-                  </div>
-                ))}
-
-                {isLoading &&
-                  pendingApprovals.length === 0 &&
-                  messages[messages.length - 1]?.role === "user" && (
-                    <div className="message-row assistant">
-                      <div className="bubble assistant thinking">
-                        Thinking...
-                      </div>
-                    </div>
-                  )}
-
-                <div ref={messagesEndRef} />
-              </div>
-
-              <form
-                className="input-bar"
-                onSubmit={(e) => {
-                  e.preventDefault();
-                  sendMessage();
-                }}
-              >
-                <textarea
-                  value={input}
-                  onChange={(e) => setInput(e.target.value)}
-                  onKeyDown={(e) => {
-                    if (e.key === "Enter" && !e.shiftKey) {
-                      e.preventDefault();
-                      sendMessage();
-                    }
-                  }}
-                  placeholder="Ask a question..."
-                  disabled={isLoading}
-                  rows={1}
-                />
-                <button type="submit" disabled={isLoading || !input.trim()}>
-                  Send
-                </button>
-              </form>
-            </div>
-
-            <div className="event-panel">
-              <div className="event-header">Event Stream</div>
-              <div className="event-list">
-                {events.length === 0 && (
-                  <p className="event-empty">Events will appear here</p>
-                )}
-                {events.map((event, i) => {
-                  let detail: string;
-                  switch (event.type) {
-                    case "response.output_text.delta":
-                      detail = event.delta?.slice(0, 60) ?? "";
-                      break;
-                    case "response.output_item.added":
-                    case "response.output_item.done":
-                      detail =
-                        event.item?.type === "function_call"
-                          ? `${event.item.name}(${(event.item.arguments ?? "").slice(0, 40)})`
-                          : event.item?.type === "function_call_output"
-                            ? (event.item.output?.slice(0, 60) ?? "")
-                            : (event.item?.status ?? event.item?.type ?? "");
-                      break;
-                    case "response.completed":
-                      detail = "done";
-                      break;
-                    case "error":
-                      detail = event.error ?? "unknown";
-                      break;
-                    case "appkit.metadata":
-                      detail = JSON.stringify(event.data).slice(0, 60);
-                      break;
-                    case "appkit.thinking":
-                      detail = event.content?.slice(0, 60) ?? "";
-                      break;
-                    default:
-                      detail = JSON.stringify(event).slice(0, 60);
-                  }
-                  return (
-                    <div key={`${event.type}-${i}`} className="event-row">
-                      <span className="event-type">
-                        {event.type
-                          .replace("response.", "")
-                          .replace("appkit.", "")}
-                      </span>
-                      <span className="event-detail">{detail}</span>
-                    </div>
-                  );
-                })}
-              </div>
-            </div>
-          </div>
-        </div>
-      </div>
-    </TooltipProvider>
-  );
-}
diff --git a/apps/agent-app/src/components/theme-selector.tsx b/apps/agent-app/src/components/theme-selector.tsx
deleted file mode 100644
index 18bb4f142..000000000
--- a/apps/agent-app/src/components/theme-selector.tsx
+++ /dev/null
@@ -1,135 +0,0 @@
-import {
-  Button,
-  DropdownMenu,
-  DropdownMenuContent,
-  DropdownMenuItem,
-  DropdownMenuTrigger,
-} from "@databricks/appkit-ui/react";
-import { MonitorIcon, MoonIcon, SunIcon } from "lucide-react";
-import { useEffect, useState } from "react";
-
-type Theme = "light" | "dark" | "system";
-
-const THEME_STORAGE_KEY = "agent-app-theme";
-
-function getSystemTheme(): "light" | "dark" {
-  if (typeof window === "undefined") return "light";
-  return window.matchMedia("(prefers-color-scheme: dark)").matches
-    ? "dark"
-    : "light";
-}
-
-function getStoredTheme(): Theme {
-  if (typeof window === "undefined") return "system";
-  const stored = localStorage.getItem(THEME_STORAGE_KEY);
-  return (stored as Theme) || "system";
-}
-
-function applyTheme(theme: Theme) {
-  if (typeof window === "undefined") return;
-
-  const root = document.documentElement;
-  root.classList.remove("light", "dark");
-
-  if (theme === "system") {
-    const systemTheme = getSystemTheme();
-    root.classList.add(systemTheme);
-  } else {
-    root.classList.add(theme);
-  }
-}
-
-export function ThemeSelector() {
-  const [theme, setTheme] = useState<Theme>(() => getStoredTheme());
-  const [mounted, setMounted] = useState(false);
-  const [systemTheme, setSystemTheme] = useState<"light" | "dark">(() =>
-    getSystemTheme(),
-  );
-
-  useEffect(() => {
-    setMounted(true);
-    applyTheme(theme);
-  }, [theme]);
-
-  useEffect(() => {
-    const mediaQuery = window.matchMedia("(prefers-color-scheme: dark)");
-    const handleChange = (e: MediaQueryListEvent | MediaQueryList) => {
-      const isDark = e.matches;
-      setSystemTheme(isDark ? "dark" : "light");
-      if (theme === "system") {
-        applyTheme("system");
-      }
-    };
-
-    handleChange(mediaQuery);
-
-    if (mediaQuery.addEventListener) {
-      mediaQuery.addEventListener("change", handleChange);
-      return () => mediaQuery.removeEventListener("change", handleChange);
-    } else {
-      mediaQuery.addListener(handleChange);
-      return () => mediaQuery.removeListener(handleChange);
-    }
-  }, [theme]);
-
-  const handleThemeChange = (newTheme: Theme) => {
-    setTheme(newTheme);
-    localStorage.setItem(THEME_STORAGE_KEY, newTheme);
-    applyTheme(newTheme);
-  };
-
-  const effectiveTheme = theme === "system" ? systemTheme : theme;
-
-  if (!mounted) {
-    return (
-      <Button variant="ghost" size="icon" className="h-9 w-9">
-        <SunIcon className="h-4 w-4" />
-      </Button>
-    );
-  }
-
-  return (
-    <DropdownMenu>
-      <DropdownMenuTrigger asChild>
-        <Button
-          variant="ghost"
-          size="icon"
-          className="h-9 w-9 text-foreground hover:text-secondary-foreground"
-          aria-label="Toggle theme"
-        >
-          {effectiveTheme === "dark" ? (
-            <MoonIcon className="h-4 w-4" />
-          ) : (
-            <SunIcon className="h-4 w-4" />
-          )}
-        </Button>
-      </DropdownMenuTrigger>
-      <DropdownMenuContent align="end">
-        <DropdownMenuItem
-          onClick={() => handleThemeChange("light")}
-          className="cursor-pointer"
-        >
-          <SunIcon className="mr-2 h-4 w-4" />
-          <span>Light</span>
-          {theme === "light" && <span className="ml-auto text-xs">✓</span>}
-        </DropdownMenuItem>
-        <DropdownMenuItem
-          onClick={() => handleThemeChange("dark")}
-          className="cursor-pointer"
-        >
-          <MoonIcon className="mr-2 h-4 w-4" />
-          <span>Dark</span>
-          {theme === "dark" && <span className="ml-auto text-xs">✓</span>}
-        </DropdownMenuItem>
-        <DropdownMenuItem
-          onClick={() => handleThemeChange("system")}
-          className="cursor-pointer"
-        >
-          <MonitorIcon className="mr-2 h-4 w-4" />
-          <span>System</span>
-          {theme === "system" && <span className="ml-auto text-xs">✓</span>}
-        </DropdownMenuItem>
-      </DropdownMenuContent>
-    </DropdownMenu>
-  );
-}
diff --git a/apps/agent-app/src/index.css b/apps/agent-app/src/index.css
deleted file mode 100644
index 5dcc4cf86..000000000
--- a/apps/agent-app/src/index.css
+++ /dev/null
@@ -1 +0,0 @@
-@import "@databricks/appkit-ui/styles.css";
diff --git a/apps/agent-app/src/main.tsx b/apps/agent-app/src/main.tsx
deleted file mode 100644
index 98b62364b..000000000
--- a/apps/agent-app/src/main.tsx
+++ /dev/null
@@ -1,15 +0,0 @@
-import { StrictMode } from "react";
-import { createRoot } from "react-dom/client";
-import App from "./App.tsx";
-import "./index.css";
-
-const rootElement = document.getElementById("root");
-if (!rootElement) {
-  throw new Error("Root element not found");
-}
-
-createRoot(rootElement).render(
-  <StrictMode>
-    <App />
-  </StrictMode>,
-);
diff --git a/apps/agent-app/tailwind.config.ts b/apps/agent-app/tailwind.config.ts
deleted file mode 100644
index fad89bf65..000000000
--- a/apps/agent-app/tailwind.config.ts
+++ /dev/null
@@ -1,11 +0,0 @@
-import path from "node:path";
-import type { Config } from "tailwindcss";
-
-export default {
-  darkMode: ["class", "media"],
-  content: [
-    path.resolve(__dirname, "./index.html"),
-    path.resolve(__dirname, "./src/**/*.{js,ts,jsx,tsx}"),
-  ],
-  plugins: [require("tailwindcss-animate")],
-} satisfies Config;
diff --git a/apps/agent-app/tsconfig.app.json b/apps/agent-app/tsconfig.app.json
deleted file mode 100644
index 2877c2180..000000000
--- a/apps/agent-app/tsconfig.app.json
+++ /dev/null
@@ -1,24 +0,0 @@
-{
-  "compilerOptions": {
-    "tsBuildInfoFile": "./node_modules/.tmp/tsconfig.app.tsbuildinfo",
-    "target": "ES2022",
-    "useDefineForClassFields": true,
-    "lib": ["ES2022", "DOM", "DOM.Iterable"],
-    "module": "ESNext",
-    "types": ["vite/client"],
-    "skipLibCheck": true,
-    "moduleResolution": "bundler",
-    "allowImportingTsExtensions": true,
-    "verbatimModuleSyntax": true,
-    "moduleDetection": "force",
-    "noEmit": true,
-    "jsx": "react-jsx",
-    "strict": true,
-    "noUnusedLocals": true,
-    "noUnusedParameters": true,
-    "erasableSyntaxOnly": true,
-    "noFallthroughCasesInSwitch": true,
-    "noUncheckedSideEffectImports": true
-  },
-  "include": ["src"]
-}
diff --git a/apps/agent-app/tsconfig.json b/apps/agent-app/tsconfig.json
deleted file mode 100644
index 1ffef600d..000000000
--- a/apps/agent-app/tsconfig.json
+++ /dev/null
@@ -1,7 +0,0 @@
-{
-  "files": [],
-  "references": [
-    { "path": "./tsconfig.app.json" },
-    { "path": "./tsconfig.node.json" }
-  ]
-}
diff --git a/apps/agent-app/tsconfig.node.json b/apps/agent-app/tsconfig.node.json
deleted file mode 100644
index 35bcd1182..000000000
--- a/apps/agent-app/tsconfig.node.json
+++ /dev/null
@@ -1,22 +0,0 @@
-{
-  "compilerOptions": {
-    "tsBuildInfoFile": "./node_modules/.tmp/tsconfig.node.tsbuildinfo",
-    "target": "ES2023",
-    "lib": ["ES2023"],
-    "module": "ESNext",
-    "types": ["node"],
-    "skipLibCheck": true,
-    "moduleResolution": "bundler",
-    "allowImportingTsExtensions": true,
-    "verbatimModuleSyntax": true,
-    "moduleDetection": "force",
-    "noEmit": true,
-    "strict": true,
-    "noUnusedLocals": true,
-    "noUnusedParameters": true,
-    "erasableSyntaxOnly": true,
-    "noFallthroughCasesInSwitch": true,
-    "noUncheckedSideEffectImports": true
-  },
-  "include": ["vite.config.ts"]
-}
diff --git a/apps/agent-app/vite.config.ts b/apps/agent-app/vite.config.ts
deleted file mode 100644
index bd1cea62c..000000000
--- a/apps/agent-app/vite.config.ts
+++ /dev/null
@@ -1,31 +0,0 @@
-import path from "node:path";
-import react from "@vitejs/plugin-react";
-import { defineConfig } from "vite";
-
-export default defineConfig({
-  plugins: [react()],
-  optimizeDeps: {
-    include: [
-      "react",
-      "react-dom",
-      "react/jsx-dev-runtime",
-      "react/jsx-runtime",
-    ],
-    exclude: ["@databricks/appkit-ui", "@databricks/appkit"],
-  },
-  server: {
-    hmr: {
-      port: 24679,
-    },
-  },
-  resolve: {
-    dedupe: ["react", "react-dom"],
-    preserveSymlinks: true,
-    alias: {
-      "@databricks/appkit-ui": path.resolve(
-        __dirname,
-        "../../packages/appkit-ui/dist",
-      ),
-    },
-  },
-});
diff --git a/apps/dev-playground/client/src/routeTree.gen.ts b/apps/dev-playground/client/src/routeTree.gen.ts
index 378a77ea6..8b953ed98 100644
--- a/apps/dev-playground/client/src/routeTree.gen.ts
+++ b/apps/dev-playground/client/src/routeTree.gen.ts
@@ -13,6 +13,7 @@ import { Route as VectorSearchRouteRouteImport } from './routes/vector-search.ro
 import { Route as TypeSafetyRouteRouteImport } from './routes/type-safety.route'
 import { Route as TelemetryRouteRouteImport } from './routes/telemetry.route'
 import { Route as SqlHelpersRouteRouteImport } from './routes/sql-helpers.route'
+import { Route as SmartDashboardRouteRouteImport } from './routes/smart-dashboard.route'
 import { Route as ServingRouteRouteImport } from './routes/serving.route'
 import { Route as ReconnectRouteRouteImport } from './routes/reconnect.route'
 import { Route as PolicyMatrixRouteRouteImport } from './routes/policy-matrix.route'
@@ -47,6 +48,11 @@ const SqlHelpersRouteRoute = SqlHelpersRouteRouteImport.update({
   path: '/sql-helpers',
   getParentRoute: () => rootRouteImport,
 } as any)
+const SmartDashboardRouteRoute = SmartDashboardRouteRouteImport.update({
+  id: '/smart-dashboard',
+  path: '/smart-dashboard',
+  getParentRoute: () => rootRouteImport,
+} as any)
 const ServingRouteRoute = ServingRouteRouteImport.update({
   id: '/serving',
   path: '/serving',
@@ -127,6 +133,7 @@ export interface FileRoutesByFullPath {
   '/policy-matrix': typeof PolicyMatrixRouteRoute
   '/reconnect': typeof ReconnectRouteRoute
   '/serving': typeof ServingRouteRoute
+  '/smart-dashboard': typeof SmartDashboardRouteRoute
   '/sql-helpers': typeof SqlHelpersRouteRoute
   '/telemetry': typeof TelemetryRouteRoute
   '/type-safety': typeof TypeSafetyRouteRoute
@@ -146,6 +153,7 @@ export interface FileRoutesByTo {
   '/policy-matrix': typeof PolicyMatrixRouteRoute
   '/reconnect': typeof ReconnectRouteRoute
   '/serving': typeof ServingRouteRoute
+  '/smart-dashboard': typeof SmartDashboardRouteRoute
   '/sql-helpers': typeof SqlHelpersRouteRoute
   '/telemetry': typeof TelemetryRouteRoute
   '/type-safety': typeof TypeSafetyRouteRoute
@@ -166,6 +174,7 @@ export interface FileRoutesById {
   '/policy-matrix': typeof PolicyMatrixRouteRoute
   '/reconnect': typeof ReconnectRouteRoute
   '/serving': typeof ServingRouteRoute
+  '/smart-dashboard': typeof SmartDashboardRouteRoute
   '/sql-helpers': typeof SqlHelpersRouteRoute
   '/telemetry': typeof TelemetryRouteRoute
   '/type-safety': typeof TypeSafetyRouteRoute
@@ -187,6 +196,7 @@ export interface FileRouteTypes {
     | '/policy-matrix'
     | '/reconnect'
     | '/serving'
+    | '/smart-dashboard'
     | '/sql-helpers'
     | '/telemetry'
     | '/type-safety'
@@ -206,6 +216,7 @@ export interface FileRouteTypes {
     | '/policy-matrix'
     | '/reconnect'
     | '/serving'
+    | '/smart-dashboard'
     | '/sql-helpers'
     | '/telemetry'
     | '/type-safety'
@@ -225,6 +236,7 @@ export interface FileRouteTypes {
     | '/policy-matrix'
     | '/reconnect'
     | '/serving'
+    | '/smart-dashboard'
     | '/sql-helpers'
     | '/telemetry'
     | '/type-safety'
@@ -245,6 +257,7 @@ export interface RootRouteChildren {
   PolicyMatrixRouteRoute: typeof PolicyMatrixRouteRoute
   ReconnectRouteRoute: typeof ReconnectRouteRoute
   ServingRouteRoute: typeof ServingRouteRoute
+  SmartDashboardRouteRoute: typeof SmartDashboardRouteRoute
   SqlHelpersRouteRoute: typeof SqlHelpersRouteRoute
   TelemetryRouteRoute: typeof TelemetryRouteRoute
   TypeSafetyRouteRoute: typeof TypeSafetyRouteRoute
@@ -281,6 +294,13 @@ declare module '@tanstack/react-router' {
       preLoaderRoute: typeof SqlHelpersRouteRouteImport
       parentRoute: typeof rootRouteImport
     }
+    '/smart-dashboard': {
+      id: '/smart-dashboard'
+      path: '/smart-dashboard'
+      fullPath: '/smart-dashboard'
+      preLoaderRoute: typeof SmartDashboardRouteRouteImport
+      parentRoute: typeof rootRouteImport
+    }
     '/serving': {
       id: '/serving'
       path: '/serving'
@@ -389,6 +409,7 @@ const rootRouteChildren: RootRouteChildren = {
   PolicyMatrixRouteRoute: PolicyMatrixRouteRoute,
   ReconnectRouteRoute: ReconnectRouteRoute,
   ServingRouteRoute: ServingRouteRoute,
+  SmartDashboardRouteRoute: SmartDashboardRouteRoute,
   SqlHelpersRouteRoute: SqlHelpersRouteRoute,
   TelemetryRouteRoute: TelemetryRouteRoute,
   TypeSafetyRouteRoute: TypeSafetyRouteRoute,
diff --git a/apps/dev-playground/client/src/routes/__root.tsx b/apps/dev-playground/client/src/routes/__root.tsx
index 6ce0c0756..1e941cd2f 100644
--- a/apps/dev-playground/client/src/routes/__root.tsx
+++ b/apps/dev-playground/client/src/routes/__root.tsx
@@ -144,6 +144,14 @@ function RootComponent() {
                     Agent
                   </Button>
                 </Link>
+                <Link to="/smart-dashboard" className="no-underline">
+                  <Button
+                    variant="ghost"
+                    className="text-foreground hover:text-secondary-foreground"
+                  >
+                    Smart Dashboard
+                  </Button>
+                </Link>
                 <ThemeSelector />
               </div>
             </nav>
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx b/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
new file mode 100644
index 000000000..16c39069c
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
@@ -0,0 +1,100 @@
+import { createFileRoute } from "@tanstack/react-router";
+import { LayoutDashboardIcon } from "lucide-react";
+import { useCallback, useState } from "react";
+import { ActiveFilters } from "./smart-dashboard/components/active-filters";
+import { AgentSidebar } from "./smart-dashboard/components/agent-sidebar";
+import { FareChart } from "./smart-dashboard/components/fare-chart";
+import { KPICards } from "./smart-dashboard/components/kpi-cards";
+import { QuerySection } from "./smart-dashboard/components/query-section";
+import { TripChart } from "./smart-dashboard/components/trip-chart";
+import type { Highlight } from "./smart-dashboard/hooks/use-action-dispatcher";
+import { useActionDispatcher } from "./smart-dashboard/hooks/use-action-dispatcher";
+import type { DashboardFilters } from "./smart-dashboard/hooks/use-dashboard-data";
+import { useDashboardData } from "./smart-dashboard/hooks/use-dashboard-data";
+
+export const Route = createFileRoute("/smart-dashboard")({
+  component: SmartDashboardRoute,
+});
+
+function SmartDashboardRoute() {
+  const [filters, setFilters] = useState<DashboardFilters>({});
+  const [highlights, setHighlights] = useState<Highlight[]>([]);
+
+  const { kpis, tripsOverTime, fareDistribution, isLoading } =
+    useDashboardData(filters);
+
+  const handleFilterChange = useCallback((newFilters: DashboardFilters) => {
+    setFilters(newFilters);
+  }, []);
+
+  const handleHighlight = useCallback((highlight: Highlight) => {
+    setHighlights((prev) => [...prev, highlight]);
+  }, []);
+
+  const { handleEvent } = useActionDispatcher({
+    onFilterChange: handleFilterChange,
+    onHighlight: handleHighlight,
+    currentFilters: filters,
+  });
+
+  const handleClearFilter = useCallback((key: keyof DashboardFilters) => {
+    setFilters((prev) => {
+      const next = { ...prev };
+      delete next[key];
+      return next;
+    });
+  }, []);
+
+  const handleClearAllFilters = useCallback(() => {
+    setFilters({});
+    setHighlights([]);
+  }, []);
+
+  return (
+    <div className="min-h-screen bg-background text-foreground">
+      <div className="max-w-[1400px] mx-auto px-4 py-4">
+        <header className="flex items-center gap-3 mb-5">
+          <div className="rounded-lg bg-primary/10 p-2">
+            <LayoutDashboardIcon className="h-5 w-5 text-primary" />
+          </div>
+          <div>
+            <h1 className="text-xl font-bold text-foreground">
+              Smart Dashboard
+            </h1>
+            <p className="text-xs text-muted-foreground">
+              NYC Taxi Analytics — powered by 3 AI agents
+            </p>
+          </div>
+        </header>
+
+        <div className="mb-4">
+          <ActiveFilters
+            filters={filters}
+            onClear={handleClearFilter}
+            onClearAll={handleClearAllFilters}
+          />
+        </div>
+
+        <div className="mb-5">
+          <KPICards data={kpis} isLoading={isLoading} />
+        </div>
+
+        <div className="grid grid-cols-1 lg:grid-cols-[1fr_320px] gap-5 mb-5">
+          <div className="space-y-5">
+            <TripChart
+              data={tripsOverTime}
+              highlights={highlights}
+              isLoading={isLoading}
+            />
+            <FareChart data={fareDistribution} isLoading={isLoading} />
+          </div>
+          <div className="lg:h-[580px]">
+            <AgentSidebar kpis={kpis} kpisLoaded={!isLoading} />
+          </div>
+        </div>
+
+        <QuerySection onEvent={handleEvent} />
+      </div>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/active-filters.tsx b/apps/dev-playground/client/src/routes/smart-dashboard/components/active-filters.tsx
new file mode 100644
index 000000000..f5fe96a2a
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/components/active-filters.tsx
@@ -0,0 +1,63 @@
+import { FilterIcon, XIcon } from "lucide-react";
+import type { DashboardFilters } from "../hooks/use-dashboard-data";
+
+interface ActiveFiltersProps {
+  filters: DashboardFilters;
+  onClear: (key: keyof DashboardFilters) => void;
+  onClearAll: () => void;
+}
+
+function formatFilterEntry(key: string, value: string): string {
+  const labels: Record<string, string> = {
+    date_from: "From",
+    date_to: "To",
+    pickup_zip: "Zone",
+    fare_min: "Min fare",
+    fare_max: "Max fare",
+  };
+  return `${labels[key] ?? key}: ${value}`;
+}
+
+export function ActiveFilters({
+  filters,
+  onClear,
+  onClearAll,
+}: ActiveFiltersProps) {
+  const entries = Object.entries(filters).filter(
+    ([, v]) => v !== undefined && v !== "",
+  );
+
+  if (entries.length === 0) return null;
+
+  return (
+    <div className="flex items-center gap-2 flex-wrap rounded-lg border border-border bg-card px-3 py-2">
+      <FilterIcon className="h-3.5 w-3.5 text-muted-foreground shrink-0" />
+      <span className="text-xs font-medium text-muted-foreground">
+        Active Filters:
+      </span>
+      {entries.map(([key, value]) => (
+        <span
+          key={key}
+          className="inline-flex items-center gap-1 rounded-md bg-primary/10 text-primary px-2 py-0.5 text-xs font-medium"
+        >
+          {formatFilterEntry(key, value ?? "")}
+          <button
+            type="button"
+            onClick={() => onClear(key as keyof DashboardFilters)}
+            className="hover:text-primary/70 transition-colors"
+            aria-label={`Remove ${key} filter`}
+          >
+            <XIcon className="h-3 w-3" />
+          </button>
+        </span>
+      ))}
+      <button
+        type="button"
+        onClick={onClearAll}
+        className="text-xs text-muted-foreground hover:text-foreground transition-colors ml-1"
+      >
+        Clear all
+      </button>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/agent-sidebar.tsx b/apps/dev-playground/client/src/routes/smart-dashboard/components/agent-sidebar.tsx
new file mode 100644
index 000000000..1c3426f88
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/components/agent-sidebar.tsx
@@ -0,0 +1,168 @@
+import { BrainIcon, Loader2Icon, RefreshCwIcon } from "lucide-react";
+import { useCallback, useEffect, useRef, useState } from "react";
+import { useAgentStream } from "../hooks/use-agent-stream";
+import type { KPIData } from "../hooks/use-dashboard-data";
+import { AnomalyCard } from "./anomaly-card";
+import { InsightCard } from "./insight-card";
+
+interface Insight {
+  title: string;
+  description: string;
+}
+
+interface Anomaly {
+  title: string;
+  description: string;
+  severity: "low" | "medium" | "high";
+}
+
+interface AgentSidebarProps {
+  kpis: KPIData | null;
+  kpisLoaded: boolean;
+}
+
+function parseAgentJSON<T>(content: string): T[] {
+  try {
+    const jsonMatch = content.match(/\[[\s\S]*\]/);
+    if (jsonMatch) {
+      return JSON.parse(jsonMatch[0]);
+    }
+  } catch {
+    /* skip */
+  }
+  return [];
+}
+
+function buildKPISummary(kpis: KPIData): string {
+  return [
+    `Total trips: ${kpis.total_trips.toLocaleString()}`,
+    `Average fare: $${kpis.avg_fare}`,
+    `Average distance: ${kpis.avg_distance} miles`,
+    `Fare range: $${kpis.min_fare} - $${kpis.max_fare}`,
+    `Top pickup zone: ${kpis.top_pickup_zone} (${kpis.top_zone_trips.toLocaleString()} trips)`,
+  ].join(", ");
+}
+
+export function AgentSidebar({ kpis, kpisLoaded }: AgentSidebarProps) {
+  const [insights, setInsights] = useState<Insight[]>([]);
+  const [anomalies, setAnomalies] = useState<Anomaly[]>([]);
+  const hasFired = useRef(false);
+
+  const insightsStream = useAgentStream({ agentName: "insights" });
+  const anomalyStream = useAgentStream({ agentName: "anomaly" });
+
+  const insightsRef = useRef(insightsStream);
+  insightsRef.current = insightsStream;
+  const anomalyRef = useRef(anomalyStream);
+  anomalyRef.current = anomalyStream;
+  const kpisRef = useRef(kpis);
+  kpisRef.current = kpis;
+
+  const analyze = useCallback(() => {
+    const currentKpis = kpisRef.current;
+    if (!currentKpis) return;
+    const summary = buildKPISummary(currentKpis);
+    setInsights([]);
+    setAnomalies([]);
+    insightsRef.current.reset();
+    anomalyRef.current.reset();
+    insightsRef.current.send(
+      `Here are the current taxi trip metrics: ${summary}. Analyze for interesting patterns and insights.`,
+    );
+    anomalyRef.current.send(
+      `Here are the current taxi trip metrics: ${summary}. Check for anomalies, outliers, or unusual patterns.`,
+    );
+  }, []);
+
+  useEffect(() => {
+    if (kpisLoaded && kpis && !hasFired.current) {
+      hasFired.current = true;
+      analyze();
+    }
+  }, [kpisLoaded, kpis, analyze]);
+
+  useEffect(() => {
+    if (!insightsStream.isLoading && insightsStream.content) {
+      setInsights(parseAgentJSON<Insight>(insightsStream.content));
+    }
+  }, [insightsStream.isLoading, insightsStream.content]);
+
+  useEffect(() => {
+    if (!anomalyStream.isLoading && anomalyStream.content) {
+      setAnomalies(parseAgentJSON<Anomaly>(anomalyStream.content));
+    }
+  }, [anomalyStream.isLoading, anomalyStream.content]);
+
+  const isAnalyzing = insightsStream.isLoading || anomalyStream.isLoading;
+
+  return (
+    <div className="rounded-xl border border-border bg-card shadow-sm flex flex-col h-full">
+      <div className="flex items-center justify-between px-4 py-3 border-b border-border">
+        <div className="flex items-center gap-2">
+          <BrainIcon className="h-4 w-4 text-primary" />
+          <span className="text-sm font-semibold text-foreground">
+            Agent Feed
+          </span>
+        </div>
+        <button
+          type="button"
+          onClick={() => {
+            hasFired.current = false;
+            analyze();
+          }}
+          disabled={isAnalyzing}
+          className="p-1.5 rounded-md hover:bg-muted text-muted-foreground hover:text-foreground transition-colors disabled:opacity-50"
+          aria-label="Refresh analysis"
+        >
+          <RefreshCwIcon
+            className={`h-3.5 w-3.5 ${isAnalyzing ? "animate-spin" : ""}`}
+          />
+        </button>
+      </div>
+
+      <div className="flex-1 overflow-y-auto p-3 space-y-2.5">
+        {isAnalyzing && insights.length === 0 && anomalies.length === 0 && (
+          <div className="flex flex-col items-center justify-center py-8 text-muted-foreground">
+            <Loader2Icon className="h-5 w-5 animate-spin mb-2" />
+            <p className="text-xs">Analyzing data...</p>
+          </div>
+        )}
+
+        {!isAnalyzing &&
+          insights.length === 0 &&
+          anomalies.length === 0 &&
+          !kpisLoaded && (
+            <p className="text-xs text-muted-foreground text-center py-8">
+              Loading dashboard data...
+            </p>
+          )}
+
+        {!isAnalyzing &&
+          insights.length === 0 &&
+          anomalies.length === 0 &&
+          kpisLoaded && (
+            <p className="text-xs text-muted-foreground text-center py-8">
+              Click refresh to analyze the data
+            </p>
+          )}
+
+        {insights.map((insight) => (
+          <InsightCard
+            key={`insight-${insight.title}`}
+            title={insight.title}
+            description={insight.description}
+          />
+        ))}
+
+        {anomalies.map((anomaly) => (
+          <AnomalyCard
+            key={`anomaly-${anomaly.title}`}
+            title={anomaly.title}
+            description={anomaly.description}
+            severity={anomaly.severity}
+          />
+        ))}
+      </div>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/anomaly-card.tsx b/apps/dev-playground/client/src/routes/smart-dashboard/components/anomaly-card.tsx
new file mode 100644
index 000000000..72c8f0ef2
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/components/anomaly-card.tsx
@@ -0,0 +1,68 @@
+import { AlertTriangleIcon } from "lucide-react";
+
+type Severity = "low" | "medium" | "high";
+
+interface AnomalyCardProps {
+  title: string;
+  description: string;
+  severity: Severity;
+}
+
+const SEVERITY_STYLES: Record<
+  Severity,
+  { border: string; bg: string; icon: string; badge: string }
+> = {
+  low: {
+    border: "border-yellow-200 dark:border-yellow-900",
+    bg: "bg-yellow-50/50 dark:bg-yellow-950/30",
+    icon: "text-yellow-500",
+    badge:
+      "bg-yellow-100 text-yellow-700 dark:bg-yellow-900/50 dark:text-yellow-400",
+  },
+  medium: {
+    border: "border-orange-200 dark:border-orange-900",
+    bg: "bg-orange-50/50 dark:bg-orange-950/30",
+    icon: "text-orange-500",
+    badge:
+      "bg-orange-100 text-orange-700 dark:bg-orange-900/50 dark:text-orange-400",
+  },
+  high: {
+    border: "border-red-200 dark:border-red-900",
+    bg: "bg-red-50/50 dark:bg-red-950/30",
+    icon: "text-red-500",
+    badge: "bg-red-100 text-red-700 dark:bg-red-900/50 dark:text-red-400",
+  },
+};
+
+export function AnomalyCard({
+  title,
+  description,
+  severity,
+}: AnomalyCardProps) {
+  const styles = SEVERITY_STYLES[severity];
+
+  return (
+    <div className={`rounded-lg border ${styles.border} ${styles.bg} p-3`}>
+      <div className="flex items-start gap-2">
+        <AlertTriangleIcon
+          className={`h-4 w-4 ${styles.icon} mt-0.5 shrink-0`}
+        />
+        <div className="min-w-0">
+          <div className="flex items-center gap-2">
+            <p className="text-sm font-medium text-foreground leading-tight">
+              {title}
+            </p>
+            <span
+              className={`text-[10px] font-medium px-1.5 py-0.5 rounded ${styles.badge}`}
+            >
+              {severity}
+            </span>
+          </div>
+          <p className="text-xs text-muted-foreground mt-1 leading-relaxed">
+            {description}
+          </p>
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/fare-chart.tsx b/apps/dev-playground/client/src/routes/smart-dashboard/components/fare-chart.tsx
new file mode 100644
index 000000000..383174aec
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/components/fare-chart.tsx
@@ -0,0 +1,78 @@
+import {
+  Bar,
+  BarChart,
+  CartesianGrid,
+  ResponsiveContainer,
+  Tooltip,
+  XAxis,
+  YAxis,
+} from "recharts";
+import { useChartColors } from "../hooks/use-chart-colors";
+import type { FareBucket } from "../hooks/use-dashboard-data";
+
+interface FareChartProps {
+  data: FareBucket[];
+  isLoading: boolean;
+}
+
+export function FareChart({ data, isLoading }: FareChartProps) {
+  const c = useChartColors();
+
+  if (isLoading) {
+    return (
+      <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
+        <h3 className="text-sm font-medium text-muted-foreground mb-4">
+          Fare Distribution
+        </h3>
+        <div className="h-[260px] flex items-center justify-center">
+          <div className="h-full w-full animate-pulse rounded bg-muted" />
+        </div>
+      </div>
+    );
+  }
+
+  return (
+    <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
+      <h3 className="text-sm font-medium text-muted-foreground mb-4">
+        Fare Distribution
+      </h3>
+      <ResponsiveContainer width="100%" height={260}>
+        <BarChart
+          data={data}
+          margin={{ top: 5, right: 20, bottom: 5, left: 0 }}
+        >
+          <CartesianGrid strokeDasharray="3 3" stroke={c.grid} />
+          <XAxis
+            dataKey="fare_bucket"
+            tick={{ fontSize: 11, fill: c.axis }}
+            stroke={c.grid}
+          />
+          <YAxis
+            tick={{ fontSize: 11, fill: c.axis }}
+            stroke={c.grid}
+            tickFormatter={(v: number) =>
+              v >= 1000 ? `${(v / 1000).toFixed(0)}K` : String(v)
+            }
+          />
+          <Tooltip
+            contentStyle={{
+              backgroundColor: c.tooltipBg,
+              color: c.tooltipFg,
+              border: `1px solid ${c.grid}`,
+              borderRadius: "8px",
+              fontSize: "12px",
+            }}
+            labelStyle={{ color: c.tooltipFg }}
+            itemStyle={{ color: c.tooltipFg }}
+            formatter={(value: number, name: string) => {
+              if (name === "trip_count")
+                return [value.toLocaleString(), "Trips"];
+              return [value, name];
+            }}
+          />
+          <Bar dataKey="trip_count" fill={c.secondary} radius={[4, 4, 0, 0]} />
+        </BarChart>
+      </ResponsiveContainer>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/insight-card.tsx b/apps/dev-playground/client/src/routes/smart-dashboard/components/insight-card.tsx
new file mode 100644
index 000000000..b17b44d70
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/components/insight-card.tsx
@@ -0,0 +1,24 @@
+import { LightbulbIcon } from "lucide-react";
+
+interface InsightCardProps {
+  title: string;
+  description: string;
+}
+
+export function InsightCard({ title, description }: InsightCardProps) {
+  return (
+    <div className="rounded-lg border border-blue-200 dark:border-blue-900 bg-blue-50/50 dark:bg-blue-950/30 p-3">
+      <div className="flex items-start gap-2">
+        <LightbulbIcon className="h-4 w-4 text-blue-500 mt-0.5 shrink-0" />
+        <div className="min-w-0">
+          <p className="text-sm font-medium text-foreground leading-tight">
+            {title}
+          </p>
+          <p className="text-xs text-muted-foreground mt-1 leading-relaxed">
+            {description}
+          </p>
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/kpi-cards.tsx b/apps/dev-playground/client/src/routes/smart-dashboard/components/kpi-cards.tsx
new file mode 100644
index 000000000..9ef8e932a
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/components/kpi-cards.tsx
@@ -0,0 +1,81 @@
+import { CarIcon, DollarSignIcon, MapPinIcon, RulerIcon } from "lucide-react";
+import type { KPIData } from "../hooks/use-dashboard-data";
+
+interface KPICardsProps {
+  data: KPIData | null;
+  isLoading: boolean;
+}
+
+interface CardProps {
+  title: string;
+  value: string;
+  subtitle?: string;
+  icon: React.ReactNode;
+  isLoading: boolean;
+}
+
+function KPICard({ title, value, subtitle, icon, isLoading }: CardProps) {
+  return (
+    <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
+      <div className="flex items-center justify-between mb-3">
+        <span className="text-sm font-medium text-muted-foreground">
+          {title}
+        </span>
+        <span className="text-muted-foreground/60">{icon}</span>
+      </div>
+      {isLoading ? (
+        <div className="h-8 w-24 animate-pulse rounded bg-muted" />
+      ) : (
+        <>
+          <p className="text-2xl font-bold text-foreground">{value}</p>
+          {subtitle && (
+            <p className="text-xs text-muted-foreground mt-1">{subtitle}</p>
+          )}
+        </>
+      )}
+    </div>
+  );
+}
+
+function formatNumber(n: number): string {
+  if (n >= 1_000_000) return `${(n / 1_000_000).toFixed(1)}M`;
+  if (n >= 1_000) return `${(n / 1_000).toFixed(1)}K`;
+  return n.toLocaleString();
+}
+
+export function KPICards({ data, isLoading }: KPICardsProps) {
+  return (
+    <div className="grid grid-cols-2 lg:grid-cols-4 gap-4">
+      <KPICard
+        title="Total Trips"
+        value={data ? formatNumber(data.total_trips) : "--"}
+        icon={<CarIcon className="h-5 w-5" />}
+        isLoading={isLoading}
+      />
+      <KPICard
+        title="Avg Fare"
+        value={data ? `$${data.avg_fare}` : "--"}
+        subtitle={
+          data ? `Range: $${data.min_fare} - $${data.max_fare}` : undefined
+        }
+        icon={<DollarSignIcon className="h-5 w-5" />}
+        isLoading={isLoading}
+      />
+      <KPICard
+        title="Avg Distance"
+        value={data ? `${data.avg_distance} mi` : "--"}
+        icon={<RulerIcon className="h-5 w-5" />}
+        isLoading={isLoading}
+      />
+      <KPICard
+        title="Top Pickup Zone"
+        value={data?.top_pickup_zone ?? "--"}
+        subtitle={
+          data ? `${formatNumber(data.top_zone_trips)} trips` : undefined
+        }
+        icon={<MapPinIcon className="h-5 w-5" />}
+        isLoading={isLoading}
+      />
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/query-section.tsx b/apps/dev-playground/client/src/routes/smart-dashboard/components/query-section.tsx
new file mode 100644
index 000000000..80612ff6a
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/components/query-section.tsx
@@ -0,0 +1,163 @@
+import {
+  FilterIcon,
+  HighlighterIcon,
+  Loader2Icon,
+  SearchIcon,
+  SendIcon,
+  SparklesIcon,
+} from "lucide-react";
+import { useCallback, useState } from "react";
+import type { SSEEvent } from "../hooks/use-agent-stream";
+import { useAgentStream } from "../hooks/use-agent-stream";
+
+interface QuerySectionProps {
+  onEvent?: (event: SSEEvent) => void;
+}
+
+const EXAMPLE_QUERIES = [
+  "What's the busiest day of the week?",
+  "Filter to only trips from February 2016",
+  "Highlight Jan 10-15 on the chart",
+  "Show trips over $50 and highlight the peak",
+];
+
+export function QuerySection({ onEvent }: QuerySectionProps) {
+  const [input, setInput] = useState("");
+  const [showTips, setShowTips] = useState(true);
+  const { content, isLoading, send } = useAgentStream({
+    agentName: "query",
+    onEvent,
+  });
+
+  const handleSubmit = useCallback(
+    (e: React.FormEvent) => {
+      e.preventDefault();
+      if (!input.trim() || isLoading) return;
+      const message = input.trim();
+      setInput("");
+      setShowTips(false);
+      send(message);
+    },
+    [input, isLoading, send],
+  );
+
+  const handleExample = useCallback(
+    (query: string) => {
+      if (isLoading) return;
+      setInput("");
+      setShowTips(false);
+      send(query);
+    },
+    [isLoading, send],
+  );
+
+  return (
+    <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
+      <div className="flex items-center justify-between mb-4">
+        <div className="flex items-center gap-2">
+          <SearchIcon className="h-4 w-4 text-primary" />
+          <h3 className="text-sm font-semibold text-foreground">
+            Ask about the data
+          </h3>
+          <span className="text-xs text-muted-foreground">
+            — powered by the Query Agent
+          </span>
+        </div>
+        <button
+          type="button"
+          onClick={() => setShowTips((v) => !v)}
+          className="text-xs text-muted-foreground hover:text-foreground transition-colors"
+        >
+          {showTips ? "Hide tips" : "Show tips"}
+        </button>
+      </div>
+
+      {showTips && (
+        <div className="mb-4 rounded-lg border border-dashed border-border bg-muted/20 p-3">
+          <p className="text-xs font-medium text-muted-foreground mb-2 flex items-center gap-1.5">
+            <SparklesIcon className="h-3.5 w-3.5" />
+            This agent can control the dashboard directly
+          </p>
+          <div className="grid grid-cols-1 sm:grid-cols-2 gap-2 mb-3">
+            <div className="flex items-start gap-2">
+              <FilterIcon className="h-3.5 w-3.5 text-blue-500 mt-0.5 shrink-0" />
+              <div>
+                <p className="text-xs font-medium text-foreground">
+                  Filter data
+                </p>
+                <p className="text-[11px] text-muted-foreground">
+                  Ask to filter by date range, zone, or fare amount and the
+                  dashboard KPIs and charts will update live.
+                </p>
+              </div>
+            </div>
+            <div className="flex items-start gap-2">
+              <HighlighterIcon className="h-3.5 w-3.5 text-amber-500 mt-0.5 shrink-0" />
+              <div>
+                <p className="text-xs font-medium text-foreground">
+                  Highlight periods
+                </p>
+                <p className="text-[11px] text-muted-foreground">
+                  Ask to highlight a date range and a shaded overlay will appear
+                  on the Trips Over Time chart.
+                </p>
+              </div>
+            </div>
+          </div>
+          <div className="flex flex-wrap gap-1.5">
+            {EXAMPLE_QUERIES.map((q) => (
+              <button
+                key={q}
+                type="button"
+                onClick={() => handleExample(q)}
+                disabled={isLoading}
+                className="rounded-md border border-border bg-background px-2 py-1 text-[11px] text-muted-foreground hover:text-foreground hover:border-primary/40 transition-colors disabled:opacity-50"
+              >
+                {q}
+              </button>
+            ))}
+          </div>
+        </div>
+      )}
+
+      <form onSubmit={handleSubmit} className="flex gap-2 mb-4">
+        <input
+          type="text"
+          value={input}
+          onChange={(e) => setInput(e.target.value)}
+          placeholder='Try "Filter to January 2016" or "Highlight the busiest week"'
+          disabled={isLoading}
+          className="flex-1 rounded-lg border border-border bg-background px-3 py-2 text-sm text-foreground placeholder:text-muted-foreground focus:outline-none focus:ring-2 focus:ring-ring disabled:opacity-50"
+        />
+        <button
+          type="submit"
+          disabled={isLoading || !input.trim()}
+          className="inline-flex items-center gap-1.5 rounded-lg bg-primary px-4 py-2 text-sm font-medium text-primary-foreground hover:bg-primary/90 disabled:opacity-50 transition-colors"
+        >
+          {isLoading ? (
+            <Loader2Icon className="h-4 w-4 animate-spin" />
+          ) : (
+            <SendIcon className="h-4 w-4" />
+          )}
+          Ask
+        </button>
+      </form>
+
+      {(content || isLoading) && (
+        <div className="rounded-lg border border-border bg-muted/30 p-4 max-h-[300px] overflow-y-auto">
+          {isLoading && !content && (
+            <div className="flex items-center gap-2 text-muted-foreground">
+              <Loader2Icon className="h-4 w-4 animate-spin" />
+              <span className="text-sm">Thinking...</span>
+            </div>
+          )}
+          {content && (
+            <div className="text-sm text-foreground whitespace-pre-wrap leading-relaxed">
+              {content}
+            </div>
+          )}
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/trip-chart.tsx b/apps/dev-playground/client/src/routes/smart-dashboard/components/trip-chart.tsx
new file mode 100644
index 000000000..89f365f10
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/components/trip-chart.tsx
@@ -0,0 +1,144 @@
+import { useId } from "react";
+import {
+  Area,
+  AreaChart,
+  CartesianGrid,
+  ReferenceArea,
+  ResponsiveContainer,
+  Tooltip,
+  XAxis,
+  YAxis,
+} from "recharts";
+import type { Highlight } from "../hooks/use-action-dispatcher";
+import { useChartColors } from "../hooks/use-chart-colors";
+import type { TripOverTime } from "../hooks/use-dashboard-data";
+
+interface TripChartProps {
+  data: TripOverTime[];
+  highlights: Highlight[];
+  isLoading: boolean;
+}
+
+const HIGHLIGHT_COLORS: Record<Highlight["color"], string> = {
+  blue: "rgba(96, 165, 250, 0.25)",
+  red: "rgba(248, 113, 113, 0.25)",
+  yellow: "rgba(250, 204, 21, 0.25)",
+};
+
+function formatDate(dateStr: string): string {
+  const d = new Date(dateStr);
+  return d.toLocaleDateString("en-US", { month: "short", day: "numeric" });
+}
+
+function findClosestDate(
+  target: string,
+  dates: string[],
+  direction: "start" | "end",
+): string | undefined {
+  if (dates.length === 0) return undefined;
+  const t = new Date(target).getTime();
+  let best: string | undefined;
+  let bestDist = Number.POSITIVE_INFINITY;
+  for (const d of dates) {
+    const dt = new Date(d).getTime();
+    const dist = Math.abs(dt - t);
+    const valid = direction === "start" ? dt <= t : dt >= t;
+    if (valid && dist < bestDist) {
+      best = d;
+      bestDist = dist;
+    }
+  }
+  return best ?? dates[direction === "start" ? 0 : dates.length - 1];
+}
+
+export function TripChart({ data, highlights, isLoading }: TripChartProps) {
+  const gradientId = useId();
+  const c = useChartColors();
+  const dates = data.map((d) => d.trip_date);
+
+  if (isLoading) {
+    return (
+      <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
+        <h3 className="text-sm font-medium text-muted-foreground mb-4">
+          Trips Over Time
+        </h3>
+        <div className="h-[260px] flex items-center justify-center">
+          <div className="h-full w-full animate-pulse rounded bg-muted" />
+        </div>
+      </div>
+    );
+  }
+
+  return (
+    <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
+      <h3 className="text-sm font-medium text-muted-foreground mb-4">
+        Trips Over Time
+      </h3>
+      <ResponsiveContainer width="100%" height={260}>
+        <AreaChart
+          data={data}
+          margin={{ top: 5, right: 20, bottom: 5, left: 0 }}
+        >
+          <defs>
+            <linearGradient id={gradientId} x1="0" y1="0" x2="0" y2="1">
+              <stop offset="5%" stopColor={c.primary} stopOpacity={0.3} />
+              <stop offset="95%" stopColor={c.primary} stopOpacity={0} />
+            </linearGradient>
+          </defs>
+          <CartesianGrid strokeDasharray="3 3" stroke={c.grid} />
+          <XAxis
+            dataKey="trip_date"
+            tickFormatter={formatDate}
+            tick={{ fontSize: 11, fill: c.axis }}
+            stroke={c.grid}
+          />
+          <YAxis
+            tick={{ fontSize: 11, fill: c.axis }}
+            stroke={c.grid}
+            tickFormatter={(v: number) =>
+              v >= 1000 ? `${(v / 1000).toFixed(0)}K` : String(v)
+            }
+          />
+          <Tooltip
+            contentStyle={{
+              backgroundColor: c.tooltipBg,
+              color: c.tooltipFg,
+              border: `1px solid ${c.grid}`,
+              borderRadius: "8px",
+              fontSize: "12px",
+            }}
+            labelStyle={{ color: c.tooltipFg }}
+            itemStyle={{ color: c.tooltipFg }}
+            labelFormatter={formatDate}
+            formatter={(value: number) => [value.toLocaleString(), "Trips"]}
+          />
+          {highlights.map((h, i) => {
+            const x1 = findClosestDate(h.start, dates, "start");
+            const x2 = findClosestDate(h.end, dates, "end");
+            if (!x1 || !x2) return null;
+            return (
+              <ReferenceArea
+                key={`${h.start}-${h.end}-${i}`}
+                x1={x1}
+                x2={x2}
+                fill={HIGHLIGHT_COLORS[h.color]}
+                label={
+                  h.label
+                    ? { value: h.label, position: "top", fontSize: 11 }
+                    : undefined
+                }
+              />
+            );
+          })}
+          <Area
+            type="monotone"
+            dataKey="trip_count"
+            stroke={c.primary}
+            fill={`url(#${gradientId})`}
+            strokeWidth={2}
+          />
+        </AreaChart>
+      </ResponsiveContainer>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-action-dispatcher.ts b/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-action-dispatcher.ts
new file mode 100644
index 000000000..c15b86379
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-action-dispatcher.ts
@@ -0,0 +1,88 @@
+import { useCallback } from "react";
+import type { SSEEvent } from "./use-agent-stream";
+import type { DashboardFilters } from "./use-dashboard-data";
+
+export interface Highlight {
+  start: string;
+  end: string;
+  color: "blue" | "red" | "yellow";
+  label?: string;
+}
+
+const DASHBOARD_TOOLS = new Set(["apply_filter", "highlight_period"]);
+
+interface UseActionDispatcherOptions {
+  onFilterChange: (filters: DashboardFilters) => void;
+  onHighlight: (highlight: Highlight) => void;
+  currentFilters: DashboardFilters;
+}
+
+export function useActionDispatcher({
+  onFilterChange,
+  onHighlight,
+  currentFilters,
+}: UseActionDispatcherOptions) {
+  const handleEvent = useCallback(
+    (event: SSEEvent) => {
+      if (
+        event.type !== "response.output_item.added" &&
+        event.type !== "response.output_item.done"
+      )
+        return;
+      if (event.item?.type !== "function_call") return;
+
+      const toolName = event.item.name;
+      if (!toolName || !DASHBOARD_TOOLS.has(toolName)) return;
+
+      let args: Record<string, unknown>;
+      try {
+        args = JSON.parse(event.item.arguments ?? "{}");
+      } catch {
+        return;
+      }
+
+      if (toolName === "apply_filter") {
+        const field = args.field as string;
+        const operator = args.operator as string;
+        const value = args.value as string | string[];
+
+        const newFilters = { ...currentFilters };
+
+        if (field === "date") {
+          if (operator === "between" && Array.isArray(value)) {
+            newFilters.date_from = value[0];
+            newFilters.date_to = value[1];
+          } else if (operator === "gt") {
+            newFilters.date_from = value as string;
+          } else if (operator === "lt") {
+            newFilters.date_to = value as string;
+          }
+        } else if (field === "pickup_zone" || field === "dropoff_zone") {
+          const zones = Array.isArray(value) ? value.join(",") : value;
+          newFilters.pickup_zip = zones as string;
+        } else if (field === "fare_range") {
+          if (operator === "between" && Array.isArray(value)) {
+            newFilters.fare_min = value[0];
+            newFilters.fare_max = value[1];
+          } else if (operator === "gt") {
+            newFilters.fare_min = value as string;
+          } else if (operator === "lt") {
+            newFilters.fare_max = value as string;
+          }
+        }
+
+        onFilterChange(newFilters);
+      } else if (toolName === "highlight_period") {
+        onHighlight({
+          start: args.start as string,
+          end: args.end as string,
+          color: (args.color as Highlight["color"]) ?? "blue",
+          label: args.label as string | undefined,
+        });
+      }
+    },
+    [onFilterChange, onHighlight, currentFilters],
+  );
+
+  return { handleEvent };
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-agent-stream.ts b/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-agent-stream.ts
new file mode 100644
index 000000000..871b8b43c
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-agent-stream.ts
@@ -0,0 +1,131 @@
+import { useCallback, useRef, useState } from "react";
+
+export interface SSEEvent {
+  type: string;
+  delta?: string;
+  item_id?: string;
+  item?: {
+    type?: string;
+    id?: string;
+    call_id?: string;
+    name?: string;
+    arguments?: string;
+    output?: string;
+    status?: string;
+  };
+  content?: string;
+  data?: Record<string, unknown>;
+  error?: string;
+  sequence_number?: number;
+  output_index?: number;
+}
+
+interface UseAgentStreamOptions {
+  agentName: string;
+  onEvent?: (event: SSEEvent) => void;
+}
+
+interface UseAgentStreamReturn {
+  content: string;
+  events: SSEEvent[];
+  isLoading: boolean;
+  threadId: string | null;
+  send: (message: string) => Promise<void>;
+  reset: () => void;
+}
+
+export function useAgentStream({
+  agentName,
+  onEvent,
+}: UseAgentStreamOptions): UseAgentStreamReturn {
+  const [content, setContent] = useState("");
+  const [events, setEvents] = useState<SSEEvent[]>([]);
+  const [isLoading, setIsLoading] = useState(false);
+  const [threadId, setThreadId] = useState<string | null>(null);
+  const contentRef = useRef("");
+  const onEventRef = useRef(onEvent);
+  onEventRef.current = onEvent;
+
+  const reset = useCallback(() => {
+    setContent("");
+    setEvents([]);
+    contentRef.current = "";
+  }, []);
+
+  const send = useCallback(
+    async (message: string) => {
+      setIsLoading(true);
+      setContent("");
+      setEvents([]);
+      contentRef.current = "";
+
+      try {
+        const res = await fetch("/api/agents/chat", {
+          method: "POST",
+          headers: { "Content-Type": "application/json" },
+          body: JSON.stringify({
+            message,
+            agent: agentName,
+            ...(threadId && { threadId }),
+          }),
+        });
+
+        if (!res.ok) {
+          const errText = await res.text();
+          try {
+            const err = JSON.parse(errText);
+            setContent(`Error: ${err.error}`);
+          } catch {
+            setContent(`Error: Server returned ${res.status}`);
+          }
+          return;
+        }
+
+        const reader = res.body?.getReader();
+        if (!reader) return;
+
+        const decoder = new TextDecoder();
+        let buffer = "";
+
+        while (true) {
+          const { done, value } = await reader.read();
+          if (done) break;
+          buffer += decoder.decode(value, { stream: true });
+          const lines = buffer.split("\n");
+          buffer = lines.pop() ?? "";
+
+          for (const line of lines) {
+            if (!line.startsWith("data: ")) continue;
+            const data = line.slice(6).trim();
+            if (!data || data === "[DONE]") continue;
+            try {
+              const event: SSEEvent = JSON.parse(data);
+              if (!event.type) continue;
+              setEvents((prev) => [...prev, event]);
+              onEventRef.current?.(event);
+
+              if (event.type === "appkit.metadata" && event.data?.threadId) {
+                setThreadId(event.data.threadId as string);
+              }
+              if (event.type === "response.output_text.delta" && event.delta) {
+                contentRef.current += event.delta;
+                setContent(contentRef.current);
+              }
+            } catch {
+              /* skip malformed events */
+            }
+          }
+        }
+      } catch (err) {
+        setContent(
+          `Error: ${err instanceof Error ? err.message : "Unknown error"}`,
+        );
+      } finally {
+        setIsLoading(false);
+      }
+    },
+    [agentName, threadId],
+  );
+
+  return { content, events, isLoading, threadId, send, reset };
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-chart-colors.ts b/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-chart-colors.ts
new file mode 100644
index 000000000..3403b1c1e
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-chart-colors.ts
@@ -0,0 +1,51 @@
+import { useEffect, useState } from "react";
+
+interface ChartColors {
+  primary: string;
+  secondary: string;
+  grid: string;
+  axis: string;
+  tooltipBg: string;
+  tooltipFg: string;
+}
+
+const LIGHT: ChartColors = {
+  primary: "hsl(221, 83%, 53%)",
+  secondary: "hsl(142, 71%, 45%)",
+  grid: "hsl(220, 13%, 91%)",
+  axis: "hsl(215, 16%, 47%)",
+  tooltipBg: "hsl(0, 0%, 100%)",
+  tooltipFg: "hsl(222, 47%, 11%)",
+};
+
+const DARK: ChartColors = {
+  primary: "hsl(217, 91%, 70%)",
+  secondary: "hsl(152, 69%, 55%)",
+  grid: "hsl(215, 14%, 25%)",
+  axis: "hsl(217, 20%, 70%)",
+  tooltipBg: "hsl(224, 71%, 4%)",
+  tooltipFg: "hsl(210, 40%, 96%)",
+};
+
+function isDark(): boolean {
+  return document.documentElement.classList.contains("dark");
+}
+
+export function useChartColors(): ChartColors {
+  const [colors, setColors] = useState<ChartColors>(() =>
+    isDark() ? DARK : LIGHT,
+  );
+
+  useEffect(() => {
+    const observer = new MutationObserver(() => {
+      setColors(isDark() ? DARK : LIGHT);
+    });
+    observer.observe(document.documentElement, {
+      attributes: true,
+      attributeFilter: ["class"],
+    });
+    return () => observer.disconnect();
+  }, []);
+
+  return colors;
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-dashboard-data.ts b/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-dashboard-data.ts
new file mode 100644
index 000000000..5a3a89fd1
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-dashboard-data.ts
@@ -0,0 +1,128 @@
+import { sql } from "@databricks/appkit-ui/js";
+import { useAnalyticsQuery } from "@databricks/appkit-ui/react";
+import { useMemo } from "react";
+
+interface KPIRawRow {
+  total_trips: number;
+  avg_fare: number;
+  avg_distance: number;
+  max_fare: number;
+  min_fare: number;
+}
+
+interface TopZoneData {
+  pickup_zip: string;
+  trip_count: number;
+}
+
+export type KPIData = KPIRawRow & {
+  top_pickup_zone: string;
+  top_zone_trips: number;
+};
+
+export interface TripOverTime {
+  trip_date: string;
+  trip_count: number;
+  avg_fare: number;
+  total_revenue: number;
+}
+
+export interface FareBucket {
+  fare_bucket: string;
+  trip_count: number;
+  avg_distance: number;
+}
+
+export interface DashboardFilters {
+  date_from?: string;
+  date_to?: string;
+  pickup_zip?: string;
+  fare_min?: string;
+  fare_max?: string;
+}
+
+function buildParams(filters: DashboardFilters) {
+  return {
+    dateFrom: sql.string(filters.date_from ?? "all"),
+    dateTo: sql.string(filters.date_to ?? "all"),
+    pickupZip: sql.string(filters.pickup_zip ?? "all"),
+    fareMin: sql.string(filters.fare_min ?? "all"),
+    fareMax: sql.string(filters.fare_max ?? "all"),
+  };
+}
+
+export function useDashboardData(filters: DashboardFilters) {
+  const params = useMemo(() => buildParams(filters), [filters]);
+
+  const {
+    data: kpisRaw,
+    loading: kpisLoading,
+    error: kpisError,
+  } = useAnalyticsQuery("dashboard_kpis", params) as {
+    data: KPIRawRow[] | null;
+    loading: boolean;
+    error: string | null;
+  };
+
+  const {
+    data: topZoneRaw,
+    loading: topZoneLoading,
+    error: topZoneError,
+  } = useAnalyticsQuery("dashboard_top_zone", params) as {
+    data: TopZoneData[] | null;
+    loading: boolean;
+    error: string | null;
+  };
+
+  const tripsParams = useMemo(
+    () => ({
+      dateFrom: params.dateFrom,
+      dateTo: params.dateTo,
+      pickupZip: params.pickupZip,
+    }),
+    [params.dateFrom, params.dateTo, params.pickupZip],
+  );
+
+  const {
+    data: tripsOverTime,
+    loading: tripsLoading,
+    error: tripsError,
+  } = useAnalyticsQuery("dashboard_trips_over_time", tripsParams) as {
+    data: TripOverTime[] | null;
+    loading: boolean;
+    error: string | null;
+  };
+
+  const {
+    data: fareDistribution,
+    loading: fareLoading,
+    error: fareError,
+  } = useAnalyticsQuery("dashboard_fare_distribution", tripsParams) as {
+    data: FareBucket[] | null;
+    loading: boolean;
+    error: string | null;
+  };
+
+  const kpis = useMemo(() => {
+    if (!kpisRaw || kpisRaw.length === 0) return null;
+    const row = kpisRaw[0];
+    const topZone = topZoneRaw?.[0];
+    return {
+      ...row,
+      top_pickup_zone: topZone?.pickup_zip ?? "N/A",
+      top_zone_trips: topZone?.trip_count ?? 0,
+    };
+  }, [kpisRaw, topZoneRaw]);
+
+  const isLoading =
+    kpisLoading || topZoneLoading || tripsLoading || fareLoading;
+  const error = kpisError || topZoneError || tripsError || fareError;
+
+  return {
+    kpis,
+    tripsOverTime: tripsOverTime ?? [],
+    fareDistribution: fareDistribution ?? [],
+    isLoading,
+    error,
+  };
+}
diff --git a/apps/dev-playground/config/agents/anomaly/agent.md b/apps/dev-playground/config/agents/anomaly/agent.md
new file mode 100644
index 000000000..8dc34c529
--- /dev/null
+++ b/apps/dev-playground/config/agents/anomaly/agent.md
@@ -0,0 +1,9 @@
+---
+endpoint: databricks-gemini-3-1-flash-lite
+maxSteps: 1
+ephemeral: true
+---
+
+You are a data quality monitor for NYC taxi trip data. Given summary statistics, identify anomalies, outliers, or unusual patterns.
+
+Return findings as a JSON array of objects with `title` (string), `severity` ('low' | 'medium' | 'high'), and `description` (string) fields. Output ONLY the JSON array, no other text.
diff --git a/apps/dev-playground/config/agents/insights/agent.md b/apps/dev-playground/config/agents/insights/agent.md
new file mode 100644
index 000000000..dbb02c013
--- /dev/null
+++ b/apps/dev-playground/config/agents/insights/agent.md
@@ -0,0 +1,9 @@
+---
+endpoint: databricks-gemini-3-1-flash-lite
+maxSteps: 1
+ephemeral: true
+---
+
+You are a data analyst specializing in NYC taxi trip data. Given summary statistics, identify the 3-5 most interesting patterns, trends, and notable findings. Be specific with numbers.
+
+Return your findings as a JSON array of objects, each with `title` (string) and `description` (string) fields. Output ONLY the JSON array, no other text.
diff --git a/apps/dev-playground/config/agents/query/agent.md b/apps/dev-playground/config/agents/query/agent.md
new file mode 100644
index 000000000..c60fa0d16
--- /dev/null
+++ b/apps/dev-playground/config/agents/query/agent.md
@@ -0,0 +1,24 @@
+---
+endpoint: databricks-claude-sonnet-4-5
+agents:
+  - sql_analyst
+  - dashboard_pilot
+---
+
+You are the dispatcher for the Smart Dashboard — NYC taxi analytics
+(`samples.nyctaxi.trips`, year 2016 only).
+
+You have two specialists. Delegate by calling the corresponding
+`agent-<name>` tool; do not answer directly when a specialist is a better
+fit.
+
+- `agent-sql_analyst` — writes and runs Databricks SQL to answer data
+  questions ("how many trips last Friday?", "top 5 pickup zones by revenue").
+  Use for any analytical query that requires reading the database.
+- `agent-dashboard_pilot` — manipulates the dashboard UI directly: applies
+  filters, highlights time ranges, scrolls the user to a specific chart.
+  Use when the user says "show me…", "filter to…", "highlight…", "focus
+  on…".
+
+Always explain briefly what you did after a specialist returns. Keep your
+own responses short; the specialists do the heavy lifting.
diff --git a/apps/dev-playground/config/queries/dashboard_fare_distribution.sql b/apps/dev-playground/config/queries/dashboard_fare_distribution.sql
new file mode 100644
index 000000000..98f5ad94e
--- /dev/null
+++ b/apps/dev-playground/config/queries/dashboard_fare_distribution.sql
@@ -0,0 +1,22 @@
+-- @param dateFrom STRING
+-- @param dateTo STRING
+-- @param pickupZip STRING
+SELECT
+  CASE
+    WHEN fare_amount < 5 THEN '$0-5'
+    WHEN fare_amount < 10 THEN '$5-10'
+    WHEN fare_amount < 15 THEN '$10-15'
+    WHEN fare_amount < 20 THEN '$15-20'
+    WHEN fare_amount < 30 THEN '$20-30'
+    WHEN fare_amount < 50 THEN '$30-50'
+    ELSE '$50+'
+  END as fare_bucket,
+  COUNT(*) as trip_count,
+  ROUND(AVG(trip_distance), 2) as avg_distance
+FROM samples.nyctaxi.trips
+WHERE 1 = 1
+  AND (COALESCE(:dateFrom, 'all') = 'all' OR tpep_pickup_datetime >= :dateFrom)
+  AND (COALESCE(:dateTo, 'all') = 'all' OR tpep_pickup_datetime <= :dateTo)
+  AND (COALESCE(:pickupZip, 'all') = 'all' OR pickup_zip IN (SELECT TRIM(value) FROM (VALUES (:pickupZip)) AS t(value)))
+GROUP BY fare_bucket
+ORDER BY MIN(fare_amount)
diff --git a/apps/dev-playground/config/queries/dashboard_kpis.sql b/apps/dev-playground/config/queries/dashboard_kpis.sql
new file mode 100644
index 000000000..49cd35001
--- /dev/null
+++ b/apps/dev-playground/config/queries/dashboard_kpis.sql
@@ -0,0 +1,18 @@
+-- @param dateFrom STRING
+-- @param dateTo STRING
+-- @param pickupZip STRING
+-- @param fareMin STRING
+-- @param fareMax STRING
+SELECT
+  COUNT(*) as total_trips,
+  ROUND(AVG(fare_amount), 2) as avg_fare,
+  ROUND(AVG(trip_distance), 2) as avg_distance,
+  ROUND(MAX(fare_amount), 2) as max_fare,
+  ROUND(MIN(fare_amount), 2) as min_fare
+FROM samples.nyctaxi.trips
+WHERE 1 = 1
+  AND (COALESCE(:dateFrom, 'all') = 'all' OR tpep_pickup_datetime >= :dateFrom)
+  AND (COALESCE(:dateTo, 'all') = 'all' OR tpep_pickup_datetime <= :dateTo)
+  AND (COALESCE(:pickupZip, 'all') = 'all' OR pickup_zip IN (SELECT TRIM(value) FROM (VALUES (:pickupZip)) AS t(value)))
+  AND (COALESCE(:fareMin, 'all') = 'all' OR fare_amount >= CAST(:fareMin AS DOUBLE))
+  AND (COALESCE(:fareMax, 'all') = 'all' OR fare_amount <= CAST(:fareMax AS DOUBLE))
diff --git a/apps/dev-playground/config/queries/dashboard_top_zone.sql b/apps/dev-playground/config/queries/dashboard_top_zone.sql
new file mode 100644
index 000000000..2d834ab84
--- /dev/null
+++ b/apps/dev-playground/config/queries/dashboard_top_zone.sql
@@ -0,0 +1,16 @@
+-- @param dateFrom STRING
+-- @param dateTo STRING
+-- @param pickupZip STRING
+-- @param fareMin STRING
+-- @param fareMax STRING
+SELECT pickup_zip, COUNT(*) as trip_count
+FROM samples.nyctaxi.trips
+WHERE 1 = 1
+  AND (COALESCE(:dateFrom, 'all') = 'all' OR tpep_pickup_datetime >= :dateFrom)
+  AND (COALESCE(:dateTo, 'all') = 'all' OR tpep_pickup_datetime <= :dateTo)
+  AND (COALESCE(:pickupZip, 'all') = 'all' OR pickup_zip IN (SELECT TRIM(value) FROM (VALUES (:pickupZip)) AS t(value)))
+  AND (COALESCE(:fareMin, 'all') = 'all' OR fare_amount >= CAST(:fareMin AS DOUBLE))
+  AND (COALESCE(:fareMax, 'all') = 'all' OR fare_amount <= CAST(:fareMax AS DOUBLE))
+GROUP BY pickup_zip
+ORDER BY trip_count DESC
+LIMIT 1
diff --git a/apps/dev-playground/config/queries/dashboard_trips_over_time.sql b/apps/dev-playground/config/queries/dashboard_trips_over_time.sql
new file mode 100644
index 000000000..d65b3c944
--- /dev/null
+++ b/apps/dev-playground/config/queries/dashboard_trips_over_time.sql
@@ -0,0 +1,16 @@
+-- @param dateFrom STRING
+-- @param dateTo STRING
+-- @param pickupZip STRING
+SELECT
+  DATE(tpep_pickup_datetime) as trip_date,
+  COUNT(*) as trip_count,
+  ROUND(AVG(fare_amount), 2) as avg_fare,
+  ROUND(SUM(fare_amount), 2) as total_revenue
+FROM samples.nyctaxi.trips
+WHERE 1 = 1
+  AND (COALESCE(:dateFrom, 'all') = 'all' OR tpep_pickup_datetime >= :dateFrom)
+  AND (COALESCE(:dateTo, 'all') = 'all' OR tpep_pickup_datetime <= :dateTo)
+  AND (COALESCE(:pickupZip, 'all') = 'all' OR pickup_zip IN (SELECT TRIM(value) FROM (VALUES (:pickupZip)) AS t(value)))
+GROUP BY DATE(tpep_pickup_datetime)
+ORDER BY trip_date
+LIMIT 60
diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index cfd6c9eae..6a36ba734 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -69,6 +69,93 @@ const helper = createAgent({
   },
 });
 
+/*
+ * Smart-Dashboard agents.
+ *
+ * The three agents form a dispatcher pattern for the /smart-dashboard route.
+ * The `query` agent (markdown, in config/agents/query/) routes user
+ * questions to one of two specialists:
+ *
+ * - `sql_analyst` — writes Databricks SQL against `samples.nyctaxi.trips`
+ *   using the analytics plugin's query tool.
+ * - `dashboard_pilot` — emits UI-action tool calls (`apply_filter`,
+ *   `highlight_period`) that the client reads off the SSE stream and
+ *   translates into React state mutations. The server-side handlers are
+ *   intentionally stubs — the tool-call JSON is the action payload.
+ */
+
+const apply_filter = tool({
+  name: "apply_filter",
+  description:
+    "Apply a filter to the dashboard data. This updates the KPIs and charts to reflect only the filtered data.",
+  schema: z.object({
+    field: z
+      .enum(["date", "pickup_zone", "dropoff_zone", "fare_range"])
+      .describe("The field to filter on"),
+    operator: z
+      .enum(["eq", "gt", "lt", "between", "in"])
+      .describe("The comparison operator"),
+    value: z
+      .union([z.string(), z.array(z.string())])
+      .describe(
+        "Filter value. For 'between', use an array of two values [start, end]. For 'in', use an array of values.",
+      ),
+  }),
+  execute: async ({ field, operator, value }) => {
+    const valueStr = Array.isArray(value) ? value.join(" to ") : value;
+    return `Filter applied: ${field} ${operator} ${valueStr}. The dashboard will update to reflect this filter.`;
+  },
+});
+
+const highlight_period = tool({
+  name: "highlight_period",
+  description:
+    "Highlight a time period on the dashboard charts to draw attention to a specific date range.",
+  schema: z.object({
+    start: z.string().describe("Start date in ISO format (YYYY-MM-DD)"),
+    end: z.string().describe("End date in ISO format (YYYY-MM-DD)"),
+    color: z
+      .enum(["blue", "red", "yellow"])
+      .optional()
+      .describe("Highlight color. Defaults to blue."),
+    label: z
+      .string()
+      .optional()
+      .describe("Optional label for the highlighted period"),
+  }),
+  execute: async ({ start, end, color: _color, label }) => {
+    const suffix = label ? ` (${label})` : "";
+    return `Highlighted period ${start} to ${end}${suffix} on the dashboard charts.`;
+  },
+});
+
+const sql_analyst = createAgent({
+  instructions: [
+    "You are a SQL expert for NYC taxi trip data (`samples.nyctaxi.trips`).",
+    "Write Databricks SQL to answer the user's question and summarize the results clearly.",
+    "IMPORTANT: The dataset only contains trips from 2016. Always add `WHERE tpep_pickup_datetime >= '2016-01-01' AND tpep_pickup_datetime < '2017-01-01'` unless the user specifies a narrower date range within 2016.",
+    "If the user asks about dates outside 2016, say the dataset only covers 2016.",
+    "Available columns: tpep_pickup_datetime, tpep_dropoff_datetime, trip_distance, fare_amount, pickup_zip, dropoff_zip.",
+  ].join(" "),
+  tools: {
+    ...fromPlugin(analytics),
+  },
+});
+
+const dashboard_pilot = createAgent({
+  instructions: [
+    "You are the Smart Dashboard pilot. You do not query data — you manipulate the UI.",
+    "Use `apply_filter` to filter the dashboard by date range, zone, or fare range.",
+    "Use `highlight_period` to highlight a time range on the charts.",
+    "When the user asks to 'show me', 'filter to', or 'highlight' something, pick the matching tool and call it.",
+    "Always briefly state what you did after applying an action.",
+  ].join(" "),
+  tools: {
+    apply_filter,
+    highlight_period,
+  },
+});
+
 createApp({
   plugins: [
     server(),
@@ -104,7 +191,12 @@ createApp({
     }),
     jobs(),
     serving(),
-    agents({ agents: { helper } }),
+    agents({
+      agents: { helper, sql_analyst, dashboard_pilot },
+      // `query` (markdown dispatcher) + `sql_analyst` + `dashboard_pilot`
+      // wire the /smart-dashboard route. `insights` and `anomaly` are
+      // ephemeral markdown agents auto-fired by the route's AgentSidebar.
+    }),
     // TODO: re-enable once vector-search is exported from @databricks/appkit
     // vectorSearch({
     //   indexes: {
diff --git a/plans/smart-dashboard-demo.md b/plans/smart-dashboard-demo.md
new file mode 100644
index 000000000..5a7be794e
--- /dev/null
+++ b/plans/smart-dashboard-demo.md
@@ -0,0 +1,365 @@
+# Plan: Smart-Dashboard demo route (retires `agent-app`)
+
+## Goal
+
+Replace `apps/agent-app` with a **new `/smart-dashboard` route inside
+`dev-playground`** that doubles as the integration test for every feature
+in the agents-plugin v2 stack. An analytics dashboard (NYC Taxi data)
+where multiple agents help the user interpret, filter, and highlight data
+in real time, plus a hidden-by-default **Stream Inspector** for observability
+of the SSE pipeline.
+
+The route is **the demo** that makes branches 4/5/6 reviewable end-to-end:
+fold-based markdown agents, `createAgent`, `fromPlugin`, sub-agent
+delegation, human-in-the-loop approval, MCP host policy, DOS limits,
+ephemeral agents — all exercised by one app.
+
+## Locked decisions
+
+| Topic | Choice |
+|---|---|
+| Location | `apps/dev-playground/client/src/routes/smart-dashboard/` + server wiring in `apps/dev-playground/server/index.ts`. **No new app.** |
+| Fate of `agent-app` | **Delete.** Replaced by this route as the sole end-to-end demo. |
+| Domain / data | NYC Taxi samples (`samples.nyctaxi.trips`). Directly reusable from the `p3ju` prototype. |
+| Agent ↔ UI protocol | **SSE tool-call args as action payload.** Agent `tool.execute` is a stub returning confirmation text; the UI reads `function_call` items from the SSE stream and mutates client state. No new primitive. |
+| Interaction level | (c) emitted actions — agent can apply filters, highlight time ranges, focus charts, save views. No server-side dashboard mutation. |
+| Agents (3 + dispatcher) | `query` (markdown dispatcher), `sql_analyst` (code, `fromPlugin(analytics)` + `save_view`), `dashboard_pilot` (code, UI action tools), `insights` + `anomaly` (ephemeral markdown, auto-fire on KPI load) |
+| Sub-agent definition style | **Code** for `sql_analyst` / `dashboard_pilot`. Markdown narrative is already covered by the three markdown agents; code demonstrates the `createAgent` + `fromPlugin` + inline `tool()` engineer path that dev-playground currently doesn't exercise. |
+| Approval flow | `save_view({ name, description? })` annotated `destructive: true`. Fires the HITL card. Server handler is a stub. |
+| Stream inspector | Slide-in right drawer, toggled by ⌘K or a small floating icon. Shows filtered SSE event timeline with args + expandable JSON. **Demo-scoped** — lives under the route directory, not promoted to `appkit-ui`. |
+| Merge strategy | **Into `agent/v2/6-apps-docs`** as the "integration test" payoff of the stack. Not a follow-up PR. |
+| Dev-playground character | Accept that it grows from "feature grab-bag" into "feature grab-bag + one flagship demo route." The route lives in its own subdirectory and doesn't leak into other routes. |
+
+## Non-goals (this iteration)
+
+- Real Databricks AI/BI dashboard embedding.
+- Server-side dashboard state (named views shared across users).
+- WebSocket / bidirectional agent ↔ UI channel. SSE-only.
+- Agents reading dashboard state via tool calls. State flows to the agent
+  via system-prompt context injection only (static).
+- Promoting the stream inspector into `appkit-ui`. Follow-up if the demo lands.
+- MCP hosted tools in this route. The v2 stack already has MCP coverage
+  elsewhere; not worth the extra env-var setup for this demo.
+
+## What exists today (prototype to port)
+
+Source: `/Users/mario.cadenas/.cursor/worktrees/app-kit/p3ju/apps/smart-dashboard/`
+
+- **Server** (`server.ts`, 97 lines) — `query` agent code-defined with
+  `apply_filter` + `highlight_period` tools + `fromPlugin(analytics)`.
+- **Markdown agents** (`config/agents/`) — `anomaly.md` and `insights.md`,
+  ephemeral, `maxSteps: 1`, return JSON.
+- **SQL queries** (`config/queries/`) — `dashboard_kpis.sql`,
+  `dashboard_trips_over_time.sql`, `dashboard_fare_distribution.sql`,
+  `dashboard_top_zone.sql`.
+- **Client** (`src/`, 16 files, 1,544 lines) — `App.tsx`, component set
+  (active-filters, agent-sidebar, anomaly-card, fare-chart, insight-card,
+  kpi-cards, query-section, trip-chart), hooks (`use-agent-stream`,
+  `use-action-dispatcher`, `use-chart-colors`, `use-dashboard-data`).
+
+**~80% copy-forward.** The 20% new is stream inspector, multi-agent
+delegation, dashboard-context injection, `focus_chart`, approval card,
+polish.
+
+## What this plan adds
+
+### 1. Stream Inspector (NEW)
+
+Hidden-by-default right-edge drawer showing the SSE timeline of the latest
+run. Reviewers see tool-calls, message deltas, sub-agent invocations, and
+approval gates inline — the "inside the black box" view.
+
+- **Trigger:** ⌘K (macOS) / Ctrl+K, or a small debug icon in the bottom-right.
+- **Layout:** 420px right drawer, backdrop-blur, slides in.
+- **Content per event:** timestamp (ms relative to stream start), event
+  type, tool name + args table when it's a function call, collapsible
+  full-JSON view.
+- **Filter chips:** `all` / `tool calls` / `messages` / `approvals` / `sub-agents`.
+- **Implementation:** extend `use-agent-stream` to push every event into a
+  module-level store; new `<StreamInspector>` component consumes it.
+- **Scope:** session-only. No persistence, no export.
+
+### 2. Approval-gate demo path
+
+One destructive tool so HITL fires visibly:
+
+- `save_view({ name, description? })` annotated
+  `{ destructive: true, readOnly: false }`.
+- Prompt it with *"save this as 'High-fare Friday 2016'"*.
+- UI renders a rich `<ApprovalCard>` with the view name, description,
+  current filters + highlights summary, annotations chip.
+- Approve → tool returns success, agent confirms. Deny → agent receives
+  the denial string, apologises, replans.
+
+Handler is a stub (console.log + return).
+
+### 3. Dashboard context injection (static)
+
+Every chat message gets a prefix block describing what the user is looking
+at: active filters, highlight ranges, current timerange.
+
+- `buildDashboardContext(filters, highlights): string` utility.
+- `use-agent-stream.send(message, { contextPrefix })` signature extension.
+- `<QuerySection>` composes the prefix before each send.
+
+Pure UX change. No new AppKit primitive.
+
+### 4. Multi-agent delegation (upgrades the `query` agent)
+
+Prototype's `query` is a flat agent with four tools. Upgrade:
+
+- `query` (markdown dispatcher) — decides which specialist to call, never
+  calls tools directly.
+- `sql_analyst` (code) — tools: `...fromPlugin(analytics)`, `save_view`.
+- `dashboard_pilot` (code) — tools: `apply_filter`, `highlight_period`,
+  `focus_chart`.
+
+Dispatcher exposes `agent-sql_analyst` and `agent-dashboard_pilot` as
+sub-agent tools. Default agent: `query`.
+
+This demonstrates:
+- Sub-agent delegation (`agents:` in def)
+- `fromPlugin` + inline `tool()` in code (`sql_analyst`)
+- Tool-only sub-agent with no plugin deps (`dashboard_pilot`)
+- The flat-vs-delegated trade-off (risk: extra round-trip latency — see Risks)
+
+### 5. New UI action tool: `focus_chart({ chart_id })`
+
+Scrolls to the named chart and pulses it. Chart IDs:
+`trips_over_time`, `fare_distribution`, `kpis`.
+
+- `tool()` handler returns a confirmation string.
+- Client `useFocusRegistry` hook: chart components register refs by id.
+- `use-action-dispatcher` listens for `focus_chart` function_call events
+  and triggers the pulse animation.
+
+Zero server logic. Pure action-dispatch demo.
+
+### 6. Polish
+
+- `<ApprovalCard>` renders annotations prominently (red badge for
+  `destructive: true`) plus filter/highlight context.
+- KPI cards use shimmer loading instead of `isLoading` text.
+- Error toasts when SQL fails / agent errors / model endpoint 4xx/5xx.
+- Keyboard: ⌘K (inspector), ⌘L (focus chat input), `Esc` (close drawer).
+- Top-of-route hero: "Smart Dashboard — NYC Taxi analytics, powered by
+  3 AI agents" with tiny indicators for each agent's state.
+
+## Architecture notes
+
+### The agent → UI action pattern
+
+The prototype's core insight: **the agent's tool-call JSON is the action
+payload.** No new AppKit primitive.
+
+```
+Agent emits:   tool_call { name: "apply_filter", args: { field: "date", ... } }
+              ↓ (via SSE response.output_item.added)
+Client reads:  SSEEvent { item: { type: "function_call", name, arguments } }
+Client applies: setFilters(deriveFiltersFromArgs(args))
+Server tool:   execute() returns confirmation text for the LLM log
+```
+
+Benefits preserved:
+- Agent control flow: LLM sees confirmation, plans next step.
+- Client latency: UI updates as tokens stream.
+- Security: no new attack surface; existing SSE pipeline already authed.
+- Observability: stream inspector sees every action inline with everything else.
+
+### Dashboard state flow
+
+```
+User action ─→ useState (filters, highlights) ─→ useDashboardData() ─→ SQL
+                              ↑                                           ↓
+                              └──── tool_call dispatch ←──── SSE ←──── agent
+                                                                          ↑
+                              buildDashboardContext() ─────→ send() ──────┘
+```
+
+One-way reactive loop. Simple, testable.
+
+### File layout (target)
+
+```
+apps/dev-playground/
+  config/
+    agents/
+      query/agent.md              # dispatcher (NEW)
+      insights/agent.md           # ported from prototype
+      anomaly/agent.md            # ported from prototype
+      assistant/agent.md          # existing — unchanged
+      autocomplete/agent.md       # existing — unchanged
+    queries/                      # NEW if not present; check
+      dashboard_kpis.sql
+      dashboard_trips_over_time.sql
+      dashboard_fare_distribution.sql
+      dashboard_top_zone.sql
+  server/
+    index.ts                      # add sql_analyst + dashboard_pilot,
+                                  # wire apply_filter, highlight_period,
+                                  # focus_chart, save_view
+  client/
+    src/
+      routes/
+        smart-dashboard.route.tsx # NEW route entry (registers under /smart-dashboard)
+        smart-dashboard/          # NEW subdirectory
+          components/
+            active-filters.tsx    # ported
+            agent-sidebar.tsx     # ported + inspector toggle
+            approval-card.tsx     # NEW
+            anomaly-card.tsx      # ported
+            fare-chart.tsx        # ported
+            insight-card.tsx      # ported
+            kpi-cards.tsx         # ported + shimmer
+            query-section.tsx     # ported + dashboard-context injection
+            stream-inspector.tsx  # NEW
+            trip-chart.tsx        # ported + focus-pulse
+          hooks/
+            use-action-dispatcher.ts  # ported + focus_chart + save_view
+            use-agent-stream.ts       # ported + context-prefix + inspector feed
+            use-chart-colors.ts       # ported
+            use-dashboard-data.ts     # ported
+            use-focus-registry.ts     # NEW
+            use-stream-inspector.ts   # NEW
+          lib/
+            dashboard-context.ts      # NEW (buildDashboardContext)
+```
+
+## Implementation stages
+
+Each stage independently shippable. Stop at Stage 2 for MVP demo; go
+through Stage 5 for wow.
+
+### Stage 0 — Port prototype + retire agent-app (2h)
+
+- [ ] Port `config/queries/*.sql` into `apps/dev-playground/config/queries/`
+- [ ] Port `config/agents/anomaly.md` + `insights.md` into folder layout:
+      `config/agents/anomaly/agent.md`, `config/agents/insights/agent.md`
+- [ ] Port 16 client files into `client/src/routes/smart-dashboard/`
+- [ ] Register the route in TanStack Router (`smart-dashboard.route.tsx`)
+- [ ] Add `query` markdown agent + `sql_analyst`/`dashboard_pilot` code
+      agents to `server/index.ts`, including the ambient tools
+- [ ] Delete `apps/agent-app/`
+- [ ] Grep repo for `agent-app` references (docs, template, scripts,
+      `docs/docs/plugins/agents.md`, tests)
+- [ ] Verify `pnpm --filter=dev-playground dev` boots, `/smart-dashboard`
+      renders the dashboard, KPIs load, default chat works
+
+### Stage 1 — Dispatcher + sub-agents (3h)
+
+- [ ] Split the flat `query` agent into `query` dispatcher + `sql_analyst`
+      + `dashboard_pilot`
+- [ ] Dispatcher prompt: "decide which specialist to call; do not call
+      tools directly"
+- [ ] `query.md` has `agents: [sql_analyst, dashboard_pilot]` frontmatter
+- [ ] Benchmark TTFT against the flat agent — if p90 > 3s, revert to flat
+      and use delegation only for pilot commands
+
+### Stage 2 — Destructive action + approval card (3h)
+
+- [ ] Implement `save_view({ name, description? })` tool with
+      `annotations: { destructive: true }`
+- [ ] Build `<ApprovalCard>`: name/description fields visible, filters +
+      highlights context block, red destructive chip, approve/deny
+- [ ] Wire to `POST /api/agent/approve`
+- [ ] Deny path: confirm agent receives denial string and gracefully
+      replans
+
+### Stage 3 — Dashboard context injection + `focus_chart` (2h)
+
+- [ ] `lib/dashboard-context.ts` — `buildDashboardContext(filters, highlights)`
+- [ ] `use-agent-stream.send` accepts `{ contextPrefix }`
+- [ ] `<QuerySection>` composes prefix before every send
+- [ ] `focus_chart` tool + `use-focus-registry` hook
+- [ ] Chart components register refs, pulse animation on focus
+
+### Stage 4 — Stream Inspector (4h)
+
+- [ ] `use-stream-inspector` — module-level event store, ⌘K toggle, clear-on-new-run
+- [ ] `use-agent-stream` pushes every SSE event into the store
+- [ ] `<StreamInspector>` component — drawer, filter chips, event timeline,
+      expandable JSON, per-event timestamp relative to stream start
+- [ ] Focus trap, `Esc` to close, restore focus on close
+- [ ] Floating debug icon in bottom-right (discoverability alongside ⌘K)
+
+### Stage 5 — Polish (2h)
+
+- [ ] KPI shimmer loading
+- [ ] Error toasts for SQL failures, agent errors
+- [ ] Keyboard shortcuts: ⌘K, ⌘L, `Esc`
+- [ ] Route-level README: `client/src/routes/smart-dashboard/README.md` —
+      architecture, demo script, known limitations
+- [ ] `docs/docs/plugins/agents.md` — add a "See it all together" pointer
+
+### Stage 6 — Demo script + rehearsal (1h)
+
+- [ ] `DEMO.md` at repo root or route directory — step-by-step, 15 min,
+      one block per feature
+- [ ] Dry-run with someone who hasn't seen it; flag rough edges
+
+**Total: ~17h focused.** Realistic wall-clock: ~2.5 days.
+
+## Acceptance criteria
+
+- [ ] `pnpm --filter=dev-playground dev` boots and `/smart-dashboard` renders
+- [ ] "show me fares above $50" → filter applied, charts update
+- [ ] "highlight November 2016" → trip chart gets a shaded band
+- [ ] "focus on the fare distribution" → fare chart scrolls into view + pulses
+- [ ] "save this as 'high-fare-fridays'" → approval card appears; deny → apology; approve → view logged
+- [ ] Default page load: insights + anomalies populate within ~5s of KPI data
+- [ ] ⌘K opens stream inspector; filter chips work; tool-call events show args + result
+- [ ] Delegation: "compare Dec vs Nov fares" routes to `sql_analyst`;
+      "highlight peak hours" routes to `dashboard_pilot`
+- [ ] `apps/agent-app/` deleted; `rg "agent-app"` across repo returns only
+      historical CHANGELOG entries
+- [ ] `pnpm --filter=appkit test` still passes (no regressions in the v2 stack)
+
+## Git
+
+- Branch: **`agent/v2/6-apps-docs`** (this stack's tip).
+- Ideally one commit per stage, for reviewable chunks.
+- Rebase 5→4 shouldn't be needed; this is additive on top of the stack.
+- After the stack merges, the work stays as-is on `main`.
+
+## Risk
+
+- **Prototype drift.** Built against AppKit 0.24.0 vendored tgz; current
+  stack is also 0.24.0 but we've refactored internals (MCP connector move,
+  helper extractions). Risk: minor import/type tweaks on port. Mitigation:
+  Stage 0 is port-and-boot first, nothing added until green.
+
+- **Stream inspector scope creep.** Easy to make a week of work. Mitigation:
+  v1 is "dump JSON events with filter chips." No search, no diff, no export.
+
+- **Delegation latency.** Dispatcher → sub-agent is 2 model round-trips. May
+  feel laggier than prototype's flat agent. Mitigation: benchmark in Stage 1;
+  fall back to flat if p90 TTFT > 3s.
+
+- **Dev-playground bloat.** Adding ~1,500 client lines in a subdirectory.
+  Mitigation: everything lives under `routes/smart-dashboard/`; other routes
+  unaffected; playground's other routes unchanged.
+
+- **v2 stack size.** Branch 6 gets bigger. Acceptable trade-off for having
+  a single end-to-end integration demo that reviewers can run and every
+  feature is visible.
+
+## Next step
+
+Stage 0 port + boot verification. One commit on `agent/v2/6-apps-docs`:
+
+```
+feat(dev-playground): port Smart Dashboard as /smart-dashboard route; retire agent-app
+
+Ports the p3ju Smart Dashboard prototype into apps/dev-playground as a new
+route. Migrates markdown agents to folder layout. Deletes apps/agent-app
+(superseded by this demo).
+
+Verifies that the route boots, KPIs load from samples.nyctaxi.trips, and
+the flat `query` agent answers and applies filters.
+
+Stages 1-6 (delegation, approval, context injection, stream inspector,
+polish, demo script) land as follow-up commits on the same branch.
+```
+
+If approved, I run Stage 0, report the diff size and any porting surprises,
+then proceed stage by stage.
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 7d8efbf52..937ec4fc4 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -81,76 +81,6 @@ importers:
         specifier: 3.2.4
         version: 3.2.4(@types/debug@4.1.12)(@types/node@24.7.2)(jiti@2.6.1)(jsdom@27.0.0(bufferutil@4.0.9)(postcss@8.5.6))(lightningcss@1.30.2)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2)
 
-  apps/agent-app:
-    dependencies:
-      '@databricks/appkit':
-        specifier: workspace:*
-        version: link:../../packages/appkit
-      '@databricks/appkit-ui':
-        specifier: workspace:*
-        version: link:../../packages/appkit-ui
-      '@databricks/sdk-experimental':
-        specifier: ^0.16.0
-        version: 0.16.0
-      dotenv:
-        specifier: ^16.6.1
-        version: 16.6.1
-      lucide-react:
-        specifier: ^0.511.0
-        version: 0.511.0(react@19.2.0)
-      marked:
-        specifier: ^15.0.0
-        version: 15.0.12
-      react:
-        specifier: 19.2.0
-        version: 19.2.0
-      react-dom:
-        specifier: 19.2.0
-        version: 19.2.0(react@19.2.0)
-      zod:
-        specifier: ^4.0.0
-        version: 4.1.13
-    devDependencies:
-      '@tailwindcss/postcss':
-        specifier: 4.1.17
-        version: 4.1.17
-      '@types/node':
-        specifier: 24.10.1
-        version: 24.10.1
-      '@types/react':
-        specifier: 19.2.7
-        version: 19.2.7
-      '@types/react-dom':
-        specifier: 19.2.3
-        version: 19.2.3(@types/react@19.2.7)
-      '@vitejs/plugin-react':
-        specifier: 5.1.1
-        version: 5.1.1(rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2))
-      autoprefixer:
-        specifier: 10.4.21
-        version: 10.4.21(postcss@8.5.6)
-      postcss:
-        specifier: 8.5.6
-        version: 8.5.6
-      tailwindcss:
-        specifier: 4.1.17
-        version: 4.1.17
-      tailwindcss-animate:
-        specifier: 1.0.7
-        version: 1.0.7(tailwindcss@4.1.17)
-      tsx:
-        specifier: 4.20.6
-        version: 4.20.6
-      tw-animate-css:
-        specifier: 1.4.0
-        version: 1.4.0
-      typescript:
-        specifier: 5.9.3
-        version: 5.9.3
-      vite:
-        specifier: npm:rolldown-vite@7.1.14
-        version: rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2)
-
   apps/clean-app:
     dependencies:
       '@databricks/appkit':
@@ -4650,136 +4580,63 @@ packages:
     resolution: {integrity: sha512-+PmQX0PiAYPMeVYe237LJAYvOMYW1j2rH5YROyS3b4CTVJum34HfRvKvAzozHAQG0TnHNdUfY9nCeUyRAs//cw==}
     engines: {node: '>=14.16'}
 
-  '@tailwindcss/node@4.1.17':
-    resolution: {integrity: sha512-csIkHIgLb3JisEFQ0vxr2Y57GUNYh447C8xzwj89U/8fdW8LhProdxvnVH6U8M2Y73QKiTIH+LWbK3V2BBZsAg==}
-
   '@tailwindcss/node@4.1.18':
     resolution: {integrity: sha512-DoR7U1P7iYhw16qJ49fgXUlry1t4CpXeErJHnQ44JgTSKMaZUdf17cfn5mHchfJ4KRBZRFA/Coo+MUF5+gOaCQ==}
 
-  '@tailwindcss/oxide-android-arm64@4.1.17':
-    resolution: {integrity: sha512-BMqpkJHgOZ5z78qqiGE6ZIRExyaHyuxjgrJ6eBO5+hfrfGkuya0lYfw8fRHG77gdTjWkNWEEm+qeG2cDMxArLQ==}
-    engines: {node: '>= 10'}
-    cpu: [arm64]
-    os: [android]
-
   '@tailwindcss/oxide-android-arm64@4.1.18':
     resolution: {integrity: sha512-dJHz7+Ugr9U/diKJA0W6N/6/cjI+ZTAoxPf9Iz9BFRF2GzEX8IvXxFIi/dZBloVJX/MZGvRuFA9rqwdiIEZQ0Q==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [android]
 
-  '@tailwindcss/oxide-darwin-arm64@4.1.17':
-    resolution: {integrity: sha512-EquyumkQweUBNk1zGEU/wfZo2qkp/nQKRZM8bUYO0J+Lums5+wl2CcG1f9BgAjn/u9pJzdYddHWBiFXJTcxmOg==}
-    engines: {node: '>= 10'}
-    cpu: [arm64]
-    os: [darwin]
-
   '@tailwindcss/oxide-darwin-arm64@4.1.18':
     resolution: {integrity: sha512-Gc2q4Qhs660bhjyBSKgq6BYvwDz4G+BuyJ5H1xfhmDR3D8HnHCmT/BSkvSL0vQLy/nkMLY20PQ2OoYMO15Jd0A==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [darwin]
 
-  '@tailwindcss/oxide-darwin-x64@4.1.17':
-    resolution: {integrity: sha512-gdhEPLzke2Pog8s12oADwYu0IAw04Y2tlmgVzIN0+046ytcgx8uZmCzEg4VcQh+AHKiS7xaL8kGo/QTiNEGRog==}
-    engines: {node: '>= 10'}
-    cpu: [x64]
-    os: [darwin]
-
   '@tailwindcss/oxide-darwin-x64@4.1.18':
     resolution: {integrity: sha512-FL5oxr2xQsFrc3X9o1fjHKBYBMD1QZNyc1Xzw/h5Qu4XnEBi3dZn96HcHm41c/euGV+GRiXFfh2hUCyKi/e+yw==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [darwin]
 
-  '@tailwindcss/oxide-freebsd-x64@4.1.17':
-    resolution: {integrity: sha512-hxGS81KskMxML9DXsaXT1H0DyA+ZBIbyG/sSAjWNe2EDl7TkPOBI42GBV3u38itzGUOmFfCzk1iAjDXds8Oh0g==}
-    engines: {node: '>= 10'}
-    cpu: [x64]
-    os: [freebsd]
-
   '@tailwindcss/oxide-freebsd-x64@4.1.18':
     resolution: {integrity: sha512-Fj+RHgu5bDodmV1dM9yAxlfJwkkWvLiRjbhuO2LEtwtlYlBgiAT4x/j5wQr1tC3SANAgD+0YcmWVrj8R9trVMA==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [freebsd]
 
-  '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.17':
-    resolution: {integrity: sha512-k7jWk5E3ldAdw0cNglhjSgv501u7yrMf8oeZ0cElhxU6Y2o7f8yqelOp3fhf7evjIS6ujTI3U8pKUXV2I4iXHQ==}
-    engines: {node: '>= 10'}
-    cpu: [arm]
-    os: [linux]
-
   '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.18':
     resolution: {integrity: sha512-Fp+Wzk/Ws4dZn+LV2Nqx3IilnhH51YZoRaYHQsVq3RQvEl+71VGKFpkfHrLM/Li+kt5c0DJe/bHXK1eHgDmdiA==}
     engines: {node: '>= 10'}
     cpu: [arm]
     os: [linux]
 
-  '@tailwindcss/oxide-linux-arm64-gnu@4.1.17':
-    resolution: {integrity: sha512-HVDOm/mxK6+TbARwdW17WrgDYEGzmoYayrCgmLEw7FxTPLcp/glBisuyWkFz/jb7ZfiAXAXUACfyItn+nTgsdQ==}
-    engines: {node: '>= 10'}
-    cpu: [arm64]
-    os: [linux]
-    libc: [glibc]
-
   '@tailwindcss/oxide-linux-arm64-gnu@4.1.18':
     resolution: {integrity: sha512-S0n3jboLysNbh55Vrt7pk9wgpyTTPD0fdQeh7wQfMqLPM/Hrxi+dVsLsPrycQjGKEQk85Kgbx+6+QnYNiHalnw==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [linux]
 
-  '@tailwindcss/oxide-linux-arm64-musl@4.1.17':
-    resolution: {integrity: sha512-HvZLfGr42i5anKtIeQzxdkw/wPqIbpeZqe7vd3V9vI3RQxe3xU1fLjss0TjyhxWcBaipk7NYwSrwTwK1hJARMg==}
-    engines: {node: '>= 10'}
-    cpu: [arm64]
-    os: [linux]
-    libc: [musl]
-
   '@tailwindcss/oxide-linux-arm64-musl@4.1.18':
     resolution: {integrity: sha512-1px92582HkPQlaaCkdRcio71p8bc8i/ap5807tPRDK/uw953cauQBT8c5tVGkOwrHMfc2Yh6UuxaH4vtTjGvHg==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [linux]
 
-  '@tailwindcss/oxide-linux-x64-gnu@4.1.17':
-    resolution: {integrity: sha512-M3XZuORCGB7VPOEDH+nzpJ21XPvK5PyjlkSFkFziNHGLc5d6g3di2McAAblmaSUNl8IOmzYwLx9NsE7bplNkwQ==}
-    engines: {node: '>= 10'}
-    cpu: [x64]
-    os: [linux]
-    libc: [glibc]
-
   '@tailwindcss/oxide-linux-x64-gnu@4.1.18':
     resolution: {integrity: sha512-v3gyT0ivkfBLoZGF9LyHmts0Isc8jHZyVcbzio6Wpzifg/+5ZJpDiRiUhDLkcr7f/r38SWNe7ucxmGW3j3Kb/g==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [linux]
 
-  '@tailwindcss/oxide-linux-x64-musl@4.1.17':
-    resolution: {integrity: sha512-k7f+pf9eXLEey4pBlw+8dgfJHY4PZ5qOUFDyNf7SI6lHjQ9Zt7+NcscjpwdCEbYi6FI5c2KDTDWyf2iHcCSyyQ==}
-    engines: {node: '>= 10'}
-    cpu: [x64]
-    os: [linux]
-    libc: [musl]
-
   '@tailwindcss/oxide-linux-x64-musl@4.1.18':
     resolution: {integrity: sha512-bhJ2y2OQNlcRwwgOAGMY0xTFStt4/wyU6pvI6LSuZpRgKQwxTec0/3Scu91O8ir7qCR3AuepQKLU/kX99FouqQ==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [linux]
 
-  '@tailwindcss/oxide-wasm32-wasi@4.1.17':
-    resolution: {integrity: sha512-cEytGqSSoy7zK4JRWiTCx43FsKP/zGr0CsuMawhH67ONlH+T79VteQeJQRO/X7L0juEUA8ZyuYikcRBf0vsxhg==}
-    engines: {node: '>=14.0.0'}
-    cpu: [wasm32]
-    bundledDependencies:
-      - '@napi-rs/wasm-runtime'
-      - '@emnapi/core'
-      - '@emnapi/runtime'
-      - '@tybys/wasm-util'
-      - '@emnapi/wasi-threads'
-      - tslib
-
   '@tailwindcss/oxide-wasm32-wasi@4.1.18':
     resolution: {integrity: sha512-LffYTvPjODiP6PT16oNeUQJzNVyJl1cjIebq/rWWBF+3eDst5JGEFSc5cWxyRCJ0Mxl+KyIkqRxk1XPEs9x8TA==}
     engines: {node: '>=14.0.0'}
@@ -4792,41 +4649,22 @@ packages:
       - '@emnapi/wasi-threads'
       - tslib
 
-  '@tailwindcss/oxide-win32-arm64-msvc@4.1.17':
-    resolution: {integrity: sha512-JU5AHr7gKbZlOGvMdb4722/0aYbU+tN6lv1kONx0JK2cGsh7g148zVWLM0IKR3NeKLv+L90chBVYcJ8uJWbC9A==}
-    engines: {node: '>= 10'}
-    cpu: [arm64]
-    os: [win32]
-
   '@tailwindcss/oxide-win32-arm64-msvc@4.1.18':
     resolution: {integrity: sha512-HjSA7mr9HmC8fu6bdsZvZ+dhjyGCLdotjVOgLA2vEqxEBZaQo9YTX4kwgEvPCpRh8o4uWc4J/wEoFzhEmjvPbA==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [win32]
 
-  '@tailwindcss/oxide-win32-x64-msvc@4.1.17':
-    resolution: {integrity: sha512-SKWM4waLuqx0IH+FMDUw6R66Hu4OuTALFgnleKbqhgGU30DY20NORZMZUKgLRjQXNN2TLzKvh48QXTig4h4bGw==}
-    engines: {node: '>= 10'}
-    cpu: [x64]
-    os: [win32]
-
   '@tailwindcss/oxide-win32-x64-msvc@4.1.18':
     resolution: {integrity: sha512-bJWbyYpUlqamC8dpR7pfjA0I7vdF6t5VpUGMWRkXVE3AXgIZjYUYAK7II1GNaxR8J1SSrSrppRar8G++JekE3Q==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [win32]
 
-  '@tailwindcss/oxide@4.1.17':
-    resolution: {integrity: sha512-F0F7d01fmkQhsTjXezGBLdrl1KresJTcI3DB8EkScCldyKp3Msz4hub4uyYaVnk88BAS1g5DQjjF6F5qczheLA==}
-    engines: {node: '>= 10'}
-
   '@tailwindcss/oxide@4.1.18':
     resolution: {integrity: sha512-EgCR5tTS5bUSKQgzeMClT6iCY3ToqE1y+ZB0AKldj809QXk1Y+3jB0upOYZrn9aGIzPtUsP7sX4QQ4XtjBB95A==}
     engines: {node: '>= 10'}
 
-  '@tailwindcss/postcss@4.1.17':
-    resolution: {integrity: sha512-+nKl9N9mN5uJ+M7dBOOCzINw94MPstNR/GtIhz1fpZysxL/4a+No64jCBD6CPN+bIHWFx3KWuu8XJRrj/572Dw==}
-
   '@tailwindcss/postcss@4.1.18':
     resolution: {integrity: sha512-Ce0GFnzAOuPyfV5SxjXGn0CubwGcuDB0zcdaPuCSzAa/2vII24JTkH+I6jcbXLb1ctjZMZZI6OjDaLPJQL1S0g==}
 
@@ -8598,11 +8436,6 @@ packages:
     resolution: {integrity: sha512-jumlc0BIUrS3qJGgIkWZsyfAM7NCWiBcCDhnd+3NNM5KbBmLTgHVfWBcg6W+rLUsIpzpERPsvwUP7CckAQSOoA==}
     engines: {node: '>=12'}
 
-  lucide-react@0.511.0:
-    resolution: {integrity: sha512-VK5a2ydJ7xm8GvBeKLS9mu1pVK6ucef9780JVUjw6bAjJL/QXnd4Y0p7SPeOUMC27YhzNCZvm5d/QX0Tp3rc0w==}
-    peerDependencies:
-      react: ^16.5.1 || ^17.0.0 || ^18.0.0 || ^19.0.0
-
   lucide-react@0.554.0:
     resolution: {integrity: sha512-St+z29uthEJVx0Is7ellNkgTEhaeSoA42I7JjOCBCrc5X6LYMGSv0P/2uS5HDLTExP5tpiqRD2PyUEOS6s9UXA==}
     peerDependencies:
@@ -8653,11 +8486,6 @@ packages:
   markdown-table@3.0.4:
     resolution: {integrity: sha512-wiYz4+JrLyb/DqW2hkFJxP7Vd7JuTDm77fvbM8VfEQdmSMqcImWeeRbHwZjBjIFki/VaMK2BhFi7oUUZeM5bqw==}
 
-  marked@15.0.12:
-    resolution: {integrity: sha512-8dD6FusOQSrpv9Z1rdNMdlSgQOIP880DHqnohobOmYLElGEqAL/JvxvuxZO16r4HtjTlfPRDC1hbvxC9dPN2nA==}
-    engines: {node: '>= 18'}
-    hasBin: true
-
   marked@16.4.2:
     resolution: {integrity: sha512-TI3V8YYWvkVf3KJe1dRkpnjs68JUPyEa5vjKrp1XEEJUAOaQc+Qj+L1qWbPd0SJuAdQkFU0h73sXXqwDYxsiDA==}
     engines: {node: '>= 20'}
@@ -17063,16 +16891,6 @@ snapshots:
     dependencies:
       defer-to-connect: 2.0.1
 
-  '@tailwindcss/node@4.1.17':
-    dependencies:
-      '@jridgewell/remapping': 2.3.5
-      enhanced-resolve: 5.18.3
-      jiti: 2.6.1
-      lightningcss: 1.30.2
-      magic-string: 0.30.21
-      source-map-js: 1.2.1
-      tailwindcss: 4.1.17
-
   '@tailwindcss/node@4.1.18':
     dependencies:
       '@jridgewell/remapping': 2.3.5
@@ -17083,93 +16901,42 @@ snapshots:
       source-map-js: 1.2.1
       tailwindcss: 4.1.18
 
-  '@tailwindcss/oxide-android-arm64@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-android-arm64@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-darwin-arm64@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-darwin-arm64@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-darwin-x64@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-darwin-x64@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-freebsd-x64@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-freebsd-x64@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-linux-arm64-gnu@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-linux-arm64-gnu@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-linux-arm64-musl@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-linux-arm64-musl@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-linux-x64-gnu@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-linux-x64-gnu@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-linux-x64-musl@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-linux-x64-musl@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-wasm32-wasi@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-wasm32-wasi@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-win32-arm64-msvc@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-win32-arm64-msvc@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide-win32-x64-msvc@4.1.17':
-    optional: true
-
   '@tailwindcss/oxide-win32-x64-msvc@4.1.18':
     optional: true
 
-  '@tailwindcss/oxide@4.1.17':
-    optionalDependencies:
-      '@tailwindcss/oxide-android-arm64': 4.1.17
-      '@tailwindcss/oxide-darwin-arm64': 4.1.17
-      '@tailwindcss/oxide-darwin-x64': 4.1.17
-      '@tailwindcss/oxide-freebsd-x64': 4.1.17
-      '@tailwindcss/oxide-linux-arm-gnueabihf': 4.1.17
-      '@tailwindcss/oxide-linux-arm64-gnu': 4.1.17
-      '@tailwindcss/oxide-linux-arm64-musl': 4.1.17
-      '@tailwindcss/oxide-linux-x64-gnu': 4.1.17
-      '@tailwindcss/oxide-linux-x64-musl': 4.1.17
-      '@tailwindcss/oxide-wasm32-wasi': 4.1.17
-      '@tailwindcss/oxide-win32-arm64-msvc': 4.1.17
-      '@tailwindcss/oxide-win32-x64-msvc': 4.1.17
-
   '@tailwindcss/oxide@4.1.18':
     optionalDependencies:
       '@tailwindcss/oxide-android-arm64': 4.1.18
@@ -17185,14 +16952,6 @@ snapshots:
       '@tailwindcss/oxide-win32-arm64-msvc': 4.1.18
       '@tailwindcss/oxide-win32-x64-msvc': 4.1.18
 
-  '@tailwindcss/postcss@4.1.17':
-    dependencies:
-      '@alloc/quick-lru': 5.2.0
-      '@tailwindcss/node': 4.1.17
-      '@tailwindcss/oxide': 4.1.17
-      postcss: 8.5.6
-      tailwindcss: 4.1.17
-
   '@tailwindcss/postcss@4.1.18':
     dependencies:
       '@alloc/quick-lru': 5.2.0
@@ -17772,18 +17531,6 @@ snapshots:
     transitivePeerDependencies:
       - supports-color
 
-  '@vitejs/plugin-react@5.1.1(rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2))':
-    dependencies:
-      '@babel/core': 7.28.5
-      '@babel/plugin-transform-react-jsx-self': 7.27.1(@babel/core@7.28.5)
-      '@babel/plugin-transform-react-jsx-source': 7.27.1(@babel/core@7.28.5)
-      '@rolldown/pluginutils': 1.0.0-beta.47
-      '@types/babel__core': 7.20.5
-      react-refresh: 0.18.0
-      vite: rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2)
-    transitivePeerDependencies:
-      - supports-color
-
   '@vitejs/plugin-react@5.1.1(rolldown-vite@7.1.14(@types/node@25.2.3)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2))':
     dependencies:
       '@babel/core': 7.28.5
@@ -21445,10 +21192,6 @@ snapshots:
 
   lru-cache@7.18.3: {}
 
-  lucide-react@0.511.0(react@19.2.0):
-    dependencies:
-      react: 19.2.0
-
   lucide-react@0.554.0(react@19.2.0):
     dependencies:
       react: 19.2.0
@@ -21512,8 +21255,6 @@ snapshots:
 
   markdown-table@3.0.4: {}
 
-  marked@15.0.12: {}
-
   marked@16.4.2: {}
 
   marked@17.0.3: {}
@@ -23820,24 +23561,6 @@ snapshots:
       tsx: 4.20.6
       yaml: 2.8.2
 
-  rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2):
-    dependencies:
-      '@oxc-project/runtime': 0.92.0
-      fdir: 6.5.0(picomatch@4.0.3)
-      lightningcss: 1.30.2
-      picomatch: 4.0.3
-      postcss: 8.5.6
-      rolldown: 1.0.0-beta.41
-      tinyglobby: 0.2.15
-    optionalDependencies:
-      '@types/node': 24.10.1
-      esbuild: 0.25.10
-      fsevents: 2.3.3
-      jiti: 2.6.1
-      terser: 5.44.1
-      tsx: 4.20.6
-      yaml: 2.8.2
-
   rolldown-vite@7.1.14(@types/node@25.2.3)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2):
     dependencies:
       '@oxc-project/runtime': 0.92.0

From 85f221ac2c68e4ceb15d7e4a862059a5caa643a5 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 12:09:46 +0200
Subject: [PATCH 24/46] feat(dev-playground): stage 2-4 of smart-dashboard demo

Stage 0 ported the dashboard shell verbatim from the prototype; this
commit layers every v2-stack feature on top, moves the feature dir out
of routes/ (TanStack was flagging files as stray routes), rewrites the
agent -> UI action pipeline for correctness, and adds discoverability
for the HITL flow.

Server (apps/dev-playground/server/index.ts)

- Split the polymorphic apply_filter into four narrower tools:
  filter_by_date_range, filter_by_pickup_zip, filter_by_fare,
  clear_filters. Each has exactly one client-side effect; removes the
  whole class of 'agent said it worked but nothing moved' bugs.
- Add clear_highlights, focus_chart, save_view (destructive; triggers
  the approval gate).
- dashboard_pilot instructions rewritten with a compact verb-per-line
  reference so the LLM picks the right single tool for each intent.

Client - moved out of routes/

- Feature code relocates to client/src/features/smart-dashboard/
  (components/, hooks/, lib/). TanStack Router was warning that every
  non-route file under routes/ 'does not contain any route piece.'
- smart-dashboard.route.tsx uses @/features/ aliases; the route file
  is now the only thing under routes/.

Client - correctness fixes in the action dispatcher

- Act only on response.output_item.done (never .added, which fires
  with partial arguments and caused double-applied highlights plus
  silent JSON-parse races).
- Dedupe by call_id with a bounded LRU; reset on appkit.metadata
  (new-run signal).
- Use updater callbacks (onFilterUpdate(prev => ...)) instead of a
  currentFilters prop to eliminate stale-closure bugs when the agent
  fires multiple tool calls in one render cycle.
- Validate arg shapes per tool; anything malformed or unrecognized
  surfaces through onUnknownTool (route renders as a red banner +
  console.warn). Silent failure was the worst failure mode.
- Emit a human-readable summary for every applied action (onAction).

Client - discoverability / HITL

- New QuickActionsBar with Save view... (inline name input), Clear
  filters, Clear highlights. Each dispatches through the chat
  pipeline so the agent still reasons and the approval gate still
  fires for destructive actions - the bar just saves typing.
- ActionToast (bottom-left) confirms every dispatcher-applied action
  for ~3s. Answers 'did it work?' without opening the inspector.
- QuerySection refactored into a view: content/isLoading/onSend come
  from the route. Lifting useAgentStream one level up lets the Quick
  Actions bar and the chat input share a single agent stream.
- QuerySection example queries refreshed to cover the new tools.

Client - stream-inspector wiring

- SSEEvent extended with approval_pending payload fields.
- use-stream-inspector threaded through so every run's events flow
  into the inspector's module-level store.
- FocusableChart renamed its 'id' prop to 'chartId' (logical
  registry key, not a DOM id - biome was right to complain).

Verification

- pnpm --filter=dev-playground client tsc --noEmit: clean.
- pnpm --filter=dev-playground client vite build: clean.
- Server typecheck: same pre-existing errors as main; no new
  regressions.
- apps/dev-playground/shared/appkit-types/analytics.d.ts regenerated
  by vite build to register the four dashboard_* queries; kept in
  the commit so CI and downstream consumers have typed
  useAnalyticsQuery access out of the box.
---
 .../components/action-toast.tsx               |  48 ++++
 .../components/active-filters.tsx             |   0
 .../components/agent-sidebar.tsx              |   0
 .../components/anomaly-card.tsx               |   0
 .../components/approval-card.tsx              | 137 ++++++++++
 .../smart-dashboard/components/fare-chart.tsx |   0
 .../components/focusable-chart.tsx            |  36 +++
 .../components/insight-card.tsx               |   0
 .../components/inspector-toggle.tsx           |  31 +++
 .../smart-dashboard/components/kpi-cards.tsx  |   0
 .../components/query-section.tsx              |  56 ++--
 .../components/quick-actions-bar.tsx          | 119 +++++++++
 .../components/stream-inspector.tsx           | 246 ++++++++++++++++++
 .../smart-dashboard/components/trip-chart.tsx |   0
 .../hooks/use-action-dispatcher.ts            | 227 ++++++++++++++++
 .../smart-dashboard/hooks/use-agent-stream.ts |  33 ++-
 .../smart-dashboard/hooks/use-chart-colors.ts |   0
 .../hooks/use-dashboard-data.ts               |   0
 .../hooks/use-focus-registry.ts               |  51 ++++
 .../hooks/use-stream-inspector.ts             | 141 ++++++++++
 .../smart-dashboard/lib/dashboard-context.ts  |  41 +++
 .../src/routes/smart-dashboard.route.tsx      | 246 +++++++++++++++---
 .../hooks/use-action-dispatcher.ts            |  88 -------
 apps/dev-playground/server/index.ts           | 151 +++++++++--
 .../shared/appkit-types/analytics.d.ts        |  88 +++++++
 25 files changed, 1565 insertions(+), 174 deletions(-)
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/action-toast.tsx
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/components/active-filters.tsx (100%)
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/components/agent-sidebar.tsx (100%)
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/components/anomaly-card.tsx (100%)
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/components/fare-chart.tsx (100%)
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/focusable-chart.tsx
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/components/insight-card.tsx (100%)
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/inspector-toggle.tsx
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/components/kpi-cards.tsx (100%)
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/components/query-section.tsx (78%)
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/quick-actions-bar.tsx
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/stream-inspector.tsx
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/components/trip-chart.tsx (100%)
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/hooks/use-agent-stream.ts (78%)
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/hooks/use-chart-colors.ts (100%)
 rename apps/dev-playground/client/src/{routes => features}/smart-dashboard/hooks/use-dashboard-data.ts (100%)
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/hooks/use-focus-registry.ts
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/hooks/use-stream-inspector.ts
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/lib/dashboard-context.ts
 delete mode 100644 apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-action-dispatcher.ts

diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/action-toast.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/action-toast.tsx
new file mode 100644
index 000000000..311ecdc23
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/action-toast.tsx
@@ -0,0 +1,48 @@
+import { CheckCircle2Icon } from "lucide-react";
+import { useEffect, useState } from "react";
+
+interface ActionToastProps {
+  /**
+   * Latest dispatcher-surfaced action summary. Each new value bumps a
+   * render key so the toast re-animates even if the same message arrives
+   * twice (e.g. two identical filter calls in a row).
+   */
+  message: string | null;
+  durationMs?: number;
+}
+
+/**
+ * Non-intrusive bottom-left toast that confirms every agent-driven UI
+ * action. Silent success was the worst failure mode before: an action
+ * silently not-applied looked identical to one that worked but didn't
+ * show its effect.
+ */
+export function ActionToast({ message, durationMs = 2800 }: ActionToastProps) {
+  const [visible, setVisible] = useState<{ key: number; text: string } | null>(
+    null,
+  );
+
+  useEffect(() => {
+    if (!message) return;
+    const key = Date.now();
+    setVisible({ key, text: message });
+    const t = setTimeout(() => {
+      setVisible((v) => (v?.key === key ? null : v));
+    }, durationMs);
+    return () => {
+      clearTimeout(t);
+    };
+  }, [message, durationMs]);
+
+  if (!visible) return null;
+
+  return (
+    <div
+      key={visible.key}
+      className="fixed bottom-20 left-4 z-30 rounded-full bg-card border border-border shadow-lg px-3 py-1.5 flex items-center gap-2 animate-in fade-in slide-in-from-bottom-2 duration-200"
+    >
+      <CheckCircle2Icon className="h-3.5 w-3.5 text-green-500 shrink-0" />
+      <span className="text-xs text-foreground">{visible.text}</span>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/active-filters.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/active-filters.tsx
similarity index 100%
rename from apps/dev-playground/client/src/routes/smart-dashboard/components/active-filters.tsx
rename to apps/dev-playground/client/src/features/smart-dashboard/components/active-filters.tsx
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/agent-sidebar.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/agent-sidebar.tsx
similarity index 100%
rename from apps/dev-playground/client/src/routes/smart-dashboard/components/agent-sidebar.tsx
rename to apps/dev-playground/client/src/features/smart-dashboard/components/agent-sidebar.tsx
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/anomaly-card.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/anomaly-card.tsx
similarity index 100%
rename from apps/dev-playground/client/src/routes/smart-dashboard/components/anomaly-card.tsx
rename to apps/dev-playground/client/src/features/smart-dashboard/components/anomaly-card.tsx
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
new file mode 100644
index 000000000..70ff99130
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
@@ -0,0 +1,137 @@
+import { ShieldAlertIcon } from "lucide-react";
+import type { Highlight } from "../hooks/use-action-dispatcher";
+import type { DashboardFilters } from "../hooks/use-dashboard-data";
+
+export interface PendingApproval {
+  approvalId: string;
+  streamId: string;
+  toolName: string;
+  args: unknown;
+  annotations?: {
+    readOnly?: boolean;
+    destructive?: boolean;
+    idempotent?: boolean;
+  };
+}
+
+interface ApprovalCardProps {
+  approval: PendingApproval;
+  filters: DashboardFilters;
+  highlights: Highlight[];
+  onDecide: (approvalId: string, decision: "approve" | "deny") => void;
+}
+
+function formatFilters(filters: DashboardFilters): string {
+  const entries = Object.entries(filters).filter(
+    ([, v]) => v !== undefined && v !== "",
+  );
+  if (entries.length === 0) return "(none)";
+  return entries.map(([k, v]) => `${k}=${v}`).join(", ");
+}
+
+function formatHighlights(highlights: Highlight[]): string {
+  if (highlights.length === 0) return "(none)";
+  return highlights
+    .map(
+      (h) =>
+        `${h.start}..${h.end}${h.label ? ` (${h.label})` : ""} [${h.color}]`,
+    )
+    .join("; ");
+}
+
+export function ApprovalCard({
+  approval,
+  filters,
+  highlights,
+  onDecide,
+}: ApprovalCardProps) {
+  const args =
+    typeof approval.args === "object" && approval.args !== null
+      ? (approval.args as Record<string, unknown>)
+      : {};
+  const isDestructive = approval.annotations?.destructive === true;
+
+  return (
+    <div className="rounded-xl border border-red-500/40 bg-red-500/[0.06] p-4 shadow-sm">
+      <div className="flex items-start gap-2 mb-3">
+        <ShieldAlertIcon className="h-4 w-4 text-red-500 mt-0.5 shrink-0" />
+        <div className="flex-1 min-w-0">
+          <div className="flex items-center gap-2 mb-1 flex-wrap">
+            <h3 className="font-semibold text-sm text-foreground">
+              Approval required
+            </h3>
+            {isDestructive && (
+              <span className="text-[10px] uppercase tracking-wide bg-red-500/20 text-red-600 px-2 py-0.5 rounded-full font-medium">
+                destructive
+              </span>
+            )}
+          </div>
+          <p className="text-xs text-muted-foreground">
+            The agent wants to call{" "}
+            <code className="font-mono text-foreground">
+              {approval.toolName}
+            </code>
+            . Review the arguments before approving.
+          </p>
+        </div>
+      </div>
+
+      {Object.keys(args).length > 0 && (
+        <div className="mb-3">
+          <div className="text-xs font-medium text-foreground mb-1.5">
+            Arguments
+          </div>
+          <table className="w-full text-xs">
+            <tbody>
+              {Object.entries(args).map(([key, value]) => (
+                <tr
+                  key={key}
+                  className="border-b border-border/40 last:border-0"
+                >
+                  <td className="py-1.5 pr-3 font-mono text-muted-foreground w-[30%] align-top">
+                    {key}
+                  </td>
+                  <td className="py-1.5 text-foreground break-words">
+                    {typeof value === "string"
+                      ? value
+                      : JSON.stringify(value, null, 2)}
+                  </td>
+                </tr>
+              ))}
+            </tbody>
+          </table>
+        </div>
+      )}
+
+      <div className="mb-3 space-y-1 text-xs">
+        <div className="text-foreground font-medium">
+          Current dashboard state
+        </div>
+        <div className="text-muted-foreground">
+          <span className="font-mono">filters</span>: {formatFilters(filters)}
+        </div>
+        <div className="text-muted-foreground">
+          <span className="font-mono">highlights</span>:{" "}
+          {formatHighlights(highlights)}
+        </div>
+      </div>
+
+      <div className="flex gap-2 justify-end">
+        <button
+          type="button"
+          onClick={() => onDecide(approval.approvalId, "deny")}
+          className="px-3 py-1.5 text-xs border border-border rounded-md hover:bg-muted transition-colors"
+        >
+          Deny
+        </button>
+        <button
+          type="button"
+          onClick={() => onDecide(approval.approvalId, "approve")}
+          className="px-3 py-1.5 text-xs bg-primary text-primary-foreground rounded-md hover:bg-primary/90 transition-colors font-medium"
+        >
+          Approve
+        </button>
+      </div>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/fare-chart.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/fare-chart.tsx
similarity index 100%
rename from apps/dev-playground/client/src/routes/smart-dashboard/components/fare-chart.tsx
rename to apps/dev-playground/client/src/features/smart-dashboard/components/fare-chart.tsx
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/focusable-chart.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/focusable-chart.tsx
new file mode 100644
index 000000000..689145a4b
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/focusable-chart.tsx
@@ -0,0 +1,36 @@
+import type { ReactNode } from "react";
+import {
+  type FocusableChartId,
+  useFocusable,
+} from "../hooks/use-focus-registry";
+
+interface FocusableChartProps {
+  chartId: FocusableChartId;
+  children: ReactNode;
+}
+
+/**
+ * Wraps a chart with a focus-ring pulse effect. Pairs with `focusChart(id)`
+ * — when the `dashboard_pilot` agent emits a `focus_chart({ chart_id })`
+ * tool call, the dispatcher invokes the registered callback here, which
+ * scrolls into view and flips `focused` true for 1.2s.
+ *
+ * Named `chartId` (not `id`) because this is a logical focus-registry key,
+ * not a DOM id attribute.
+ */
+export function FocusableChart({ chartId, children }: FocusableChartProps) {
+  const { setRef, focused } = useFocusable(chartId);
+
+  return (
+    <div
+      ref={setRef}
+      className={`rounded-xl transition-[box-shadow,transform] duration-500 ${
+        focused
+          ? "ring-4 ring-primary ring-offset-2 ring-offset-background scale-[1.01]"
+          : ""
+      }`}
+    >
+      {children}
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/insight-card.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/insight-card.tsx
similarity index 100%
rename from apps/dev-playground/client/src/routes/smart-dashboard/components/insight-card.tsx
rename to apps/dev-playground/client/src/features/smart-dashboard/components/insight-card.tsx
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/inspector-toggle.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/inspector-toggle.tsx
new file mode 100644
index 000000000..4a0388b6b
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/inspector-toggle.tsx
@@ -0,0 +1,31 @@
+import { ActivityIcon } from "lucide-react";
+import {
+  toggleInspector,
+  useStreamInspector,
+} from "../hooks/use-stream-inspector";
+
+/**
+ * Floating icon in the bottom-right that opens the Stream Inspector.
+ * Complements the ⌘K keyboard shortcut with a discoverable affordance.
+ */
+export function InspectorToggle() {
+  const { records } = useStreamInspector();
+  const currentRunEvents = records[0]?.events.length ?? 0;
+
+  return (
+    <button
+      type="button"
+      onClick={toggleInspector}
+      aria-label="Toggle stream inspector (⌘K)"
+      title="Stream Inspector (⌘K)"
+      className="fixed bottom-4 right-4 z-30 rounded-full bg-card border border-border shadow-lg p-3 hover:bg-muted transition-colors flex items-center gap-2"
+    >
+      <ActivityIcon className="h-4 w-4 text-foreground" />
+      {currentRunEvents > 0 && (
+        <span className="text-[10px] font-mono text-muted-foreground tabular-nums">
+          {currentRunEvents}
+        </span>
+      )}
+    </button>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/kpi-cards.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/kpi-cards.tsx
similarity index 100%
rename from apps/dev-playground/client/src/routes/smart-dashboard/components/kpi-cards.tsx
rename to apps/dev-playground/client/src/features/smart-dashboard/components/kpi-cards.tsx
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/query-section.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/query-section.tsx
similarity index 78%
rename from apps/dev-playground/client/src/routes/smart-dashboard/components/query-section.tsx
rename to apps/dev-playground/client/src/features/smart-dashboard/components/query-section.tsx
index 80612ff6a..9f0d60c24 100644
--- a/apps/dev-playground/client/src/routes/smart-dashboard/components/query-section.tsx
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/query-section.tsx
@@ -7,38 +7,42 @@ import {
   SparklesIcon,
 } from "lucide-react";
 import { useCallback, useState } from "react";
-import type { SSEEvent } from "../hooks/use-agent-stream";
-import { useAgentStream } from "../hooks/use-agent-stream";
 
 interface QuerySectionProps {
-  onEvent?: (event: SSEEvent) => void;
+  /** Dispatch a message through the chat pipeline. Owned by the route. */
+  onSend: (message: string) => void;
+  /** Streaming assistant text for the current run. */
+  content: string;
+  /** Whether a run is in flight. */
+  isLoading: boolean;
 }
 
 const EXAMPLE_QUERIES = [
-  "What's the busiest day of the week?",
-  "Filter to only trips from February 2016",
-  "Highlight Jan 10-15 on the chart",
-  "Show trips over $50 and highlight the peak",
+  "What's the busiest day of the week in 2016?",
+  "Filter to November 2016 only",
+  "Highlight the first week of Jan 2016 in red",
+  "Focus on the fare distribution chart",
+  "Clear all filters and highlights",
 ];
 
-export function QuerySection({ onEvent }: QuerySectionProps) {
+export function QuerySection({
+  onSend,
+  content,
+  isLoading,
+}: QuerySectionProps) {
   const [input, setInput] = useState("");
   const [showTips, setShowTips] = useState(true);
-  const { content, isLoading, send } = useAgentStream({
-    agentName: "query",
-    onEvent,
-  });
 
   const handleSubmit = useCallback(
     (e: React.FormEvent) => {
       e.preventDefault();
-      if (!input.trim() || isLoading) return;
       const message = input.trim();
+      if (!message || isLoading) return;
       setInput("");
       setShowTips(false);
-      send(message);
+      onSend(message);
     },
-    [input, isLoading, send],
+    [input, isLoading, onSend],
   );
 
   const handleExample = useCallback(
@@ -46,9 +50,9 @@ export function QuerySection({ onEvent }: QuerySectionProps) {
       if (isLoading) return;
       setInput("");
       setShowTips(false);
-      send(query);
+      onSend(query);
     },
-    [isLoading, send],
+    [isLoading, onSend],
   );
 
   return (
@@ -60,7 +64,7 @@ export function QuerySection({ onEvent }: QuerySectionProps) {
             Ask about the data
           </h3>
           <span className="text-xs text-muted-foreground">
-            — powered by the Query Agent
+            — query dispatcher routes to SQL analyst or dashboard pilot
           </span>
         </div>
         <button
@@ -76,18 +80,18 @@ export function QuerySection({ onEvent }: QuerySectionProps) {
         <div className="mb-4 rounded-lg border border-dashed border-border bg-muted/20 p-3">
           <p className="text-xs font-medium text-muted-foreground mb-2 flex items-center gap-1.5">
             <SparklesIcon className="h-3.5 w-3.5" />
-            This agent can control the dashboard directly
+            This agent can query data and control the dashboard
           </p>
           <div className="grid grid-cols-1 sm:grid-cols-2 gap-2 mb-3">
             <div className="flex items-start gap-2">
               <FilterIcon className="h-3.5 w-3.5 text-blue-500 mt-0.5 shrink-0" />
               <div>
                 <p className="text-xs font-medium text-foreground">
-                  Filter data
+                  Filter & highlight
                 </p>
                 <p className="text-[11px] text-muted-foreground">
-                  Ask to filter by date range, zone, or fare amount and the
-                  dashboard KPIs and charts will update live.
+                  Ask to filter by date, ZIP, or fare, or highlight a period.
+                  Dashboard updates live as the agent acts.
                 </p>
               </div>
             </div>
@@ -95,11 +99,11 @@ export function QuerySection({ onEvent }: QuerySectionProps) {
               <HighlighterIcon className="h-3.5 w-3.5 text-amber-500 mt-0.5 shrink-0" />
               <div>
                 <p className="text-xs font-medium text-foreground">
-                  Highlight periods
+                  Save view (approval gate)
                 </p>
                 <p className="text-[11px] text-muted-foreground">
-                  Ask to highlight a date range and a shaded overlay will appear
-                  on the Trips Over Time chart.
+                  Ask to save the current view — it's destructive, so you'll see
+                  an approval card before the agent can proceed.
                 </p>
               </div>
             </div>
@@ -125,7 +129,7 @@ export function QuerySection({ onEvent }: QuerySectionProps) {
           type="text"
           value={input}
           onChange={(e) => setInput(e.target.value)}
-          placeholder='Try "Filter to January 2016" or "Highlight the busiest week"'
+          placeholder='Try "Filter to January 2016" or "Save this view as Peak Week"'
           disabled={isLoading}
           className="flex-1 rounded-lg border border-border bg-background px-3 py-2 text-sm text-foreground placeholder:text-muted-foreground focus:outline-none focus:ring-2 focus:ring-ring disabled:opacity-50"
         />
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/quick-actions-bar.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/quick-actions-bar.tsx
new file mode 100644
index 000000000..c67aa0662
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/quick-actions-bar.tsx
@@ -0,0 +1,119 @@
+import { BookmarkPlusIcon, EraserIcon, FilterXIcon, XIcon } from "lucide-react";
+import { useCallback, useRef, useState } from "react";
+
+interface QuickActionsBarProps {
+  /**
+   * Dispatches a message through the chat pipeline (same `useAgentStream`
+   * the text input uses). Keeps the demo narrative honest: clicks are just
+   * prefilled prompts — the agent still reasons and the approval gate
+   * still fires for destructive actions.
+   */
+  onSend: (message: string) => void;
+  disabled?: boolean;
+}
+
+export function QuickActionsBar({
+  onSend,
+  disabled = false,
+}: QuickActionsBarProps) {
+  const [savingName, setSavingName] = useState<string | null>(null);
+  const saveInputRef = useRef<HTMLInputElement>(null);
+
+  const startSave = useCallback(() => {
+    setSavingName("");
+    setTimeout(() => saveInputRef.current?.focus(), 0);
+  }, []);
+
+  const cancelSave = useCallback(() => {
+    setSavingName(null);
+  }, []);
+
+  const submitSave = useCallback(() => {
+    const name = savingName?.trim();
+    if (!name) {
+      setSavingName(null);
+      return;
+    }
+    onSend(`Save the current view as "${name}"`);
+    setSavingName(null);
+  }, [savingName, onSend]);
+
+  return (
+    <div className="flex items-center gap-2 flex-wrap">
+      <span className="text-[11px] uppercase tracking-wide text-muted-foreground font-medium mr-1">
+        Quick actions
+      </span>
+
+      {savingName === null ? (
+        <button
+          type="button"
+          onClick={startSave}
+          disabled={disabled}
+          className="inline-flex items-center gap-1.5 rounded-md border border-red-500/40 bg-red-500/5 px-2.5 py-1 text-xs text-red-700 dark:text-red-400 hover:bg-red-500/10 transition-colors disabled:opacity-50"
+          title="Save current view (destructive — requires approval)"
+        >
+          <BookmarkPlusIcon className="h-3.5 w-3.5" />
+          Save view…
+        </button>
+      ) : (
+        <div className="inline-flex items-center gap-1 rounded-md border border-red-500/40 bg-red-500/5 pl-2 pr-1 py-0.5">
+          <BookmarkPlusIcon className="h-3.5 w-3.5 text-red-600 shrink-0" />
+          <input
+            ref={saveInputRef}
+            type="text"
+            value={savingName}
+            onChange={(e) => setSavingName(e.target.value)}
+            onKeyDown={(e) => {
+              if (e.key === "Enter") {
+                e.preventDefault();
+                submitSave();
+              } else if (e.key === "Escape") {
+                e.preventDefault();
+                cancelSave();
+              }
+            }}
+            placeholder="Name this view…"
+            disabled={disabled}
+            className="w-44 bg-transparent border-0 outline-none text-xs text-foreground placeholder:text-muted-foreground"
+          />
+          <button
+            type="button"
+            onClick={submitSave}
+            disabled={disabled || !savingName.trim()}
+            className="text-xs px-2 py-0.5 rounded bg-red-600 text-white hover:bg-red-700 disabled:opacity-40"
+          >
+            Save
+          </button>
+          <button
+            type="button"
+            onClick={cancelSave}
+            className="p-0.5 rounded text-muted-foreground hover:text-foreground"
+            aria-label="Cancel"
+          >
+            <XIcon className="h-3.5 w-3.5" />
+          </button>
+        </div>
+      )}
+
+      <button
+        type="button"
+        onClick={() => onSend("Clear all filters on the dashboard.")}
+        disabled={disabled}
+        className="inline-flex items-center gap-1.5 rounded-md border border-border bg-background px-2.5 py-1 text-xs text-foreground hover:bg-muted transition-colors disabled:opacity-50"
+      >
+        <FilterXIcon className="h-3.5 w-3.5" />
+        Clear filters
+      </button>
+
+      <button
+        type="button"
+        onClick={() => onSend("Clear all highlights from the charts.")}
+        disabled={disabled}
+        className="inline-flex items-center gap-1.5 rounded-md border border-border bg-background px-2.5 py-1 text-xs text-foreground hover:bg-muted transition-colors disabled:opacity-50"
+      >
+        <EraserIcon className="h-3.5 w-3.5" />
+        Clear highlights
+      </button>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/stream-inspector.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/stream-inspector.tsx
new file mode 100644
index 000000000..adf15dccc
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/stream-inspector.tsx
@@ -0,0 +1,246 @@
+import { ChevronDownIcon, ChevronRightIcon, XIcon } from "lucide-react";
+import { useMemo, useState } from "react";
+import {
+  clearInspectorHistory,
+  closeInspector,
+  type StreamEventRecord,
+  type StreamRecord,
+  useStreamInspector,
+} from "../hooks/use-stream-inspector";
+
+type FilterMode =
+  | "all"
+  | "tool_calls"
+  | "messages"
+  | "approvals"
+  | "sub_agents";
+
+const FILTER_OPTIONS: Array<{ id: FilterMode; label: string }> = [
+  { id: "all", label: "All" },
+  { id: "tool_calls", label: "Tool calls" },
+  { id: "messages", label: "Messages" },
+  { id: "approvals", label: "Approvals" },
+  { id: "sub_agents", label: "Sub-agents" },
+];
+
+function matchesFilter(
+  event: StreamEventRecord["event"],
+  mode: FilterMode,
+): boolean {
+  if (mode === "all") return true;
+  if (mode === "messages") {
+    return (
+      event.type === "response.output_text.delta" ||
+      event.type === "response.output_item.added" ||
+      event.type === "response.output_item.done" ||
+      event.type === "response.completed"
+    );
+  }
+  if (mode === "tool_calls") {
+    return (
+      (event.type === "response.output_item.added" ||
+        event.type === "response.output_item.done") &&
+      event.item?.type === "function_call"
+    );
+  }
+  if (mode === "approvals") {
+    return event.type === "appkit.approval_pending";
+  }
+  if (mode === "sub_agents") {
+    // Sub-agent invocations surface as `agent-<key>` function_calls; keep
+    // `appkit.metadata` in here too since it carries threadId on new runs.
+    if (event.item?.type === "function_call") {
+      return event.item.name?.startsWith("agent-") ?? false;
+    }
+    return false;
+  }
+  return true;
+}
+
+function shortType(type: string): string {
+  // Collapse the verbose `response.*` prefix for legibility.
+  return type.replace(/^response\./, "").replace(/^appkit\./, "");
+}
+
+function formatTimestamp(relMs: number): string {
+  if (relMs < 1000) return `${Math.round(relMs)}ms`;
+  return `${(relMs / 1000).toFixed(2)}s`;
+}
+
+function EventRow({
+  event,
+  receivedAt,
+  startedAt,
+}: StreamEventRecord & { startedAt: number }) {
+  const [expanded, setExpanded] = useState(false);
+  const rel = receivedAt - startedAt;
+
+  const isFunctionCall = event.item?.type === "function_call";
+  const isApproval = event.type === "appkit.approval_pending";
+
+  let summary: string;
+  if (isApproval) {
+    summary = `approval: ${event.tool_name}`;
+  } else if (isFunctionCall) {
+    summary = `${event.item?.name ?? "(unnamed)"}`;
+  } else if (event.type === "response.output_text.delta") {
+    summary = event.delta ?? "";
+  } else {
+    summary = "";
+  }
+
+  return (
+    <div className="border-b border-border/40 last:border-0">
+      <button
+        type="button"
+        onClick={() => setExpanded((v) => !v)}
+        className="w-full px-3 py-2 flex items-start gap-2 text-left hover:bg-muted/40 transition-colors"
+      >
+        {expanded ? (
+          <ChevronDownIcon className="h-3.5 w-3.5 mt-0.5 shrink-0 text-muted-foreground" />
+        ) : (
+          <ChevronRightIcon className="h-3.5 w-3.5 mt-0.5 shrink-0 text-muted-foreground" />
+        )}
+        <div className="flex-1 min-w-0">
+          <div className="flex items-baseline gap-2">
+            <span className="text-[10px] font-mono text-muted-foreground tabular-nums w-12 shrink-0">
+              {formatTimestamp(rel)}
+            </span>
+            <span
+              className={`text-xs font-mono shrink-0 ${
+                isApproval
+                  ? "text-red-600"
+                  : isFunctionCall
+                    ? "text-primary"
+                    : "text-foreground"
+              }`}
+            >
+              {shortType(event.type)}
+            </span>
+            {summary && (
+              <span className="text-xs text-muted-foreground truncate">
+                {summary}
+              </span>
+            )}
+          </div>
+          {expanded && (
+            <pre className="mt-2 p-2 bg-muted/50 rounded text-[10px] font-mono text-foreground whitespace-pre-wrap break-all overflow-x-auto">
+              {JSON.stringify(event, null, 2)}
+            </pre>
+          )}
+        </div>
+      </button>
+    </div>
+  );
+}
+
+function RunBlock({ record }: { record: StreamRecord }) {
+  return (
+    <div className="mb-4">
+      <div className="px-3 py-2 bg-muted/60 border-y border-border text-xs">
+        <div className="font-medium text-foreground truncate">
+          {record.label}
+        </div>
+        <div className="text-[10px] text-muted-foreground mt-0.5">
+          {record.events.length} events · started{" "}
+          {new Date(
+            Date.now() - (performance.now() - record.startedAt),
+          ).toLocaleTimeString()}
+        </div>
+      </div>
+      <div>
+        {record.events.map((er, idx) => (
+          <EventRow
+            key={`${record.id}-${idx}`}
+            event={er.event}
+            receivedAt={er.receivedAt}
+            startedAt={record.startedAt}
+          />
+        ))}
+      </div>
+    </div>
+  );
+}
+
+export function StreamInspector() {
+  const { isOpen, records } = useStreamInspector();
+  const [filter, setFilter] = useState<FilterMode>("all");
+
+  const filteredRecords = useMemo(() => {
+    if (filter === "all") return records;
+    return records.map((r) => ({
+      ...r,
+      events: r.events.filter((er) => matchesFilter(er.event, filter)),
+    }));
+  }, [records, filter]);
+
+  if (!isOpen) return null;
+
+  return (
+    <>
+      {/* biome-ignore lint/a11y/noStaticElementInteractions: backdrop dismiss */}
+      {/* biome-ignore lint/a11y/useKeyWithClickEvents: backdrop dismiss handled globally via Esc */}
+      <div
+        onClick={closeInspector}
+        className="fixed inset-0 bg-black/30 backdrop-blur-sm z-40"
+      />
+      <aside className="fixed top-0 right-0 bottom-0 w-[420px] bg-card border-l border-border shadow-2xl z-50 flex flex-col animate-in slide-in-from-right duration-200">
+        <header className="px-4 py-3 border-b border-border flex items-center justify-between shrink-0">
+          <div>
+            <h2 className="text-sm font-semibold text-foreground">
+              Stream Inspector
+            </h2>
+            <p className="text-[11px] text-muted-foreground">
+              Agent SSE timeline · ⌘K to toggle · Esc to close
+            </p>
+          </div>
+          <button
+            type="button"
+            onClick={closeInspector}
+            className="p-1 rounded-md hover:bg-muted text-muted-foreground hover:text-foreground transition-colors"
+            aria-label="Close inspector"
+          >
+            <XIcon className="h-4 w-4" />
+          </button>
+        </header>
+
+        <div className="px-3 py-2 border-b border-border flex items-center gap-1 flex-wrap shrink-0">
+          {FILTER_OPTIONS.map((opt) => (
+            <button
+              key={opt.id}
+              type="button"
+              onClick={() => setFilter(opt.id)}
+              className={`text-[11px] px-2 py-1 rounded-full transition-colors ${
+                filter === opt.id
+                  ? "bg-primary text-primary-foreground"
+                  : "bg-muted text-muted-foreground hover:bg-muted/70"
+              }`}
+            >
+              {opt.label}
+            </button>
+          ))}
+          <div className="flex-1" />
+          {records.length > 0 && (
+            <button
+              type="button"
+              onClick={clearInspectorHistory}
+              className="text-[11px] px-2 py-1 rounded-full text-muted-foreground hover:bg-muted transition-colors"
+            >
+              Clear
+            </button>
+          )}
+        </div>
+
+        <div className="flex-1 overflow-y-auto">
+          {filteredRecords.length === 0 ? (
+            <div className="p-6 text-center text-xs text-muted-foreground">
+              No events yet. Ask the agent something to see the SSE stream here.
+            </div>
+          ) : (
+            filteredRecords.map((r) => <RunBlock key={r.id} record={r} />)
+          )}
+        </div>
+      </aside>
+    </>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/components/trip-chart.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/trip-chart.tsx
similarity index 100%
rename from apps/dev-playground/client/src/routes/smart-dashboard/components/trip-chart.tsx
rename to apps/dev-playground/client/src/features/smart-dashboard/components/trip-chart.tsx
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts
new file mode 100644
index 000000000..70981b6b8
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts
@@ -0,0 +1,227 @@
+import { useCallback, useRef } from "react";
+import type { SSEEvent } from "./use-agent-stream";
+import type { DashboardFilters } from "./use-dashboard-data";
+import { type FocusableChartId, focusChart } from "./use-focus-registry";
+
+export interface Highlight {
+  start: string;
+  end: string;
+  color: "blue" | "red" | "yellow";
+  label?: string;
+}
+
+const DASHBOARD_TOOLS = new Set<string>([
+  "filter_by_date_range",
+  "filter_by_pickup_zip",
+  "filter_by_fare",
+  "clear_filters",
+  "highlight_period",
+  "clear_highlights",
+  "focus_chart",
+]);
+
+interface UseActionDispatcherOptions {
+  /** Receives an updater fn; avoids stale-closure bugs when the agent fires multiple tool calls back-to-back. */
+  onFilterUpdate: (
+    updater: (prev: DashboardFilters) => DashboardFilters,
+  ) => void;
+  onAddHighlight: (highlight: Highlight) => void;
+  onClearFilters: () => void;
+  onClearHighlights: () => void;
+  /** Called once per applied action with a short human-readable summary. Route surfaces it as a toast. */
+  onAction?: (summary: string) => void;
+  /** Called when the dispatcher receives a tool it doesn't know how to handle. Lets the route warn visibly. */
+  onUnknownTool?: (name: string, args: unknown) => void;
+}
+
+function parseArgs(raw: string | undefined): Record<string, unknown> | null {
+  if (!raw) return {};
+  try {
+    const parsed: unknown = JSON.parse(raw);
+    return typeof parsed === "object" && parsed !== null
+      ? (parsed as Record<string, unknown>)
+      : null;
+  } catch {
+    return null;
+  }
+}
+
+const CALL_ID_LRU_CAP = 128;
+
+/**
+ * Translates `function_call` tool events from the agent's SSE stream into
+ * dashboard state mutations.
+ *
+ * Correctness rules (learned the hard way):
+ *
+ * - Only acts on `response.output_item.done`, never `.added`. `.added` fires
+ *   with incomplete `arguments`, causing spurious JSON parse failures and,
+ *   worse, double-firing: `highlight_period` used to append the same band
+ *   twice because both events passed.
+ * - Dedupes by `call_id`. Keeps a bounded LRU so memory stays finite across
+ *   a long session. A new run clears the cache on `appkit.metadata` (the
+ *   first event of every stream carries the new threadId).
+ * - Uses updater callbacks (`onFilterUpdate(prev => ...)`) instead of reading
+ *   `currentFilters` from props. Multi-tool-call runs within a single
+ *   render cycle would otherwise see stale filter state.
+ * - Emits a summary for every applied action via `onAction`. Silent success
+ *   is the worst failure mode here — if the user can't see what changed,
+ *   they can't tell whether the agent misfired.
+ */
+export function useActionDispatcher({
+  onFilterUpdate,
+  onAddHighlight,
+  onClearFilters,
+  onClearHighlights,
+  onAction,
+  onUnknownTool,
+}: UseActionDispatcherOptions) {
+  const seen = useRef<string[]>([]);
+
+  const markSeen = useCallback((callId: string): boolean => {
+    if (seen.current.includes(callId)) return true;
+    seen.current.push(callId);
+    if (seen.current.length > CALL_ID_LRU_CAP) {
+      seen.current.splice(0, seen.current.length - CALL_ID_LRU_CAP);
+    }
+    return false;
+  }, []);
+
+  const handleEvent = useCallback(
+    (event: SSEEvent) => {
+      // New run → fresh dedupe cache. `appkit.metadata` is the very first
+      // event the agents plugin emits for each stream.
+      if (event.type === "appkit.metadata") {
+        seen.current = [];
+        return;
+      }
+
+      if (event.type !== "response.output_item.done") return;
+      if (event.item?.type !== "function_call") return;
+
+      const name = event.item.name;
+      if (!name) return;
+
+      // Tools not owned by the dashboard (e.g. `analytics.query`, sub-agent
+      // `agent-sql_analyst`) flow through without a dispatcher side-effect.
+      if (!DASHBOARD_TOOLS.has(name)) return;
+
+      const callId = event.item.call_id;
+      if (callId && markSeen(callId)) return;
+
+      const args = parseArgs(event.item.arguments);
+      if (args === null) {
+        onUnknownTool?.(name, event.item.arguments);
+        return;
+      }
+
+      switch (name) {
+        case "filter_by_date_range": {
+          const start = args.start;
+          const end = args.end;
+          if (typeof start !== "string" || typeof end !== "string") {
+            onUnknownTool?.(name, args);
+            return;
+          }
+          onFilterUpdate((prev) => ({
+            ...prev,
+            date_from: start,
+            date_to: end,
+          }));
+          onAction?.(`Filtered to ${start} → ${end}`);
+          return;
+        }
+        case "filter_by_pickup_zip": {
+          const zip = args.zip;
+          if (typeof zip !== "string") {
+            onUnknownTool?.(name, args);
+            return;
+          }
+          onFilterUpdate((prev) => ({ ...prev, pickup_zip: zip }));
+          onAction?.(`Filtered to pickup ZIP ${zip}`);
+          return;
+        }
+        case "filter_by_fare": {
+          const min = typeof args.min === "number" ? args.min : undefined;
+          const max = typeof args.max === "number" ? args.max : undefined;
+          if (min === undefined && max === undefined) {
+            onUnknownTool?.(name, args);
+            return;
+          }
+          onFilterUpdate((prev) => ({
+            ...prev,
+            ...(min !== undefined ? { fare_min: String(min) } : {}),
+            ...(max !== undefined ? { fare_max: String(max) } : {}),
+          }));
+          const parts: string[] = [];
+          if (min !== undefined) parts.push(`≥ $${min}`);
+          if (max !== undefined) parts.push(`≤ $${max}`);
+          onAction?.(`Filtered by fare ${parts.join(" and ")}`);
+          return;
+        }
+        case "clear_filters": {
+          onClearFilters();
+          onAction?.("Filters cleared");
+          return;
+        }
+        case "highlight_period": {
+          const start = args.start;
+          const end = args.end;
+          if (typeof start !== "string" || typeof end !== "string") {
+            onUnknownTool?.(name, args);
+            return;
+          }
+          const color =
+            args.color === "red" || args.color === "yellow"
+              ? args.color
+              : "blue";
+          const label =
+            typeof args.label === "string" && args.label !== ""
+              ? args.label
+              : undefined;
+          onAddHighlight({ start, end, color, label });
+          onAction?.(
+            `Highlighted ${start} → ${end}${label ? ` (${label})` : ""}`,
+          );
+          return;
+        }
+        case "clear_highlights": {
+          onClearHighlights();
+          onAction?.("Highlights cleared");
+          return;
+        }
+        case "focus_chart": {
+          const id = args.chart_id;
+          if (
+            id !== "kpis" &&
+            id !== "trips_over_time" &&
+            id !== "fare_distribution"
+          ) {
+            onUnknownTool?.(name, args);
+            return;
+          }
+          focusChart(id as FocusableChartId);
+          onAction?.(`Focused ${id.replace(/_/g, " ")}`);
+          return;
+        }
+        default: {
+          // DASHBOARD_TOOLS membership already filtered unknowns; this branch
+          // is a compile-time exhaustiveness check.
+          onUnknownTool?.(name, args);
+          return;
+        }
+      }
+    },
+    [
+      markSeen,
+      onFilterUpdate,
+      onAddHighlight,
+      onClearFilters,
+      onClearHighlights,
+      onAction,
+      onUnknownTool,
+    ],
+  );
+
+  return { handleEvent };
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-agent-stream.ts b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-agent-stream.ts
similarity index 78%
rename from apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-agent-stream.ts
rename to apps/dev-playground/client/src/features/smart-dashboard/hooks/use-agent-stream.ts
index 871b8b43c..9810b2618 100644
--- a/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-agent-stream.ts
+++ b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-agent-stream.ts
@@ -1,4 +1,5 @@
 import { useCallback, useRef, useState } from "react";
+import { beginStreamRun, recordStreamEvent } from "./use-stream-inspector";
 
 export interface SSEEvent {
   type: string;
@@ -18,6 +19,16 @@ export interface SSEEvent {
   error?: string;
   sequence_number?: number;
   output_index?: number;
+  // appkit.approval_pending payload
+  approval_id?: string;
+  stream_id?: string;
+  tool_name?: string;
+  args?: unknown;
+  annotations?: {
+    readOnly?: boolean;
+    destructive?: boolean;
+    idempotent?: boolean;
+  };
 }
 
 interface UseAgentStreamOptions {
@@ -25,12 +36,21 @@ interface UseAgentStreamOptions {
   onEvent?: (event: SSEEvent) => void;
 }
 
+interface SendOptions {
+  /**
+   * Text prepended to the user's message on the wire. Used by the Smart
+   * Dashboard route to inject active filters / highlights into the system
+   * prompt so the agent always knows what the user is looking at.
+   */
+  contextPrefix?: string;
+}
+
 interface UseAgentStreamReturn {
   content: string;
   events: SSEEvent[];
   isLoading: boolean;
   threadId: string | null;
-  send: (message: string) => Promise<void>;
+  send: (message: string, opts?: SendOptions) => Promise<void>;
   reset: () => void;
 }
 
@@ -53,18 +73,24 @@ export function useAgentStream({
   }, []);
 
   const send = useCallback(
-    async (message: string) => {
+    async (message: string, opts?: SendOptions) => {
       setIsLoading(true);
       setContent("");
       setEvents([]);
       contentRef.current = "";
 
+      const wire = opts?.contextPrefix
+        ? `${opts.contextPrefix}${message}`
+        : message;
+
+      const runId = beginStreamRun(`${agentName}: ${message.slice(0, 80)}`);
+
       try {
         const res = await fetch("/api/agents/chat", {
           method: "POST",
           headers: { "Content-Type": "application/json" },
           body: JSON.stringify({
-            message,
+            message: wire,
             agent: agentName,
             ...(threadId && { threadId }),
           }),
@@ -102,6 +128,7 @@ export function useAgentStream({
               const event: SSEEvent = JSON.parse(data);
               if (!event.type) continue;
               setEvents((prev) => [...prev, event]);
+              recordStreamEvent(runId, event);
               onEventRef.current?.(event);
 
               if (event.type === "appkit.metadata" && event.data?.threadId) {
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-chart-colors.ts b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-chart-colors.ts
similarity index 100%
rename from apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-chart-colors.ts
rename to apps/dev-playground/client/src/features/smart-dashboard/hooks/use-chart-colors.ts
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-dashboard-data.ts b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-dashboard-data.ts
similarity index 100%
rename from apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-dashboard-data.ts
rename to apps/dev-playground/client/src/features/smart-dashboard/hooks/use-dashboard-data.ts
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-focus-registry.ts b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-focus-registry.ts
new file mode 100644
index 000000000..6c1dc3773
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-focus-registry.ts
@@ -0,0 +1,51 @@
+import { useEffect, useRef, useState } from "react";
+
+/**
+ * Module-level focus registry. Chart wrappers register a callback under a
+ * stable id; `focusChart(id)` looks up the callback and invokes it to
+ * scroll the user's viewport to the chart and pulse a ring around it.
+ *
+ * Registrations live outside React state so the agent's SSE stream (which
+ * hands off to `focusChart` via `use-action-dispatcher`) never needs to
+ * thread a ref through the component tree.
+ */
+const registry = new Map<string, () => void>();
+
+export type FocusableChartId = "kpis" | "trips_over_time" | "fare_distribution";
+
+export function focusChart(id: FocusableChartId): void {
+  registry.get(id)?.();
+}
+
+/**
+ * Registers `id` as a focusable chart. Returns a `setRef` callback for the
+ * wrapping element and a `focused` boolean that flips true for 1.2s when
+ * `focusChart(id)` is called from elsewhere.
+ */
+export function useFocusable(id: FocusableChartId): {
+  setRef: (el: HTMLElement | null) => void;
+  focused: boolean;
+} {
+  const elRef = useRef<HTMLElement | null>(null);
+  const [focused, setFocused] = useState(false);
+
+  useEffect(() => {
+    const onFocus = (): void => {
+      const el = elRef.current;
+      if (!el) return;
+      el.scrollIntoView({ behavior: "smooth", block: "center" });
+      setFocused(true);
+      setTimeout(() => setFocused(false), 1200);
+    };
+    registry.set(id, onFocus);
+    return () => {
+      if (registry.get(id) === onFocus) registry.delete(id);
+    };
+  }, [id]);
+
+  const setRef = (el: HTMLElement | null): void => {
+    elRef.current = el;
+  };
+
+  return { setRef, focused };
+}
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-stream-inspector.ts b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-stream-inspector.ts
new file mode 100644
index 000000000..38b672138
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-stream-inspector.ts
@@ -0,0 +1,141 @@
+import { useCallback, useEffect, useSyncExternalStore } from "react";
+import type { SSEEvent } from "./use-agent-stream";
+
+/**
+ * Observability store for the agent SSE stream. Every chat message the
+ * dashboard sends gets a `StreamRecord`; each event the adapter yields is
+ * appended to that record with a relative timestamp. The Stream Inspector
+ * drawer reads from here to render a human-legible timeline.
+ *
+ * State is module-level on purpose — multiple components (the chat section,
+ * the agent sidebar, the inspector drawer itself) feed and read from the
+ * same store without wiring props or context. React only re-renders when
+ * `version` changes.
+ */
+
+export interface StreamEventRecord {
+  event: SSEEvent;
+  receivedAt: number;
+}
+
+export interface StreamRecord {
+  id: string;
+  label: string;
+  startedAt: number;
+  events: StreamEventRecord[];
+}
+
+const MAX_RECORDS = 5;
+
+const state = {
+  isOpen: false,
+  records: [] as StreamRecord[],
+};
+const listeners = new Set<() => void>();
+let version = 0;
+
+function notify(): void {
+  version++;
+  for (const fn of listeners) fn();
+}
+
+function subscribe(fn: () => void): () => void {
+  listeners.add(fn);
+  return () => {
+    listeners.delete(fn);
+  };
+}
+
+function getVersion(): number {
+  return version;
+}
+
+export function useStreamInspector(): {
+  isOpen: boolean;
+  records: StreamRecord[];
+} {
+  useSyncExternalStore(subscribe, getVersion, getVersion);
+  return { isOpen: state.isOpen, records: state.records };
+}
+
+export function beginStreamRun(label: string): string {
+  const id =
+    (globalThis.crypto?.randomUUID?.() as string | undefined) ??
+    `run_${Date.now().toString(36)}_${Math.random().toString(36).slice(2, 8)}`;
+  const record: StreamRecord = {
+    id,
+    label,
+    startedAt: performance.now(),
+    events: [],
+  };
+  state.records = [record, ...state.records].slice(0, MAX_RECORDS);
+  notify();
+  return id;
+}
+
+export function recordStreamEvent(runId: string, event: SSEEvent): void {
+  const record = state.records.find((r) => r.id === runId);
+  if (!record) return;
+  record.events.push({ event, receivedAt: performance.now() });
+  notify();
+}
+
+export function openInspector(): void {
+  state.isOpen = true;
+  notify();
+}
+
+export function closeInspector(): void {
+  state.isOpen = false;
+  notify();
+}
+
+export function toggleInspector(): void {
+  state.isOpen = !state.isOpen;
+  notify();
+}
+
+export function clearInspectorHistory(): void {
+  state.records = [];
+  notify();
+}
+
+/**
+ * Binds ⌘K / Ctrl+K to open-toggle and `Esc` to close. Mount once inside
+ * the route.
+ */
+export function useInspectorShortcuts(): void {
+  useEffect(() => {
+    const onKey = (e: KeyboardEvent): void => {
+      if (
+        e.key === "k" &&
+        (e.metaKey || e.ctrlKey) &&
+        !e.altKey &&
+        !e.shiftKey
+      ) {
+        e.preventDefault();
+        toggleInspector();
+      } else if (e.key === "Escape" && state.isOpen) {
+        closeInspector();
+      }
+    };
+    window.addEventListener("keydown", onKey);
+    return () => {
+      window.removeEventListener("keydown", onKey);
+    };
+  }, []);
+}
+
+/**
+ * Convenience hook for the currently-open run's events. Used by the agent
+ * sidebar's tiny "pulse" indicator next to each agent.
+ */
+export function useCurrentRun(): StreamRecord | null {
+  const { records } = useStreamInspector();
+  return records[0] ?? null;
+}
+
+// Dummy export to keep the "callback" shape callers can use if they want
+// to opt out of the module-level store (none do today).
+export const useStreamInspectorToggle: () => () => void = () =>
+  useCallback(() => toggleInspector(), []);
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/lib/dashboard-context.ts b/apps/dev-playground/client/src/features/smart-dashboard/lib/dashboard-context.ts
new file mode 100644
index 000000000..2348f6fef
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/lib/dashboard-context.ts
@@ -0,0 +1,41 @@
+import type { Highlight } from "../hooks/use-action-dispatcher";
+import type { DashboardFilters } from "../hooks/use-dashboard-data";
+
+/**
+ * Serialises the user's current dashboard state into a short natural-language
+ * preamble prepended to every chat turn. The `query` dispatcher and its
+ * specialists use this to stay grounded in what the user is looking at —
+ * e.g. "user asked 'is this unusual?' with filters {date_from: 2016-11-01}".
+ *
+ * Empty when nothing is set; callers should skip prepending in that case.
+ */
+export function buildDashboardContext(
+  filters: DashboardFilters,
+  highlights: Highlight[],
+): string {
+  const parts: string[] = [];
+
+  const filterEntries = Object.entries(filters).filter(
+    ([, v]) => v !== undefined && v !== "",
+  );
+  if (filterEntries.length > 0) {
+    const rendered = filterEntries
+      .map(([key, value]) => `${key}=${value}`)
+      .join(", ");
+    parts.push(`active filters: ${rendered}`);
+  }
+
+  if (highlights.length > 0) {
+    const rendered = highlights
+      .map(
+        (h) =>
+          `${h.start}..${h.end}${h.color !== "blue" ? ` [${h.color}]` : ""}${h.label ? ` (${h.label})` : ""}`,
+      )
+      .join("; ");
+    parts.push(`highlighted periods: ${rendered}`);
+  }
+
+  if (parts.length === 0) return "";
+
+  return `[Dashboard state] ${parts.join(". ")}.\n\nUser question: `;
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx b/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
index 16c39069c..4417d7669 100644
--- a/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
+++ b/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
@@ -1,16 +1,29 @@
 import { createFileRoute } from "@tanstack/react-router";
 import { LayoutDashboardIcon } from "lucide-react";
-import { useCallback, useState } from "react";
-import { ActiveFilters } from "./smart-dashboard/components/active-filters";
-import { AgentSidebar } from "./smart-dashboard/components/agent-sidebar";
-import { FareChart } from "./smart-dashboard/components/fare-chart";
-import { KPICards } from "./smart-dashboard/components/kpi-cards";
-import { QuerySection } from "./smart-dashboard/components/query-section";
-import { TripChart } from "./smart-dashboard/components/trip-chart";
-import type { Highlight } from "./smart-dashboard/hooks/use-action-dispatcher";
-import { useActionDispatcher } from "./smart-dashboard/hooks/use-action-dispatcher";
-import type { DashboardFilters } from "./smart-dashboard/hooks/use-dashboard-data";
-import { useDashboardData } from "./smart-dashboard/hooks/use-dashboard-data";
+import { useCallback, useMemo, useRef, useState } from "react";
+import { ActionToast } from "@/features/smart-dashboard/components/action-toast";
+import { ActiveFilters } from "@/features/smart-dashboard/components/active-filters";
+import { AgentSidebar } from "@/features/smart-dashboard/components/agent-sidebar";
+import {
+  ApprovalCard,
+  type PendingApproval,
+} from "@/features/smart-dashboard/components/approval-card";
+import { FareChart } from "@/features/smart-dashboard/components/fare-chart";
+import { FocusableChart } from "@/features/smart-dashboard/components/focusable-chart";
+import { InspectorToggle } from "@/features/smart-dashboard/components/inspector-toggle";
+import { KPICards } from "@/features/smart-dashboard/components/kpi-cards";
+import { QuerySection } from "@/features/smart-dashboard/components/query-section";
+import { QuickActionsBar } from "@/features/smart-dashboard/components/quick-actions-bar";
+import { StreamInspector } from "@/features/smart-dashboard/components/stream-inspector";
+import { TripChart } from "@/features/smart-dashboard/components/trip-chart";
+import type { Highlight } from "@/features/smart-dashboard/hooks/use-action-dispatcher";
+import { useActionDispatcher } from "@/features/smart-dashboard/hooks/use-action-dispatcher";
+import type { SSEEvent } from "@/features/smart-dashboard/hooks/use-agent-stream";
+import { useAgentStream } from "@/features/smart-dashboard/hooks/use-agent-stream";
+import type { DashboardFilters } from "@/features/smart-dashboard/hooks/use-dashboard-data";
+import { useDashboardData } from "@/features/smart-dashboard/hooks/use-dashboard-data";
+import { useInspectorShortcuts } from "@/features/smart-dashboard/hooks/use-stream-inspector";
+import { buildDashboardContext } from "@/features/smart-dashboard/lib/dashboard-context";
 
 export const Route = createFileRoute("/smart-dashboard")({
   component: SmartDashboardRoute,
@@ -19,24 +32,148 @@ export const Route = createFileRoute("/smart-dashboard")({
 function SmartDashboardRoute() {
   const [filters, setFilters] = useState<DashboardFilters>({});
   const [highlights, setHighlights] = useState<Highlight[]>([]);
+  const [pendingApprovals, setPendingApprovals] = useState<PendingApproval[]>(
+    [],
+  );
+  const [lastAction, setLastAction] = useState<string | null>(null);
+  const [error, setError] = useState<string | null>(null);
+
+  useInspectorShortcuts();
 
-  const { kpis, tripsOverTime, fareDistribution, isLoading } =
-    useDashboardData(filters);
+  // Dashboard data is keyed on the *current* filter state; the dispatcher
+  // mutates `filters` via setState updaters, so every new filter triggers
+  // a re-query automatically.
+  const {
+    kpis,
+    tripsOverTime,
+    fareDistribution,
+    isLoading: dataLoading,
+    error: dataError,
+  } = useDashboardData(filters);
+
+  // Dispatcher surfaces actions via `onAction`; toast shows them. A small
+  // stream of summaries arrives as the agent makes calls on `.done` events.
+  const pushAction = useCallback((summary: string) => {
+    setLastAction(summary);
+  }, []);
 
-  const handleFilterChange = useCallback((newFilters: DashboardFilters) => {
-    setFilters(newFilters);
+  const pushUnknown = useCallback((name: string, args: unknown) => {
+    const argsPreview = typeof args === "string" ? args : JSON.stringify(args);
+    setError(
+      `Agent emitted an unhandled tool call '${name}' with args ${argsPreview}. Ignoring — the dispatcher only handles the declared dashboard tools.`,
+    );
+    // Keep the inspector warning visible too:
+    // eslint-disable-next-line no-console
+    console.warn(`[dispatcher] unknown/invalid tool '${name}':`, args);
   }, []);
 
-  const handleHighlight = useCallback((highlight: Highlight) => {
-    setHighlights((prev) => [...prev, highlight]);
+  const handleFilterUpdate = useCallback(
+    (updater: (prev: DashboardFilters) => DashboardFilters) => {
+      setFilters(updater);
+    },
+    [],
+  );
+  const handleAddHighlight = useCallback((h: Highlight) => {
+    setHighlights((prev) => [...prev, h]);
   }, []);
+  const handleClearFilters = useCallback(() => setFilters({}), []);
+  const handleClearHighlights = useCallback(() => setHighlights([]), []);
+
+  const { handleEvent: handleDispatcherEvent } = useActionDispatcher({
+    onFilterUpdate: handleFilterUpdate,
+    onAddHighlight: handleAddHighlight,
+    onClearFilters: handleClearFilters,
+    onClearHighlights: handleClearHighlights,
+    onAction: pushAction,
+    onUnknownTool: pushUnknown,
+  });
+
+  const decideApproval = useCallback(
+    async (approvalId: string, decision: "approve" | "deny") => {
+      const approval = pendingApprovals.find(
+        (a) => a.approvalId === approvalId,
+      );
+      if (!approval) return;
+      try {
+        await fetch("/api/agents/approve", {
+          method: "POST",
+          headers: { "Content-Type": "application/json" },
+          body: JSON.stringify({
+            streamId: approval.streamId,
+            approvalId,
+            decision,
+          }),
+        });
+      } catch (e) {
+        setError(
+          `Approval failed: ${e instanceof Error ? e.message : "unknown"}`,
+        );
+      } finally {
+        setPendingApprovals((prev) =>
+          prev.filter((a) => a.approvalId !== approvalId),
+        );
+      }
+    },
+    [pendingApprovals],
+  );
+
+  // Context prefix is recomputed when filter/highlight state changes, so
+  // every `send()` carries the freshest snapshot even though useAgentStream
+  // is mounted once at the route level.
+  const contextPrefix = useMemo(
+    () => buildDashboardContext(filters, highlights),
+    [filters, highlights],
+  );
+  const contextPrefixRef = useRef(contextPrefix);
+  contextPrefixRef.current = contextPrefix;
+
+  const handleStreamEvent = useCallback(
+    (event: SSEEvent) => {
+      handleDispatcherEvent(event);
+
+      if (
+        event.type === "appkit.approval_pending" &&
+        event.approval_id &&
+        event.stream_id &&
+        event.tool_name
+      ) {
+        setPendingApprovals((prev) => [
+          ...prev,
+          {
+            approvalId: event.approval_id as string,
+            streamId: event.stream_id as string,
+            toolName: event.tool_name as string,
+            args: event.args,
+            annotations: event.annotations,
+          },
+        ]);
+      }
+
+      if (event.type === "error" && event.error) {
+        setError(event.error);
+      }
+    },
+    [handleDispatcherEvent],
+  );
 
-  const { handleEvent } = useActionDispatcher({
-    onFilterChange: handleFilterChange,
-    onHighlight: handleHighlight,
-    currentFilters: filters,
+  // Lifted to the route so the Quick Actions bar can dispatch through the
+  // same pipeline as the chat input. One agent stream, two callers.
+  const {
+    content,
+    isLoading: agentLoading,
+    send,
+  } = useAgentStream({
+    agentName: "query",
+    onEvent: handleStreamEvent,
   });
 
+  const dispatchToAgent = useCallback(
+    (message: string) => {
+      send(message, { contextPrefix: contextPrefixRef.current });
+    },
+    [send],
+  );
+
   const handleClearFilter = useCallback((key: keyof DashboardFilters) => {
     setFilters((prev) => {
       const next = { ...prev };
@@ -53,7 +190,7 @@ function SmartDashboardRoute() {
   return (
     <div className="min-h-screen bg-background text-foreground">
       <div className="max-w-[1400px] mx-auto px-4 py-4">
-        <header className="flex items-center gap-3 mb-5">
+        <header className="flex items-center gap-3 mb-4">
           <div className="rounded-lg bg-primary/10 p-2">
             <LayoutDashboardIcon className="h-5 w-5 text-primary" />
           </div>
@@ -62,11 +199,31 @@ function SmartDashboardRoute() {
               Smart Dashboard
             </h1>
             <p className="text-xs text-muted-foreground">
-              NYC Taxi Analytics — powered by 3 AI agents
+              NYC Taxi Analytics — powered by agents · press ⌘K for the stream
+              inspector
             </p>
           </div>
         </header>
 
+        <div className="mb-4">
+          <QuickActionsBar onSend={dispatchToAgent} disabled={agentLoading} />
+        </div>
+
+        {(error || dataError) && (
+          <div className="mb-4 rounded-lg border border-red-500/40 bg-red-500/5 p-3 text-xs text-red-700 dark:text-red-400">
+            <div className="flex items-start justify-between gap-3">
+              <div className="flex-1">{error ?? dataError}</div>
+              <button
+                type="button"
+                onClick={() => setError(null)}
+                className="text-red-600/70 hover:text-red-700 font-medium"
+              >
+                dismiss
+              </button>
+            </div>
+          </div>
+        )}
+
         <div className="mb-4">
           <ActiveFilters
             filters={filters}
@@ -76,25 +233,50 @@ function SmartDashboardRoute() {
         </div>
 
         <div className="mb-5">
-          <KPICards data={kpis} isLoading={isLoading} />
+          <FocusableChart chartId="kpis">
+            <KPICards data={kpis} isLoading={dataLoading} />
+          </FocusableChart>
         </div>
 
         <div className="grid grid-cols-1 lg:grid-cols-[1fr_320px] gap-5 mb-5">
           <div className="space-y-5">
-            <TripChart
-              data={tripsOverTime}
-              highlights={highlights}
-              isLoading={isLoading}
-            />
-            <FareChart data={fareDistribution} isLoading={isLoading} />
+            <FocusableChart chartId="trips_over_time">
+              <TripChart
+                data={tripsOverTime}
+                highlights={highlights}
+                isLoading={dataLoading}
+              />
+            </FocusableChart>
+            <FocusableChart chartId="fare_distribution">
+              <FareChart data={fareDistribution} isLoading={dataLoading} />
+            </FocusableChart>
           </div>
           <div className="lg:h-[580px]">
-            <AgentSidebar kpis={kpis} kpisLoaded={!isLoading} />
+            <AgentSidebar kpis={kpis} kpisLoaded={!dataLoading} />
           </div>
         </div>
 
-        <QuerySection onEvent={handleEvent} />
+        <div className="space-y-4">
+          <QuerySection
+            onSend={dispatchToAgent}
+            content={content}
+            isLoading={agentLoading}
+          />
+          {pendingApprovals.map((approval) => (
+            <ApprovalCard
+              key={approval.approvalId}
+              approval={approval}
+              filters={filters}
+              highlights={highlights}
+              onDecide={decideApproval}
+            />
+          ))}
+        </div>
       </div>
+
+      <InspectorToggle />
+      <StreamInspector />
+      <ActionToast message={lastAction} />
     </div>
   );
 }
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-action-dispatcher.ts b/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-action-dispatcher.ts
deleted file mode 100644
index c15b86379..000000000
--- a/apps/dev-playground/client/src/routes/smart-dashboard/hooks/use-action-dispatcher.ts
+++ /dev/null
@@ -1,88 +0,0 @@
-import { useCallback } from "react";
-import type { SSEEvent } from "./use-agent-stream";
-import type { DashboardFilters } from "./use-dashboard-data";
-
-export interface Highlight {
-  start: string;
-  end: string;
-  color: "blue" | "red" | "yellow";
-  label?: string;
-}
-
-const DASHBOARD_TOOLS = new Set(["apply_filter", "highlight_period"]);
-
-interface UseActionDispatcherOptions {
-  onFilterChange: (filters: DashboardFilters) => void;
-  onHighlight: (highlight: Highlight) => void;
-  currentFilters: DashboardFilters;
-}
-
-export function useActionDispatcher({
-  onFilterChange,
-  onHighlight,
-  currentFilters,
-}: UseActionDispatcherOptions) {
-  const handleEvent = useCallback(
-    (event: SSEEvent) => {
-      if (
-        event.type !== "response.output_item.added" &&
-        event.type !== "response.output_item.done"
-      )
-        return;
-      if (event.item?.type !== "function_call") return;
-
-      const toolName = event.item.name;
-      if (!toolName || !DASHBOARD_TOOLS.has(toolName)) return;
-
-      let args: Record<string, unknown>;
-      try {
-        args = JSON.parse(event.item.arguments ?? "{}");
-      } catch {
-        return;
-      }
-
-      if (toolName === "apply_filter") {
-        const field = args.field as string;
-        const operator = args.operator as string;
-        const value = args.value as string | string[];
-
-        const newFilters = { ...currentFilters };
-
-        if (field === "date") {
-          if (operator === "between" && Array.isArray(value)) {
-            newFilters.date_from = value[0];
-            newFilters.date_to = value[1];
-          } else if (operator === "gt") {
-            newFilters.date_from = value as string;
-          } else if (operator === "lt") {
-            newFilters.date_to = value as string;
-          }
-        } else if (field === "pickup_zone" || field === "dropoff_zone") {
-          const zones = Array.isArray(value) ? value.join(",") : value;
-          newFilters.pickup_zip = zones as string;
-        } else if (field === "fare_range") {
-          if (operator === "between" && Array.isArray(value)) {
-            newFilters.fare_min = value[0];
-            newFilters.fare_max = value[1];
-          } else if (operator === "gt") {
-            newFilters.fare_min = value as string;
-          } else if (operator === "lt") {
-            newFilters.fare_max = value as string;
-          }
-        }
-
-        onFilterChange(newFilters);
-      } else if (toolName === "highlight_period") {
-        onHighlight({
-          start: args.start as string,
-          end: args.end as string,
-          color: (args.color as Highlight["color"]) ?? "blue",
-          label: args.label as string | undefined,
-        });
-      }
-    },
-    [onFilterChange, onHighlight, currentFilters],
-  );
-
-  return { handleEvent };
-}
diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index 6a36ba734..2bb8c3a6a 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -84,33 +84,74 @@ const helper = createAgent({
  *   intentionally stubs — the tool-call JSON is the action payload.
  */
 
-const apply_filter = tool({
-  name: "apply_filter",
+// Narrow, single-purpose tools.
+//
+// The earlier polymorphic `apply_filter({ field, operator, value })` was
+// too expressive — the LLM could emit valid-looking calls the dispatcher
+// couldn't faithfully apply (e.g. `field: "dropoff_zone"` when the
+// dashboard only has a `pickup_zip` filter; `operator: "eq"` with a date).
+// Splitting into one tool per filter verb removes the whole class of
+// "agent said it worked but nothing moved" bugs.
+//
+// Each tool has exactly one client-side effect, rendered by
+// use-action-dispatcher. Server handlers are still stubs — the tool-call
+// JSON is the action payload.
+
+const filter_by_date_range = tool({
+  name: "filter_by_date_range",
+  description:
+    "Filter the dashboard to trips within a date range. Both start and end are required and must be ISO dates (YYYY-MM-DD) within 2016.",
+  schema: z.object({
+    start: z.string().describe("Start date in ISO format, e.g. 2016-03-01"),
+    end: z.string().describe("End date in ISO format, e.g. 2016-03-31"),
+  }),
+  execute: async ({ start, end }) =>
+    `Filtered dashboard to trips between ${start} and ${end}.`,
+});
+
+const filter_by_pickup_zip = tool({
+  name: "filter_by_pickup_zip",
   description:
-    "Apply a filter to the dashboard data. This updates the KPIs and charts to reflect only the filtered data.",
+    "Filter the dashboard to trips originating from a specific pickup ZIP code. Use when the user asks about a specific pickup zone or ZIP.",
   schema: z.object({
-    field: z
-      .enum(["date", "pickup_zone", "dropoff_zone", "fare_range"])
-      .describe("The field to filter on"),
-    operator: z
-      .enum(["eq", "gt", "lt", "between", "in"])
-      .describe("The comparison operator"),
-    value: z
-      .union([z.string(), z.array(z.string())])
-      .describe(
-        "Filter value. For 'between', use an array of two values [start, end]. For 'in', use an array of values.",
-      ),
+    zip: z.string().describe("Pickup ZIP code, e.g. 10001"),
   }),
-  execute: async ({ field, operator, value }) => {
-    const valueStr = Array.isArray(value) ? value.join(" to ") : value;
-    return `Filter applied: ${field} ${operator} ${valueStr}. The dashboard will update to reflect this filter.`;
+  execute: async ({ zip }) =>
+    `Filtered dashboard to trips picked up in ${zip}.`,
+});
+
+const filter_by_fare = tool({
+  name: "filter_by_fare",
+  description:
+    "Filter the dashboard to trips within a fare range. At least one of min or max must be provided.",
+  schema: z
+    .object({
+      min: z.number().optional().describe("Minimum fare in USD"),
+      max: z.number().optional().describe("Maximum fare in USD"),
+    })
+    .refine((v) => v.min !== undefined || v.max !== undefined, {
+      message: "Provide at least one of min or max.",
+    }),
+  execute: async ({ min, max }) => {
+    const parts = [] as string[];
+    if (min !== undefined) parts.push(`>= $${min}`);
+    if (max !== undefined) parts.push(`<= $${max}`);
+    return `Filtered dashboard to trips with fare ${parts.join(" and ")}.`;
   },
 });
 
+const clear_filters = tool({
+  name: "clear_filters",
+  description:
+    "Remove all active filters from the dashboard. Use when the user asks to reset, clear, or remove filters.",
+  schema: z.object({}),
+  execute: async () => "All filters cleared.",
+});
+
 const highlight_period = tool({
   name: "highlight_period",
   description:
-    "Highlight a time period on the dashboard charts to draw attention to a specific date range.",
+    "Highlight a time period on the Trips Over Time chart to draw attention to a specific date range.",
   schema: z.object({
     start: z.string().describe("Start date in ISO format (YYYY-MM-DD)"),
     end: z.string().describe("End date in ISO format (YYYY-MM-DD)"),
@@ -125,7 +166,50 @@ const highlight_period = tool({
   }),
   execute: async ({ start, end, color: _color, label }) => {
     const suffix = label ? ` (${label})` : "";
-    return `Highlighted period ${start} to ${end}${suffix} on the dashboard charts.`;
+    return `Highlighted period ${start} to ${end}${suffix} on the dashboard.`;
+  },
+});
+
+const clear_highlights = tool({
+  name: "clear_highlights",
+  description:
+    "Remove all highlight overlays from the charts. Use when the user asks to clear, reset, or remove highlights.",
+  schema: z.object({}),
+  execute: async () => "All highlights cleared.",
+});
+
+const focus_chart = tool({
+  name: "focus_chart",
+  description:
+    "Scroll the user's viewport to a specific chart on the dashboard and briefly pulse it to draw attention. Use when the user asks to 'look at' or 'focus on' a specific visualization.",
+  schema: z.object({
+    chart_id: z
+      .enum(["kpis", "trips_over_time", "fare_distribution"])
+      .describe("Which chart to focus on"),
+  }),
+  execute: async ({ chart_id }) => `Focused on ${chart_id}.`,
+});
+
+// Destructive tool: exercises the approval gate. Server handler is a
+// stub — no view persistence — but `destructive: true` forces the
+// human-in-the-loop flow before the agent can call it.
+const save_view = tool({
+  name: "save_view",
+  description:
+    "Persist the current dashboard configuration (filters + highlights) as a named view the user can recall later. Destructive because it writes persistent user state; always surfaces the approval gate.",
+  annotations: { destructive: true, readOnly: false },
+  schema: z.object({
+    name: z.string().describe("Short human-readable name for the saved view"),
+    description: z
+      .string()
+      .optional()
+      .describe("Optional longer description for the saved view"),
+  }),
+  execute: async ({ name, description }) => {
+    const suffix = description ? `: ${description}` : "";
+    // Stub for the demo. A real impl would insert into a views table.
+    console.log(`[save_view] Saving view "${name}"${suffix}`);
+    return `Saved view "${name}"${suffix}.`;
   },
 });
 
@@ -145,14 +229,31 @@ const sql_analyst = createAgent({
 const dashboard_pilot = createAgent({
   instructions: [
     "You are the Smart Dashboard pilot. You do not query data — you manipulate the UI.",
-    "Use `apply_filter` to filter the dashboard by date range, zone, or fare range.",
-    "Use `highlight_period` to highlight a time range on the charts.",
-    "When the user asks to 'show me', 'filter to', or 'highlight' something, pick the matching tool and call it.",
-    "Always briefly state what you did after applying an action.",
-  ].join(" "),
+    "Filters:",
+    "- `filter_by_date_range({start, end})` — narrow to a date window within 2016.",
+    "- `filter_by_pickup_zip({zip})` — narrow to trips from a specific ZIP.",
+    "- `filter_by_fare({min?, max?})` — narrow by fare range (at least one bound required).",
+    "- `clear_filters()` — remove all active filters.",
+    "Highlights:",
+    "- `highlight_period({start, end, color?, label?})` — shade a date window on the trips chart.",
+    "- `clear_highlights()` — remove all shaded overlays.",
+    "Focus & save:",
+    "- `focus_chart({chart_id})` — scroll the viewport to `kpis`, `trips_over_time`, or `fare_distribution` and briefly pulse it.",
+    "- `save_view({name, description?})` — persist the current configuration. Destructive; the user will see an approval card.",
+    "Rules:",
+    "1. Pick the single tool that matches the user's intent. Do not chain filters unless the user asks for a compound filter.",
+    "2. Briefly state what you did after the tool returns. Do not narrate before calling the tool.",
+    "3. If the user's request is ambiguous (e.g. 'filter to last month' without a 2016 context), ask one clarifying question before calling any tool.",
+  ].join("\n"),
   tools: {
-    apply_filter,
+    filter_by_date_range,
+    filter_by_pickup_zip,
+    filter_by_fare,
+    clear_filters,
     highlight_period,
+    clear_highlights,
+    focus_chart,
+    save_view,
   },
 });
 
diff --git a/apps/dev-playground/shared/appkit-types/analytics.d.ts b/apps/dev-playground/shared/appkit-types/analytics.d.ts
index 43666dd06..6db948f81 100644
--- a/apps/dev-playground/shared/appkit-types/analytics.d.ts
+++ b/apps/dev-playground/shared/appkit-types/analytics.d.ts
@@ -48,6 +48,94 @@ declare module "@databricks/appkit-ui/react" {
           dummy: number;
         }>;
       };
+    dashboard_fare_distribution: {
+        name: "dashboard_fare_distribution";
+        parameters: {
+          /** STRING - use sql.string() */
+          dateFrom: SQLStringMarker;
+          /** STRING - use sql.string() */
+          dateTo: SQLStringMarker;
+          /** STRING - use sql.string() */
+          pickupZip: SQLStringMarker;
+        };
+        result: Array<{
+          /** @sqlType STRING */
+          fare_bucket: string;
+          /** @sqlType BIGINT */
+          trip_count: number;
+          /** @sqlType DOUBLE */
+          avg_distance: number;
+        }>;
+      };
+    dashboard_kpis: {
+        name: "dashboard_kpis";
+        parameters: {
+          /** STRING - use sql.string() */
+          dateFrom: SQLStringMarker;
+          /** STRING - use sql.string() */
+          dateTo: SQLStringMarker;
+          /** STRING - use sql.string() */
+          pickupZip: SQLStringMarker;
+          /** STRING - use sql.string() */
+          fareMin: SQLStringMarker;
+          /** STRING - use sql.string() */
+          fareMax: SQLStringMarker;
+        };
+        result: Array<{
+          /** @sqlType BIGINT */
+          total_trips: number;
+          /** @sqlType DOUBLE */
+          avg_fare: number;
+          /** @sqlType DOUBLE */
+          avg_distance: number;
+          /** @sqlType DOUBLE */
+          max_fare: number;
+          /** @sqlType DOUBLE */
+          min_fare: number;
+        }>;
+      };
+    dashboard_top_zone: {
+        name: "dashboard_top_zone";
+        parameters: {
+          /** STRING - use sql.string() */
+          dateFrom: SQLStringMarker;
+          /** STRING - use sql.string() */
+          dateTo: SQLStringMarker;
+          /** STRING - use sql.string() */
+          pickupZip: SQLStringMarker;
+          /** STRING - use sql.string() */
+          fareMin: SQLStringMarker;
+          /** STRING - use sql.string() */
+          fareMax: SQLStringMarker;
+        };
+        result: Array<{
+          /** @sqlType INT */
+          pickup_zip: number;
+          /** @sqlType BIGINT */
+          trip_count: number;
+        }>;
+      };
+    dashboard_trips_over_time: {
+        name: "dashboard_trips_over_time";
+        parameters: {
+          /** STRING - use sql.string() */
+          dateFrom: SQLStringMarker;
+          /** STRING - use sql.string() */
+          dateTo: SQLStringMarker;
+          /** STRING - use sql.string() */
+          pickupZip: SQLStringMarker;
+        };
+        result: Array<{
+          /** @sqlType DATE */
+          trip_date: string;
+          /** @sqlType BIGINT */
+          trip_count: number;
+          /** @sqlType DOUBLE */
+          avg_fare: number;
+          /** @sqlType DOUBLE */
+          total_revenue: number;
+        }>;
+      };
     example: {
         name: "example";
         parameters: Record<string, never>;

From 60c8ea6c9349277d3be349b7855c5ac16faf2c4f Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 4 May 2026 19:52:08 +0200
Subject: [PATCH 25/46] feat(appkit): sub-agent approval gate + save view to
 volume + saved views panel + floating chat

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 apps/dev-playground/client/package-lock.json  |  50 ++++
 apps/dev-playground/client/package.json       |   3 +-
 .../components/approval-card.tsx              | 147 +++++++++-
 .../components/chat-drawer.tsx                | 242 +++++++++++++++++
 .../components/query-section.tsx              | 167 ------------
 .../components/saved-views-panel.tsx          | 176 ++++++++++++
 .../hooks/use-action-dispatcher.ts            |  43 +++
 .../smart-dashboard/lib/capture-dashboard.ts  |  45 ++++
 .../src/routes/smart-dashboard.route.tsx      | 247 +++++++++++++----
 .../config/agents/query/agent.md              |   9 +-
 apps/dev-playground/server/index.ts           | 251 +++++++++++++++++-
 11 files changed, 1138 insertions(+), 242 deletions(-)
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx
 delete mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/query-section.tsx
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/saved-views-panel.tsx
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/lib/capture-dashboard.ts

diff --git a/apps/dev-playground/client/package-lock.json b/apps/dev-playground/client/package-lock.json
index 80bd5ad40..fb7e267b5 100644
--- a/apps/dev-playground/client/package-lock.json
+++ b/apps/dev-playground/client/package-lock.json
@@ -18,6 +18,7 @@
         "@tanstack/router-plugin": "1.133.22",
         "class-variance-authority": "0.7.1",
         "clsx": "2.1.1",
+        "html2canvas": "^1.4.1",
         "lucide-react": "0.546.0",
         "react": "19.2.0",
         "react-dom": "19.2.0",
@@ -3559,6 +3560,15 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/base64-arraybuffer": {
+      "version": "1.0.2",
+      "resolved": "https://npm-proxy.dev.databricks.com/base64-arraybuffer/-/base64-arraybuffer-1.0.2.tgz",
+      "integrity": "sha512-I3yl4r9QB5ZRY3XuJVEPfc2XhZO6YweFPI+UovAzn+8/hb3oJ6lnysaFcjVpkCPfVWFUDvoZ8kmVDP7WyRtYtQ==",
+      "license": "MIT",
+      "engines": {
+        "node": ">= 0.6.0"
+      }
+    },
     "node_modules/baseline-browser-mapping": {
       "version": "2.8.16",
       "resolved": "https://registry.npmjs.org/baseline-browser-mapping/-/baseline-browser-mapping-2.8.16.tgz",
@@ -3916,6 +3926,15 @@
         "node": ">= 8"
       }
     },
+    "node_modules/css-line-break": {
+      "version": "2.1.0",
+      "resolved": "https://npm-proxy.dev.databricks.com/css-line-break/-/css-line-break-2.1.0.tgz",
+      "integrity": "sha512-FHcKFCZcAha3LwfVBhCQbW2nCNbkZXn7KVUJcsT5/P8YmfsVja0FMPJr0B903j/E69HUphKiV9iQArX8SDYA4w==",
+      "license": "MIT",
+      "dependencies": {
+        "utrie": "^1.0.2"
+      }
+    },
     "node_modules/csstype": {
       "version": "3.1.3",
       "resolved": "https://registry.npmjs.org/csstype/-/csstype-3.1.3.tgz",
@@ -4711,6 +4730,19 @@
         "url": "https://github.com/sponsors/wooorm"
       }
     },
+    "node_modules/html2canvas": {
+      "version": "1.4.1",
+      "resolved": "https://npm-proxy.dev.databricks.com/html2canvas/-/html2canvas-1.4.1.tgz",
+      "integrity": "sha512-fPU6BHNpsyIhr8yyMpTLLxAbkaK8ArIBcmZIRiBLiDhjeqvXolaEmDGmELFuX9I4xDcaKKcJl+TKZLqruBbmWA==",
+      "license": "MIT",
+      "dependencies": {
+        "css-line-break": "^2.1.0",
+        "text-segmentation": "^1.0.3"
+      },
+      "engines": {
+        "node": ">=8.0.0"
+      }
+    },
     "node_modules/ignore": {
       "version": "5.3.2",
       "resolved": "https://registry.npmjs.org/ignore/-/ignore-5.3.2.tgz",
@@ -6215,6 +6247,15 @@
         "url": "https://opencollective.com/webpack"
       }
     },
+    "node_modules/text-segmentation": {
+      "version": "1.0.3",
+      "resolved": "https://npm-proxy.dev.databricks.com/text-segmentation/-/text-segmentation-1.0.3.tgz",
+      "integrity": "sha512-iOiPUo/BGnZ6+54OsWxZidGCsdU8YbE4PSpdPinp7DeMtUJNJBoJ/ouUSTJjHkh1KntHaltHl/gDs2FC4i5+Nw==",
+      "license": "MIT",
+      "dependencies": {
+        "utrie": "^1.0.2"
+      }
+    },
     "node_modules/tiny-invariant": {
       "version": "1.3.3",
       "resolved": "https://registry.npmjs.org/tiny-invariant/-/tiny-invariant-1.3.3.tgz",
@@ -6592,6 +6633,15 @@
         "react": "^16.8.0 || ^17.0.0 || ^18.0.0 || ^19.0.0"
       }
     },
+    "node_modules/utrie": {
+      "version": "1.0.2",
+      "resolved": "https://npm-proxy.dev.databricks.com/utrie/-/utrie-1.0.2.tgz",
+      "integrity": "sha512-1MLa5ouZiOmQzUbjbu9VmjLzn1QLXBhwpUa7kdLUQK+KQ5KA9I1vk5U4YHe/X2Ch7PYnJfWuWT+VbuxbGwljhw==",
+      "license": "MIT",
+      "dependencies": {
+        "base64-arraybuffer": "^1.0.2"
+      }
+    },
     "node_modules/vfile": {
       "version": "6.0.3",
       "resolved": "https://registry.npmjs.org/vfile/-/vfile-6.0.3.tgz",
diff --git a/apps/dev-playground/client/package.json b/apps/dev-playground/client/package.json
index 9bf90c3fd..98ea9f00c 100644
--- a/apps/dev-playground/client/package.json
+++ b/apps/dev-playground/client/package.json
@@ -20,6 +20,7 @@
     "@tanstack/router-plugin": "1.133.22",
     "class-variance-authority": "0.7.1",
     "clsx": "2.1.1",
+    "html2canvas": "^1.4.1",
     "lucide-react": "0.546.0",
     "react": "19.2.0",
     "react-dom": "19.2.0",
@@ -30,6 +31,7 @@
   },
   "devDependencies": {
     "@eslint/js": "9.36.0",
+    "@tailwindcss/postcss": "4.1.17",
     "@tanstack/router-cli": "1.133.20",
     "@types/node": "24.6.0",
     "@types/react": "19.2.2",
@@ -43,7 +45,6 @@
     "postcss": "8.5.6",
     "shiki": "3.15.0",
     "tailwindcss": "4.1.17",
-    "@tailwindcss/postcss": "4.1.17",
     "typescript": "5.9.3",
     "typescript-eslint": "8.45.0",
     "vite": "npm:rolldown-vite@7.1.14"
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
index 70ff99130..dcb55e3fd 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
@@ -1,6 +1,8 @@
-import { ShieldAlertIcon } from "lucide-react";
+import { CheckCircle2Icon, ShieldAlertIcon } from "lucide-react";
+import { useCallback, useState } from "react";
 import type { Highlight } from "../hooks/use-action-dispatcher";
 import type { DashboardFilters } from "../hooks/use-dashboard-data";
+import { captureDashboardAsDataUrl } from "../lib/capture-dashboard";
 
 export interface PendingApproval {
   approvalId: string;
@@ -18,7 +20,11 @@ interface ApprovalCardProps {
   approval: PendingApproval;
   filters: DashboardFilters;
   highlights: Highlight[];
+  /** Root element to capture when the approved tool is `save_view`. */
+  dashboardRef: React.RefObject<HTMLElement | null>;
   onDecide: (approvalId: string, decision: "approve" | "deny") => void;
+  /** Notification surfaced back to the route for the toast. */
+  onSaved?: (info: { name: string; volumePath: string }) => void;
 }
 
 function formatFilters(filters: DashboardFilters): string {
@@ -43,13 +49,102 @@ export function ApprovalCard({
   approval,
   filters,
   highlights,
+  dashboardRef,
   onDecide,
+  onSaved,
 }: ApprovalCardProps) {
   const args =
     typeof approval.args === "object" && approval.args !== null
       ? (approval.args as Record<string, unknown>)
       : {};
   const isDestructive = approval.annotations?.destructive === true;
+  const isSaveView = approval.toolName === "save_view";
+
+  const [phase, setPhase] = useState<
+    | { kind: "idle" }
+    | { kind: "capturing" }
+    | { kind: "uploading"; previewUrl: string }
+    | { kind: "done"; volumePath: string }
+    | { kind: "error"; message: string }
+  >({ kind: "idle" });
+
+  const handleApprove = useCallback(async () => {
+    if (!isSaveView) {
+      onDecide(approval.approvalId, "approve");
+      return;
+    }
+
+    const root = dashboardRef.current;
+    if (!root) {
+      setPhase({
+        kind: "error",
+        message:
+          "Cannot locate the dashboard element to capture. Contact support.",
+      });
+      return;
+    }
+
+    try {
+      setPhase({ kind: "capturing" });
+      // Conservative capture settings: AppKit's server plugin caps
+      // JSON bodies at 100kb by default. JPEG @ quality 0.75 + scale
+      // 0.6 keeps base64 payloads in the 25-60kb range for typical
+      // dashboard viewports with room for metadata.
+      const { dataUrl } = await captureDashboardAsDataUrl(root, {
+        quality: 0.75,
+        scale: 0.6,
+      });
+      setPhase({ kind: "uploading", previewUrl: dataUrl });
+
+      const name =
+        typeof args.name === "string" && args.name.trim() !== ""
+          ? (args.name as string)
+          : "Untitled view";
+      const description =
+        typeof args.description === "string" ? args.description : undefined;
+
+      const uploadRes = await fetch("/api/dashboard/save-view", {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({
+          name,
+          description,
+          filters,
+          highlights,
+          pngBase64: dataUrl,
+        }),
+      });
+
+      if (!uploadRes.ok) {
+        const err = await uploadRes.text();
+        throw new Error(`Upload failed (${uploadRes.status}): ${err}`);
+      }
+
+      const uploadJson = (await uploadRes.json()) as {
+        volumePath: string;
+      };
+
+      setPhase({ kind: "done", volumePath: uploadJson.volumePath });
+      onSaved?.({ name, volumePath: uploadJson.volumePath });
+      onDecide(approval.approvalId, "approve");
+    } catch (err) {
+      setPhase({
+        kind: "error",
+        message: err instanceof Error ? err.message : String(err),
+      });
+    }
+  }, [
+    isSaveView,
+    args,
+    filters,
+    highlights,
+    dashboardRef,
+    onDecide,
+    onSaved,
+    approval.approvalId,
+  ]);
+
+  const busy = phase.kind === "capturing" || phase.kind === "uploading";
 
   return (
     <div className="rounded-xl border border-red-500/40 bg-red-500/[0.06] p-4 shadow-sm">
@@ -71,7 +166,9 @@ export function ApprovalCard({
             <code className="font-mono text-foreground">
               {approval.toolName}
             </code>
-            . Review the arguments before approving.
+            {isSaveView
+              ? ". Approving captures the current dashboard and uploads it as a saved view."
+              : ". Review the arguments before approving."}
           </p>
         </div>
       </div>
@@ -116,20 +213,58 @@ export function ApprovalCard({
         </div>
       </div>
 
+      {phase.kind === "uploading" && (
+        <div className="mb-3 rounded-md border border-border bg-muted/40 p-2">
+          <div className="text-[11px] text-muted-foreground mb-1.5 font-medium">
+            Captured preview (uploading…)
+          </div>
+          <img
+            src={phase.previewUrl}
+            alt="Dashboard preview"
+            className="max-h-40 w-full object-contain rounded border border-border bg-background"
+          />
+        </div>
+      )}
+
+      {phase.kind === "done" && (
+        <div className="mb-3 rounded-md border border-green-500/40 bg-green-500/10 p-2 flex items-center gap-2 text-xs text-green-700 dark:text-green-400">
+          <CheckCircle2Icon className="h-3.5 w-3.5 shrink-0" />
+          <span>
+            Saved to <code className="font-mono">{phase.volumePath}</code>
+          </span>
+        </div>
+      )}
+
+      {phase.kind === "error" && (
+        <div className="mb-3 rounded-md border border-red-500/40 bg-red-500/10 p-2 text-xs text-red-700 dark:text-red-400">
+          {phase.message}
+        </div>
+      )}
+
       <div className="flex gap-2 justify-end">
         <button
           type="button"
           onClick={() => onDecide(approval.approvalId, "deny")}
-          className="px-3 py-1.5 text-xs border border-border rounded-md hover:bg-muted transition-colors"
+          disabled={busy}
+          className="px-3 py-1.5 text-xs border border-border rounded-md hover:bg-muted transition-colors disabled:opacity-50"
         >
           Deny
         </button>
         <button
           type="button"
-          onClick={() => onDecide(approval.approvalId, "approve")}
-          className="px-3 py-1.5 text-xs bg-primary text-primary-foreground rounded-md hover:bg-primary/90 transition-colors font-medium"
+          onClick={handleApprove}
+          disabled={busy || phase.kind === "done"}
+          className="px-3 py-1.5 text-xs bg-primary text-primary-foreground rounded-md hover:bg-primary/90 transition-colors font-medium disabled:opacity-50"
         >
-          Approve
+          {phase.kind === "capturing"
+            ? "Capturing…"
+            : phase.kind === "uploading"
+              ? "Uploading…"
+              : phase.kind === "done"
+                ? "Approved"
+                : isSaveView
+                  ? "Approve & save"
+                  : "Approve"}
         </button>
       </div>
     </div>
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx
new file mode 100644
index 000000000..0a37523a2
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx
@@ -0,0 +1,242 @@
+import {
+  FilterIcon,
+  Loader2Icon,
+  MessageSquareIcon,
+  SendIcon,
+  SparklesIcon,
+  XIcon,
+} from "lucide-react";
+import { useCallback, useEffect, useRef, useState } from "react";
+import type { PendingApproval } from "./approval-card";
+
+export interface ChatMessage {
+  id: string;
+  role: "user" | "assistant" | "system";
+  content: string;
+  /** When true, this is the in-progress assistant turn being streamed. */
+  streaming?: boolean;
+}
+
+interface ChatDrawerProps {
+  messages: ChatMessage[];
+  isLoading: boolean;
+  onSend: (message: string) => void;
+  /** Rendered inline in the message list for the turn that triggered it. */
+  approvalCardForMessage: (messageId: string) => React.ReactNode | null;
+  pendingApprovals: PendingApproval[];
+  /** Floating affordance: the toggle button also shows a pending-approval dot. */
+  unreadCount?: number;
+}
+
+const EXAMPLE_QUERIES = [
+  "Filter to November 2016",
+  "Highlight the first week of Jan 2016 in red",
+  "Save this view as Peak Week",
+  "Focus on the fare distribution",
+  "Clear all filters and highlights",
+];
+
+/**
+ * Floating chat drawer. Toggled by the ⌘J keyboard shortcut or the
+ * floating message-square button in the bottom-right. Multi-turn
+ * conversation history stays mounted in state so previous turns remain
+ * visible as the user iterates.
+ */
+export function ChatDrawer({
+  messages,
+  isLoading,
+  onSend,
+  approvalCardForMessage,
+  pendingApprovals,
+  unreadCount,
+}: ChatDrawerProps) {
+  const [open, setOpen] = useState(false);
+  const [input, setInput] = useState("");
+  const [showTips, setShowTips] = useState(true);
+  const bottomRef = useRef<HTMLDivElement>(null);
+
+  useEffect(() => {
+    const onKey = (e: KeyboardEvent) => {
+      if (
+        e.key === "j" &&
+        (e.metaKey || e.ctrlKey) &&
+        !e.altKey &&
+        !e.shiftKey
+      ) {
+        e.preventDefault();
+        setOpen((v) => !v);
+      } else if (e.key === "Escape" && open) {
+        setOpen(false);
+      }
+    };
+    window.addEventListener("keydown", onKey);
+    return () => {
+      window.removeEventListener("keydown", onKey);
+    };
+  }, [open]);
+
+  // Auto-open when a new approval arrives so users don't miss it.
+  useEffect(() => {
+    if (pendingApprovals.length > 0) setOpen(true);
+  }, [pendingApprovals.length]);
+
+  // biome-ignore lint/correctness/useExhaustiveDependencies: scroll on new messages
+  useEffect(() => {
+    bottomRef.current?.scrollIntoView({ behavior: "smooth" });
+  }, [messages.length, messages[messages.length - 1]?.content]);
+
+  const handleSubmit = useCallback(
+    (e: React.FormEvent) => {
+      e.preventDefault();
+      const msg = input.trim();
+      if (!msg || isLoading) return;
+      setInput("");
+      setShowTips(false);
+      onSend(msg);
+    },
+    [input, isLoading, onSend],
+  );
+
+  const handleExample = useCallback(
+    (q: string) => {
+      if (isLoading) return;
+      setShowTips(false);
+      onSend(q);
+    },
+    [isLoading, onSend],
+  );
+
+  return (
+    <>
+      <button
+        type="button"
+        onClick={() => setOpen((v) => !v)}
+        aria-label="Toggle chat (⌘J)"
+        title="Chat with the agent (⌘J)"
+        className="fixed bottom-4 right-20 z-30 rounded-full bg-primary text-primary-foreground shadow-lg hover:bg-primary/90 transition-colors p-3 flex items-center gap-1.5"
+      >
+        <MessageSquareIcon className="h-4 w-4" />
+        <span className="text-xs font-medium">Chat</span>
+        {(unreadCount ?? 0) > 0 && (
+          <span className="ml-1 inline-flex items-center justify-center w-4 h-4 text-[10px] bg-red-500 text-white rounded-full">
+            {unreadCount}
+          </span>
+        )}
+      </button>
+
+      {open && (
+        <aside className="fixed bottom-20 right-4 z-40 w-[420px] max-h-[calc(100vh-120px)] flex flex-col rounded-xl border border-border bg-card shadow-2xl animate-in slide-in-from-bottom-4 fade-in duration-200">
+          <header className="px-4 py-3 border-b border-border flex items-center justify-between shrink-0">
+            <div>
+              <h2 className="text-sm font-semibold text-foreground flex items-center gap-2">
+                <SparklesIcon className="h-4 w-4 text-primary" />
+                Dashboard Agent
+              </h2>
+              <p className="text-[11px] text-muted-foreground">
+                ⌘J toggle · Esc close · full history preserved
+              </p>
+            </div>
+            <button
+              type="button"
+              onClick={() => setOpen(false)}
+              className="p-1 rounded-md hover:bg-muted text-muted-foreground hover:text-foreground transition-colors"
+              aria-label="Close chat"
+            >
+              <XIcon className="h-4 w-4" />
+            </button>
+          </header>
+
+          <div className="flex-1 overflow-y-auto px-4 py-3 space-y-3 min-h-0">
+            {messages.length === 0 && (
+              <div className="text-xs text-muted-foreground text-center py-6">
+                Ask the agent to filter, highlight, focus, or save the
+                dashboard.
+              </div>
+            )}
+
+            {messages.map((m) => (
+              <div key={m.id} className="space-y-1">
+                <MessageBubble message={m} />
+                {approvalCardForMessage(m.id)}
+              </div>
+            ))}
+
+            {isLoading &&
+              messages[messages.length - 1]?.role !== "assistant" && (
+                <div className="flex items-center gap-2 text-xs text-muted-foreground pl-2">
+                  <Loader2Icon className="h-3 w-3 animate-spin" />
+                  Thinking…
+                </div>
+              )}
+
+            <div ref={bottomRef} />
+          </div>
+
+          {showTips && messages.length === 0 && (
+            <div className="px-4 pb-3 border-t border-border">
+              <div className="flex items-center gap-1.5 mt-3 mb-2 text-[11px] font-medium text-muted-foreground">
+                <FilterIcon className="h-3 w-3" />
+                Try one of these
+              </div>
+              <div className="flex flex-wrap gap-1.5">
+                {EXAMPLE_QUERIES.map((q) => (
+                  <button
+                    key={q}
+                    type="button"
+                    onClick={() => handleExample(q)}
+                    disabled={isLoading}
+                    className="rounded-md border border-border bg-background px-2 py-0.5 text-[11px] text-muted-foreground hover:text-foreground hover:border-primary/40 transition-colors disabled:opacity-50"
+                  >
+                    {q}
+                  </button>
+                ))}
+              </div>
+            </div>
+          )}
+
+          <form
+            onSubmit={handleSubmit}
+            className="px-4 py-3 border-t border-border flex gap-2 shrink-0"
+          >
+            <input
+              type="text"
+              value={input}
+              onChange={(e) => setInput(e.target.value)}
+              placeholder="Ask the dashboard…"
+              disabled={isLoading}
+              className="flex-1 rounded-lg border border-border bg-background px-3 py-1.5 text-sm focus:outline-none focus:ring-2 focus:ring-ring disabled:opacity-50"
+            />
+            <button
+              type="submit"
+              disabled={isLoading || !input.trim()}
+              className="inline-flex items-center gap-1 rounded-lg bg-primary px-3 py-1.5 text-xs font-medium text-primary-foreground hover:bg-primary/90 disabled:opacity-50 transition-colors"
+            >
+              {isLoading ? (
+                <Loader2Icon className="h-3.5 w-3.5 animate-spin" />
+              ) : (
+                <SendIcon className="h-3.5 w-3.5" />
+              )}
+            </button>
+          </form>
+        </aside>
+      )}
+    </>
+  );
+}
+
+function MessageBubble({ message }: { message: ChatMessage }) {
+  const isUser = message.role === "user";
+  return (
+    <div className={`flex ${isUser ? "justify-end" : "justify-start"}`}>
+      <div
+        className={`max-w-[85%] px-3 py-2 rounded-lg text-sm whitespace-pre-wrap ${
+          isUser
+            ? "bg-primary text-primary-foreground rounded-br-sm"
+            : "bg-muted text-foreground rounded-bl-sm"
+        } ${message.streaming ? "animate-pulse" : ""}`}
+      >
+        {message.content || (message.streaming ? "…" : "")}
+      </div>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/query-section.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/query-section.tsx
deleted file mode 100644
index 9f0d60c24..000000000
--- a/apps/dev-playground/client/src/features/smart-dashboard/components/query-section.tsx
+++ /dev/null
@@ -1,167 +0,0 @@
-import {
-  FilterIcon,
-  HighlighterIcon,
-  Loader2Icon,
-  SearchIcon,
-  SendIcon,
-  SparklesIcon,
-} from "lucide-react";
-import { useCallback, useState } from "react";
-
-interface QuerySectionProps {
-  /** Dispatch a message through the chat pipeline. Owned by the route. */
-  onSend: (message: string) => void;
-  /** Streaming assistant text for the current run. */
-  content: string;
-  /** Whether a run is in flight. */
-  isLoading: boolean;
-}
-
-const EXAMPLE_QUERIES = [
-  "What's the busiest day of the week in 2016?",
-  "Filter to November 2016 only",
-  "Highlight the first week of Jan 2016 in red",
-  "Focus on the fare distribution chart",
-  "Clear all filters and highlights",
-];
-
-export function QuerySection({
-  onSend,
-  content,
-  isLoading,
-}: QuerySectionProps) {
-  const [input, setInput] = useState("");
-  const [showTips, setShowTips] = useState(true);
-
-  const handleSubmit = useCallback(
-    (e: React.FormEvent) => {
-      e.preventDefault();
-      const message = input.trim();
-      if (!message || isLoading) return;
-      setInput("");
-      setShowTips(false);
-      onSend(message);
-    },
-    [input, isLoading, onSend],
-  );
-
-  const handleExample = useCallback(
-    (query: string) => {
-      if (isLoading) return;
-      setInput("");
-      setShowTips(false);
-      onSend(query);
-    },
-    [isLoading, onSend],
-  );
-
-  return (
-    <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
-      <div className="flex items-center justify-between mb-4">
-        <div className="flex items-center gap-2">
-          <SearchIcon className="h-4 w-4 text-primary" />
-          <h3 className="text-sm font-semibold text-foreground">
-            Ask about the data
-          </h3>
-          <span className="text-xs text-muted-foreground">
-            — query dispatcher routes to SQL analyst or dashboard pilot
-          </span>
-        </div>
-        <button
-          type="button"
-          onClick={() => setShowTips((v) => !v)}
-          className="text-xs text-muted-foreground hover:text-foreground transition-colors"
-        >
-          {showTips ? "Hide tips" : "Show tips"}
-        </button>
-      </div>
-
-      {showTips && (
-        <div className="mb-4 rounded-lg border border-dashed border-border bg-muted/20 p-3">
-          <p className="text-xs font-medium text-muted-foreground mb-2 flex items-center gap-1.5">
-            <SparklesIcon className="h-3.5 w-3.5" />
-            This agent can query data and control the dashboard
-          </p>
-          <div className="grid grid-cols-1 sm:grid-cols-2 gap-2 mb-3">
-            <div className="flex items-start gap-2">
-              <FilterIcon className="h-3.5 w-3.5 text-blue-500 mt-0.5 shrink-0" />
-              <div>
-                <p className="text-xs font-medium text-foreground">
-                  Filter & highlight
-                </p>
-                <p className="text-[11px] text-muted-foreground">
-                  Ask to filter by date, ZIP, or fare, or highlight a period.
-                  Dashboard updates live as the agent acts.
-                </p>
-              </div>
-            </div>
-            <div className="flex items-start gap-2">
-              <HighlighterIcon className="h-3.5 w-3.5 text-amber-500 mt-0.5 shrink-0" />
-              <div>
-                <p className="text-xs font-medium text-foreground">
-                  Save view (approval gate)
-                </p>
-                <p className="text-[11px] text-muted-foreground">
-                  Ask to save the current view — it's destructive, so you'll see
-                  an approval card before the agent can proceed.
-                </p>
-              </div>
-            </div>
-          </div>
-          <div className="flex flex-wrap gap-1.5">
-            {EXAMPLE_QUERIES.map((q) => (
-              <button
-                key={q}
-                type="button"
-                onClick={() => handleExample(q)}
-                disabled={isLoading}
-                className="rounded-md border border-border bg-background px-2 py-1 text-[11px] text-muted-foreground hover:text-foreground hover:border-primary/40 transition-colors disabled:opacity-50"
-              >
-                {q}
-              </button>
-            ))}
-          </div>
-        </div>
-      )}
-
-      <form onSubmit={handleSubmit} className="flex gap-2 mb-4">
-        <input
-          type="text"
-          value={input}
-          onChange={(e) => setInput(e.target.value)}
-          placeholder='Try "Filter to January 2016" or "Save this view as Peak Week"'
-          disabled={isLoading}
-          className="flex-1 rounded-lg border border-border bg-background px-3 py-2 text-sm text-foreground placeholder:text-muted-foreground focus:outline-none focus:ring-2 focus:ring-ring disabled:opacity-50"
-        />
-        <button
-          type="submit"
-          disabled={isLoading || !input.trim()}
-          className="inline-flex items-center gap-1.5 rounded-lg bg-primary px-4 py-2 text-sm font-medium text-primary-foreground hover:bg-primary/90 disabled:opacity-50 transition-colors"
-        >
-          {isLoading ? (
-            <Loader2Icon className="h-4 w-4 animate-spin" />
-          ) : (
-            <SendIcon className="h-4 w-4" />
-          )}
-          Ask
-        </button>
-      </form>
-
-      {(content || isLoading) && (
-        <div className="rounded-lg border border-border bg-muted/30 p-4 max-h-[300px] overflow-y-auto">
-          {isLoading && !content && (
-            <div className="flex items-center gap-2 text-muted-foreground">
-              <Loader2Icon className="h-4 w-4 animate-spin" />
-              <span className="text-sm">Thinking...</span>
-            </div>
-          )}
-          {content && (
-            <div className="text-sm text-foreground whitespace-pre-wrap leading-relaxed">
-              {content}
-            </div>
-          )}
-        </div>
-      )}
-    </div>
-  );
-}
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/saved-views-panel.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/saved-views-panel.tsx
new file mode 100644
index 000000000..a04a86121
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/saved-views-panel.tsx
@@ -0,0 +1,176 @@
+import {
+  BookmarkIcon,
+  ChevronDownIcon,
+  ChevronUpIcon,
+  Loader2Icon,
+  RefreshCwIcon,
+} from "lucide-react";
+import { useCallback, useEffect, useState } from "react";
+
+export interface SavedView {
+  pngPath: string;
+  metaPath: string;
+  metadata: {
+    name?: string;
+    description?: string | null;
+    filters?: Record<string, unknown>;
+    highlights?: unknown[];
+    savedAt?: string;
+    savedBy?: string;
+    pngPath?: string;
+  };
+}
+
+interface SavedViewsPanelProps {
+  /**
+   * Send-to-chat callback. Clicking a saved view dispatches a load request
+   * through the agent so the approval/action trail stays consistent.
+   */
+  onLoad: (view: SavedView) => void;
+  /** Incrementing counter bumped by the route after each successful save. */
+  refreshToken: number;
+}
+
+export function SavedViewsPanel({
+  onLoad,
+  refreshToken,
+}: SavedViewsPanelProps) {
+  const [open, setOpen] = useState(true);
+  const [views, setViews] = useState<SavedView[]>([]);
+  const [loading, setLoading] = useState(false);
+  const [error, setError] = useState<string | null>(null);
+
+  const load = useCallback(async () => {
+    setLoading(true);
+    setError(null);
+    try {
+      const res = await fetch("/api/dashboard/saved-views");
+      if (!res.ok) {
+        const txt = await res.text();
+        throw new Error(`${res.status}: ${txt}`);
+      }
+      const data = (await res.json()) as { views: SavedView[] };
+      setViews(data.views);
+    } catch (err) {
+      setError(err instanceof Error ? err.message : String(err));
+    } finally {
+      setLoading(false);
+    }
+  }, []);
+
+  // Load on mount + whenever the parent bumps refreshToken. The dep on
+  // refreshToken is intentional — biome flags it because it's an opaque
+  // number with no direct read inside the effect body, but the whole
+  // point is that changing it in the parent invalidates the cached list.
+  // biome-ignore lint/correctness/useExhaustiveDependencies: see above
+  useEffect(() => {
+    load();
+  }, [load, refreshToken]);
+
+  return (
+    <div className="rounded-xl border border-border bg-card shadow-sm">
+      <button
+        type="button"
+        onClick={() => setOpen((v) => !v)}
+        className="w-full flex items-center justify-between px-4 py-3 text-left"
+      >
+        <div className="flex items-center gap-2">
+          <BookmarkIcon className="h-4 w-4 text-primary" />
+          <span className="text-sm font-semibold text-foreground">
+            Saved views
+          </span>
+          <span className="text-xs text-muted-foreground">
+            {views.length > 0 ? `(${views.length})` : ""}
+          </span>
+        </div>
+        <div className="flex items-center gap-2">
+          {loading && (
+            <Loader2Icon className="h-3.5 w-3.5 text-muted-foreground animate-spin" />
+          )}
+          {!loading && (
+            <button
+              type="button"
+              onClick={(e) => {
+                e.stopPropagation();
+                load();
+              }}
+              className="p-1 rounded hover:bg-muted text-muted-foreground hover:text-foreground transition-colors"
+              aria-label="Refresh saved views"
+            >
+              <RefreshCwIcon className="h-3.5 w-3.5" />
+            </button>
+          )}
+          {open ? (
+            <ChevronUpIcon className="h-4 w-4 text-muted-foreground" />
+          ) : (
+            <ChevronDownIcon className="h-4 w-4 text-muted-foreground" />
+          )}
+        </div>
+      </button>
+
+      {open && (
+        <div className="px-4 pb-4">
+          {error && (
+            <div className="text-xs text-red-600 mb-2">
+              Failed to load: {error}
+            </div>
+          )}
+
+          {!error && views.length === 0 && !loading && (
+            <div className="text-xs text-muted-foreground py-3">
+              No saved views yet. Use the <em>Save view…</em> quick action or
+              ask the agent to save the current configuration.
+            </div>
+          )}
+
+          {views.length > 0 && (
+            <div className="flex gap-3 overflow-x-auto pb-1">
+              {views.map((view) => (
+                <SavedViewCard
+                  key={view.pngPath}
+                  view={view}
+                  onLoad={() => onLoad(view)}
+                />
+              ))}
+            </div>
+          )}
+        </div>
+      )}
+    </div>
+  );
+}
+
+function SavedViewCard({
+  view,
+  onLoad,
+}: {
+  view: SavedView;
+  onLoad: () => void;
+}) {
+  const savedAt = view.metadata.savedAt
+    ? new Date(view.metadata.savedAt).toLocaleString()
+    : "";
+
+  return (
+    <button
+      type="button"
+      onClick={onLoad}
+      className="shrink-0 w-56 rounded-lg border border-border bg-background hover:border-primary/40 hover:shadow-sm transition-all text-left overflow-hidden group"
+    >
+      <img
+        src={`/api/dashboard/saved-view-png?path=${encodeURIComponent(view.pngPath)}`}
+        alt={view.metadata.name ?? "saved view"}
+        className="w-full h-24 object-cover bg-muted border-b border-border"
+        loading="lazy"
+      />
+      <div className="p-2">
+        <div className="text-xs font-medium text-foreground truncate">
+          {view.metadata.name ?? "Untitled view"}
+        </div>
+        <div className="text-[10px] text-muted-foreground truncate">
+          {savedAt}
+        </div>
+      </div>
+    </button>
+  );
+}
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts
index 70981b6b8..227cee81b 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts
+++ b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts
@@ -18,6 +18,7 @@ const DASHBOARD_TOOLS = new Set<string>([
   "highlight_period",
   "clear_highlights",
   "focus_chart",
+  "load_view",
 ]);
 
 interface UseActionDispatcherOptions {
@@ -204,6 +205,48 @@ export function useActionDispatcher({
           onAction?.(`Focused ${id.replace(/_/g, " ")}`);
           return;
         }
+        case "load_view": {
+          const rawFilters = (args.filters ?? {}) as Record<string, unknown>;
+          const nextFilters: DashboardFilters = {};
+          if (typeof rawFilters.date_from === "string")
+            nextFilters.date_from = rawFilters.date_from;
+          if (typeof rawFilters.date_to === "string")
+            nextFilters.date_to = rawFilters.date_to;
+          if (typeof rawFilters.pickup_zip === "string")
+            nextFilters.pickup_zip = rawFilters.pickup_zip;
+          if (typeof rawFilters.fare_min === "string")
+            nextFilters.fare_min = rawFilters.fare_min;
+          if (typeof rawFilters.fare_max === "string")
+            nextFilters.fare_max = rawFilters.fare_max;
+
+          const rawHighlights = Array.isArray(args.highlights)
+            ? (args.highlights as Array<Record<string, unknown>>)
+            : [];
+          const nextHighlights: Highlight[] = rawHighlights.flatMap((h) => {
+            const start = h.start;
+            const end = h.end;
+            if (typeof start !== "string" || typeof end !== "string") return [];
+            const color: Highlight["color"] =
+              h.color === "red" || h.color === "yellow" ? h.color : "blue";
+            const label = typeof h.label === "string" ? h.label : undefined;
+            return [{ start, end, color, label }];
+          });
+
+          // Restore: clear then re-apply both filters and highlights in one
+          // shot so partial states don't linger.
+          onClearFilters();
+          onClearHighlights();
+          if (Object.keys(nextFilters).length > 0) {
+            onFilterUpdate(() => nextFilters);
+          }
+          for (const h of nextHighlights) {
+            onAddHighlight(h);
+          }
+          const viewName =
+            typeof args.name === "string" ? args.name : "saved view";
+          onAction?.(`Loaded "${viewName}"`);
+          return;
+        }
         default: {
           // DASHBOARD_TOOLS membership already filtered unknowns; this branch
           // is a compile-time exhaustiveness check.
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/lib/capture-dashboard.ts b/apps/dev-playground/client/src/features/smart-dashboard/lib/capture-dashboard.ts
new file mode 100644
index 000000000..90c892f91
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/lib/capture-dashboard.ts
@@ -0,0 +1,45 @@
+import html2canvas from "html2canvas";
+
+/**
+ * Captures an element to a compressed JPEG data URL.
+ *
+ * We deliberately use JPEG + downscale instead of PNG because:
+ *
+ * - AppKit's server plugin applies `express.json({ limit: default = 100kb })`
+ *   globally. A full-fidelity dashboard PNG encoded in base64 is typically
+ *   200-600kb — over the limit.
+ * - JPEG @ quality 0.85 + pixelRatio 1 keeps payloads to ~40-80kb base64
+ *   for the Smart Dashboard viewport, comfortably under the limit.
+ *
+ * If the payload ever needs to grow (higher fidelity, larger viewports),
+ * switch to a raw body route (`express.raw`) with an explicit larger limit.
+ */
+export async function captureDashboardAsDataUrl(
+  el: HTMLElement,
+  opts: { quality?: number; scale?: number } = {},
+): Promise<{ dataUrl: string; widthPx: number; heightPx: number }> {
+  const quality = opts.quality ?? 0.85;
+  const scale = opts.scale ?? 1;
+
+  const canvas = await html2canvas(el, {
+    backgroundColor: readCssVar(el, "--background") ?? "#ffffff",
+    scale,
+    // Disable CORS image proxying — charts are same-origin SVG/canvas.
+    useCORS: true,
+    // Don't taint; we only render DOM we own.
+    allowTaint: false,
+    logging: false,
+  });
+
+  const dataUrl = canvas.toDataURL("image/jpeg", quality);
+  return { dataUrl, widthPx: canvas.width, heightPx: canvas.height };
+}
+
+function readCssVar(el: HTMLElement, name: string): string | null {
+  const raw = getComputedStyle(el).getPropertyValue(name).trim();
+  if (!raw) return null;
+  // CSS var values may be raw HSL triplets ("0 0% 100%") or full hsl(...).
+  // Wrap naked triplets so html2canvas' painter treats them as colors.
+  if (/^\d/.test(raw)) return `hsl(${raw})`;
+  return raw;
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx b/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
index 4417d7669..050428b8e 100644
--- a/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
+++ b/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
@@ -8,12 +8,19 @@ import {
   ApprovalCard,
   type PendingApproval,
 } from "@/features/smart-dashboard/components/approval-card";
+import {
+  ChatDrawer,
+  type ChatMessage,
+} from "@/features/smart-dashboard/components/chat-drawer";
 import { FareChart } from "@/features/smart-dashboard/components/fare-chart";
 import { FocusableChart } from "@/features/smart-dashboard/components/focusable-chart";
 import { InspectorToggle } from "@/features/smart-dashboard/components/inspector-toggle";
 import { KPICards } from "@/features/smart-dashboard/components/kpi-cards";
-import { QuerySection } from "@/features/smart-dashboard/components/query-section";
 import { QuickActionsBar } from "@/features/smart-dashboard/components/quick-actions-bar";
+import {
+  type SavedView,
+  SavedViewsPanel,
+} from "@/features/smart-dashboard/components/saved-views-panel";
 import { StreamInspector } from "@/features/smart-dashboard/components/stream-inspector";
 import { TripChart } from "@/features/smart-dashboard/components/trip-chart";
 import type { Highlight } from "@/features/smart-dashboard/hooks/use-action-dispatcher";
@@ -29,6 +36,13 @@ export const Route = createFileRoute("/smart-dashboard")({
   component: SmartDashboardRoute,
 });
 
+// Lightweight id factory for chat messages. Not using crypto.randomUUID
+// because the value is only meaningful for React keys + approval lookup
+// inside a single session.
+let messageIdCounter = 0;
+const nextMessageId = (): string =>
+  `msg_${++messageIdCounter}_${Math.random().toString(36).slice(2, 8)}`;
+
 function SmartDashboardRoute() {
   const [filters, setFilters] = useState<DashboardFilters>({});
   const [highlights, setHighlights] = useState<Highlight[]>([]);
@@ -38,11 +52,19 @@ function SmartDashboardRoute() {
   const [lastAction, setLastAction] = useState<string | null>(null);
   const [error, setError] = useState<string | null>(null);
 
+  // Multi-turn chat history. Messages accumulate across sends so the user
+  // can scroll back through the conversation rather than having the UI
+  // wipe itself after every reply.
+  const [messages, setMessages] = useState<ChatMessage[]>([]);
+  const activeAssistantIdRef = useRef<string | null>(null);
+  const lastUserMessageIdRef = useRef<string | null>(null);
+
+  // Saved-views panel bumps this token after an upload to force a list
+  // refresh without pushing props down through ApprovalCard manually.
+  const [savedViewsVersion, setSavedViewsVersion] = useState(0);
+
   useInspectorShortcuts();
 
-  // Dashboard data is keyed on the *current* filter state; the dispatcher
-  // mutates `filters` via setState updaters, so every new filter triggers
-  // a re-query automatically.
   const {
     kpis,
     tripsOverTime,
@@ -51,8 +73,6 @@ function SmartDashboardRoute() {
     error: dataError,
   } = useDashboardData(filters);
 
-  // Dispatcher surfaces actions via `onAction`; toast shows them. A small
-  // stream of summaries arrives as the agent makes calls on `.done` events.
   const pushAction = useCallback((summary: string) => {
     setLastAction(summary);
   }, []);
@@ -60,10 +80,8 @@ function SmartDashboardRoute() {
   const pushUnknown = useCallback((name: string, args: unknown) => {
     const argsPreview = typeof args === "string" ? args : JSON.stringify(args);
     setError(
-      `Agent emitted an unhandled tool call '${name}' with args ${argsPreview}. Ignoring — the dispatcher only handles the declared dashboard tools.`,
+      `Agent emitted an unhandled tool call '${name}' with args ${argsPreview}. Ignoring.`,
     );
-    // Keep the inspector warning visible too:
-    // eslint-disable-next-line no-console
     console.warn(`[dispatcher] unknown/invalid tool '${name}':`, args);
   }, []);
 
@@ -117,9 +135,6 @@ function SmartDashboardRoute() {
     [pendingApprovals],
   );
 
-  // Context prefix is recomputed when filter/highlight state changes, so
-  // every `send()` carries the freshest snapshot even though useAgentStream
-  // is mounted once at the route level.
   const contextPrefix = useMemo(
     () => buildDashboardContext(filters, highlights),
     [filters, highlights],
@@ -131,12 +146,15 @@ function SmartDashboardRoute() {
     (event: SSEEvent) => {
       handleDispatcherEvent(event);
 
+      // Capture pending approvals and pin them to the user turn that
+      // triggered them so the ChatDrawer can render the card inline.
       if (
         event.type === "appkit.approval_pending" &&
         event.approval_id &&
         event.stream_id &&
         event.tool_name
       ) {
+        const pinnedToMessageId = lastUserMessageIdRef.current;
         setPendingApprovals((prev) => [
           ...prev,
           {
@@ -145,10 +163,38 @@ function SmartDashboardRoute() {
             toolName: event.tool_name as string,
             args: event.args,
             annotations: event.annotations,
-          },
+            ...(pinnedToMessageId
+              ? { _pinnedToMessageId: pinnedToMessageId }
+              : {}),
+          } as PendingApproval & { _pinnedToMessageId?: string },
         ]);
       }
 
+      // Stream assistant text into the in-progress assistant message.
+      if (event.type === "response.output_text.delta" && event.delta) {
+        const id = activeAssistantIdRef.current;
+        if (id) {
+          setMessages((prev) =>
+            prev.map((m) =>
+              m.id === id
+                ? { ...m, content: m.content + (event.delta ?? "") }
+                : m,
+            ),
+          );
+        }
+      }
+
+      // Finalize the streaming assistant message when the run completes.
+      if (event.type === "response.completed") {
+        const id = activeAssistantIdRef.current;
+        if (id) {
+          setMessages((prev) =>
+            prev.map((m) => (m.id === id ? { ...m, streaming: false } : m)),
+          );
+          activeAssistantIdRef.current = null;
+        }
+      }
+
       if (event.type === "error" && event.error) {
         setError(event.error);
       }
@@ -156,24 +202,43 @@ function SmartDashboardRoute() {
     [handleDispatcherEvent],
   );
 
-  // Lifted to the route so the Quick Actions bar can dispatch through the
-  // same pipeline as the chat input. One agent stream, two callers.
-  const {
-    content,
-    isLoading: agentLoading,
-    send,
-  } = useAgentStream({
+  const { isLoading: agentLoading, send } = useAgentStream({
     agentName: "query",
     onEvent: handleStreamEvent,
   });
 
   const dispatchToAgent = useCallback(
     (message: string) => {
+      const userMsgId = nextMessageId();
+      const assistantMsgId = nextMessageId();
+      lastUserMessageIdRef.current = userMsgId;
+      activeAssistantIdRef.current = assistantMsgId;
+      setMessages((prev) => [
+        ...prev,
+        { id: userMsgId, role: "user", content: message },
+        { id: assistantMsgId, role: "assistant", content: "", streaming: true },
+      ]);
       send(message, { contextPrefix: contextPrefixRef.current });
     },
     [send],
   );
 
+  const handleLoadSavedView = useCallback(
+    (view: SavedView) => {
+      const name = view.metadata.name ?? "saved view";
+      dispatchToAgent(`Load the saved view '${name}'`);
+    },
+    [dispatchToAgent],
+  );
+
+  const handleSavedNotification = useCallback(
+    (info: { name: string; volumePath: string }) => {
+      setLastAction(`Saved "${info.name}" to volume`);
+      setSavedViewsVersion((v) => v + 1);
+    },
+    [],
+  );
+
   const handleClearFilter = useCallback((key: keyof DashboardFilters) => {
     setFilters((prev) => {
       const next = { ...prev };
@@ -187,6 +252,56 @@ function SmartDashboardRoute() {
     setHighlights([]);
   }, []);
 
+  // Ref to the captured region for save_view. Kept on the dashboard body
+  // (not the header/chat) so the screenshot is the analytics surface only.
+  const dashboardRef = useRef<HTMLDivElement | null>(null);
+
+  // ApprovalCards render inline in the chat drawer, pinned to the user
+  // turn that triggered them. Builds a lookup per render.
+  const approvalsByMessage = useMemo(() => {
+    const map = new Map<string, PendingApproval[]>();
+    for (const a of pendingApprovals) {
+      const pinId =
+        (a as PendingApproval & { _pinnedToMessageId?: string })
+          ._pinnedToMessageId ?? "__loose";
+      const arr = map.get(pinId) ?? [];
+      arr.push(a);
+      map.set(pinId, arr);
+    }
+    return map;
+  }, [pendingApprovals]);
+
+  const approvalCardForMessage = useCallback(
+    (messageId: string): React.ReactNode | null => {
+      const bucket = approvalsByMessage.get(messageId);
+      if (!bucket || bucket.length === 0) return null;
+      return (
+        <div className="space-y-2">
+          {bucket.map((approval) => (
+            <ApprovalCard
+              key={approval.approvalId}
+              approval={approval}
+              filters={filters}
+              highlights={highlights}
+              dashboardRef={dashboardRef}
+              onDecide={decideApproval}
+              onSaved={handleSavedNotification}
+            />
+          ))}
+        </div>
+      );
+    },
+    [
+      approvalsByMessage,
+      filters,
+      highlights,
+      decideApproval,
+      handleSavedNotification,
+    ],
+  );
+
+  const looseApprovals = approvalsByMessage.get("__loose") ?? [];
+
   return (
     <div className="min-h-screen bg-background text-foreground">
       <div className="max-w-[1400px] mx-auto px-4 py-4">
@@ -199,8 +314,7 @@ function SmartDashboardRoute() {
               Smart Dashboard
             </h1>
             <p className="text-xs text-muted-foreground">
-              NYC Taxi Analytics — powered by agents · press ⌘K for the stream
-              inspector
+              NYC Taxi Analytics · ⌘J chat · ⌘K stream inspector
             </p>
           </div>
         </header>
@@ -224,6 +338,13 @@ function SmartDashboardRoute() {
           </div>
         )}
 
+        <div className="mb-4">
+          <SavedViewsPanel
+            onLoad={handleLoadSavedView}
+            refreshToken={savedViewsVersion}
+          />
+        </div>
+
         <div className="mb-4">
           <ActiveFilters
             filters={filters}
@@ -232,51 +353,63 @@ function SmartDashboardRoute() {
           />
         </div>
 
-        <div className="mb-5">
-          <FocusableChart chartId="kpis">
-            <KPICards data={kpis} isLoading={dataLoading} />
-          </FocusableChart>
-        </div>
-
-        <div className="grid grid-cols-1 lg:grid-cols-[1fr_320px] gap-5 mb-5">
-          <div className="space-y-5">
-            <FocusableChart chartId="trips_over_time">
-              <TripChart
-                data={tripsOverTime}
-                highlights={highlights}
-                isLoading={dataLoading}
-              />
-            </FocusableChart>
-            <FocusableChart chartId="fare_distribution">
-              <FareChart data={fareDistribution} isLoading={dataLoading} />
+        {/* Everything below this ref is what gets captured for save_view. */}
+        <div ref={dashboardRef}>
+          <div className="mb-5">
+            <FocusableChart chartId="kpis">
+              <KPICards data={kpis} isLoading={dataLoading} />
             </FocusableChart>
           </div>
-          <div className="lg:h-[580px]">
-            <AgentSidebar kpis={kpis} kpisLoaded={!dataLoading} />
+
+          <div className="grid grid-cols-1 lg:grid-cols-[1fr_320px] gap-5 mb-5">
+            <div className="space-y-5">
+              <FocusableChart chartId="trips_over_time">
+                <TripChart
+                  data={tripsOverTime}
+                  highlights={highlights}
+                  isLoading={dataLoading}
+                />
+              </FocusableChart>
+              <FocusableChart chartId="fare_distribution">
+                <FareChart data={fareDistribution} isLoading={dataLoading} />
+              </FocusableChart>
+            </div>
+            <div className="lg:h-[580px]">
+              <AgentSidebar kpis={kpis} kpisLoaded={!dataLoading} />
+            </div>
           </div>
         </div>
 
-        <div className="space-y-4">
-          <QuerySection
-            onSend={dispatchToAgent}
-            content={content}
-            isLoading={agentLoading}
-          />
-          {pendingApprovals.map((approval) => (
-            <ApprovalCard
-              key={approval.approvalId}
-              approval={approval}
-              filters={filters}
-              highlights={highlights}
-              onDecide={decideApproval}
-            />
-          ))}
-        </div>
+        {/* Any approvals not pinned to a chat message (defensive fallback). */}
+        {looseApprovals.length > 0 && (
+          <div className="space-y-3">
+            {looseApprovals.map((approval) => (
+              <ApprovalCard
+                key={approval.approvalId}
+                approval={approval}
+                filters={filters}
+                highlights={highlights}
+                dashboardRef={dashboardRef}
+                onDecide={decideApproval}
+                onSaved={handleSavedNotification}
+              />
+            ))}
+          </div>
+        )}
       </div>
 
       <InspectorToggle />
       <StreamInspector />
       <ActionToast message={lastAction} />
+
+      <ChatDrawer
+        messages={messages}
+        isLoading={agentLoading}
+        onSend={dispatchToAgent}
+        approvalCardForMessage={approvalCardForMessage}
+        pendingApprovals={pendingApprovals}
+        unreadCount={pendingApprovals.length}
+      />
     </div>
   );
 }
diff --git a/apps/dev-playground/config/agents/query/agent.md b/apps/dev-playground/config/agents/query/agent.md
index c60fa0d16..d32c74331 100644
--- a/apps/dev-playground/config/agents/query/agent.md
+++ b/apps/dev-playground/config/agents/query/agent.md
@@ -16,9 +16,12 @@ fit.
   questions ("how many trips last Friday?", "top 5 pickup zones by revenue").
   Use for any analytical query that requires reading the database.
 - `agent-dashboard_pilot` — manipulates the dashboard UI directly: applies
-  filters, highlights time ranges, scrolls the user to a specific chart.
-  Use when the user says "show me…", "filter to…", "highlight…", "focus
-  on…".
+  or clears filters, highlights or clears time ranges, focuses a specific
+  chart, and saves the current configuration as a named view. Use when
+  the user says "show me…", "filter to…", "highlight…", "focus on…",
+  "clear…", "save…", or any request to modify the dashboard's visual
+  state. Do not answer these yourself — always delegate to the pilot
+  even if you think you lack the tool.
 
 Always explain briefly what you did after a specialist returns. Keep your
 own responses short; the specialists do the heavy lifting.
diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index 2bb8c3a6a..498f6e47a 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -8,7 +8,6 @@ import {
   files,
   fromPlugin,
   genie,
-  jobs,
   PolicyDeniedError,
   server,
   serving,
@@ -178,6 +177,42 @@ const clear_highlights = tool({
   execute: async () => "All highlights cleared.",
 });
 
+// Restores a previously saved view. The tool-call arguments are the
+// authoritative state: the client listens for this function_call on SSE
+// and applies the filters + highlights directly without needing a round
+// trip back for metadata. The agent is expected to have looked up the
+// saved view server-side before emitting this call (it passes the
+// already-resolved state through).
+const load_view = tool({
+  name: "load_view",
+  description:
+    "Restore a previously saved dashboard view by applying its filters and highlights. The caller supplies the already-resolved state so the client can apply it from this tool call without a second round trip.",
+  schema: z.object({
+    name: z.string().describe("The saved view's name (for UI feedback)"),
+    filters: z
+      .object({
+        date_from: z.string().optional(),
+        date_to: z.string().optional(),
+        pickup_zip: z.string().optional(),
+        fare_min: z.string().optional(),
+        fare_max: z.string().optional(),
+      })
+      .passthrough()
+      .describe("Filters to restore. Omit fields that should not be set."),
+    highlights: z
+      .array(
+        z.object({
+          start: z.string(),
+          end: z.string(),
+          color: z.enum(["blue", "red", "yellow"]).optional(),
+          label: z.string().optional(),
+        }),
+      )
+      .describe("Highlight ranges to restore."),
+  }),
+  execute: async ({ name }) => `Restored saved view "${name}".`,
+});
+
 const focus_chart = tool({
   name: "focus_chart",
   description:
@@ -240,6 +275,7 @@ const dashboard_pilot = createAgent({
     "Focus & save:",
     "- `focus_chart({chart_id})` — scroll the viewport to `kpis`, `trips_over_time`, or `fare_distribution` and briefly pulse it.",
     "- `save_view({name, description?})` — persist the current configuration. Destructive; the user will see an approval card.",
+    "- `load_view({name, filters, highlights})` — restore a previously saved view. Always pass the resolved state; never leave fields unset.",
     "Rules:",
     "1. Pick the single tool that matches the user's intent. Do not chain filters unless the user asks for a compound filter.",
     "2. Briefly state what you did after the tool returns. Do not narrate before calling the tool.",
@@ -254,12 +290,13 @@ const dashboard_pilot = createAgent({
     clear_highlights,
     focus_chart,
     save_view,
+    load_view,
   },
 });
 
 createApp({
   plugins: [
-    server(),
+    server({ autoStart: false }),
     reconnect(),
     telemetryExamples(),
     analytics({}),
@@ -269,6 +306,10 @@ createApp({
     lakebaseExamples(),
     files({
       volumes: {
+        // Smart Dashboard saved views land here. Backed by
+        // DATABRICKS_VOLUME_FILES (see app.yaml / .env). Open policy for
+        // the demo — production apps should narrow this.
+        files: { policy: files.policy.allowAll() },
         // baseline: everything allowed
         allow_all: { policy: files.policy.allowAll() },
         // read-only: uploads/mkdir/delete return 403
@@ -290,7 +331,6 @@ createApp({
         implicit: {},
       },
     }),
-    jobs(),
     serving(),
     agents({
       agents: { helper, sql_analyst, dashboard_pilot },
@@ -311,8 +351,9 @@ createApp({
     // }),
   ],
   ...(process.env.APPKIT_E2E_TEST && { client: createMockClient() }),
-  onPluginsReady(appkit) {
-    appkit.server.extend((app) => {
+}).then((appkit) => {
+  appkit.server
+    .extend((app) => {
       app.get("/sp", (_req, res) => {
         appkit.analytics
           .query("SELECT * FROM samples.nyctaxi.trips;")
@@ -410,9 +451,203 @@ createApp({
           results,
         });
       });
-    });
-  },
-}).catch(console.error);
+
+      /**
+       * Smart-Dashboard saved-view storage.
+       *
+       * Writes a PNG snapshot of the dashboard plus a sidecar JSON of the
+       * filter/highlight state into the `files` volume
+       * (`DATABRICKS_VOLUME_FILES` — `/Volumes/<catalog>/<schema>/...`).
+       * Body is JSON with a base64-encoded PNG so we avoid adding a
+       * multipart library just for this route. The ~33% size overhead is
+       * fine for demo payloads.
+       *
+       * This endpoint is only reachable AFTER the `save_view` approval
+       * gate has resolved client-side — the agent's text confirmation
+       * depends on the client first upload the screenshot, then POSTing
+       * the approval.
+       */
+      app.post("/api/dashboard/save-view", async (req, res) => {
+        const body = req.body as {
+          name?: string;
+          description?: string;
+          filters?: Record<string, unknown>;
+          highlights?: unknown[];
+          pngBase64?: string;
+        } | null;
+
+        if (
+          !body?.name ||
+          typeof body.name !== "string" ||
+          !body.pngBase64 ||
+          typeof body.pngBase64 !== "string"
+        ) {
+          res
+            .status(400)
+            .json({ error: "Missing required fields: name, pngBase64." });
+          return;
+        }
+
+        const slug = toSlug(body.name);
+        const timestamp = new Date().toISOString().replace(/[:.]/g, "-");
+        const baseName = `saved-views/${timestamp}_${slug}`;
+        const pngPath = `${baseName}.png`;
+        const metaPath = `${baseName}.json`;
+
+        const pngBytes = decodeDataUrlOrBase64(body.pngBase64);
+        if (!pngBytes) {
+          res.status(400).json({ error: "pngBase64 is not valid base64." });
+          return;
+        }
+
+        const metadata = {
+          name: body.name,
+          description: body.description ?? null,
+          filters: body.filters ?? {},
+          highlights: body.highlights ?? [],
+          savedAt: new Date().toISOString(),
+          savedBy: req.header("x-forwarded-user") ?? "unknown",
+          pngPath,
+        };
+
+        try {
+          const volume = appkit.files("files").asUser(req);
+          await volume.upload(pngPath, pngBytes, { overwrite: true });
+          await volume.upload(
+            metaPath,
+            Buffer.from(JSON.stringify(metadata, null, 2), "utf8"),
+            { overwrite: true },
+          );
+          res.json({
+            volumePath: pngPath,
+            metaPath,
+            bytes: pngBytes.length,
+            metadata,
+          });
+        } catch (err) {
+          console.error("[save-view] upload failed:", err);
+          const msg = err instanceof Error ? err.message : String(err);
+          res.status(500).json({ error: `Upload failed: ${msg}` });
+        }
+      });
+
+      /**
+       * Lists saved views in the `files` volume.
+       *
+       * Pairs the `.png` and `.json` entries into a single record per
+       * saved view; strips files that don't conform to the
+       * `<timestamp>_<slug>.(png|json)` convention.
+       */
+      app.get("/api/dashboard/saved-views", async (req, res) => {
+        try {
+          const volume = appkit.files("files").asUser(req);
+          const entries = await volume.list("saved-views");
+          const pngs = new Map<string, (typeof entries)[number]>();
+          const metas = new Map<string, (typeof entries)[number]>();
+          for (const e of entries) {
+            if (e.path.endsWith(".png")) {
+              pngs.set(e.path.replace(/\.png$/, ""), e);
+            } else if (e.path.endsWith(".json")) {
+              metas.set(e.path.replace(/\.json$/, ""), e);
+            }
+          }
+          const views = await Promise.all(
+            Array.from(pngs.entries())
+              .filter(([base]) => metas.has(base))
+              .sort(([a], [b]) => (a < b ? 1 : -1))
+              .map(async ([base, pngEntry]) => {
+                try {
+                  const metaText = await volume.read(`${base}.json`);
+                  const metaJson =
+                    typeof metaText === "string"
+                      ? metaText
+                      : new TextDecoder().decode(metaText);
+                  const parsed = JSON.parse(metaJson) as Record<
+                    string,
+                    unknown
+                  >;
+                  return {
+                    pngPath: pngEntry.path,
+                    metaPath: `${base}.json`,
+                    metadata: parsed,
+                  };
+                } catch {
+                  return null;
+                }
+              }),
+          );
+          res.json({ views: views.filter((v) => v !== null) });
+        } catch (err) {
+          console.error("[saved-views] list failed:", err);
+          const msg = err instanceof Error ? err.message : String(err);
+          res.status(500).json({ error: msg });
+        }
+      });
+
+      /**
+       * Streams the PNG bytes of a saved view so `<img src>` tags in the
+       * UI can render thumbnails without exposing a general-purpose file
+       * download endpoint. Path is the volume-relative key returned by
+       * /api/dashboard/saved-views.
+       */
+      app.get("/api/dashboard/saved-view-png", async (req, res) => {
+        const path = req.query.path;
+        if (typeof path !== "string" || !path.endsWith(".png")) {
+          res
+            .status(400)
+            .json({ error: "path query param required, .png only" });
+          return;
+        }
+        try {
+          const volume = appkit.files("files").asUser(req);
+          const contents = await volume.download(path);
+          res.setHeader("Content-Type", "image/png");
+          res.setHeader("Cache-Control", "private, max-age=60");
+          if (contents instanceof Uint8Array || Buffer.isBuffer(contents)) {
+            res.end(contents);
+          } else if (typeof contents === "string") {
+            res.end(contents);
+          } else {
+            // ReadableStream fallback
+            const reader = (contents as ReadableStream<Uint8Array>).getReader();
+            const chunks: Uint8Array[] = [];
+            while (true) {
+              const { done, value } = await reader.read();
+              if (done) break;
+              if (value) chunks.push(value);
+            }
+            res.end(Buffer.concat(chunks));
+          }
+        } catch (err) {
+          console.error("[saved-view-png] fetch failed:", err);
+          const msg = err instanceof Error ? err.message : String(err);
+          res.status(404).json({ error: msg });
+        }
+      });
+    })
+    .start();
+});
+
+function toSlug(s: string): string {
+  return (
+    s
+      .toLowerCase()
+      .replace(/[^a-z0-9-]+/g, "-")
+      .replace(/^-+|-+$/g, "")
+      .slice(0, 60) || "view"
+  );
+}
+
+function decodeDataUrlOrBase64(input: string): Buffer | null {
+  const stripped = input.startsWith("data:")
+    ? input.substring(input.indexOf(",") + 1)
+    : input;
+  try {
+    return Buffer.from(stripped, "base64");
+  } catch {
+    return null;
+  }
+}
 
 type ProbeResult = {
   volume: string;

From 63a19d166dccf9d24ae43949e7593df638d9b61a Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 14:29:47 +0200
Subject: [PATCH 26/46] fix(playground): treat missing saved-views dir as empty
 list, not 500

Fresh UC volumes don't have a saved-views/ subdirectory until the first
save; the SDK throws FILES_API_DIRECTORY_IS_NOT_FOUND on list. The
route was propagating that as a 500 which rendered as a red error
banner in the SavedViewsPanel on first load.

Catch the error explicitly, return { views: [] }, let the panel render
its 'no saved views yet' empty state cleanly. Uploads still work the
first time because the SDK auto-creates parent dirs on upload.
---
 apps/dev-playground/server/index.ts | 30 ++++++++++++++++++++++++++++-
 1 file changed, 29 insertions(+), 1 deletion(-)

diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index 498f6e47a..b1acbf088 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -541,7 +541,19 @@ createApp({
       app.get("/api/dashboard/saved-views", async (req, res) => {
         try {
           const volume = appkit.files("files").asUser(req);
-          const entries = await volume.list("saved-views");
+          let entries: Awaited<ReturnType<typeof volume.list>>;
+          try {
+            entries = await volume.list("saved-views");
+          } catch (err) {
+            // Fresh volume — the `saved-views/` subdirectory only exists
+            // after the first save. Treat "not found" as an empty list so
+            // the panel renders cleanly instead of showing a 500.
+            if (isNotFoundError(err)) {
+              res.json({ views: [] });
+              return;
+            }
+            throw err;
+          }
           const pngs = new Map<string, (typeof entries)[number]>();
           const metas = new Map<string, (typeof entries)[number]>();
           for (const e of entries) {
@@ -628,6 +640,22 @@ createApp({
     .start();
 });
 
+/**
+ * Heuristic match for Databricks Files API's "directory not found" error.
+ * The SDK surfaces it as a wrapped Error whose message contains the
+ * `FILES_API_DIRECTORY_IS_NOT_FOUND` reason + `NOT_FOUND` error code.
+ * Happy to be more specific if the SDK exposes a typed error class later.
+ */
+function isNotFoundError(err: unknown): boolean {
+  if (!(err instanceof Error)) return false;
+  const msg = err.message;
+  return (
+    msg.includes("FILES_API_DIRECTORY_IS_NOT_FOUND") ||
+    msg.includes("directory being accessed is not found") ||
+    /\bNOT_FOUND\b/.test(msg)
+  );
+}
+
 function toSlug(s: string): string {
   return (
     s

From 014e5290751f361af825df08f078bef974e73f84 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 4 May 2026 19:52:08 +0200
Subject: [PATCH 27/46] fix(appkit): forward all sub-agent events except
 metadata

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 apps/dev-playground/config/agents/query/agent.md | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/apps/dev-playground/config/agents/query/agent.md b/apps/dev-playground/config/agents/query/agent.md
index d32c74331..6f13584ad 100644
--- a/apps/dev-playground/config/agents/query/agent.md
+++ b/apps/dev-playground/config/agents/query/agent.md
@@ -23,5 +23,14 @@ fit.
   state. Do not answer these yourself — always delegate to the pilot
   even if you think you lack the tool.
 
-Always explain briefly what you did after a specialist returns. Keep your
-own responses short; the specialists do the heavy lifting.
+The specialists stream their own confirmation text back to the user
+while they work — their text is already visible in the chat by the time
+they return. **Do not echo or restate what they said.** Only speak
+yourself when you need to:
+
+- Route a request (one short sentence: "Handing this to the pilot…").
+- Combine results from multiple specialists.
+- Add context the user needs that the specialist didn't cover.
+
+If the specialist's response already answers the user, say nothing and
+let their text stand.

From 6879ecec387082cf09e11d1ed82d3f049fd9089a Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 16:22:33 +0200
Subject: [PATCH 28/46] fix(playground): use html2canvas-pro to support oklch()
 colors

html2canvas 1.x throws on `oklch()` color values, which Tailwind v4 emits
everywhere in computed styles. Swap to the maintained html2canvas-pro
fork (drop-in API) so dashboard captures render without
"Attempting to parse an unsupported color function 'oklch'" errors in
the approval card. Keeps html2canvas pinned so types still resolve.
---
 apps/dev-playground/client/package-lock.json     | 16 +++++++++++++++-
 apps/dev-playground/client/package.json          |  3 ++-
 .../smart-dashboard/components/approval-card.tsx |  3 ++-
 .../smart-dashboard/lib/capture-dashboard.ts     | 11 +++++++----
 4 files changed, 26 insertions(+), 7 deletions(-)

diff --git a/apps/dev-playground/client/package-lock.json b/apps/dev-playground/client/package-lock.json
index fb7e267b5..7a34b5b28 100644
--- a/apps/dev-playground/client/package-lock.json
+++ b/apps/dev-playground/client/package-lock.json
@@ -18,7 +18,8 @@
         "@tanstack/router-plugin": "1.133.22",
         "class-variance-authority": "0.7.1",
         "clsx": "2.1.1",
-        "html2canvas": "^1.4.1",
+        "html2canvas": "1.4.1",
+        "html2canvas-pro": "2.0.2",
         "lucide-react": "0.546.0",
         "react": "19.2.0",
         "react-dom": "19.2.0",
@@ -4743,6 +4744,19 @@
         "node": ">=8.0.0"
       }
     },
+    "node_modules/html2canvas-pro": {
+      "version": "2.0.2",
+      "resolved": "https://npm-proxy.dev.databricks.com/html2canvas-pro/-/html2canvas-pro-2.0.2.tgz",
+      "integrity": "sha512-9G/t0XgCZWonLwL0JwI7su6NdbOPUY7Ur4Ihpp8+XMaW9ibA2nDXF181Jr6tm94k8lX6sthpaXB3XqEnsMd5Cw==",
+      "license": "MIT",
+      "dependencies": {
+        "css-line-break": "^2.1.0",
+        "text-segmentation": "^1.0.3"
+      },
+      "engines": {
+        "node": ">=16.0.0"
+      }
+    },
     "node_modules/ignore": {
       "version": "5.3.2",
       "resolved": "https://registry.npmjs.org/ignore/-/ignore-5.3.2.tgz",
diff --git a/apps/dev-playground/client/package.json b/apps/dev-playground/client/package.json
index 98ea9f00c..e69a49a3c 100644
--- a/apps/dev-playground/client/package.json
+++ b/apps/dev-playground/client/package.json
@@ -20,7 +20,8 @@
     "@tanstack/router-plugin": "1.133.22",
     "class-variance-authority": "0.7.1",
     "clsx": "2.1.1",
-    "html2canvas": "^1.4.1",
+    "html2canvas": "1.4.1",
+    "html2canvas-pro": "2.0.2",
     "lucide-react": "0.546.0",
     "react": "19.2.0",
     "react-dom": "19.2.0",
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
index dcb55e3fd..06f5f6582 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
@@ -128,9 +128,10 @@ export function ApprovalCard({
       onSaved?.({ name, volumePath: uploadJson.volumePath });
       onDecide(approval.approvalId, "approve");
     } catch (err) {
+      const msg = err instanceof Error ? err.message : String(err);
       setPhase({
         kind: "error",
-        message: err instanceof Error ? err.message : String(err),
+        message: msg,
       });
     }
   }, [
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/lib/capture-dashboard.ts b/apps/dev-playground/client/src/features/smart-dashboard/lib/capture-dashboard.ts
index 90c892f91..a00f8799b 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/lib/capture-dashboard.ts
+++ b/apps/dev-playground/client/src/features/smart-dashboard/lib/capture-dashboard.ts
@@ -1,4 +1,4 @@
-import html2canvas from "html2canvas";
+import html2canvas from "html2canvas-pro";
 
 /**
  * Captures an element to a compressed JPEG data URL.
@@ -13,6 +13,10 @@ import html2canvas from "html2canvas";
  *
  * If the payload ever needs to grow (higher fidelity, larger viewports),
  * switch to a raw body route (`express.raw`) with an explicit larger limit.
+ *
+ * `html2canvas-pro` (drop-in fork of html2canvas) is required because
+ * Tailwind v4 emits `oklch()` colors throughout the computed styles of
+ * every node, which the original html2canvas 1.x cannot parse.
  */
 export async function captureDashboardAsDataUrl(
   el: HTMLElement,
@@ -20,13 +24,12 @@ export async function captureDashboardAsDataUrl(
 ): Promise<{ dataUrl: string; widthPx: number; heightPx: number }> {
   const quality = opts.quality ?? 0.85;
   const scale = opts.scale ?? 1;
+  const backgroundColor = readCssVar(el, "--background") ?? "#ffffff";
 
   const canvas = await html2canvas(el, {
-    backgroundColor: readCssVar(el, "--background") ?? "#ffffff",
+    backgroundColor,
     scale,
-    // Disable CORS image proxying — charts are same-origin SVG/canvas.
     useCORS: true,
-    // Don't taint; we only render DOM we own.
     allowTaint: false,
     logging: false,
   });

From af760e239398fb5e39e9506bf19cc34d25167e1d Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 16:22:45 +0200
Subject: [PATCH 29/46] fix(playground): unwrap DownloadResponse when serving
 saved-view PNGs

Databricks SDK `volume.download(path)` returns a wrapper
`{ contents: ReadableStream, "content-type": string }`, not the stream
itself. The previous handler tried to write the wrapper directly, which
produced an empty body and broke thumbnails in the saved-views panel.
Now we read `.contents`, drain the stream, and respond with the
server-reported content-type (falling back to `image/png`).

Also drops a couple of noisy console.logs left over from the debugging
session.
---
 apps/dev-playground/server/index.ts | 49 +++++++++++++++++------------
 1 file changed, 29 insertions(+), 20 deletions(-)

diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index b1acbf088..37022f0bc 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -242,8 +242,6 @@ const save_view = tool({
   }),
   execute: async ({ name, description }) => {
     const suffix = description ? `: ${description}` : "";
-    // Stub for the demo. A real impl would insert into a views table.
-    console.log(`[save_view] Saving view "${name}"${suffix}`);
     return `Saved view "${name}"${suffix}.`;
   },
 });
@@ -525,7 +523,6 @@ createApp({
             metadata,
           });
         } catch (err) {
-          console.error("[save-view] upload failed:", err);
           const msg = err instanceof Error ? err.message : String(err);
           res.status(500).json({ error: `Upload failed: ${msg}` });
         }
@@ -612,24 +609,36 @@ createApp({
         }
         try {
           const volume = appkit.files("files").asUser(req);
-          const contents = await volume.download(path);
-          res.setHeader("Content-Type", "image/png");
-          res.setHeader("Cache-Control", "private, max-age=60");
-          if (contents instanceof Uint8Array || Buffer.isBuffer(contents)) {
-            res.end(contents);
-          } else if (typeof contents === "string") {
-            res.end(contents);
-          } else {
-            // ReadableStream fallback
-            const reader = (contents as ReadableStream<Uint8Array>).getReader();
-            const chunks: Uint8Array[] = [];
-            while (true) {
-              const { done, value } = await reader.read();
-              if (done) break;
-              if (value) chunks.push(value);
-            }
-            res.end(Buffer.concat(chunks));
+          /**
+           * Databricks `FilesAPI.download` returns a wrapper:
+           *   { contents: ReadableStream, "content-type": string, ... }
+           * NOT the stream itself. We must unwrap `.contents` and drain it
+           * before writing to the Express response. Using the server-reported
+           * content-type (our captures are JPEG under a `.png` key, historical).
+           */
+          const response = (await volume.download(path)) as unknown as {
+            contents?: ReadableStream<Uint8Array>;
+            "content-type"?: string;
+          };
+          const stream = response.contents;
+          if (!stream) {
+            res.status(404).json({ error: "empty download response" });
+            return;
+          }
+          const chunks: Uint8Array[] = [];
+          const reader = stream.getReader();
+          while (true) {
+            const { done, value } = await reader.read();
+            if (done) break;
+            if (value) chunks.push(value);
           }
+          const body = Buffer.concat(chunks);
+          res.setHeader(
+            "Content-Type",
+            response["content-type"] ?? "image/png",
+          );
+          res.setHeader("Cache-Control", "private, max-age=60");
+          res.end(body);
         } catch (err) {
           console.error("[saved-view-png] fetch failed:", err);
           const msg = err instanceof Error ? err.message : String(err);

From 887af6fc22daa4b7756acde860f4085e0717f812 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 16:22:58 +0200
Subject: [PATCH 30/46] fix(playground): apply saved view directly from
 metadata on thumbnail click

Clicking a saved-view thumbnail was sending a chat prompt like "Load the
saved view 'january'" and letting the agent reconstruct filters from the
view name. That dropped the highlights (agent had no tool to fetch the
stored metadata) so January-with-focus-on-week-1 came back as just
January-wide.

Since the client already holds the full authoritative metadata for the
clicked thumbnail, bypass the agent and apply `meta.filters` and
`meta.highlights` directly to local state, with a toast summarising
what was restored.

Also hardens the `appkit.approval_pending` handler: it now accepts
both snake_case and camelCase fields and validates that
approval_id/tool_name/stream_id are non-empty strings before enqueuing,
so a malformed event can't push a broken approval card.
---
 .../src/routes/smart-dashboard.route.tsx      | 109 +++++++++++++-----
 1 file changed, 82 insertions(+), 27 deletions(-)

diff --git a/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx b/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
index 050428b8e..eab0bf317 100644
--- a/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
+++ b/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
@@ -148,26 +148,36 @@ function SmartDashboardRoute() {
 
       // Capture pending approvals and pin them to the user turn that
       // triggered them so the ChatDrawer can render the card inline.
-      if (
-        event.type === "appkit.approval_pending" &&
-        event.approval_id &&
-        event.stream_id &&
-        event.tool_name
-      ) {
-        const pinnedToMessageId = lastUserMessageIdRef.current;
-        setPendingApprovals((prev) => [
-          ...prev,
-          {
-            approvalId: event.approval_id as string,
-            streamId: event.stream_id as string,
-            toolName: event.tool_name as string,
-            args: event.args,
-            annotations: event.annotations,
-            ...(pinnedToMessageId
-              ? { _pinnedToMessageId: pinnedToMessageId }
-              : {}),
-          } as PendingApproval & { _pinnedToMessageId?: string },
-        ]);
+      if (event.type === "appkit.approval_pending") {
+        const e = event as SSEEvent & {
+          streamId?: string;
+          toolName?: string;
+        };
+        const approvalId = e.approval_id;
+        const streamId = e.stream_id ?? e.streamId;
+        const toolName = e.tool_name ?? e.toolName;
+        if (
+          typeof approvalId === "string" &&
+          approvalId &&
+          toolName &&
+          typeof streamId === "string" &&
+          streamId
+        ) {
+          const pinnedToMessageId = lastUserMessageIdRef.current;
+          setPendingApprovals((prev) => [
+            ...prev,
+            {
+              approvalId,
+              streamId,
+              toolName,
+              args: e.args,
+              annotations: e.annotations,
+              ...(pinnedToMessageId
+                ? { _pinnedToMessageId: pinnedToMessageId }
+                : {}),
+            } as PendingApproval & { _pinnedToMessageId?: string },
+          ]);
+        }
       }
 
       // Stream assistant text into the in-progress assistant message.
@@ -223,13 +233,58 @@ function SmartDashboardRoute() {
     [send],
   );
 
-  const handleLoadSavedView = useCallback(
-    (view: SavedView) => {
-      const name = view.metadata.name ?? "saved view";
-      dispatchToAgent(`Load the saved view '${name}'`);
-    },
-    [dispatchToAgent],
-  );
+  /**
+   * Apply a saved view directly from its stored metadata. We don't round-trip
+   * through the agent here because the agent has no tool to fetch saved-view
+   * metadata — it would have to guess filters/highlights from the name alone.
+   * The client already holds the full authoritative state, so just apply it.
+   */
+  const handleLoadSavedView = useCallback((view: SavedView) => {
+    const meta = view.metadata;
+    const rawFilters = (meta.filters ?? {}) as Record<string, unknown>;
+    const nextFilters: DashboardFilters = {};
+    if (typeof rawFilters.date_from === "string")
+      nextFilters.date_from = rawFilters.date_from;
+    if (typeof rawFilters.date_to === "string")
+      nextFilters.date_to = rawFilters.date_to;
+    if (typeof rawFilters.pickup_zip === "string")
+      nextFilters.pickup_zip = rawFilters.pickup_zip;
+    if (typeof rawFilters.fare_min === "string")
+      nextFilters.fare_min = rawFilters.fare_min;
+    if (typeof rawFilters.fare_max === "string")
+      nextFilters.fare_max = rawFilters.fare_max;
+
+    const rawHighlights = Array.isArray(meta.highlights) ? meta.highlights : [];
+    const nextHighlights: Highlight[] = rawHighlights.flatMap((h) => {
+      if (typeof h !== "object" || h === null) return [];
+      const entry = h as Record<string, unknown>;
+      const start = entry.start;
+      const end = entry.end;
+      if (typeof start !== "string" || typeof end !== "string") return [];
+      const color: Highlight["color"] =
+        entry.color === "red" || entry.color === "yellow"
+          ? entry.color
+          : "blue";
+      const label = typeof entry.label === "string" ? entry.label : undefined;
+      return [{ start, end, color, label }];
+    });
+
+    setFilters(nextFilters);
+    setHighlights(nextHighlights);
+
+    const viewName = meta.name ?? "saved view";
+    const summary = [
+      Object.keys(nextFilters).length > 0
+        ? `${Object.keys(nextFilters).length} filter(s)`
+        : null,
+      nextHighlights.length > 0
+        ? `${nextHighlights.length} highlight(s)`
+        : null,
+    ]
+      .filter(Boolean)
+      .join(" + ");
+    setLastAction(`Loaded "${viewName}"${summary ? ` (${summary})` : ""}`);
+  }, []);
 
   const handleSavedNotification = useCallback(
     (info: { name: string; volumePath: string }) => {

From 912fbda1e43ca9d46009a911164868df025601c8 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 16:23:12 +0200
Subject: [PATCH 31/46] docs(appkit): regenerate typedoc for tool annotations

Picks up the new `annotations?: ToolAnnotations` field on `ToolConfig`
and `FunctionTool` introduced upstream in the annotations-propagation
fix.
---
 docs/docs/api/appkit/Interface.FunctionTool.md | 15 +++++++++++++++
 docs/docs/api/appkit/Interface.ToolConfig.md   | 15 +++++++++++++++
 2 files changed, 30 insertions(+)

diff --git a/docs/docs/api/appkit/Interface.FunctionTool.md b/docs/docs/api/appkit/Interface.FunctionTool.md
index c096dacac..499503060 100644
--- a/docs/docs/api/appkit/Interface.FunctionTool.md
+++ b/docs/docs/api/appkit/Interface.FunctionTool.md
@@ -2,6 +2,21 @@
 
 ## Properties
 
+### annotations?
+
+```ts
+optional annotations: ToolAnnotations;
+```
+
+Behavioural hints that drive the agents plugin's approval gate and the
+client's approval-card styling. Prefer setting `effect` (one of
+`"read" | "write" | "update" | "destructive"`) — any mutating value
+forces HITL approval before `execute()` runs. Legacy `destructive: true`
+is still honoured. Must be preserved through functionToolToDefinition so the plugin sees them when building agent
+tool indexes.
+
+***
+
 ### description?
 
 ```ts
diff --git a/docs/docs/api/appkit/Interface.ToolConfig.md b/docs/docs/api/appkit/Interface.ToolConfig.md
index 48828a387..58855b4d4 100644
--- a/docs/docs/api/appkit/Interface.ToolConfig.md
+++ b/docs/docs/api/appkit/Interface.ToolConfig.md
@@ -8,6 +8,21 @@
 
 ## Properties
 
+### annotations?
+
+```ts
+optional annotations: ToolAnnotations;
+```
+
+Behavioural hints forwarded to the resolved tool definition. Prefer
+`effect` (`"read" | "write" | "update" | "destructive"`) — any mutating
+value forces the agents-plugin approval gate before `execute()` runs
+and the client's approval card will colour itself accordingly. Legacy
+`destructive: true` still gates. Dropped silently before the fix that
+added this field.
+
+***
+
 ### description?
 
 ```ts

From c888e300f19ad8271bf085cbe2f7f51fe65079a1 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 17:21:07 +0200
Subject: [PATCH 32/46] feat(playground): revamp smart dashboard with denser
 charts and actionable agent feed
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Reshapes the Smart Dashboard demo from a sparse 2-chart layout into a 2x2
chart grid with a right-rail agent feed, and turns the previously
read-only insights/anomaly cards into clickable actions that drive the
dashboard directly.

New visualisations:
- HourlyHeatmap: day-of-week × hour-of-day grid, click a cell to ask the
  agent to investigate that slot.
- TopZonesChart: hand-rolled horizontal bar leaderboard with click-to-
  filter and a `highlight_zone` ring driven by the agent.
- KPI sparklines: inline 7-day micro-charts with windowed trend deltas
  baked into each KPI card.

Agent feed becomes interactive:
- `feed-actions.ts` defines a structured action schema (filter_date,
  filter_zip, filter_fare, highlight_period, highlight_zone, focus_chart,
  ask) and a parser. The `insights` and `anomaly` ephemeral agents now
  emit JSON matching that schema.
- `ActionableCard` renders insights/anomalies with action chips that
  invoke `useActionDispatcher.dispatch` directly — same code path the
  SSE function-call handler uses, so UI clicks and agent tool calls
  behave identically.
- The feed re-runs (debounced) whenever filters or highlights change.

Server-side wiring:
- Adds `highlight_zone` and `clear_zone_highlights` tools.
- Extends the `focus_chart` enum with `hourly_heatmap` and `top_zones`.
- Updates `dashboard_pilot` instructions to prefer `highlight_zone` over
  `filter_by_pickup_zip` when calling out a single ZIP.
- Adds three SQL queries: `dashboard_hourly_heatmap`,
  `dashboard_top_zones`, `dashboard_kpi_sparklines`. The top-zones query
  casts `pickup_zip` (an INT in samples.nyctaxi.trips) to STRING so the
  client's highlight Map keys, the agent's `highlight_zone` arg, and the
  filter parameter all speak the same type.

Polish & defensive fixes:
- Defensive `Number()` coercion in `kpi-cards.tsx` for sparkline values
  so trend math doesn't render `NaN%` or string-concatenated revenue
  totals if a driver hands back DECIMAL-as-string.
- `Sparkline` reserves vertical space for intentionally-empty series
  (e.g. the categorical "Top Pickup Zone" KPI) instead of rendering a
  loading-style placeholder.
- 2x2 chart grid uses `items-start` + `auto-rows-min content-start` so
  the rail no longer stretches the chart column and creates dead space.
- `ChatDrawer` becomes a controlled component (`open` + `onOpenChange`)
  so any agent-triggering UI action can auto-open the chat — the user
  always sees the agent's response without manual disclosure.
---
 .../components/actionable-card.tsx            | 179 +++++++++++++
 .../components/agent-sidebar.tsx              | 252 ++++++++++++------
 .../components/chat-drawer.tsx                |  22 +-
 .../components/hourly-heatmap.tsx             | 186 +++++++++++++
 .../smart-dashboard/components/kpi-cards.tsx  | 201 +++++++++++++-
 .../components/top-zones-chart.tsx            | 164 ++++++++++++
 .../hooks/use-action-dispatcher.ts            | 134 ++++++----
 .../hooks/use-dashboard-data.ts               |  72 ++++-
 .../hooks/use-focus-registry.ts               |  22 +-
 .../smart-dashboard/lib/feed-actions.ts       | 206 ++++++++++++++
 .../src/routes/smart-dashboard.route.tsx      | 147 +++++++++-
 .../config/agents/anomaly/agent.md            |  30 ++-
 .../config/agents/insights/agent.md           |  31 ++-
 .../config/agents/query/agent.md              |  14 +-
 .../queries/dashboard_hourly_heatmap.sql      |  24 ++
 .../queries/dashboard_kpi_sparklines.sql      |  25 ++
 .../config/queries/dashboard_top_zones.sql    |  35 +++
 apps/dev-playground/server/index.ts           |  41 ++-
 .../shared/appkit-types/analytics.d.ts        |  77 ++++++
 19 files changed, 1692 insertions(+), 170 deletions(-)
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/actionable-card.tsx
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/hourly-heatmap.tsx
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/components/top-zones-chart.tsx
 create mode 100644 apps/dev-playground/client/src/features/smart-dashboard/lib/feed-actions.ts
 create mode 100644 apps/dev-playground/config/queries/dashboard_hourly_heatmap.sql
 create mode 100644 apps/dev-playground/config/queries/dashboard_kpi_sparklines.sql
 create mode 100644 apps/dev-playground/config/queries/dashboard_top_zones.sql

diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/actionable-card.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/actionable-card.tsx
new file mode 100644
index 000000000..41063defc
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/actionable-card.tsx
@@ -0,0 +1,179 @@
+import {
+  AlertTriangleIcon,
+  ArrowRightIcon,
+  CalendarIcon,
+  CrosshairIcon,
+  DollarSignIcon,
+  HighlighterIcon,
+  LightbulbIcon,
+  MapPinIcon,
+  MessageSquareIcon,
+} from "lucide-react";
+import type { FeedAction } from "../lib/feed-actions";
+
+type Variant = "insight" | "anomaly";
+type Severity = "low" | "medium" | "high";
+
+interface ActionableCardProps {
+  variant: Variant;
+  severity?: Severity;
+  title: string;
+  description: string;
+  actions: FeedAction[];
+  /** Fired for non-ask actions. Route applies them to dashboard state. */
+  onAction: (action: FeedAction) => void;
+  /** Fired for `ask` actions. Route forwards the prompt to the chat drawer. */
+  onAsk: (prompt: string) => void;
+}
+
+const INSIGHT_STYLES = {
+  border: "border-blue-200 dark:border-blue-900",
+  bg: "bg-blue-50/50 dark:bg-blue-950/30",
+  icon: "text-blue-500",
+};
+
+const ANOMALY_STYLES: Record<
+  Severity,
+  { border: string; bg: string; icon: string; badge: string }
+> = {
+  low: {
+    border: "border-yellow-200 dark:border-yellow-900",
+    bg: "bg-yellow-50/50 dark:bg-yellow-950/30",
+    icon: "text-yellow-500",
+    badge:
+      "bg-yellow-100 text-yellow-700 dark:bg-yellow-900/50 dark:text-yellow-400",
+  },
+  medium: {
+    border: "border-orange-200 dark:border-orange-900",
+    bg: "bg-orange-50/50 dark:bg-orange-950/30",
+    icon: "text-orange-500",
+    badge:
+      "bg-orange-100 text-orange-700 dark:bg-orange-900/50 dark:text-orange-400",
+  },
+  high: {
+    border: "border-red-200 dark:border-red-900",
+    bg: "bg-red-50/50 dark:bg-red-950/30",
+    icon: "text-red-500",
+    badge: "bg-red-100 text-red-700 dark:bg-red-900/50 dark:text-red-400",
+  },
+};
+
+function iconForAction(kind: FeedAction["kind"]): React.ReactNode {
+  const cls = "h-3 w-3";
+  switch (kind) {
+    case "filter_date":
+      return <CalendarIcon className={cls} />;
+    case "filter_zip":
+      return <MapPinIcon className={cls} />;
+    case "filter_fare":
+      return <DollarSignIcon className={cls} />;
+    case "highlight_period":
+      return <HighlighterIcon className={cls} />;
+    case "highlight_zone":
+      return <MapPinIcon className={cls} />;
+    case "focus_chart":
+      return <CrosshairIcon className={cls} />;
+    case "ask":
+      return <MessageSquareIcon className={cls} />;
+  }
+}
+
+/**
+ * Action chip for a single feed suggestion. The chip's visual weight depends
+ * on its kind: structural mutations (filter/highlight/focus) use the primary
+ * tint, `ask` uses a neutral outline so the user can tell "this opens the
+ * chat" from "this changes the dashboard" without reading the label.
+ */
+function ActionChip({
+  action,
+  onAction,
+  onAsk,
+}: {
+  action: FeedAction;
+  onAction: (a: FeedAction) => void;
+  onAsk: (prompt: string) => void;
+}) {
+  const isAsk = action.kind === "ask";
+  const isHighlight =
+    action.kind === "highlight_period" || action.kind === "highlight_zone";
+
+  return (
+    <button
+      type="button"
+      onClick={() => {
+        if (isAsk) onAsk(action.prompt);
+        else onAction(action);
+      }}
+      className={`inline-flex items-center gap-1 text-[11px] font-medium px-2 py-1 rounded-md transition-colors ${
+        isAsk
+          ? "border border-border bg-background text-foreground/80 hover:bg-muted hover:text-foreground"
+          : isHighlight
+            ? "bg-amber-100 text-amber-800 hover:bg-amber-200 dark:bg-amber-900/40 dark:text-amber-200 dark:hover:bg-amber-900/60"
+            : "bg-primary/10 text-primary hover:bg-primary/20"
+      }`}
+    >
+      {iconForAction(action.kind)}
+      <span>{action.label}</span>
+      {isAsk && <ArrowRightIcon className="h-3 w-3 opacity-70" />}
+    </button>
+  );
+}
+
+export function ActionableCard({
+  variant,
+  severity,
+  title,
+  description,
+  actions,
+  onAction,
+  onAsk,
+}: ActionableCardProps) {
+  const isAnomaly = variant === "anomaly";
+  const styles = isAnomaly
+    ? ANOMALY_STYLES[severity ?? "low"]
+    : { ...INSIGHT_STYLES, badge: "" };
+
+  return (
+    <div className={`rounded-lg border ${styles.border} ${styles.bg} p-3`}>
+      <div className="flex items-start gap-2 mb-2">
+        {isAnomaly ? (
+          <AlertTriangleIcon
+            className={`h-4 w-4 ${styles.icon} mt-0.5 shrink-0`}
+          />
+        ) : (
+          <LightbulbIcon className={`h-4 w-4 ${styles.icon} mt-0.5 shrink-0`} />
+        )}
+        <div className="min-w-0 flex-1">
+          <div className="flex items-start gap-2">
+            <p className="text-sm font-medium text-foreground leading-tight flex-1">
+              {title}
+            </p>
+            {isAnomaly && severity && (
+              <span
+                className={`text-[10px] font-medium px-1.5 py-0.5 rounded shrink-0 ${styles.badge}`}
+              >
+                {severity}
+              </span>
+            )}
+          </div>
+          <p className="text-xs text-muted-foreground mt-1 leading-relaxed">
+            {description}
+          </p>
+        </div>
+      </div>
+
+      {actions.length > 0 && (
+        <div className="flex flex-wrap gap-1.5 pl-6">
+          {actions.map((action, i) => (
+            <ActionChip
+              key={`${action.kind}-${i}-${action.label}`}
+              action={action}
+              onAction={onAction}
+              onAsk={onAsk}
+            />
+          ))}
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/agent-sidebar.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/agent-sidebar.tsx
index 1c3426f88..0c14b501c 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/components/agent-sidebar.tsx
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/agent-sidebar.tsx
@@ -1,79 +1,122 @@
 import { BrainIcon, Loader2Icon, RefreshCwIcon } from "lucide-react";
-import { useCallback, useEffect, useRef, useState } from "react";
+import { useCallback, useEffect, useMemo, useRef, useState } from "react";
+import type { Highlight } from "../hooks/use-action-dispatcher";
 import { useAgentStream } from "../hooks/use-agent-stream";
-import type { KPIData } from "../hooks/use-dashboard-data";
-import { AnomalyCard } from "./anomaly-card";
-import { InsightCard } from "./insight-card";
-
-interface Insight {
-  title: string;
-  description: string;
-}
-
-interface Anomaly {
-  title: string;
-  description: string;
-  severity: "low" | "medium" | "high";
-}
+import type { DashboardFilters, KPIData } from "../hooks/use-dashboard-data";
+import {
+  type FeedAction,
+  type FeedAnomaly,
+  type FeedInsight,
+  parseFeedAnomalies,
+  parseFeedInsights,
+} from "../lib/feed-actions";
+import { ActionableCard } from "./actionable-card";
 
 interface AgentSidebarProps {
   kpis: KPIData | null;
   kpisLoaded: boolean;
+  filters: DashboardFilters;
+  highlights: Highlight[];
+  /** Dispatches a structured action back to the dashboard without an LLM round-trip. */
+  onAction: (action: FeedAction) => void;
+  /** Fires when the user clicks an `ask` chip — routes to the main chat drawer. */
+  onAsk: (prompt: string) => void;
 }
 
-function parseAgentJSON<T>(content: string): T[] {
-  try {
-    const jsonMatch = content.match(/\[[\s\S]*\]/);
-    if (jsonMatch) {
-      return JSON.parse(jsonMatch[0]);
-    }
-  } catch {
-    /* skip */
+function buildKPISummary(
+  kpis: KPIData,
+  filters: DashboardFilters,
+  highlights: Highlight[],
+): string {
+  const parts = [
+    `Total trips: ${kpis.total_trips.toLocaleString()}`,
+    `Avg fare: $${kpis.avg_fare}`,
+    `Avg distance: ${kpis.avg_distance} mi`,
+    `Fare range: $${kpis.min_fare}–$${kpis.max_fare}`,
+    `Top pickup zone: ${kpis.top_pickup_zone} (${kpis.top_zone_trips.toLocaleString()} trips)`,
+  ];
+  const activeFilters = Object.entries(filters)
+    .filter(([, v]) => typeof v === "string" && v)
+    .map(([k, v]) => `${k}=${v}`);
+  if (activeFilters.length > 0) {
+    parts.push(`Active filters: ${activeFilters.join(", ")}`);
+  } else {
+    parts.push("Active filters: none (full 2016 dataset)");
   }
-  return [];
+  if (highlights.length > 0) {
+    parts.push(
+      `Highlights: ${highlights
+        .map(
+          (h) =>
+            `${h.start}→${h.end}${h.label ? ` (${h.label})` : ""} [${h.color}]`,
+        )
+        .join(", ")}`,
+    );
+  }
+  return parts.join(". ");
 }
 
-function buildKPISummary(kpis: KPIData): string {
-  return [
-    `Total trips: ${kpis.total_trips.toLocaleString()}`,
-    `Average fare: $${kpis.avg_fare}`,
-    `Average distance: ${kpis.avg_distance} miles`,
-    `Fare range: $${kpis.min_fare} - $${kpis.max_fare}`,
-    `Top pickup zone: ${kpis.top_pickup_zone} (${kpis.top_zone_trips.toLocaleString()} trips)`,
-  ].join(", ");
+/**
+ * Debounce helper so a rapid sequence of filter/highlight changes collapses
+ * into one ephemeral agent re-run. 700ms is short enough to feel responsive
+ * but long enough to coalesce a typical click+click interaction.
+ */
+function useDebouncedSignal(dep: string, delayMs: number): string {
+  const [stable, setStable] = useState(dep);
+  useEffect(() => {
+    const t = setTimeout(() => setStable(dep), delayMs);
+    return () => clearTimeout(t);
+  }, [dep, delayMs]);
+  return stable;
 }
 
-export function AgentSidebar({ kpis, kpisLoaded }: AgentSidebarProps) {
-  const [insights, setInsights] = useState<Insight[]>([]);
-  const [anomalies, setAnomalies] = useState<Anomaly[]>([]);
-  const hasFired = useRef(false);
+const SUGGESTED_FOLLOWUPS = [
+  "Compare this slice to the prior month.",
+  "What ZIPs show the highest fare-per-mile?",
+  "Were there any days with abnormal trip counts?",
+];
+
+export function AgentSidebar({
+  kpis,
+  kpisLoaded,
+  filters,
+  highlights,
+  onAction,
+  onAsk,
+}: AgentSidebarProps) {
+  const [insights, setInsights] = useState<FeedInsight[]>([]);
+  const [anomalies, setAnomalies] = useState<FeedAnomaly[]>([]);
 
   const insightsStream = useAgentStream({ agentName: "insights" });
   const anomalyStream = useAgentStream({ agentName: "anomaly" });
 
+  // Hold the latest stream handles + context refs so `analyze()` is stable
+  // but still reads current state.
   const insightsRef = useRef(insightsStream);
   insightsRef.current = insightsStream;
   const anomalyRef = useRef(anomalyStream);
   anomalyRef.current = anomalyStream;
-  const kpisRef = useRef(kpis);
-  kpisRef.current = kpis;
+  const ctxRef = useRef({ kpis, filters, highlights });
+  ctxRef.current = { kpis, filters, highlights };
 
   const analyze = useCallback(() => {
-    const currentKpis = kpisRef.current;
+    const { kpis: currentKpis, filters: f, highlights: h } = ctxRef.current;
     if (!currentKpis) return;
-    const summary = buildKPISummary(currentKpis);
+    const summary = buildKPISummary(currentKpis, f, h);
     setInsights([]);
     setAnomalies([]);
     insightsRef.current.reset();
     anomalyRef.current.reset();
     insightsRef.current.send(
-      `Here are the current taxi trip metrics: ${summary}. Analyze for interesting patterns and insights.`,
+      `Current NYC taxi dashboard state: ${summary}. Surface the most interesting patterns and insights with actionable chips.`,
     );
     anomalyRef.current.send(
-      `Here are the current taxi trip metrics: ${summary}. Check for anomalies, outliers, or unusual patterns.`,
+      `Current NYC taxi dashboard state: ${summary}. Identify anomalies, outliers, or suspicious patterns with actionable chips.`,
     );
   }, []);
 
+  // Initial fire once KPIs load.
+  const hasFired = useRef(false);
   useEffect(() => {
     if (kpisLoaded && kpis && !hasFired.current) {
       hasFired.current = true;
@@ -81,38 +124,71 @@ export function AgentSidebar({ kpis, kpisLoaded }: AgentSidebarProps) {
     }
   }, [kpisLoaded, kpis, analyze]);
 
+  // Re-run whenever filters or highlights settle into a new value. Encoded as
+  // a string so useEffect gets a primitive dep and the debounce works off
+  // structural equality, not object identity.
+  const stateSignal = useMemo(
+    () =>
+      JSON.stringify({
+        f: filters,
+        h: highlights.map((hh) => `${hh.start}-${hh.end}-${hh.color}`),
+      }),
+    [filters, highlights],
+  );
+  const debouncedSignal = useDebouncedSignal(stateSignal, 700);
+  const lastAnalyzedSignal = useRef(stateSignal);
+  useEffect(() => {
+    if (!kpisLoaded || !kpis) return;
+    if (!hasFired.current) return; // initial fire is in the other effect
+    if (debouncedSignal === lastAnalyzedSignal.current) return;
+    lastAnalyzedSignal.current = debouncedSignal;
+    analyze();
+  }, [debouncedSignal, kpisLoaded, kpis, analyze]);
+
   useEffect(() => {
     if (!insightsStream.isLoading && insightsStream.content) {
-      setInsights(parseAgentJSON<Insight>(insightsStream.content));
+      setInsights(parseFeedInsights(insightsStream.content));
     }
   }, [insightsStream.isLoading, insightsStream.content]);
 
   useEffect(() => {
     if (!anomalyStream.isLoading && anomalyStream.content) {
-      setAnomalies(parseAgentJSON<Anomaly>(anomalyStream.content));
+      setAnomalies(parseFeedAnomalies(anomalyStream.content));
     }
   }, [anomalyStream.isLoading, anomalyStream.content]);
 
   const isAnalyzing = insightsStream.isLoading || anomalyStream.isLoading;
+  const totalFindings = insights.length + anomalies.length;
 
   return (
     <div className="rounded-xl border border-border bg-card shadow-sm flex flex-col h-full">
       <div className="flex items-center justify-between px-4 py-3 border-b border-border">
-        <div className="flex items-center gap-2">
-          <BrainIcon className="h-4 w-4 text-primary" />
+        <div className="flex items-center gap-2 min-w-0">
+          <BrainIcon className="h-4 w-4 text-primary shrink-0" />
           <span className="text-sm font-semibold text-foreground">
             Agent Feed
           </span>
+          {isAnalyzing ? (
+            <span className="inline-flex items-center gap-1 text-[10px] font-medium text-primary bg-primary/10 px-1.5 py-0.5 rounded">
+              <Loader2Icon className="h-2.5 w-2.5 animate-spin" />
+              analyzing
+            </span>
+          ) : totalFindings > 0 ? (
+            <span className="text-[10px] font-medium text-muted-foreground bg-muted/60 px-1.5 py-0.5 rounded">
+              {insights.length}
+              <span className="text-muted-foreground/70"> insights · </span>
+              {anomalies.length}
+              <span className="text-muted-foreground/70"> anomalies</span>
+            </span>
+          ) : null}
         </div>
         <button
           type="button"
-          onClick={() => {
-            hasFired.current = false;
-            analyze();
-          }}
+          onClick={analyze}
           disabled={isAnalyzing}
           className="p-1.5 rounded-md hover:bg-muted text-muted-foreground hover:text-foreground transition-colors disabled:opacity-50"
           aria-label="Refresh analysis"
+          title="Re-run insights & anomaly agents"
         >
           <RefreshCwIcon
             className={`h-3.5 w-3.5 ${isAnalyzing ? "animate-spin" : ""}`}
@@ -121,48 +197,70 @@ export function AgentSidebar({ kpis, kpisLoaded }: AgentSidebarProps) {
       </div>
 
       <div className="flex-1 overflow-y-auto p-3 space-y-2.5">
-        {isAnalyzing && insights.length === 0 && anomalies.length === 0 && (
+        {isAnalyzing && totalFindings === 0 && (
           <div className="flex flex-col items-center justify-center py-8 text-muted-foreground">
             <Loader2Icon className="h-5 w-5 animate-spin mb-2" />
-            <p className="text-xs">Analyzing data...</p>
+            <p className="text-xs">Analyzing data…</p>
           </div>
         )}
 
-        {!isAnalyzing &&
-          insights.length === 0 &&
-          anomalies.length === 0 &&
-          !kpisLoaded && (
-            <p className="text-xs text-muted-foreground text-center py-8">
-              Loading dashboard data...
-            </p>
-          )}
-
-        {!isAnalyzing &&
-          insights.length === 0 &&
-          anomalies.length === 0 &&
-          kpisLoaded && (
-            <p className="text-xs text-muted-foreground text-center py-8">
-              Click refresh to analyze the data
-            </p>
-          )}
-
-        {insights.map((insight) => (
-          <InsightCard
-            key={`insight-${insight.title}`}
+        {!isAnalyzing && totalFindings === 0 && !kpisLoaded && (
+          <p className="text-xs text-muted-foreground text-center py-8">
+            Loading dashboard data…
+          </p>
+        )}
+
+        {!isAnalyzing && totalFindings === 0 && kpisLoaded && (
+          <p className="text-xs text-muted-foreground text-center py-8">
+            No findings for this slice — try widening the filters.
+          </p>
+        )}
+
+        {insights.map((insight, i) => (
+          <ActionableCard
+            key={`insight-${i}-${insight.title}`}
+            variant="insight"
             title={insight.title}
             description={insight.description}
+            actions={insight.actions ?? []}
+            onAction={onAction}
+            onAsk={onAsk}
           />
         ))}
 
-        {anomalies.map((anomaly) => (
-          <AnomalyCard
-            key={`anomaly-${anomaly.title}`}
+        {anomalies.map((anomaly, i) => (
+          <ActionableCard
+            key={`anomaly-${i}-${anomaly.title}`}
+            variant="anomaly"
+            severity={anomaly.severity}
             title={anomaly.title}
             description={anomaly.description}
-            severity={anomaly.severity}
+            actions={anomaly.actions ?? []}
+            onAction={onAction}
+            onAsk={onAsk}
           />
         ))}
       </div>
+
+      {kpisLoaded && (
+        <div className="border-t border-border px-3 py-2.5">
+          <p className="text-[10px] font-medium text-muted-foreground uppercase tracking-wide mb-1.5">
+            Try asking
+          </p>
+          <div className="flex flex-wrap gap-1.5">
+            {SUGGESTED_FOLLOWUPS.map((prompt) => (
+              <button
+                key={prompt}
+                type="button"
+                onClick={() => onAsk(prompt)}
+                className="text-[11px] px-2 py-1 rounded-md border border-border bg-background hover:bg-muted text-foreground/80 hover:text-foreground transition-colors"
+              >
+                {prompt}
+              </button>
+            ))}
+          </div>
+        </div>
+      )}
     </div>
   );
 }
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx
index 0a37523a2..4c5196489 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx
@@ -26,6 +26,11 @@ interface ChatDrawerProps {
   pendingApprovals: PendingApproval[];
   /** Floating affordance: the toggle button also shows a pending-approval dot. */
   unreadCount?: number;
+  /** Controlled open state so the parent can auto-open the drawer when a
+   *  dashboard interaction (chips, heatmap cells, quick actions, follow-ups)
+   *  dispatches a turn the user needs to see. */
+  open: boolean;
+  onOpenChange: (open: boolean) => void;
 }
 
 const EXAMPLE_QUERIES = [
@@ -49,8 +54,9 @@ export function ChatDrawer({
   approvalCardForMessage,
   pendingApprovals,
   unreadCount,
+  open,
+  onOpenChange,
 }: ChatDrawerProps) {
-  const [open, setOpen] = useState(false);
   const [input, setInput] = useState("");
   const [showTips, setShowTips] = useState(true);
   const bottomRef = useRef<HTMLDivElement>(null);
@@ -64,21 +70,21 @@ export function ChatDrawer({
         !e.shiftKey
       ) {
         e.preventDefault();
-        setOpen((v) => !v);
+        onOpenChange(!open);
       } else if (e.key === "Escape" && open) {
-        setOpen(false);
+        onOpenChange(false);
       }
     };
     window.addEventListener("keydown", onKey);
     return () => {
       window.removeEventListener("keydown", onKey);
     };
-  }, [open]);
+  }, [open, onOpenChange]);
 
   // Auto-open when a new approval arrives so users don't miss it.
   useEffect(() => {
-    if (pendingApprovals.length > 0) setOpen(true);
-  }, [pendingApprovals.length]);
+    if (pendingApprovals.length > 0) onOpenChange(true);
+  }, [pendingApprovals.length, onOpenChange]);
 
   // biome-ignore lint/correctness/useExhaustiveDependencies: scroll on new messages
   useEffect(() => {
@@ -110,7 +116,7 @@ export function ChatDrawer({
     <>
       <button
         type="button"
-        onClick={() => setOpen((v) => !v)}
+        onClick={() => onOpenChange(!open)}
         aria-label="Toggle chat (⌘J)"
         title="Chat with the agent (⌘J)"
         className="fixed bottom-4 right-20 z-30 rounded-full bg-primary text-primary-foreground shadow-lg hover:bg-primary/90 transition-colors p-3 flex items-center gap-1.5"
@@ -138,7 +144,7 @@ export function ChatDrawer({
             </div>
             <button
               type="button"
-              onClick={() => setOpen(false)}
+              onClick={() => onOpenChange(false)}
               className="p-1 rounded-md hover:bg-muted text-muted-foreground hover:text-foreground transition-colors"
               aria-label="Close chat"
             >
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/hourly-heatmap.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/hourly-heatmap.tsx
new file mode 100644
index 000000000..51ce98ed8
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/hourly-heatmap.tsx
@@ -0,0 +1,186 @@
+import { useMemo } from "react";
+import type { HeatmapCell } from "../hooks/use-dashboard-data";
+
+interface HourlyHeatmapProps {
+  data: HeatmapCell[];
+  isLoading: boolean;
+  /** Fires when the user clicks a cell. Receives a human-readable slot label
+   *  the route typically routes to `dispatchToAgent` so the agent can narrate. */
+  onCellClick?: (label: string, cell: HeatmapCell) => void;
+}
+
+// Spark's DAYOFWEEK returns 1..7 (Sunday=1, Saturday=7). We render Mon–Sun
+// for commuter intuition, so the row order is shifted.
+const DAY_ROW_ORDER: Array<{ label: string; dayOfWeek: number }> = [
+  { label: "Mon", dayOfWeek: 2 },
+  { label: "Tue", dayOfWeek: 3 },
+  { label: "Wed", dayOfWeek: 4 },
+  { label: "Thu", dayOfWeek: 5 },
+  { label: "Fri", dayOfWeek: 6 },
+  { label: "Sat", dayOfWeek: 7 },
+  { label: "Sun", dayOfWeek: 1 },
+];
+
+const FULL_DAY_LABEL: Record<number, string> = {
+  1: "Sunday",
+  2: "Monday",
+  3: "Tuesday",
+  4: "Wednesday",
+  5: "Thursday",
+  6: "Friday",
+  7: "Saturday",
+};
+
+const HOURS = Array.from({ length: 24 }, (_, i) => i);
+
+function formatHour(h: number): string {
+  if (h === 0) return "12a";
+  if (h === 12) return "12p";
+  if (h < 12) return `${h}a`;
+  return `${h - 12}p`;
+}
+
+/**
+ * Maps trip_count to an HSL string along the primary → hot gradient. Uses
+ * lightness rather than alpha so the cells stay legible on both themes; alpha
+ * would wash out the dark-mode variant. Missing cells render as a neutral
+ * muted tile rather than "empty" so the grid reads as a matrix at a glance.
+ */
+function cellColor(value: number, max: number, isDark: boolean): string {
+  if (max === 0 || value === 0) {
+    return isDark ? "hsl(215, 14%, 22%)" : "hsl(220, 13%, 94%)";
+  }
+  const t = Math.min(1, value / max);
+  if (isDark) {
+    const lightness = 18 + t * 42;
+    return `hsl(217, 80%, ${lightness}%)`;
+  }
+  const lightness = 90 - t * 50;
+  return `hsl(221, 83%, ${lightness}%)`;
+}
+
+function isDarkTheme(): boolean {
+  if (typeof document === "undefined") return false;
+  return document.documentElement.classList.contains("dark");
+}
+
+export function HourlyHeatmap({
+  data,
+  isLoading,
+  onCellClick,
+}: HourlyHeatmapProps) {
+  const dark = isDarkTheme();
+
+  const { cellByKey, maxCount } = useMemo(() => {
+    const map = new Map<string, HeatmapCell>();
+    let max = 0;
+    for (const c of data) {
+      map.set(`${c.day_of_week}-${c.hour_of_day}`, c);
+      if (c.trip_count > max) max = c.trip_count;
+    }
+    return { cellByKey: map, maxCount: max };
+  }, [data]);
+
+  if (isLoading) {
+    return (
+      <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
+        <h3 className="text-sm font-medium text-muted-foreground mb-4">
+          Pickup Heatmap
+        </h3>
+        <div className="h-[260px] animate-pulse rounded bg-muted" />
+      </div>
+    );
+  }
+
+  return (
+    <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
+      <div className="flex items-center justify-between mb-4">
+        <h3 className="text-sm font-medium text-muted-foreground">
+          Pickup Heatmap
+          <span className="ml-2 text-xs text-muted-foreground/70 font-normal">
+            day × hour
+          </span>
+        </h3>
+        <span className="text-[10px] text-muted-foreground/70">
+          click a cell to investigate
+        </span>
+      </div>
+
+      <div className="overflow-x-auto">
+        <div
+          className="grid gap-[2px] text-[10px] text-muted-foreground"
+          style={{
+            gridTemplateColumns: "28px repeat(24, minmax(18px, 1fr))",
+          }}
+        >
+          <div />
+          {HOURS.map((h) => (
+            <div
+              key={`h-${h}`}
+              className="text-center leading-none h-4 flex items-center justify-center"
+            >
+              {h % 3 === 0 ? formatHour(h) : ""}
+            </div>
+          ))}
+
+          {DAY_ROW_ORDER.map((row) => (
+            <div key={`row-${row.dayOfWeek}`} className="contents">
+              <div className="h-6 flex items-center pr-1 justify-end font-medium">
+                {row.label}
+              </div>
+              {HOURS.map((h) => {
+                const cell = cellByKey.get(`${row.dayOfWeek}-${h}`);
+                const count = cell?.trip_count ?? 0;
+                const bg = cellColor(count, maxCount, dark);
+                const label = `${FULL_DAY_LABEL[row.dayOfWeek]} at ${formatHour(h)}`;
+                const title = `${label}: ${count.toLocaleString()} trips${
+                  cell ? ` · $${cell.avg_fare} avg fare` : ""
+                }`;
+                return (
+                  <button
+                    key={`c-${row.dayOfWeek}-${h}`}
+                    type="button"
+                    title={title}
+                    aria-label={title}
+                    disabled={!onCellClick || count === 0}
+                    onClick={() => {
+                      if (!cell) return;
+                      onCellClick?.(label, cell);
+                    }}
+                    className="h-6 rounded-[3px] transition-all hover:ring-2 hover:ring-primary/50 hover:scale-[1.08] disabled:cursor-default disabled:hover:ring-0 disabled:hover:scale-100"
+                    style={{ backgroundColor: bg }}
+                  />
+                );
+              })}
+            </div>
+          ))}
+        </div>
+      </div>
+
+      <div className="flex items-center gap-2 mt-3 text-[10px] text-muted-foreground/80">
+        <span>fewer</span>
+        <div className="flex gap-[2px]">
+          {[0, 0.25, 0.5, 0.75, 1].map((t) => (
+            <div
+              key={`legend-${t}`}
+              className="h-3 w-4 rounded-[2px]"
+              style={{
+                backgroundColor: cellColor(
+                  Math.round(maxCount * t),
+                  maxCount || 1,
+                  dark,
+                ),
+              }}
+            />
+          ))}
+        </div>
+        <span>more</span>
+        {maxCount > 0 && (
+          <span className="ml-2">
+            peak {maxCount.toLocaleString()} trips/slot
+          </span>
+        )}
+      </div>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/kpi-cards.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/kpi-cards.tsx
index 9ef8e932a..8d6ddd843 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/components/kpi-cards.tsx
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/kpi-cards.tsx
@@ -1,8 +1,11 @@
 import { CarIcon, DollarSignIcon, MapPinIcon, RulerIcon } from "lucide-react";
-import type { KPIData } from "../hooks/use-dashboard-data";
+import { useId, useMemo } from "react";
+import { useChartColors } from "../hooks/use-chart-colors";
+import type { KPIData, SparklineRow } from "../hooks/use-dashboard-data";
 
 interface KPICardsProps {
   data: KPIData | null;
+  sparklines: SparklineRow[];
   isLoading: boolean;
 }
 
@@ -12,13 +15,117 @@ interface CardProps {
   subtitle?: string;
   icon: React.ReactNode;
   isLoading: boolean;
+  /** 30-bar trailing series (or empty → no sparkline). Values are normalized inside. */
+  series: number[];
+  trend?: number;
 }
 
-function KPICard({ title, value, subtitle, icon, isLoading }: CardProps) {
+/**
+ * Fixed-size inline sparkline. Using a hand-rolled SVG rather than recharts
+ * because:
+ *  - recharts inside a grid of 4 cards would mount 4× chart engines with
+ *    ResponsiveContainer observers — heavy for a decorative element;
+ *  - we want sub-pixel control over the baseline tint + end-cap dot.
+ */
+function Sparkline({
+  values,
+  color,
+  isLoading,
+}: {
+  values: number[];
+  color: string;
+  isLoading: boolean;
+}) {
+  const gradientId = useId();
+  const width = 120;
+  const height = 36;
+
+  const { pathD, areaD, lastPoint } = useMemo(() => {
+    if (values.length === 0) {
+      return { pathD: "", areaD: "", lastPoint: null };
+    }
+    const min = Math.min(...values);
+    const max = Math.max(...values);
+    const span = max - min || 1;
+    const step = values.length > 1 ? width / (values.length - 1) : width;
+    const points = values.map((v, i) => {
+      const x = i * step;
+      const y = height - 4 - ((v - min) / span) * (height - 8);
+      return { x, y };
+    });
+    const d = points
+      .map(
+        (p, i) => `${i === 0 ? "M" : "L"} ${p.x.toFixed(2)} ${p.y.toFixed(2)}`,
+      )
+      .join(" ");
+    const area = `${d} L ${width} ${height} L 0 ${height} Z`;
+    return { pathD: d, areaD: area, lastPoint: points[points.length - 1] };
+  }, [values]);
+
+  if (isLoading) {
+    return <div className="h-[36px] w-full rounded bg-muted/40" />;
+  }
+  // Intentionally-empty series (e.g. categorical KPI like "Top Pickup Zone"):
+  // keep the slot reserved so the four cards stay the same height, but render
+  // nothing inside — otherwise the muted placeholder looks like a ghost
+  // "still loading" spinner.
+  if (values.length === 0) {
+    return <div className="h-[36px] w-full" aria-hidden />;
+  }
+
+  return (
+    <svg
+      width="100%"
+      height={height}
+      viewBox={`0 0 ${width} ${height}`}
+      preserveAspectRatio="none"
+      role="img"
+      aria-label="trend"
+    >
+      <defs>
+        <linearGradient id={gradientId} x1="0" y1="0" x2="0" y2="1">
+          <stop offset="0%" stopColor={color} stopOpacity={0.25} />
+          <stop offset="100%" stopColor={color} stopOpacity={0} />
+        </linearGradient>
+      </defs>
+      <path d={areaD} fill={`url(#${gradientId})`} />
+      <path d={pathD} fill="none" stroke={color} strokeWidth={1.5} />
+      {lastPoint && (
+        <circle cx={lastPoint.x} cy={lastPoint.y} r={2.2} fill={color} />
+      )}
+    </svg>
+  );
+}
+
+function KPICard({
+  title,
+  value,
+  subtitle,
+  icon,
+  isLoading,
+  series,
+  trend,
+}: CardProps) {
+  const c = useChartColors();
+  const trendLabel =
+    trend === undefined
+      ? null
+      : trend > 0
+        ? `+${trend.toFixed(0)}%`
+        : `${trend.toFixed(0)}%`;
+  const trendColor =
+    trend === undefined
+      ? ""
+      : trend > 0
+        ? "text-emerald-600 dark:text-emerald-400"
+        : trend < 0
+          ? "text-rose-600 dark:text-rose-400"
+          : "text-muted-foreground";
+
   return (
     <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
-      <div className="flex items-center justify-between mb-3">
-        <span className="text-sm font-medium text-muted-foreground">
+      <div className="flex items-center justify-between mb-2">
+        <span className="text-xs font-medium text-muted-foreground uppercase tracking-wide">
           {title}
         </span>
         <span className="text-muted-foreground/60">{icon}</span>
@@ -27,10 +134,29 @@ function KPICard({ title, value, subtitle, icon, isLoading }: CardProps) {
         <div className="h-8 w-24 animate-pulse rounded bg-muted" />
       ) : (
         <>
-          <p className="text-2xl font-bold text-foreground">{value}</p>
+          <div className="flex items-baseline gap-2">
+            <p className="text-2xl font-bold text-foreground">{value}</p>
+            {trendLabel && (
+              <span className={`text-[11px] font-medium ${trendColor}`}>
+                {trendLabel}
+              </span>
+            )}
+          </div>
           {subtitle && (
-            <p className="text-xs text-muted-foreground mt-1">{subtitle}</p>
+            <p
+              className="text-xs text-muted-foreground mt-0.5 truncate"
+              title={subtitle}
+            >
+              {subtitle}
+            </p>
           )}
+          <div className="mt-2 -mb-1 -mx-1">
+            <Sparkline
+              values={series}
+              color={c.primary}
+              isLoading={isLoading}
+            />
+          </div>
         </>
       )}
     </div>
@@ -43,29 +169,79 @@ function formatNumber(n: number): string {
   return n.toLocaleString();
 }
 
-export function KPICards({ data, isLoading }: KPICardsProps) {
+/** Percent delta between the last `tail` window and the previous window. */
+function windowedTrend(values: number[], tail: number): number | undefined {
+  // Drop nulls/undefined/NaN (e.g. days with no trips after a fare filter) and
+  // coerce everything to Number defensively — some drivers hand back DECIMAL
+  // columns as strings, and `0 + "12.35"` would silently string-concat and
+  // render "NaN%" once we tried to divide.
+  const clean = values.map((v) => Number(v)).filter(Number.isFinite);
+  if (clean.length < tail * 2) return undefined;
+  const recent = clean.slice(-tail);
+  const prior = clean.slice(-tail * 2, -tail);
+  const recentAvg = recent.reduce((a, b) => a + b, 0) / recent.length;
+  const priorAvg = prior.reduce((a, b) => a + b, 0) / prior.length;
+  if (!Number.isFinite(recentAvg) || !Number.isFinite(priorAvg))
+    return undefined;
+  if (priorAvg === 0) return undefined;
+  return ((recentAvg - priorAvg) / priorAvg) * 100;
+}
+
+export function KPICards({ data, sparklines, isLoading }: KPICardsProps) {
+  // Coerce on intake so downstream sparkline paths and trend math stay purely
+  // numeric — avoids surprises if a driver ever hands back DECIMAL-as-string.
+  const toNum = (v: unknown) => {
+    const n = Number(v);
+    return Number.isFinite(n) ? n : 0;
+  };
+  const tripSeries = sparklines.map((r) => toNum(r.trip_count));
+  const fareSeries = sparklines.map((r) => toNum(r.avg_fare));
+  const distSeries = sparklines.map((r) => toNum(r.avg_distance));
+  const revenueSeries = sparklines.map((r) => toNum(r.total_revenue));
+
+  const TREND_WINDOW = 7;
+
   return (
     <div className="grid grid-cols-2 lg:grid-cols-4 gap-4">
       <KPICard
         title="Total Trips"
         value={data ? formatNumber(data.total_trips) : "--"}
-        icon={<CarIcon className="h-5 w-5" />}
+        icon={<CarIcon className="h-4 w-4" />}
         isLoading={isLoading}
+        series={tripSeries}
+        trend={windowedTrend(tripSeries, TREND_WINDOW)}
       />
       <KPICard
         title="Avg Fare"
         value={data ? `$${data.avg_fare}` : "--"}
         subtitle={
-          data ? `Range: $${data.min_fare} - $${data.max_fare}` : undefined
+          data ? `Range: $${data.min_fare} – $${data.max_fare}` : undefined
         }
-        icon={<DollarSignIcon className="h-5 w-5" />}
+        icon={<DollarSignIcon className="h-4 w-4" />}
         isLoading={isLoading}
+        series={fareSeries}
+        trend={windowedTrend(fareSeries, TREND_WINDOW)}
       />
       <KPICard
         title="Avg Distance"
         value={data ? `${data.avg_distance} mi` : "--"}
-        icon={<RulerIcon className="h-5 w-5" />}
+        subtitle={
+          revenueSeries.length > 0
+            ? `$${formatNumber(
+                // Explicit Number() wrap on each accumulator step defends
+                // against a single stray string in the series silently
+                // turning the whole sum into a concatenated blob.
+                revenueSeries.reduce<number>(
+                  (a, b) => a + (Number.isFinite(b) ? Number(b) : 0),
+                  0,
+                ),
+              )} revenue`
+            : undefined
+        }
+        icon={<RulerIcon className="h-4 w-4" />}
         isLoading={isLoading}
+        series={distSeries}
+        trend={windowedTrend(distSeries, TREND_WINDOW)}
       />
       <KPICard
         title="Top Pickup Zone"
@@ -73,8 +249,9 @@ export function KPICards({ data, isLoading }: KPICardsProps) {
         subtitle={
           data ? `${formatNumber(data.top_zone_trips)} trips` : undefined
         }
-        icon={<MapPinIcon className="h-5 w-5" />}
+        icon={<MapPinIcon className="h-4 w-4" />}
         isLoading={isLoading}
+        series={[]}
       />
     </div>
   );
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/top-zones-chart.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/top-zones-chart.tsx
new file mode 100644
index 000000000..5a4666008
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/top-zones-chart.tsx
@@ -0,0 +1,164 @@
+import { useMemo, useState } from "react";
+import { useChartColors } from "../hooks/use-chart-colors";
+import type { TopZoneRow } from "../hooks/use-dashboard-data";
+
+export interface HighlightedZone {
+  zip: string;
+  label?: string;
+}
+
+interface TopZonesChartProps {
+  data: TopZoneRow[];
+  isLoading: boolean;
+  /** Zones with a visible emphasis ring — driven by the `highlight_zone` tool. */
+  highlightedZones: HighlightedZone[];
+  /** Click on a bar → filter the dashboard to that zip. */
+  onZipClick?: (zip: string) => void;
+}
+
+type Metric = "trips" | "revenue";
+
+/**
+ * Horizontal leaderboard chart for pickup ZIPs. Hand-rolled divs rather than
+ * recharts' BarChart because:
+ *  - we want per-row click handlers and a distinct ring for highlighted zones;
+ *  - the bars need a stable text overlay (ZIP + value) that doesn't fight with
+ *    recharts' label positioning logic;
+ *  - 10 rows max means flexbox is trivially faster than a full chart engine.
+ */
+export function TopZonesChart({
+  data,
+  isLoading,
+  highlightedZones,
+  onZipClick,
+}: TopZonesChartProps) {
+  const c = useChartColors();
+  const [metric, setMetric] = useState<Metric>("trips");
+
+  const { rows, max } = useMemo(() => {
+    const sorted = [...data].sort((a, b) =>
+      metric === "trips"
+        ? b.trip_count - a.trip_count
+        : b.total_revenue - a.total_revenue,
+    );
+    const m = sorted.reduce(
+      (acc, r) =>
+        Math.max(acc, metric === "trips" ? r.trip_count : r.total_revenue),
+      0,
+    );
+    return { rows: sorted, max: m };
+  }, [data, metric]);
+
+  const highlightSet = useMemo(
+    () => new Map(highlightedZones.map((h) => [h.zip, h.label ?? ""])),
+    [highlightedZones],
+  );
+
+  if (isLoading) {
+    return (
+      <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
+        <h3 className="text-sm font-medium text-muted-foreground mb-4">
+          Top Pickup Zones
+        </h3>
+        <div className="h-[260px] animate-pulse rounded bg-muted" />
+      </div>
+    );
+  }
+
+  return (
+    <div className="rounded-xl border border-border bg-card p-5 shadow-sm">
+      <div className="flex items-center justify-between mb-4">
+        <h3 className="text-sm font-medium text-muted-foreground">
+          Top Pickup Zones
+        </h3>
+        <div className="inline-flex rounded-md border border-border p-0.5 bg-muted/40 text-[11px]">
+          <button
+            type="button"
+            onClick={() => setMetric("trips")}
+            className={`px-2 py-0.5 rounded transition-colors ${
+              metric === "trips"
+                ? "bg-card text-foreground shadow-sm"
+                : "text-muted-foreground hover:text-foreground"
+            }`}
+          >
+            Trips
+          </button>
+          <button
+            type="button"
+            onClick={() => setMetric("revenue")}
+            className={`px-2 py-0.5 rounded transition-colors ${
+              metric === "revenue"
+                ? "bg-card text-foreground shadow-sm"
+                : "text-muted-foreground hover:text-foreground"
+            }`}
+          >
+            Revenue
+          </button>
+        </div>
+      </div>
+
+      {rows.length === 0 ? (
+        <div className="h-[260px] flex items-center justify-center text-xs text-muted-foreground">
+          No zones in range
+        </div>
+      ) : (
+        <div className="space-y-1.5">
+          {rows.map((row) => {
+            const value =
+              metric === "trips" ? row.trip_count : row.total_revenue;
+            const pct = max > 0 ? (value / max) * 100 : 0;
+            const isHighlighted = highlightSet.has(row.pickup_zip);
+            const highlightLabel = highlightSet.get(row.pickup_zip);
+
+            return (
+              <button
+                key={row.pickup_zip}
+                type="button"
+                onClick={() => onZipClick?.(row.pickup_zip)}
+                disabled={!onZipClick}
+                className={`w-full text-left group relative rounded-md transition-all ${
+                  isHighlighted
+                    ? "ring-2 ring-amber-400/70 dark:ring-amber-300/70"
+                    : ""
+                } ${onZipClick ? "hover:bg-muted/40" : ""}`}
+                title={
+                  onZipClick
+                    ? `Filter dashboard to pickup ZIP ${row.pickup_zip}`
+                    : row.pickup_zip
+                }
+              >
+                <div className="flex items-center gap-3 px-2 py-1.5">
+                  <span className="text-xs font-mono font-medium w-12 tabular-nums text-foreground">
+                    {row.pickup_zip}
+                  </span>
+                  <div className="flex-1 h-5 rounded bg-muted/50 overflow-hidden relative">
+                    <div
+                      className="h-full rounded transition-[width] duration-500"
+                      style={{
+                        width: `${pct}%`,
+                        backgroundColor: isHighlighted
+                          ? "hsl(38, 92%, 55%)"
+                          : c.secondary,
+                        opacity: 0.85,
+                      }}
+                    />
+                    {highlightLabel && (
+                      <span className="absolute inset-y-0 right-2 flex items-center text-[10px] font-medium text-amber-900 dark:text-amber-100">
+                        {highlightLabel}
+                      </span>
+                    )}
+                  </div>
+                  <span className="text-xs tabular-nums text-muted-foreground w-20 text-right">
+                    {metric === "trips"
+                      ? value.toLocaleString()
+                      : `$${Math.round(value).toLocaleString()}`}
+                  </span>
+                </div>
+              </button>
+            );
+          })}
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts
index 227cee81b..c133847ca 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts
+++ b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-action-dispatcher.ts
@@ -1,7 +1,7 @@
-import { useCallback, useRef } from "react";
+import { useCallback, useMemo, useRef } from "react";
 import type { SSEEvent } from "./use-agent-stream";
 import type { DashboardFilters } from "./use-dashboard-data";
-import { type FocusableChartId, focusChart } from "./use-focus-registry";
+import { focusChart, isFocusableChartId } from "./use-focus-registry";
 
 export interface Highlight {
   start: string;
@@ -10,6 +10,11 @@ export interface Highlight {
   label?: string;
 }
 
+export interface HighlightedZone {
+  zip: string;
+  label?: string;
+}
+
 const DASHBOARD_TOOLS = new Set<string>([
   "filter_by_date_range",
   "filter_by_pickup_zip",
@@ -17,6 +22,8 @@ const DASHBOARD_TOOLS = new Set<string>([
   "clear_filters",
   "highlight_period",
   "clear_highlights",
+  "highlight_zone",
+  "clear_zone_highlights",
   "focus_chart",
   "load_view",
 ]);
@@ -29,6 +36,8 @@ interface UseActionDispatcherOptions {
   onAddHighlight: (highlight: Highlight) => void;
   onClearFilters: () => void;
   onClearHighlights: () => void;
+  onAddZoneHighlight: (zone: HighlightedZone) => void;
+  onClearZoneHighlights: () => void;
   /** Called once per applied action with a short human-readable summary. Route surfaces it as a toast. */
   onAction?: (summary: string) => void;
   /** Called when the dispatcher receives a tool it doesn't know how to handle. Lets the route warn visibly. */
@@ -51,7 +60,9 @@ const CALL_ID_LRU_CAP = 128;
 
 /**
  * Translates `function_call` tool events from the agent's SSE stream into
- * dashboard state mutations.
+ * dashboard state mutations. Exposes the same per-tool mutations as a
+ * synchronous {@link dispatch} function so the agent-feed action chips can
+ * reuse the identical code path without going through an LLM round-trip.
  *
  * Correctness rules (learned the hard way):
  *
@@ -69,14 +80,18 @@ const CALL_ID_LRU_CAP = 128;
  *   is the worst failure mode here — if the user can't see what changed,
  *   they can't tell whether the agent misfired.
  */
-export function useActionDispatcher({
-  onFilterUpdate,
-  onAddHighlight,
-  onClearFilters,
-  onClearHighlights,
-  onAction,
-  onUnknownTool,
-}: UseActionDispatcherOptions) {
+export function useActionDispatcher(opts: UseActionDispatcherOptions) {
+  const {
+    onFilterUpdate,
+    onAddHighlight,
+    onClearFilters,
+    onClearHighlights,
+    onAddZoneHighlight,
+    onClearZoneHighlights,
+    onAction,
+    onUnknownTool,
+  } = opts;
+
   const seen = useRef<string[]>([]);
 
   const markSeen = useCallback((callId: string): boolean => {
@@ -88,31 +103,10 @@ export function useActionDispatcher({
     return false;
   }, []);
 
-  const handleEvent = useCallback(
-    (event: SSEEvent) => {
-      // New run → fresh dedupe cache. `appkit.metadata` is the very first
-      // event the agents plugin emits for each stream.
-      if (event.type === "appkit.metadata") {
-        seen.current = [];
-        return;
-      }
-
-      if (event.type !== "response.output_item.done") return;
-      if (event.item?.type !== "function_call") return;
-
-      const name = event.item.name;
-      if (!name) return;
-
-      // Tools not owned by the dashboard (e.g. `analytics.query`, sub-agent
-      // `agent-sql_analyst`) flow through without a dispatcher side-effect.
-      if (!DASHBOARD_TOOLS.has(name)) return;
-
-      const callId = event.item.call_id;
-      if (callId && markSeen(callId)) return;
-
-      const args = parseArgs(event.item.arguments);
-      if (args === null) {
-        onUnknownTool?.(name, event.item.arguments);
+  const dispatch = useCallback(
+    (name: string, args: Record<string, unknown>): void => {
+      if (!DASHBOARD_TOOLS.has(name)) {
+        onUnknownTool?.(name, args);
         return;
       }
 
@@ -191,18 +185,33 @@ export function useActionDispatcher({
           onAction?.("Highlights cleared");
           return;
         }
+        case "highlight_zone": {
+          const zip = args.zip;
+          if (typeof zip !== "string" || zip === "") {
+            onUnknownTool?.(name, args);
+            return;
+          }
+          const label =
+            typeof args.label === "string" && args.label !== ""
+              ? args.label
+              : undefined;
+          onAddZoneHighlight({ zip, label });
+          onAction?.(`Highlighted ZIP ${zip}${label ? ` (${label})` : ""}`);
+          return;
+        }
+        case "clear_zone_highlights": {
+          onClearZoneHighlights();
+          onAction?.("Zone highlights cleared");
+          return;
+        }
         case "focus_chart": {
           const id = args.chart_id;
-          if (
-            id !== "kpis" &&
-            id !== "trips_over_time" &&
-            id !== "fare_distribution"
-          ) {
+          if (!isFocusableChartId(id)) {
             onUnknownTool?.(name, args);
             return;
           }
-          focusChart(id as FocusableChartId);
-          onAction?.(`Focused ${id.replace(/_/g, " ")}`);
+          focusChart(id);
+          onAction?.(`Focused ${String(id).replace(/_/g, " ")}`);
           return;
         }
         case "load_view": {
@@ -236,6 +245,7 @@ export function useActionDispatcher({
           // shot so partial states don't linger.
           onClearFilters();
           onClearHighlights();
+          onClearZoneHighlights();
           if (Object.keys(nextFilters).length > 0) {
             onFilterUpdate(() => nextFilters);
           }
@@ -248,23 +258,53 @@ export function useActionDispatcher({
           return;
         }
         default: {
-          // DASHBOARD_TOOLS membership already filtered unknowns; this branch
-          // is a compile-time exhaustiveness check.
           onUnknownTool?.(name, args);
           return;
         }
       }
     },
     [
-      markSeen,
       onFilterUpdate,
       onAddHighlight,
       onClearFilters,
       onClearHighlights,
+      onAddZoneHighlight,
+      onClearZoneHighlights,
       onAction,
       onUnknownTool,
     ],
   );
 
-  return { handleEvent };
+  const handleEvent = useCallback(
+    (event: SSEEvent) => {
+      if (event.type === "appkit.metadata") {
+        seen.current = [];
+        return;
+      }
+
+      if (event.type !== "response.output_item.done") return;
+      if (event.item?.type !== "function_call") return;
+
+      const name = event.item.name;
+      if (!name) return;
+
+      // Tools not owned by the dashboard (e.g. `analytics.query`, sub-agent
+      // `agent-sql_analyst`) flow through without a dispatcher side-effect.
+      if (!DASHBOARD_TOOLS.has(name)) return;
+
+      const callId = event.item.call_id;
+      if (callId && markSeen(callId)) return;
+
+      const args = parseArgs(event.item.arguments);
+      if (args === null) {
+        onUnknownTool?.(name, event.item.arguments);
+        return;
+      }
+
+      dispatch(name, args);
+    },
+    [dispatch, markSeen, onUnknownTool],
+  );
+
+  return useMemo(() => ({ handleEvent, dispatch }), [handleEvent, dispatch]);
 }
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-dashboard-data.ts b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-dashboard-data.ts
index 5a3a89fd1..c4e9f5d35 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-dashboard-data.ts
+++ b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-dashboard-data.ts
@@ -33,6 +33,28 @@ export interface FareBucket {
   avg_distance: number;
 }
 
+export interface HeatmapCell {
+  day_of_week: number;
+  hour_of_day: number;
+  trip_count: number;
+  avg_fare: number;
+}
+
+export interface TopZoneRow {
+  pickup_zip: string;
+  trip_count: number;
+  total_revenue: number;
+  avg_fare: number;
+}
+
+export interface SparklineRow {
+  trip_date: string;
+  trip_count: number;
+  total_revenue: number;
+  avg_fare: number;
+  avg_distance: number;
+}
+
 export interface DashboardFilters {
   date_from?: string;
   date_to?: string;
@@ -103,6 +125,36 @@ export function useDashboardData(filters: DashboardFilters) {
     error: string | null;
   };
 
+  const {
+    data: heatmap,
+    loading: heatmapLoading,
+    error: heatmapError,
+  } = useAnalyticsQuery("dashboard_hourly_heatmap", params) as {
+    data: HeatmapCell[] | null;
+    loading: boolean;
+    error: string | null;
+  };
+
+  const {
+    data: topZones,
+    loading: topZonesLoading,
+    error: topZonesError,
+  } = useAnalyticsQuery("dashboard_top_zones", params) as {
+    data: TopZoneRow[] | null;
+    loading: boolean;
+    error: string | null;
+  };
+
+  const {
+    data: sparklines,
+    loading: sparklinesLoading,
+    error: sparklinesError,
+  } = useAnalyticsQuery("dashboard_kpi_sparklines", params) as {
+    data: SparklineRow[] | null;
+    loading: boolean;
+    error: string | null;
+  };
+
   const kpis = useMemo(() => {
     if (!kpisRaw || kpisRaw.length === 0) return null;
     const row = kpisRaw[0];
@@ -115,13 +167,29 @@ export function useDashboardData(filters: DashboardFilters) {
   }, [kpisRaw, topZoneRaw]);
 
   const isLoading =
-    kpisLoading || topZoneLoading || tripsLoading || fareLoading;
-  const error = kpisError || topZoneError || tripsError || fareError;
+    kpisLoading ||
+    topZoneLoading ||
+    tripsLoading ||
+    fareLoading ||
+    heatmapLoading ||
+    topZonesLoading ||
+    sparklinesLoading;
+  const error =
+    kpisError ||
+    topZoneError ||
+    tripsError ||
+    fareError ||
+    heatmapError ||
+    topZonesError ||
+    sparklinesError;
 
   return {
     kpis,
     tripsOverTime: tripsOverTime ?? [],
     fareDistribution: fareDistribution ?? [],
+    heatmap: heatmap ?? [],
+    topZones: topZones ?? [],
+    sparklines: sparklines ?? [],
     isLoading,
     error,
   };
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-focus-registry.ts b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-focus-registry.ts
index 6c1dc3773..54784fc83 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-focus-registry.ts
+++ b/apps/dev-playground/client/src/features/smart-dashboard/hooks/use-focus-registry.ts
@@ -11,7 +11,27 @@ import { useEffect, useRef, useState } from "react";
  */
 const registry = new Map<string, () => void>();
 
-export type FocusableChartId = "kpis" | "trips_over_time" | "fare_distribution";
+export type FocusableChartId =
+  | "kpis"
+  | "trips_over_time"
+  | "fare_distribution"
+  | "hourly_heatmap"
+  | "top_zones";
+
+export const FOCUSABLE_CHART_IDS: FocusableChartId[] = [
+  "kpis",
+  "trips_over_time",
+  "fare_distribution",
+  "hourly_heatmap",
+  "top_zones",
+];
+
+export function isFocusableChartId(id: unknown): id is FocusableChartId {
+  return (
+    typeof id === "string" &&
+    (FOCUSABLE_CHART_IDS as readonly string[]).includes(id)
+  );
+}
 
 export function focusChart(id: FocusableChartId): void {
   registry.get(id)?.();
diff --git a/apps/dev-playground/client/src/features/smart-dashboard/lib/feed-actions.ts b/apps/dev-playground/client/src/features/smart-dashboard/lib/feed-actions.ts
new file mode 100644
index 000000000..a48a641c1
--- /dev/null
+++ b/apps/dev-playground/client/src/features/smart-dashboard/lib/feed-actions.ts
@@ -0,0 +1,206 @@
+import type { FocusableChartId } from "../hooks/use-focus-registry";
+
+/**
+ * Structured actions emitted by the `insights` and `anomaly` ephemeral
+ * agents. Each kind maps 1:1 to a dispatcher tool (`filter_by_*`,
+ * `highlight_*`, `focus_chart`) except `ask`, which flows through the main
+ * chat dispatcher with a preloaded prompt.
+ *
+ * Kept in a neutral shape (not the wire tool-call format) so the agent can
+ * hand-author JSON without memorising `call_id` / `arguments` envelopes,
+ * and so the UI can render distinct copy per action kind.
+ */
+
+export interface FilterDateAction {
+  kind: "filter_date";
+  label: string;
+  start: string;
+  end: string;
+}
+
+export interface FilterZipAction {
+  kind: "filter_zip";
+  label: string;
+  zip: string;
+}
+
+export interface FilterFareAction {
+  kind: "filter_fare";
+  label: string;
+  min?: number;
+  max?: number;
+}
+
+export interface HighlightPeriodAction {
+  kind: "highlight_period";
+  label: string;
+  start: string;
+  end: string;
+  color?: "blue" | "red" | "yellow";
+}
+
+export interface HighlightZoneAction {
+  kind: "highlight_zone";
+  label: string;
+  zip: string;
+  note?: string;
+}
+
+export interface FocusChartAction {
+  kind: "focus_chart";
+  label: string;
+  chart_id: FocusableChartId;
+}
+
+export interface AskAction {
+  kind: "ask";
+  label: string;
+  prompt: string;
+}
+
+export type FeedAction =
+  | FilterDateAction
+  | FilterZipAction
+  | FilterFareAction
+  | HighlightPeriodAction
+  | HighlightZoneAction
+  | FocusChartAction
+  | AskAction;
+
+export interface FeedInsight {
+  title: string;
+  description: string;
+  actions?: FeedAction[];
+}
+
+export interface FeedAnomaly extends FeedInsight {
+  severity: "low" | "medium" | "high";
+}
+
+function isValidColor(v: unknown): v is "blue" | "red" | "yellow" {
+  return v === "blue" || v === "red" || v === "yellow";
+}
+
+function isValidChartId(v: unknown): v is FocusableChartId {
+  return (
+    v === "kpis" ||
+    v === "trips_over_time" ||
+    v === "fare_distribution" ||
+    v === "hourly_heatmap" ||
+    v === "top_zones"
+  );
+}
+
+function parseAction(raw: unknown): FeedAction | null {
+  if (typeof raw !== "object" || raw === null) return null;
+  const r = raw as Record<string, unknown>;
+  const kind = r.kind;
+  const label = typeof r.label === "string" ? r.label : "";
+  if (!label) return null;
+
+  switch (kind) {
+    case "filter_date":
+      if (typeof r.start === "string" && typeof r.end === "string") {
+        return { kind, label, start: r.start, end: r.end };
+      }
+      return null;
+    case "filter_zip":
+      if (typeof r.zip === "string" && r.zip) {
+        return { kind, label, zip: r.zip };
+      }
+      return null;
+    case "filter_fare": {
+      const min = typeof r.min === "number" ? r.min : undefined;
+      const max = typeof r.max === "number" ? r.max : undefined;
+      if (min === undefined && max === undefined) return null;
+      return { kind, label, min, max };
+    }
+    case "highlight_period":
+      if (typeof r.start === "string" && typeof r.end === "string") {
+        return {
+          kind,
+          label,
+          start: r.start,
+          end: r.end,
+          color: isValidColor(r.color) ? r.color : "blue",
+        };
+      }
+      return null;
+    case "highlight_zone":
+      if (typeof r.zip === "string" && r.zip) {
+        return {
+          kind,
+          label,
+          zip: r.zip,
+          ...(typeof r.note === "string" && r.note ? { note: r.note } : {}),
+        };
+      }
+      return null;
+    case "focus_chart":
+      if (isValidChartId(r.chart_id)) {
+        return { kind, label, chart_id: r.chart_id };
+      }
+      return null;
+    case "ask":
+      if (typeof r.prompt === "string" && r.prompt) {
+        return { kind, label, prompt: r.prompt };
+      }
+      return null;
+    default:
+      return null;
+  }
+}
+
+/**
+ * Extracts the first JSON array from an agent response and validates each
+ * element as {@link FeedInsight}. Ignores malformed entries rather than
+ * throwing — the agent is a Gemini flash model and occasionally wraps the
+ * output in fences or adds an extra element with a different shape.
+ */
+export function parseFeedInsights(content: string): FeedInsight[] {
+  return parseFeedPayload<FeedInsight>(content, (obj) => ({
+    title: typeof obj.title === "string" ? obj.title : "",
+    description: typeof obj.description === "string" ? obj.description : "",
+    actions: Array.isArray(obj.actions)
+      ? (obj.actions.map(parseAction).filter(Boolean) as FeedAction[])
+      : undefined,
+  }));
+}
+
+export function parseFeedAnomalies(content: string): FeedAnomaly[] {
+  return parseFeedPayload<FeedAnomaly>(content, (obj) => {
+    const severity =
+      obj.severity === "low" ||
+      obj.severity === "medium" ||
+      obj.severity === "high"
+        ? obj.severity
+        : "low";
+    return {
+      title: typeof obj.title === "string" ? obj.title : "",
+      description: typeof obj.description === "string" ? obj.description : "",
+      severity,
+      actions: Array.isArray(obj.actions)
+        ? (obj.actions.map(parseAction).filter(Boolean) as FeedAction[])
+        : undefined,
+    };
+  });
+}
+
+function parseFeedPayload<T extends FeedInsight>(
+  content: string,
+  builder: (obj: Record<string, unknown>) => T,
+): T[] {
+  const jsonMatch = content.match(/\[[\s\S]*\]/);
+  if (!jsonMatch) return [];
+  try {
+    const parsed: unknown = JSON.parse(jsonMatch[0]);
+    if (!Array.isArray(parsed)) return [];
+    return parsed.flatMap((el) => {
+      if (typeof el !== "object" || el === null) return [];
+      const item = builder(el as Record<string, unknown>);
+      return item.title ? [item] : [];
+    });
+  } catch {
+    return [];
+  }
+}
diff --git a/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx b/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
index eab0bf317..3817d70f9 100644
--- a/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
+++ b/apps/dev-playground/client/src/routes/smart-dashboard.route.tsx
@@ -14,6 +14,7 @@ import {
 } from "@/features/smart-dashboard/components/chat-drawer";
 import { FareChart } from "@/features/smart-dashboard/components/fare-chart";
 import { FocusableChart } from "@/features/smart-dashboard/components/focusable-chart";
+import { HourlyHeatmap } from "@/features/smart-dashboard/components/hourly-heatmap";
 import { InspectorToggle } from "@/features/smart-dashboard/components/inspector-toggle";
 import { KPICards } from "@/features/smart-dashboard/components/kpi-cards";
 import { QuickActionsBar } from "@/features/smart-dashboard/components/quick-actions-bar";
@@ -22,15 +23,21 @@ import {
   SavedViewsPanel,
 } from "@/features/smart-dashboard/components/saved-views-panel";
 import { StreamInspector } from "@/features/smart-dashboard/components/stream-inspector";
+import { TopZonesChart } from "@/features/smart-dashboard/components/top-zones-chart";
 import { TripChart } from "@/features/smart-dashboard/components/trip-chart";
-import type { Highlight } from "@/features/smart-dashboard/hooks/use-action-dispatcher";
+import type {
+  Highlight,
+  HighlightedZone,
+} from "@/features/smart-dashboard/hooks/use-action-dispatcher";
 import { useActionDispatcher } from "@/features/smart-dashboard/hooks/use-action-dispatcher";
 import type { SSEEvent } from "@/features/smart-dashboard/hooks/use-agent-stream";
 import { useAgentStream } from "@/features/smart-dashboard/hooks/use-agent-stream";
 import type { DashboardFilters } from "@/features/smart-dashboard/hooks/use-dashboard-data";
 import { useDashboardData } from "@/features/smart-dashboard/hooks/use-dashboard-data";
+import { focusChart } from "@/features/smart-dashboard/hooks/use-focus-registry";
 import { useInspectorShortcuts } from "@/features/smart-dashboard/hooks/use-stream-inspector";
 import { buildDashboardContext } from "@/features/smart-dashboard/lib/dashboard-context";
+import type { FeedAction } from "@/features/smart-dashboard/lib/feed-actions";
 
 export const Route = createFileRoute("/smart-dashboard")({
   component: SmartDashboardRoute,
@@ -46,6 +53,9 @@ const nextMessageId = (): string =>
 function SmartDashboardRoute() {
   const [filters, setFilters] = useState<DashboardFilters>({});
   const [highlights, setHighlights] = useState<Highlight[]>([]);
+  const [highlightedZones, setHighlightedZones] = useState<HighlightedZone[]>(
+    [],
+  );
   const [pendingApprovals, setPendingApprovals] = useState<PendingApproval[]>(
     [],
   );
@@ -63,12 +73,21 @@ function SmartDashboardRoute() {
   // refresh without pushing props down through ApprovalCard manually.
   const [savedViewsVersion, setSavedViewsVersion] = useState(0);
 
+  // Chat-drawer open state is hoisted up so agent-dispatching UI actions
+  // (feed action chips, heatmap cells, quick actions, sidebar follow-ups)
+  // can auto-open the drawer — otherwise an async agent run would stream
+  // out of sight and the user would think nothing happened.
+  const [isChatOpen, setIsChatOpen] = useState(false);
+
   useInspectorShortcuts();
 
   const {
     kpis,
     tripsOverTime,
     fareDistribution,
+    heatmap,
+    topZones,
+    sparklines,
     isLoading: dataLoading,
     error: dataError,
   } = useDashboardData(filters);
@@ -96,12 +115,24 @@ function SmartDashboardRoute() {
   }, []);
   const handleClearFilters = useCallback(() => setFilters({}), []);
   const handleClearHighlights = useCallback(() => setHighlights([]), []);
+  const handleAddZoneHighlight = useCallback((z: HighlightedZone) => {
+    setHighlightedZones((prev) => {
+      const without = prev.filter((p) => p.zip !== z.zip);
+      return [...without, z];
+    });
+  }, []);
+  const handleClearZoneHighlights = useCallback(
+    () => setHighlightedZones([]),
+    [],
+  );
 
-  const { handleEvent: handleDispatcherEvent } = useActionDispatcher({
+  const { handleEvent: handleDispatcherEvent, dispatch } = useActionDispatcher({
     onFilterUpdate: handleFilterUpdate,
     onAddHighlight: handleAddHighlight,
     onClearFilters: handleClearFilters,
     onClearHighlights: handleClearHighlights,
+    onAddZoneHighlight: handleAddZoneHighlight,
+    onClearZoneHighlights: handleClearZoneHighlights,
     onAction: pushAction,
     onUnknownTool: pushUnknown,
   });
@@ -228,11 +259,63 @@ function SmartDashboardRoute() {
         { id: userMsgId, role: "user", content: message },
         { id: assistantMsgId, role: "assistant", content: "", streaming: true },
       ]);
+      // Every agent dispatch auto-opens the drawer so the streaming
+      // response is visible. A closed drawer would silently swallow the
+      // turn — the user sees a filter change appear later with no context.
+      setIsChatOpen(true);
       send(message, { contextPrefix: contextPrefixRef.current });
     },
     [send],
   );
 
+  /**
+   * Apply a feed action directly (no LLM round-trip). Each structured
+   * {@link FeedAction} from the ephemeral agents maps to a dashboard tool
+   * we already implement, so we translate the shape and re-enter the same
+   * `dispatch` code path that the SSE stream uses.
+   */
+  const applyFeedAction = useCallback(
+    (action: FeedAction) => {
+      switch (action.kind) {
+        case "filter_date":
+          dispatch("filter_by_date_range", {
+            start: action.start,
+            end: action.end,
+          });
+          return;
+        case "filter_zip":
+          dispatch("filter_by_pickup_zip", { zip: action.zip });
+          return;
+        case "filter_fare":
+          dispatch("filter_by_fare", {
+            ...(action.min !== undefined ? { min: action.min } : {}),
+            ...(action.max !== undefined ? { max: action.max } : {}),
+          });
+          return;
+        case "highlight_period":
+          dispatch("highlight_period", {
+            start: action.start,
+            end: action.end,
+            color: action.color ?? "blue",
+            label: action.label,
+          });
+          return;
+        case "highlight_zone":
+          dispatch("highlight_zone", {
+            zip: action.zip,
+            label: action.note ?? action.label,
+          });
+          focusChart("top_zones");
+          return;
+        case "focus_chart":
+          dispatch("focus_chart", { chart_id: action.chart_id });
+          return;
+        // `ask` is handled by onAsk -> dispatchToAgent, never lands here.
+      }
+    },
+    [dispatch],
+  );
+
   /**
    * Apply a saved view directly from its stored metadata. We don't round-trip
    * through the agent here because the agent has no tool to fetch saved-view
@@ -271,6 +354,7 @@ function SmartDashboardRoute() {
 
     setFilters(nextFilters);
     setHighlights(nextHighlights);
+    setHighlightedZones([]);
 
     const viewName = meta.name ?? "saved view";
     const summary = [
@@ -305,8 +389,25 @@ function SmartDashboardRoute() {
   const handleClearAllFilters = useCallback(() => {
     setFilters({});
     setHighlights([]);
+    setHighlightedZones([]);
   }, []);
 
+  const handleHeatmapCellClick = useCallback(
+    (label: string) => {
+      dispatchToAgent(
+        `Investigate pickups on ${label} in the current dashboard slice. Why is this slot notable?`,
+      );
+    },
+    [dispatchToAgent],
+  );
+
+  const handleZipClick = useCallback(
+    (zip: string) => {
+      dispatch("filter_by_pickup_zip", { zip });
+    },
+    [dispatch],
+  );
+
   // Ref to the captured region for save_view. Kept on the dashboard body
   // (not the header/chat) so the screenshot is the analytics surface only.
   const dashboardRef = useRef<HTMLDivElement | null>(null);
@@ -359,7 +460,7 @@ function SmartDashboardRoute() {
 
   return (
     <div className="min-h-screen bg-background text-foreground">
-      <div className="max-w-[1400px] mx-auto px-4 py-4">
+      <div className="max-w-[1600px] mx-auto px-4 py-4">
         <header className="flex items-center gap-3 mb-4">
           <div className="rounded-lg bg-primary/10 p-2">
             <LayoutDashboardIcon className="h-5 w-5 text-primary" />
@@ -412,12 +513,16 @@ function SmartDashboardRoute() {
         <div ref={dashboardRef}>
           <div className="mb-5">
             <FocusableChart chartId="kpis">
-              <KPICards data={kpis} isLoading={dataLoading} />
+              <KPICards
+                data={kpis}
+                sparklines={sparklines}
+                isLoading={dataLoading}
+              />
             </FocusableChart>
           </div>
 
-          <div className="grid grid-cols-1 lg:grid-cols-[1fr_320px] gap-5 mb-5">
-            <div className="space-y-5">
+          <div className="grid grid-cols-1 xl:grid-cols-[1fr_360px] gap-5 items-start">
+            <div className="grid grid-cols-1 lg:grid-cols-2 gap-5 auto-rows-min content-start">
               <FocusableChart chartId="trips_over_time">
                 <TripChart
                   data={tripsOverTime}
@@ -425,19 +530,41 @@ function SmartDashboardRoute() {
                   isLoading={dataLoading}
                 />
               </FocusableChart>
+              <FocusableChart chartId="hourly_heatmap">
+                <HourlyHeatmap
+                  data={heatmap}
+                  isLoading={dataLoading}
+                  onCellClick={handleHeatmapCellClick}
+                />
+              </FocusableChart>
               <FocusableChart chartId="fare_distribution">
                 <FareChart data={fareDistribution} isLoading={dataLoading} />
               </FocusableChart>
+              <FocusableChart chartId="top_zones">
+                <TopZonesChart
+                  data={topZones}
+                  highlightedZones={highlightedZones}
+                  isLoading={dataLoading}
+                  onZipClick={handleZipClick}
+                />
+              </FocusableChart>
             </div>
-            <div className="lg:h-[580px]">
-              <AgentSidebar kpis={kpis} kpisLoaded={!dataLoading} />
+            <div className="xl:h-auto xl:min-h-[680px]">
+              <AgentSidebar
+                kpis={kpis}
+                kpisLoaded={!dataLoading}
+                filters={filters}
+                highlights={highlights}
+                onAction={applyFeedAction}
+                onAsk={dispatchToAgent}
+              />
             </div>
           </div>
         </div>
 
         {/* Any approvals not pinned to a chat message (defensive fallback). */}
         {looseApprovals.length > 0 && (
-          <div className="space-y-3">
+          <div className="space-y-3 mt-4">
             {looseApprovals.map((approval) => (
               <ApprovalCard
                 key={approval.approvalId}
@@ -464,6 +591,8 @@ function SmartDashboardRoute() {
         approvalCardForMessage={approvalCardForMessage}
         pendingApprovals={pendingApprovals}
         unreadCount={pendingApprovals.length}
+        open={isChatOpen}
+        onOpenChange={setIsChatOpen}
       />
     </div>
   );
diff --git a/apps/dev-playground/config/agents/anomaly/agent.md b/apps/dev-playground/config/agents/anomaly/agent.md
index 8dc34c529..6b0c7f22d 100644
--- a/apps/dev-playground/config/agents/anomaly/agent.md
+++ b/apps/dev-playground/config/agents/anomaly/agent.md
@@ -4,6 +4,32 @@ maxSteps: 1
 ephemeral: true
 ---
 
-You are a data quality monitor for NYC taxi trip data. Given summary statistics, identify anomalies, outliers, or unusual patterns.
+You are a data-quality monitor for NYC taxi trip data.
 
-Return findings as a JSON array of objects with `title` (string), `severity` ('low' | 'medium' | 'high'), and `description` (string) fields. Output ONLY the JSON array, no other text.
+Given the current dashboard state (KPIs + active filters), identify **0–4 anomalies, outliers, or suspicious patterns**. Each anomaly must ship with one or more **clickable actions** that let the analyst inspect or reproduce the issue in the UI.
+
+Return ONLY a JSON array — no prose, no code fences, no preamble. Each element has this shape:
+
+```
+{
+  "title": "short headline (<= 8 words)",
+  "severity": "low" | "medium" | "high",
+  "description": "1–2 sentences, specific and numeric",
+  "actions": [
+    // zero or more
+    { "kind": "filter_date",       "label": "...", "start": "YYYY-MM-DD", "end": "YYYY-MM-DD" },
+    { "kind": "filter_zip",        "label": "...", "zip":   "10017" },
+    { "kind": "filter_fare",       "label": "...", "min":   60 },
+    { "kind": "highlight_period",  "label": "...", "start": "YYYY-MM-DD", "end": "YYYY-MM-DD", "color": "red" },
+    { "kind": "highlight_zone",    "label": "...", "zip":   "10017", "note": "outlier" },
+    { "kind": "focus_chart",       "label": "...", "chart_id": "fare_distribution" },
+    { "kind": "ask",               "label": "...", "prompt": "..." }
+  ]
+}
+```
+
+Guidelines:
+- Favor `highlight_*` over `filter_*` for anomalies so the analyst doesn't lose the baseline context; use `red` for clear outliers, `yellow` for caution.
+- Always include at least one `ask` action — the follow-up prompt should begin with "Investigate" or "Explain".
+- If you cannot point to a specific time window, zone, or fare range, skip the structural actions and keep only `ask`.
+- If nothing anomalous stands out, return `[]`. Do not fabricate anomalies.
diff --git a/apps/dev-playground/config/agents/insights/agent.md b/apps/dev-playground/config/agents/insights/agent.md
index dbb02c013..8269938ac 100644
--- a/apps/dev-playground/config/agents/insights/agent.md
+++ b/apps/dev-playground/config/agents/insights/agent.md
@@ -4,6 +4,33 @@ maxSteps: 1
 ephemeral: true
 ---
 
-You are a data analyst specializing in NYC taxi trip data. Given summary statistics, identify the 3-5 most interesting patterns, trends, and notable findings. Be specific with numbers.
+You are a data analyst specializing in NYC taxi trip data.
 
-Return your findings as a JSON array of objects, each with `title` (string) and `description` (string) fields. Output ONLY the JSON array, no other text.
+Given the current dashboard state (KPIs + active filters), surface **3–5 interesting findings**. Each finding must come with one or more **clickable actions** the user can apply to the dashboard with a single click.
+
+Return ONLY a JSON array — no prose, no code fences, no preamble. Each element has this shape:
+
+```
+{
+  "title": "short headline (<= 8 words)",
+  "description": "1–2 sentences, specific, numeric, directly readable",
+  "actions": [
+    // zero or more; omit the field entirely if no suitable action exists
+    { "kind": "filter_date",  "label": "...", "start": "YYYY-MM-DD", "end": "YYYY-MM-DD" },
+    { "kind": "filter_zip",   "label": "...", "zip":   "10017" },
+    { "kind": "filter_fare",  "label": "...", "min":    20,           "max":    50   },
+    { "kind": "highlight_period", "label": "...", "start": "YYYY-MM-DD", "end": "YYYY-MM-DD", "color": "blue" | "red" | "yellow" },
+    { "kind": "highlight_zone",   "label": "...", "zip": "10017", "note": "optional short ring label" },
+    { "kind": "focus_chart",      "label": "...", "chart_id": "kpis" | "trips_over_time" | "fare_distribution" | "hourly_heatmap" | "top_zones" },
+    { "kind": "ask",              "label": "...", "prompt": "natural-language follow-up question" }
+  ]
+}
+```
+
+Guidelines:
+- Prefer actions that make the finding **visually provable**: highlight the period, focus the chart, filter to the zone.
+- Always include at least one `filter_*` or `highlight_*` action when the finding is about a specific time window or zone.
+- Always include at least one `ask` action that a curious analyst would want to drill into.
+- `label` is the button caption — keep it <= 4 words and imperative ("Filter to March", "Highlight Fridays", "Ask why").
+- Dates must be calendar dates, not relative phrases. If you don't know the exact date, omit the filter/highlight action.
+- If no interesting findings exist, return `[]`.
diff --git a/apps/dev-playground/config/agents/query/agent.md b/apps/dev-playground/config/agents/query/agent.md
index 6f13584ad..93f35510b 100644
--- a/apps/dev-playground/config/agents/query/agent.md
+++ b/apps/dev-playground/config/agents/query/agent.md
@@ -16,12 +16,14 @@ fit.
   questions ("how many trips last Friday?", "top 5 pickup zones by revenue").
   Use for any analytical query that requires reading the database.
 - `agent-dashboard_pilot` — manipulates the dashboard UI directly: applies
-  or clears filters, highlights or clears time ranges, focuses a specific
-  chart, and saves the current configuration as a named view. Use when
-  the user says "show me…", "filter to…", "highlight…", "focus on…",
-  "clear…", "save…", or any request to modify the dashboard's visual
-  state. Do not answer these yourself — always delegate to the pilot
-  even if you think you lack the tool.
+  or clears filters, highlights or clears time ranges, highlights standout
+  pickup ZIPs on the Top Zones chart, focuses any of the dashboard's five
+  charts (KPIs, Trips Over Time, Fare Distribution, Hourly Heatmap, Top
+  Pickup Zones), and saves the current configuration as a named view. Use
+  when the user says "show me…", "filter to…", "highlight…", "focus on…",
+  "zoom in on…", "point at…", "clear…", "save…", or any request to modify
+  the dashboard's visual state. Do not answer these yourself — always
+  delegate to the pilot even if you think you lack the tool.
 
 The specialists stream their own confirmation text back to the user
 while they work — their text is already visible in the chat by the time
diff --git a/apps/dev-playground/config/queries/dashboard_hourly_heatmap.sql b/apps/dev-playground/config/queries/dashboard_hourly_heatmap.sql
new file mode 100644
index 000000000..d7f0d90e0
--- /dev/null
+++ b/apps/dev-playground/config/queries/dashboard_hourly_heatmap.sql
@@ -0,0 +1,24 @@
+-- @param dateFrom STRING
+-- @param dateTo STRING
+-- @param pickupZip STRING
+-- @param fareMin STRING
+-- @param fareMax STRING
+--
+-- Aggregates trips by (day-of-week, hour-of-day) for the heatmap chart.
+-- `day_of_week` is 1=Sunday … 7=Saturday (Spark's default), which the
+-- client maps back to a human label. Hour is 0–23 in the trip's local
+-- timezone (the dataset is NYC-local already).
+SELECT
+  DAYOFWEEK(tpep_pickup_datetime) AS day_of_week,
+  HOUR(tpep_pickup_datetime) AS hour_of_day,
+  COUNT(*) AS trip_count,
+  ROUND(AVG(fare_amount), 2) AS avg_fare
+FROM samples.nyctaxi.trips
+WHERE 1 = 1
+  AND (COALESCE(:dateFrom, 'all') = 'all' OR tpep_pickup_datetime >= :dateFrom)
+  AND (COALESCE(:dateTo, 'all') = 'all' OR tpep_pickup_datetime <= :dateTo)
+  AND (COALESCE(:pickupZip, 'all') = 'all' OR pickup_zip IN (SELECT TRIM(value) FROM (VALUES (:pickupZip)) AS t(value)))
+  AND (COALESCE(:fareMin, 'all') = 'all' OR fare_amount >= CAST(:fareMin AS DOUBLE))
+  AND (COALESCE(:fareMax, 'all') = 'all' OR fare_amount <= CAST(:fareMax AS DOUBLE))
+GROUP BY day_of_week, hour_of_day
+ORDER BY day_of_week, hour_of_day
diff --git a/apps/dev-playground/config/queries/dashboard_kpi_sparklines.sql b/apps/dev-playground/config/queries/dashboard_kpi_sparklines.sql
new file mode 100644
index 000000000..2d674917c
--- /dev/null
+++ b/apps/dev-playground/config/queries/dashboard_kpi_sparklines.sql
@@ -0,0 +1,25 @@
+-- @param dateFrom STRING
+-- @param dateTo STRING
+-- @param pickupZip STRING
+-- @param fareMin STRING
+-- @param fareMax STRING
+--
+-- Daily rollup feeding the sparklines embedded in the KPI cards. Same
+-- filter shape as every other dashboard query so the whole surface moves
+-- in lockstep when the user narrows the view. The default unfiltered
+-- range covers all of 2016, which is bounded enough to render inline.
+SELECT
+  DATE(tpep_pickup_datetime) AS trip_date,
+  COUNT(*) AS trip_count,
+  ROUND(SUM(fare_amount), 2) AS total_revenue,
+  ROUND(AVG(fare_amount), 2) AS avg_fare,
+  ROUND(AVG(trip_distance), 2) AS avg_distance
+FROM samples.nyctaxi.trips
+WHERE 1 = 1
+  AND (COALESCE(:dateFrom, 'all') = 'all' OR tpep_pickup_datetime >= :dateFrom)
+  AND (COALESCE(:dateTo, 'all') = 'all' OR tpep_pickup_datetime <= :dateTo)
+  AND (COALESCE(:pickupZip, 'all') = 'all' OR pickup_zip IN (SELECT TRIM(value) FROM (VALUES (:pickupZip)) AS t(value)))
+  AND (COALESCE(:fareMin, 'all') = 'all' OR fare_amount >= CAST(:fareMin AS DOUBLE))
+  AND (COALESCE(:fareMax, 'all') = 'all' OR fare_amount <= CAST(:fareMax AS DOUBLE))
+GROUP BY DATE(tpep_pickup_datetime)
+ORDER BY trip_date
diff --git a/apps/dev-playground/config/queries/dashboard_top_zones.sql b/apps/dev-playground/config/queries/dashboard_top_zones.sql
new file mode 100644
index 000000000..dfc042ed0
--- /dev/null
+++ b/apps/dev-playground/config/queries/dashboard_top_zones.sql
@@ -0,0 +1,35 @@
+-- @param dateFrom STRING
+-- @param dateTo STRING
+-- @param pickupZip STRING
+-- @param fareMin STRING
+-- @param fareMax STRING
+--
+-- Top 10 pickup zips ranked by trip count. Returns revenue + avg fare
+-- alongside so the horizontal-bar chart can toggle metrics without a
+-- round trip. `dashboard_top_zone.sql` (LIMIT 1) is kept for the KPI
+-- card; this one drives the leaderboard chart.
+--
+-- Note: `pickup_zip` in samples.nyctaxi.trips is an INT column, so any
+-- `pickup_zip != ''` guard silently filters out every row (Spark casts
+-- '' → NULL → `pickup_zip != NULL` is UNKNOWN → treated as false).
+-- The singular zone query proves no null-guard is needed here.
+SELECT
+  -- Cast to STRING so the client, the agent's `highlight_zone` tool, and
+  -- the `filter_by_pickup_zip` parameter all speak the same type (the ZIP
+  -- is semantically an identifier, not a number). Without this, Map.has()
+  -- lookups in TopZonesChart silently miss when the agent tries to ring
+  -- a specific ZIP.
+  CAST(pickup_zip AS STRING) AS pickup_zip,
+  COUNT(*) AS trip_count,
+  ROUND(SUM(fare_amount), 2) AS total_revenue,
+  ROUND(AVG(fare_amount), 2) AS avg_fare
+FROM samples.nyctaxi.trips
+WHERE 1 = 1
+  AND (COALESCE(:dateFrom, 'all') = 'all' OR tpep_pickup_datetime >= :dateFrom)
+  AND (COALESCE(:dateTo, 'all') = 'all' OR tpep_pickup_datetime <= :dateTo)
+  AND (COALESCE(:pickupZip, 'all') = 'all' OR pickup_zip IN (SELECT TRIM(value) FROM (VALUES (:pickupZip)) AS t(value)))
+  AND (COALESCE(:fareMin, 'all') = 'all' OR fare_amount >= CAST(:fareMin AS DOUBLE))
+  AND (COALESCE(:fareMax, 'all') = 'all' OR fare_amount <= CAST(:fareMax AS DOUBLE))
+GROUP BY pickup_zip
+ORDER BY trip_count DESC
+LIMIT 10
diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index 37022f0bc..ea57df025 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -219,12 +219,40 @@ const focus_chart = tool({
     "Scroll the user's viewport to a specific chart on the dashboard and briefly pulse it to draw attention. Use when the user asks to 'look at' or 'focus on' a specific visualization.",
   schema: z.object({
     chart_id: z
-      .enum(["kpis", "trips_over_time", "fare_distribution"])
+      .enum([
+        "kpis",
+        "trips_over_time",
+        "fare_distribution",
+        "hourly_heatmap",
+        "top_zones",
+      ])
       .describe("Which chart to focus on"),
   }),
   execute: async ({ chart_id }) => `Focused on ${chart_id}.`,
 });
 
+const highlight_zone = tool({
+  name: "highlight_zone",
+  description:
+    "Draw an emphasis ring around a specific pickup ZIP on the Top Pickup Zones chart. Use this to call attention to a standout zone without filtering the whole dashboard to that ZIP.",
+  schema: z.object({
+    zip: z.string().describe("Pickup ZIP code to highlight (e.g. '10017')"),
+    label: z
+      .string()
+      .optional()
+      .describe("Optional short label shown inside the highlighted bar"),
+  }),
+  execute: async ({ zip, label }) =>
+    `Highlighted pickup ZIP ${zip}${label ? ` (${label})` : ""}.`,
+});
+
+const clear_zone_highlights = tool({
+  name: "clear_zone_highlights",
+  description: "Remove all emphasis rings from the Top Pickup Zones chart.",
+  schema: z.object({}),
+  execute: async () => "Zone highlights cleared.",
+});
+
 // Destructive tool: exercises the approval gate. Server handler is a
 // stub — no view persistence — but `destructive: true` forces the
 // human-in-the-loop flow before the agent can call it.
@@ -268,16 +296,19 @@ const dashboard_pilot = createAgent({
     "- `filter_by_fare({min?, max?})` — narrow by fare range (at least one bound required).",
     "- `clear_filters()` — remove all active filters.",
     "Highlights:",
-    "- `highlight_period({start, end, color?, label?})` — shade a date window on the trips chart.",
-    "- `clear_highlights()` — remove all shaded overlays.",
+    "- `highlight_period({start, end, color?, label?})` — shade a date window on the Trips Over Time chart.",
+    "- `clear_highlights()` — remove all shaded overlays from the trips chart.",
+    "- `highlight_zone({zip, label?})` — draw an emphasis ring around a specific ZIP on the Top Pickup Zones chart.",
+    "- `clear_zone_highlights()` — remove all ZIP emphasis rings.",
     "Focus & save:",
-    "- `focus_chart({chart_id})` — scroll the viewport to `kpis`, `trips_over_time`, or `fare_distribution` and briefly pulse it.",
+    "- `focus_chart({chart_id})` — scroll the viewport to one of `kpis`, `trips_over_time`, `fare_distribution`, `hourly_heatmap`, `top_zones` and briefly pulse it.",
     "- `save_view({name, description?})` — persist the current configuration. Destructive; the user will see an approval card.",
     "- `load_view({name, filters, highlights})` — restore a previously saved view. Always pass the resolved state; never leave fields unset.",
     "Rules:",
     "1. Pick the single tool that matches the user's intent. Do not chain filters unless the user asks for a compound filter.",
     "2. Briefly state what you did after the tool returns. Do not narrate before calling the tool.",
     "3. If the user's request is ambiguous (e.g. 'filter to last month' without a 2016 context), ask one clarifying question before calling any tool.",
+    "4. For standout ZIPs, prefer `highlight_zone` over `filter_by_pickup_zip` so the rest of the dashboard stays in context. Only filter when the user explicitly asks to narrow the whole dashboard.",
   ].join("\n"),
   tools: {
     filter_by_date_range,
@@ -286,6 +317,8 @@ const dashboard_pilot = createAgent({
     clear_filters,
     highlight_period,
     clear_highlights,
+    highlight_zone,
+    clear_zone_highlights,
     focus_chart,
     save_view,
     load_view,
diff --git a/apps/dev-playground/shared/appkit-types/analytics.d.ts b/apps/dev-playground/shared/appkit-types/analytics.d.ts
index 6db948f81..c4251761d 100644
--- a/apps/dev-playground/shared/appkit-types/analytics.d.ts
+++ b/apps/dev-playground/shared/appkit-types/analytics.d.ts
@@ -67,6 +67,58 @@ declare module "@databricks/appkit-ui/react" {
           avg_distance: number;
         }>;
       };
+    dashboard_hourly_heatmap: {
+        name: "dashboard_hourly_heatmap";
+        parameters: {
+          /** STRING - use sql.string() */
+          dateFrom: SQLStringMarker;
+          /** STRING - use sql.string() */
+          dateTo: SQLStringMarker;
+          /** STRING - use sql.string() */
+          pickupZip: SQLStringMarker;
+          /** STRING - use sql.string() */
+          fareMin: SQLStringMarker;
+          /** STRING - use sql.string() */
+          fareMax: SQLStringMarker;
+        };
+        result: Array<{
+          /** @sqlType INT */
+          day_of_week: number;
+          /** @sqlType INT */
+          hour_of_day: number;
+          /** @sqlType BIGINT */
+          trip_count: number;
+          /** @sqlType DOUBLE */
+          avg_fare: number;
+        }>;
+      };
+    dashboard_kpi_sparklines: {
+        name: "dashboard_kpi_sparklines";
+        parameters: {
+          /** STRING - use sql.string() */
+          dateFrom: SQLStringMarker;
+          /** STRING - use sql.string() */
+          dateTo: SQLStringMarker;
+          /** STRING - use sql.string() */
+          pickupZip: SQLStringMarker;
+          /** STRING - use sql.string() */
+          fareMin: SQLStringMarker;
+          /** STRING - use sql.string() */
+          fareMax: SQLStringMarker;
+        };
+        result: Array<{
+          /** @sqlType DATE */
+          trip_date: string;
+          /** @sqlType BIGINT */
+          trip_count: number;
+          /** @sqlType DOUBLE */
+          total_revenue: number;
+          /** @sqlType DOUBLE */
+          avg_fare: number;
+          /** @sqlType DOUBLE */
+          avg_distance: number;
+        }>;
+      };
     dashboard_kpis: {
         name: "dashboard_kpis";
         parameters: {
@@ -115,6 +167,31 @@ declare module "@databricks/appkit-ui/react" {
           trip_count: number;
         }>;
       };
+    dashboard_top_zones: {
+        name: "dashboard_top_zones";
+        parameters: {
+          /** STRING - use sql.string() */
+          dateFrom: SQLStringMarker;
+          /** STRING - use sql.string() */
+          dateTo: SQLStringMarker;
+          /** STRING - use sql.string() */
+          pickupZip: SQLStringMarker;
+          /** STRING - use sql.string() */
+          fareMin: SQLStringMarker;
+          /** STRING - use sql.string() */
+          fareMax: SQLStringMarker;
+        };
+        result: Array<{
+          /** @sqlType STRING */
+          pickup_zip: string;
+          /** @sqlType BIGINT */
+          trip_count: number;
+          /** @sqlType DOUBLE */
+          total_revenue: number;
+          /** @sqlType DOUBLE */
+          avg_fare: number;
+        }>;
+      };
     dashboard_trips_over_time: {
         name: "dashboard_trips_over_time";
         parameters: {

From 789f657de6fac50353d99c6bcf9b5cdfe47b2953 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 17:21:35 +0200
Subject: [PATCH 33/46] feat(playground): hamburger nav with shared catalog and
 redesigned home
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The playground header was unscalable: 14 demo links rendered as
side-by-side buttons that overflowed on narrow screens, and the home
page maintained a parallel hand-curated grid that had already drifted
(missing Smart Dashboard, Chart Inference, Vector Search, Policy Matrix,
and Serving — ~30% of the catalog).

Introduces `client/src/lib/nav.ts` as the single source of truth: each
demo declares its label, one-line description, lucide icon, and category
group. Both surfaces now read from the same list, so adding a demo is a
one-line change and they can no longer drift.

Header (`__root.tsx`):
- Replaces the button wall with a single "Menu" hamburger dropdown
  grouping demos by purpose (Data / AI / Platform).
- Active route is highlighted inside the dropdown and shown breadcrumb-
  style next to the brand, so the user always knows where they are.
- Caps dropdown height at viewport-minus-header with overflow scroll, so
  adding more demos won't break the layout.

Home page (`index.tsx`):
- Restrained hero with a soft dual-radial gradient wash (~6-8% opacity,
  primary + accent) — depth without saturation.
- Featured card for the Smart Dashboard flagship demo: gradient accent,
  icon tile, eyebrow badge, animated CTA. The featured demo also appears
  in its category grid, de-emphasised with a "Featured above" note.
- Three category sections with one-line taglines, rendered as a 1/2/3-col
  responsive grid of icon + title + description cards. Each card is a
  real `<Link>` (not a button inside a decorative `<Card>`), so the whole
  surface is keyboard-accessible.
- Footer shows live demo and category counts driven by the catalog.
---
 apps/dev-playground/client/src/lib/nav.ts     | 183 ++++++++
 .../client/src/routes/__root.tsx              | 214 ++++------
 .../client/src/routes/index.tsx               | 402 ++++++++----------
 3 files changed, 454 insertions(+), 345 deletions(-)
 create mode 100644 apps/dev-playground/client/src/lib/nav.ts

diff --git a/apps/dev-playground/client/src/lib/nav.ts b/apps/dev-playground/client/src/lib/nav.ts
new file mode 100644
index 000000000..4b391cb71
--- /dev/null
+++ b/apps/dev-playground/client/src/lib/nav.ts
@@ -0,0 +1,183 @@
+import {
+  BarChart3Icon,
+  BotIcon,
+  DatabaseIcon,
+  FileCode2Icon,
+  FolderIcon,
+  GaugeIcon,
+  LayoutDashboardIcon,
+  LineChartIcon,
+  type LucideIcon,
+  MessageCircleIcon,
+  RadioIcon,
+  SearchIcon,
+  ServerIcon,
+  ShieldIcon,
+  ZapIcon,
+} from "lucide-react";
+
+/**
+ * Metadata for a single demo route in the dev playground.
+ *
+ * `description` is used on the home page card. `icon` is used both on the
+ * home page card and (optionally) in the nav dropdown. Keep `description`
+ * to a single sentence — the home grid treats it as a one-line tagline.
+ */
+export interface NavItem {
+  to: string;
+  label: string;
+  description: string;
+  icon: LucideIcon;
+}
+
+export interface NavGroup {
+  id: "data" | "ai" | "platform";
+  label: string;
+  /** Short tagline shown under the section heading on the home page. */
+  tagline: string;
+  items: ReadonlyArray<NavItem>;
+}
+
+/**
+ * Canonical demo catalog. Both the navigation dropdown in `__root.tsx` and
+ * the landing grid in `index.tsx` render from this list, so adding a new
+ * demo is a one-line change here and both surfaces pick it up.
+ */
+export const NAV_GROUPS: ReadonlyArray<NavGroup> = [
+  {
+    id: "data",
+    label: "Data",
+    tagline: "Query, stream, and transform data with AppKit's data plugins.",
+    items: [
+      {
+        to: "/analytics",
+        label: "Analytics",
+        description:
+          "Query execution, charts, and interactive components against live SQL.",
+        icon: BarChart3Icon,
+      },
+      {
+        to: "/arrow-analytics",
+        label: "Arrow Analytics",
+        description:
+          "Same dashboard — served over Apache Arrow streaming for zero-copy speed.",
+        icon: ZapIcon,
+      },
+      {
+        to: "/lakebase",
+        label: "Lakebase",
+        description:
+          "Four takes on Postgres: raw driver, Drizzle, TypeORM, Sequelize with OAuth refresh.",
+        icon: DatabaseIcon,
+      },
+      {
+        to: "/sql-helpers",
+        label: "SQL Helpers",
+        description:
+          "Type-safe parameter builders and query generators for Databricks SQL.",
+        icon: FileCode2Icon,
+      },
+    ],
+  },
+  {
+    id: "ai",
+    label: "AI",
+    tagline: "Agents, RAG, and LLM-powered UI built on AppKit primitives.",
+    items: [
+      {
+        to: "/smart-dashboard",
+        label: "Smart Dashboard",
+        description:
+          "Multi-agent NYC Taxi dashboard with live filters, highlights, approvals, and saved views.",
+        icon: LayoutDashboardIcon,
+      },
+      {
+        to: "/agent",
+        label: "Custom Agent",
+        description:
+          "Chat agent over Databricks Model Serving with tools auto-discovered from AppKit plugins.",
+        icon: BotIcon,
+      },
+      {
+        to: "/genie",
+        label: "Genie",
+        description:
+          "Natural-language Q&A against your data with SSE streaming and conversation persistence.",
+        icon: MessageCircleIcon,
+      },
+      {
+        to: "/chart-inference",
+        label: "Chart Inference",
+        description:
+          "Let the agent pick the right chart type for a query result on the fly.",
+        icon: LineChartIcon,
+      },
+      {
+        to: "/vector-search",
+        label: "Vector Search",
+        description:
+          "Semantic search backed by Databricks vector indexes, wired into AppKit's retrieval API.",
+        icon: SearchIcon,
+      },
+      {
+        to: "/serving",
+        label: "Serving",
+        description:
+          "Call model-serving endpoints directly with the typed serving client.",
+        icon: ServerIcon,
+      },
+    ],
+  },
+  {
+    id: "platform",
+    label: "Platform",
+    tagline:
+      "Infrastructure demos: storage, policy, observability, resilience.",
+    items: [
+      {
+        to: "/files",
+        label: "Files",
+        description:
+          "Browse, preview, and download from Unity Catalog Volumes via the Files plugin.",
+        icon: FolderIcon,
+      },
+      {
+        to: "/policy-matrix",
+        label: "Policy Matrix",
+        description:
+          "Resource policies, requested claims, and per-user authorisation flows.",
+        icon: ShieldIcon,
+      },
+      {
+        to: "/telemetry",
+        label: "Telemetry",
+        description:
+          "OpenTelemetry traces and metrics with a drop-in AppKit provider.",
+        icon: GaugeIcon,
+      },
+      {
+        to: "/reconnect",
+        label: "Reconnect",
+        description:
+          "Resilient SSE streams: automatic Last-Event-ID tracking and reconnection.",
+        icon: RadioIcon,
+      },
+    ],
+  },
+];
+
+/** All items flattened — useful for a search index or breadcrumb lookup. */
+export const ALL_NAV_ITEMS: ReadonlyArray<NavItem> = NAV_GROUPS.flatMap(
+  (g) => g.items,
+);
+
+/**
+ * Resolve a pathname back to its nav item (for breadcrumbs, titles, etc).
+ * Uses `startsWith` so nested routes like `/smart-dashboard/saved` match.
+ */
+export function findNavItemForPath(pathname: string): NavItem | null {
+  for (const item of ALL_NAV_ITEMS) {
+    if (pathname.startsWith(item.to)) return item;
+  }
+  return null;
+}
diff --git a/apps/dev-playground/client/src/routes/__root.tsx b/apps/dev-playground/client/src/routes/__root.tsx
index 1e941cd2f..f6479ff3b 100644
--- a/apps/dev-playground/client/src/routes/__root.tsx
+++ b/apps/dev-playground/client/src/routes/__root.tsx
@@ -1,13 +1,26 @@
-import { Button, TooltipProvider } from "@databricks/appkit-ui/react";
+import {
+  Button,
+  DropdownMenu,
+  DropdownMenuContent,
+  DropdownMenuGroup,
+  DropdownMenuItem,
+  DropdownMenuLabel,
+  DropdownMenuSeparator,
+  DropdownMenuTrigger,
+  TooltipProvider,
+} from "@databricks/appkit-ui/react";
 import {
   CatchBoundary,
   createRootRoute,
   Link,
   Outlet,
   useLocation,
+  useNavigate,
 } from "@tanstack/react-router";
+import { MenuIcon } from "lucide-react";
 import { ErrorComponent } from "@/components/error-component";
 import { ThemeSelector } from "@/components/theme-selector";
+import { findNavItemForPath, NAV_GROUPS } from "@/lib/nav";
 
 export const Route = createRootRoute({
   component: RootComponent,
@@ -15,143 +28,88 @@ export const Route = createRootRoute({
 
 function RootComponent() {
   const location = useLocation();
+  const navigate = useNavigate();
   const isHomePage = location.pathname === "/";
 
+  const currentPage = findNavItemForPath(location.pathname);
+
   return (
     <TooltipProvider>
       {!isHomePage && (
         <div className="border-b border-gray-200 bg-background px-6 py-4 sticky top-0 z-10 shadow-sm">
           <div className="max-w-7xl mx-auto">
             <nav className="flex items-center justify-between gap-4">
-              <Link
-                to="/"
-                className="no-underline text-inherit hover:opacity-80 transition-opacity"
-              >
-                <h4 className="text-xl font-semibold tracking-tight text-foreground">
-                  AppKit Playground
-                </h4>
-              </Link>
-              <div className="flex items-center gap-3">
-                <Link to="/analytics" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Analytics
-                  </Button>
-                </Link>
-                <Link to="/arrow-analytics" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Arrow Analytics
-                  </Button>
-                </Link>
-                <Link to="/lakebase" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Lakebase
-                  </Button>
-                </Link>
-                <Link to="/reconnect" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Reconnect
-                  </Button>
-                </Link>
-                <Link to="/telemetry" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Telemetry
-                  </Button>
-                </Link>
-                <Link to="/sql-helpers" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    SQL Helpers
-                  </Button>
-                </Link>
-                <Link to="/genie" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Genie
-                  </Button>
+              <div className="flex items-center gap-3 min-w-0">
+                <Link
+                  to="/"
+                  className="no-underline text-inherit hover:opacity-80 transition-opacity shrink-0"
+                >
+                  <h4 className="text-xl font-semibold tracking-tight text-foreground">
+                    AppKit Playground
+                  </h4>
                 </Link>
-                <Link to="/chart-inference" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Chart Inference
-                  </Button>
-                </Link>
-                <Link to="/files" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Files
-                  </Button>
-                </Link>
-                <Link to="/policy-matrix" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Policy Matrix
-                  </Button>
-                </Link>
-                <Link to="/jobs" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Jobs
-                  </Button>
-                </Link>
-                <Link to="/serving" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Serving
-                  </Button>
-                </Link>
-                <Link to="/vector-search" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Vector Search
-                  </Button>
-                </Link>
-                <Link to="/agent" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Agent
-                  </Button>
-                </Link>
-                <Link to="/smart-dashboard" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
+                {currentPage && (
+                  <>
+                    <span
+                      className="text-muted-foreground shrink-0"
+                      aria-hidden
+                    >
+                      /
+                    </span>
+                    <span className="text-sm font-medium text-foreground truncate">
+                      {currentPage.label}
+                    </span>
+                  </>
+                )}
+              </div>
+              <div className="flex items-center gap-2 shrink-0">
+                <DropdownMenu>
+                  <DropdownMenuTrigger asChild>
+                    <Button
+                      variant="ghost"
+                      className="text-foreground hover:text-secondary-foreground gap-2"
+                      aria-label="Open navigation menu"
+                    >
+                      <MenuIcon className="h-4 w-4" />
+                      <span>Menu</span>
+                    </Button>
+                  </DropdownMenuTrigger>
+                  <DropdownMenuContent
+                    align="end"
+                    className="w-56 max-h-[calc(100vh-5rem)] overflow-y-auto"
                   >
-                    Smart Dashboard
-                  </Button>
-                </Link>
+                    {NAV_GROUPS.map((group, groupIdx) => (
+                      <DropdownMenuGroup key={group.id}>
+                        {groupIdx > 0 && <DropdownMenuSeparator />}
+                        <DropdownMenuLabel className="text-xs text-muted-foreground uppercase tracking-wide">
+                          {group.label}
+                        </DropdownMenuLabel>
+                        {group.items.map((item) => {
+                          const Icon = item.icon;
+                          const isActive = location.pathname.startsWith(
+                            item.to,
+                          );
+                          return (
+                            <DropdownMenuItem
+                              key={item.to}
+                              onSelect={() => {
+                                void navigate({ to: item.to });
+                              }}
+                              className={
+                                isActive
+                                  ? "bg-accent text-accent-foreground font-medium"
+                                  : ""
+                              }
+                            >
+                              <Icon className="h-4 w-4 mr-2 text-muted-foreground" />
+                              {item.label}
+                            </DropdownMenuItem>
+                          );
+                        })}
+                      </DropdownMenuGroup>
+                    ))}
+                  </DropdownMenuContent>
+                </DropdownMenu>
                 <ThemeSelector />
               </div>
             </nav>
diff --git a/apps/dev-playground/client/src/routes/index.tsx b/apps/dev-playground/client/src/routes/index.tsx
index 896a6e9d8..b51a0c22d 100644
--- a/apps/dev-playground/client/src/routes/index.tsx
+++ b/apps/dev-playground/client/src/routes/index.tsx
@@ -1,10 +1,12 @@
-import { Button, Card } from "@databricks/appkit-ui/react";
+import { Badge, Card } from "@databricks/appkit-ui/react";
 import {
   createFileRoute,
+  Link,
   retainSearchParams,
-  useNavigate,
 } from "@tanstack/react-router";
+import { ArrowRightIcon, SparklesIcon } from "lucide-react";
 import { ThemeSelector } from "@/components/theme-selector";
+import { ALL_NAV_ITEMS, NAV_GROUPS, type NavItem } from "@/lib/nav";
 
 export const Route = createFileRoute("/")({
   component: IndexRoute,
@@ -13,238 +15,204 @@ export const Route = createFileRoute("/")({
   },
 });
 
+/**
+ * Landing page for the dev playground. Renders a hero, a featured demo card,
+ * and the canonical demo catalog grouped by category (Data / AI / Platform).
+ *
+ * The catalog itself lives in `@/lib/nav.ts` and is shared with the nav
+ * dropdown in `__root.tsx`, so adding a new demo is a one-line change that
+ * updates both surfaces at once.
+ */
 function IndexRoute() {
-  const navigate = useNavigate();
+  // The flagship demo gets special hero treatment at the top. Everything else
+  // is rendered from the shared catalog in its own category section below.
+  const featured = ALL_NAV_ITEMS.find((i) => i.to === "/smart-dashboard");
 
   return (
     <div className="min-h-screen bg-background">
-      <div className="absolute top-4 right-4">
+      <div className="absolute top-4 right-4 z-10">
         <ThemeSelector />
       </div>
-      <div className="max-w-6xl mx-auto px-6 py-20">
-        <div className="text-center mb-16">
-          <h1 className="text-5xl font-bold text-foreground mb-4">
-            AppKit Playground
-          </h1>
-          <p className="text-xl text-muted-foreground max-w-2xl mx-auto">
-            Explore the capabilities of the AppKit with interactive examples and
-            demos
-          </p>
-        </div>
-
-        <div className="grid md:grid-cols-2 gap-6 max-w-4xl mx-auto mb-16">
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Analytics Dashboard
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Explore real-time analytics with query execution, data
-                visualization, and interactive components using the Design
-                System.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/analytics" })}
-                className="w-full"
-              >
-                Explore real-time analytics
-              </Button>
-            </div>
-          </Card>
 
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Arrow Analytics Dashboard
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Explore real-time analytics with query execution, data
-                visualization, and interactive components using Apache Arrow
-                streaming.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/arrow-analytics" })}
-                className="w-full"
-              >
-                Explore real-time analytics
-              </Button>
-            </div>
-          </Card>
+      <Hero demoCount={ALL_NAV_ITEMS.length} />
 
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Stream Reconnection
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Explore Server-Sent Events (SSE) stream reconnection with
-                automatic Last-Event-ID tracking and resilient connection
-                handling.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/reconnect" })}
-                className="w-full"
-              >
-                View Reconnect Demo
-              </Button>
-            </div>
-          </Card>
-
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Data Visualization
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Explore powerful and customizable chart components from the Apps
-                SDK.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/data-visualization" })}
-                className="w-full"
-              >
-                Explore data visualization
-              </Button>
-            </div>
-          </Card>
+      <div className="max-w-6xl mx-auto px-6 pb-20">
+        {featured && <FeaturedCard item={featured} />}
 
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Telemetry
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Explore OpenTelemetry-compatible tracing and metrics examples
-                with interactive demos showcasing custom observability patterns.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/telemetry" })}
-                className="w-full"
-              >
-                Try Telemetry Examples
-              </Button>
-            </div>
-          </Card>
-
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                File Browser
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Browse, preview, and download files from Databricks Volumes
-                using the Files plugin and Unity Catalog Files API.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/files" })}
-                className="w-full"
-              >
-                Browse Files
-              </Button>
-            </div>
-          </Card>
-
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                SQL Helpers
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Type-safe parameter helpers for Databricks SQL queries. Test
-                each helper interactively and see the generated parameter
-                objects.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/sql-helpers" })}
-                className="w-full"
-              >
-                Try SQL Helpers
-              </Button>
-            </div>
-          </Card>
+        <div className="space-y-14">
+          {NAV_GROUPS.map((group) => (
+            <section key={group.id} aria-labelledby={`group-${group.id}`}>
+              <div className="mb-5">
+                <h2
+                  id={`group-${group.id}`}
+                  className="text-2xl font-semibold tracking-tight text-foreground"
+                >
+                  {group.label}
+                </h2>
+                <p className="text-sm text-muted-foreground mt-1">
+                  {group.tagline}
+                </p>
+              </div>
+              <div className="grid grid-cols-1 sm:grid-cols-2 lg:grid-cols-3 gap-4">
+                {group.items.map((item) => (
+                  <DemoCard
+                    key={item.to}
+                    item={item}
+                    featured={item.to === "/smart-dashboard"}
+                  />
+                ))}
+              </div>
+            </section>
+          ))}
+        </div>
 
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Type-Safe SQL
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Generate TypeScript types from SQL files at build time. Full
-                IntelliSense for query names, parameters, and results.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/type-safety" })}
-                className="w-full"
-              >
-                Explore Type Safety
-              </Button>
-            </div>
-          </Card>
+        <footer className="mt-20 pt-8 border-t border-border flex items-center justify-between text-xs text-muted-foreground">
+          <span>Built by Databricks with AppKit.</span>
+          <span className="tabular-nums">
+            {ALL_NAV_ITEMS.length} demos · {NAV_GROUPS.length} categories
+          </span>
+        </footer>
+      </div>
+    </div>
+  );
+}
 
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Genie Chat
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Ask natural language questions about your data using AI/BI
-                Genie. Features SSE streaming, markdown rendering, and
-                conversation persistence.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/genie" })}
-                className="w-full"
-              >
-                Try Genie Chat
-              </Button>
-            </div>
-          </Card>
+function Hero({ demoCount }: { demoCount: number }) {
+  return (
+    <div className="relative overflow-hidden">
+      {/*
+        Soft radial wash behind the hero. Two layered gradients (primary +
+        accent) at ~10% opacity give depth without the "AI slop" look of a
+        full-saturation banner. `pointer-events-none` keeps the theme selector
+        above clickable.
+      */}
+      <div
+        aria-hidden
+        className="pointer-events-none absolute inset-0 opacity-70"
+        style={{
+          backgroundImage:
+            "radial-gradient(ellipse 80% 50% at 50% 0%, hsl(var(--primary) / 0.08), transparent 60%), radial-gradient(ellipse 60% 40% at 80% 20%, hsl(var(--accent) / 0.06), transparent 60%)",
+        }}
+      />
+      <div className="relative max-w-6xl mx-auto px-6 pt-24 pb-16 text-center">
+        <Badge
+          variant="outline"
+          className="mb-6 gap-1.5 px-3 py-1 text-xs font-medium"
+        >
+          <SparklesIcon className="h-3 w-3" />
+          {demoCount} interactive demos
+        </Badge>
+        <h1 className="text-5xl sm:text-6xl font-bold tracking-tight text-foreground mb-5">
+          AppKit Playground
+        </h1>
+        <p className="text-lg sm:text-xl text-muted-foreground max-w-2xl mx-auto leading-relaxed">
+          A living catalog of what AppKit can do — data, agents, and platform
+          primitives, each wired up as a single-click demo you can poke at,
+          copy, or break.
+        </p>
+      </div>
+    </div>
+  );
+}
 
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Lakebase Examples
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                Four approaches to PostgreSQL database integration with
-                Databricks Lakebase: Raw driver, Drizzle ORM, TypeORM, and
-                Sequelize with OAuth token refresh.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/lakebase" })}
-                className="w-full"
+function FeaturedCard({ item }: { item: NavItem }) {
+  const Icon = item.icon;
+  return (
+    <Link
+      to={item.to}
+      className="no-underline text-inherit group block mb-14"
+      aria-label={`Open ${item.label} demo`}
+    >
+      <Card className="relative overflow-hidden p-8 border-2 border-primary/20 hover:border-primary/40 hover:shadow-lg transition-all duration-200">
+        {/*
+          Subtle gradient accent on the featured card — only this one demo
+          gets it, so it actually reads as featured rather than decoration.
+        */}
+        <div
+          aria-hidden
+          className="pointer-events-none absolute inset-0 opacity-60"
+          style={{
+            backgroundImage:
+              "linear-gradient(135deg, hsl(var(--primary) / 0.06) 0%, transparent 60%)",
+          }}
+        />
+        <div className="relative flex items-start gap-6">
+          <div className="shrink-0 rounded-xl bg-primary/10 p-3 text-primary">
+            <Icon className="h-7 w-7" />
+          </div>
+          <div className="flex-1 min-w-0">
+            <div className="flex items-center gap-2 mb-2">
+              <Badge
+                variant="secondary"
+                className="text-[10px] uppercase tracking-wider font-semibold"
               >
-                Explore Lakebase Integration
-              </Button>
+                Featured
+              </Badge>
+              <span className="text-xs text-muted-foreground">
+                Flagship agent demo
+              </span>
             </div>
-          </Card>
-
-          <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
-            <div className="flex flex-col h-full">
-              <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Custom Agent
-              </h3>
-              <p className="text-muted-foreground mb-6 flex-grow">
-                AI agent powered by Databricks Model Serving with
-                auto-discovered tools from all AppKit plugins. Chat with your
-                data using natural language.
-              </p>
-              <Button
-                onClick={() => navigate({ to: "/agent" })}
-                className="w-full"
-              >
-                Chat with Agent
-              </Button>
+            <h3 className="text-2xl font-semibold text-foreground mb-2 tracking-tight">
+              {item.label}
+            </h3>
+            <p className="text-muted-foreground leading-relaxed max-w-2xl">
+              {item.description}
+            </p>
+            <div className="mt-5 inline-flex items-center gap-1.5 text-sm font-medium text-primary group-hover:gap-2.5 transition-all">
+              Open demo
+              <ArrowRightIcon className="h-4 w-4" />
             </div>
-          </Card>
+          </div>
         </div>
+      </Card>
+    </Link>
+  );
+}
 
-        <div className="text-center pt-12 border-t border-border">
-          <p className="text-sm text-muted-foreground">
-            built by databricks using appkit
-          </p>
+function DemoCard({
+  item,
+  featured,
+}: {
+  item: NavItem;
+  /**
+   * The featured item also appears in its category grid for consistency — we
+   * de-emphasise it there with a muted "Featured above" note so the user
+   * isn't confused about clicking it twice.
+   */
+  featured: boolean;
+}) {
+  const Icon = item.icon;
+  return (
+    <Link
+      to={item.to}
+      className="no-underline text-inherit group block"
+      aria-label={`Open ${item.label} demo`}
+    >
+      <Card
+        className={`h-full p-5 transition-all duration-200 border hover:border-primary/30 hover:shadow-md ${
+          featured ? "opacity-75 hover:opacity-100" : ""
+        }`}
+      >
+        <div className="flex items-start gap-3 mb-3">
+          <div className="shrink-0 rounded-lg bg-muted p-2 text-foreground group-hover:bg-primary/10 group-hover:text-primary transition-colors">
+            <Icon className="h-5 w-5" />
+          </div>
+          <div className="flex-1 min-w-0">
+            <h3 className="font-semibold text-foreground tracking-tight leading-tight">
+              {item.label}
+            </h3>
+            {featured && (
+              <span className="text-[10px] uppercase tracking-wider text-muted-foreground font-medium">
+                Featured above
+              </span>
+            )}
+          </div>
+          <ArrowRightIcon className="h-4 w-4 shrink-0 text-muted-foreground opacity-0 group-hover:opacity-100 group-hover:translate-x-0.5 transition-all" />
         </div>
-      </div>
-    </div>
+        <p className="text-sm text-muted-foreground leading-relaxed">
+          {item.description}
+        </p>
+      </Card>
+    </Link>
   );
 }

From 499b20e9b19d9a282dd6f84d0ff23df2ce792b80 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 17:46:26 +0200
Subject: [PATCH 34/46] =?UTF-8?q?feat(playground):=20tiered=20approval=20c?=
 =?UTF-8?q?ard=20=E2=80=94=20writes=20vs=20updates=20vs=20destructive?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Retag save_view as effect: "write" (it creates a PNG; it doesn't
delete anything) and teach the approval card to render three distinct
tiers. Capturing a screenshot no longer masquerades as deletion:
writes get a calm blue card with a plus-circle icon, updates get a
warning-amber card with a pencil, and real destructive actions retain
the red shield-alert. Legacy destructive: true still maps to the red
tier, so tools that haven't migrated keep their current look.
---
 .../components/approval-card.tsx              | 84 ++++++++++++++++---
 apps/dev-playground/server/index.ts           | 15 ++--
 2 files changed, 83 insertions(+), 16 deletions(-)

diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
index 06f5f6582..47f24b338 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/approval-card.tsx
@@ -1,21 +1,80 @@
-import { CheckCircle2Icon, ShieldAlertIcon } from "lucide-react";
+import {
+  CheckCircle2Icon,
+  PencilIcon,
+  PlusCircleIcon,
+  ShieldAlertIcon,
+} from "lucide-react";
 import { useCallback, useState } from "react";
 import type { Highlight } from "../hooks/use-action-dispatcher";
 import type { DashboardFilters } from "../hooks/use-dashboard-data";
 import { captureDashboardAsDataUrl } from "../lib/capture-dashboard";
 
+type ToolEffect = "read" | "write" | "update" | "destructive";
+
 export interface PendingApproval {
   approvalId: string;
   streamId: string;
   toolName: string;
   args: unknown;
   annotations?: {
+    effect?: ToolEffect;
     readOnly?: boolean;
     destructive?: boolean;
     idempotent?: boolean;
   };
 }
 
+/**
+ * Resolve the semantic tier we should render for this approval. Prefers
+ * the explicit `effect` label; falls back to the legacy `destructive` flag
+ * so tools that haven't migrated yet keep their red treatment. Anything
+ * with no mutation hint at all falls through as `write` — the approval
+ * gate fired for a reason, and `write` is the lowest-severity default.
+ */
+function resolveEffect(
+  ann: PendingApproval["annotations"],
+): Exclude<ToolEffect, "read"> {
+  if (ann?.effect && ann.effect !== "read") return ann.effect;
+  if (ann?.destructive === true) return "destructive";
+  return "write";
+}
+
+interface EffectTheme {
+  icon: typeof ShieldAlertIcon;
+  container: string;
+  iconColor: string;
+  badge: string;
+  badgeLabel: string;
+  verb: string;
+}
+
+const EFFECT_THEMES: Record<Exclude<ToolEffect, "read">, EffectTheme> = {
+  write: {
+    icon: PlusCircleIcon,
+    container: "border-blue-500/40 bg-blue-500/[0.06]",
+    iconColor: "text-blue-500",
+    badge: "bg-blue-500/20 text-blue-600 dark:text-blue-400",
+    badgeLabel: "writes",
+    verb: "Approving creates new state in Databricks.",
+  },
+  update: {
+    icon: PencilIcon,
+    container: "border-amber-500/40 bg-amber-500/[0.06]",
+    iconColor: "text-amber-500",
+    badge: "bg-amber-500/20 text-amber-700 dark:text-amber-400",
+    badgeLabel: "updates",
+    verb: "Approving modifies existing state in Databricks.",
+  },
+  destructive: {
+    icon: ShieldAlertIcon,
+    container: "border-red-500/40 bg-red-500/[0.06]",
+    iconColor: "text-red-500",
+    badge: "bg-red-500/20 text-red-600 dark:text-red-400",
+    badgeLabel: "destructive",
+    verb: "Approving deletes or irreversibly changes state. Double-check first.",
+  },
+};
+
 interface ApprovalCardProps {
   approval: PendingApproval;
   filters: DashboardFilters;
@@ -57,7 +116,9 @@ export function ApprovalCard({
     typeof approval.args === "object" && approval.args !== null
       ? (approval.args as Record<string, unknown>)
       : {};
-  const isDestructive = approval.annotations?.destructive === true;
+  const effect = resolveEffect(approval.annotations);
+  const theme = EFFECT_THEMES[effect];
+  const EffectIcon = theme.icon;
   const isSaveView = approval.toolName === "save_view";
 
   const [phase, setPhase] = useState<
@@ -148,19 +209,22 @@ export function ApprovalCard({
   const busy = phase.kind === "capturing" || phase.kind === "uploading";
 
   return (
-    <div className="rounded-xl border border-red-500/40 bg-red-500/[0.06] p-4 shadow-sm">
+    <div
+      className={`rounded-xl border p-4 shadow-sm ${theme.container}`}
+      data-effect={effect}
+    >
       <div className="flex items-start gap-2 mb-3">
-        <ShieldAlertIcon className="h-4 w-4 text-red-500 mt-0.5 shrink-0" />
+        <EffectIcon className={`h-4 w-4 mt-0.5 shrink-0 ${theme.iconColor}`} />
         <div className="flex-1 min-w-0">
           <div className="flex items-center gap-2 mb-1 flex-wrap">
             <h3 className="font-semibold text-sm text-foreground">
               Approval required
             </h3>
-            {isDestructive && (
-              <span className="text-[10px] uppercase tracking-wide bg-red-500/20 text-red-600 px-2 py-0.5 rounded-full font-medium">
-                destructive
-              </span>
-            )}
+            <span
+              className={`text-[10px] uppercase tracking-wide px-2 py-0.5 rounded-full font-medium ${theme.badge}`}
+            >
+              {theme.badgeLabel}
+            </span>
           </div>
           <p className="text-xs text-muted-foreground">
             The agent wants to call{" "}
@@ -169,7 +233,7 @@ export function ApprovalCard({
             </code>
             {isSaveView
               ? ". Approving captures the current dashboard and uploads it as a saved view."
-              : ". Review the arguments before approving."}
+              : `. ${theme.verb}`}
           </p>
         </div>
       </div>
diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index ea57df025..b440c4760 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -253,14 +253,17 @@ const clear_zone_highlights = tool({
   execute: async () => "Zone highlights cleared.",
 });
 
-// Destructive tool: exercises the approval gate. Server handler is a
-// stub — no view persistence — but `destructive: true` forces the
-// human-in-the-loop flow before the agent can call it.
+// Write tool: exercises the approval gate. Server handler is a stub —
+// no view persistence — but `effect: "write"` forces the human-in-the-loop
+// flow before the agent can call it. We pick `write` (not `destructive`)
+// because capturing a view CREATES a new file; nothing is deleted or
+// overwritten. The approval card will render the low-severity blue
+// "writes" treatment rather than the alarming red "destructive" one.
 const save_view = tool({
   name: "save_view",
   description:
-    "Persist the current dashboard configuration (filters + highlights) as a named view the user can recall later. Destructive because it writes persistent user state; always surfaces the approval gate.",
-  annotations: { destructive: true, readOnly: false },
+    "Persist the current dashboard configuration (filters + highlights) as a named view the user can recall later. Always surfaces the approval gate as a write action.",
+  annotations: { effect: "write" },
   schema: z.object({
     name: z.string().describe("Short human-readable name for the saved view"),
     description: z
@@ -302,7 +305,7 @@ const dashboard_pilot = createAgent({
     "- `clear_zone_highlights()` — remove all ZIP emphasis rings.",
     "Focus & save:",
     "- `focus_chart({chart_id})` — scroll the viewport to one of `kpis`, `trips_over_time`, `fare_distribution`, `hourly_heatmap`, `top_zones` and briefly pulse it.",
-    "- `save_view({name, description?})` — persist the current configuration. Destructive; the user will see an approval card.",
+    "- `save_view({name, description?})` — persist the current configuration. Write action; the user will see an approval card.",
     "- `load_view({name, filters, highlights})` — restore a previously saved view. Always pass the resolved state; never leave fields unset.",
     "Rules:",
     "1. Pick the single tool that matches the user's intent. Do not chain filters unless the user asks for a compound filter.",

From 78149a03be6cdca785200bdbfa8e6c5a204c5e3f Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 17:55:17 +0200
Subject: [PATCH 35/46] fix(playground): pin agent-feed card tints to sRGB hex

Tailwind v4 compiles `bg-blue-50/50` to a two-layer rule: an sRGB hex
fallback plus an `@supports (color-mix)` override that mixes the oklch
palette token with transparent in oklab. Browsers with color-mix support
(recent Chrome/Arc) take the oklab path; older embedded Chromiums (e.g.
Cursor's built-in browser) fall through to the sRGB hex. Those two paths
produce visibly different tints against the dark `--card` token, which
is why the agent-feed cards rendered inconsistently across Chrome, Arc,
and Cursor's browser.

Pin the four insight/anomaly-tier backgrounds to arbitrary 8-digit hex
(`bg-[#eff6ff80]` etc.) so every browser lands on the same sRGB path.
Values taken from Tailwind's own fallback output to preserve the
intended look on color-mix-capable browsers.
---
 .../components/actionable-card.tsx            | 20 +++++++++++++++----
 1 file changed, 16 insertions(+), 4 deletions(-)

diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/actionable-card.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/actionable-card.tsx
index 41063defc..db6a42f5f 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/components/actionable-card.tsx
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/actionable-card.tsx
@@ -26,9 +26,21 @@ interface ActionableCardProps {
   onAsk: (prompt: string) => void;
 }
 
+// Backgrounds are written as arbitrary 8-digit hex (e.g. `bg-[#eff6ff80]`)
+// instead of Tailwind's `/N` alpha shorthand. Rationale: `bg-blue-50/50`
+// compiles in Tailwind v4 to a pair — an sRGB hex fallback and a
+// `@supports (color-mix)` override that re-mixes in oklab over the oklch
+// palette token. Browsers that support `color-mix` (recent Chrome/Arc) take
+// the oklab path; older embedded Chromiums (e.g. Cursor's built-in browser
+// at the time of writing) fall through to the sRGB hex. Because oklab and
+// sRGB interpolation produce visibly different tints — especially against
+// the dark `--card` token — the same card ends up looking different in each
+// browser. Pinning the colour to a literal hex (no `/N`, no @supports
+// override) keeps all browsers on the same sRGB path and therefore the same
+// visual result.
 const INSIGHT_STYLES = {
   border: "border-blue-200 dark:border-blue-900",
-  bg: "bg-blue-50/50 dark:bg-blue-950/30",
+  bg: "bg-[#eff6ff80] dark:bg-[#1624564d]",
   icon: "text-blue-500",
 };
 
@@ -38,21 +50,21 @@ const ANOMALY_STYLES: Record<
 > = {
   low: {
     border: "border-yellow-200 dark:border-yellow-900",
-    bg: "bg-yellow-50/50 dark:bg-yellow-950/30",
+    bg: "bg-[#fefce880] dark:bg-[#4320044d]",
     icon: "text-yellow-500",
     badge:
       "bg-yellow-100 text-yellow-700 dark:bg-yellow-900/50 dark:text-yellow-400",
   },
   medium: {
     border: "border-orange-200 dark:border-orange-900",
-    bg: "bg-orange-50/50 dark:bg-orange-950/30",
+    bg: "bg-[#fff7ed80] dark:bg-[#4413064d]",
     icon: "text-orange-500",
     badge:
       "bg-orange-100 text-orange-700 dark:bg-orange-900/50 dark:text-orange-400",
   },
   high: {
     border: "border-red-200 dark:border-red-900",
-    bg: "bg-red-50/50 dark:bg-red-950/30",
+    bg: "bg-[#fef2f280] dark:bg-[#4608094d]",
     icon: "text-red-500",
     badge: "bg-red-100 text-red-700 dark:bg-red-900/50 dark:text-red-400",
   },

From 8b2ee5553c1ad68a37d0f14d804ec35fee7aa2a2 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Fri, 24 Apr 2026 18:09:55 +0200
Subject: [PATCH 36/46] fix(playground): gate Tailwind dark: variant on the
 theme class
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

appkit-ui's globals.css already defines dark-theme tokens via two paths
— an explicit `.dark` class on <html>, and `@media (prefers-color-scheme:
dark)` guarded by `:root:not(.light)` so an explicit `.light` class
wins. Tailwind v4's default `dark:` variant, however, is purely media
driven. That mismatch shows up when the user forces light via the
playground's theme selector while their OS is in dark mode: the
bootstrap script sets `<html class="light">`, --card/--background
correctly resolve to light, but every `dark:*` utility keeps firing
under the media query — cards end up painted with dark-mode
backgrounds layered under light-mode chrome.

Declare a playground-local `@custom-variant dark` that mirrors the
token logic exactly: fire when the element is (or descends from)
`.dark`, or when `prefers-color-scheme: dark` matches and no `.light`
ancestor is present. This rebinds every `dark:*` utility to respect
the theme selector's forced choice, keeping the rest of appkit-ui's
consumers — which don't ship the bootstrap script — on the existing
media-only behaviour.
---
 apps/dev-playground/client/src/index.css | 39 ++++++++++++++++++++++++
 1 file changed, 39 insertions(+)

diff --git a/apps/dev-playground/client/src/index.css b/apps/dev-playground/client/src/index.css
index 5dcc4cf86..b5389ab8c 100644
--- a/apps/dev-playground/client/src/index.css
+++ b/apps/dev-playground/client/src/index.css
@@ -1 +1,40 @@
 @import "@databricks/appkit-ui/styles.css";
+
+/**
+ * Realign Tailwind v4's `dark:` variant with appkit-ui's theme tokens.
+ *
+ * `packages/appkit-ui/.../globals.css` defines two paths into dark theme:
+ *   - An explicit `.dark` class on <html> (wins unconditionally).
+ *   - `@media (prefers-color-scheme: dark)` on `:root:not(.light)` — i.e.
+ *     the media query is ignored when the user has explicitly opted into
+ *     light via the `.light` class.
+ *
+ * Tailwind v4's default `dark:` variant, however, is purely media-query
+ * driven. That mismatch produces a split-personality theme in exactly one
+ * scenario, which is the one we hit: OS set to dark, user forces light
+ * via the theme selector (bootstrap script in index.html sets
+ * `<html class="light">`). `--card`, `--background`, etc. correctly
+ * resolve to light, but every `dark:*` utility keeps firing under the
+ * media query — cards end up with dark-mode backgrounds layered under
+ * light-mode text and chrome.
+ *
+ * This `@custom-variant dark` rebinds the variant to mirror the token
+ * logic exactly:
+ *   - Element is (or descends from) `.dark`      → dark utilities fire.
+ *   - `prefers-color-scheme: dark` AND no `.light` ancestor → also fire.
+ *   - Everything else                            → no-op.
+ *
+ * Scoped to the playground because the bootstrap script in index.html is
+ * what makes the `.light` / `.dark` classes meaningful here; other
+ * appkit-ui consumers may rely on the current media-only behaviour.
+ */
+@custom-variant dark {
+  &:where(.dark, .dark *) {
+    @slot;
+  }
+  @media (prefers-color-scheme: dark) {
+    &:where(:not(.light):not(.light *)) {
+      @slot;
+    }
+  }
+}

From fb49ee59462f3b692c02118e23e6e638407f8cf7 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 27 Apr 2026 10:54:59 +0200
Subject: [PATCH 37/46] fix(playground): stop streaming chat bubbles from
 pulsing
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The streaming-message bubble in the smart-dashboard chat drawer used
`animate-pulse` while tokens arrived. The constant fade in/out reads
as visual noise when the agent is mid-stream — especially with longer
replies where it pulses for many seconds. Drop the animation; the
ellipsis placeholder still communicates the loading state for empty
streaming bubbles.
---
 .../src/features/smart-dashboard/components/chat-drawer.tsx     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx b/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx
index 4c5196489..559f5950d 100644
--- a/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx
+++ b/apps/dev-playground/client/src/features/smart-dashboard/components/chat-drawer.tsx
@@ -239,7 +239,7 @@ function MessageBubble({ message }: { message: ChatMessage }) {
           isUser
             ? "bg-primary text-primary-foreground rounded-br-sm"
             : "bg-muted text-foreground rounded-bl-sm"
-        } ${message.streaming ? "animate-pulse" : ""}`}
+        }`}
       >
         {message.content || (message.streaming ? "…" : "")}
       </div>

From b8be1476b41be8b8d138fb5c8f01b4f9eee4fd2b Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 27 Apr 2026 15:27:52 +0200
Subject: [PATCH 38/46] chore(playground): migrate dev-playground server to
 onPluginsReady
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

`server({ autoStart: false }).then(appkit => appkit.server.extend(...).start())`
is gone — `createApp` now orchestrates server start itself, with the
post-setup hook surfaced as the `onPluginsReady` config callback.

Drop `autoStart: false`, hoist the `extend` block from the trailing
`.then` chain into `onPluginsReady`, and replace the dangling promise
with `.catch(console.error)` so unhandled rejections still surface.

Tracks #280 / #291 (autoStart removal + on-plugins-ready codemod).
---
 apps/dev-playground/server/index.ts | 13 ++++++-------
 1 file changed, 6 insertions(+), 7 deletions(-)

diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index b440c4760..c3ac957c1 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -330,7 +330,7 @@ const dashboard_pilot = createAgent({
 
 createApp({
   plugins: [
-    server({ autoStart: false }),
+    server(),
     reconnect(),
     telemetryExamples(),
     analytics({}),
@@ -385,9 +385,8 @@ createApp({
     // }),
   ],
   ...(process.env.APPKIT_E2E_TEST && { client: createMockClient() }),
-}).then((appkit) => {
-  appkit.server
-    .extend((app) => {
+  async onPluginsReady(appkit) {
+    appkit.server.extend((app) => {
       app.get("/sp", (_req, res) => {
         appkit.analytics
           .query("SELECT * FROM samples.nyctaxi.trips;")
@@ -681,9 +680,9 @@ createApp({
           res.status(404).json({ error: msg });
         }
       });
-    })
-    .start();
-});
+    });
+  },
+}).catch(console.error);
 
 /**
  * Heuristic match for Databricks Files API's "directory not found" error.

From 137d12a274a53013999bcb44bcb8c11b361992cf Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Wed, 29 Apr 2026 18:52:35 +0200
Subject: [PATCH 39/46] feat(template): scaffold a working starter agent
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Selecting `agents` in `databricks apps init` previously produced an
app that booted, logged "No agents registered.", and rendered no UI for
the plugin. Fixes that by scaffolding two starter agents (one markdown,
one code-defined) and a chat surface, gated on `{{if .plugins.agents}}`.

Added:
- template/config/agents/assistant/agent.md — markdown agent, default,
  no tools. Demonstrates the declarative form.
- template/server/agents/helper.ts — code-defined agent via
  createAgent({...}) with two inline tool({...}) definitions:
  current_time (returns ISO timestamp) and count_words. Tools are pure
  JS so the demo works regardless of which other plugins were selected
  at scaffold time.
- template/client/src/pages/agents/AgentChat.tsx — minimal SSE consumer
  for /api/agents/chat with an agent picker, streaming text bubbles,
  and inline tool-call rows. Hand-rolled because @databricks/appkit-ui
  doesn't yet ship a generic agent chat primitive — replace with one
  when it lands.

Modified:
- template/server/server.ts: when {{if .plugins.agents}}, imports the
  helper agent and wires it as agents({ agents: { helper } }) instead
  of bare agents(). The markdown 'assistant' loads automatically from
  config/agents/.
- template/client/src/App.tsx: conditional NavLink + route entry,
  mirroring the analytics/files/etc. blocks.

End-to-end shape after init with --features agents:
- GET /api/agents/info returns { agents: ['assistant', 'helper'],
  defaultAgent: 'assistant' }
- /agents page renders chat with picker
- 'what time is it?' to helper triggers a current_time tool round-trip
- 'count words in: the quick brown fox' triggers count_words → 4

The serving-endpoint resource (DATABRICKS_SERVING_ENDPOINT_NAME) is
already declared in template/appkit.plugins.json from PR 4, so the CLI
prompts for an endpoint when agents is selected.
---
 template/client/src/App.tsx                   |  11 +
 .../client/src/pages/agents/AgentChat.tsx     | 269 ++++++++++++++++++
 template/config/agents/assistant/agent.md     |  17 ++
 template/server/agents/helper.ts              |  44 +++
 template/server/server.ts                     |   7 +
 5 files changed, 348 insertions(+)
 create mode 100644 template/client/src/pages/agents/AgentChat.tsx
 create mode 100644 template/config/agents/assistant/agent.md
 create mode 100644 template/server/agents/helper.ts

diff --git a/template/client/src/App.tsx b/template/client/src/App.tsx
index 5510bb805..4b86eb557 100644
--- a/template/client/src/App.tsx
+++ b/template/client/src/App.tsx
@@ -5,6 +5,9 @@ import {
   CardHeader,
   CardTitle,
 } from '@databricks/appkit-ui/react';
+{{- if .plugins.agents}}
+import { AgentChat } from './pages/agents/AgentChat';
+{{- end}}
 {{- if .plugins.analytics}}
 import { AnalyticsPage } from './pages/analytics/AnalyticsPage';
 {{- end}}
@@ -43,6 +46,11 @@ function Layout() {
           <NavLink to="/" end className={navLinkClass}>
             Home
           </NavLink>
+{{- if .plugins.agents}}
+          <NavLink to="/agents" className={navLinkClass}>
+            Agents
+          </NavLink>
+{{- end}}
 {{- if .plugins.analytics}}
           <NavLink to="/analytics" className={navLinkClass}>
             Analytics
@@ -93,6 +101,9 @@ const router = createBrowserRouter([
     element: <Layout />,
     children: [
       { path: '/', element: <HomePage /> },
+{{- if .plugins.agents}}
+      { path: '/agents', element: <AgentChat /> },
+{{- end}}
 {{- if .plugins.analytics}}
       { path: '/analytics', element: <AnalyticsPage /> },
 {{- end}}
diff --git a/template/client/src/pages/agents/AgentChat.tsx b/template/client/src/pages/agents/AgentChat.tsx
new file mode 100644
index 000000000..40cfbea78
--- /dev/null
+++ b/template/client/src/pages/agents/AgentChat.tsx
@@ -0,0 +1,269 @@
+{{if .plugins.agents -}}
+import { useEffect, useRef, useState } from 'react';
+import {
+  Button,
+  Card,
+  CardContent,
+  Input,
+} from '@databricks/appkit-ui/react';
+
+interface Message {
+  id: string;
+  role: 'user' | 'assistant' | 'tool';
+  content: string;
+  toolName?: string;
+}
+
+interface AgentInfo {
+  agents: string[];
+  defaultAgent: string | null;
+}
+
+/**
+ * Minimal chat surface for the `agents` plugin.
+ *
+ * - Lists registered agents from `GET /api/agents/info` and lets the user
+ *   pick one (markdown `assistant` from `config/agents/assistant/agent.md`
+ *   and code-defined `helper` from `server/agents/helper.ts`).
+ * - Sends turns to `POST /api/agents/chat` and consumes the SSE stream
+ *   the agents plugin emits (Responses-API shape).
+ * - Renders streaming assistant text incrementally and surfaces tool
+ *   calls as separate inline rows.
+ *
+ * Replace this with `<GenieChat>`-style components when AppKit ships a
+ * first-class agent chat primitive in `@databricks/appkit-ui/react`.
+ */
+export function AgentChat() {
+  const [agents, setAgents] = useState<string[]>([]);
+  const [selectedAgent, setSelectedAgent] = useState<string | null>(null);
+  const [threadId, setThreadId] = useState<string | null>(null);
+  const [messages, setMessages] = useState<Message[]>([]);
+  const [input, setInput] = useState('');
+  const [streaming, setStreaming] = useState(false);
+  const [error, setError] = useState<string | null>(null);
+  const scrollRef = useRef<HTMLDivElement | null>(null);
+
+  useEffect(() => {
+    fetch('/api/agents/info')
+      .then((res) => {
+        if (!res.ok) throw new Error(`agents info failed: ${res.statusText}`);
+        return res.json() as Promise<AgentInfo>;
+      })
+      .then((info) => {
+        setAgents(info.agents);
+        setSelectedAgent(info.defaultAgent ?? info.agents[0] ?? null);
+      })
+      .catch((err) =>
+        setError(err instanceof Error ? err.message : 'Failed to load agents'),
+      );
+  }, []);
+
+  useEffect(() => {
+    scrollRef.current?.scrollTo({ top: scrollRef.current.scrollHeight });
+  }, []);
+
+  const send = async (e: React.FormEvent) => {
+    e.preventDefault();
+    const message = input.trim();
+    if (!message || streaming || !selectedAgent) return;
+
+    setError(null);
+    setInput('');
+    setStreaming(true);
+
+    const userMsg: Message = {
+      id: `u-${Date.now()}`,
+      role: 'user',
+      content: message,
+    };
+    const assistantId = `a-${Date.now()}`;
+    setMessages((prev) => [
+      ...prev,
+      userMsg,
+      { id: assistantId, role: 'assistant', content: '' },
+    ]);
+
+    try {
+      const res = await fetch('/api/agents/chat', {
+        method: 'POST',
+        headers: { 'Content-Type': 'application/json' },
+        body: JSON.stringify({
+          message,
+          agent: selectedAgent,
+          threadId: threadId ?? undefined,
+        }),
+      });
+      if (!res.ok || !res.body) {
+        throw new Error(`chat failed: ${res.status} ${res.statusText}`);
+      }
+
+      const reader = res.body.getReader();
+      const decoder = new TextDecoder();
+      let buf = '';
+
+      while (true) {
+        const { done, value } = await reader.read();
+        if (done) break;
+        buf += decoder.decode(value, { stream: true });
+
+        // SSE events are blank-line separated. Drain whole events from buf.
+        let idx;
+        while ((idx = buf.indexOf('\n\n')) !== -1) {
+          const raw = buf.slice(0, idx);
+          buf = buf.slice(idx + 2);
+          const dataLine = raw
+            .split('\n')
+            .find((l) => l.startsWith('data:'));
+          if (!dataLine) continue;
+          const json = dataLine.slice(5).trim();
+          if (!json) continue;
+          try {
+            handleEvent(JSON.parse(json), assistantId);
+          } catch {
+            // Ignore malformed payloads; the SSE stream will recover.
+          }
+        }
+      }
+    } catch (err) {
+      setError(err instanceof Error ? err.message : 'Chat error');
+    } finally {
+      setStreaming(false);
+    }
+  };
+
+  function handleEvent(ev: unknown, assistantId: string) {
+    if (!ev || typeof ev !== 'object') return;
+    const e = ev as Record<string, unknown>;
+
+    if (e.type === 'appkit.metadata') {
+      const data = e.data as { threadId?: string } | undefined;
+      if (data?.threadId) setThreadId(data.threadId);
+      return;
+    }
+
+    if (e.type === 'response.output_text.delta') {
+      const delta = (e.delta as string | undefined) ?? '';
+      setMessages((prev) =>
+        prev.map((m) =>
+          m.id === assistantId ? { ...m, content: m.content + delta } : m,
+        ),
+      );
+      return;
+    }
+
+    if (e.type === 'response.output_item.added') {
+      const item = e.item as
+        | { type: string; name?: string; arguments?: string }
+        | undefined;
+      if (item?.type === 'function_call' && item.name) {
+        setMessages((prev) => [
+          ...prev,
+          {
+            id: `t-${Date.now()}-${Math.random()}`,
+            role: 'tool',
+            toolName: item.name,
+            content: item.arguments ?? '',
+          },
+        ]);
+      }
+    }
+  }
+
+  return (
+    <div className="space-y-6 w-full max-w-4xl mx-auto">
+      <div className="flex items-end justify-between gap-4">
+        <div>
+          <h2 className="text-2xl font-bold text-foreground">Agents</h2>
+          <p className="text-sm text-muted-foreground mt-1">
+            Chat with a registered agent. Markdown agents come from
+            <code className="mx-1">config/agents/</code>; code-defined
+            agents are wired in <code className="mx-1">server/server.ts</code>.
+          </p>
+        </div>
+        {agents.length > 0 && (
+          <div className="flex gap-2">
+            {agents.map((name) => (
+              <Button
+                key={name}
+                variant={selectedAgent === name ? 'default' : 'outline'}
+                size="sm"
+                onClick={() => {
+                  setSelectedAgent(name);
+                  setThreadId(null);
+                  setMessages([]);
+                }}
+              >
+                {name}
+              </Button>
+            ))}
+          </div>
+        )}
+      </div>
+
+      <Card className="h-[600px] flex flex-col">
+        <CardContent className="flex-1 overflow-y-auto p-4 space-y-3" ref={scrollRef}>
+          {messages.length === 0 && (
+            <p className="text-sm text-muted-foreground text-center mt-8">
+              Start the conversation. Try asking <code>helper</code> "what
+              time is it?" or "count the words in: the quick brown fox".
+            </p>
+          )}
+          {messages.map((m) => {
+            if (m.role === 'tool') {
+              return (
+                <div
+                  key={m.id}
+                  className="text-xs font-mono text-muted-foreground border-l-2 border-primary/50 pl-3"
+                >
+                  <span className="font-semibold">tool · {m.toolName}</span>
+                  {m.content ? <span className="ml-2">{m.content}</span> : null}
+                </div>
+              );
+            }
+            return (
+              <div
+                key={m.id}
+                className={`p-3 rounded-md ${
+                  m.role === 'user'
+                    ? 'bg-primary/10 ml-12'
+                    : 'bg-muted mr-12'
+                }`}
+              >
+                <div className="text-xs text-muted-foreground mb-1">
+                  {m.role}
+                </div>
+                <div className="whitespace-pre-wrap text-sm">
+                  {m.content || (streaming ? '…' : '')}
+                </div>
+              </div>
+            );
+          })}
+        </CardContent>
+
+        <form onSubmit={send} className="p-3 border-t flex gap-2">
+          <Input
+            value={input}
+            onChange={(e) => setInput(e.target.value)}
+            placeholder={
+              selectedAgent
+                ? `Message ${selectedAgent}…`
+                : 'Loading agents…'
+            }
+            disabled={!selectedAgent || streaming}
+          />
+          <Button
+            type="submit"
+            disabled={!input.trim() || !selectedAgent || streaming}
+          >
+            {streaming ? 'Sending…' : 'Send'}
+          </Button>
+        </form>
+      </Card>
+
+      {error && (
+        <div className="text-sm text-destructive">Error: {error}</div>
+      )}
+    </div>
+  );
+}
+{{- end}}
diff --git a/template/config/agents/assistant/agent.md b/template/config/agents/assistant/agent.md
new file mode 100644
index 000000000..65a5d5f40
--- /dev/null
+++ b/template/config/agents/assistant/agent.md
@@ -0,0 +1,17 @@
+{{if .plugins.agents -}}
+---
+default: true
+---
+
+You are a helpful assistant for this Databricks application.
+
+Greet the user briefly when the conversation starts. Answer questions
+about how to use this app, what it can do, and how the code is laid out.
+Keep replies short and direct. If the user asks something you don't know,
+say so plainly.
+
+You don't have any tools beyond plain conversation. If the user asks for
+a calculation or a side-effect (e.g. "what time is it?", "count the
+words in this sentence"), tell them the `helper` agent can do that and
+they can switch agents from the chat picker.
+{{- end}}
diff --git a/template/server/agents/helper.ts b/template/server/agents/helper.ts
new file mode 100644
index 000000000..005fdbcdf
--- /dev/null
+++ b/template/server/agents/helper.ts
@@ -0,0 +1,44 @@
+{{if .plugins.agents -}}
+import { createAgent, tool } from '@databricks/appkit';
+import { z } from 'zod';
+
+/**
+ * Code-defined agent: showcases the imperative `createAgent({...})` form
+ * with inline `tool({...})` definitions.
+ *
+ * Tools here are intentionally dependency-free (no SQL warehouse, no
+ * volumes, no external APIs) so this template demos the tool-calling
+ * round-trip even when no other plugin is selected at scaffold time.
+ *
+ * The companion markdown agent at `config/agents/assistant/agent.md`
+ * shows the declarative form for prose-only agents.
+ */
+export const helper = createAgent({
+  name: 'helper',
+  instructions: [
+    'You are a tool-using helper agent.',
+    'When the user asks about the time, call `current_time`.',
+    'When the user asks to count words in a string, call `count_words`.',
+    'For anything else, answer briefly in plain text.',
+  ].join(' '),
+  tools: {
+    current_time: tool({
+      description: 'Returns the current server time as an ISO 8601 timestamp.',
+      schema: z.object({}),
+      annotations: { effect: 'read' },
+      execute: () => ({ now: new Date().toISOString() }),
+    }),
+    count_words: tool({
+      description: 'Counts the words in a string. Words are runs of non-whitespace.',
+      schema: z.object({
+        text: z.string().describe('The text to count words in.'),
+      }),
+      annotations: { effect: 'read' },
+      execute: ({ text }) => ({
+        text,
+        word_count: text.trim().split(/\s+/).filter(Boolean).length,
+      }),
+    }),
+  },
+});
+{{- end}}
diff --git a/template/server/server.ts b/template/server/server.ts
index b33bb94d8..47f8f9c1c 100644
--- a/template/server/server.ts
+++ b/template/server/server.ts
@@ -15,11 +15,18 @@ import { {{$betaImports}} } from '@databricks/appkit/beta';
 {{- if .plugins.lakebase}}
 import { setupSampleLakebaseRoutes } from './routes/lakebase/todo-routes';
 {{- end}}
+{{- if .plugins.agents}}
+import { helper } from './agents/helper';
+{{- end}}
 
 createApp({
   plugins: [
 {{- range $name, $_ := .plugins}}
+{{- if eq $name "agents"}}
+    agents({ agents: { helper } }),
+{{- else}}
     {{$name}}(),
+{{- end}}
 {{- end}}
   ],
 {{- if .plugins.lakebase}}

From cefe28d06eb5870b858a529bb3bcacdd9c4f60de Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 4 May 2026 13:05:09 +0200
Subject: [PATCH 40/46] fix(playground, template): import agents from
 @databricks/appkit/beta

agents, createAgent, fromPlugin, tool and all agent-related exports
are now under the beta subpath. Update the dev-playground server and
the template helper to import from @databricks/appkit/beta.
---
 apps/dev-playground/server/index.ts | 5 +----
 template/server/agents/helper.ts    | 2 +-
 2 files changed, 2 insertions(+), 5 deletions(-)

diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index c3ac957c1..d4b7bb7a7 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -1,19 +1,16 @@
 import "reflect-metadata";
 import {
-  agents,
   analytics,
-  createAgent,
   createApp,
   type FilePolicy,
   files,
-  fromPlugin,
   genie,
   PolicyDeniedError,
   server,
   serving,
-  tool,
   WRITE_ACTIONS,
 } from "@databricks/appkit";
+import { agents, createAgent, fromPlugin, tool } from "@databricks/appkit/beta";
 import { WorkspaceClient } from "@databricks/sdk-experimental";
 import { z } from "zod";
 import { lakebaseExamples } from "./lakebase-examples-plugin";
diff --git a/template/server/agents/helper.ts b/template/server/agents/helper.ts
index 005fdbcdf..aa3303b41 100644
--- a/template/server/agents/helper.ts
+++ b/template/server/agents/helper.ts
@@ -1,5 +1,5 @@
 {{if .plugins.agents -}}
-import { createAgent, tool } from '@databricks/appkit';
+import { createAgent, tool } from '@databricks/appkit/beta';
 import { z } from 'zod';
 
 /**

From c43aacfb2a330e82b8ab54c3bcb09610eeb07c9a Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 4 May 2026 18:47:21 +0200
Subject: [PATCH 41/46] docs: beta agents banner, template stability, and
 unified typedoc entry

- Document agents as beta in docs and set stability in app template manifest
- Point Docusaurus Typedoc at typedoc.entry.ts so stable + beta APIs publish
  together (fixes agent symbol pages being dropped from index-only builds)
- Regenerate api/appkit index and sidebar; knip-ignore docs-only entry file

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 .../appkit/Interface.AgentsPluginConfig.md    |  4 +-
 .../Interface.AutoInheritToolsConfig.md       | 30 +++++++++
 .../api/appkit/Interface.BasePluginConfig.md  |  2 +-
 .../appkit/Interface.LakebasePoolConfig.md    |  2 +-
 .../api/appkit/Interface.RegisteredAgent.md   | 67 +++++++++++++++++++
 .../api/appkit/Interface.ToolAnnotations.md   | 55 +++++++++++++++
 .../api/appkit/TypeAlias.ResolvedToolEntry.md | 28 ++++++++
 docs/docs/api/appkit/index.md                 |  8 ++-
 docs/docs/api/appkit/typedoc-sidebar.ts       | 20 ++++++
 docs/docs/plugins/agents.md                   |  6 ++
 docs/docusaurus.config.ts                     |  2 +-
 knip.json                                     |  1 +
 packages/appkit/src/typedoc.entry.ts          |  9 +++
 template/appkit.plugins.json                  |  3 +-
 14 files changed, 230 insertions(+), 7 deletions(-)
 create mode 100644 docs/docs/api/appkit/Interface.AutoInheritToolsConfig.md
 create mode 100644 docs/docs/api/appkit/Interface.RegisteredAgent.md
 create mode 100644 docs/docs/api/appkit/Interface.ToolAnnotations.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.ResolvedToolEntry.md
 create mode 100644 packages/appkit/src/typedoc.entry.ts

diff --git a/docs/docs/api/appkit/Interface.AgentsPluginConfig.md b/docs/docs/api/appkit/Interface.AgentsPluginConfig.md
index e4d30fb22..916266d79 100644
--- a/docs/docs/api/appkit/Interface.AgentsPluginConfig.md
+++ b/docs/docs/api/appkit/Interface.AgentsPluginConfig.md
@@ -60,7 +60,9 @@ Milliseconds to wait before auto-denying. Default: 60_000.
 ### autoInheritTools?
 
 ```ts
-optional autoInheritTools: boolean | AutoInheritToolsConfig;
+optional autoInheritTools: 
+  | boolean
+  | AutoInheritToolsConfig;
 ```
 
 Whether to auto-inherit every ToolProvider plugin's toolkit. Accepts a boolean shorthand.
diff --git a/docs/docs/api/appkit/Interface.AutoInheritToolsConfig.md b/docs/docs/api/appkit/Interface.AutoInheritToolsConfig.md
new file mode 100644
index 000000000..4e42b68ce
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AutoInheritToolsConfig.md
@@ -0,0 +1,30 @@
+# Interface: AutoInheritToolsConfig
+
+Auto-inherit configuration. When enabled for a given agent origin, agents
+with no explicit `tools:` declaration receive every registered ToolProvider
+plugin tool whose author marked `autoInheritable: true`. Tools without that
+flag — destructive, state-mutating, or privilege-sensitive — never spread
+automatically and must be wired via `tools:`, `toolkits:`, or `fromPlugin`.
+
+Defaults are `false` for both origins (safe-by-default): developers must
+consciously opt an origin in to any auto-inherit behaviour.
+
+## Properties
+
+### code?
+
+```ts
+optional code: boolean;
+```
+
+Default for code-defined agents (via `agents: { foo: createAgent(...) }`). Default: `false`.
+
+***
+
+### file?
+
+```ts
+optional file: boolean;
+```
+
+Default for agents loaded from markdown files. Default: `false`.
diff --git a/docs/docs/api/appkit/Interface.BasePluginConfig.md b/docs/docs/api/appkit/Interface.BasePluginConfig.md
index 653df68ce..797c2c7d5 100644
--- a/docs/docs/api/appkit/Interface.BasePluginConfig.md
+++ b/docs/docs/api/appkit/Interface.BasePluginConfig.md
@@ -4,8 +4,8 @@ Base configuration interface for AppKit plugins
 
 ## Extended by
 
-- [`AgentsPluginConfig`](Interface.AgentsPluginConfig.md)
 - [`IJobsConfig`](Interface.IJobsConfig.md)
+- [`AgentsPluginConfig`](Interface.AgentsPluginConfig.md)
 
 ## Indexable
 
diff --git a/docs/docs/api/appkit/Interface.LakebasePoolConfig.md b/docs/docs/api/appkit/Interface.LakebasePoolConfig.md
index 3f40f3021..e75c457b4 100644
--- a/docs/docs/api/appkit/Interface.LakebasePoolConfig.md
+++ b/docs/docs/api/appkit/Interface.LakebasePoolConfig.md
@@ -76,7 +76,7 @@ const pool = createLakebasePool({
 ### sslMode?
 
 ```ts
-optional sslMode: "require" | "disable" | "prefer";
+optional sslMode: "disable" | "require" | "prefer";
 ```
 
 SSL mode for the connection (convenience helper)
diff --git a/docs/docs/api/appkit/Interface.RegisteredAgent.md b/docs/docs/api/appkit/Interface.RegisteredAgent.md
new file mode 100644
index 000000000..ead127e6e
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.RegisteredAgent.md
@@ -0,0 +1,67 @@
+# Interface: RegisteredAgent
+
+## Properties
+
+### adapter
+
+```ts
+adapter: AgentAdapter;
+```
+
+***
+
+### baseSystemPrompt?
+
+```ts
+optional baseSystemPrompt: BaseSystemPromptOption;
+```
+
+***
+
+### ephemeral?
+
+```ts
+optional ephemeral: boolean;
+```
+
+Mirrors `AgentDefinition.ephemeral` — skip thread persistence.
+
+***
+
+### instructions
+
+```ts
+instructions: string;
+```
+
+***
+
+### maxSteps?
+
+```ts
+optional maxSteps: number;
+```
+
+***
+
+### maxTokens?
+
+```ts
+optional maxTokens: number;
+```
+
+***
+
+### name
+
+```ts
+name: string;
+```
+
+***
+
+### toolIndex
+
+```ts
+toolIndex: Map<string, ResolvedToolEntry>;
+```
diff --git a/docs/docs/api/appkit/Interface.ToolAnnotations.md b/docs/docs/api/appkit/Interface.ToolAnnotations.md
new file mode 100644
index 000000000..39fbecff6
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ToolAnnotations.md
@@ -0,0 +1,55 @@
+# Interface: ToolAnnotations
+
+## Properties
+
+### ~~destructive?~~
+
+```ts
+optional destructive: boolean;
+```
+
+#### Deprecated
+
+Prefer [effect](#effect) with value `"destructive"`. Retained
+so existing annotations continue to force the approval gate, and so
+MCP-style consumers that only read `destructive` still see the hint.
+
+***
+
+### effect?
+
+```ts
+optional effect: ToolEffect;
+```
+
+Preferred semantic label. When set, drives both the approval gate (fires
+for `write`/`update`/`destructive`) and the approval-card styling.
+
+***
+
+### idempotent?
+
+```ts
+optional idempotent: boolean;
+```
+
+***
+
+### ~~readOnly?~~
+
+```ts
+optional readOnly: boolean;
+```
+
+#### Deprecated
+
+Prefer [effect](#effect). Retained for backward compatibility
+with tools authored against the original flags and for MCP interop.
+
+***
+
+### requiresUserContext?
+
+```ts
+optional requiresUserContext: boolean;
+```
diff --git a/docs/docs/api/appkit/TypeAlias.ResolvedToolEntry.md b/docs/docs/api/appkit/TypeAlias.ResolvedToolEntry.md
new file mode 100644
index 000000000..e97b3ef97
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.ResolvedToolEntry.md
@@ -0,0 +1,28 @@
+# Type Alias: ResolvedToolEntry
+
+```ts
+type ResolvedToolEntry = 
+  | {
+  def: AgentToolDefinition;
+  localName: string;
+  pluginName: string;
+  source: "toolkit";
+}
+  | {
+  def: AgentToolDefinition;
+  functionTool: FunctionTool;
+  source: "function";
+}
+  | {
+  def: AgentToolDefinition;
+  mcpToolName: string;
+  source: "mcp";
+}
+  | {
+  agentName: string;
+  def: AgentToolDefinition;
+  source: "subagent";
+};
+```
+
+Internal tool-index entry after a tool record has been resolved to a dispatchable form.
diff --git a/docs/docs/api/appkit/index.md b/docs/docs/api/appkit/index.md
index 5b273e690..0470b6d2b 100644
--- a/docs/docs/api/appkit/index.md
+++ b/docs/docs/api/appkit/index.md
@@ -1,7 +1,7 @@
 # @databricks/appkit
 
-Core library for building Databricks applications with type-safe SQL queries,
-plugin architecture, and React integration.
+Documentation merge entry for Typedoc — combines the stable `@databricks/appkit`
+surface with `@databricks/appkit/beta`. Not meant for application imports.
 
 ## Enumerations
 
@@ -37,6 +37,7 @@ plugin architecture, and React integration.
 | [AgentRunContext](Interface.AgentRunContext.md) | - |
 | [AgentsPluginConfig](Interface.AgentsPluginConfig.md) | Base configuration interface for AppKit plugins |
 | [AgentToolDefinition](Interface.AgentToolDefinition.md) | - |
+| [AutoInheritToolsConfig](Interface.AutoInheritToolsConfig.md) | Auto-inherit configuration. When enabled for a given agent origin, agents with no explicit `tools:` declaration receive every registered ToolProvider plugin tool whose author marked `autoInheritable: true`. Tools without that flag — destructive, state-mutating, or privilege-sensitive — never spread automatically and must be wired via `tools:`, `toolkits:`, or `fromPlugin`. |
 | [BasePluginConfig](Interface.BasePluginConfig.md) | Base configuration interface for AppKit plugins |
 | [CacheConfig](Interface.CacheConfig.md) | Configuration for the CacheInterceptor. Controls TTL, size limits, storage backend, and probabilistic cleanup. |
 | [DatabaseCredential](Interface.DatabaseCredential.md) | Database credentials with OAuth token for Postgres connection |
@@ -55,6 +56,7 @@ plugin architecture, and React integration.
 | [Message](Interface.Message.md) | - |
 | [PluginManifest](Interface.PluginManifest.md) | Plugin manifest that declares metadata and resource requirements. Attached to plugin classes as a static property. Extends the shared PluginManifest with strict resource types. |
 | [PromptContext](Interface.PromptContext.md) | Context passed to `baseSystemPrompt` callbacks. |
+| [RegisteredAgent](Interface.RegisteredAgent.md) | - |
 | [RequestedClaims](Interface.RequestedClaims.md) | Optional claims for fine-grained Unity Catalog table permissions When specified, the returned token will be scoped to only the requested tables |
 | [RequestedResource](Interface.RequestedResource.md) | Resource to request permissions for in Unity Catalog |
 | [ResourceEntry](Interface.ResourceEntry.md) | Internal representation of a resource in the registry. Extends ResourceRequirement with resolution state and plugin ownership. |
@@ -68,6 +70,7 @@ plugin architecture, and React integration.
 | [TelemetryConfig](Interface.TelemetryConfig.md) | OpenTelemetry configuration for AppKit applications |
 | [Thread](Interface.Thread.md) | - |
 | [ThreadStore](Interface.ThreadStore.md) | - |
+| [ToolAnnotations](Interface.ToolAnnotations.md) | - |
 | [ToolConfig](Interface.ToolConfig.md) | - |
 | [ToolkitEntry](Interface.ToolkitEntry.md) | A tool reference produced by a plugin's `.toolkit()` call. The agents plugin recognizes the `__toolkitRef` brand and dispatches tool invocations through `PluginContext.executeTool(req, pluginName, localName, ...)`, preserving OBO (asUser) and telemetry spans. |
 | [ToolkitOptions](Interface.ToolkitOptions.md) | - |
@@ -91,6 +94,7 @@ plugin architecture, and React integration.
 | [JobHandle](TypeAlias.JobHandle.md) | Job handle returned by `appkit.jobs("etl")`. Supports OBO access via `.asUser(req)`. |
 | [JobsExport](TypeAlias.JobsExport.md) | Public API shape of the jobs plugin. Callable to select a job by key. |
 | [PluginData](TypeAlias.PluginData.md) | Tuple of plugin class, config, and name. Created by `toPlugin()` and passed to `createApp()`. |
+| [ResolvedToolEntry](TypeAlias.ResolvedToolEntry.md) | Internal tool-index entry after a tool record has been resolved to a dispatchable form. |
 | [ResourcePermission](TypeAlias.ResourcePermission.md) | Union of all possible permission levels across all resource types. |
 | [ServingFactory](TypeAlias.ServingFactory.md) | Factory function returned by `AppKit.serving`. |
 | [ToPlugin](TypeAlias.ToPlugin.md) | Factory function type returned by `toPlugin()`. Accepts optional config and returns a PluginData tuple. |
diff --git a/docs/docs/api/appkit/typedoc-sidebar.ts b/docs/docs/api/appkit/typedoc-sidebar.ts
index 8b7090851..297aca334 100644
--- a/docs/docs/api/appkit/typedoc-sidebar.ts
+++ b/docs/docs/api/appkit/typedoc-sidebar.ts
@@ -117,6 +117,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.AgentToolDefinition",
           label: "AgentToolDefinition"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AutoInheritToolsConfig",
+          label: "AutoInheritToolsConfig"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.BasePluginConfig",
@@ -207,6 +212,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.PromptContext",
           label: "PromptContext"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.RegisteredAgent",
+          label: "RegisteredAgent"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.RequestedClaims",
@@ -272,6 +282,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.ThreadStore",
           label: "ThreadStore"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ToolAnnotations",
+          label: "ToolAnnotations"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.ToolConfig",
@@ -368,6 +383,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/TypeAlias.PluginData",
           label: "PluginData"
         },
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.ResolvedToolEntry",
+          label: "ResolvedToolEntry"
+        },
         {
           type: "doc",
           id: "api/appkit/TypeAlias.ResourcePermission",
diff --git a/docs/docs/plugins/agents.md b/docs/docs/plugins/agents.md
index d06befacc..432117049 100644
--- a/docs/docs/plugins/agents.md
+++ b/docs/docs/plugins/agents.md
@@ -1,5 +1,11 @@
 # Agents
 
+<!-- AUTO-GENERATED: stability-banner-start -->
+:::warning Beta plugin
+This plugin is currently **beta**. APIs may change between minor releases. Import from `@databricks/appkit/beta`. See [Plugin Stability Tiers](./stability.md).
+:::
+<!-- AUTO-GENERATED: stability-banner-end -->
+
 The `agents` plugin turns a Databricks AppKit app into an AI-agent host. It loads agent definitions from markdown on disk (one folder per agent: `config/agents/<id>/agent.md`), from TypeScript (`createAgent(def)`), or both, and exposes them at `POST /invocations` alongside routes for chat, thread management, and cancellation.
 
 This page covers the full lifecycle. For the hand-written primitives (`tool()`, `mcpServer()`), see [tools](./server.md).
diff --git a/docs/docusaurus.config.ts b/docs/docusaurus.config.ts
index 2e9461773..a4386ab8c 100644
--- a/docs/docusaurus.config.ts
+++ b/docs/docusaurus.config.ts
@@ -119,7 +119,7 @@ const config: Config = {
       "docusaurus-plugin-typedoc",
       {
         id: "appkit",
-        entryPoints: ["../packages/appkit/src/index.ts"],
+        entryPoints: ["../packages/appkit/src/typedoc.entry.ts"],
         tsconfig: "../packages/appkit/tsconfig.json",
         out: "docs/api/appkit",
         gitRevision: "main",
diff --git a/knip.json b/knip.json
index 0a2351b79..dbd7eee89 100644
--- a/knip.json
+++ b/knip.json
@@ -24,6 +24,7 @@
     "packages/appkit/src/core/agent/from-plugin.ts",
     "packages/appkit/src/core/agent/load-agents.ts",
     "packages/appkit/src/connectors/mcp/index.ts",
+    "packages/appkit/src/typedoc.entry.ts",
     "template/**",
     "tools/**",
     "docs/**",
diff --git a/packages/appkit/src/typedoc.entry.ts b/packages/appkit/src/typedoc.entry.ts
new file mode 100644
index 000000000..295ed192f
--- /dev/null
+++ b/packages/appkit/src/typedoc.entry.ts
@@ -0,0 +1,9 @@
+/**
+ * Documentation merge entry for Typedoc — combines the stable `@databricks/appkit`
+ * surface with `@databricks/appkit/beta`. Not meant for application imports.
+ *
+ * @packageDocumentation
+ */
+
+export * from "./beta";
+export * from "./index";
diff --git a/template/appkit.plugins.json b/template/appkit.plugins.json
index 87e4304ac..131ccbbf8 100644
--- a/template/appkit.plugins.json
+++ b/template/appkit.plugins.json
@@ -24,7 +24,8 @@
             }
           }
         ]
-      }
+      },
+      "stability": "beta"
     },
     "analytics": {
       "name": "analytics",

From b8db81bcf9b20ac932e444588021b4b13709bc5e Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Mon, 4 May 2026 19:52:12 +0200
Subject: [PATCH 42/46] chore: remove plans scratch docs from agents stack
 branch

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 plans/agent-folder-layout.md  |  35 ----
 plans/smart-dashboard-demo.md | 365 ----------------------------------
 2 files changed, 400 deletions(-)
 delete mode 100644 plans/agent-folder-layout.md
 delete mode 100644 plans/smart-dashboard-demo.md

diff --git a/plans/agent-folder-layout.md b/plans/agent-folder-layout.md
deleted file mode 100644
index 8c530a5fe..000000000
--- a/plans/agent-folder-layout.md
+++ /dev/null
@@ -1,35 +0,0 @@
-# Folder-based markdown agents (`<id>/agent.md`)
-
-## Locked decisions
-
-| Topic | Choice |
-|--------|--------|
-| Top-level `*.md` | **Removed** — folder layout only (**breaking**). Startup lists orphan files and tells you to use `<stem>/agent.md`. |
-| Entry file | **`agent.md` only** — no `index.md` alias in v1. |
-| Subdir without entry | **Throw** — every directory under `config/agents` (except reserved names) must contain `agent.md`. |
-| `skills/` at repo root under `agents/` | **Ignored** — reserved for future per-agent skills; not loaded as an agent package in v1. |
-| `agents:` frontmatter | Unchanged — array of **agent ids** (folder names). |
-
-## Goal
-
-Support one **directory per agent** with a fixed entry file (`agent.md`), so each agent can later grow **skills** and other assets without flattening everything into one markdown file.
-
-## Loader behavior (`loadAgentsFromDir`)
-
-1. `readdirSync(dir, { withFileTypes: true })`.
-2. **Reject** any top-level `*.md` with an error that suggests `mv X.md X/agent.md`-style migration.
-3. For each subdirectory whose name is not reserved (`skills`), require `<id>/agent.md`; register agent **`id`** from that file.
-4. Two-pass resolution for `agents:` references (unchanged semantics).
-5. **`default: true`** — deterministic: sort agent ids, first `default: true` wins.
-
-Single-file **`loadAgentFromFile`** keeps rejecting non-empty `agents:`. Paths ending in `/agent.md` derive the logical agent id from the **parent directory name** (see `agentIdFromMarkdownPath`).
-
-## Acceptance criteria
-
-- Loading `config/agents` with only `assistant/agent.md` yields `defs.assistant`.
-- Flat `assistant.md` alone does **not** register — covered by loader tests and docs.
-- Reference apps use `<id>/agent.md` under `config/agents`.
-
-## Git stack
-
-Loader + unit tests belong on **`agent/v2/4-agents-plugin`**. Docs and app migrations typically land on **`agent/v2/6-apps-docs`** after rebasing onto the updated stack; **`git push --force-with-lease`** stacked branches **4 → 5 → 6** when coordinating PRs.
diff --git a/plans/smart-dashboard-demo.md b/plans/smart-dashboard-demo.md
deleted file mode 100644
index 5a7be794e..000000000
--- a/plans/smart-dashboard-demo.md
+++ /dev/null
@@ -1,365 +0,0 @@
-# Plan: Smart-Dashboard demo route (retires `agent-app`)
-
-## Goal
-
-Replace `apps/agent-app` with a **new `/smart-dashboard` route inside
-`dev-playground`** that doubles as the integration test for every feature
-in the agents-plugin v2 stack. An analytics dashboard (NYC Taxi data)
-where multiple agents help the user interpret, filter, and highlight data
-in real time, plus a hidden-by-default **Stream Inspector** for observability
-of the SSE pipeline.
-
-The route is **the demo** that makes branches 4/5/6 reviewable end-to-end:
-fold-based markdown agents, `createAgent`, `fromPlugin`, sub-agent
-delegation, human-in-the-loop approval, MCP host policy, DOS limits,
-ephemeral agents — all exercised by one app.
-
-## Locked decisions
-
-| Topic | Choice |
-|---|---|
-| Location | `apps/dev-playground/client/src/routes/smart-dashboard/` + server wiring in `apps/dev-playground/server/index.ts`. **No new app.** |
-| Fate of `agent-app` | **Delete.** Replaced by this route as the sole end-to-end demo. |
-| Domain / data | NYC Taxi samples (`samples.nyctaxi.trips`). Directly reusable from the `p3ju` prototype. |
-| Agent ↔ UI protocol | **SSE tool-call args as action payload.** Agent `tool.execute` is a stub returning confirmation text; the UI reads `function_call` items from the SSE stream and mutates client state. No new primitive. |
-| Interaction level | (c) emitted actions — agent can apply filters, highlight time ranges, focus charts, save views. No server-side dashboard mutation. |
-| Agents (3 + dispatcher) | `query` (markdown dispatcher), `sql_analyst` (code, `fromPlugin(analytics)` + `save_view`), `dashboard_pilot` (code, UI action tools), `insights` + `anomaly` (ephemeral markdown, auto-fire on KPI load) |
-| Sub-agent definition style | **Code** for `sql_analyst` / `dashboard_pilot`. Markdown narrative is already covered by the three markdown agents; code demonstrates the `createAgent` + `fromPlugin` + inline `tool()` engineer path that dev-playground currently doesn't exercise. |
-| Approval flow | `save_view({ name, description? })` annotated `destructive: true`. Fires the HITL card. Server handler is a stub. |
-| Stream inspector | Slide-in right drawer, toggled by ⌘K or a small floating icon. Shows filtered SSE event timeline with args + expandable JSON. **Demo-scoped** — lives under the route directory, not promoted to `appkit-ui`. |
-| Merge strategy | **Into `agent/v2/6-apps-docs`** as the "integration test" payoff of the stack. Not a follow-up PR. |
-| Dev-playground character | Accept that it grows from "feature grab-bag" into "feature grab-bag + one flagship demo route." The route lives in its own subdirectory and doesn't leak into other routes. |
-
-## Non-goals (this iteration)
-
-- Real Databricks AI/BI dashboard embedding.
-- Server-side dashboard state (named views shared across users).
-- WebSocket / bidirectional agent ↔ UI channel. SSE-only.
-- Agents reading dashboard state via tool calls. State flows to the agent
-  via system-prompt context injection only (static).
-- Promoting the stream inspector into `appkit-ui`. Follow-up if the demo lands.
-- MCP hosted tools in this route. The v2 stack already has MCP coverage
-  elsewhere; not worth the extra env-var setup for this demo.
-
-## What exists today (prototype to port)
-
-Source: `/Users/mario.cadenas/.cursor/worktrees/app-kit/p3ju/apps/smart-dashboard/`
-
-- **Server** (`server.ts`, 97 lines) — `query` agent code-defined with
-  `apply_filter` + `highlight_period` tools + `fromPlugin(analytics)`.
-- **Markdown agents** (`config/agents/`) — `anomaly.md` and `insights.md`,
-  ephemeral, `maxSteps: 1`, return JSON.
-- **SQL queries** (`config/queries/`) — `dashboard_kpis.sql`,
-  `dashboard_trips_over_time.sql`, `dashboard_fare_distribution.sql`,
-  `dashboard_top_zone.sql`.
-- **Client** (`src/`, 16 files, 1,544 lines) — `App.tsx`, component set
-  (active-filters, agent-sidebar, anomaly-card, fare-chart, insight-card,
-  kpi-cards, query-section, trip-chart), hooks (`use-agent-stream`,
-  `use-action-dispatcher`, `use-chart-colors`, `use-dashboard-data`).
-
-**~80% copy-forward.** The 20% new is stream inspector, multi-agent
-delegation, dashboard-context injection, `focus_chart`, approval card,
-polish.
-
-## What this plan adds
-
-### 1. Stream Inspector (NEW)
-
-Hidden-by-default right-edge drawer showing the SSE timeline of the latest
-run. Reviewers see tool-calls, message deltas, sub-agent invocations, and
-approval gates inline — the "inside the black box" view.
-
-- **Trigger:** ⌘K (macOS) / Ctrl+K, or a small debug icon in the bottom-right.
-- **Layout:** 420px right drawer, backdrop-blur, slides in.
-- **Content per event:** timestamp (ms relative to stream start), event
-  type, tool name + args table when it's a function call, collapsible
-  full-JSON view.
-- **Filter chips:** `all` / `tool calls` / `messages` / `approvals` / `sub-agents`.
-- **Implementation:** extend `use-agent-stream` to push every event into a
-  module-level store; new `<StreamInspector>` component consumes it.
-- **Scope:** session-only. No persistence, no export.
-
-### 2. Approval-gate demo path
-
-One destructive tool so HITL fires visibly:
-
-- `save_view({ name, description? })` annotated
-  `{ destructive: true, readOnly: false }`.
-- Prompt it with *"save this as 'High-fare Friday 2016'"*.
-- UI renders a rich `<ApprovalCard>` with the view name, description,
-  current filters + highlights summary, annotations chip.
-- Approve → tool returns success, agent confirms. Deny → agent receives
-  the denial string, apologises, replans.
-
-Handler is a stub (console.log + return).
-
-### 3. Dashboard context injection (static)
-
-Every chat message gets a prefix block describing what the user is looking
-at: active filters, highlight ranges, current timerange.
-
-- `buildDashboardContext(filters, highlights): string` utility.
-- `use-agent-stream.send(message, { contextPrefix })` signature extension.
-- `<QuerySection>` composes the prefix before each send.
-
-Pure UX change. No new AppKit primitive.
-
-### 4. Multi-agent delegation (upgrades the `query` agent)
-
-Prototype's `query` is a flat agent with four tools. Upgrade:
-
-- `query` (markdown dispatcher) — decides which specialist to call, never
-  calls tools directly.
-- `sql_analyst` (code) — tools: `...fromPlugin(analytics)`, `save_view`.
-- `dashboard_pilot` (code) — tools: `apply_filter`, `highlight_period`,
-  `focus_chart`.
-
-Dispatcher exposes `agent-sql_analyst` and `agent-dashboard_pilot` as
-sub-agent tools. Default agent: `query`.
-
-This demonstrates:
-- Sub-agent delegation (`agents:` in def)
-- `fromPlugin` + inline `tool()` in code (`sql_analyst`)
-- Tool-only sub-agent with no plugin deps (`dashboard_pilot`)
-- The flat-vs-delegated trade-off (risk: extra round-trip latency — see Risks)
-
-### 5. New UI action tool: `focus_chart({ chart_id })`
-
-Scrolls to the named chart and pulses it. Chart IDs:
-`trips_over_time`, `fare_distribution`, `kpis`.
-
-- `tool()` handler returns a confirmation string.
-- Client `useFocusRegistry` hook: chart components register refs by id.
-- `use-action-dispatcher` listens for `focus_chart` function_call events
-  and triggers the pulse animation.
-
-Zero server logic. Pure action-dispatch demo.
-
-### 6. Polish
-
-- `<ApprovalCard>` renders annotations prominently (red badge for
-  `destructive: true`) plus filter/highlight context.
-- KPI cards use shimmer loading instead of `isLoading` text.
-- Error toasts when SQL fails / agent errors / model endpoint 4xx/5xx.
-- Keyboard: ⌘K (inspector), ⌘L (focus chat input), `Esc` (close drawer).
-- Top-of-route hero: "Smart Dashboard — NYC Taxi analytics, powered by
-  3 AI agents" with tiny indicators for each agent's state.
-
-## Architecture notes
-
-### The agent → UI action pattern
-
-The prototype's core insight: **the agent's tool-call JSON is the action
-payload.** No new AppKit primitive.
-
-```
-Agent emits:   tool_call { name: "apply_filter", args: { field: "date", ... } }
-              ↓ (via SSE response.output_item.added)
-Client reads:  SSEEvent { item: { type: "function_call", name, arguments } }
-Client applies: setFilters(deriveFiltersFromArgs(args))
-Server tool:   execute() returns confirmation text for the LLM log
-```
-
-Benefits preserved:
-- Agent control flow: LLM sees confirmation, plans next step.
-- Client latency: UI updates as tokens stream.
-- Security: no new attack surface; existing SSE pipeline already authed.
-- Observability: stream inspector sees every action inline with everything else.
-
-### Dashboard state flow
-
-```
-User action ─→ useState (filters, highlights) ─→ useDashboardData() ─→ SQL
-                              ↑                                           ↓
-                              └──── tool_call dispatch ←──── SSE ←──── agent
-                                                                          ↑
-                              buildDashboardContext() ─────→ send() ──────┘
-```
-
-One-way reactive loop. Simple, testable.
-
-### File layout (target)
-
-```
-apps/dev-playground/
-  config/
-    agents/
-      query/agent.md              # dispatcher (NEW)
-      insights/agent.md           # ported from prototype
-      anomaly/agent.md            # ported from prototype
-      assistant/agent.md          # existing — unchanged
-      autocomplete/agent.md       # existing — unchanged
-    queries/                      # NEW if not present; check
-      dashboard_kpis.sql
-      dashboard_trips_over_time.sql
-      dashboard_fare_distribution.sql
-      dashboard_top_zone.sql
-  server/
-    index.ts                      # add sql_analyst + dashboard_pilot,
-                                  # wire apply_filter, highlight_period,
-                                  # focus_chart, save_view
-  client/
-    src/
-      routes/
-        smart-dashboard.route.tsx # NEW route entry (registers under /smart-dashboard)
-        smart-dashboard/          # NEW subdirectory
-          components/
-            active-filters.tsx    # ported
-            agent-sidebar.tsx     # ported + inspector toggle
-            approval-card.tsx     # NEW
-            anomaly-card.tsx      # ported
-            fare-chart.tsx        # ported
-            insight-card.tsx      # ported
-            kpi-cards.tsx         # ported + shimmer
-            query-section.tsx     # ported + dashboard-context injection
-            stream-inspector.tsx  # NEW
-            trip-chart.tsx        # ported + focus-pulse
-          hooks/
-            use-action-dispatcher.ts  # ported + focus_chart + save_view
-            use-agent-stream.ts       # ported + context-prefix + inspector feed
-            use-chart-colors.ts       # ported
-            use-dashboard-data.ts     # ported
-            use-focus-registry.ts     # NEW
-            use-stream-inspector.ts   # NEW
-          lib/
-            dashboard-context.ts      # NEW (buildDashboardContext)
-```
-
-## Implementation stages
-
-Each stage independently shippable. Stop at Stage 2 for MVP demo; go
-through Stage 5 for wow.
-
-### Stage 0 — Port prototype + retire agent-app (2h)
-
-- [ ] Port `config/queries/*.sql` into `apps/dev-playground/config/queries/`
-- [ ] Port `config/agents/anomaly.md` + `insights.md` into folder layout:
-      `config/agents/anomaly/agent.md`, `config/agents/insights/agent.md`
-- [ ] Port 16 client files into `client/src/routes/smart-dashboard/`
-- [ ] Register the route in TanStack Router (`smart-dashboard.route.tsx`)
-- [ ] Add `query` markdown agent + `sql_analyst`/`dashboard_pilot` code
-      agents to `server/index.ts`, including the ambient tools
-- [ ] Delete `apps/agent-app/`
-- [ ] Grep repo for `agent-app` references (docs, template, scripts,
-      `docs/docs/plugins/agents.md`, tests)
-- [ ] Verify `pnpm --filter=dev-playground dev` boots, `/smart-dashboard`
-      renders the dashboard, KPIs load, default chat works
-
-### Stage 1 — Dispatcher + sub-agents (3h)
-
-- [ ] Split the flat `query` agent into `query` dispatcher + `sql_analyst`
-      + `dashboard_pilot`
-- [ ] Dispatcher prompt: "decide which specialist to call; do not call
-      tools directly"
-- [ ] `query.md` has `agents: [sql_analyst, dashboard_pilot]` frontmatter
-- [ ] Benchmark TTFT against the flat agent — if p90 > 3s, revert to flat
-      and use delegation only for pilot commands
-
-### Stage 2 — Destructive action + approval card (3h)
-
-- [ ] Implement `save_view({ name, description? })` tool with
-      `annotations: { destructive: true }`
-- [ ] Build `<ApprovalCard>`: name/description fields visible, filters +
-      highlights context block, red destructive chip, approve/deny
-- [ ] Wire to `POST /api/agent/approve`
-- [ ] Deny path: confirm agent receives denial string and gracefully
-      replans
-
-### Stage 3 — Dashboard context injection + `focus_chart` (2h)
-
-- [ ] `lib/dashboard-context.ts` — `buildDashboardContext(filters, highlights)`
-- [ ] `use-agent-stream.send` accepts `{ contextPrefix }`
-- [ ] `<QuerySection>` composes prefix before every send
-- [ ] `focus_chart` tool + `use-focus-registry` hook
-- [ ] Chart components register refs, pulse animation on focus
-
-### Stage 4 — Stream Inspector (4h)
-
-- [ ] `use-stream-inspector` — module-level event store, ⌘K toggle, clear-on-new-run
-- [ ] `use-agent-stream` pushes every SSE event into the store
-- [ ] `<StreamInspector>` component — drawer, filter chips, event timeline,
-      expandable JSON, per-event timestamp relative to stream start
-- [ ] Focus trap, `Esc` to close, restore focus on close
-- [ ] Floating debug icon in bottom-right (discoverability alongside ⌘K)
-
-### Stage 5 — Polish (2h)
-
-- [ ] KPI shimmer loading
-- [ ] Error toasts for SQL failures, agent errors
-- [ ] Keyboard shortcuts: ⌘K, ⌘L, `Esc`
-- [ ] Route-level README: `client/src/routes/smart-dashboard/README.md` —
-      architecture, demo script, known limitations
-- [ ] `docs/docs/plugins/agents.md` — add a "See it all together" pointer
-
-### Stage 6 — Demo script + rehearsal (1h)
-
-- [ ] `DEMO.md` at repo root or route directory — step-by-step, 15 min,
-      one block per feature
-- [ ] Dry-run with someone who hasn't seen it; flag rough edges
-
-**Total: ~17h focused.** Realistic wall-clock: ~2.5 days.
-
-## Acceptance criteria
-
-- [ ] `pnpm --filter=dev-playground dev` boots and `/smart-dashboard` renders
-- [ ] "show me fares above $50" → filter applied, charts update
-- [ ] "highlight November 2016" → trip chart gets a shaded band
-- [ ] "focus on the fare distribution" → fare chart scrolls into view + pulses
-- [ ] "save this as 'high-fare-fridays'" → approval card appears; deny → apology; approve → view logged
-- [ ] Default page load: insights + anomalies populate within ~5s of KPI data
-- [ ] ⌘K opens stream inspector; filter chips work; tool-call events show args + result
-- [ ] Delegation: "compare Dec vs Nov fares" routes to `sql_analyst`;
-      "highlight peak hours" routes to `dashboard_pilot`
-- [ ] `apps/agent-app/` deleted; `rg "agent-app"` across repo returns only
-      historical CHANGELOG entries
-- [ ] `pnpm --filter=appkit test` still passes (no regressions in the v2 stack)
-
-## Git
-
-- Branch: **`agent/v2/6-apps-docs`** (this stack's tip).
-- Ideally one commit per stage, for reviewable chunks.
-- Rebase 5→4 shouldn't be needed; this is additive on top of the stack.
-- After the stack merges, the work stays as-is on `main`.
-
-## Risk
-
-- **Prototype drift.** Built against AppKit 0.24.0 vendored tgz; current
-  stack is also 0.24.0 but we've refactored internals (MCP connector move,
-  helper extractions). Risk: minor import/type tweaks on port. Mitigation:
-  Stage 0 is port-and-boot first, nothing added until green.
-
-- **Stream inspector scope creep.** Easy to make a week of work. Mitigation:
-  v1 is "dump JSON events with filter chips." No search, no diff, no export.
-
-- **Delegation latency.** Dispatcher → sub-agent is 2 model round-trips. May
-  feel laggier than prototype's flat agent. Mitigation: benchmark in Stage 1;
-  fall back to flat if p90 TTFT > 3s.
-
-- **Dev-playground bloat.** Adding ~1,500 client lines in a subdirectory.
-  Mitigation: everything lives under `routes/smart-dashboard/`; other routes
-  unaffected; playground's other routes unchanged.
-
-- **v2 stack size.** Branch 6 gets bigger. Acceptable trade-off for having
-  a single end-to-end integration demo that reviewers can run and every
-  feature is visible.
-
-## Next step
-
-Stage 0 port + boot verification. One commit on `agent/v2/6-apps-docs`:
-
-```
-feat(dev-playground): port Smart Dashboard as /smart-dashboard route; retire agent-app
-
-Ports the p3ju Smart Dashboard prototype into apps/dev-playground as a new
-route. Migrates markdown agents to folder layout. Deletes apps/agent-app
-(superseded by this demo).
-
-Verifies that the route boots, KPIs load from samples.nyctaxi.trips, and
-the flat `query` agent answers and applies filters.
-
-Stages 1-6 (delegation, approval, context injection, stream inspector,
-polish, demo script) land as follow-up commits on the same branch.
-```
-
-If approved, I run Stage 0, report the diff size and any porting surprises,
-then proceed stage by stage.

From 4dbe99eb13a3c902e22a0702939add94e4b6e6d6 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Tue, 5 May 2026 12:40:36 +0200
Subject: [PATCH 43/46] chore(appkit): Biome format load-agents imports

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 packages/appkit/src/core/agent/load-agents.ts            | 2 +-
 packages/appkit/src/core/agent/tests/load-agents.test.ts | 9 ++++++---
 2 files changed, 7 insertions(+), 4 deletions(-)

diff --git a/packages/appkit/src/core/agent/load-agents.ts b/packages/appkit/src/core/agent/load-agents.ts
index e557a1ebb..9011b7761 100644
--- a/packages/appkit/src/core/agent/load-agents.ts
+++ b/packages/appkit/src/core/agent/load-agents.ts
@@ -2,7 +2,6 @@ import fs from "node:fs";
 import path from "node:path";
 import yaml from "js-yaml";
 import type { AgentAdapter } from "shared";
-import { createLogger } from "../../logging/logger";
 import type {
   AgentDefinition,
   AgentTool,
@@ -11,6 +10,7 @@ import type {
   ToolkitOptions,
 } from "../../core/agent/types";
 import { isToolkitEntry } from "../../core/agent/types";
+import { createLogger } from "../../logging/logger";
 
 const logger = createLogger("agents:loader");
 
diff --git a/packages/appkit/src/core/agent/tests/load-agents.test.ts b/packages/appkit/src/core/agent/tests/load-agents.test.ts
index 8176cef13..aa87a841a 100644
--- a/packages/appkit/src/core/agent/tests/load-agents.test.ts
+++ b/packages/appkit/src/core/agent/tests/load-agents.test.ts
@@ -4,15 +4,18 @@ import path from "node:path";
 import { afterEach, beforeEach, describe, expect, test } from "vitest";
 import { z } from "zod";
 import { buildToolkitEntries } from "../../../core/agent/build-toolkit";
+import {
+  defineTool,
+  type ToolRegistry,
+} from "../../../core/agent/tools/define-tool";
+import { tool } from "../../../core/agent/tools/tool";
+import type { AgentDefinition } from "../../../core/agent/types";
 import {
   agentIdFromMarkdownPath,
   loadAgentFromFile,
   loadAgentsFromDir,
   parseFrontmatter,
 } from "../load-agents";
-import { defineTool, type ToolRegistry } from "../../../core/agent/tools/define-tool";
-import { tool } from "../../../core/agent/tools/tool";
-import type { AgentDefinition } from "../../../core/agent/types";
 
 let workDir: string;
 

From db77efac6b6f68202c9b7b0fb0bf9a15d259368f Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Thu, 7 May 2026 11:32:44 +0200
Subject: [PATCH 44/46] chore(appkit): regenerate typedoc and sync lockfile
 after rebase

Typedoc reference grew when the unified entry started exposing tool
authoring primitives (defineTool, AppKitMcpClient, DatabricksAdapter,
parseTextToolCalls, ToolEntry, ToolRegistry, etc.) that beta.ts now
re-exports. Regenerating brings docs/docs/api/ back in sync so the
docs:build CI gate passes.

pnpm-lock.yaml gains the get-port@7.2.0 entry that was added to
@databricks/appkit on main and merged into v4 during the stack rebase.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 docs/docs/api/appkit/Class.AppKitMcpClient.md | 154 ++++++++++++++++++
 .../api/appkit/Class.DatabricksAdapter.md     | 152 +++++++++++++++++
 docs/docs/api/appkit/Function.defineTool.md   |  27 +++
 .../appkit/Function.executeFromRegistry.md    |  27 +++
 .../Function.functionToolToDefinition.md      |  15 ++
 .../api/appkit/Function.parseTextToolCalls.md |  27 +++
 .../api/appkit/Function.resolveHostedTools.md |  15 ++
 .../api/appkit/Function.toolsFromRegistry.md  |  21 +++
 .../api/appkit/Interface.AgentRunContext.md   |   2 +
 .../api/appkit/Interface.BasePluginConfig.md  |   2 +-
 .../docs/api/appkit/Interface.FunctionTool.md |   2 +-
 docs/docs/api/appkit/Interface.ToolEntry.md   |  71 ++++++++
 .../docs/api/appkit/Interface.ToolkitEntry.md |   2 +-
 .../docs/api/appkit/TypeAlias.ToolRegistry.md |   5 +
 docs/docs/api/appkit/index.md                 |  10 ++
 docs/docs/api/appkit/typedoc-sidebar.ts       |  50 ++++++
 pnpm-lock.yaml                                |   9 +
 17 files changed, 588 insertions(+), 3 deletions(-)
 create mode 100644 docs/docs/api/appkit/Class.AppKitMcpClient.md
 create mode 100644 docs/docs/api/appkit/Class.DatabricksAdapter.md
 create mode 100644 docs/docs/api/appkit/Function.defineTool.md
 create mode 100644 docs/docs/api/appkit/Function.executeFromRegistry.md
 create mode 100644 docs/docs/api/appkit/Function.functionToolToDefinition.md
 create mode 100644 docs/docs/api/appkit/Function.parseTextToolCalls.md
 create mode 100644 docs/docs/api/appkit/Function.resolveHostedTools.md
 create mode 100644 docs/docs/api/appkit/Function.toolsFromRegistry.md
 create mode 100644 docs/docs/api/appkit/Interface.ToolEntry.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.ToolRegistry.md

diff --git a/docs/docs/api/appkit/Class.AppKitMcpClient.md b/docs/docs/api/appkit/Class.AppKitMcpClient.md
new file mode 100644
index 000000000..ba33f56aa
--- /dev/null
+++ b/docs/docs/api/appkit/Class.AppKitMcpClient.md
@@ -0,0 +1,154 @@
+# Class: AppKitMcpClient
+
+Lightweight MCP client for Databricks-hosted MCP servers.
+
+Uses raw fetch() with JSON-RPC 2.0 over HTTP — no @modelcontextprotocol/sdk
+or LangChain dependency. Supports the Streamable HTTP transport only
+(POST with JSON-RPC request, single JSON-RPC response). Implements exactly
+four methods: `initialize`, `notifications/initialized`, `tools/list`,
+`tools/call`. No prompts/resources/completion/sampling.
+
+All outbound URLs are gated by an McpHostPolicy: unallowlisted hosts
+are rejected before the first byte is sent, and workspace credentials are
+only forwarded to the same-origin workspace. See `mcp-host-policy.ts`.
+
+Rationale for hand-rolling JSON-RPC instead of `@modelcontextprotocol/sdk`:
+see the file-level comment at the top of this module.
+
+## Constructors
+
+### Constructor
+
+```ts
+new AppKitMcpClient(
+   workspaceHost: string, 
+   authenticate: () => Promise<Record<string, string>>, 
+   policy: McpHostPolicy, 
+   options: {
+  dnsLookup?: DnsLookup;
+  fetchImpl?: (input: string | URL | Request, init?: RequestInit) => Promise<Response>;
+}): AppKitMcpClient;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `workspaceHost` | `string` |
+| `authenticate` | () => `Promise`\<`Record`\<`string`, `string`\>\> |
+| `policy` | `McpHostPolicy` |
+| `options` | \{ `dnsLookup?`: `DnsLookup`; `fetchImpl?`: (`input`: `string` \| `URL` \| `Request`, `init?`: `RequestInit`) => `Promise`\<`Response`\>; \} |
+| `options.dnsLookup?` | `DnsLookup` |
+| `options.fetchImpl?` | (`input`: `string` \| `URL` \| `Request`, `init?`: `RequestInit`) => `Promise`\<`Response`\> |
+
+#### Returns
+
+`AppKitMcpClient`
+
+## Methods
+
+### callTool()
+
+```ts
+callTool(
+   qualifiedName: string, 
+   args: unknown, 
+   authHeaders?: Record<string, string>, 
+callerSignal?: AbortSignal): Promise<string>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `qualifiedName` | `string` |
+| `args` | `unknown` |
+| `authHeaders?` | `Record`\<`string`, `string`\> |
+| `callerSignal?` | `AbortSignal` |
+
+#### Returns
+
+`Promise`\<`string`\>
+
+***
+
+### canForwardWorkspaceAuth()
+
+```ts
+canForwardWorkspaceAuth(serverName: string): boolean;
+```
+
+Whether the named MCP server may receive workspace-scoped auth headers
+(e.g., an OBO bearer token from an end-user request). Callers should gate
+auth-forwarding decisions on this to prevent credential exfiltration to
+non-workspace hosts.
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `serverName` | `string` |
+
+#### Returns
+
+`boolean`
+
+***
+
+### close()
+
+```ts
+close(): Promise<void>;
+```
+
+#### Returns
+
+`Promise`\<`void`\>
+
+***
+
+### connect()
+
+```ts
+connect(endpoint: McpEndpointConfig): Promise<void>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `endpoint` | `McpEndpointConfig` |
+
+#### Returns
+
+`Promise`\<`void`\>
+
+***
+
+### connectAll()
+
+```ts
+connectAll(endpoints: McpEndpointConfig[]): Promise<void>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `endpoints` | `McpEndpointConfig`[] |
+
+#### Returns
+
+`Promise`\<`void`\>
+
+***
+
+### getAllToolDefinitions()
+
+```ts
+getAllToolDefinitions(): AgentToolDefinition[];
+```
+
+#### Returns
+
+[`AgentToolDefinition`](Interface.AgentToolDefinition.md)[]
diff --git a/docs/docs/api/appkit/Class.DatabricksAdapter.md b/docs/docs/api/appkit/Class.DatabricksAdapter.md
new file mode 100644
index 000000000..ba4a8a187
--- /dev/null
+++ b/docs/docs/api/appkit/Class.DatabricksAdapter.md
@@ -0,0 +1,152 @@
+# Class: DatabricksAdapter
+
+Adapter that talks directly to Databricks Model Serving `/invocations` endpoint.
+
+No dependency on the Vercel AI SDK or LangChain. Uses raw `fetch()` to POST
+OpenAI-compatible payloads and parses the SSE stream itself. Calls
+`authenticate()` per-request so tokens are always fresh.
+
+Handles both structured `tool_calls` responses and text-based tool call
+fallback parsing for models that output tool calls as text.
+
+## Examples
+
+```ts
+import { createApp, createAgent, agents } from "@databricks/appkit";
+import { DatabricksAdapter } from "@databricks/appkit/beta";
+import { WorkspaceClient } from "@databricks/sdk-experimental";
+
+const adapter = DatabricksAdapter.fromServingEndpoint({
+  workspaceClient: new WorkspaceClient({}),
+  endpointName: "my-endpoint",
+});
+
+await createApp({
+  plugins: [
+    agents({
+      agents: {
+        assistant: createAgent({
+          instructions: "You are a helpful assistant.",
+          model: adapter,
+        }),
+      },
+    }),
+  ],
+});
+```
+
+```ts
+const adapter = new DatabricksAdapter({
+  endpointUrl: "https://host/serving-endpoints/my-endpoint/invocations",
+  authenticate: async () => ({ Authorization: `Bearer ${token}` }),
+});
+```
+
+## Implements
+
+- [`AgentAdapter`](Interface.AgentAdapter.md)
+
+## Constructors
+
+### Constructor
+
+```ts
+new DatabricksAdapter(options: DatabricksAdapterOptions): DatabricksAdapter;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `options` | `DatabricksAdapterOptions` |
+
+#### Returns
+
+`DatabricksAdapter`
+
+## Methods
+
+### run()
+
+```ts
+run(input: AgentInput, context: AgentRunContext): AsyncGenerator<AgentEvent, void, unknown>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `input` | [`AgentInput`](Interface.AgentInput.md) |
+| `context` | [`AgentRunContext`](Interface.AgentRunContext.md) |
+
+#### Returns
+
+`AsyncGenerator`\<[`AgentEvent`](TypeAlias.AgentEvent.md), `void`, `unknown`\>
+
+#### Implementation of
+
+[`AgentAdapter`](Interface.AgentAdapter.md).[`run`](Interface.AgentAdapter.md#run)
+
+***
+
+### fromModelServing()
+
+```ts
+static fromModelServing(endpointName?: string, options?: ModelServingOptions): Promise<DatabricksAdapter>;
+```
+
+Creates a DatabricksAdapter from a Model Serving endpoint name.
+Auto-creates a WorkspaceClient internally. Reads the endpoint name
+from the argument or the `DATABRICKS_SERVING_ENDPOINT_NAME` env var.
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `endpointName?` | `string` |
+| `options?` | `ModelServingOptions` |
+
+#### Returns
+
+`Promise`\<`DatabricksAdapter`\>
+
+#### Example
+
+```ts
+// Reads endpoint from DATABRICKS_SERVING_ENDPOINT_NAME env var
+const adapter = await DatabricksAdapter.fromModelServing();
+
+// Explicit endpoint
+const adapter = await DatabricksAdapter.fromModelServing("my-endpoint");
+
+// With options
+const adapter = await DatabricksAdapter.fromModelServing("my-endpoint", {
+  maxSteps: 5,
+  maxTokens: 2048,
+});
+```
+
+***
+
+### fromServingEndpoint()
+
+```ts
+static fromServingEndpoint(options: ServingEndpointOptions): Promise<DatabricksAdapter>;
+```
+
+Creates a DatabricksAdapter for a Databricks Model Serving endpoint.
+
+Routes through the shared `connectors/serving/stream` helper, which
+delegates to the SDK's `apiClient.request({ raw: true })`. That gives the
+adapter centralised URL encoding + authentication with the rest of the
+serving surface — no bespoke `fetch()` + `authenticate()` plumbing.
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `options` | `ServingEndpointOptions` |
+
+#### Returns
+
+`Promise`\<`DatabricksAdapter`\>
diff --git a/docs/docs/api/appkit/Function.defineTool.md b/docs/docs/api/appkit/Function.defineTool.md
new file mode 100644
index 000000000..93069623f
--- /dev/null
+++ b/docs/docs/api/appkit/Function.defineTool.md
@@ -0,0 +1,27 @@
+# Function: defineTool()
+
+```ts
+function defineTool<S>(config: ToolEntry<S>): ToolEntry<S>;
+```
+
+Defines a single tool entry for a plugin's internal registry.
+
+The generic `S` flows from `schema` through to the `handler` callback so
+`args` is fully typed from the Zod schema. Names are assigned by the
+registry key, so they are not repeated inside the entry.
+
+## Type Parameters
+
+| Type Parameter |
+| ------ |
+| `S` *extends* `ZodType`\<`unknown`, `unknown`, `$ZodTypeInternals`\<`unknown`, `unknown`\>\> |
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `config` | [`ToolEntry`](Interface.ToolEntry.md)\<`S`\> |
+
+## Returns
+
+[`ToolEntry`](Interface.ToolEntry.md)\<`S`\>
diff --git a/docs/docs/api/appkit/Function.executeFromRegistry.md b/docs/docs/api/appkit/Function.executeFromRegistry.md
new file mode 100644
index 000000000..762aad5df
--- /dev/null
+++ b/docs/docs/api/appkit/Function.executeFromRegistry.md
@@ -0,0 +1,27 @@
+# Function: executeFromRegistry()
+
+```ts
+function executeFromRegistry(
+   registry: ToolRegistry, 
+   name: string, 
+   args: unknown, 
+signal?: AbortSignal): Promise<unknown>;
+```
+
+Validates tool-call arguments against the entry's schema and invokes its
+handler. On validation failure, returns an LLM-friendly error string
+(matching the behavior of `tool()`) rather than throwing, so the model
+can self-correct on its next turn.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `registry` | [`ToolRegistry`](TypeAlias.ToolRegistry.md) |
+| `name` | `string` |
+| `args` | `unknown` |
+| `signal?` | `AbortSignal` |
+
+## Returns
+
+`Promise`\<`unknown`\>
diff --git a/docs/docs/api/appkit/Function.functionToolToDefinition.md b/docs/docs/api/appkit/Function.functionToolToDefinition.md
new file mode 100644
index 000000000..71ac617aa
--- /dev/null
+++ b/docs/docs/api/appkit/Function.functionToolToDefinition.md
@@ -0,0 +1,15 @@
+# Function: functionToolToDefinition()
+
+```ts
+function functionToolToDefinition(tool: FunctionTool): AgentToolDefinition;
+```
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `tool` | [`FunctionTool`](Interface.FunctionTool.md) |
+
+## Returns
+
+[`AgentToolDefinition`](Interface.AgentToolDefinition.md)
diff --git a/docs/docs/api/appkit/Function.parseTextToolCalls.md b/docs/docs/api/appkit/Function.parseTextToolCalls.md
new file mode 100644
index 000000000..ed701952c
--- /dev/null
+++ b/docs/docs/api/appkit/Function.parseTextToolCalls.md
@@ -0,0 +1,27 @@
+# Function: parseTextToolCalls()
+
+```ts
+function parseTextToolCalls(text: string): {
+  args: unknown;
+  name: string;
+}[];
+```
+
+Parses text-based tool calls from model output.
+
+Handles two formats:
+1. Llama native: `[{"name": "tool_name", "parameters": {"arg": "val"}}]`
+2. Python-style: `[tool_name(arg1='val1', arg2='val2')]`
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `text` | `string` |
+
+## Returns
+
+\{
+  `args`: `unknown`;
+  `name`: `string`;
+\}[]
diff --git a/docs/docs/api/appkit/Function.resolveHostedTools.md b/docs/docs/api/appkit/Function.resolveHostedTools.md
new file mode 100644
index 000000000..b846410cd
--- /dev/null
+++ b/docs/docs/api/appkit/Function.resolveHostedTools.md
@@ -0,0 +1,15 @@
+# Function: resolveHostedTools()
+
+```ts
+function resolveHostedTools(tools: HostedTool[]): McpEndpointConfig[];
+```
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `tools` | [`HostedTool`](TypeAlias.HostedTool.md)[] |
+
+## Returns
+
+`McpEndpointConfig`[]
diff --git a/docs/docs/api/appkit/Function.toolsFromRegistry.md b/docs/docs/api/appkit/Function.toolsFromRegistry.md
new file mode 100644
index 000000000..ea47da132
--- /dev/null
+++ b/docs/docs/api/appkit/Function.toolsFromRegistry.md
@@ -0,0 +1,21 @@
+# Function: toolsFromRegistry()
+
+```ts
+function toolsFromRegistry(registry: ToolRegistry): AgentToolDefinition[];
+```
+
+Produces the `AgentToolDefinition[]` a ToolProvider exposes to the LLM,
+deriving `parameters` JSON Schema from each entry's Zod schema.
+
+Tool names come from registry keys (supports dotted names like
+`uploads.list` for dynamic plugins).
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `registry` | [`ToolRegistry`](TypeAlias.ToolRegistry.md) |
+
+## Returns
+
+[`AgentToolDefinition`](Interface.AgentToolDefinition.md)[]
diff --git a/docs/docs/api/appkit/Interface.AgentRunContext.md b/docs/docs/api/appkit/Interface.AgentRunContext.md
index c9bfcb79f..4dfbea18d 100644
--- a/docs/docs/api/appkit/Interface.AgentRunContext.md
+++ b/docs/docs/api/appkit/Interface.AgentRunContext.md
@@ -8,6 +8,8 @@
 executeTool: (name: string, args: unknown) => Promise<unknown>;
 ```
 
+Tool implementations should sanitize failure text — errors become `tool_result.error` and can flow back into the LLM transcript.
+
 #### Parameters
 
 | Parameter | Type |
diff --git a/docs/docs/api/appkit/Interface.BasePluginConfig.md b/docs/docs/api/appkit/Interface.BasePluginConfig.md
index 797c2c7d5..653df68ce 100644
--- a/docs/docs/api/appkit/Interface.BasePluginConfig.md
+++ b/docs/docs/api/appkit/Interface.BasePluginConfig.md
@@ -4,8 +4,8 @@ Base configuration interface for AppKit plugins
 
 ## Extended by
 
-- [`IJobsConfig`](Interface.IJobsConfig.md)
 - [`AgentsPluginConfig`](Interface.AgentsPluginConfig.md)
+- [`IJobsConfig`](Interface.IJobsConfig.md)
 
 ## Indexable
 
diff --git a/docs/docs/api/appkit/Interface.FunctionTool.md b/docs/docs/api/appkit/Interface.FunctionTool.md
index 499503060..ca1e82b18 100644
--- a/docs/docs/api/appkit/Interface.FunctionTool.md
+++ b/docs/docs/api/appkit/Interface.FunctionTool.md
@@ -12,7 +12,7 @@ Behavioural hints that drive the agents plugin's approval gate and the
 client's approval-card styling. Prefer setting `effect` (one of
 `"read" | "write" | "update" | "destructive"`) — any mutating value
 forces HITL approval before `execute()` runs. Legacy `destructive: true`
-is still honoured. Must be preserved through functionToolToDefinition so the plugin sees them when building agent
+is still honoured. Must be preserved through [functionToolToDefinition](Function.functionToolToDefinition.md) so the plugin sees them when building agent
 tool indexes.
 
 ***
diff --git a/docs/docs/api/appkit/Interface.ToolEntry.md b/docs/docs/api/appkit/Interface.ToolEntry.md
new file mode 100644
index 000000000..755e1dbce
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ToolEntry.md
@@ -0,0 +1,71 @@
+# Interface: ToolEntry\<S\>
+
+Single-tool entry for a plugin's internal tool registry.
+
+Plugins collect these into a `Record<string, ToolEntry>` keyed by the tool's
+public name and dispatch via `executeFromRegistry`.
+
+## Type Parameters
+
+| Type Parameter | Default type |
+| ------ | ------ |
+| `S` *extends* `z.ZodType` | `z.ZodType` |
+
+## Properties
+
+### annotations?
+
+```ts
+optional annotations: ToolAnnotations;
+```
+
+***
+
+### autoInheritable?
+
+```ts
+optional autoInheritable: boolean;
+```
+
+Whether this tool is eligible for auto-inheritance into markdown or
+code-defined agents that enable `autoInheritTools`. Defaults to `false`
+(safe-by-default) — plugin authors must explicitly opt a tool in if they
+consider it safe enough to appear in every agent's tool record without an
+explicit `tools:` declaration. Destructive or privilege-sensitive tools
+should leave this unset so that they only reach agents that wire them
+explicitly (via `tools:`, `toolkits:`, or `fromPlugin({ only: [...] })`).
+
+***
+
+### description
+
+```ts
+description: string;
+```
+
+***
+
+### handler()
+
+```ts
+handler: (args: output<S>, signal?: AbortSignal) => unknown;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `args` | `output`\<`S`\> |
+| `signal?` | `AbortSignal` |
+
+#### Returns
+
+`unknown`
+
+***
+
+### schema
+
+```ts
+schema: S;
+```
diff --git a/docs/docs/api/appkit/Interface.ToolkitEntry.md b/docs/docs/api/appkit/Interface.ToolkitEntry.md
index 626cc8981..3eec2be25 100644
--- a/docs/docs/api/appkit/Interface.ToolkitEntry.md
+++ b/docs/docs/api/appkit/Interface.ToolkitEntry.md
@@ -30,7 +30,7 @@ optional autoInheritable: boolean;
 ```
 
 Whether this tool is eligible for `autoInheritTools` spreading. Mirrors
-ToolEntry.autoInheritable from the source registry so the agents
+[ToolEntry.autoInheritable](Interface.ToolEntry.md#autoinheritable) from the source registry so the agents
 plugin can filter auto-inherited tools without re-walking the provider's
 internal registry.
 
diff --git a/docs/docs/api/appkit/TypeAlias.ToolRegistry.md b/docs/docs/api/appkit/TypeAlias.ToolRegistry.md
new file mode 100644
index 000000000..dcee758a0
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.ToolRegistry.md
@@ -0,0 +1,5 @@
+# Type Alias: ToolRegistry
+
+```ts
+type ToolRegistry = Record<string, ToolEntry>;
+```
diff --git a/docs/docs/api/appkit/index.md b/docs/docs/api/appkit/index.md
index 0470b6d2b..aa2c3b2d6 100644
--- a/docs/docs/api/appkit/index.md
+++ b/docs/docs/api/appkit/index.md
@@ -15,9 +15,11 @@ surface with `@databricks/appkit/beta`. Not meant for application imports.
 | Class | Description |
 | ------ | ------ |
 | [AppKitError](Class.AppKitError.md) | Base error class for all AppKit errors. Provides a consistent structure for error handling across the framework. |
+| [AppKitMcpClient](Class.AppKitMcpClient.md) | Lightweight MCP client for Databricks-hosted MCP servers. |
 | [AuthenticationError](Class.AuthenticationError.md) | Error thrown when authentication fails. Use for missing tokens, invalid credentials, or authorization failures. |
 | [ConfigurationError](Class.ConfigurationError.md) | Error thrown when configuration is missing or invalid. Use for missing environment variables, invalid settings, or setup issues. |
 | [ConnectionError](Class.ConnectionError.md) | Error thrown when a connection or network operation fails. Use for database pool errors, API failures, timeouts, etc. |
+| [DatabricksAdapter](Class.DatabricksAdapter.md) | Adapter that talks directly to Databricks Model Serving `/invocations` endpoint. |
 | [ExecutionError](Class.ExecutionError.md) | Error thrown when an operation execution fails. Use for statement failures, canceled operations, or unexpected states. |
 | [InitializationError](Class.InitializationError.md) | Error thrown when a service or component is not properly initialized. Use when accessing services before they are ready. |
 | [Plugin](Class.Plugin.md) | Base abstract class for creating AppKit plugins. |
@@ -72,6 +74,7 @@ surface with `@databricks/appkit/beta`. Not meant for application imports.
 | [ThreadStore](Interface.ThreadStore.md) | - |
 | [ToolAnnotations](Interface.ToolAnnotations.md) | - |
 | [ToolConfig](Interface.ToolConfig.md) | - |
+| [ToolEntry](Interface.ToolEntry.md) | Single-tool entry for a plugin's internal tool registry. |
 | [ToolkitEntry](Interface.ToolkitEntry.md) | A tool reference produced by a plugin's `.toolkit()` call. The agents plugin recognizes the `__toolkitRef` brand and dispatches tool invocations through `PluginContext.executeTool(req, pluginName, localName, ...)`, preserving OBO (asUser) and telemetry spans. |
 | [ToolkitOptions](Interface.ToolkitOptions.md) | - |
 | [ToolProvider](Interface.ToolProvider.md) | - |
@@ -97,6 +100,7 @@ surface with `@databricks/appkit/beta`. Not meant for application imports.
 | [ResolvedToolEntry](TypeAlias.ResolvedToolEntry.md) | Internal tool-index entry after a tool record has been resolved to a dispatchable form. |
 | [ResourcePermission](TypeAlias.ResourcePermission.md) | Union of all possible permission levels across all resource types. |
 | [ServingFactory](TypeAlias.ServingFactory.md) | Factory function returned by `AppKit.serving`. |
+| [ToolRegistry](TypeAlias.ToolRegistry.md) | - |
 | [ToPlugin](TypeAlias.ToPlugin.md) | Factory function type returned by `toPlugin()`. Accepts optional config and returns a PluginData tuple. |
 
 ## Variables
@@ -118,9 +122,12 @@ surface with `@databricks/appkit/beta`. Not meant for application imports.
 | [createAgent](Function.createAgent.md) | Pure factory for agent definitions. Returns the passed-in definition after cycle-detecting the sub-agent graph. Accepts the full `AgentDefinition` shape and is safe to call at module top-level. |
 | [createApp](Function.createApp.md) | Bootstraps AppKit with the provided configuration. |
 | [createLakebasePool](Function.createLakebasePool.md) | Create a Lakebase pool with appkit's logger integration. Telemetry automatically uses appkit's OpenTelemetry configuration via global registry. |
+| [defineTool](Function.defineTool.md) | Defines a single tool entry for a plugin's internal registry. |
+| [executeFromRegistry](Function.executeFromRegistry.md) | Validates tool-call arguments against the entry's schema and invokes its handler. On validation failure, returns an LLM-friendly error string (matching the behavior of `tool()`) rather than throwing, so the model can self-correct on its next turn. |
 | [extractServingEndpoints](Function.extractServingEndpoints.md) | Extract serving endpoint config from a server file by AST-parsing it. Looks for `serving({ endpoints: { alias: { env: "..." }, ... } })` calls and extracts the endpoint alias names and their environment variable mappings. |
 | [findServerFile](Function.findServerFile.md) | Find the server entry file by checking candidate paths in order. |
 | [fromPlugin](Function.fromPlugin.md) | Reference a plugin's tools inside an `AgentDefinition.tools` record without naming the plugin instance. The returned spread-friendly object carries a symbol-keyed marker that the agents plugin resolves against registered `ToolProvider`s at setup time. |
+| [functionToolToDefinition](Function.functionToolToDefinition.md) | - |
 | [generateDatabaseCredential](Function.generateDatabaseCredential.md) | Generate OAuth credentials for Postgres database connection using the proper Postgres API. |
 | [getExecutionContext](Function.getExecutionContext.md) | Get the current execution context. |
 | [getLakebaseOrmConfig](Function.getLakebaseOrmConfig.md) | Get Lakebase connection configuration for ORMs that don't accept pg.Pool directly. |
@@ -137,5 +144,8 @@ surface with `@databricks/appkit/beta`. Not meant for application imports.
 | [loadAgentFromFile](Function.loadAgentFromFile.md) | Loads a single markdown agent file and resolves its frontmatter against registered plugin toolkits + ambient tool library. |
 | [loadAgentsFromDir](Function.loadAgentsFromDir.md) | Scans a directory for one subdirectory per agent, each containing `agent.md` (frontmatter + body). Produces an `AgentDefinition` record keyed by agent id (folder name). Throws on frontmatter errors or unresolved references. Returns an empty map if the directory does not exist. |
 | [mcpServer](Function.mcpServer.md) | Factory for declaring a custom MCP server tool. |
+| [parseTextToolCalls](Function.parseTextToolCalls.md) | Parses text-based tool calls from model output. |
+| [resolveHostedTools](Function.resolveHostedTools.md) | - |
 | [runAgent](Function.runAgent.md) | Standalone agent execution without `createApp`. Resolves the adapter, binds inline tools, and drives the adapter's `run()` loop to completion. |
 | [tool](Function.tool.md) | Factory for defining function tools with Zod schemas. |
+| [toolsFromRegistry](Function.toolsFromRegistry.md) | Produces the `AgentToolDefinition[]` a ToolProvider exposes to the LLM, deriving `parameters` JSON Schema from each entry's Zod schema. |
diff --git a/docs/docs/api/appkit/typedoc-sidebar.ts b/docs/docs/api/appkit/typedoc-sidebar.ts
index 297aca334..7a7f1a7cc 100644
--- a/docs/docs/api/appkit/typedoc-sidebar.ts
+++ b/docs/docs/api/appkit/typedoc-sidebar.ts
@@ -26,6 +26,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Class.AppKitError",
           label: "AppKitError"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Class.AppKitMcpClient",
+          label: "AppKitMcpClient"
+        },
         {
           type: "doc",
           id: "api/appkit/Class.AuthenticationError",
@@ -41,6 +46,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Class.ConnectionError",
           label: "ConnectionError"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Class.DatabricksAdapter",
+          label: "DatabricksAdapter"
+        },
         {
           type: "doc",
           id: "api/appkit/Class.ExecutionError",
@@ -292,6 +302,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.ToolConfig",
           label: "ToolConfig"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ToolEntry",
+          label: "ToolEntry"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.ToolkitEntry",
@@ -398,6 +413,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/TypeAlias.ServingFactory",
           label: "ServingFactory"
         },
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.ToolRegistry",
+          label: "ToolRegistry"
+        },
         {
           type: "doc",
           id: "api/appkit/TypeAlias.ToPlugin",
@@ -465,6 +485,16 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Function.createLakebasePool",
           label: "createLakebasePool"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Function.defineTool",
+          label: "defineTool"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.executeFromRegistry",
+          label: "executeFromRegistry"
+        },
         {
           type: "doc",
           id: "api/appkit/Function.extractServingEndpoints",
@@ -480,6 +510,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Function.fromPlugin",
           label: "fromPlugin"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Function.functionToolToDefinition",
+          label: "functionToolToDefinition"
+        },
         {
           type: "doc",
           id: "api/appkit/Function.generateDatabaseCredential",
@@ -560,6 +595,16 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Function.mcpServer",
           label: "mcpServer"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Function.parseTextToolCalls",
+          label: "parseTextToolCalls"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.resolveHostedTools",
+          label: "resolveHostedTools"
+        },
         {
           type: "doc",
           id: "api/appkit/Function.runAgent",
@@ -569,6 +614,11 @@ const typedocSidebar: SidebarsConfig = {
           type: "doc",
           id: "api/appkit/Function.tool",
           label: "tool"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.toolsFromRegistry",
+          label: "toolsFromRegistry"
         }
       ]
     }
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 937ec4fc4..ad89c6b48 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -305,6 +305,9 @@ importers:
       express:
         specifier: 4.22.0
         version: 4.22.0
+      get-port:
+        specifier: 7.2.0
+        version: 7.2.0
       js-yaml:
         specifier: ^4.1.1
         version: 4.1.1
@@ -7291,6 +7294,10 @@ packages:
   get-own-enumerable-property-symbols@3.0.2:
     resolution: {integrity: sha512-I0UBV/XOz1XkIJHEUDMZAbzCThU/H8DxmSfmdGcKPnVhu2VfFqr34jr9777IyaTYvxjedWhqVIilEDsCdP5G6g==}
 
+  get-port@7.2.0:
+    resolution: {integrity: sha512-afP4W205ONCuMoPBqcR6PSXnzX35KTcJygfJfcp+QY+uwm3p20p1YczWXhlICIzGMCxYBQcySEcOgsJcrkyobg==}
+    engines: {node: '>=16'}
+
   get-proto@1.0.1:
     resolution: {integrity: sha512-sTSfBjoXBp89JvIKIefqw7U2CCebsc74kiY6awiGogKtoSGbgjYE/G/+l9sF3MWFPNc9IcoOC4ODfKHfxFmp0g==}
     engines: {node: '>= 0.4'}
@@ -19879,6 +19886,8 @@ snapshots:
 
   get-own-enumerable-property-symbols@3.0.2: {}
 
+  get-port@7.2.0: {}
+
   get-proto@1.0.1:
     dependencies:
       dunder-proto: 1.0.1

From cc8d3ab337739377ad0273444cb83c382b4f7639 Mon Sep 17 00:00:00 2001
From: Hubert Zub <hubert.zub@databricks.com>
Date: Wed, 6 May 2026 12:42:51 +0200
Subject: [PATCH 45/46] feat(appkit): add Vercel AI SDK UI Message Stream
 protocol to agents plugin

Adds a parallel wire protocol selectable via Accept header content
negotiation. The MIME constant lives in shared/chat-protocol so server
and any workspace client share one literal. Wire-format helpers
(detectChatProtocol, extractVercelAIUserText) move out of agents.ts
into a sibling protocol.ts module next to schemas/translator.

Signed-off-by: Hubert Zub <hubert.zub@databricks.com>
---
 apps/dev-playground/client/package-lock.json  | 157 ++++-
 apps/dev-playground/client/package.json       |   6 +-
 .../client/src/lib/vercel-ai-agent-chat.ts    |  45 ++
 .../client/src/routes/agent.route.tsx         | 538 +++++++++---------
 apps/dev-playground/package.json              |   3 +-
 packages/appkit/src/plugins/agents/agents.ts  | 125 +++-
 .../src/plugins/agents/event-translator.ts    |   5 +-
 .../src/plugins/agents/http-tool-executor.ts  |  20 +-
 .../appkit/src/plugins/agents/protocol.ts     |  47 ++
 packages/appkit/src/plugins/agents/schemas.ts |  27 +
 ...el-ai-ui-message-stream-translator.test.ts | 256 +++++++++
 .../appkit/src/plugins/agents/translator.ts   |  27 +
 .../vercel-ai-ui-message-stream-translator.ts | 257 +++++++++
 .../appkit/src/registry/types.generated.ts    |  16 +-
 packages/shared/src/chat-protocol.ts          |   8 +
 packages/shared/src/index.ts                  |   1 +
 pnpm-lock.yaml                                |   5 +-
 17 files changed, 1234 insertions(+), 309 deletions(-)
 create mode 100644 apps/dev-playground/client/src/lib/vercel-ai-agent-chat.ts
 create mode 100644 packages/appkit/src/plugins/agents/protocol.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/vercel-ai-ui-message-stream-translator.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/translator.ts
 create mode 100644 packages/appkit/src/plugins/agents/vercel-ai-ui-message-stream-translator.ts
 create mode 100644 packages/shared/src/chat-protocol.ts

diff --git a/apps/dev-playground/client/package-lock.json b/apps/dev-playground/client/package-lock.json
index 7a34b5b28..80876cdcc 100644
--- a/apps/dev-playground/client/package-lock.json
+++ b/apps/dev-playground/client/package-lock.json
@@ -8,6 +8,7 @@
       "name": "client",
       "version": "0.0.0",
       "dependencies": {
+        "@ai-sdk/react": "4.0.0-beta.76",
         "@radix-ui/react-dropdown-menu": "2.1.16",
         "@radix-ui/react-select": "2.2.6",
         "@radix-ui/react-slot": "1.2.3",
@@ -16,13 +17,14 @@
         "@tanstack/react-router-devtools": "1.133.22",
         "@tanstack/react-table": "8.21.3",
         "@tanstack/router-plugin": "1.133.22",
+        "ai": "7.0.0-beta.76",
         "class-variance-authority": "0.7.1",
         "clsx": "2.1.1",
         "html2canvas": "1.4.1",
         "html2canvas-pro": "2.0.2",
         "lucide-react": "0.546.0",
-        "react": "19.2.0",
-        "react-dom": "19.2.0",
+        "react": "19.2.5",
+        "react-dom": "19.2.5",
         "recharts": "3.4.1",
         "tailwind-merge": "3.3.1",
         "tailwindcss-animate": "1.0.7",
@@ -74,6 +76,70 @@
     "../../../packages/appkit-ui/dist": {
       "extraneous": true
     },
+    "node_modules/@ai-sdk/gateway": {
+      "version": "4.0.0-beta.43",
+      "resolved": "https://npm-proxy.dev.databricks.com/@ai-sdk/gateway/-/gateway-4.0.0-beta.43.tgz",
+      "integrity": "sha512-EGQe4If6jt1ZhENmwZn8UAeHbEc7DRiK7ff7dwgfNthwso2hdzLbgXzuTO+W/op+oDFQK1pKiAz5RrPsVQWiew==",
+      "license": "Apache-2.0",
+      "dependencies": {
+        "@ai-sdk/provider": "4.0.0-beta.10",
+        "@ai-sdk/provider-utils": "5.0.0-beta.16",
+        "@vercel/oidc": "3.2.0"
+      },
+      "engines": {
+        "node": ">=18"
+      },
+      "peerDependencies": {
+        "zod": "^3.25.76 || ^4.1.8"
+      }
+    },
+    "node_modules/@ai-sdk/provider": {
+      "version": "4.0.0-beta.10",
+      "resolved": "https://npm-proxy.dev.databricks.com/@ai-sdk/provider/-/provider-4.0.0-beta.10.tgz",
+      "integrity": "sha512-E2O/LCWjqOxAUfpykQR4xLmcGXySIu6L+wYJjav2xiHu38otPq0qIexgH9ZKulBvBWkrtJ3fxz0kzHDlCBkwng==",
+      "license": "Apache-2.0",
+      "dependencies": {
+        "json-schema": "^0.4.0"
+      },
+      "engines": {
+        "node": ">=18"
+      }
+    },
+    "node_modules/@ai-sdk/provider-utils": {
+      "version": "5.0.0-beta.16",
+      "resolved": "https://npm-proxy.dev.databricks.com/@ai-sdk/provider-utils/-/provider-utils-5.0.0-beta.16.tgz",
+      "integrity": "sha512-CyMV5go6libw5WaZ4m7nO0uRLTENxbIODiDrTXJNwxYIBR8p5aCGaxt9oj3prbvNkTt0Srh/Gyw+n2pR9hQ5Pg==",
+      "license": "Apache-2.0",
+      "dependencies": {
+        "@ai-sdk/provider": "4.0.0-beta.10",
+        "@standard-schema/spec": "^1.1.0",
+        "eventsource-parser": "^3.0.6"
+      },
+      "engines": {
+        "node": ">=18"
+      },
+      "peerDependencies": {
+        "zod": "^3.25.76 || ^4.1.8"
+      }
+    },
+    "node_modules/@ai-sdk/react": {
+      "version": "4.0.0-beta.76",
+      "resolved": "https://npm-proxy.dev.databricks.com/@ai-sdk/react/-/react-4.0.0-beta.76.tgz",
+      "integrity": "sha512-M5CMl+wlIZexdN+gJG06WPW6F88JFFzjwC1dEyeVNLztxDnZn8VpJy6WDNEo3QgUWjinWJCOnLDLP9qPBzTSSA==",
+      "license": "Apache-2.0",
+      "dependencies": {
+        "@ai-sdk/provider-utils": "5.0.0-beta.16",
+        "ai": "7.0.0-beta.76",
+        "swr": "^2.2.5",
+        "throttleit": "2.1.0"
+      },
+      "engines": {
+        "node": ">=18"
+      },
+      "peerDependencies": {
+        "react": "^18 || ~19.0.1 || ~19.1.2 || ^19.2.1"
+      }
+    },
     "node_modules/@alloc/quick-lru": {
       "version": "5.2.0",
       "resolved": "https://registry.npmjs.org/@alloc/quick-lru/-/quick-lru-5.2.0.tgz",
@@ -2314,9 +2380,9 @@
       "license": "MIT"
     },
     "node_modules/@standard-schema/spec": {
-      "version": "1.0.0",
-      "resolved": "https://registry.npmjs.org/@standard-schema/spec/-/spec-1.0.0.tgz",
-      "integrity": "sha512-m2bOd0f2RT9k8QJx1JN85cZYyH1RqFBdlwtkSlf4tBDYLCiiZnv1fIIwacK6cqwXavOydf0NPToMQgpKq+dVlA==",
+      "version": "1.1.0",
+      "resolved": "https://npm-proxy.dev.databricks.com/@standard-schema/spec/-/spec-1.1.0.tgz",
+      "integrity": "sha512-l2aFy5jALhniG5HgqrD6jXLi/rUWrKvqN/qJx6yoJsgKhblVd+iqqU4RCXavm/jPityDo5TCvKMnpjKnOriy0w==",
       "license": "MIT"
     },
     "node_modules/@standard-schema/utils": {
@@ -3375,6 +3441,15 @@
       "dev": true,
       "license": "ISC"
     },
+    "node_modules/@vercel/oidc": {
+      "version": "3.2.0",
+      "resolved": "https://npm-proxy.dev.databricks.com/@vercel/oidc/-/oidc-3.2.0.tgz",
+      "integrity": "sha512-UycprH3T6n3jH0k44NHMa7pnFHGu/N05MjojYr+Mc6I7obkoLIJujSWwin1pCvdy/eOxrI/l3uDLQsmcrOb4ug==",
+      "license": "Apache-2.0",
+      "engines": {
+        "node": ">= 20"
+      }
+    },
     "node_modules/@vitejs/plugin-react": {
       "version": "5.0.4",
       "resolved": "https://registry.npmjs.org/@vitejs/plugin-react/-/plugin-react-5.0.4.tgz",
@@ -3418,6 +3493,23 @@
         "acorn": "^6.0.0 || ^7.0.0 || ^8.0.0"
       }
     },
+    "node_modules/ai": {
+      "version": "7.0.0-beta.76",
+      "resolved": "https://npm-proxy.dev.databricks.com/ai/-/ai-7.0.0-beta.76.tgz",
+      "integrity": "sha512-yJMCqsnfUi8jnFOvxmXhjMZd0YVSCLk1E5PZpqmGWynvo3uADt1XADYYYRcj0I9Q2wsL4HbCLAKe01I8aswzJg==",
+      "license": "Apache-2.0",
+      "dependencies": {
+        "@ai-sdk/gateway": "4.0.0-beta.43",
+        "@ai-sdk/provider": "4.0.0-beta.10",
+        "@ai-sdk/provider-utils": "5.0.0-beta.16"
+      },
+      "engines": {
+        "node": ">=18"
+      },
+      "peerDependencies": {
+        "zod": "^3.25.76 || ^4.1.8"
+      }
+    },
     "node_modules/ajv": {
       "version": "6.12.6",
       "resolved": "https://registry.npmjs.org/ajv/-/ajv-6.12.6.tgz",
@@ -4097,7 +4189,6 @@
       "version": "2.0.3",
       "resolved": "https://registry.npmjs.org/dequal/-/dequal-2.0.3.tgz",
       "integrity": "sha512-0je+qPKHEMohvfRTCEo3CrPG6cAzAYgmzKyxRiYSSDkS6eGJdyVJm7WaYA5ECaAD9wLB2T4EEeymA5aFVcYXCA==",
-      "dev": true,
       "license": "MIT",
       "engines": {
         "node": ">=6"
@@ -4431,6 +4522,15 @@
       "integrity": "sha512-GWkBvjiSZK87ELrYOSESUYeVIc9mvLLf/nXalMOS5dYrgZq9o5OVkbZAVM06CVxYsCwH9BDZFPlQTlPA1j4ahA==",
       "license": "MIT"
     },
+    "node_modules/eventsource-parser": {
+      "version": "3.0.8",
+      "resolved": "https://npm-proxy.dev.databricks.com/eventsource-parser/-/eventsource-parser-3.0.8.tgz",
+      "integrity": "sha512-70QWGkr4snxr0OXLRWsFLeRBIRPuQOvt4s8QYjmUlmlkyTZkRqS7EDVRZtzU3TiyDbXSzaOeF0XUKy8PchzukQ==",
+      "license": "MIT",
+      "engines": {
+        "node": ">=18.0.0"
+      }
+    },
     "node_modules/fast-deep-equal": {
       "version": "3.1.3",
       "resolved": "https://registry.npmjs.org/fast-deep-equal/-/fast-deep-equal-3.1.3.tgz",
@@ -4929,6 +5029,12 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/json-schema": {
+      "version": "0.4.0",
+      "resolved": "https://npm-proxy.dev.databricks.com/json-schema/-/json-schema-0.4.0.tgz",
+      "integrity": "sha512-es94M3nTIfsEPisRafak+HDLfHXnKBhV3vU5eqPcS3flIWqcxJWgXHXiey3YrpaNsanY5ei1VoYEbOzijuq9BA==",
+      "license": "(AFL-2.1 OR BSD-3-Clause)"
+    },
     "node_modules/json-schema-traverse": {
       "version": "0.4.1",
       "resolved": "https://registry.npmjs.org/json-schema-traverse/-/json-schema-traverse-0.4.1.tgz",
@@ -5717,24 +5823,24 @@
       "license": "MIT"
     },
     "node_modules/react": {
-      "version": "19.2.0",
-      "resolved": "https://registry.npmjs.org/react/-/react-19.2.0.tgz",
-      "integrity": "sha512-tmbWg6W31tQLeB5cdIBOicJDJRR2KzXsV7uSK9iNfLWQ5bIZfxuPEHp7M8wiHyHnn0DD1i7w3Zmin0FtkrwoCQ==",
+      "version": "19.2.5",
+      "resolved": "https://npm-proxy.dev.databricks.com/react/-/react-19.2.5.tgz",
+      "integrity": "sha512-llUJLzz1zTUBrskt2pwZgLq59AemifIftw4aB7JxOqf1HY2FDaGDxgwpAPVzHU1kdWabH7FauP4i1oEeer2WCA==",
       "license": "MIT",
       "engines": {
         "node": ">=0.10.0"
       }
     },
     "node_modules/react-dom": {
-      "version": "19.2.0",
-      "resolved": "https://registry.npmjs.org/react-dom/-/react-dom-19.2.0.tgz",
-      "integrity": "sha512-UlbRu4cAiGaIewkPyiRGJk0imDN2T3JjieT6spoL2UeSf5od4n5LB/mQ4ejmxhCFT1tYe8IvaFulzynWovsEFQ==",
+      "version": "19.2.5",
+      "resolved": "https://npm-proxy.dev.databricks.com/react-dom/-/react-dom-19.2.5.tgz",
+      "integrity": "sha512-J5bAZz+DXMMwW/wV3xzKke59Af6CHY7G4uYLN1OvBcKEsWOs4pQExj86BBKamxl/Ik5bx9whOrvBlSDfWzgSag==",
       "license": "MIT",
       "dependencies": {
         "scheduler": "^0.27.0"
       },
       "peerDependencies": {
-        "react": "^19.2.0"
+        "react": "^19.2.5"
       }
     },
     "node_modules/react-is": {
@@ -6222,6 +6328,19 @@
         "node": ">=8"
       }
     },
+    "node_modules/swr": {
+      "version": "2.4.1",
+      "resolved": "https://npm-proxy.dev.databricks.com/swr/-/swr-2.4.1.tgz",
+      "integrity": "sha512-2CC6CiKQtEwaEeNiqWTAw9PGykW8SR5zZX8MZk6TeAvEAnVS7Visz8WzphqgtQ8v2xz/4Q5K+j+SeMaKXeeQIA==",
+      "license": "MIT",
+      "dependencies": {
+        "dequal": "^2.0.3",
+        "use-sync-external-store": "^1.6.0"
+      },
+      "peerDependencies": {
+        "react": "^16.11.0 || ^17.0.0 || ^18.0.0 || ^19.0.0"
+      }
+    },
     "node_modules/tailwind-merge": {
       "version": "3.3.1",
       "resolved": "https://registry.npmjs.org/tailwind-merge/-/tailwind-merge-3.3.1.tgz",
@@ -6270,6 +6389,18 @@
         "utrie": "^1.0.2"
       }
     },
+    "node_modules/throttleit": {
+      "version": "2.1.0",
+      "resolved": "https://npm-proxy.dev.databricks.com/throttleit/-/throttleit-2.1.0.tgz",
+      "integrity": "sha512-nt6AMGKW1p/70DF/hGBdJB57B8Tspmbp5gfJ8ilhLnt7kkr2ye7hzD6NVG8GGErk2HWF34igrL2CXmNIkzKqKw==",
+      "license": "MIT",
+      "engines": {
+        "node": ">=18"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/sindresorhus"
+      }
+    },
     "node_modules/tiny-invariant": {
       "version": "1.3.3",
       "resolved": "https://registry.npmjs.org/tiny-invariant/-/tiny-invariant-1.3.3.tgz",
diff --git a/apps/dev-playground/client/package.json b/apps/dev-playground/client/package.json
index e69a49a3c..e302a32af 100644
--- a/apps/dev-playground/client/package.json
+++ b/apps/dev-playground/client/package.json
@@ -10,6 +10,8 @@
     "preview": "vite preview"
   },
   "dependencies": {
+    "@ai-sdk/react": "4.0.0-beta.76",
+    "ai": "7.0.0-beta.76",
     "@radix-ui/react-dropdown-menu": "2.1.16",
     "@radix-ui/react-select": "2.2.6",
     "@radix-ui/react-slot": "1.2.3",
@@ -23,8 +25,8 @@
     "html2canvas": "1.4.1",
     "html2canvas-pro": "2.0.2",
     "lucide-react": "0.546.0",
-    "react": "19.2.0",
-    "react-dom": "19.2.0",
+    "react": "19.2.5",
+    "react-dom": "19.2.5",
     "recharts": "3.4.1",
     "tailwind-merge": "3.3.1",
     "tailwindcss-animate": "1.0.7",
diff --git a/apps/dev-playground/client/src/lib/vercel-ai-agent-chat.ts b/apps/dev-playground/client/src/lib/vercel-ai-agent-chat.ts
new file mode 100644
index 000000000..66618378f
--- /dev/null
+++ b/apps/dev-playground/client/src/lib/vercel-ai-agent-chat.ts
@@ -0,0 +1,45 @@
+import type { UIMessage } from "ai";
+
+/**
+ * Custom data parts emitted by AppKit's Vercel AI SDK UI Message Stream
+ * branch (server: `VercelAIUIMessageStreamTranslator`).
+ *
+ * AppKit-only payloads — these only exist because of the Vercel AI SDK
+ * `useChat` integration and are not part of the SDK protocol itself.
+ */
+export interface VercelAIAgentDataParts {
+  /**
+   * A destructive tool call is paused on the server-side approval gate.
+   * The client renders an approval card and POSTs the user's decision to
+   * `/api/agents/approve`. The approval gate auto-denies on timeout.
+   */
+  "approval-pending": {
+    approvalId: string;
+    streamId: string;
+    toolName: string;
+    args: unknown;
+    annotations?: {
+      effect?: "read" | "write" | "update" | "destructive";
+      readOnly?: boolean;
+      destructive?: boolean;
+      idempotent?: boolean;
+    };
+  };
+}
+
+/**
+ * Strongly-typed UIMessage for the AppKit agent chat. Used as the type
+ * parameter to `useChat<VercelAIAgentUIMessage>()` so message metadata,
+ * data-part dispatch, and `onData` callbacks are all type-checked.
+ */
+export type VercelAIAgentUIMessage = UIMessage<unknown, VercelAIAgentDataParts>;
+
+/**
+ * MIME type advertised on the `Accept` header to opt the agents plugin's
+ * `POST /chat` route into the Vercel AI SDK UI Message Stream protocol.
+ * Mirrored on the server as `VERCEL_AI_UI_MESSAGE_STREAM_MIME` (in
+ * `shared/chat-protocol`). Duplicated here because the dev-playground
+ * client is npm-managed and cannot pull workspace-only deps.
+ */
+export const VERCEL_AI_UI_MESSAGE_STREAM_ACCEPT =
+  "application/vnd.ai-sdk.ui-message-stream";
diff --git a/apps/dev-playground/client/src/routes/agent.route.tsx b/apps/dev-playground/client/src/routes/agent.route.tsx
index 6762a1a38..4a0dd39c8 100644
--- a/apps/dev-playground/client/src/routes/agent.route.tsx
+++ b/apps/dev-playground/client/src/routes/agent.route.tsx
@@ -1,54 +1,30 @@
+import { useChat } from "@ai-sdk/react";
 import { getPluginClientConfig } from "@databricks/appkit-ui/js";
 import { Button } from "@databricks/appkit-ui/react";
 import { createFileRoute } from "@tanstack/react-router";
-import { useCallback, useEffect, useRef, useState } from "react";
+import { DefaultChatTransport } from "ai";
+import { useCallback, useEffect, useMemo, useRef, useState } from "react";
+import {
+  VERCEL_AI_UI_MESSAGE_STREAM_ACCEPT,
+  type VercelAIAgentDataParts,
+  type VercelAIAgentUIMessage,
+} from "../lib/vercel-ai-agent-chat";
 
 export const Route = createFileRoute("/agent")({
   component: AgentRoute,
 });
 
-interface SSEEvent {
-  type: string;
-  delta?: string;
-  item_id?: string;
-  item?: {
-    type?: string;
-    id?: string;
-    call_id?: string;
-    name?: string;
-    arguments?: string;
-    output?: string;
-    status?: string;
-  };
-  content?: string;
-  data?: Record<string, unknown>;
-  error?: string;
-  sequence_number?: number;
-  output_index?: number;
-  approval_id?: string;
-  stream_id?: string;
-  tool_name?: string;
-  args?: unknown;
-  annotations?: {
-    readOnly?: boolean;
-    destructive?: boolean;
-    idempotent?: boolean;
-  };
-}
+type ApprovalPendingPayload = VercelAIAgentDataParts["approval-pending"];
 
-interface ChatMessage {
-  id: number;
-  role: "user" | "assistant";
-  content: string;
-}
-
-interface PendingApproval {
-  approvalId: string;
-  streamId: string;
-  toolName: string;
-  args: unknown;
-}
+type PendingApproval = ApprovalPendingPayload;
 
+/**
+ * Inline-suggestion autocomplete still uses the legacy Responses-API SSE
+ * shape on `/api/agents/chat`. The autocomplete agent runs as a one-shot
+ * stateless completion (its `agent.md` flags `ephemeral: true`), so it
+ * doesn't share the chat thread with the conversational `useChat` flow
+ * and there's nothing to gain from migrating it here.
+ */
 function useAutocomplete(enabled: boolean) {
   const [suggestion, setSuggestion] = useState("");
   const [isLoading, setIsLoading] = useState(false);
@@ -136,16 +112,88 @@ function useAutocomplete(enabled: boolean) {
   };
 }
 
+/**
+ * Concatenate all `text` parts of a message — `useChat` keeps text
+ * streamed across multiple `text-delta` chunks as a single `TextUIPart`,
+ * but if the agent loop reopens text after a tool call, the message
+ * carries multiple text parts. For chat-bubble rendering we want them
+ * joined.
+ */
+function messageBodyText(message: VercelAIAgentUIMessage): string {
+  let body = "";
+  for (const part of message.parts) {
+    if (part.type === "text") body += part.text;
+  }
+  return body;
+}
+
 function AgentRoute() {
-  const [messages, setMessages] = useState<ChatMessage[]>([]);
-  const [events, setEvents] = useState<AgentEvent[]>([]);
-  const [input, setInput] = useState("");
-  const [isLoading, setIsLoading] = useState(false);
-  const [threadId, setThreadId] = useState<string | null>(null);
   const [pendingApprovals, setPendingApprovals] = useState<PendingApproval[]>(
     [],
   );
 
+  const messagesEndRef = useRef<HTMLDivElement>(null);
+  const inputRef = useRef<HTMLTextAreaElement>(null);
+  const [input, setInput] = useState("");
+
+  const agentConfig = getPluginClientConfig<{
+    agents?: string[];
+    defaultAgent?: string;
+  }>("agents");
+  const hasAutocomplete = (agentConfig.agents ?? []).includes("autocomplete");
+
+  const transport = useMemo(
+    () =>
+      new DefaultChatTransport<VercelAIAgentUIMessage>({
+        api: "/api/agents/chat",
+        headers: {
+          Accept: VERCEL_AI_UI_MESSAGE_STREAM_ACCEPT,
+        },
+      }),
+    [],
+  );
+
+  // We deliberately do NOT pass `id` to useChat. The hook auto-mints one
+  // through the AI SDK's own `generateId` (which doesn't depend on the
+  // browser's `crypto.randomUUID`, so it survives environments where the
+  // global is shimmed or stripped) and exposes it on the return value.
+  // The chat id is sent to the server as the request body `id` and the
+  // agents plugin maps it 1:1 to its `threadId`.
+  const {
+    id: chatId,
+    messages,
+    sendMessage,
+    status,
+    error,
+    stop,
+  } = useChat<VercelAIAgentUIMessage>({
+    transport,
+    onData: (part) => {
+      if (part.type === "data-approval-pending") {
+        const payload = part.data as ApprovalPendingPayload;
+        setPendingApprovals((prev) =>
+          prev.some((p) => p.approvalId === payload.approvalId)
+            ? prev
+            : [...prev, payload],
+        );
+      }
+    },
+  });
+
+  const isLoading = status === "submitted" || status === "streaming";
+
+  // `useChat` creates the assistant `UIMessage` stub the moment the server
+  // emits its `start` chunk — well before any text-delta arrives. We want
+  // to show "Thinking..." until the assistant has produced visible text
+  // (either rendered tokens or a fully-materialised message). Tool-only
+  // turns therefore keep the indicator up until the model speaks.
+  const lastMessage = messages[messages.length - 1];
+  const lastAssistantHasText =
+    lastMessage?.role === "assistant" &&
+    messageBodyText(lastMessage).length > 0;
+  const showThinking =
+    isLoading && pendingApprovals.length === 0 && !lastAssistantHasText;
+
   const decideApproval = useCallback(
     async (approvalId: string, decision: "approve" | "deny") => {
       const approval = pendingApprovals.find(
@@ -170,15 +218,6 @@ function AgentRoute() {
     },
     [pendingApprovals],
   );
-  const messagesEndRef = useRef<HTMLDivElement>(null);
-  const inputRef = useRef<HTMLTextAreaElement>(null);
-  const msgIdCounter = useRef(0);
-
-  const agentConfig = getPluginClientConfig<{
-    agents?: string[];
-    defaultAgent?: string;
-  }>("agents");
-  const hasAutocomplete = (agentConfig.agents ?? []).includes("autocomplete");
 
   const {
     suggestion,
@@ -192,125 +231,13 @@ function AgentRoute() {
     messagesEndRef.current?.scrollIntoView({ behavior: "smooth" });
   }, [messages]);
 
-  const sendMessage = useCallback(async () => {
-    if (!input.trim() || isLoading) return;
-
+  const submit = useCallback(() => {
+    const text = input.trim();
+    if (!text || isLoading) return;
     clearSuggestion();
-    const userMessage = input.trim();
     setInput("");
-    setMessages((prev) => [
-      ...prev,
-      { id: ++msgIdCounter.current, role: "user", content: userMessage },
-    ]);
-    setEvents([]);
-    setIsLoading(true);
-
-    try {
-      const response = await fetch("/api/agents/chat", {
-        method: "POST",
-        headers: { "Content-Type": "application/json" },
-        body: JSON.stringify({
-          message: userMessage,
-          ...(threadId && { threadId }),
-        }),
-      });
-
-      if (!response.ok) {
-        const error = await response.json();
-        setMessages((prev) => [
-          ...prev,
-          {
-            id: ++msgIdCounter.current,
-            role: "assistant",
-            content: `Error: ${error.error}`,
-          },
-        ]);
-        return;
-      }
-
-      const reader = response.body?.getReader();
-      if (!reader) return;
-
-      const decoder = new TextDecoder();
-      let assistantContent = "";
-      let buffer = "";
-
-      while (true) {
-        const { done, value } = await reader.read();
-        if (done) break;
-
-        buffer += decoder.decode(value, { stream: true });
-        const lines = buffer.split("\n");
-        buffer = lines.pop() ?? "";
-
-        for (const line of lines) {
-          if (!line.startsWith("data: ")) continue;
-          const data = line.slice(6).trim();
-          if (!data || data === "[DONE]") continue;
-
-          try {
-            const event: SSEEvent = JSON.parse(data);
-            if (!event.type) continue;
-            setEvents((prev) => [...prev, event]);
-
-            if (
-              event.type === "appkit.approval_pending" &&
-              event.approval_id &&
-              event.stream_id &&
-              event.tool_name
-            ) {
-              setPendingApprovals((prev) => [
-                ...prev,
-                {
-                  approvalId: event.approval_id as string,
-                  streamId: event.stream_id as string,
-                  toolName: event.tool_name as string,
-                  args: event.args,
-                },
-              ]);
-            }
-            if (event.type === "appkit.metadata" && event.data?.threadId) {
-              setThreadId(event.data.threadId as string);
-            }
-
-            if (event.type === "response.output_text.delta" && event.delta) {
-              assistantContent += event.delta;
-              setMessages((prev) => {
-                const updated = [...prev];
-                const last = updated[updated.length - 1];
-                if (last?.role === "assistant") {
-                  updated[updated.length - 1] = {
-                    ...last,
-                    content: assistantContent,
-                  };
-                } else {
-                  updated.push({
-                    id: ++msgIdCounter.current,
-                    role: "assistant",
-                    content: assistantContent,
-                  });
-                }
-                return updated;
-              });
-            }
-          } catch {
-            // skip malformed events
-          }
-        }
-      }
-    } catch (err) {
-      setMessages((prev) => [
-        ...prev,
-        {
-          id: ++msgIdCounter.current,
-          role: "assistant",
-          content: `Error: ${err instanceof Error ? err.message : "Unknown error"}`,
-        },
-      ]);
-    } finally {
-      setIsLoading(false);
-    }
-  }, [input, isLoading, threadId, clearSuggestion]);
+    sendMessage({ text });
+  }, [input, isLoading, clearSuggestion, sendMessage]);
 
   const handleInputChange = (value: string) => {
     setInput(value);
@@ -333,11 +260,9 @@ function AgentRoute() {
             <h1 className="text-3xl font-bold mb-2">Agent Chat</h1>
             <p className="text-base text-muted-foreground">
               AI agent with auto-discovered tools from all AppKit plugins.
-              {threadId && (
-                <span className="ml-2 text-xs font-mono opacity-60">
-                  Thread: {threadId.slice(0, 8)}...
-                </span>
-              )}
+              <span className="ml-2 text-xs font-mono opacity-60">
+                Chat: {chatId.slice(0, 8)}...
+              </span>
             </p>
           </div>
           {hasAutocomplete && (
@@ -363,22 +288,28 @@ function AgentRoute() {
                 </div>
               )}
 
-              {messages.map((msg) => (
-                <div
-                  key={msg.id}
-                  className={`flex ${msg.role === "user" ? "justify-end" : "justify-start"}`}
-                >
+              {messages.map((msg) => {
+                const body = messageBodyText(msg);
+                if (!body) return null;
+                return (
                   <div
-                    className={`max-w-[85%] rounded-lg px-4 py-2 ${
-                      msg.role === "user"
-                        ? "bg-primary text-primary-foreground"
-                        : "bg-muted"
+                    key={msg.id}
+                    className={`flex ${
+                      msg.role === "user" ? "justify-end" : "justify-start"
                     }`}
                   >
-                    <p className="whitespace-pre-wrap text-sm">{msg.content}</p>
+                    <div
+                      className={`max-w-[85%] rounded-lg px-4 py-2 ${
+                        msg.role === "user"
+                          ? "bg-primary text-primary-foreground"
+                          : "bg-muted"
+                      }`}
+                    >
+                      <p className="whitespace-pre-wrap text-sm">{body}</p>
+                    </div>
                   </div>
-                </div>
-              ))}
+                );
+              })}
 
               {pendingApprovals.map((approval) => (
                 <div key={approval.approvalId} className="flex justify-start">
@@ -419,17 +350,23 @@ function AgentRoute() {
                 </div>
               ))}
 
-              {isLoading &&
-                pendingApprovals.length === 0 &&
-                messages[messages.length - 1]?.role === "user" && (
-                  <div className="flex justify-start">
-                    <div className="bg-muted rounded-lg px-4 py-2">
-                      <p className="text-sm text-muted-foreground animate-pulse">
-                        Thinking...
-                      </p>
-                    </div>
+              {showThinking && (
+                <div className="flex justify-start">
+                  <div className="bg-muted rounded-lg px-4 py-2">
+                    <p className="text-sm text-muted-foreground animate-pulse">
+                      Thinking...
+                    </p>
                   </div>
-                )}
+                </div>
+              )}
+
+              {error && (
+                <div className="flex justify-start">
+                  <div className="max-w-[85%] rounded-lg border border-red-500/60 bg-red-500/10 px-4 py-2">
+                    <p className="text-sm">Error: {error.message}</p>
+                  </div>
+                </div>
+              )}
 
               <div ref={messagesEndRef} />
             </div>
@@ -454,7 +391,7 @@ function AgentRoute() {
               <form
                 onSubmit={(e) => {
                   e.preventDefault();
-                  sendMessage();
+                  submit();
                 }}
                 className="flex gap-2"
               >
@@ -482,7 +419,7 @@ function AgentRoute() {
                       }
                       if (e.key === "Enter" && !e.shiftKey && !suggestion) {
                         e.preventDefault();
-                        sendMessage();
+                        submit();
                       }
                     }}
                     placeholder="Ask a question..."
@@ -491,77 +428,146 @@ function AgentRoute() {
                     className="w-full rounded-md border border-input bg-transparent px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring disabled:opacity-50 resize-none"
                   />
                 </div>
-                <Button
-                  type="submit"
-                  disabled={isLoading || !input.trim()}
-                  className="self-end"
-                >
-                  Send
-                </Button>
+                {isLoading ? (
+                  <Button
+                    type="button"
+                    variant="outline"
+                    onClick={stop}
+                    className="self-end"
+                  >
+                    Stop
+                  </Button>
+                ) : (
+                  <Button
+                    type="submit"
+                    disabled={!input.trim()}
+                    className="self-end"
+                  >
+                    Send
+                  </Button>
+                )}
               </form>
             </div>
           </div>
 
-          <div className="w-80 shrink-0 flex flex-col border rounded-lg bg-card">
-            <div className="px-3 py-2 border-b">
-              <h3 className="text-sm font-semibold text-muted-foreground">
-                Event Stream
-              </h3>
-            </div>
-            <div className="flex-1 overflow-y-auto p-3 space-y-1">
-              {events.length === 0 && (
-                <p className="text-xs text-muted-foreground/50 text-center py-8">
-                  Events will appear here
-                </p>
-              )}
-              {events.map((event, i) => {
-                let detail: string;
-                switch (event.type) {
-                  case "response.output_text.delta":
-                    detail = event.delta?.slice(0, 60) ?? "";
-                    break;
-                  case "response.output_item.added":
-                  case "response.output_item.done":
-                    detail =
-                      event.item?.type === "function_call"
-                        ? `${event.item.name}(${(event.item.arguments ?? "").slice(0, 40)})`
-                        : event.item?.type === "function_call_output"
-                          ? (event.item.output?.slice(0, 60) ?? "")
-                          : (event.item?.status ?? event.item?.type ?? "");
-                    break;
-                  case "response.completed":
-                    detail = "done";
-                    break;
-                  case "error":
-                    detail = event.error ?? "unknown";
-                    break;
-                  case "appkit.metadata":
-                    detail = JSON.stringify(event.data).slice(0, 60);
-                    break;
-                  case "appkit.thinking":
-                    detail = event.content?.slice(0, 60) ?? "";
-                    break;
-                  default:
-                    detail = JSON.stringify(event).slice(0, 60);
-                }
-                return (
-                  <div
-                    key={`${event.type}-${i}`}
-                    className="font-mono text-xs text-muted-foreground"
-                  >
-                    <span className="inline-block w-24 text-right mr-2 opacity-50">
-                      {event.type
-                        .replace("response.", "")
-                        .replace("appkit.", "")}
-                    </span>
-                    <span className="opacity-80 break-all">{detail}</span>
-                  </div>
-                );
-              })}
-            </div>
-          </div>
+          <EventStreamPanel messages={messages} approvals={pendingApprovals} />
         </div>
       </div>
     </div>
   );
 }
+
+interface EventStreamRow {
+  /** Stable React key. */
+  key: string;
+  /** Short label rendered in the left column. */
+  label: string;
+  /** Free-form right-column detail. */
+  detail: string;
+}
+
+/**
+ * Right-hand debug panel. Walks every part of every message and renders a
+ * compact, terse log entry per part. Pairs with `pendingApprovals` so the
+ * panel surfaces approval prompts (which arrive via `onData`, not as
+ * message parts) alongside the message-derived rows.
+ */
+function EventStreamPanel({
+  messages,
+  approvals,
+}: {
+  messages: VercelAIAgentUIMessage[];
+  approvals: PendingApproval[];
+}) {
+  const rows: EventStreamRow[] = [];
+
+  for (const message of messages) {
+    let partIndex = 0;
+    for (const part of message.parts) {
+      const key = `${message.id}:${partIndex++}`;
+      if (part.type === "text") {
+        rows.push({
+          key,
+          label: message.role === "user" ? "user" : "text",
+          detail: part.text.slice(0, 80),
+        });
+      } else if (part.type === "reasoning") {
+        rows.push({
+          key,
+          label: "reasoning",
+          detail: part.text.slice(0, 80),
+        });
+      } else if (part.type === "dynamic-tool") {
+        const detail =
+          part.state === "output-available"
+            ? safeStringify(part.output).slice(0, 80)
+            : part.state === "output-error"
+              ? `error: ${part.errorText}`
+              : safeStringify(part.input).slice(0, 80);
+        rows.push({
+          key,
+          label: `tool:${part.toolName}`,
+          detail: `${part.state} ${detail}`,
+        });
+      } else if (part.type === "step-start") {
+        rows.push({ key, label: "step", detail: "start" });
+      } else if (
+        typeof part.type === "string" &&
+        part.type.startsWith("data-")
+      ) {
+        const data = (part as { data?: unknown }).data;
+        rows.push({
+          key,
+          label: part.type.replace(/^data-/, "data:"),
+          detail: safeStringify(data).slice(0, 80),
+        });
+      }
+    }
+  }
+
+  for (const approval of approvals) {
+    rows.push({
+      key: `pending:${approval.approvalId}`,
+      label: "approval",
+      detail: `pending: ${approval.toolName}`,
+    });
+  }
+
+  return (
+    <div className="w-80 shrink-0 flex flex-col border rounded-lg bg-card">
+      <div className="px-3 py-2 border-b">
+        <h3 className="text-sm font-semibold text-muted-foreground">
+          Event Stream
+        </h3>
+      </div>
+      <div className="flex-1 overflow-y-auto p-3 space-y-1">
+        {rows.length === 0 && (
+          <p className="text-xs text-muted-foreground/50 text-center py-8">
+            Events will appear here
+          </p>
+        )}
+        {rows.map((row) => (
+          <div
+            key={row.key}
+            className="font-mono text-xs text-muted-foreground"
+          >
+            <span className="inline-block w-24 text-right mr-2 opacity-50">
+              {row.label}
+            </span>
+            <span className="opacity-80 break-all">{row.detail}</span>
+          </div>
+        ))}
+      </div>
+    </div>
+  );
+}
+
+function safeStringify(value: unknown): string {
+  if (typeof value === "string") return value;
+  if (value === undefined) return "";
+  try {
+    return JSON.stringify(value) ?? "";
+  } catch {
+    return String(value);
+  }
+}
diff --git a/apps/dev-playground/package.json b/apps/dev-playground/package.json
index add84abe9..d9e2fbf10 100644
--- a/apps/dev-playground/package.json
+++ b/apps/dev-playground/package.json
@@ -31,7 +31,8 @@
     "drizzle-orm": "0.45.1",
     "reflect-metadata": "0.2.2",
     "sequelize": "6.37.7",
-    "typeorm": "0.3.28"
+    "typeorm": "0.3.28",
+    "zod": "^4.1.13"
   },
   "devDependencies": {
     "@playwright/test": "1.58.1",
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index 80cda55e4..3d05f4738 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -48,14 +48,18 @@ import {
 } from "./http-tool-executor";
 import manifest from "./manifest.json";
 import { composePromptForAgent, normalizeAutoInherit } from "./prompt";
+import { detectChatProtocol, extractVercelAIUserText } from "./protocol";
 import { printRegistry } from "./registry-printer";
 import {
   approvalRequestSchema,
   chatRequestSchema,
   invocationsRequestSchema,
+  vercelAIChatRequestSchema,
 } from "./schemas";
 import { InMemoryThreadStore } from "./thread-store";
 import { ToolApprovalGate } from "./tool-approval-gate";
+import type { AgentEventStreamTranslator } from "./translator";
+import { VercelAIUIMessageStreamTranslator } from "./vercel-ai-ui-message-stream-translator";
 
 const logger = createLogger("agents");
 
@@ -665,6 +669,18 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
   }
 
   private async _handleChat(req: express.Request, res: express.Response) {
+    // Content-negotiate the wire protocol. Default is the Responses-API SSE
+    // shape used by AppKit's existing UI; clients sending the Vercel AI SDK
+    // vendor MIME (emitted by `@ai-sdk/react`'s `useChat` via our
+    // configured `Accept` header) get the UI Message Stream protocol
+    // instead. The two protocols share the same engine — only the request
+    // body shape and the on-the-wire translator differ.
+    const protocol = detectChatProtocol(req);
+
+    if (protocol === "vercel-ai-ui-message-stream") {
+      return this._handleVercelAIChat(req, res);
+    }
+
     const parsed = chatRequestSchema.safeParse(req.body);
     if (!parsed.success) {
       res.status(400).json({
@@ -718,6 +734,97 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     return this._streamAgent(req, res, registered, thread, userId);
   }
 
+  /**
+   * Vercel AI SDK UI Message Stream branch of `_handleChat`. Selected via
+   * `Accept: application/vnd.ai-sdk.ui-message-stream`. The request body
+   * is the shape `@ai-sdk/react`'s `DefaultChatTransport` produces:
+   * `{ id, messages, trigger?, ... }`.
+   *
+   * The chat `id` is mapped 1:1 to AppKit's `threadId` so re-use of an
+   * existing chat picks up the persisted history. The latest user turn is
+   * extracted from the last entry of `messages` (text parts only).
+   */
+  private async _handleVercelAIChat(
+    req: express.Request,
+    res: express.Response,
+  ) {
+    const parsed = vercelAIChatRequestSchema.safeParse(req.body);
+    if (!parsed.success) {
+      res.status(400).json({
+        error: "Invalid request",
+        details: parsed.error.flatten().fieldErrors,
+      });
+      return;
+    }
+    const { id: chatId, messages: uiMessages, agent: agentName } = parsed.data;
+
+    const lastMessage = uiMessages.at(-1);
+    if (!lastMessage || lastMessage.role !== "user") {
+      res.status(400).json({
+        error:
+          "Vercel AI SDK chat request must end with a user message; got role " +
+          (lastMessage?.role ?? "<empty>"),
+      });
+      return;
+    }
+
+    const userText = extractVercelAIUserText(lastMessage.parts);
+    if (!userText) {
+      res.status(400).json({
+        error: "Last user message has no text content",
+      });
+      return;
+    }
+
+    const registered = this.resolveAgent(agentName);
+    if (!registered) {
+      res.status(400).json({
+        error: agentName
+          ? `Agent "${agentName}" not found`
+          : "No agent registered",
+      });
+      return;
+    }
+
+    const userId = this.resolveUserId(req);
+
+    const limits = this.resolvedLimits;
+    if (this.countUserStreams(userId) >= limits.maxConcurrentStreamsPerUser) {
+      res.setHeader("Retry-After", "5");
+      res.status(429).json({
+        error: `Too many concurrent streams for this user (limit ${limits.maxConcurrentStreamsPerUser}). Wait for an existing stream to complete before starting another.`,
+      });
+      return;
+    }
+
+    // The chat id is reused as the thread id. First-turn requests produce
+    // a thread under that id; subsequent turns load it. We tolerate a
+    // thread the user already owns under a different store id by falling
+    // back to a freshly-created thread when `get` returns null AND there
+    // is exactly one user message in the request — i.e. this is the
+    // start of a brand-new conversation.
+    let thread = await this.threadStore.get(chatId, userId);
+    if (!thread) {
+      // The thread-store API allocates ids itself; we cannot force it to
+      // mint a thread under `chatId`. Best-effort: create a fresh thread
+      // for the user. The chat id will still be the stable client-side
+      // handle the UI uses.
+      thread = await this.threadStore.create(userId);
+    }
+
+    const userMessage: Message = {
+      id: randomUUID(),
+      role: "user",
+      content: userText,
+      createdAt: new Date(),
+    };
+    await this.threadStore.addMessage(thread.id, userId, userMessage);
+
+    return this._streamAgent(req, res, registered, thread, userId, {
+      translatorFactory: () => new VercelAIUIMessageStreamTranslator(),
+    });
+  }
+
   private async _handleInvocations(
     req: express.Request,
     res: express.Response,
@@ -766,12 +873,20 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     return this._streamAgent(req, res, registered, thread, userId);
   }
 
-  private async _streamAgent(
+  private async _streamAgent<T = ResponseStreamEvent>(
     req: express.Request,
     res: express.Response,
     registered: RegisteredAgent,
     thread: Thread,
     userId: string,
+    options?: {
+      /**
+       * Wire-protocol translator factory. Defaults to the legacy
+       * Responses-API SSE translator. The Vercel AI SDK UI Message Stream
+       * branch passes its own factory.
+       */
+      translatorFactory?: () => AgentEventStreamTranslator<T>;
+    },
   ): Promise<void> {
     const abortController = new AbortController();
     const signal = abortController.signal;
@@ -780,8 +895,10 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
 
     const tools = Array.from(registered.toolIndex.values()).map((e) => e.def);
     const limits = this.resolvedLimits;
-    const outboundEvents = new EventChannel<ResponseStreamEvent>();
-    const translator = new AgentEventTranslator();
+    const outboundEvents = new EventChannel<T>();
+    const translator: AgentEventStreamTranslator<T> = options?.translatorFactory
+      ? options.translatorFactory()
+      : (new AgentEventTranslator() as unknown as AgentEventStreamTranslator<T>);
     // Per-run tool-call budget shared across the top-level adapter and any
     // sub-agents it delegates to. Counted pre-dispatch so a prompt-injected
     // agent cannot drain the budget silently via denied calls.
@@ -912,7 +1029,7 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
       outboundEvents.close();
     })();
 
-    await this.executeStream<ResponseStreamEvent>(
+    await this.executeStream<T>(
       res,
       async function* () {
         try {
diff --git a/packages/appkit/src/plugins/agents/event-translator.ts b/packages/appkit/src/plugins/agents/event-translator.ts
index 54d749fb0..e4e877c4e 100644
--- a/packages/appkit/src/plugins/agents/event-translator.ts
+++ b/packages/appkit/src/plugins/agents/event-translator.ts
@@ -6,6 +6,7 @@ import type {
   ResponseOutputMessage,
   ResponseStreamEvent,
 } from "shared";
+import type { AgentEventStreamTranslator } from "./translator";
 
 /**
  * Translates internal `AgentEvent` stream into Responses API SSE events.
@@ -23,7 +24,9 @@ import type {
  * added, so subsequent text resumes as a new message item at a strictly
  * later index.
  */
-export class AgentEventTranslator {
+export class AgentEventTranslator
+  implements AgentEventStreamTranslator<ResponseStreamEvent>
+{
   private seqNum = 0;
   private nextOutputIndex = 0;
   private currentMessage: {
diff --git a/packages/appkit/src/plugins/agents/http-tool-executor.ts b/packages/appkit/src/plugins/agents/http-tool-executor.ts
index 5217ab414..e596ff1d0 100644
--- a/packages/appkit/src/plugins/agents/http-tool-executor.ts
+++ b/packages/appkit/src/plugins/agents/http-tool-executor.ts
@@ -8,8 +8,8 @@ import { dispatchToolCall } from "../../core/agent/tool-dispatch";
 import type { ResolvedToolEntry } from "../../core/agent/types";
 import type { PluginContext } from "../../core/plugin-context";
 import type { EventChannel } from "./event-channel";
-import type { AgentEventTranslator } from "./event-translator";
 import type { ToolApprovalGate } from "./tool-approval-gate";
+import type { AgentEventStreamTranslator } from "./translator";
 
 /**
  * Decision returned by the approval check. `null` means "no gate fires"
@@ -52,15 +52,19 @@ export interface ToolBudget {
   limit: number;
 }
 
-interface HttpToolExecutorDeps {
+interface HttpToolExecutorDeps<T> {
   toolIndex: Map<string, ResolvedToolEntry>;
   /** Approval policy as resolved from `agents({ approval: ... })`. */
   approvalPolicy: { requireForDestructive: boolean; timeoutMs: number };
   approvalGate: ToolApprovalGate;
-  /** Translator used to emit `approval_pending` to the SSE stream. */
-  translator: AgentEventTranslator;
-  /** Channel the SSE stream drains. Approval events are pushed here. */
-  outboundEvents: EventChannel<ResponseStreamEvent>;
+  /**
+   * Translator used to emit `approval_pending` to the outbound stream.
+   * Generic in `T` so the same executor works for the legacy
+   * Responses-API SSE wire format and the Vercel AI UI Message Stream.
+   */
+  translator: AgentEventStreamTranslator<T>;
+  /** Channel the outbound stream drains. Approval events are pushed here. */
+  outboundEvents: EventChannel<T>;
   /** Aborted on budget exhaustion to unwind the adapter promptly. */
   abortController: AbortController;
   /**
@@ -99,8 +103,8 @@ interface HttpToolExecutorDeps {
  * the top-level cap — the parent already incremented when it dispatched
  * the `agent-<key>` call.
  */
-export class HttpToolExecutor implements ToolExecutor {
-  constructor(private deps: HttpToolExecutorDeps) {}
+export class HttpToolExecutor<T = ResponseStreamEvent> implements ToolExecutor {
+  constructor(private deps: HttpToolExecutorDeps<T>) {}
 
   async execute(
     name: string,
diff --git a/packages/appkit/src/plugins/agents/protocol.ts b/packages/appkit/src/plugins/agents/protocol.ts
new file mode 100644
index 000000000..5e874bd2b
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/protocol.ts
@@ -0,0 +1,47 @@
+import type express from "express";
+import { VERCEL_AI_UI_MESSAGE_STREAM_MIME } from "shared";
+
+type ChatProtocol = "responses-api" | "vercel-ai-ui-message-stream";
+
+/**
+ * Pick the wire protocol for a chat request. Inspects `Accept` first;
+ * falls back to a custom `x-appkit-protocol` header so callers without
+ * fine-grained Accept control (e.g. some embedded clients) can opt in.
+ */
+export function detectChatProtocol(req: express.Request): ChatProtocol {
+  const accept = (req.headers.accept ?? "").toLowerCase();
+  if (accept.includes(VERCEL_AI_UI_MESSAGE_STREAM_MIME)) {
+    return "vercel-ai-ui-message-stream";
+  }
+  const explicit = req.headers["x-appkit-protocol"];
+  if (
+    typeof explicit === "string" &&
+    explicit.trim() === "vercel-ai-ui-message-stream"
+  ) {
+    return "vercel-ai-ui-message-stream";
+  }
+  return "responses-api";
+}
+
+/**
+ * Extract user text from a Vercel AI SDK `UIMessage.parts` array. The SDK
+ * supports many part types (text, file, reasoning, tool-* …); for the
+ * purposes of seeding the agent's user turn we only care about text
+ * parts. File and tool-call parts in the inbound message are ignored
+ * because the agent loop runs server-side and does not need the client's
+ * locally-rendered tool history.
+ */
+export function extractVercelAIUserText(parts: unknown[]): string {
+  let text = "";
+  for (const part of parts) {
+    if (
+      typeof part === "object" &&
+      part !== null &&
+      (part as { type?: unknown }).type === "text" &&
+      typeof (part as { text?: unknown }).text === "string"
+    ) {
+      text += (part as { text: string }).text;
+    }
+  }
+  return text;
+}
diff --git a/packages/appkit/src/plugins/agents/schemas.ts b/packages/appkit/src/plugins/agents/schemas.ts
index cea6c6d64..0b70ad047 100644
--- a/packages/appkit/src/plugins/agents/schemas.ts
+++ b/packages/appkit/src/plugins/agents/schemas.ts
@@ -67,3 +67,30 @@ export const approvalRequestSchema = z.object({
   approvalId: z.string().min(1, "approvalId is required"),
   decision: z.enum(["approve", "deny"]),
 });
+
+// Vercel AI SDK `DefaultChatTransport` request shape (from `@ai-sdk/react`).
+// Mirrors the body produced by useChat's default transport. Selected at
+// runtime when the request advertises `Accept: application/vnd.ai-sdk.ui-message-stream`.
+//
+// `id` carries the chat id and is mapped 1:1 to AppKit's `threadId`. The
+// latest user message is read from `messages.at(-1).parts` (text parts only).
+export const vercelAIChatRequestSchema = z.object({
+  id: z.string().min(1, "id is required"),
+  messages: z
+    .array(
+      z.object({
+        id: z.string(),
+        role: z.enum(["user", "assistant", "system"]),
+        parts: z.array(z.any()),
+        metadata: z.unknown().optional(),
+      }),
+    )
+    .min(1, "messages must not be empty")
+    .max(
+      MAX_INVOCATIONS_INPUT_ITEMS,
+      `messages exceeds the ${MAX_INVOCATIONS_INPUT_ITEMS}-item limit`,
+    ),
+  trigger: z.enum(["submit-message", "regenerate-message"]).optional(),
+  messageId: z.string().optional(),
+  agent: z.string().optional(),
+});
diff --git a/packages/appkit/src/plugins/agents/tests/vercel-ai-ui-message-stream-translator.test.ts b/packages/appkit/src/plugins/agents/tests/vercel-ai-ui-message-stream-translator.test.ts
new file mode 100644
index 000000000..1cfbd2b14
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/vercel-ai-ui-message-stream-translator.test.ts
@@ -0,0 +1,256 @@
+import { describe, expect, test } from "vitest";
+import {
+  type VercelAIUIMessageChunk,
+  VercelAIUIMessageStreamTranslator,
+} from "../vercel-ai-ui-message-stream-translator";
+
+/**
+ * Reduces a translator output stream so assertions don't have to encode
+ * the random `start.messageId` and `text-start.id` UUIDs. Replaces every
+ * occurrence of the same id with a deterministic placeholder per kind so
+ * we can still assert "deltas reference the same span as start/end".
+ */
+function normalize(chunks: VercelAIUIMessageChunk[]): VercelAIUIMessageChunk[] {
+  const seen = new Map<string, string>();
+  const counts: Record<string, number> = {};
+  const slot = (kind: string, id: string): string => {
+    const key = `${kind}:${id}`;
+    if (!seen.has(key)) {
+      counts[kind] = (counts[kind] ?? 0) + 1;
+      seen.set(key, `${kind}_${counts[kind]}`);
+    }
+    return seen.get(key) as string;
+  };
+  return chunks.map((c) => {
+    switch (c.type) {
+      case "start":
+        return { ...c, messageId: c.messageId ? "msg_1" : c.messageId };
+      case "text-start":
+      case "text-delta":
+      case "text-end":
+        return { ...c, id: slot("text", c.id) };
+      case "reasoning-start":
+      case "reasoning-delta":
+      case "reasoning-end":
+        return { ...c, id: slot("reasoning", c.id) };
+      default:
+        return c;
+    }
+  });
+}
+
+describe("VercelAIUIMessageStreamTranslator", () => {
+  test("emits exactly one start chunk on the first event", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    const a = t.translate({ type: "message_delta", content: "hello" });
+    const b = t.translate({ type: "message_delta", content: " world" });
+    const startChunks = [...a, ...b].filter((c) => c.type === "start");
+    expect(startChunks).toHaveLength(1);
+    expect(startChunks[0]).toMatchObject({ type: "start" });
+    expect((startChunks[0] as { messageId?: string }).messageId).toMatch(
+      /^msg_/,
+    );
+  });
+
+  test("opens text span lazily and reuses the same id across deltas", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    const out = normalize([
+      ...t.translate({ type: "message_delta", content: "he" }),
+      ...t.translate({ type: "message_delta", content: "llo" }),
+      ...t.finalize(),
+    ]);
+
+    expect(out).toEqual([
+      { type: "start", messageId: "msg_1" },
+      { type: "text-start", id: "text_1" },
+      { type: "text-delta", id: "text_1", delta: "he" },
+      { type: "text-delta", id: "text_1", delta: "llo" },
+      { type: "text-end", id: "text_1" },
+      { type: "finish" },
+    ]);
+  });
+
+  test("closes open text-span before a tool-call", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    const out = normalize([
+      ...t.translate({ type: "message_delta", content: "thinking..." }),
+      ...t.translate({
+        type: "tool_call",
+        callId: "call_1",
+        name: "search",
+        args: { q: "x" },
+      }),
+      ...t.translate({
+        type: "tool_result",
+        callId: "call_1",
+        result: { hits: 3 },
+      }),
+      ...t.translate({ type: "message_delta", content: "done" }),
+      ...t.finalize(),
+    ]);
+
+    expect(out).toEqual([
+      { type: "start", messageId: "msg_1" },
+      { type: "text-start", id: "text_1" },
+      { type: "text-delta", id: "text_1", delta: "thinking..." },
+      { type: "text-end", id: "text_1" },
+      {
+        type: "tool-input-available",
+        toolCallId: "call_1",
+        toolName: "search",
+        input: { q: "x" },
+      },
+      {
+        type: "tool-output-available",
+        toolCallId: "call_1",
+        output: { hits: 3 },
+      },
+      { type: "text-start", id: "text_2" },
+      { type: "text-delta", id: "text_2", delta: "done" },
+      { type: "text-end", id: "text_2" },
+      { type: "finish" },
+    ]);
+  });
+
+  test("emits tool-output-error when tool_result carries an error", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    const out = normalize([
+      ...t.translate({
+        type: "tool_call",
+        callId: "call_1",
+        name: "search",
+        args: {},
+      }),
+      ...t.translate({
+        type: "tool_result",
+        callId: "call_1",
+        result: undefined,
+        error: "Tool blew up",
+      }),
+      ...t.finalize(),
+    ]);
+
+    expect(out).toContainEqual({
+      type: "tool-output-error",
+      toolCallId: "call_1",
+      errorText: "Tool blew up",
+    });
+    expect(out.some((c) => c.type === "tool-output-available")).toBe(false);
+  });
+
+  test("forwards approval_pending as a data-approval-pending part keyed by approvalId", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    t.translate({ type: "message_delta", content: "pre" });
+    const chunks = t.translate({
+      type: "approval_pending",
+      approvalId: "appr_1",
+      streamId: "stream_1",
+      toolName: "delete_view",
+      args: { id: 42 },
+      annotations: { effect: "destructive" },
+    });
+
+    const dataPart = chunks.find(
+      (c) => c.type === "data-approval-pending",
+    ) as Extract<VercelAIUIMessageChunk, { type: `data-${string}` }>;
+
+    expect(dataPart).toBeDefined();
+    expect(dataPart.id).toBe("appr_1");
+    expect(dataPart.data).toEqual({
+      approvalId: "appr_1",
+      streamId: "stream_1",
+      toolName: "delete_view",
+      args: { id: 42 },
+      annotations: { effect: "destructive" },
+    });
+    // Approval is concurrent with an open text span — must NOT close it.
+    expect(chunks.some((c) => c.type === "text-end")).toBe(false);
+  });
+
+  test("opens reasoning lazily, closes before a text-delta", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    const out = normalize([
+      ...t.translate({ type: "thinking", content: "let me see..." }),
+      ...t.translate({ type: "message_delta", content: "result" }),
+      ...t.finalize(),
+    ]);
+
+    expect(out).toEqual([
+      { type: "start", messageId: "msg_1" },
+      { type: "reasoning-start", id: "reasoning_1" },
+      {
+        type: "reasoning-delta",
+        id: "reasoning_1",
+        delta: "let me see...",
+      },
+      { type: "reasoning-end", id: "reasoning_1" },
+      { type: "text-start", id: "text_1" },
+      { type: "text-delta", id: "text_1", delta: "result" },
+      { type: "text-end", id: "text_1" },
+      { type: "finish" },
+    ]);
+  });
+
+  test("metadata events become message-metadata chunks", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    const out = t.translate({
+      type: "metadata",
+      data: { threadId: "thread_42" },
+    });
+    expect(out).toContainEqual({
+      type: "message-metadata",
+      messageMetadata: { threadId: "thread_42" },
+    });
+  });
+
+  test("status: error closes spans and emits error+finish", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    const out = normalize([
+      ...t.translate({ type: "message_delta", content: "halfway" }),
+      ...t.translate({
+        type: "status",
+        status: "error",
+        error: "boom",
+      }),
+    ]);
+
+    expect(out).toEqual([
+      { type: "start", messageId: "msg_1" },
+      { type: "text-start", id: "text_1" },
+      { type: "text-delta", id: "text_1", delta: "halfway" },
+      { type: "text-end", id: "text_1" },
+      { type: "error", errorText: "boom" },
+      { type: "finish" },
+    ]);
+  });
+
+  test("status: complete is treated as a terminator equivalent to finalize", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    const out = normalize([
+      ...t.translate({ type: "message_delta", content: "ok" }),
+      ...t.translate({ type: "status", status: "complete" }),
+      ...t.finalize(),
+    ]);
+
+    expect(out.filter((c) => c.type === "finish")).toHaveLength(1);
+    expect(out.filter((c) => c.type === "text-end")).toHaveLength(1);
+  });
+
+  test("finalize is idempotent", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    t.translate({ type: "message_delta", content: "hi" });
+    const first = t.finalize();
+    const second = t.finalize();
+
+    expect(first.filter((c) => c.type === "finish")).toHaveLength(1);
+    expect(second).toEqual([]);
+  });
+
+  test("status: running is silently dropped (no chunks)", () => {
+    const t = new VercelAIUIMessageStreamTranslator();
+    const out = t.translate({ type: "status", status: "running" });
+    // start is emitted because every translate() call may emit start; but
+    // no other content chunks should appear.
+    expect(out.filter((c) => c.type !== "start")).toEqual([]);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/translator.ts b/packages/appkit/src/plugins/agents/translator.ts
new file mode 100644
index 000000000..671700d83
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/translator.ts
@@ -0,0 +1,27 @@
+import type { AgentEvent } from "shared";
+
+/**
+ * Stream-protocol-agnostic translator: converts AppKit's internal
+ * {@link AgentEvent} stream into a wire-specific event/chunk type `T`.
+ *
+ * One instance per streaming request — implementations are stateful (e.g.
+ * lazy text-message open/close, sequence numbers). Translators are
+ * exclusively output-side: they never decide what to invoke or how to call
+ * the model, only how to encode the agent's already-produced events.
+ *
+ * Concrete implementations:
+ * - `AgentEventTranslator` — Responses-API SSE wire format (legacy default).
+ * - `VercelAIUIMessageStreamTranslator` — Vercel AI SDK
+ *   {@link https://ai-sdk.dev/docs/ai-sdk-ui/stream-protocols UI Message Stream}
+ *   chunks consumed by `@ai-sdk/react`'s `useChat`.
+ */
+export interface AgentEventStreamTranslator<T> {
+  /** Translate a single internal event into zero or more wire chunks. */
+  translate(event: AgentEvent): T[];
+  /**
+   * Emit any terminal chunks (e.g. closing an open text item, a `finish`
+   * marker). Idempotent — safe to call multiple times; only the first call
+   * yields output.
+   */
+  finalize(): T[];
+}
diff --git a/packages/appkit/src/plugins/agents/vercel-ai-ui-message-stream-translator.ts b/packages/appkit/src/plugins/agents/vercel-ai-ui-message-stream-translator.ts
new file mode 100644
index 000000000..b1061e628
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/vercel-ai-ui-message-stream-translator.ts
@@ -0,0 +1,257 @@
+import { randomUUID } from "node:crypto";
+import type { AgentEvent } from "shared";
+import type { AgentEventStreamTranslator } from "./translator";
+
+/**
+ * Vercel AI SDK UI Message Stream wire chunks consumed by `@ai-sdk/react`'s
+ * `useChat`. We declare the subset we emit locally rather than importing
+ * from `ai` because that package is an optional peer dependency of AppKit.
+ *
+ * See {@link https://ai-sdk.dev/docs/ai-sdk-ui/stream-protocols} for the
+ * authoritative protocol definition.
+ */
+export type VercelAIUIMessageChunk =
+  | { type: "start"; messageId?: string }
+  | { type: "text-start"; id: string }
+  | { type: "text-delta"; id: string; delta: string }
+  | { type: "text-end"; id: string }
+  | { type: "reasoning-start"; id: string }
+  | { type: "reasoning-delta"; id: string; delta: string }
+  | { type: "reasoning-end"; id: string }
+  | {
+      type: "tool-input-available";
+      toolCallId: string;
+      toolName: string;
+      input: unknown;
+    }
+  | {
+      type: "tool-output-available";
+      toolCallId: string;
+      output: unknown;
+    }
+  | {
+      type: "tool-output-error";
+      toolCallId: string;
+      errorText: string;
+    }
+  | { type: "error"; errorText: string }
+  | {
+      type: "message-metadata";
+      messageMetadata: Record<string, unknown>;
+    }
+  | {
+      // Custom data part. The AppKit chat UI uses `data-approval-pending`
+      // to render the destructive-tool approval card. The `id` makes the
+      // part idempotent on the client (re-renders don't duplicate cards).
+      type: `data-${string}`;
+      id?: string;
+      data: unknown;
+      transient?: boolean;
+    }
+  | { type: "finish" };
+
+/**
+ * Translates AppKit's internal {@link AgentEvent} stream into Vercel AI SDK
+ * UI Message Stream chunks consumed by `@ai-sdk/react`'s `useChat`.
+ *
+ * Stateful: one instance per streaming request. Manages lazy lifecycle for
+ * the two streamable item kinds the protocol defines:
+ *
+ * - **text**: opened on the first `message_delta`, closed (`text-end`)
+ *   before any non-text event (tool call, tool result, error) or
+ *   `finalize()`. Each open span carries a stable `id` so deltas can be
+ *   correlated on the client.
+ * - **reasoning**: same lifecycle as text but for `thinking` events.
+ *
+ * `start` is emitted exactly once on the first translated event so the
+ * client can establish the message id up front.
+ *
+ * Approval gates ride as a `data-approval-pending` data part keyed by
+ * `approvalId` — the client matches the matching `POST /approve` decision
+ * back via the existing `streamId`/`approvalId` pair.
+ */
+export class VercelAIUIMessageStreamTranslator
+  implements AgentEventStreamTranslator<VercelAIUIMessageChunk>
+{
+  private startEmitted = false;
+  private currentTextId: string | null = null;
+  private currentReasoningId: string | null = null;
+  private finalized = false;
+
+  translate(event: AgentEvent): VercelAIUIMessageChunk[] {
+    const out: VercelAIUIMessageChunk[] = [];
+    this.maybeEmitStart(out);
+
+    switch (event.type) {
+      case "message_delta":
+        this.closeReasoning(out);
+        this.openTextIfNeeded(out);
+        out.push({
+          type: "text-delta",
+          id: this.currentTextId as string,
+          delta: event.content,
+        });
+        return out;
+
+      case "message":
+        // Adapter delivered a fully-materialised message in one shot. If a
+        // streaming text span is already open, append the content as a
+        // final delta so the on-the-wire text is identical to the
+        // accumulated deltas; otherwise emit a one-shot delta wrapped in
+        // start/end.
+        this.closeReasoning(out);
+        this.openTextIfNeeded(out);
+        out.push({
+          type: "text-delta",
+          id: this.currentTextId as string,
+          delta: event.content,
+        });
+        this.closeText(out);
+        return out;
+
+      case "thinking":
+        this.closeText(out);
+        this.openReasoningIfNeeded(out);
+        out.push({
+          type: "reasoning-delta",
+          id: this.currentReasoningId as string,
+          delta: event.content,
+        });
+        return out;
+
+      case "tool_call":
+        this.closeText(out);
+        this.closeReasoning(out);
+        out.push({
+          type: "tool-input-available",
+          toolCallId: event.callId,
+          toolName: event.name,
+          input: event.args,
+        });
+        return out;
+
+      case "tool_result":
+        this.closeText(out);
+        this.closeReasoning(out);
+        if (event.error !== undefined) {
+          out.push({
+            type: "tool-output-error",
+            toolCallId: event.callId,
+            errorText: event.error,
+          });
+        } else {
+          out.push({
+            type: "tool-output-available",
+            toolCallId: event.callId,
+            output: event.result,
+          });
+        }
+        return out;
+
+      case "metadata":
+        // AppKit-internal `metadata` events surface things like the
+        // server-allocated thread id. Forward as `message-metadata` so the
+        // client gets it without bespoke wire shapes.
+        out.push({
+          type: "message-metadata",
+          messageMetadata: event.data,
+        });
+        return out;
+
+      case "approval_pending":
+        // Custom data part — does NOT close the open text/reasoning span,
+        // because the agent loop is paused on the approval gate and may
+        // resume the same span once the user decides.
+        out.push({
+          type: "data-approval-pending",
+          id: event.approvalId,
+          data: {
+            approvalId: event.approvalId,
+            streamId: event.streamId,
+            toolName: event.toolName,
+            args: event.args,
+            annotations: event.annotations,
+          },
+        });
+        return out;
+
+      case "status":
+        return this.handleStatus(event.status, event.error, out);
+    }
+  }
+
+  finalize(): VercelAIUIMessageChunk[] {
+    if (this.finalized) return [];
+    this.finalized = true;
+
+    const out: VercelAIUIMessageChunk[] = [];
+    this.maybeEmitStart(out);
+    this.closeText(out);
+    this.closeReasoning(out);
+    out.push({ type: "finish" });
+    return out;
+  }
+
+  private maybeEmitStart(out: VercelAIUIMessageChunk[]): void {
+    if (this.startEmitted) return;
+    this.startEmitted = true;
+    out.push({ type: "start", messageId: `msg_${randomUUID()}` });
+  }
+
+  private openTextIfNeeded(out: VercelAIUIMessageChunk[]): void {
+    if (this.currentTextId) return;
+    this.currentTextId = `text_${randomUUID()}`;
+    out.push({ type: "text-start", id: this.currentTextId });
+  }
+
+  private closeText(out: VercelAIUIMessageChunk[]): void {
+    if (!this.currentTextId) return;
+    out.push({ type: "text-end", id: this.currentTextId });
+    this.currentTextId = null;
+  }
+
+  private openReasoningIfNeeded(out: VercelAIUIMessageChunk[]): void {
+    if (this.currentReasoningId) return;
+    this.currentReasoningId = `reasoning_${randomUUID()}`;
+    out.push({ type: "reasoning-start", id: this.currentReasoningId });
+  }
+
+  private closeReasoning(out: VercelAIUIMessageChunk[]): void {
+    if (!this.currentReasoningId) return;
+    out.push({ type: "reasoning-end", id: this.currentReasoningId });
+    this.currentReasoningId = null;
+  }
+
+  private handleStatus(
+    status: string,
+    error: string | undefined,
+    out: VercelAIUIMessageChunk[],
+  ): VercelAIUIMessageChunk[] {
+    if (status === "error") {
+      this.closeText(out);
+      this.closeReasoning(out);
+      out.push({ type: "error", errorText: error ?? "Unknown error" });
+      // Pair `error` with `finish` so the client transitions out of
+      // streaming state rather than waiting indefinitely for more chunks.
+      if (!this.finalized) {
+        this.finalized = true;
+        out.push({ type: "finish" });
+      }
+      return out;
+    }
+
+    if (status === "complete") {
+      // `complete` is the canonical happy-path terminator. Delegate to
+      // `finalize()` so the close-text + close-reasoning + finish ordering
+      // is shared with explicit caller-driven finalization.
+      if (this.finalized) return out;
+      this.finalized = true;
+      this.closeText(out);
+      this.closeReasoning(out);
+      out.push({ type: "finish" });
+      return out;
+    }
+
+    return out;
+  }
+}
diff --git a/packages/appkit/src/registry/types.generated.ts b/packages/appkit/src/registry/types.generated.ts
index 7e38af9bd..348e74550 100644
--- a/packages/appkit/src/registry/types.generated.ts
+++ b/packages/appkit/src/registry/types.generated.ts
@@ -52,11 +52,7 @@ export type DatabasePermission = "CAN_CONNECT_AND_CREATE";
 export type PostgresPermission = "CAN_CONNECT_AND_CREATE";
 
 /** Permissions for GENIE_SPACE resources */
-export type GenieSpacePermission =
-  | "CAN_VIEW"
-  | "CAN_RUN"
-  | "CAN_EDIT"
-  | "CAN_MANAGE";
+export type GenieSpacePermission = "CAN_VIEW" | "CAN_RUN" | "CAN_EDIT" | "CAN_MANAGE";
 
 /** Permissions for EXPERIMENT resources */
 export type ExperimentPermission = "CAN_READ" | "CAN_EDIT" | "CAN_MANAGE";
@@ -81,10 +77,7 @@ export type ResourcePermission =
   | AppPermission;
 
 /** Permission hierarchy per resource type (weakest to strongest). Schema enum order. */
-export const PERMISSION_HIERARCHY_BY_TYPE: Record<
-  ResourceType,
-  readonly ResourcePermission[]
-> = {
+export const PERMISSION_HIERARCHY_BY_TYPE: Record<ResourceType, readonly ResourcePermission[]> = {
   [ResourceType.SECRET]: ["READ", "WRITE", "MANAGE"],
   [ResourceType.JOB]: ["CAN_VIEW", "CAN_MANAGE_RUN", "CAN_MANAGE"],
   [ResourceType.SQL_WAREHOUSE]: ["CAN_USE", "CAN_MANAGE"],
@@ -101,7 +94,4 @@ export const PERMISSION_HIERARCHY_BY_TYPE: Record<
 } as const;
 
 /** Set of valid permissions per type (for validation). */
-export const PERMISSIONS_BY_TYPE: Record<
-  ResourceType,
-  readonly ResourcePermission[]
-> = PERMISSION_HIERARCHY_BY_TYPE;
+export const PERMISSIONS_BY_TYPE: Record<ResourceType, readonly ResourcePermission[]> = PERMISSION_HIERARCHY_BY_TYPE;
diff --git a/packages/shared/src/chat-protocol.ts b/packages/shared/src/chat-protocol.ts
new file mode 100644
index 000000000..b1c9e5863
--- /dev/null
+++ b/packages/shared/src/chat-protocol.ts
@@ -0,0 +1,8 @@
+/**
+ * Vendor MIME type advertised by the Vercel AI SDK chat client so the
+ * server selects the UI Message Stream wire protocol. Shared between the
+ * agents plugin server and any client that wants to opt into the
+ * protocol via an `Accept` header.
+ */
+export const VERCEL_AI_UI_MESSAGE_STREAM_MIME =
+  "application/vnd.ai-sdk.ui-message-stream";
diff --git a/packages/shared/src/index.ts b/packages/shared/src/index.ts
index 9829729a7..a906fa491 100644
--- a/packages/shared/src/index.ts
+++ b/packages/shared/src/index.ts
@@ -1,5 +1,6 @@
 export * from "./agent";
 export * from "./cache";
+export * from "./chat-protocol";
 export * from "./execute";
 export * from "./genie";
 export * from "./plugin";
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index ad89c6b48..8c6a34ddf 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -147,6 +147,9 @@ importers:
       typeorm:
         specifier: 0.3.28
         version: 0.3.28(pg@8.18.0)
+      zod:
+        specifier: ^4.1.13
+        version: 4.1.13
     devDependencies:
       '@playwright/test':
         specifier: 1.58.1
@@ -5514,7 +5517,7 @@ packages:
   basic-ftp@5.0.5:
     resolution: {integrity: sha512-4Bcg1P8xhUuqcii/S0Z9wiHIrQVPMermM1any+MX5GeGD7faD3/msQUDGLol9wOcz4/jbg/WJnGqoJF6LiBdtg==}
     engines: {node: '>=10.0.0'}
-    deprecated: Security vulnerability fixed in 5.2.0, please upgrade
+    deprecated: Security vulnerability fixed in 5.2.1, please upgrade
 
   batch@0.6.1:
     resolution: {integrity: sha512-x+VAiMRL6UPkx+kudNvxTl6hB2XNNCG2r+7wixVfIYwu/2HKRXimwQyaumLjMveWvT2Hkd/cAJw+QBMfJ/EKVw==}

From beb7a439d3433be345c3a7e11b932ca1c6b6dc60 Mon Sep 17 00:00:00 2001
From: Hubert Zub <hubert.zub@databricks.com>
Date: Thu, 7 May 2026 09:24:41 +0200
Subject: [PATCH 46/46] feat(appkit-ui): add chat building blocks (provider,
 hooks, headless components)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

New subpath export @databricks/appkit-ui/react/chat with three layers:

- lib/ — pure utilities (transport, fetch error handlers, oauth helpers,
  Vercel AI SDK MIME re-export from shared, message conversion).
- hooks/ — data hooks (useChat, useChatHistory, useChatData,
  useScrollToBottom). Trivial context-reading wrappers (useChatSession,
  useChatConfig) are intentionally NOT exported — consumers call
  useChatContext directly.
- headless/ — render-prop components (Conversation, ChatInput,
  ChatHistoryList).

Errors live in their own module (errors.ts) so types.ts stays types-only.
The default prepareSendMessagesRequest body shape matches AppKit's
agents plugin ({ id, messages, trigger }); consumers targeting other
servers pass their own.

Signed-off-by: Hubert Zub <hubert.zub@databricks.com>
---
 apps/dev-playground/client/package-lock.json  |    1 +
 apps/dev-playground/client/package.json       |    1 +
 .../client/src/routes/agent.route.tsx         |  707 +++++------
 apps/dev-playground/server/index.ts           |    2 +-
 knip.json                                     |    8 +-
 packages/appkit-ui/package.json               |   28 +-
 packages/appkit-ui/src/react/chat/context.ts  |   25 +
 packages/appkit-ui/src/react/chat/errors.ts   |   86 ++
 .../src/react/chat/headless/chat-input.tsx    |   80 ++
 .../src/react/chat/headless/conversation.tsx  |   61 +
 .../src/react/chat/headless/history-list.tsx  |   25 +
 .../src/react/chat/headless/index.ts          |    3 +
 .../appkit-ui/src/react/chat/hooks/index.ts   |    4 +
 .../src/react/chat/hooks/use-chat-data.ts     |   84 ++
 .../src/react/chat/hooks/use-chat.ts          |  294 +++++
 .../src/react/chat/hooks/use-history.ts       |  105 ++
 .../react/chat/hooks/use-scroll-to-bottom.ts  |   63 +
 packages/appkit-ui/src/react/chat/index.ts    |   11 +
 .../appkit-ui/src/react/chat/lib/messages.ts  |   25 +
 .../appkit-ui/src/react/chat/lib/oauth.ts     |   32 +
 .../appkit-ui/src/react/chat/lib/protocol.ts  |    1 +
 .../appkit-ui/src/react/chat/lib/transport.ts |   43 +
 .../appkit-ui/src/react/chat/lib/utils.ts     |   56 +
 .../appkit-ui/src/react/chat/provider.tsx     |   87 ++
 packages/appkit-ui/src/react/chat/types.ts    |   86 ++
 packages/appkit-ui/tsdown.config.ts           |    1 +
 pnpm-lock.yaml                                | 1053 +++++++++--------
 27 files changed, 2116 insertions(+), 856 deletions(-)
 create mode 100644 packages/appkit-ui/src/react/chat/context.ts
 create mode 100644 packages/appkit-ui/src/react/chat/errors.ts
 create mode 100644 packages/appkit-ui/src/react/chat/headless/chat-input.tsx
 create mode 100644 packages/appkit-ui/src/react/chat/headless/conversation.tsx
 create mode 100644 packages/appkit-ui/src/react/chat/headless/history-list.tsx
 create mode 100644 packages/appkit-ui/src/react/chat/headless/index.ts
 create mode 100644 packages/appkit-ui/src/react/chat/hooks/index.ts
 create mode 100644 packages/appkit-ui/src/react/chat/hooks/use-chat-data.ts
 create mode 100644 packages/appkit-ui/src/react/chat/hooks/use-chat.ts
 create mode 100644 packages/appkit-ui/src/react/chat/hooks/use-history.ts
 create mode 100644 packages/appkit-ui/src/react/chat/hooks/use-scroll-to-bottom.ts
 create mode 100644 packages/appkit-ui/src/react/chat/index.ts
 create mode 100644 packages/appkit-ui/src/react/chat/lib/messages.ts
 create mode 100644 packages/appkit-ui/src/react/chat/lib/oauth.ts
 create mode 100644 packages/appkit-ui/src/react/chat/lib/protocol.ts
 create mode 100644 packages/appkit-ui/src/react/chat/lib/transport.ts
 create mode 100644 packages/appkit-ui/src/react/chat/lib/utils.ts
 create mode 100644 packages/appkit-ui/src/react/chat/provider.tsx
 create mode 100644 packages/appkit-ui/src/react/chat/types.ts

diff --git a/apps/dev-playground/client/package-lock.json b/apps/dev-playground/client/package-lock.json
index 80876cdcc..d741b3cad 100644
--- a/apps/dev-playground/client/package-lock.json
+++ b/apps/dev-playground/client/package-lock.json
@@ -26,6 +26,7 @@
         "react": "19.2.5",
         "react-dom": "19.2.5",
         "recharts": "3.4.1",
+        "swr": "2.4.1",
         "tailwind-merge": "3.3.1",
         "tailwindcss-animate": "1.0.7",
         "tw-animate-css": "1.4.0"
diff --git a/apps/dev-playground/client/package.json b/apps/dev-playground/client/package.json
index e302a32af..249ca306e 100644
--- a/apps/dev-playground/client/package.json
+++ b/apps/dev-playground/client/package.json
@@ -28,6 +28,7 @@
     "react": "19.2.5",
     "react-dom": "19.2.5",
     "recharts": "3.4.1",
+    "swr": "2.4.1",
     "tailwind-merge": "3.3.1",
     "tailwindcss-animate": "1.0.7",
     "tw-animate-css": "1.4.0"
diff --git a/apps/dev-playground/client/src/routes/agent.route.tsx b/apps/dev-playground/client/src/routes/agent.route.tsx
index 4a0dd39c8..a627c2481 100644
--- a/apps/dev-playground/client/src/routes/agent.route.tsx
+++ b/apps/dev-playground/client/src/routes/agent.route.tsx
@@ -1,9 +1,14 @@
-import { useChat } from "@ai-sdk/react";
 import { getPluginClientConfig } from "@databricks/appkit-ui/js";
 import { Button } from "@databricks/appkit-ui/react";
+import {
+  ChatInput,
+  ChatProvider,
+  Conversation,
+  generateUUID,
+} from "@databricks/appkit-ui/react/chat";
 import { createFileRoute } from "@tanstack/react-router";
-import { DefaultChatTransport } from "ai";
-import { useCallback, useEffect, useMemo, useRef, useState } from "react";
+import type { UIMessageChunk } from "ai";
+import { useCallback, useRef, useState } from "react";
 import {
   VERCEL_AI_UI_MESSAGE_STREAM_ACCEPT,
   type VercelAIAgentDataParts,
@@ -15,15 +20,14 @@ export const Route = createFileRoute("/agent")({
 });
 
 type ApprovalPendingPayload = VercelAIAgentDataParts["approval-pending"];
-
 type PendingApproval = ApprovalPendingPayload;
 
 /**
  * Inline-suggestion autocomplete still uses the legacy Responses-API SSE
  * shape on `/api/agents/chat`. The autocomplete agent runs as a one-shot
  * stateless completion (its `agent.md` flags `ephemeral: true`), so it
- * doesn't share the chat thread with the conversational `useChat` flow
- * and there's nothing to gain from migrating it here.
+ * doesn't share the chat thread with the conversational chat flow and
+ * there's nothing to gain from migrating it to the chat building blocks.
  */
 function useAutocomplete(enabled: boolean) {
   const [suggestion, setSuggestion] = useState("");
@@ -113,7 +117,7 @@ function useAutocomplete(enabled: boolean) {
 }
 
 /**
- * Concatenate all `text` parts of a message — `useChat` keeps text
+ * Concatenate all `text` parts of a message — the AI SDK keeps text
  * streamed across multiple `text-delta` chunks as a single `TextUIPart`,
  * but if the agent loop reopens text after a tool call, the message
  * carries multiple text parts. For chat-bubble rendering we want them
@@ -128,13 +132,38 @@ function messageBodyText(message: VercelAIAgentUIMessage): string {
 }
 
 function AgentRoute() {
+  // The dev-playground server doesn't expose `/config` or `/session`
+  // endpoints, so we hand-roll the provider state. `apiBase` is unused
+  // for the chat call itself (overridden via `api` on the conversation)
+  // and only feeds the disabled history/feedback paths.
+  return (
+    <ChatProvider
+      apiBase="/api/agents"
+      features={{ chatHistory: false, feedback: false }}
+      session={{ user: null }}
+    >
+      <AgentRouteInner />
+    </ChatProvider>
+  );
+}
+
+function AgentRouteInner() {
+  // Stable chat id seeded once per route mount. 's agents plugin
+  // maps it 1:1 to its `threadId`, so a remount = a fresh thread.
+  const [chatId] = useState(() => generateUUID());
   const [pendingApprovals, setPendingApprovals] = useState<PendingApproval[]>(
     [],
   );
-
-  const messagesEndRef = useRef<HTMLDivElement>(null);
+  // Chronological log of every UIMessageChunk received over the stream.
+  // Fed by `onStreamPart` so it matches the raw-SSE fidelity of the
+  // pre-AI-SDK implementation (one row per chunk, not per message-part).
+  // We stamp each entry with a monotonic id so React keys stay stable
+  // without leaking through the chunk shape itself.
+  const [streamLog, setStreamLog] = useState<
+    Array<{ id: number; chunk: UIMessageChunk }>
+  >([]);
+  const nextChunkIdRef = useRef(0);
   const inputRef = useRef<HTMLTextAreaElement>(null);
-  const [input, setInput] = useState("");
 
   const agentConfig = getPluginClientConfig<{
     agents?: string[];
@@ -142,57 +171,12 @@ function AgentRoute() {
   }>("agents");
   const hasAutocomplete = (agentConfig.agents ?? []).includes("autocomplete");
 
-  const transport = useMemo(
-    () =>
-      new DefaultChatTransport<VercelAIAgentUIMessage>({
-        api: "/api/agents/chat",
-        headers: {
-          Accept: VERCEL_AI_UI_MESSAGE_STREAM_ACCEPT,
-        },
-      }),
-    [],
-  );
-
-  // We deliberately do NOT pass `id` to useChat. The hook auto-mints one
-  // through the AI SDK's own `generateId` (which doesn't depend on the
-  // browser's `crypto.randomUUID`, so it survives environments where the
-  // global is shimmed or stripped) and exposes it on the return value.
-  // The chat id is sent to the server as the request body `id` and the
-  // agents plugin maps it 1:1 to its `threadId`.
   const {
-    id: chatId,
-    messages,
-    sendMessage,
-    status,
-    error,
-    stop,
-  } = useChat<VercelAIAgentUIMessage>({
-    transport,
-    onData: (part) => {
-      if (part.type === "data-approval-pending") {
-        const payload = part.data as ApprovalPendingPayload;
-        setPendingApprovals((prev) =>
-          prev.some((p) => p.approvalId === payload.approvalId)
-            ? prev
-            : [...prev, payload],
-        );
-      }
-    },
-  });
-
-  const isLoading = status === "submitted" || status === "streaming";
-
-  // `useChat` creates the assistant `UIMessage` stub the moment the server
-  // emits its `start` chunk — well before any text-delta arrives. We want
-  // to show "Thinking..." until the assistant has produced visible text
-  // (either rendered tokens or a fully-materialised message). Tool-only
-  // turns therefore keep the indicator up until the model speaks.
-  const lastMessage = messages[messages.length - 1];
-  const lastAssistantHasText =
-    lastMessage?.role === "assistant" &&
-    messageBodyText(lastMessage).length > 0;
-  const showThinking =
-    isLoading && pendingApprovals.length === 0 && !lastAssistantHasText;
+    suggestion,
+    isLoading: isAutocompleting,
+    requestSuggestion,
+    clear: clearSuggestion,
+  } = useAutocomplete(hasAutocomplete);
 
   const decideApproval = useCallback(
     async (approvalId: string, decision: "approve" | "deny") => {
@@ -219,39 +203,6 @@ function AgentRoute() {
     [pendingApprovals],
   );
 
-  const {
-    suggestion,
-    isLoading: isAutocompleting,
-    requestSuggestion,
-    clear: clearSuggestion,
-  } = useAutocomplete(hasAutocomplete);
-
-  // biome-ignore lint/correctness/useExhaustiveDependencies: scroll on new messages
-  useEffect(() => {
-    messagesEndRef.current?.scrollIntoView({ behavior: "smooth" });
-  }, [messages]);
-
-  const submit = useCallback(() => {
-    const text = input.trim();
-    if (!text || isLoading) return;
-    clearSuggestion();
-    setInput("");
-    sendMessage({ text });
-  }, [input, isLoading, clearSuggestion, sendMessage]);
-
-  const handleInputChange = (value: string) => {
-    setInput(value);
-    requestSuggestion(value);
-  };
-
-  const acceptSuggestion = () => {
-    if (!suggestion) return;
-    const newValue = input + suggestion;
-    setInput(newValue);
-    clearSuggestion();
-    inputRef.current?.focus();
-  };
-
   return (
     <div className="min-h-screen bg-background">
       <div className="max-w-7xl mx-auto px-6 py-12">
@@ -259,7 +210,7 @@ function AgentRoute() {
           <div>
             <h1 className="text-3xl font-bold mb-2">Agent Chat</h1>
             <p className="text-base text-muted-foreground">
-              AI agent with auto-discovered tools from all AppKit plugins.
+              AI agent with auto-discovered tools from all plugins.
               <span className="ml-2 text-xs font-mono opacity-60">
                 Chat: {chatId.slice(0, 8)}...
               </span>
@@ -272,296 +223,352 @@ function AgentRoute() {
           )}
         </div>
 
-        <div className="flex gap-6 h-[700px]">
-          <div className="flex-1 flex flex-col border rounded-lg bg-card min-w-0">
-            <div className="flex-1 overflow-y-auto p-4 space-y-4">
-              {messages.length === 0 && (
-                <div className="text-center text-muted-foreground py-20">
-                  <p className="text-lg">
-                    Send a message to start a conversation
-                  </p>
-                  <p className="text-sm mt-2">
-                    The agent can use analytics, files, genie, and lakebase
-                    tools.
-                    {hasAutocomplete && " Start typing for inline suggestions."}
-                  </p>
-                </div>
-              )}
-
-              {messages.map((msg) => {
-                const body = messageBodyText(msg);
-                if (!body) return null;
-                return (
+        <Conversation<VercelAIAgentUIMessage>
+          id={chatId}
+          api="/api/agents/chat"
+          headers={{ Accept: VERCEL_AI_UI_MESSAGE_STREAM_ACCEPT }}
+          onData={(part) => {
+            if (part.type === "data-approval-pending") {
+              const payload = part.data as ApprovalPendingPayload;
+              setPendingApprovals((prev) =>
+                prev.some((p) => p.approvalId === payload.approvalId)
+                  ? prev
+                  : [...prev, payload],
+              );
+            }
+          }}
+          onStreamPart={(chunk) =>
+            setStreamLog((prev) => [
+              ...prev,
+              { id: nextChunkIdRef.current++, chunk },
+            ])
+          }
+        >
+          {({ messages, status, error, sendMessage, stop, containerRef }) => {
+            const isLoading = status === "submitted" || status === "streaming";
+            // The AI SDK creates the assistant `UIMessage` stub the moment
+            // the server emits its `start` chunk — well before any
+            // text-delta arrives. Show "Thinking..." until the assistant
+            // has produced visible text. Tool-only turns therefore keep
+            // the indicator up until the model speaks.
+            const lastMessage = messages[messages.length - 1];
+            const lastAssistantHasText =
+              lastMessage?.role === "assistant" &&
+              messageBodyText(lastMessage).length > 0;
+            const showThinking =
+              isLoading &&
+              pendingApprovals.length === 0 &&
+              !lastAssistantHasText;
+
+            return (
+              <div className="flex gap-6 h-[700px]">
+                <div className="flex-1 flex flex-col border rounded-lg bg-card min-w-0">
                   <div
-                    key={msg.id}
-                    className={`flex ${
-                      msg.role === "user" ? "justify-end" : "justify-start"
-                    }`}
+                    ref={containerRef}
+                    className="flex-1 overflow-y-auto p-4 space-y-4"
                   >
-                    <div
-                      className={`max-w-[85%] rounded-lg px-4 py-2 ${
-                        msg.role === "user"
-                          ? "bg-primary text-primary-foreground"
-                          : "bg-muted"
-                      }`}
-                    >
-                      <p className="whitespace-pre-wrap text-sm">{body}</p>
-                    </div>
-                  </div>
-                );
-              })}
-
-              {pendingApprovals.map((approval) => (
-                <div key={approval.approvalId} className="flex justify-start">
-                  <div className="max-w-[80%] rounded-lg border border-orange-500/60 bg-orange-500/10 px-4 py-3">
-                    <div className="mb-2 flex items-center gap-2">
-                      <span className="rounded bg-orange-600 px-2 py-0.5 text-xs font-semibold uppercase tracking-wide text-white">
-                        Destructive tool — approval required
-                      </span>
-                    </div>
-                    <div className="text-sm">
-                      <strong>{approval.toolName}</strong>
-                      <pre className="mt-1 max-h-52 overflow-auto whitespace-pre-wrap break-words rounded bg-background p-2 text-xs">
-                        {JSON.stringify(approval.args, null, 2)}
-                      </pre>
-                    </div>
-                    <div className="mt-3 flex justify-end gap-2">
-                      <Button
-                        type="button"
-                        variant="outline"
-                        size="sm"
-                        onClick={() =>
-                          decideApproval(approval.approvalId, "deny")
-                        }
-                      >
-                        Deny
-                      </Button>
-                      <Button
-                        type="button"
-                        size="sm"
-                        onClick={() =>
-                          decideApproval(approval.approvalId, "approve")
-                        }
+                    {messages.length === 0 && (
+                      <div className="text-center text-muted-foreground py-20">
+                        <p className="text-lg">
+                          Send a message to start a conversation
+                        </p>
+                        <p className="text-sm mt-2">
+                          The agent can use analytics, files, genie, and
+                          lakebase tools.
+                          {hasAutocomplete &&
+                            " Start typing for inline suggestions."}
+                        </p>
+                      </div>
+                    )}
+
+                    {messages.map((msg) => {
+                      const body = messageBodyText(msg);
+                      if (!body) return null;
+                      return (
+                        <div
+                          key={msg.id}
+                          className={`flex ${
+                            msg.role === "user"
+                              ? "justify-end"
+                              : "justify-start"
+                          }`}
+                        >
+                          <div
+                            className={`max-w-[85%] rounded-lg px-4 py-2 ${
+                              msg.role === "user"
+                                ? "bg-primary text-primary-foreground"
+                                : "bg-muted"
+                            }`}
+                          >
+                            <p className="whitespace-pre-wrap text-sm">
+                              {body}
+                            </p>
+                          </div>
+                        </div>
+                      );
+                    })}
+
+                    {pendingApprovals.map((approval) => (
+                      <div
+                        key={approval.approvalId}
+                        className="flex justify-start"
                       >
-                        Approve
-                      </Button>
-                    </div>
-                  </div>
-                </div>
-              ))}
-
-              {showThinking && (
-                <div className="flex justify-start">
-                  <div className="bg-muted rounded-lg px-4 py-2">
-                    <p className="text-sm text-muted-foreground animate-pulse">
-                      Thinking...
-                    </p>
-                  </div>
-                </div>
-              )}
-
-              {error && (
-                <div className="flex justify-start">
-                  <div className="max-w-[85%] rounded-lg border border-red-500/60 bg-red-500/10 px-4 py-2">
-                    <p className="text-sm">Error: {error.message}</p>
+                        <div className="max-w-[80%] rounded-lg border border-orange-500/60 bg-orange-500/10 px-4 py-3">
+                          <div className="mb-2 flex items-center gap-2">
+                            <span className="rounded bg-orange-600 px-2 py-0.5 text-xs font-semibold uppercase tracking-wide text-white">
+                              Destructive tool — approval required
+                            </span>
+                          </div>
+                          <div className="text-sm">
+                            <strong>{approval.toolName}</strong>
+                            <pre className="mt-1 max-h-52 overflow-auto whitespace-pre-wrap break-words rounded bg-background p-2 text-xs">
+                              {JSON.stringify(approval.args, null, 2)}
+                            </pre>
+                          </div>
+                          <div className="mt-3 flex justify-end gap-2">
+                            <Button
+                              type="button"
+                              variant="outline"
+                              size="sm"
+                              onClick={() =>
+                                decideApproval(approval.approvalId, "deny")
+                              }
+                            >
+                              Deny
+                            </Button>
+                            <Button
+                              type="button"
+                              size="sm"
+                              onClick={() =>
+                                decideApproval(approval.approvalId, "approve")
+                              }
+                            >
+                              Approve
+                            </Button>
+                          </div>
+                        </div>
+                      </div>
+                    ))}
+
+                    {showThinking && (
+                      <div className="flex justify-start">
+                        <div className="bg-muted rounded-lg px-4 py-2">
+                          <p className="text-sm text-muted-foreground animate-pulse">
+                            Thinking...
+                          </p>
+                        </div>
+                      </div>
+                    )}
+
+                    {error && (
+                      <div className="flex justify-start">
+                        <div className="max-w-[85%] rounded-lg border border-red-500/60 bg-red-500/10 px-4 py-2">
+                          <p className="text-sm">Error: {error.message}</p>
+                        </div>
+                      </div>
+                    )}
                   </div>
-                </div>
-              )}
-
-              <div ref={messagesEndRef} />
-            </div>
 
-            <div className="border-t p-4">
-              {hasAutocomplete && (suggestion || isAutocompleting) && (
-                <div className="flex items-center gap-2 mb-2 text-xs text-muted-foreground">
-                  {isAutocompleting && (
-                    <span className="animate-pulse">Thinking...</span>
-                  )}
-                  {suggestion && (
-                    <span>
-                      Press{" "}
-                      <kbd className="px-1.5 py-0.5 rounded bg-muted border text-[10px] font-mono">
-                        Tab
-                      </kbd>{" "}
-                      to accept suggestion
-                    </span>
-                  )}
-                </div>
-              )}
-              <form
-                onSubmit={(e) => {
-                  e.preventDefault();
-                  submit();
-                }}
-                className="flex gap-2"
-              >
-                <div className="flex-1 relative">
-                  <div
-                    aria-hidden
-                    className="absolute inset-0 px-3 py-2 text-sm pointer-events-none whitespace-pre-wrap break-words overflow-hidden"
-                  >
-                    <span className="invisible">{input}</span>
-                    <span className="text-muted-foreground/40">
-                      {suggestion}
-                    </span>
-                  </div>
-                  <textarea
-                    ref={inputRef}
-                    value={input}
-                    onChange={(e) => handleInputChange(e.target.value)}
-                    onKeyDown={(e) => {
-                      if (e.key === "Tab" && suggestion) {
-                        e.preventDefault();
-                        acceptSuggestion();
-                      }
-                      if (e.key === "Escape" && suggestion) {
+                  <div className="border-t p-4">
+                    {hasAutocomplete && (suggestion || isAutocompleting) && (
+                      <div className="flex items-center gap-2 mb-2 text-xs text-muted-foreground">
+                        {isAutocompleting && (
+                          <span className="animate-pulse">Thinking...</span>
+                        )}
+                        {suggestion && (
+                          <span>
+                            Press{" "}
+                            <kbd className="px-1.5 py-0.5 rounded bg-muted border text-[10px] font-mono">
+                              Tab
+                            </kbd>{" "}
+                            to accept suggestion
+                          </span>
+                        )}
+                      </div>
+                    )}
+                    <ChatInput<VercelAIAgentUIMessage>
+                      onSubmit={(message) => {
+                        // Cancel any in-flight or debounced autocomplete
+                        // before the input clears — otherwise the 500ms
+                        // timer scheduled on the last keystroke fires
+                        // post-submit and asks for suggestions on stale
+                        // text (or, after the input clears, on "" — which
+                        // surfaces as a phantom "/chat" request).
                         clearSuggestion();
-                      }
-                      if (e.key === "Enter" && !e.shiftKey && !suggestion) {
-                        e.preventDefault();
-                        submit();
-                      }
-                    }}
-                    placeholder="Ask a question..."
-                    disabled={isLoading}
-                    rows={1}
-                    className="w-full rounded-md border border-input bg-transparent px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring disabled:opacity-50 resize-none"
-                  />
+                        sendMessage(message);
+                      }}
+                      status={status}
+                      onStop={stop}
+                    >
+                      {({
+                        value,
+                        onChange,
+                        submit,
+                        isStreaming,
+                        canSubmit,
+                        handleKeyDown,
+                      }) => (
+                        <form onSubmit={submit} className="flex gap-2">
+                          <div className="flex-1 relative">
+                            <div
+                              aria-hidden
+                              className="absolute inset-0 px-3 py-2 text-sm pointer-events-none whitespace-pre-wrap break-words overflow-hidden"
+                            >
+                              <span className="invisible">{value}</span>
+                              <span className="text-muted-foreground/40">
+                                {suggestion}
+                              </span>
+                            </div>
+                            <textarea
+                              ref={inputRef}
+                              value={value}
+                              onChange={(e) => {
+                                onChange(e.target.value);
+                                requestSuggestion(e.target.value);
+                              }}
+                              onKeyDown={(e) => {
+                                if (e.key === "Tab" && suggestion) {
+                                  e.preventDefault();
+                                  onChange(value + suggestion);
+                                  clearSuggestion();
+                                  inputRef.current?.focus();
+                                  return;
+                                }
+                                if (e.key === "Escape" && suggestion) {
+                                  clearSuggestion();
+                                  return;
+                                }
+                                // While a suggestion is showing, don't let
+                                // Enter submit — let the Tab path absorb
+                                // it. Otherwise delegate to the headless
+                                // input's default Enter-to-submit handler.
+                                if (suggestion) return;
+                                handleKeyDown(e);
+                              }}
+                              placeholder="Ask a question..."
+                              disabled={isStreaming}
+                              rows={1}
+                              className="w-full rounded-md border border-input bg-transparent px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring disabled:opacity-50 resize-none"
+                            />
+                          </div>
+                          {isStreaming ? (
+                            <Button
+                              type="button"
+                              variant="outline"
+                              onClick={stop}
+                              className="self-end"
+                            >
+                              Stop
+                            </Button>
+                          ) : (
+                            <Button
+                              type="submit"
+                              disabled={!canSubmit}
+                              className="self-end"
+                            >
+                              Send
+                            </Button>
+                          )}
+                        </form>
+                      )}
+                    </ChatInput>
+                  </div>
                 </div>
-                {isLoading ? (
-                  <Button
-                    type="button"
-                    variant="outline"
-                    onClick={stop}
-                    className="self-end"
-                  >
-                    Stop
-                  </Button>
-                ) : (
-                  <Button
-                    type="submit"
-                    disabled={!input.trim()}
-                    className="self-end"
-                  >
-                    Send
-                  </Button>
-                )}
-              </form>
-            </div>
-          </div>
 
-          <EventStreamPanel messages={messages} approvals={pendingApprovals} />
-        </div>
+                <EventStreamPanel chunks={streamLog} />
+              </div>
+            );
+          }}
+        </Conversation>
       </div>
     </div>
   );
 }
 
-interface EventStreamRow {
-  /** Stable React key. */
-  key: string;
-  /** Short label rendered in the left column. */
-  label: string;
-  /** Free-form right-column detail. */
-  detail: string;
-}
-
 /**
- * Right-hand debug panel. Walks every part of every message and renders a
- * compact, terse log entry per part. Pairs with `pendingApprovals` so the
- * panel surfaces approval prompts (which arrive via `onData`, not as
- * message parts) alongside the message-derived rows.
+ * Right-hand debug panel. Renders one row per `UIMessageChunk` exactly as
+ * it arrived from the transport — `text-delta`s are NOT coalesced, so the
+ * panel doubles as a faithful trace of the wire stream (matching what the
+ * legacy raw-SSE viewer used to show).
  */
 function EventStreamPanel({
-  messages,
-  approvals,
+  chunks,
 }: {
-  messages: VercelAIAgentUIMessage[];
-  approvals: PendingApproval[];
+  chunks: Array<{ id: number; chunk: UIMessageChunk }>;
 }) {
-  const rows: EventStreamRow[] = [];
-
-  for (const message of messages) {
-    let partIndex = 0;
-    for (const part of message.parts) {
-      const key = `${message.id}:${partIndex++}`;
-      if (part.type === "text") {
-        rows.push({
-          key,
-          label: message.role === "user" ? "user" : "text",
-          detail: part.text.slice(0, 80),
-        });
-      } else if (part.type === "reasoning") {
-        rows.push({
-          key,
-          label: "reasoning",
-          detail: part.text.slice(0, 80),
-        });
-      } else if (part.type === "dynamic-tool") {
-        const detail =
-          part.state === "output-available"
-            ? safeStringify(part.output).slice(0, 80)
-            : part.state === "output-error"
-              ? `error: ${part.errorText}`
-              : safeStringify(part.input).slice(0, 80);
-        rows.push({
-          key,
-          label: `tool:${part.toolName}`,
-          detail: `${part.state} ${detail}`,
-        });
-      } else if (part.type === "step-start") {
-        rows.push({ key, label: "step", detail: "start" });
-      } else if (
-        typeof part.type === "string" &&
-        part.type.startsWith("data-")
-      ) {
-        const data = (part as { data?: unknown }).data;
-        rows.push({
-          key,
-          label: part.type.replace(/^data-/, "data:"),
-          detail: safeStringify(data).slice(0, 80),
-        });
-      }
-    }
-  }
-
-  for (const approval of approvals) {
-    rows.push({
-      key: `pending:${approval.approvalId}`,
-      label: "approval",
-      detail: `pending: ${approval.toolName}`,
-    });
-  }
-
   return (
     <div className="w-80 shrink-0 flex flex-col border rounded-lg bg-card">
-      <div className="px-3 py-2 border-b">
+      <div className="px-3 py-2 border-b flex items-center justify-between">
         <h3 className="text-sm font-semibold text-muted-foreground">
           Event Stream
         </h3>
+        <span className="text-[10px] font-mono text-muted-foreground/60">
+          {chunks.length} chunk{chunks.length === 1 ? "" : "s"}
+        </span>
       </div>
       <div className="flex-1 overflow-y-auto p-3 space-y-1">
-        {rows.length === 0 && (
+        {chunks.length === 0 && (
           <p className="text-xs text-muted-foreground/50 text-center py-8">
             Events will appear here
           </p>
         )}
-        {rows.map((row) => (
-          <div
-            key={row.key}
-            className="font-mono text-xs text-muted-foreground"
-          >
-            <span className="inline-block w-24 text-right mr-2 opacity-50">
-              {row.label}
-            </span>
-            <span className="opacity-80 break-all">{row.detail}</span>
-          </div>
-        ))}
+        {chunks.map(({ id, chunk }) => {
+          const { label, detail } = describeChunk(chunk);
+          return (
+            <div key={id} className="font-mono text-xs text-muted-foreground">
+              <span className="inline-block w-24 text-right mr-2 opacity-50">
+                {label}
+              </span>
+              <span className="opacity-80 break-all">{detail}</span>
+            </div>
+          );
+        })}
       </div>
     </div>
   );
 }
 
+/**
+ * Format a `UIMessageChunk` into a (label, detail) pair for the debug
+ * panel. The chunk discriminator is the AI SDK's wire-level event name
+ * (`text-delta`, `reasoning-delta`, `tool-input-available`, `data-*`,
+ * etc.); see {@link https://ai-sdk.dev/docs/ai-sdk-ui/stream-protocol#ui-message-chunks}.
+ */
+function describeChunk(chunk: UIMessageChunk): {
+  label: string;
+  detail: string;
+} {
+  const c = chunk as Record<string, unknown> & { type: string };
+  if (c.type === "text-delta") {
+    return { label: "text-Δ", detail: String(c.delta ?? "").slice(0, 80) };
+  }
+  if (c.type === "reasoning-delta") {
+    return {
+      label: "reasoning-Δ",
+      detail: String(c.delta ?? "").slice(0, 80),
+    };
+  }
+  if (c.type === "tool-input-available") {
+    return {
+      label: `tool→ ${String(c.toolName ?? "?")}`,
+      detail: safeStringify(c.input).slice(0, 80),
+    };
+  }
+  if (c.type === "tool-output-available") {
+    return {
+      label: `tool← ${String(c.toolName ?? "?")}`,
+      detail: safeStringify(c.output).slice(0, 80),
+    };
+  }
+  if (c.type.startsWith("data-")) {
+    return {
+      label: c.type.replace(/^data-/, "data:"),
+      detail: safeStringify(c.data).slice(0, 80),
+    };
+  }
+  return { label: c.type, detail: "" };
+}
+
 function safeStringify(value: unknown): string {
   if (typeof value === "string") return value;
   if (value === undefined) return "";
diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index d4b7bb7a7..7205339ad 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -6,7 +6,7 @@ import {
   files,
   genie,
   PolicyDeniedError,
-  server,
+  server, 
   serving,
   WRITE_ACTIONS,
 } from "@databricks/appkit";
diff --git a/knip.json b/knip.json
index dbd7eee89..c414785b8 100644
--- a/knip.json
+++ b/knip.json
@@ -8,7 +8,13 @@
   ],
   "workspaces": {
     "packages/appkit-ui": {
-      "ignoreDependencies": ["tailwindcss", "tw-animate-css"]
+      "ignoreDependencies": [
+        "@ai-sdk/react",
+        "ai",
+        "swr",
+        "tailwindcss",
+        "tw-animate-css"
+      ]
     }
   },
   "ignore": [
diff --git a/packages/appkit-ui/package.json b/packages/appkit-ui/package.json
index 885c02b17..c1f2cfc1e 100644
--- a/packages/appkit-ui/package.json
+++ b/packages/appkit-ui/package.json
@@ -39,6 +39,10 @@
       "development": "./src/react/beta.ts",
       "default": "./dist/react/beta.js"
     },
+    "./react/chat": {
+      "development": "./src/react/chat/index.ts",
+      "default": "./dist/react/chat/index.js"
+    },
     "./package.json": "./package.json",
     "./styles.css": {
       "development": "./src/react/styles/globals.css",
@@ -103,16 +107,33 @@
     "vaul": "1.1.2"
   },
   "peerDependencies": {
+    "@ai-sdk/react": ">=4.0.0-beta",
+    "ai": ">=7.0.0-beta",
     "react": "^18.0.0 || ^19.0.0",
     "react-dom": "^18.0.0 || ^19.0.0",
-    "recharts": "^2.0.0 || ^3.0.0"
+    "recharts": "^2.0.0 || ^3.0.0",
+    "swr": ">=2.0.0"
+  },
+  "peerDependenciesMeta": {
+    "@ai-sdk/react": {
+      "optional": true
+    },
+    "ai": {
+      "optional": true
+    },
+    "swr": {
+      "optional": true
+    }
   },
   "devDependencies": {
+    "@ai-sdk/react": "4.0.0-beta.76",
     "@types/react": "19.2.2",
     "@types/react-dom": "19.2.2",
-    "react": "19.2.0",
-    "react-dom": "19.2.0",
+    "ai": "7.0.0-beta.76",
+    "react": "19.2.5",
+    "react-dom": "19.2.5",
     "recharts": "2.15.4",
+    "swr": "2.4.1",
     "tailwindcss": "4.1.17",
     "tw-animate-css": "1.4.0"
   },
@@ -122,6 +143,7 @@
       "./js/beta": "./dist/js/beta.js",
       "./react": "./dist/react/index.js",
       "./react/beta": "./dist/react/beta.js",
+      "./react/chat": "./dist/react/chat/index.js",
       "./package.json": "./package.json",
       "./styles.css": "./dist/styles.css"
     }
diff --git a/packages/appkit-ui/src/react/chat/context.ts b/packages/appkit-ui/src/react/chat/context.ts
new file mode 100644
index 000000000..3214372b5
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/context.ts
@@ -0,0 +1,25 @@
+import { createContext, useContext } from "react";
+import type { ChatFeatures, ChatSession } from "./types";
+
+export interface ChatContextValue {
+  apiBase: string;
+  basePath: string;
+  features: ChatFeatures;
+  chatHistoryEnabled: boolean;
+  feedbackEnabled: boolean;
+  session: ChatSession | null;
+  isLoading: boolean;
+  onNavigate?: (chatId: string) => void;
+}
+
+export const ChatContext = createContext<ChatContextValue | undefined>(
+  undefined,
+);
+
+export function useChatContext(): ChatContextValue {
+  const ctx = useContext(ChatContext);
+  if (!ctx) {
+    throw new Error("useChatContext must be used within a ChatProvider");
+  }
+  return ctx;
+}
diff --git a/packages/appkit-ui/src/react/chat/errors.ts b/packages/appkit-ui/src/react/chat/errors.ts
new file mode 100644
index 000000000..9528e146b
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/errors.ts
@@ -0,0 +1,86 @@
+type ErrorType =
+  | "bad_request"
+  | "unauthorized"
+  | "forbidden"
+  | "not_found"
+  | "rate_limit"
+  | "offline"
+  | "empty";
+
+type Surface =
+  | "chat"
+  | "auth"
+  | "api"
+  | "database"
+  | "history"
+  | "stream"
+  | "message";
+
+export type ChatErrorCode = `${ErrorType}:${Surface}`;
+
+export class ChatError extends Error {
+  public type: ErrorType;
+  public surface: Surface;
+  public statusCode: number;
+  public cause?: string;
+
+  constructor(errorCode: ChatErrorCode, cause?: string) {
+    super();
+
+    const [_type, _surface] = errorCode.split(":");
+    const type = _type as ErrorType;
+    const surface = _surface as Surface;
+
+    this.type = type;
+    this.cause = cause;
+    this.surface = surface;
+    this.message = getMessageByErrorCode(errorCode);
+    this.statusCode = getStatusCodeByType(this.type);
+  }
+}
+
+function getStatusCodeByType(type: ErrorType): number {
+  switch (type) {
+    case "bad_request":
+      return 400;
+    case "unauthorized":
+      return 401;
+    case "forbidden":
+      return 403;
+    case "not_found":
+      return 404;
+    case "rate_limit":
+      return 429;
+    case "offline":
+      return 0;
+    default:
+      return 500;
+  }
+}
+
+export function getMessageByErrorCode(errorCode: ChatErrorCode): string {
+  if (errorCode.includes("database")) {
+    return "An error occurred while executing a database query.";
+  }
+
+  switch (errorCode) {
+    case "bad_request:api":
+      return "The request couldn't be processed. Please check your input and try again.";
+    case "unauthorized:auth":
+      return "You need to sign in before continuing.";
+    case "forbidden:auth":
+      return "Your account does not have access to this feature.";
+    case "rate_limit:chat":
+      return "You have exceeded your maximum number of messages for the day. Please try again later.";
+    case "not_found:chat":
+      return "The requested chat was not found. Please check the chat ID and try again.";
+    case "forbidden:chat":
+      return "This chat belongs to another user. Please check the chat ID and try again.";
+    case "unauthorized:chat":
+      return "You need to sign in to view this chat. Please sign in and try again.";
+    case "offline:chat":
+      return "We're having trouble sending your message. Please check your internet connection and try again.";
+    default:
+      return "Something went wrong. Please try again later.";
+  }
+}
diff --git a/packages/appkit-ui/src/react/chat/headless/chat-input.tsx b/packages/appkit-ui/src/react/chat/headless/chat-input.tsx
new file mode 100644
index 000000000..2607eac1a
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/headless/chat-input.tsx
@@ -0,0 +1,80 @@
+import type { UseChatHelpers } from "@ai-sdk/react";
+import type { ChatStatus, UIMessage } from "ai";
+import {
+  useCallback,
+  useState,
+  type FormEvent,
+  type ReactNode,
+} from "react";
+import type { ChatMessage } from "../types";
+
+export interface ChatInputRenderProps {
+  value: string;
+  onChange: (value: string) => void;
+  submit: (e?: FormEvent) => void;
+  isStreaming: boolean;
+  stop: () => void;
+  canSubmit: boolean;
+  handleKeyDown: (
+    e: React.KeyboardEvent<HTMLTextAreaElement | HTMLInputElement>,
+  ) => void;
+}
+
+export interface ChatInputProps<
+  TMessage extends UIMessage = ChatMessage,
+> {
+  onSubmit: UseChatHelpers<TMessage>["sendMessage"];
+  status: ChatStatus;
+  onStop: () => void;
+  children: (props: ChatInputRenderProps) => ReactNode;
+}
+
+export function ChatInput<
+  TMessage extends UIMessage = ChatMessage,
+>({
+  onSubmit,
+  status,
+  onStop,
+  children,
+}: ChatInputProps<TMessage>) {
+  const [value, setValue] = useState("");
+  const isStreaming = status === "streaming";
+
+  const submit = useCallback(
+    (e?: FormEvent) => {
+      e?.preventDefault();
+      const trimmed = value.trim();
+      if (!trimmed) return;
+
+      // Use the AI SDK's `{ text }` shorthand. Internally this is
+      // promoted to a single `text` part on a `user` message — the
+      // wire shape is identical to manually constructing
+      // `{ role: "user", parts: [{ type: "text", text }] }`.
+      onSubmit({ text: trimmed });
+      setValue("");
+    },
+    [value, onSubmit],
+  );
+
+  const handleKeyDown = useCallback(
+    (e: React.KeyboardEvent<HTMLTextAreaElement | HTMLInputElement>) => {
+      if (e.key === "Enter") {
+        if (e.nativeEvent.isComposing) return;
+        if (e.shiftKey) return;
+        e.preventDefault();
+        submit();
+      }
+    },
+    [submit],
+  );
+
+  return children({
+    value,
+    onChange: setValue,
+    submit,
+    isStreaming,
+    stop: onStop,
+    canSubmit: value.trim().length > 0 && !isStreaming,
+    handleKeyDown,
+  });
+}
diff --git a/packages/appkit-ui/src/react/chat/headless/conversation.tsx b/packages/appkit-ui/src/react/chat/headless/conversation.tsx
new file mode 100644
index 000000000..5230f98b9
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/headless/conversation.tsx
@@ -0,0 +1,61 @@
+import type { UseChatHelpers } from "@ai-sdk/react";
+import type { UIMessage } from "ai";
+import type { ReactNode } from "react";
+import { type UseChatOptions, useChat } from "../hooks/use-chat";
+import { useScrollToBottom } from "../hooks/use-scroll-to-bottom";
+import type { ChatMessage } from "../types";
+
+export interface ConversationRenderProps<
+  TMessage extends UIMessage = ChatMessage,
+> {
+  messages: TMessage[];
+  status: UseChatHelpers<TMessage>["status"];
+  error: UseChatHelpers<TMessage>["error"];
+  clearError: UseChatHelpers<TMessage>["clearError"];
+  sendMessage: UseChatHelpers<TMessage>["sendMessage"];
+  setMessages: UseChatHelpers<TMessage>["setMessages"];
+  addToolApprovalResponse: UseChatHelpers<TMessage>["addToolApprovalResponse"];
+  regenerate: UseChatHelpers<TMessage>["regenerate"];
+  stop: () => void;
+  id: string;
+  title: string | undefined;
+  isTitleLoading: boolean;
+  isReadonly: boolean;
+  isAtBottom: boolean;
+  scrollToBottom: (behavior?: ScrollBehavior) => void;
+  containerRef: React.RefObject<HTMLDivElement | null>;
+}
+
+export interface ConversationProps<TMessage extends UIMessage = ChatMessage>
+  extends UseChatOptions<TMessage> {
+  children: (props: ConversationRenderProps<TMessage>) => ReactNode;
+}
+
+export function Conversation<TMessage extends UIMessage = ChatMessage>({
+  children,
+  ...chatOptions
+}: ConversationProps<TMessage>) {
+  const chat = useChat<TMessage>(chatOptions);
+  const { containerRef, isAtBottom, scrollToBottom } = useScrollToBottom({
+    trigger: chat.messages,
+  });
+
+  return children({
+    messages: chat.messages,
+    status: chat.status,
+    error: chat.error,
+    clearError: chat.clearError,
+    sendMessage: chat.sendMessage,
+    setMessages: chat.setMessages,
+    addToolApprovalResponse: chat.addToolApprovalResponse,
+    regenerate: chat.regenerate,
+    stop: chat.stop,
+    id: chat.id,
+    title: chat.title,
+    isTitleLoading: chat.isTitleLoading,
+    isReadonly: chat.isReadonly,
+    isAtBottom,
+    scrollToBottom,
+    containerRef,
+  });
+}
diff --git a/packages/appkit-ui/src/react/chat/headless/history-list.tsx b/packages/appkit-ui/src/react/chat/headless/history-list.tsx
new file mode 100644
index 000000000..df11c3088
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/headless/history-list.tsx
@@ -0,0 +1,25 @@
+import type { ReactNode } from "react";
+import { useChatHistory } from "../hooks/use-history";
+import type { Chat } from "../types";
+
+export interface ChatHistoryListRenderProps {
+  chats: Chat[];
+  isLoading: boolean;
+  isValidating: boolean;
+  hasMore: boolean;
+  isEmpty: boolean;
+  loadMore: () => void;
+  deleteChat: (id: string) => Promise<void>;
+  renameChat: (id: string, title: string) => Promise<void>;
+}
+
+export interface ChatHistoryListProps {
+  children: (props: ChatHistoryListRenderProps) => ReactNode;
+}
+
+export function ChatHistoryList({
+  children,
+}: ChatHistoryListProps) {
+  const history = useChatHistory();
+  return children(history);
+}
diff --git a/packages/appkit-ui/src/react/chat/headless/index.ts b/packages/appkit-ui/src/react/chat/headless/index.ts
new file mode 100644
index 000000000..7d4367c59
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/headless/index.ts
@@ -0,0 +1,3 @@
+export * from "./chat-input";
+export * from "./conversation";
+export * from "./history-list";
diff --git a/packages/appkit-ui/src/react/chat/hooks/index.ts b/packages/appkit-ui/src/react/chat/hooks/index.ts
new file mode 100644
index 000000000..d6c9cabc8
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/hooks/index.ts
@@ -0,0 +1,4 @@
+export * from "./use-chat";
+export * from "./use-chat-data";
+export * from "./use-history";
+export * from "./use-scroll-to-bottom";
diff --git a/packages/appkit-ui/src/react/chat/hooks/use-chat-data.ts b/packages/appkit-ui/src/react/chat/hooks/use-chat-data.ts
new file mode 100644
index 000000000..f365329d0
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/hooks/use-chat-data.ts
@@ -0,0 +1,84 @@
+import { useMemo } from "react";
+import useSWR from "swr";
+import { useChatContext } from "../context";
+import { convertToChatMessages } from "../lib/messages";
+import { apiUrl } from "../lib/utils";
+import type { Chat, ChatFeedbackMap, ChatMessage } from "../types";
+
+interface ChatData {
+  chat: Chat;
+  messages: ChatMessage[];
+  feedback: ChatFeedbackMap;
+}
+
+function createFetchChatData(apiBase: string) {
+  return async function fetchChatData(url: string): Promise<ChatData | null> {
+    const chatId = url.split("/").pop();
+
+    const chatResponse = await fetch(apiUrl(apiBase, `/${chatId}`));
+
+    if (!chatResponse.ok) {
+      if (chatResponse.status === 404 || chatResponse.status === 403) {
+        return null;
+      }
+      throw new Error("Failed to load chat");
+    }
+
+    const chat = await chatResponse.json();
+
+    const messagesResponse = await fetch(
+      apiUrl(apiBase, `/messages/${chatId}`),
+    );
+
+    if (!messagesResponse.ok) {
+      if (messagesResponse.status === 404) {
+        return { chat, messages: [], feedback: {} };
+      }
+      throw new Error("Failed to load messages");
+    }
+
+    const messagesFromDb = await messagesResponse.json();
+    const messages = convertToChatMessages(messagesFromDb);
+
+    let feedbackMap: ChatFeedbackMap = {};
+    try {
+      const feedbackResponse = await fetch(
+        apiUrl(apiBase, `/feedback/chat/${chatId}`),
+      );
+      if (feedbackResponse.ok) {
+        feedbackMap = await feedbackResponse.json();
+      }
+    } catch (error) {
+      console.warn("Failed to fetch feedback:", error);
+    }
+
+    return { chat, messages, feedback: feedbackMap };
+  };
+}
+
+export function useChatData(chatId: string | undefined, enabled = true) {
+  const { apiBase } = useChatContext();
+  const fetchFn = useMemo(() => createFetchChatData(apiBase), [apiBase]);
+
+  const { data, error, isLoading, mutate } = useSWR<ChatData | null>(
+    chatId && enabled ? `/chat/${chatId}` : null,
+    fetchFn,
+    {
+      revalidateOnFocus: false,
+      revalidateOnReconnect: false,
+      keepPreviousData: true,
+      dedupingInterval: 2000,
+    },
+  );
+
+  return {
+    chatData: data,
+    isLoading,
+    error: error
+      ? "Failed to load chat"
+      : data === null && !isLoading
+        ? "Chat not found or you do not have access"
+        : null,
+    mutate,
+  };
+}
diff --git a/packages/appkit-ui/src/react/chat/hooks/use-chat.ts b/packages/appkit-ui/src/react/chat/hooks/use-chat.ts
new file mode 100644
index 000000000..4a29a12aa
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/hooks/use-chat.ts
@@ -0,0 +1,294 @@
+import { type UseChatHelpers, useChat as useAiChat } from "@ai-sdk/react";
+import type {
+  ChatOnDataCallback,
+  HttpChatTransportInitOptions,
+  LanguageModelUsage,
+  PrepareSendMessagesRequest,
+  UIMessage,
+  UIMessageChunk,
+} from "ai";
+import { useCallback, useMemo, useRef, useState } from "react";
+import { useSWRConfig } from "swr";
+import { unstable_serialize } from "swr/infinite";
+import { useChatContext } from "../context";
+import { ChatError } from "../errors";
+import { isCredentialErrorMessage } from "../lib/oauth";
+import { ChatTransport } from "../lib/transport";
+import { apiUrl, fetchWithErrorHandlers, generateUUID } from "../lib/utils";
+import type {
+  ChatFeedbackMap,
+  ChatMessage,
+  ChatVisibilityType,
+} from "../types";
+import { getChatHistoryPaginationKey } from "./use-history";
+
+export type UseChatReturn<TMessage extends UIMessage = ChatMessage> =
+  UseChatHelpers<TMessage> & {
+    id: string;
+    title: string | undefined;
+    isTitleLoading: boolean;
+    isReadonly: boolean;
+    feedback: ChatFeedbackMap;
+    visibilityType: ChatVisibilityType;
+    model: string;
+  };
+
+export interface UseChatOptions<TMessage extends UIMessage = ChatMessage> {
+  id?: string;
+  initialMessages?: TMessage[];
+  model?: string;
+  initialVisibility?: ChatVisibilityType;
+  isReadonly?: boolean;
+  feedback?: ChatFeedbackMap;
+  title?: string;
+  onError?: (error: Error) => void;
+  onTitleGenerated?: (title: string) => void;
+
+  /**
+   * Override the chat endpoint URL. Defaults to `apiUrl(apiBase, "/")`
+   * (i.e. derived from the surrounding `ChatProvider`'s `apiBase`).
+   */
+  api?: string;
+  /**
+   * Extra fetch headers (e.g. `Accept` for content negotiation). Forwarded
+   * verbatim to the underlying transport.
+   */
+  headers?: HttpChatTransportInitOptions<TMessage>["headers"];
+  /**
+   * Replaces the default body builder. When provided, the default
+   * `{ id, messages, trigger }` shape is NOT emitted — the consumer is
+   * fully responsible for the request body.
+   */
+  prepareSendMessagesRequest?: PrepareSendMessagesRequest<TMessage>;
+  /**
+   * Called AFTER the hook's internal `data-usage` / `data-title` handlers
+   * for every received data part. Use this to react to custom data parts
+   * (e.g. tool-approval prompts) without forking the hook.
+   */
+  onData?: ChatOnDataCallback<TMessage>;
+  /**
+   * Called for every raw `UIMessageChunk` arriving from the transport
+   * (text-delta, reasoning-delta, tool-input-available, finish, etc.).
+   * Fires synchronously inside the stream pipeline — unaffected by render
+   * throttling — so it's the right hook for chronological event logging
+   * or debug panels.
+   */
+  onStreamPart?: (part: UIMessageChunk) => void;
+}
+
+export function useChat<TMessage extends UIMessage = ChatMessage>(
+  options: UseChatOptions<TMessage> = {},
+): UseChatReturn<TMessage> {
+  const {
+    id: providedId,
+    initialMessages,
+    model = "chat-model",
+    initialVisibility = "private",
+    isReadonly = false,
+    feedback = {},
+    title: externalTitle,
+    onError: onErrorCb,
+    onTitleGenerated,
+    api: apiOverride,
+    headers,
+    prepareSendMessagesRequest: prepareSendMessagesRequestOverride,
+    onData: onDataOverride,
+    onStreamPart: onStreamPartOverride,
+  } = options;
+
+  const [id] = useState(() => providedId ?? generateUUID());
+  const initialMessagesRef = useRef<TMessage[]>(initialMessages ?? []);
+  const { chatHistoryEnabled, apiBase, onNavigate } = useChatContext();
+
+  const [visibilityType] = useState<ChatVisibilityType>(initialVisibility);
+
+  const { mutate } = useSWRConfig();
+
+  const [_usage, setUsage] = useState<LanguageModelUsage | undefined>();
+  const [lastPart, setLastPart] = useState<UIMessageChunk | undefined>();
+  const lastPartRef = useRef<UIMessageChunk | undefined>(lastPart);
+  lastPartRef.current = lastPart;
+
+  const resumeAttemptCountRef = useRef(0);
+  const maxResumeAttempts = 3;
+
+  // Hold the consumer's onStreamPart in a ref so the transport memo doesn't
+  // need it as a dep — keeping the transport identity stable across renders
+  // even when the caller passes an inline callback.
+  const onStreamPartRef = useRef(onStreamPartOverride);
+  onStreamPartRef.current = onStreamPartOverride;
+
+  const isNewChat = initialMessagesRef.current.length === 0;
+  const didFetchHistoryOnNewChat = useRef(false);
+  const fetchChatHistory = useCallback(() => {
+    mutate(
+      unstable_serialize((pageIndex: number, previousPageData: unknown) =>
+        getChatHistoryPaginationKey(apiBase, pageIndex, previousPageData),
+      ),
+    );
+  }, [mutate, apiBase]);
+
+  const [streamTitle, setStreamTitle] = useState<string | undefined>();
+  const [titlePending, setTitlePending] = useState(false);
+  const displayTitle = externalTitle ?? streamTitle;
+
+  const chatApiUrl = apiOverride ?? apiUrl(apiBase, "/");
+
+  // Default body builder used when the consumer doesn't supply their own
+  // `prepareSendMessagesRequest`. Matches AppKit's agents plugin
+  // `vercelAIChatRequestSchema` shape (`{ id, messages, trigger }`).
+  // Consumers targeting a different server pass `prepareSendMessagesRequest`.
+  const defaultPrepareSendMessagesRequest = useMemo<
+    PrepareSendMessagesRequest<TMessage>
+  >(
+    () =>
+      ({ messages, id: msgId, body, trigger }) => ({
+        body: {
+          id: msgId,
+          messages,
+          trigger,
+          ...body,
+        },
+      }),
+    [],
+  );
+
+  const prepareSendMessagesRequest =
+    prepareSendMessagesRequestOverride ?? defaultPrepareSendMessagesRequest;
+
+  const transport = useMemo(
+    () =>
+      new ChatTransport<TMessage>({
+        api: chatApiUrl,
+        headers,
+        // Pass `fetchWithErrorHandlers` straight through. It forwards `init`
+        // verbatim to `fetch`, so the AbortSignal that `useChat` plumbs in
+        // for its native `stop()` and unmount cleanup is preserved.
+        fetch: fetchWithErrorHandlers,
+        prepareSendMessagesRequest,
+        prepareReconnectToStreamRequest({ id: streamId }) {
+          return {
+            api: apiUrl(apiBase, `/${streamId}/stream`),
+            credentials: "include",
+          };
+        },
+        onStreamPart: (part) => {
+          if (isNewChat && !didFetchHistoryOnNewChat.current) {
+            fetchChatHistory();
+            if (chatHistoryEnabled) {
+              setTitlePending(true);
+            }
+            didFetchHistoryOnNewChat.current = true;
+
+            if (chatHistoryEnabled && onNavigate) {
+              onNavigate(id);
+            }
+          }
+          resumeAttemptCountRef.current = 0;
+          setLastPart(part);
+          onStreamPartRef.current?.(part);
+        },
+      }),
+    [
+      apiBase,
+      chatApiUrl,
+      chatHistoryEnabled,
+      fetchChatHistory,
+      headers,
+      id,
+      isNewChat,
+      onNavigate,
+      prepareSendMessagesRequest,
+    ],
+  );
+
+  const chatResult = useAiChat<TMessage>({
+    id,
+    messages: initialMessagesRef.current,
+    experimental_throttle: 100,
+    generateId: generateUUID,
+    resume: id !== undefined && initialMessagesRef.current.length > 0,
+    transport,
+    onData: (dataPart) => {
+      if (dataPart.type === "data-usage") {
+        setUsage(dataPart.data as LanguageModelUsage);
+      }
+      if (dataPart.type === "data-title") {
+        const title = dataPart.data as string;
+        setStreamTitle(title);
+        setTitlePending(false);
+        fetchChatHistory();
+        onTitleGenerated?.(title);
+      }
+      onDataOverride?.(dataPart);
+    },
+    onFinish: ({
+      isAbort,
+      isDisconnect,
+      isError,
+      messages: finishedMessages,
+    }) => {
+      didFetchHistoryOnNewChat.current = false;
+      setTitlePending(false);
+
+      if (isAbort) {
+        fetchChatHistory();
+        return;
+      }
+
+      const lastMessage = finishedMessages?.[finishedMessages.length - 1];
+      const hasOAuthError = (
+        lastMessage?.parts as
+          | Array<{ type: string; data?: unknown }>
+          | undefined
+      )?.some(
+        (part) =>
+          part.type === "data-error" &&
+          typeof part.data === "string" &&
+          isCredentialErrorMessage(part.data),
+      );
+
+      if (hasOAuthError) {
+        fetchChatHistory();
+        chatResult.clearError();
+        return;
+      }
+
+      const streamIncomplete = lastPartRef.current?.type !== "finish";
+      const shouldResume =
+        streamIncomplete &&
+        (isDisconnect || isError || lastPartRef.current === undefined);
+
+      if (shouldResume && resumeAttemptCountRef.current < maxResumeAttempts) {
+        resumeAttemptCountRef.current++;
+        queueMicrotask(() => {
+          chatResult.resumeStream();
+        });
+      } else {
+        if (resumeAttemptCountRef.current >= maxResumeAttempts) {
+          console.warn("[useChat] Max resume attempts reached");
+        }
+        fetchChatHistory();
+      }
+    },
+    onError: (error) => {
+      if (error instanceof ChatError) {
+        console.warn("[useChat] Chat error:", error.message);
+      } else {
+        console.warn("[useChat] Error during streaming:", error.message);
+      }
+      onErrorCb?.(error);
+    },
+  });
+
+  return {
+    ...chatResult,
+    id,
+    title: displayTitle,
+    isTitleLoading: titlePending && !displayTitle,
+    isReadonly,
+    feedback,
+    visibilityType,
+    model,
+  };
+}
diff --git a/packages/appkit-ui/src/react/chat/hooks/use-history.ts b/packages/appkit-ui/src/react/chat/hooks/use-history.ts
new file mode 100644
index 000000000..a7c297aa4
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/hooks/use-history.ts
@@ -0,0 +1,105 @@
+import { useCallback } from "react";
+import useSWRInfinite from "swr/infinite";
+import { useChatContext } from "../context";
+import { apiUrl, fetcher } from "../lib/utils";
+import type { ChatHistoryPage } from "../types";
+
+const PAGE_SIZE = 20;
+
+export function getChatHistoryPaginationKey(
+  apiBase: string,
+  pageIndex: number,
+  previousPageData: unknown,
+) {
+  const prev = previousPageData as ChatHistoryPage | undefined;
+  if (prev && prev.hasMore === false) {
+    return null;
+  }
+  if (pageIndex === 0) return apiUrl(apiBase, `/history?limit=${PAGE_SIZE}`);
+
+  const lastChat = prev?.chats[prev.chats.length - 1];
+  if (!lastChat) return null;
+
+  return apiUrl(
+    apiBase,
+    `/history?ending_before=${lastChat.id}&limit=${PAGE_SIZE}`,
+  );
+}
+
+export function useChatHistory() {
+  const { chatHistoryEnabled, apiBase } = useChatContext();
+
+  const {
+    data: pages,
+    setSize,
+    isValidating,
+    isLoading,
+    mutate,
+  } = useSWRInfinite<ChatHistoryPage>(
+    chatHistoryEnabled
+      ? (pageIndex: number, previousPageData: unknown) =>
+          getChatHistoryPaginationKey(
+            apiBase,
+            pageIndex,
+            previousPageData,
+          )
+      : () => null,
+    fetcher,
+    { fallbackData: [] },
+  );
+
+  const chats = pages?.flatMap((page) => page.chats) ?? [];
+  const hasMore = pages ? !pages.some((p) => p.hasMore === false) : true;
+  const isEmpty = pages ? pages.every((p) => p.chats.length === 0) : false;
+
+  const loadMore = useCallback(() => {
+    if (!isValidating && hasMore) {
+      setSize((s) => s + 1);
+    }
+  }, [isValidating, hasMore, setSize]);
+
+  const deleteChat = useCallback(
+    async (chatId: string) => {
+      const response = await fetch(apiUrl(apiBase, `/${chatId}`), {
+        method: "DELETE",
+      });
+      if (!response.ok) {
+        throw new Error(`Failed to delete chat: ${response.status}`);
+      }
+      mutate((histories) =>
+        histories?.map((h) => ({
+          ...h,
+          chats: h.chats.filter((c) => c.id !== chatId),
+        })),
+      );
+    },
+    [mutate, apiBase],
+  );
+
+  const renameChat = useCallback(
+    async (chatId: string, title: string) => {
+      const response = await fetch(apiUrl(apiBase, `/${chatId}`), {
+        method: "PATCH",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({ title }),
+      });
+      if (!response.ok) {
+        throw new Error(`Failed to rename chat: ${response.status}`);
+      }
+      mutate();
+    },
+    [mutate, apiBase],
+  );
+
+  return {
+    chats,
+    isLoading,
+    isValidating,
+    hasMore,
+    isEmpty,
+    loadMore,
+    deleteChat,
+    renameChat,
+    mutate,
+  };
+}
diff --git a/packages/appkit-ui/src/react/chat/hooks/use-scroll-to-bottom.ts b/packages/appkit-ui/src/react/chat/hooks/use-scroll-to-bottom.ts
new file mode 100644
index 000000000..49f95356e
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/hooks/use-scroll-to-bottom.ts
@@ -0,0 +1,63 @@
+import { useCallback, useEffect, useRef, useState } from "react";
+
+export interface UseScrollToBottomOptions {
+  /** Pixels from the bottom that still count as "at bottom". Default 50. */
+  threshold?: number;
+  /** Reactive value that triggers an auto-scroll when isAtBottom is true. */
+  trigger?: unknown;
+}
+
+export interface UseScrollToBottomReturn<T extends HTMLElement> {
+  containerRef: React.RefObject<T | null>;
+  endRef: React.RefObject<HTMLDivElement | null>;
+  isAtBottom: boolean;
+  scrollToBottom: (behavior?: ScrollBehavior) => void;
+}
+
+/**
+ * Tracks whether a scroll container is at the bottom and exposes an
+ * imperative `scrollToBottom`. When `trigger` changes and the user was at
+ * the bottom, the container auto-scrolls — preserving the typical chat
+ * "stick to latest" behavior without overriding manual scroll-up.
+ */
+export function useScrollToBottom<T extends HTMLElement = HTMLDivElement>({
+  threshold = 50,
+  trigger,
+}: UseScrollToBottomOptions = {}): UseScrollToBottomReturn<T> {
+  const containerRef = useRef<T | null>(null);
+  const endRef = useRef<HTMLDivElement | null>(null);
+  const [isAtBottom, setIsAtBottom] = useState(true);
+
+  const handleScroll = useCallback(() => {
+    const el = containerRef.current;
+    if (!el) return;
+    setIsAtBottom(el.scrollHeight - el.scrollTop - el.clientHeight < threshold);
+  }, [threshold]);
+
+  useEffect(() => {
+    const el = containerRef.current;
+    if (!el) return;
+    el.addEventListener("scroll", handleScroll, { passive: true });
+    handleScroll();
+    return () => el.removeEventListener("scroll", handleScroll);
+  }, [handleScroll]);
+
+  useEffect(() => {
+    void trigger;
+    if (isAtBottom && containerRef.current) {
+      containerRef.current.scrollTo({
+        top: containerRef.current.scrollHeight,
+        behavior: "smooth",
+      });
+    }
+  }, [trigger, isAtBottom]);
+
+  const scrollToBottom = useCallback((behavior: ScrollBehavior = "smooth") => {
+    containerRef.current?.scrollTo({
+      top: containerRef.current.scrollHeight,
+      behavior,
+    });
+  }, []);
+
+  return { containerRef, endRef, isAtBottom, scrollToBottom };
+}
diff --git a/packages/appkit-ui/src/react/chat/index.ts b/packages/appkit-ui/src/react/chat/index.ts
new file mode 100644
index 000000000..280e2e071
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/index.ts
@@ -0,0 +1,11 @@
+export * from "./context";
+export * from "./errors";
+export * from "./headless";
+export * from "./hooks";
+export * from "./lib/messages";
+export * from "./lib/oauth";
+export * from "./lib/protocol";
+export * from "./lib/transport";
+export * from "./lib/utils";
+export * from "./provider";
+export * from "./types";
diff --git a/packages/appkit-ui/src/react/chat/lib/messages.ts b/packages/appkit-ui/src/react/chat/lib/messages.ts
new file mode 100644
index 000000000..90d11a09a
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/lib/messages.ts
@@ -0,0 +1,25 @@
+import type { UIMessagePart } from "ai";
+import type {
+  ChatCustomUIDataTypes,
+  ChatMessage,
+  ChatTools,
+  DBMessage,
+} from "../types";
+
+/**
+ * Convert messages from the DB shape (unknown JSON parts/attachments)
+ * into the typed `ChatMessage` UI shape.
+ */
+export function convertToChatMessages(messages: DBMessage[]): ChatMessage[] {
+  return messages.map((message) => ({
+    id: message.id,
+    role: message.role as "user" | "assistant" | "system",
+    parts: message.parts as UIMessagePart<ChatCustomUIDataTypes, ChatTools>[],
+    metadata: {
+      createdAt:
+        typeof message.createdAt === "string"
+          ? message.createdAt
+          : message.createdAt.toISOString(),
+    },
+  }));
+}
diff --git a/packages/appkit-ui/src/react/chat/lib/oauth.ts b/packages/appkit-ui/src/react/chat/lib/oauth.ts
new file mode 100644
index 000000000..a754f1880
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/lib/oauth.ts
@@ -0,0 +1,32 @@
+/**
+ * Detection and parsing helpers for OAuth credential errors thrown when a
+ * tool call requires user authentication that hasn't been completed yet.
+ *
+ * Expected error format:
+ * "Failed request to https://... Error: Credential for user identity('___') is not found
+ * for the connection 'CONNECTION_NAME'. Please login first to the connection by visiting https://LOGIN_URL"
+ */
+
+const CREDENTIAL_ERROR_PATTERN =
+  /Credential for user identity\([^)]*\) is not found for the connection/i;
+
+const LOGIN_URL_PATTERN =
+  /please login first to the connection by visiting\s+(https?:\/\/[^\s]+)/i;
+
+const CONNECTION_NAME_PATTERN = /for the connection\s+'([^']+)'/i;
+
+export function isCredentialErrorMessage(errorMessage: string): boolean {
+  return CREDENTIAL_ERROR_PATTERN.test(errorMessage);
+}
+
+export function findLoginURLFromCredentialErrorMessage(
+  errorMessage: string,
+): string | undefined {
+  return errorMessage.match(LOGIN_URL_PATTERN)?.[1];
+}
+
+export function findConnectionNameFromCredentialErrorMessage(
+  errorMessage: string,
+): string | undefined {
+  return errorMessage.match(CONNECTION_NAME_PATTERN)?.[1];
+}
diff --git a/packages/appkit-ui/src/react/chat/lib/protocol.ts b/packages/appkit-ui/src/react/chat/lib/protocol.ts
new file mode 100644
index 000000000..ff1ee7d73
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/lib/protocol.ts
@@ -0,0 +1 @@
+export { VERCEL_AI_UI_MESSAGE_STREAM_MIME } from "shared";
diff --git a/packages/appkit-ui/src/react/chat/lib/transport.ts b/packages/appkit-ui/src/react/chat/lib/transport.ts
new file mode 100644
index 000000000..e735d99a0
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/lib/transport.ts
@@ -0,0 +1,43 @@
+import {
+  DefaultChatTransport,
+  type HttpChatTransportInitOptions,
+  type UIMessage,
+  type UIMessageChunk,
+} from "ai";
+
+/**
+ * Transport extension that taps into the streamed UIMessageChunks before
+ * they reach the SDK's reducer. Used by `useChat` to spot the
+ * stream's first chunk (for history-revalidation timing) and the latest
+ * chunk (for resume-on-disconnect heuristics) without re-parsing the
+ * stream a second time.
+ */
+export class ChatTransport<
+  T extends UIMessage,
+> extends DefaultChatTransport<T> {
+  private onStreamPart: ((part: UIMessageChunk) => void) | undefined;
+  constructor(
+    options?: HttpChatTransportInitOptions<T> & {
+      onStreamPart?: (part: UIMessageChunk) => void;
+    },
+  ) {
+    const { onStreamPart, ...rest } = options ?? {};
+    super(rest);
+    this.onStreamPart = onStreamPart;
+  }
+
+  protected processResponseStream(
+    stream: ReadableStream<Uint8Array<ArrayBufferLike>>,
+  ): ReadableStream<UIMessageChunk> {
+    const onStreamPart = this.onStreamPart;
+    const processedStream = super.processResponseStream(stream);
+    return processedStream.pipeThrough(
+      new TransformStream<UIMessageChunk, UIMessageChunk>({
+        transform(chunk, controller) {
+          onStreamPart?.(chunk);
+          controller.enqueue(chunk);
+        },
+      }),
+    );
+  }
+}
diff --git a/packages/appkit-ui/src/react/chat/lib/utils.ts b/packages/appkit-ui/src/react/chat/lib/utils.ts
new file mode 100644
index 000000000..3fb92f6d7
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/lib/utils.ts
@@ -0,0 +1,56 @@
+import { ChatError, type ChatErrorCode } from "../errors";
+
+/**
+ * Plain-JS UUID v4 generator. Avoids `crypto.randomUUID` because some
+ * deployment targets shim or strip it from the global `crypto` object.
+ */
+export function generateUUID(): string {
+  return "xxxxxxxx-xxxx-4xxx-yxxx-xxxxxxxxxxxx".replace(/[xy]/g, (c) => {
+    const r = (Math.random() * 16) | 0;
+    const v = c === "x" ? r : (r & 0x3) | 0x8;
+    return v.toString(16);
+  });
+}
+
+export function apiUrl(apiBase: string, path: string): string {
+  if (path.startsWith("/")) return `${apiBase}${path}`;
+  return `${apiBase}/${path}`;
+}
+
+export async function fetchWithErrorHandlers(
+  input: RequestInfo | URL,
+  init?: RequestInit,
+) {
+  try {
+    const response = await fetch(input, init);
+
+    if (!response.ok) {
+      const parsedResponse = await response.json();
+      const { code, cause } = parsedResponse;
+      throw new ChatError(code as ChatErrorCode, cause);
+    }
+
+    return response;
+  } catch (error: unknown) {
+    if (typeof navigator !== "undefined" && !navigator.onLine) {
+      throw new ChatError("offline:chat");
+    }
+
+    throw error;
+  }
+}
+
+export const fetcher = async (url: string) => {
+  const response = await fetch(url);
+
+  if (!response.ok) {
+    const { code, cause } = await response.json();
+    throw new ChatError(code as ChatErrorCode, cause);
+  }
+
+  if (response.status === 204) {
+    return { chats: [], hasMore: false };
+  }
+
+  return response.json();
+};
diff --git a/packages/appkit-ui/src/react/chat/provider.tsx b/packages/appkit-ui/src/react/chat/provider.tsx
new file mode 100644
index 000000000..337c423c8
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/provider.tsx
@@ -0,0 +1,87 @@
+import { type ReactNode, useMemo } from "react";
+import useSWR, { SWRConfig } from "swr";
+import { ChatContext, type ChatContextValue } from "./context";
+import type { ChatFeatures, ChatSession } from "./types";
+
+export interface ChatProviderProps {
+  /** Base URL for the chat API (e.g. "/api/chat") */
+  apiBase?: string;
+  /** Base path for client-side routing (e.g. "/chat") */
+  basePath?: string;
+  /** Feature flags — auto-fetched from the /config endpoint when omitted */
+  features?: Partial<ChatFeatures>;
+  /** User session — auto-fetched from the /session endpoint when omitted */
+  session?: ChatSession;
+  /** Called when the library wants to navigate to a chat (e.g. after creating a new one) */
+  onNavigate?: (chatId: string) => void;
+  children: ReactNode;
+}
+
+const jsonFetcher = async (url: string) => {
+  const res = await fetch(url, { credentials: "include" });
+  if (!res.ok) throw new Error(`Fetch failed: ${url}`);
+  return res.json();
+};
+
+export function ChatProvider({
+  apiBase = "/api/chat",
+  basePath = "/",
+  features: featuresProp,
+  session: sessionProp,
+  onNavigate,
+  children,
+}: ChatProviderProps) {
+  const shouldFetchConfig = featuresProp === undefined;
+  const { data: serverConfig, isLoading: configLoading } = useSWR<{
+    features: ChatFeatures;
+  }>(shouldFetchConfig ? `${apiBase}/config` : null, jsonFetcher, {
+    revalidateOnFocus: false,
+    revalidateOnReconnect: false,
+    dedupingInterval: 60000,
+  });
+
+  const shouldFetchSession = sessionProp === undefined;
+  const { data: serverSession, isLoading: sessionLoading } =
+    useSWR<ChatSession>(
+      shouldFetchSession ? `${apiBase}/session` : null,
+      jsonFetcher,
+      { revalidateOnFocus: false },
+    );
+
+  const features: ChatFeatures = useMemo(
+    () => ({
+      chatHistory:
+        featuresProp?.chatHistory ??
+        serverConfig?.features?.chatHistory ??
+        true,
+      feedback:
+        featuresProp?.feedback ?? serverConfig?.features?.feedback ?? false,
+    }),
+    [featuresProp, serverConfig],
+  );
+
+  const session = sessionProp ?? serverSession ?? null;
+  const isLoading =
+    (shouldFetchConfig && configLoading) ||
+    (shouldFetchSession && sessionLoading);
+
+  const value: ChatContextValue = useMemo(
+    () => ({
+      apiBase,
+      basePath,
+      features,
+      chatHistoryEnabled: features.chatHistory,
+      feedbackEnabled: features.feedback,
+      session,
+      isLoading,
+      onNavigate,
+    }),
+    [apiBase, basePath, features, session, isLoading, onNavigate],
+  );
+
+  return (
+    <SWRConfig value={{ dedupingInterval: 2000 }}>
+      <ChatContext.Provider value={value}>{children}</ChatContext.Provider>
+    </SWRConfig>
+  );
+}
diff --git a/packages/appkit-ui/src/react/chat/types.ts b/packages/appkit-ui/src/react/chat/types.ts
new file mode 100644
index 000000000..855fa1299
--- /dev/null
+++ b/packages/appkit-ui/src/react/chat/types.ts
@@ -0,0 +1,86 @@
+import type { LanguageModelUsage, UIMessage } from "ai";
+
+// Custom data types for the AI SDK stream
+
+export type ChatCustomUIDataTypes = {
+  error: string;
+  usage: LanguageModelUsage;
+  traceId: string | null;
+  title: string;
+};
+
+type MessageMetadata = {
+  createdAt: string;
+};
+
+// biome-ignore lint/complexity/noBannedTypes: empty default tool registry — consumers extend this type
+export type ChatTools = {};
+
+export type ChatMessage = UIMessage<MessageMetadata, ChatCustomUIDataTypes>;
+
+// Domain types
+
+export interface ChatAttachment {
+  name: string;
+  url: string;
+  contentType: string;
+}
+
+export type ChatVisibilityType = "private" | "public";
+
+export interface ChatFeedback {
+  messageId: string;
+  feedbackType: "thumbs_up" | "thumbs_down";
+  assessmentId: string | null;
+}
+
+export type ChatFeedbackMap = Record<string, ChatFeedback>;
+
+export interface ChatSession {
+  user: {
+    email: string;
+    name?: string;
+    preferredUsername?: string;
+  } | null;
+}
+
+export interface Chat {
+  id: string;
+  createdAt: Date;
+  title: string;
+  userId: string;
+  visibility: "public" | "private";
+  lastContext: {
+    inputTokens?: {
+      total?: number;
+      noCache?: number;
+      cacheRead?: number;
+      cacheWrite?: number;
+    };
+    outputTokens?: {
+      total?: number;
+      text?: number;
+      reasoning?: number;
+    };
+  } | null;
+}
+
+export interface DBMessage {
+  id: string;
+  chatId: string;
+  role: string;
+  parts: unknown;
+  attachments: unknown;
+  createdAt: Date;
+  traceId: string | null;
+}
+
+export interface ChatFeatures {
+  chatHistory: boolean;
+  feedback: boolean;
+}
+
+export interface ChatHistoryPage {
+  chats: Array<Chat>;
+  hasMore: boolean;
+}
diff --git a/packages/appkit-ui/tsdown.config.ts b/packages/appkit-ui/tsdown.config.ts
index f55a51457..2c9932391 100644
--- a/packages/appkit-ui/tsdown.config.ts
+++ b/packages/appkit-ui/tsdown.config.ts
@@ -9,6 +9,7 @@ export default defineConfig([
       "src/js/beta.ts",
       "src/react/index.ts",
       "src/react/beta.ts",
+      "src/react/chat/index.ts",
     ],
     outDir: "dist",
     platform: "browser",
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 8c6a34ddf..99883508e 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -31,7 +31,7 @@ importers:
         version: 10.4.1
       '@testing-library/react':
         specifier: 16.3.0
-        version: 16.3.0(@testing-library/dom@10.4.1)(@types/react-dom@19.2.3(@types/react@19.2.7))(@types/react@19.2.7)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 16.3.0(@testing-library/dom@10.4.1)(@types/react-dom@19.2.3(@types/react@19.2.7))(@types/react@19.2.7)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@types/node':
         specifier: 24.7.2
         version: 24.7.2
@@ -365,85 +365,85 @@ importers:
     dependencies:
       '@radix-ui/react-accordion':
         specifier: 1.2.12
-        version: 1.2.12(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.2.12(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-alert-dialog':
         specifier: 1.1.15
-        version: 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-aspect-ratio':
         specifier: 1.1.8
-        version: 1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-avatar':
         specifier: 1.1.11
-        version: 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-checkbox':
         specifier: 1.3.3
-        version: 1.3.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.3.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-collapsible':
         specifier: 1.1.12
-        version: 1.1.12(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.12(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-context-menu':
         specifier: 2.2.16
-        version: 2.2.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 2.2.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-dialog':
         specifier: 1.1.15
-        version: 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-dropdown-menu':
         specifier: 2.1.16
-        version: 2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-hover-card':
         specifier: 1.1.15
-        version: 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-label':
         specifier: 2.1.8
-        version: 2.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 2.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-menubar':
         specifier: 1.1.16
-        version: 1.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-navigation-menu':
         specifier: 1.2.14
-        version: 1.2.14(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.2.14(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-popover':
         specifier: 1.1.15
-        version: 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-progress':
         specifier: 1.1.8
-        version: 1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-radio-group':
         specifier: 1.3.8
-        version: 1.3.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.3.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-scroll-area':
         specifier: 1.2.10
-        version: 1.2.10(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.2.10(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-select':
         specifier: 2.2.6
-        version: 2.2.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 2.2.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-separator':
         specifier: 1.1.8
-        version: 1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-slider':
         specifier: 1.3.6
-        version: 1.3.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.3.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-slot':
         specifier: 1.2.4
-        version: 1.2.4(@types/react@19.2.2)(react@19.2.0)
+        version: 1.2.4(@types/react@19.2.2)(react@19.2.5)
       '@radix-ui/react-switch':
         specifier: 1.2.6
-        version: 1.2.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.2.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-tabs':
         specifier: 1.1.13
-        version: 1.1.13(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.13(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-toggle':
         specifier: 1.1.10
-        version: 1.1.10(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.10(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-toggle-group':
         specifier: 1.1.11
-        version: 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@radix-ui/react-tooltip':
         specifier: 1.2.8
-        version: 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       '@tanstack/react-table':
         specifier: 8.21.3
-        version: 8.21.3(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 8.21.3(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       apache-arrow:
         specifier: 21.1.0
         version: 21.1.0
@@ -455,7 +455,7 @@ importers:
         version: 2.1.1
       cmdk:
         specifier: 1.1.1
-        version: 1.1.1(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.1(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       dompurify:
         specifier: 3.3.3
         version: 3.3.3
@@ -464,59 +464,68 @@ importers:
         version: 6.0.0
       echarts-for-react:
         specifier: 3.0.5
-        version: 3.0.5(echarts@6.0.0)(react@19.2.0)
+        version: 3.0.5(echarts@6.0.0)(react@19.2.5)
       embla-carousel-react:
         specifier: 8.6.0
-        version: 8.6.0(react@19.2.0)
+        version: 8.6.0(react@19.2.5)
       input-otp:
         specifier: 1.4.2
-        version: 1.4.2(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.4.2(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       lucide-react:
         specifier: 0.554.0
-        version: 0.554.0(react@19.2.0)
+        version: 0.554.0(react@19.2.5)
       marked:
         specifier: 17.0.3
         version: 17.0.3
       next-themes:
         specifier: 0.4.6
-        version: 0.4.6(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 0.4.6(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       react-day-picker:
         specifier: 9.12.0
-        version: 9.12.0(react@19.2.0)
+        version: 9.12.0(react@19.2.5)
       react-hook-form:
         specifier: 7.68.0
-        version: 7.68.0(react@19.2.0)
+        version: 7.68.0(react@19.2.5)
       react-resizable-panels:
         specifier: 3.0.6
-        version: 3.0.6(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 3.0.6(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       shared:
         specifier: workspace:*
         version: link:../shared
       sonner:
         specifier: 2.0.7
-        version: 2.0.7(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 2.0.7(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       tailwind-merge:
         specifier: 3.4.0
         version: 3.4.0
       vaul:
         specifier: 1.1.2
-        version: 1.1.2(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 1.1.2(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
     devDependencies:
+      '@ai-sdk/react':
+        specifier: 4.0.0-beta.76
+        version: 4.0.0-beta.76(react@19.2.5)(zod@4.1.13)
       '@types/react':
         specifier: 19.2.2
         version: 19.2.2
       '@types/react-dom':
         specifier: 19.2.2
         version: 19.2.2(@types/react@19.2.2)
+      ai:
+        specifier: 7.0.0-beta.76
+        version: 7.0.0-beta.76(zod@4.1.13)
       react:
-        specifier: 19.2.0
-        version: 19.2.0
+        specifier: 19.2.5
+        version: 19.2.5
       react-dom:
-        specifier: 19.2.0
-        version: 19.2.0(react@19.2.0)
+        specifier: 19.2.5
+        version: 19.2.5(react@19.2.5)
       recharts:
         specifier: 2.15.4
-        version: 2.15.4(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+        version: 2.15.4(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      swr:
+        specifier: 2.4.1
+        version: 2.4.1(react@19.2.5)
       tailwindcss:
         specifier: 4.1.17
         version: 4.1.17
@@ -599,6 +608,12 @@ packages:
       zod:
         optional: true
 
+  '@ai-sdk/react@4.0.0-beta.76':
+    resolution: {integrity: sha512-M5CMl+wlIZexdN+gJG06WPW6F88JFFzjwC1dEyeVNLztxDnZn8VpJy6WDNEo3QgUWjinWJCOnLDLP9qPBzTSSA==}
+    engines: {node: '>=18'}
+    peerDependencies:
+      react: ^18 || ~19.0.1 || ~19.1.2 || ^19.2.1
+
   '@algolia/abtesting@1.12.0':
     resolution: {integrity: sha512-EfW0bfxjPs+C7ANkJDw2TATntfBKsFiy7APh+KO0pQ8A6HYa5I0NjFuCGCXWfzzzLXNZta3QUl3n5Kmm6aJo9Q==}
     engines: {node: '>= 14.0.0'}
@@ -9960,6 +9975,11 @@ packages:
     peerDependencies:
       react: ^19.2.0
 
+  react-dom@19.2.5:
+    resolution: {integrity: sha512-J5bAZz+DXMMwW/wV3xzKke59Af6CHY7G4uYLN1OvBcKEsWOs4pQExj86BBKamxl/Ik5bx9whOrvBlSDfWzgSag==}
+    peerDependencies:
+      react: ^19.2.5
+
   react-fast-compare@3.2.2:
     resolution: {integrity: sha512-nsO+KSNgo1SbJqJEYRE9ERzo7YtYbou/OqjSQKxV7jcKox7+usiUVZOAC+XnDOABXggQTno0Y1CpVnuWEc1boQ==}
 
@@ -10067,6 +10087,10 @@ packages:
     resolution: {integrity: sha512-tmbWg6W31tQLeB5cdIBOicJDJRR2KzXsV7uSK9iNfLWQ5bIZfxuPEHp7M8wiHyHnn0DD1i7w3Zmin0FtkrwoCQ==}
     engines: {node: '>=0.10.0'}
 
+  react@19.2.5:
+    resolution: {integrity: sha512-llUJLzz1zTUBrskt2pwZgLq59AemifIftw4aB7JxOqf1HY2FDaGDxgwpAPVzHU1kdWabH7FauP4i1oEeer2WCA==}
+    engines: {node: '>=0.10.0'}
+
   read-cmd-shim@6.0.0:
     resolution: {integrity: sha512-1zM5HuOfagXCBWMN83fuFI/x+T/UhZ7k+KIzhrHXcQoeX5+7gmaDYjELQHmmzIodumBHeByBJT4QYS7ufAgs7A==}
     engines: {node: ^20.17.0 || >=22.9.0}
@@ -10832,8 +10856,8 @@ packages:
     engines: {node: '>=14.0.0'}
     hasBin: true
 
-  swr@2.3.8:
-    resolution: {integrity: sha512-gaCPRVoMq8WGDcWj9p4YWzCMPHzE0WNl6W8ADIx9c3JBEIdMkJGMzW+uzXvxHMltwcYACr9jP+32H8/hgwMR7w==}
+  swr@2.4.1:
+    resolution: {integrity: sha512-2CC6CiKQtEwaEeNiqWTAw9PGykW8SR5zZX8MZk6TeAvEAnVS7Visz8WzphqgtQ8v2xz/4Q5K+j+SeMaKXeeQIA==}
     peerDependencies:
       react: ^16.11.0 || ^17.0.0 || ^18.0.0 || ^19.0.0
 
@@ -11939,11 +11963,21 @@ snapshots:
       '@ai-sdk/provider-utils': 3.0.19(zod@4.3.6)
       ai: 5.0.113(zod@4.3.6)
       react: 19.2.0
-      swr: 2.3.8(react@19.2.0)
+      swr: 2.4.1(react@19.2.0)
       throttleit: 2.1.0
     optionalDependencies:
       zod: 4.3.6
 
+  '@ai-sdk/react@4.0.0-beta.76(react@19.2.5)(zod@4.1.13)':
+    dependencies:
+      '@ai-sdk/provider-utils': 5.0.0-beta.16(zod@4.1.13)
+      ai: 7.0.0-beta.76(zod@4.1.13)
+      react: 19.2.5
+      swr: 2.4.1(react@19.2.5)
+      throttleit: 2.1.0
+    transitivePeerDependencies:
+      - zod
+
   '@algolia/abtesting@1.12.0':
     dependencies:
       '@algolia/client-common': 5.46.0
@@ -14549,11 +14583,11 @@ snapshots:
       '@floating-ui/core': 1.7.3
       '@floating-ui/utils': 0.2.10
 
-  '@floating-ui/react-dom@2.1.6(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@floating-ui/react-dom@2.1.6(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@floating-ui/dom': 1.7.4
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
 
   '@floating-ui/utils@0.2.10': {}
 
@@ -15828,671 +15862,671 @@ snapshots:
 
   '@radix-ui/primitive@1.1.3': {}
 
-  '@radix-ui/react-accordion@1.2.12(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-accordion@1.2.12(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-collapsible': 1.1.12(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-collapsible': 1.1.12(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-alert-dialog@1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-alert-dialog@1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-dialog': 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-dialog': 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-arrow@1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-arrow@1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-aspect-ratio@1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-aspect-ratio@1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-avatar@1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-avatar@1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-context': 1.1.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-is-hydrated': 0.1.0(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-context': 1.1.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-is-hydrated': 0.1.0(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-checkbox@1.3.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-checkbox@1.3.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-size': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-size': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-collapsible@1.1.12(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-collapsible@1.1.12(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-collection@1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-collection@1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-compose-refs@1.1.2(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-compose-refs@1.1.2(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-context-menu@2.2.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-context-menu@2.2.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-menu': 2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-menu': 2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-context@1.1.2(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-context@1.1.2(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-context@1.1.3(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-context@1.1.3(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-dialog@1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-dialog@1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-focus-guards': 1.1.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-focus-scope': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-focus-guards': 1.1.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-focus-scope': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
       aria-hidden: 1.2.6
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
-      react-remove-scroll: 2.7.1(@types/react@19.2.2)(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
+      react-remove-scroll: 2.7.1(@types/react@19.2.2)(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-direction@1.1.1(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-direction@1.1.1(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-dismissable-layer@1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-dismissable-layer@1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-escape-keydown': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-escape-keydown': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-dropdown-menu@2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-dropdown-menu@2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-menu': 2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-menu': 2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-focus-guards@1.1.3(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-focus-guards@1.1.3(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-focus-scope@1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-focus-scope@1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-hover-card@1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-hover-card@1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-popper': 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-popper': 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-id@1.1.1(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-id@1.1.1(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-label@2.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-label@2.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-menu@2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-menu@2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-focus-guards': 1.1.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-focus-scope': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-popper': 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-roving-focus': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
+      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-focus-guards': 1.1.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-focus-scope': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-popper': 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-roving-focus': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
       aria-hidden: 1.2.6
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
-      react-remove-scroll: 2.7.1(@types/react@19.2.2)(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
+      react-remove-scroll: 2.7.1(@types/react@19.2.2)(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-menubar@1.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-menubar@1.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-menu': 2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-roving-focus': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-menu': 2.1.16(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-roving-focus': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-navigation-menu@1.2.14(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-navigation-menu@1.2.14(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-visually-hidden': 1.2.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-visually-hidden': 1.2.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-popover@1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-popover@1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-focus-guards': 1.1.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-focus-scope': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-popper': 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-focus-guards': 1.1.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-focus-scope': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-popper': 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
       aria-hidden: 1.2.6
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
-      react-remove-scroll: 2.7.1(@types/react@19.2.2)(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
+      react-remove-scroll: 2.7.1(@types/react@19.2.2)(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-popper@1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
-    dependencies:
-      '@floating-ui/react-dom': 2.1.6(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-arrow': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-rect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-size': 1.1.1(@types/react@19.2.2)(react@19.2.0)
+  '@radix-ui/react-popper@1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
+    dependencies:
+      '@floating-ui/react-dom': 2.1.6(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-arrow': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-rect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-size': 1.1.1(@types/react@19.2.2)(react@19.2.5)
       '@radix-ui/rect': 1.1.1
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-portal@1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-portal@1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-presence@1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-presence@1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-primitive@2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-primitive@2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-primitive@2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-primitive@2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-slot': 1.2.4(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-slot': 1.2.4(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-progress@1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-progress@1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-context': 1.1.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-context': 1.1.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-radio-group@1.3.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-radio-group@1.3.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-roving-focus': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-size': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-roving-focus': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-size': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-roving-focus@1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-roving-focus@1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-scroll-area@1.2.10(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-scroll-area@1.2.10(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/number': 1.1.1
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-select@2.2.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-select@2.2.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/number': 1.1.1
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-focus-guards': 1.1.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-focus-scope': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-popper': 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-visually-hidden': 1.2.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-focus-guards': 1.1.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-focus-scope': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-popper': 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-visually-hidden': 1.2.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       aria-hidden: 1.2.6
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
-      react-remove-scroll: 2.7.1(@types/react@19.2.2)(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
+      react-remove-scroll: 2.7.1(@types/react@19.2.2)(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-separator@1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-separator@1.1.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-slider@1.3.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-slider@1.3.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/number': 1.1.1
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-size': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-collection': 1.1.7(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-size': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-slot@1.2.3(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-slot@1.2.3(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-slot@1.2.4(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-slot@1.2.4(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-switch@1.2.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-switch@1.2.6(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-size': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-previous': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-size': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-tabs@1.1.13(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-tabs@1.1.13(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-roving-focus': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-roving-focus': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-toggle-group@1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-toggle-group@1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-roving-focus': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-toggle': 1.1.10(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-direction': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-roving-focus': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-toggle': 1.1.10(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-toggle@1.1.10(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-toggle@1.1.10(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-tooltip@1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-tooltip@1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@radix-ui/primitive': 1.1.3
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-popper': 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-visually-hidden': 1.2.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-context': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-dismissable-layer': 1.1.11(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-popper': 1.2.8(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-portal': 1.1.9(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-presence': 1.1.5(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-slot': 1.2.3(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-controllable-state': 1.2.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-visually-hidden': 1.2.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
 
-  '@radix-ui/react-use-callback-ref@1.1.1(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-use-callback-ref@1.1.1(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-use-controllable-state@1.2.2(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-use-controllable-state@1.2.2(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-use-effect-event': 0.0.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
+      '@radix-ui/react-use-effect-event': 0.0.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-use-effect-event@0.0.2(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-use-effect-event@0.0.2(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-use-escape-keydown@1.1.1(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-use-escape-keydown@1.1.1(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
+      '@radix-ui/react-use-callback-ref': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-use-is-hydrated@0.1.0(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-use-is-hydrated@0.1.0(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      react: 19.2.0
-      use-sync-external-store: 1.6.0(react@19.2.0)
+      react: 19.2.5
+      use-sync-external-store: 1.6.0(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-use-layout-effect@1.1.1(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-use-layout-effect@1.1.1(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-use-previous@1.1.1(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-use-previous@1.1.1(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-use-rect@1.1.1(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-use-rect@1.1.1(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
       '@radix-ui/rect': 1.1.1
-      react: 19.2.0
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-use-size@1.1.1(@types/react@19.2.2)(react@19.2.0)':
+  '@radix-ui/react-use-size@1.1.1(@types/react@19.2.2)(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      react: 19.2.0
+      '@radix-ui/react-use-layout-effect': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      react: 19.2.5
     optionalDependencies:
       '@types/react': 19.2.2
 
-  '@radix-ui/react-visually-hidden@1.2.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@radix-ui/react-visually-hidden@1.2.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
-      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-primitive': 2.1.3(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
       '@types/react-dom': 19.2.2(@types/react@19.2.2)
@@ -16970,11 +17004,11 @@ snapshots:
       postcss: 8.5.6
       tailwindcss: 4.1.18
 
-  '@tanstack/react-table@8.21.3(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@tanstack/react-table@8.21.3(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@tanstack/table-core': 8.21.3
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
 
   '@tanstack/table-core@8.21.3': {}
 
@@ -16989,12 +17023,12 @@ snapshots:
       picocolors: 1.1.1
       pretty-format: 27.5.1
 
-  '@testing-library/react@16.3.0(@testing-library/dom@10.4.1)(@types/react-dom@19.2.3(@types/react@19.2.7))(@types/react@19.2.7)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)':
+  '@testing-library/react@16.3.0(@testing-library/dom@10.4.1)(@types/react-dom@19.2.3(@types/react@19.2.7))(@types/react@19.2.7)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)':
     dependencies:
       '@babel/runtime': 7.28.6
       '@testing-library/dom': 10.4.1
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.7
       '@types/react-dom': 19.2.3(@types/react@19.2.7)
@@ -18411,14 +18445,14 @@ snapshots:
 
   cmd-shim@8.0.0: {}
 
-  cmdk@1.1.1(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0):
+  cmdk@1.1.1(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5):
     dependencies:
-      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-dialog': 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.0)
-      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-compose-refs': 1.1.2(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-dialog': 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      '@radix-ui/react-id': 1.1.1(@types/react@19.2.2)(react@19.2.5)
+      '@radix-ui/react-primitive': 2.1.4(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     transitivePeerDependencies:
       - '@types/react'
       - '@types/react-dom'
@@ -19256,11 +19290,11 @@ snapshots:
     dependencies:
       safe-buffer: 5.2.1
 
-  echarts-for-react@3.0.5(echarts@6.0.0)(react@19.2.0):
+  echarts-for-react@3.0.5(echarts@6.0.0)(react@19.2.5):
     dependencies:
       echarts: 6.0.0
       fast-deep-equal: 3.1.3
-      react: 19.2.0
+      react: 19.2.5
       size-sensor: 1.0.2
 
   echarts@6.0.0:
@@ -19276,11 +19310,11 @@ snapshots:
 
   electron-to-chromium@1.5.267: {}
 
-  embla-carousel-react@8.6.0(react@19.2.0):
+  embla-carousel-react@8.6.0(react@19.2.5):
     dependencies:
       embla-carousel: 8.6.0
       embla-carousel-reactive-utils: 8.6.0(embla-carousel@8.6.0)
-      react: 19.2.0
+      react: 19.2.5
 
   embla-carousel-reactive-utils@8.6.0(embla-carousel@8.6.0):
     dependencies:
@@ -20621,10 +20655,10 @@ snapshots:
 
   inline-style-parser@0.2.7: {}
 
-  input-otp@1.4.2(react-dom@19.2.0(react@19.2.0))(react@19.2.0):
+  input-otp@1.4.2(react-dom@19.2.5(react@19.2.5))(react@19.2.5):
     dependencies:
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
 
   inquirer@12.11.1(@types/node@24.7.2):
     dependencies:
@@ -21204,9 +21238,9 @@ snapshots:
 
   lru-cache@7.18.3: {}
 
-  lucide-react@0.554.0(react@19.2.0):
+  lucide-react@0.554.0(react@19.2.5):
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
 
   lunr-languages@1.14.0: {}
 
@@ -21971,10 +22005,10 @@ snapshots:
     dependencies:
       type-fest: 2.19.0
 
-  next-themes@0.4.6(react-dom@19.2.0(react@19.2.0))(react@19.2.0):
+  next-themes@0.4.6(react-dom@19.2.5(react@19.2.5))(react@19.2.5):
     dependencies:
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
 
   no-case@3.0.4:
     dependencies:
@@ -23104,12 +23138,12 @@ snapshots:
       minimist: 1.2.8
       strip-json-comments: 2.0.1
 
-  react-day-picker@9.12.0(react@19.2.0):
+  react-day-picker@9.12.0(react@19.2.5):
     dependencies:
       '@date-fns/tz': 1.4.1
       date-fns: 4.1.0
       date-fns-jalali: 4.1.0-0
-      react: 19.2.0
+      react: 19.2.5
 
   react-docgen-typescript@2.4.0(typescript@5.6.3):
     dependencies:
@@ -23120,11 +23154,16 @@ snapshots:
       react: 19.2.0
       scheduler: 0.27.0
 
+  react-dom@19.2.5(react@19.2.5):
+    dependencies:
+      react: 19.2.5
+      scheduler: 0.27.0
+
   react-fast-compare@3.2.2: {}
 
-  react-hook-form@7.68.0(react@19.2.0):
+  react-hook-form@7.68.0(react@19.2.5):
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
 
   react-is@16.13.1: {}
 
@@ -23146,29 +23185,29 @@ snapshots:
 
   react-refresh@0.18.0: {}
 
-  react-remove-scroll-bar@2.3.8(@types/react@19.2.2)(react@19.2.0):
+  react-remove-scroll-bar@2.3.8(@types/react@19.2.2)(react@19.2.5):
     dependencies:
-      react: 19.2.0
-      react-style-singleton: 2.2.3(@types/react@19.2.2)(react@19.2.0)
+      react: 19.2.5
+      react-style-singleton: 2.2.3(@types/react@19.2.2)(react@19.2.5)
       tslib: 2.8.1
     optionalDependencies:
       '@types/react': 19.2.2
 
-  react-remove-scroll@2.7.1(@types/react@19.2.2)(react@19.2.0):
+  react-remove-scroll@2.7.1(@types/react@19.2.2)(react@19.2.5):
     dependencies:
-      react: 19.2.0
-      react-remove-scroll-bar: 2.3.8(@types/react@19.2.2)(react@19.2.0)
-      react-style-singleton: 2.2.3(@types/react@19.2.2)(react@19.2.0)
+      react: 19.2.5
+      react-remove-scroll-bar: 2.3.8(@types/react@19.2.2)(react@19.2.5)
+      react-style-singleton: 2.2.3(@types/react@19.2.2)(react@19.2.5)
       tslib: 2.8.1
-      use-callback-ref: 1.3.3(@types/react@19.2.2)(react@19.2.0)
-      use-sidecar: 1.1.3(@types/react@19.2.2)(react@19.2.0)
+      use-callback-ref: 1.3.3(@types/react@19.2.2)(react@19.2.5)
+      use-sidecar: 1.1.3(@types/react@19.2.2)(react@19.2.5)
     optionalDependencies:
       '@types/react': 19.2.2
 
-  react-resizable-panels@3.0.6(react-dom@19.2.0(react@19.2.0))(react@19.2.0):
+  react-resizable-panels@3.0.6(react-dom@19.2.5(react@19.2.5))(react@19.2.5):
     dependencies:
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
 
   react-router-config@5.1.1(react-router@5.3.4(react@19.2.0))(react@19.2.0):
     dependencies:
@@ -23200,33 +23239,35 @@ snapshots:
       tiny-invariant: 1.3.3
       tiny-warning: 1.0.3
 
-  react-smooth@4.0.4(react-dom@19.2.0(react@19.2.0))(react@19.2.0):
+  react-smooth@4.0.4(react-dom@19.2.5(react@19.2.5))(react@19.2.5):
     dependencies:
       fast-equals: 5.3.3
       prop-types: 15.8.1
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
-      react-transition-group: 4.4.5(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
+      react-transition-group: 4.4.5(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
 
-  react-style-singleton@2.2.3(@types/react@19.2.2)(react@19.2.0):
+  react-style-singleton@2.2.3(@types/react@19.2.2)(react@19.2.5):
     dependencies:
       get-nonce: 1.0.1
-      react: 19.2.0
+      react: 19.2.5
       tslib: 2.8.1
     optionalDependencies:
       '@types/react': 19.2.2
 
-  react-transition-group@4.4.5(react-dom@19.2.0(react@19.2.0))(react@19.2.0):
+  react-transition-group@4.4.5(react-dom@19.2.5(react@19.2.5))(react@19.2.5):
     dependencies:
       '@babel/runtime': 7.28.6
       dom-helpers: 5.2.1
       loose-envify: 1.4.0
       prop-types: 15.8.1
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
 
   react@19.2.0: {}
 
+  react@19.2.5: {}
+
   read-cmd-shim@6.0.0: {}
 
   read-package-json-fast@5.0.0:
@@ -23260,15 +23301,15 @@ snapshots:
     dependencies:
       decimal.js-light: 2.5.1
 
-  recharts@2.15.4(react-dom@19.2.0(react@19.2.0))(react@19.2.0):
+  recharts@2.15.4(react-dom@19.2.5(react@19.2.5))(react@19.2.5):
     dependencies:
       clsx: 2.1.1
       eventemitter3: 4.0.7
       lodash: 4.17.21
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
       react-is: 18.3.1
-      react-smooth: 4.0.4(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
+      react-smooth: 4.0.4(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
       recharts-scale: 0.4.5
       tiny-invariant: 1.3.3
       victory-vendor: 36.9.2
@@ -24007,10 +24048,10 @@ snapshots:
       ip-address: 10.1.0
       smart-buffer: 4.2.0
 
-  sonner@2.0.7(react-dom@19.2.0(react@19.2.0))(react@19.2.0):
+  sonner@2.0.7(react-dom@19.2.5(react@19.2.5))(react@19.2.5):
     dependencies:
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
 
   sort-css-media-queries@2.2.0: {}
 
@@ -24199,12 +24240,18 @@ snapshots:
       csso: 5.0.5
       picocolors: 1.1.1
 
-  swr@2.3.8(react@19.2.0):
+  swr@2.4.1(react@19.2.0):
     dependencies:
       dequal: 2.0.3
       react: 19.2.0
       use-sync-external-store: 1.6.0(react@19.2.0)
 
+  swr@2.4.1(react@19.2.5):
+    dependencies:
+      dequal: 2.0.3
+      react: 19.2.5
+      use-sync-external-store: 1.6.0(react@19.2.5)
+
   symbol-tree@3.2.4: {}
 
   table-layout@4.1.1:
@@ -24711,17 +24758,17 @@ snapshots:
     optionalDependencies:
       file-loader: 6.2.0(webpack@5.103.0)
 
-  use-callback-ref@1.3.3(@types/react@19.2.2)(react@19.2.0):
+  use-callback-ref@1.3.3(@types/react@19.2.2)(react@19.2.5):
     dependencies:
-      react: 19.2.0
+      react: 19.2.5
       tslib: 2.8.1
     optionalDependencies:
       '@types/react': 19.2.2
 
-  use-sidecar@1.1.3(@types/react@19.2.2)(react@19.2.0):
+  use-sidecar@1.1.3(@types/react@19.2.2)(react@19.2.5):
     dependencies:
       detect-node-es: 1.1.0
-      react: 19.2.0
+      react: 19.2.5
       tslib: 2.8.1
     optionalDependencies:
       '@types/react': 19.2.2
@@ -24730,6 +24777,10 @@ snapshots:
     dependencies:
       react: 19.2.0
 
+  use-sync-external-store@1.6.0(react@19.2.5):
+    dependencies:
+      react: 19.2.5
+
   util-deprecate@1.0.2: {}
 
   utila@0.4.0: {}
@@ -24759,11 +24810,11 @@ snapshots:
 
   vary@1.1.2: {}
 
-  vaul@1.1.2(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0):
+  vaul@1.1.2(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5):
     dependencies:
-      '@radix-ui/react-dialog': 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.0(react@19.2.0))(react@19.2.0)
-      react: 19.2.0
-      react-dom: 19.2.0(react@19.2.0)
+      '@radix-ui/react-dialog': 1.1.15(@types/react-dom@19.2.2(@types/react@19.2.2))(@types/react@19.2.2)(react-dom@19.2.5(react@19.2.5))(react@19.2.5)
+      react: 19.2.5
+      react-dom: 19.2.5(react@19.2.5)
     transitivePeerDependencies:
       - '@types/react'
       - '@types/react-dom'