From 5a7a4df431904c810c2007e857ce6ed35a3cb2f3 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Tue, 21 Apr 2026 19:46:14 +0200
Subject: [PATCH 1/6] feat(appkit): tool primitives and ToolProvider surfaces
 on core plugins
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Second layer of the agents feature. Adds the primitives for defining
agent tools and implements them on every core ToolProvider plugin.

### User-facing factories

- `tool(config)` — inline function tools backed by a Zod schema. Auto-
  generates JSON Schema for the LLM via `z.toJSONSchema()` (stripping
  the top-level `$schema` annotation that Gemini rejects), runtime-
  validates tool-call arguments, returns an LLM-friendly error string
  on validation failure so the model can self-correct.
- `mcpServer(name, url)` — tiny factory for hosted custom MCP server
  configs. Replaces the verbose
  `{ type: "custom_mcp_server", custom_mcp_server: { app_name, app_url } }`
  wrapper.
- `FunctionTool` / `HostedTool` types + `isFunctionTool` / `isHostedTool`
  type guards. `HostedTool` is a union of Genie, VectorSearch, custom
  MCP, and external-connection configs.
- `ToolkitEntry` + `ToolkitOptions` types + `isToolkitEntry` guard.
  `AgentTool = FunctionTool | HostedTool | ToolkitEntry` is the canonical
  union later PRs spread into agent definitions.

### Internal registry + JSON Schema helper

- `defineTool(config)` + `ToolRegistry` — plugin authors' internal shape
  for declaring a keyed set of tools with Zod-typed handlers.
- `toolsFromRegistry()` — produces the `AgentToolDefinition[]` exposed
  via `ToolProvider.getAgentTools()`.
- `executeFromRegistry()` — validates args then dispatches to the
  handler. Returns LLM-friendly errors on bad args.
- `toToolJSONSchema()` — shared helper at
  `packages/appkit/src/plugins/agents/tools/json-schema.ts` that wraps
  `toJSONSchema()` and strips `$schema`. Used by `tool()`,
  `toolsFromRegistry()`, and `buildToolkitEntries()`.
- `buildToolkitEntries(pluginName, registry, opts?)` — converts a
  plugin's internal `ToolRegistry` into a keyed record of `ToolkitEntry`
  markers, honoring `prefix` / `only` / `except` / `rename`.

### MCP client

- `AppKitMcpClient` — minimal JSON-RPC 2.0 client over SSE, zero deps.
  Handles auth refresh, per-server connection pooling, and tool
  definition aggregation.
- `resolveHostedTools()` — maps `HostedTool` configs to Databricks MCP
  endpoint URLs.

### ToolProvider surfaces on core plugins

- **analytics** — `query` tool (Zod-typed, asUser dispatch)
- **files** — per-volume tool family: `${volumeKey}.{list,read,exists,metadata,upload,delete}` (dynamically named from the plugin's volume config)
- **genie** — per-space tool family: `${alias}.{sendMessage,getConversation}` (dynamically named from the plugin's spaces config)
- **lakebase** — `query` tool

Each plugin gains `getAgentTools()` + `executeAgentTool()` satisfying
the `ToolProvider` interface, plus a `.toolkit(opts?)` method that
returns a record of `ToolkitEntry` markers for later spread into agent
definitions.

### Test plan

- 58 new tests across tool primitives + plugin ToolProvider surfaces
- Full appkit vitest suite: 1212 tests passing
- Typecheck clean
- Build clean, publint clean

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 packages/appkit/src/index.ts                  |  24 ++
 .../src/plugins/agents/build-toolkit.ts       |  62 ++++
 .../agents/tests/build-toolkit.test.ts        |  75 +++++
 .../plugins/agents/tests/define-tool.test.ts  | 133 +++++++++
 .../agents/tests/function-tool.test.ts        | 110 +++++++
 .../plugins/agents/tests/hosted-tools.test.ts | 131 +++++++++
 .../agents/tests/mcp-server-helper.test.ts    |  34 +++
 .../src/plugins/agents/tests/tool.test.ts     | 110 +++++++
 .../src/plugins/agents/tools/define-tool.ts   |  84 ++++++
 .../src/plugins/agents/tools/function-tool.ts |  33 +++
 .../src/plugins/agents/tools/hosted-tools.ts  | 102 +++++++
 .../appkit/src/plugins/agents/tools/index.ts  |  20 ++
 .../src/plugins/agents/tools/json-schema.ts   |  22 ++
 .../src/plugins/agents/tools/mcp-client.ts    | 278 ++++++++++++++++++
 .../appkit/src/plugins/agents/tools/tool.ts   |  53 ++++
 packages/appkit/src/plugins/agents/types.ts   |  47 +++
 .../appkit/src/plugins/analytics/analytics.ts |  50 +++-
 .../plugins/analytics/tests/analytics.test.ts |  18 ++
 packages/appkit/src/plugins/files/plugin.ts   | 108 ++++++-
 .../src/plugins/files/tests/plugin.test.ts    |  56 ++++
 packages/appkit/src/plugins/genie/genie.ts    |  81 ++++-
 .../src/plugins/genie/tests/genie.test.ts     |  24 ++
 .../appkit/src/plugins/lakebase/lakebase.ts   |  54 +++-
 23 files changed, 1703 insertions(+), 6 deletions(-)
 create mode 100644 packages/appkit/src/plugins/agents/build-toolkit.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/build-toolkit.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/define-tool.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/function-tool.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/hosted-tools.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/mcp-server-helper.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/tool.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tools/define-tool.ts
 create mode 100644 packages/appkit/src/plugins/agents/tools/function-tool.ts
 create mode 100644 packages/appkit/src/plugins/agents/tools/hosted-tools.ts
 create mode 100644 packages/appkit/src/plugins/agents/tools/index.ts
 create mode 100644 packages/appkit/src/plugins/agents/tools/json-schema.ts
 create mode 100644 packages/appkit/src/plugins/agents/tools/mcp-client.ts
 create mode 100644 packages/appkit/src/plugins/agents/tools/tool.ts
 create mode 100644 packages/appkit/src/plugins/agents/types.ts

diff --git a/packages/appkit/src/index.ts b/packages/appkit/src/index.ts
index 955bfde6..8d236780 100644
--- a/packages/appkit/src/index.ts
+++ b/packages/appkit/src/index.ts
@@ -7,11 +7,20 @@
 
 // Types from shared
 export type {
+  AgentAdapter,
+  AgentEvent,
+  AgentInput,
+  AgentRunContext,
+  AgentToolDefinition,
   BasePluginConfig,
   CacheConfig,
   IAppRouter,
+  Message,
   PluginData,
   StreamExecutionSettings,
+  Thread,
+  ThreadStore,
+  ToolProvider,
 } from "shared";
 export { isSQLTypeMarker, sql } from "shared";
 export { CacheManager } from "./cache";
@@ -54,6 +63,21 @@ export {
   toPlugin,
 } from "./plugin";
 export { analytics, files, genie, lakebase, server, serving } from "./plugins";
+export {
+  type AgentTool,
+  isToolkitEntry,
+  type ToolkitEntry,
+  type ToolkitOptions,
+} from "./plugins/agents/types";
+export {
+  type FunctionTool,
+  type HostedTool,
+  isFunctionTool,
+  isHostedTool,
+  mcpServer,
+  type ToolConfig,
+  tool,
+} from "./plugins/agents/tools";
 export type {
   EndpointConfig,
   ServingEndpointEntry,
diff --git a/packages/appkit/src/plugins/agents/build-toolkit.ts b/packages/appkit/src/plugins/agents/build-toolkit.ts
new file mode 100644
index 00000000..540fec25
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/build-toolkit.ts
@@ -0,0 +1,62 @@
+import type { AgentToolDefinition } from "shared";
+import type { ToolRegistry } from "./tools/define-tool";
+import { toToolJSONSchema } from "./tools/json-schema";
+import type { ToolkitEntry, ToolkitOptions } from "./types";
+
+/**
+ * Converts a plugin's internal `ToolRegistry` into a keyed record of
+ * `ToolkitEntry` markers suitable for spreading into an `AgentDefinition.tools`
+ * record.
+ *
+ * The `opts` record controls shape and filtering:
+ * - `prefix` — overrides the default `${pluginName}.` prefix; `""` drops it.
+ * - `only` — allowlist of local tool names to include (post-prefix).
+ * - `except` — denylist of local names.
+ * - `rename` — per-tool key remapping (applied after prefix/filter).
+ *
+ * Each entry carries `pluginName` + `localName` so the agents plugin can
+ * dispatch back through `PluginContext.executeTool` for OBO + telemetry.
+ */
+export function buildToolkitEntries(
+  pluginName: string,
+  registry: ToolRegistry,
+  opts: ToolkitOptions = {},
+): Record<string, ToolkitEntry> {
+  const prefix = opts.prefix ?? `${pluginName}.`;
+  const only = opts.only ? new Set(opts.only) : null;
+  const except = opts.except ? new Set(opts.except) : null;
+  const rename = opts.rename ?? {};
+
+  const out: Record<string, ToolkitEntry> = {};
+
+  for (const [localName, entry] of Object.entries(registry)) {
+    if (only && !only.has(localName)) continue;
+    if (except?.has(localName)) continue;
+
+    const keyAfterPrefix = `${prefix}${localName}`;
+    const key = rename[localName] ?? keyAfterPrefix;
+
+    const parameters = toToolJSONSchema(
+      entry.schema,
+    ) as unknown as AgentToolDefinition["parameters"];
+
+    const def: AgentToolDefinition = {
+      name: key,
+      description: entry.description,
+      parameters,
+    };
+    if (entry.annotations) {
+      def.annotations = entry.annotations;
+    }
+
+    out[key] = {
+      __toolkitRef: true,
+      pluginName,
+      localName,
+      def,
+      annotations: entry.annotations,
+    };
+  }
+
+  return out;
+}
diff --git a/packages/appkit/src/plugins/agents/tests/build-toolkit.test.ts b/packages/appkit/src/plugins/agents/tests/build-toolkit.test.ts
new file mode 100644
index 00000000..b1b6a60c
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/build-toolkit.test.ts
@@ -0,0 +1,75 @@
+import { describe, expect, test } from "vitest";
+import { z } from "zod";
+import { buildToolkitEntries } from "../build-toolkit";
+import { defineTool, type ToolRegistry } from "../tools/define-tool";
+import { isToolkitEntry } from "../types";
+
+const registry: ToolRegistry = {
+  query: defineTool({
+    description: "Run a query",
+    schema: z.object({ sql: z.string() }),
+    handler: () => "ok",
+  }),
+  history: defineTool({
+    description: "Get query history",
+    schema: z.object({}),
+    handler: () => [],
+  }),
+};
+
+describe("buildToolkitEntries", () => {
+  test("produces ToolkitEntry per registry item with default dotted prefix", () => {
+    const entries = buildToolkitEntries("analytics", registry);
+    expect(Object.keys(entries).sort()).toEqual([
+      "analytics.history",
+      "analytics.query",
+    ]);
+    for (const entry of Object.values(entries)) {
+      expect(isToolkitEntry(entry)).toBe(true);
+      expect(entry.pluginName).toBe("analytics");
+    }
+  });
+
+  test("respects prefix option (empty drops the namespace)", () => {
+    const entries = buildToolkitEntries("analytics", registry, { prefix: "" });
+    expect(Object.keys(entries).sort()).toEqual(["history", "query"]);
+  });
+
+  test("respects custom prefix", () => {
+    const entries = buildToolkitEntries("analytics", registry, {
+      prefix: "db.",
+    });
+    expect(Object.keys(entries).sort()).toEqual(["db.history", "db.query"]);
+  });
+
+  test("only filter keeps the listed local names", () => {
+    const entries = buildToolkitEntries("analytics", registry, {
+      only: ["query"],
+    });
+    expect(Object.keys(entries)).toEqual(["analytics.query"]);
+  });
+
+  test("except filter drops the listed local names", () => {
+    const entries = buildToolkitEntries("analytics", registry, {
+      except: ["history"],
+    });
+    expect(Object.keys(entries)).toEqual(["analytics.query"]);
+  });
+
+  test("rename remaps specific local names (overrides the prefix key)", () => {
+    const entries = buildToolkitEntries("analytics", registry, {
+      rename: { query: "sql" },
+    });
+    expect(Object.keys(entries).sort()).toEqual(["analytics.history", "sql"]);
+  });
+
+  test("exposes the original plugin+local name so dispatch can route", () => {
+    const entries = buildToolkitEntries("analytics", registry, {
+      prefix: "db.",
+    });
+    const qEntry = entries["db.query"];
+    expect(qEntry.pluginName).toBe("analytics");
+    expect(qEntry.localName).toBe("query");
+    expect(qEntry.def.name).toBe("db.query");
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/define-tool.test.ts b/packages/appkit/src/plugins/agents/tests/define-tool.test.ts
new file mode 100644
index 00000000..ef61e8c4
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/define-tool.test.ts
@@ -0,0 +1,133 @@
+import { describe, expect, test, vi } from "vitest";
+import { z } from "zod";
+import {
+  defineTool,
+  executeFromRegistry,
+  type ToolRegistry,
+  toolsFromRegistry,
+} from "../tools/define-tool";
+
+describe("defineTool()", () => {
+  test("returns an entry matching the input config", () => {
+    const entry = defineTool({
+      description: "echo",
+      schema: z.object({ msg: z.string() }),
+      annotations: { readOnly: true },
+      handler: ({ msg }) => msg,
+    });
+
+    expect(entry.description).toBe("echo");
+    expect(entry.annotations).toEqual({ readOnly: true });
+    expect(typeof entry.handler).toBe("function");
+  });
+});
+
+describe("executeFromRegistry", () => {
+  const registry: ToolRegistry = {
+    echo: defineTool({
+      description: "echo",
+      schema: z.object({ msg: z.string() }),
+      handler: ({ msg }) => `got ${msg}`,
+    }),
+  };
+
+  test("validates args and calls handler on success", async () => {
+    const result = await executeFromRegistry(registry, "echo", { msg: "hi" });
+    expect(result).toBe("got hi");
+  });
+
+  test("returns formatted error string on validation failure", async () => {
+    const result = await executeFromRegistry(registry, "echo", {});
+    expect(typeof result).toBe("string");
+    expect(result).toContain("Invalid arguments for echo");
+    expect(result).toContain("msg");
+  });
+
+  test("throws for unknown tool names", async () => {
+    await expect(executeFromRegistry(registry, "missing", {})).rejects.toThrow(
+      /Unknown tool: missing/,
+    );
+  });
+
+  test("forwards AbortSignal to the handler", async () => {
+    const handler = vi.fn(async (_args: { x: string }, signal?: AbortSignal) =>
+      signal?.aborted ? "aborted" : "ok",
+    );
+    const reg: ToolRegistry = {
+      t: defineTool({
+        description: "t",
+        schema: z.object({ x: z.string() }),
+        handler,
+      }),
+    };
+
+    const controller = new AbortController();
+    controller.abort();
+    await executeFromRegistry(reg, "t", { x: "hi" }, controller.signal);
+
+    expect(handler).toHaveBeenCalledTimes(1);
+    expect(handler.mock.calls[0][1]).toBe(controller.signal);
+  });
+});
+
+describe("toolsFromRegistry", () => {
+  test("produces AgentToolDefinition[] with JSON Schema parameters", () => {
+    const registry: ToolRegistry = {
+      query: defineTool({
+        description: "Execute a SQL query",
+        schema: z.object({
+          query: z.string().describe("SQL query"),
+        }),
+        annotations: { readOnly: true, requiresUserContext: true },
+        handler: () => "ok",
+      }),
+    };
+
+    const defs = toolsFromRegistry(registry);
+    expect(defs).toHaveLength(1);
+    expect(defs[0].name).toBe("query");
+    expect(defs[0].description).toBe("Execute a SQL query");
+    expect(defs[0].parameters).toMatchObject({
+      type: "object",
+      properties: {
+        query: { type: "string", description: "SQL query" },
+      },
+      required: ["query"],
+    });
+    expect(defs[0].annotations).toEqual({
+      readOnly: true,
+      requiresUserContext: true,
+    });
+  });
+
+  test("preserves dotted names like uploads.list from the registry keys", () => {
+    const registry: ToolRegistry = {
+      "uploads.list": defineTool({
+        description: "list uploads",
+        schema: z.object({}),
+        handler: () => [],
+      }),
+      "documents.list": defineTool({
+        description: "list documents",
+        schema: z.object({}),
+        handler: () => [],
+      }),
+    };
+
+    const names = toolsFromRegistry(registry).map((d) => d.name);
+    expect(names).toContain("uploads.list");
+    expect(names).toContain("documents.list");
+  });
+
+  test("omits annotations when none are provided", () => {
+    const registry: ToolRegistry = {
+      plain: defineTool({
+        description: "plain",
+        schema: z.object({}),
+        handler: () => "ok",
+      }),
+    };
+    const [def] = toolsFromRegistry(registry);
+    expect(def.annotations).toBeUndefined();
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/function-tool.test.ts b/packages/appkit/src/plugins/agents/tests/function-tool.test.ts
new file mode 100644
index 00000000..8e668d69
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/function-tool.test.ts
@@ -0,0 +1,110 @@
+import { describe, expect, test } from "vitest";
+import {
+  functionToolToDefinition,
+  isFunctionTool,
+} from "../tools/function-tool";
+
+describe("isFunctionTool", () => {
+  test("returns true for valid FunctionTool", () => {
+    expect(
+      isFunctionTool({
+        type: "function",
+        name: "greet",
+        execute: async () => "hello",
+      }),
+    ).toBe(true);
+  });
+
+  test("returns true for minimal FunctionTool", () => {
+    expect(
+      isFunctionTool({
+        type: "function",
+        name: "x",
+        execute: () => "y",
+      }),
+    ).toBe(true);
+  });
+
+  test("returns false for null", () => {
+    expect(isFunctionTool(null)).toBe(false);
+  });
+
+  test("returns false for non-object", () => {
+    expect(isFunctionTool("function")).toBe(false);
+  });
+
+  test("returns false for wrong type", () => {
+    expect(
+      isFunctionTool({
+        type: "genie-space",
+        name: "x",
+        execute: () => "y",
+      }),
+    ).toBe(false);
+  });
+
+  test("returns false when execute is missing", () => {
+    expect(isFunctionTool({ type: "function", name: "x" })).toBe(false);
+  });
+
+  test("returns false when name is missing", () => {
+    expect(isFunctionTool({ type: "function", execute: () => "y" })).toBe(
+      false,
+    );
+  });
+});
+
+describe("functionToolToDefinition", () => {
+  test("converts a FunctionTool with all fields", () => {
+    const def = functionToolToDefinition({
+      type: "function",
+      name: "getWeather",
+      description: "Get current weather",
+      parameters: {
+        type: "object",
+        properties: { city: { type: "string" } },
+        required: ["city"],
+      },
+      execute: async () => "sunny",
+    });
+
+    expect(def.name).toBe("getWeather");
+    expect(def.description).toBe("Get current weather");
+    expect(def.parameters).toEqual({
+      type: "object",
+      properties: { city: { type: "string" } },
+      required: ["city"],
+    });
+  });
+
+  test("uses name as fallback description", () => {
+    const def = functionToolToDefinition({
+      type: "function",
+      name: "myTool",
+      execute: async () => "result",
+    });
+
+    expect(def.description).toBe("myTool");
+  });
+
+  test("uses empty object schema when parameters are null", () => {
+    const def = functionToolToDefinition({
+      type: "function",
+      name: "noParams",
+      parameters: null,
+      execute: async () => "ok",
+    });
+
+    expect(def.parameters).toEqual({ type: "object", properties: {} });
+  });
+
+  test("uses empty object schema when parameters are omitted", () => {
+    const def = functionToolToDefinition({
+      type: "function",
+      name: "noParams",
+      execute: async () => "ok",
+    });
+
+    expect(def.parameters).toEqual({ type: "object", properties: {} });
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/hosted-tools.test.ts b/packages/appkit/src/plugins/agents/tests/hosted-tools.test.ts
new file mode 100644
index 00000000..d62b266b
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/hosted-tools.test.ts
@@ -0,0 +1,131 @@
+import { describe, expect, test } from "vitest";
+import { isHostedTool, resolveHostedTools } from "../tools/hosted-tools";
+
+describe("isHostedTool", () => {
+  test("returns true for genie-space", () => {
+    expect(
+      isHostedTool({ type: "genie-space", genie_space: { id: "abc" } }),
+    ).toBe(true);
+  });
+
+  test("returns true for vector_search_index", () => {
+    expect(
+      isHostedTool({
+        type: "vector_search_index",
+        vector_search_index: { name: "cat.schema.idx" },
+      }),
+    ).toBe(true);
+  });
+
+  test("returns true for custom_mcp_server", () => {
+    expect(
+      isHostedTool({
+        type: "custom_mcp_server",
+        custom_mcp_server: { app_name: "my-app", app_url: "my-app-url" },
+      }),
+    ).toBe(true);
+  });
+
+  test("returns true for external_mcp_server", () => {
+    expect(
+      isHostedTool({
+        type: "external_mcp_server",
+        external_mcp_server: { connection_name: "conn1" },
+      }),
+    ).toBe(true);
+  });
+
+  test("returns false for FunctionTool", () => {
+    expect(
+      isHostedTool({ type: "function", name: "x", execute: () => "y" }),
+    ).toBe(false);
+  });
+
+  test("returns false for null", () => {
+    expect(isHostedTool(null)).toBe(false);
+  });
+
+  test("returns false for unknown type", () => {
+    expect(isHostedTool({ type: "unknown" })).toBe(false);
+  });
+
+  test("returns false for non-object", () => {
+    expect(isHostedTool(42)).toBe(false);
+  });
+});
+
+describe("resolveHostedTools", () => {
+  test("resolves genie-space to correct MCP endpoint", () => {
+    const configs = resolveHostedTools([
+      { type: "genie-space", genie_space: { id: "space123" } },
+    ]);
+
+    expect(configs).toHaveLength(1);
+    expect(configs[0].name).toBe("genie-space123");
+    expect(configs[0].url).toBe("/api/2.0/mcp/genie/space123");
+  });
+
+  test("resolves vector_search_index with 3-part name", () => {
+    const configs = resolveHostedTools([
+      {
+        type: "vector_search_index",
+        vector_search_index: { name: "catalog.schema.my_index" },
+      },
+    ]);
+
+    expect(configs).toHaveLength(1);
+    expect(configs[0].name).toBe("vs-catalog-schema-my_index");
+    expect(configs[0].url).toBe(
+      "/api/2.0/mcp/vector-search/catalog/schema/my_index",
+    );
+  });
+
+  test("throws for invalid vector_search_index name", () => {
+    expect(() =>
+      resolveHostedTools([
+        {
+          type: "vector_search_index",
+          vector_search_index: { name: "bad.name" },
+        },
+      ]),
+    ).toThrow("3-part dotted");
+  });
+
+  test("resolves custom_mcp_server", () => {
+    const configs = resolveHostedTools([
+      {
+        type: "custom_mcp_server",
+        custom_mcp_server: { app_name: "my-app", app_url: "my-app-endpoint" },
+      },
+    ]);
+
+    expect(configs[0].name).toBe("my-app");
+    expect(configs[0].url).toBe("my-app-endpoint");
+  });
+
+  test("resolves external_mcp_server", () => {
+    const configs = resolveHostedTools([
+      {
+        type: "external_mcp_server",
+        external_mcp_server: { connection_name: "conn1" },
+      },
+    ]);
+
+    expect(configs[0].name).toBe("conn1");
+    expect(configs[0].url).toBe("/api/2.0/mcp/external/conn1");
+  });
+
+  test("resolves multiple tools preserving order", () => {
+    const configs = resolveHostedTools([
+      { type: "genie-space", genie_space: { id: "g1" } },
+      {
+        type: "external_mcp_server",
+        external_mcp_server: { connection_name: "e1" },
+      },
+    ]);
+
+    expect(configs).toHaveLength(2);
+    expect(configs[0].name).toBe("genie-g1");
+    expect(configs[1].name).toBe("e1");
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/mcp-server-helper.test.ts b/packages/appkit/src/plugins/agents/tests/mcp-server-helper.test.ts
new file mode 100644
index 00000000..96ad8e38
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/mcp-server-helper.test.ts
@@ -0,0 +1,34 @@
+import { describe, expect, test } from "vitest";
+import {
+  isHostedTool,
+  mcpServer,
+  resolveHostedTools,
+} from "../tools/hosted-tools";
+
+describe("mcpServer()", () => {
+  test("returns a CustomMcpServerTool with correct shape", () => {
+    const result = mcpServer("my-app", "https://example.com/mcp");
+
+    expect(result).toEqual({
+      type: "custom_mcp_server",
+      custom_mcp_server: {
+        app_name: "my-app",
+        app_url: "https://example.com/mcp",
+      },
+    });
+  });
+
+  test("isHostedTool recognizes mcpServer() output", () => {
+    expect(isHostedTool(mcpServer("x", "y"))).toBe(true);
+  });
+
+  test("resolveHostedTools resolves mcpServer() output to an endpoint config", () => {
+    const configs = resolveHostedTools([
+      mcpServer("vector-search", "https://host/mcp/vs"),
+    ]);
+
+    expect(configs).toHaveLength(1);
+    expect(configs[0].name).toBe("vector-search");
+    expect(configs[0].url).toBe("https://host/mcp/vs");
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/tool.test.ts b/packages/appkit/src/plugins/agents/tests/tool.test.ts
new file mode 100644
index 00000000..3d47f3a9
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/tool.test.ts
@@ -0,0 +1,110 @@
+import { describe, expect, test } from "vitest";
+import { z } from "zod";
+import { formatZodError, tool } from "../tools/tool";
+
+describe("tool()", () => {
+  test("produces a FunctionTool with JSON Schema parameters from the Zod schema", () => {
+    const weather = tool({
+      name: "get_weather",
+      description: "Get the current weather for a city",
+      schema: z.object({
+        city: z.string().describe("City name"),
+      }),
+      execute: async ({ city }) => `Sunny in ${city}`,
+    });
+
+    expect(weather.type).toBe("function");
+    expect(weather.name).toBe("get_weather");
+    expect(weather.description).toBe("Get the current weather for a city");
+    expect(weather.parameters).toMatchObject({
+      type: "object",
+      properties: {
+        city: { type: "string", description: "City name" },
+      },
+      required: ["city"],
+    });
+  });
+
+  test("execute receives typed args on valid input", async () => {
+    const echo = tool({
+      name: "echo",
+      schema: z.object({ message: z.string() }),
+      execute: async ({ message }) => {
+        const _typed: string = message;
+        return `got ${_typed}`;
+      },
+    });
+
+    const result = await echo.execute({ message: "hi" });
+    expect(result).toBe("got hi");
+  });
+
+  test("returns formatted error string (does not throw) when args are invalid", async () => {
+    const weather = tool({
+      name: "get_weather",
+      schema: z.object({ city: z.string() }),
+      execute: async ({ city }) => `Sunny in ${city}`,
+    });
+
+    const result = await weather.execute({});
+    expect(typeof result).toBe("string");
+    expect(result).toContain("Invalid arguments for get_weather");
+    expect(result).toContain("city");
+  });
+
+  test("joins multiple validation errors with '; '", async () => {
+    const t = tool({
+      name: "multi",
+      schema: z.object({ a: z.string(), b: z.number() }),
+      execute: async () => "ok",
+    });
+
+    const result = await t.execute({});
+    expect(result).toContain("a:");
+    expect(result).toContain("b:");
+    expect(result).toContain(";");
+  });
+
+  test("optional fields validate when absent", async () => {
+    const t = tool({
+      name: "opt",
+      schema: z.object({ note: z.string().optional() }),
+      execute: async ({ note }) => note ?? "(no note)",
+    });
+
+    expect(await t.execute({})).toBe("(no note)");
+    expect(await t.execute({ note: "hello" })).toBe("hello");
+  });
+
+  test("description falls back to the tool name when omitted", () => {
+    const t = tool({
+      name: "my_tool",
+      schema: z.object({}),
+      execute: async () => "ok",
+    });
+
+    expect(t.description).toBe("my_tool");
+    expect(t.parameters).toBeDefined();
+  });
+});
+
+describe("formatZodError", () => {
+  test("formats a single issue with the tool name", () => {
+    const schema = z.object({ city: z.string() });
+    const result = schema.safeParse({});
+    if (result.success) throw new Error("expected failure");
+
+    const msg = formatZodError(result.error, "get_weather");
+    expect(msg).toMatch(/^Invalid arguments for get_weather: /);
+    expect(msg).toContain("city:");
+  });
+
+  test("joins multiple issues with '; '", () => {
+    const schema = z.object({ a: z.string(), b: z.number() });
+    const result = schema.safeParse({});
+    if (result.success) throw new Error("expected failure");
+
+    const msg = formatZodError(result.error, "t");
+    expect(msg.split(";").length).toBeGreaterThanOrEqual(2);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tools/define-tool.ts b/packages/appkit/src/plugins/agents/tools/define-tool.ts
new file mode 100644
index 00000000..bcefceef
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tools/define-tool.ts
@@ -0,0 +1,84 @@
+import type { AgentToolDefinition, ToolAnnotations } from "shared";
+import type { z } from "zod";
+import { toToolJSONSchema } from "./json-schema";
+import { formatZodError } from "./tool";
+
+/**
+ * Single-tool entry for a plugin's internal tool registry.
+ *
+ * Plugins collect these into a `Record<string, ToolEntry>` keyed by the tool's
+ * public name and dispatch via `executeFromRegistry`.
+ */
+export interface ToolEntry<S extends z.ZodType = z.ZodType> {
+  description: string;
+  schema: S;
+  annotations?: ToolAnnotations;
+  handler: (
+    args: z.infer<S>,
+    signal?: AbortSignal,
+  ) => unknown | Promise<unknown>;
+}
+
+export type ToolRegistry = Record<string, ToolEntry>;
+
+/**
+ * Defines a single tool entry for a plugin's internal registry.
+ *
+ * The generic `S` flows from `schema` through to the `handler` callback so
+ * `args` is fully typed from the Zod schema. Names are assigned by the
+ * registry key, so they are not repeated inside the entry.
+ */
+export function defineTool<S extends z.ZodType>(
+  config: ToolEntry<S>,
+): ToolEntry<S> {
+  return config;
+}
+
+/**
+ * Validates tool-call arguments against the entry's schema and invokes its
+ * handler. On validation failure, returns an LLM-friendly error string
+ * (matching the behavior of `tool()`) rather than throwing, so the model
+ * can self-correct on its next turn.
+ */
+export async function executeFromRegistry(
+  registry: ToolRegistry,
+  name: string,
+  args: unknown,
+  signal?: AbortSignal,
+): Promise<unknown> {
+  const entry = registry[name];
+  if (!entry) {
+    throw new Error(`Unknown tool: ${name}`);
+  }
+  const parsed = entry.schema.safeParse(args);
+  if (!parsed.success) {
+    return formatZodError(parsed.error, name);
+  }
+  return entry.handler(parsed.data, signal);
+}
+
+/**
+ * Produces the `AgentToolDefinition[]` a ToolProvider exposes to the LLM,
+ * deriving `parameters` JSON Schema from each entry's Zod schema.
+ *
+ * Tool names come from registry keys (supports dotted names like
+ * `uploads.list` for dynamic plugins).
+ */
+export function toolsFromRegistry(
+  registry: ToolRegistry,
+): AgentToolDefinition[] {
+  return Object.entries(registry).map(([name, entry]) => {
+    const parameters = toToolJSONSchema(
+      entry.schema,
+    ) as unknown as AgentToolDefinition["parameters"];
+    const def: AgentToolDefinition = {
+      name,
+      description: entry.description,
+      parameters,
+    };
+    if (entry.annotations) {
+      def.annotations = entry.annotations;
+    }
+    return def;
+  });
+}
diff --git a/packages/appkit/src/plugins/agents/tools/function-tool.ts b/packages/appkit/src/plugins/agents/tools/function-tool.ts
new file mode 100644
index 00000000..8ce634e0
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tools/function-tool.ts
@@ -0,0 +1,33 @@
+import type { AgentToolDefinition } from "shared";
+
+export interface FunctionTool {
+  type: "function";
+  name: string;
+  description?: string | null;
+  parameters?: Record<string, unknown> | null;
+  strict?: boolean | null;
+  execute: (args: Record<string, unknown>) => Promise<string> | string;
+}
+
+export function isFunctionTool(value: unknown): value is FunctionTool {
+  if (typeof value !== "object" || value === null) return false;
+  const obj = value as Record<string, unknown>;
+  return (
+    obj.type === "function" &&
+    typeof obj.name === "string" &&
+    typeof obj.execute === "function"
+  );
+}
+
+export function functionToolToDefinition(
+  tool: FunctionTool,
+): AgentToolDefinition {
+  return {
+    name: tool.name,
+    description: tool.description ?? tool.name,
+    parameters: (tool.parameters as AgentToolDefinition["parameters"]) ?? {
+      type: "object",
+      properties: {},
+    },
+  };
+}
diff --git a/packages/appkit/src/plugins/agents/tools/hosted-tools.ts b/packages/appkit/src/plugins/agents/tools/hosted-tools.ts
new file mode 100644
index 00000000..bce70c4f
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tools/hosted-tools.ts
@@ -0,0 +1,102 @@
+export interface GenieTool {
+  type: "genie-space";
+  genie_space: { id: string };
+}
+
+export interface VectorSearchIndexTool {
+  type: "vector_search_index";
+  vector_search_index: { name: string };
+}
+
+export interface CustomMcpServerTool {
+  type: "custom_mcp_server";
+  custom_mcp_server: { app_name: string; app_url: string };
+}
+
+export interface ExternalMcpServerTool {
+  type: "external_mcp_server";
+  external_mcp_server: { connection_name: string };
+}
+
+export type HostedTool =
+  | GenieTool
+  | VectorSearchIndexTool
+  | CustomMcpServerTool
+  | ExternalMcpServerTool;
+
+const HOSTED_TOOL_TYPES = new Set([
+  "genie-space",
+  "vector_search_index",
+  "custom_mcp_server",
+  "external_mcp_server",
+]);
+
+export function isHostedTool(value: unknown): value is HostedTool {
+  if (typeof value !== "object" || value === null) return false;
+  const obj = value as Record<string, unknown>;
+  return typeof obj.type === "string" && HOSTED_TOOL_TYPES.has(obj.type);
+}
+
+export interface McpEndpointConfig {
+  name: string;
+  /** Absolute URL or path relative to workspace host */
+  url: string;
+}
+
+/**
+ * Resolves HostedTool configs into MCP endpoint configurations
+ * that the MCP client can connect to.
+ */
+function resolveHostedTool(tool: HostedTool): McpEndpointConfig {
+  switch (tool.type) {
+    case "genie-space":
+      return {
+        name: `genie-${tool.genie_space.id}`,
+        url: `/api/2.0/mcp/genie/${tool.genie_space.id}`,
+      };
+    case "vector_search_index": {
+      const parts = tool.vector_search_index.name.split(".");
+      if (parts.length !== 3) {
+        throw new Error(
+          `vector_search_index name must be 3-part dotted (catalog.schema.index), got: ${tool.vector_search_index.name}`,
+        );
+      }
+      return {
+        name: `vs-${parts.join("-")}`,
+        url: `/api/2.0/mcp/vector-search/${parts[0]}/${parts[1]}/${parts[2]}`,
+      };
+    }
+    case "custom_mcp_server":
+      return {
+        name: tool.custom_mcp_server.app_name,
+        url: tool.custom_mcp_server.app_url,
+      };
+    case "external_mcp_server":
+      return {
+        name: tool.external_mcp_server.connection_name,
+        url: `/api/2.0/mcp/external/${tool.external_mcp_server.connection_name}`,
+      };
+  }
+}
+
+export function resolveHostedTools(tools: HostedTool[]): McpEndpointConfig[] {
+  return tools.map(resolveHostedTool);
+}
+
+/**
+ * Factory for declaring a custom MCP server tool.
+ *
+ * Replaces the verbose `{ type: "custom_mcp_server", custom_mcp_server: { app_name, app_url } }`
+ * wrapper with a concise positional call.
+ *
+ * Example:
+ * ```ts
+ * mcpServer("my-app", "https://my-app.databricksapps.com/mcp")
+ * ```
+ */
+export function mcpServer(name: string, url: string): CustomMcpServerTool {
+  return {
+    type: "custom_mcp_server",
+    custom_mcp_server: { app_name: name, app_url: url },
+  };
+}
diff --git a/packages/appkit/src/plugins/agents/tools/index.ts b/packages/appkit/src/plugins/agents/tools/index.ts
new file mode 100644
index 00000000..7b779d1c
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tools/index.ts
@@ -0,0 +1,20 @@
+export {
+  defineTool,
+  executeFromRegistry,
+  type ToolEntry,
+  type ToolRegistry,
+  toolsFromRegistry,
+} from "./define-tool";
+export {
+  type FunctionTool,
+  functionToolToDefinition,
+  isFunctionTool,
+} from "./function-tool";
+export {
+  type HostedTool,
+  isHostedTool,
+  mcpServer,
+  resolveHostedTools,
+} from "./hosted-tools";
+export { AppKitMcpClient } from "./mcp-client";
+export { type ToolConfig, tool } from "./tool";
diff --git a/packages/appkit/src/plugins/agents/tools/json-schema.ts b/packages/appkit/src/plugins/agents/tools/json-schema.ts
new file mode 100644
index 00000000..805fd48f
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tools/json-schema.ts
@@ -0,0 +1,22 @@
+import { toJSONSchema, type z } from "zod";
+
+/**
+ * Converts a Zod schema to JSON Schema suitable for an LLM tool-call
+ * `parameters` field.
+ *
+ * Wraps `zod`'s `toJSONSchema()` and strips the top-level `$schema` annotation
+ * that Zod v4 emits by default (e.g. `"https://json-schema.org/draft/..."`).
+ * The Databricks Mosaic serving endpoint forwards tool schemas to Google's
+ * Gemini `function_declarations` format, which rejects any top-level key it
+ * doesn't explicitly recognize — including `$schema` — with a 400
+ * `Invalid JSON payload received. Unknown name "$schema"` error. Other LLM
+ * providers either ignore the field or also trip on it, so stripping here is
+ * safe across backends.
+ */
+export function toToolJSONSchema(
+  schema: z.ZodType,
+): Record<string, unknown> {
+  const raw = toJSONSchema(schema) as Record<string, unknown>;
+  const { $schema: _ignored, ...rest } = raw;
+  return rest;
+}
diff --git a/packages/appkit/src/plugins/agents/tools/mcp-client.ts b/packages/appkit/src/plugins/agents/tools/mcp-client.ts
new file mode 100644
index 00000000..bd96d348
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tools/mcp-client.ts
@@ -0,0 +1,278 @@
+import type { AgentToolDefinition } from "shared";
+import { createLogger } from "../../../logging/logger";
+import type { McpEndpointConfig } from "./hosted-tools";
+
+const logger = createLogger("agent:mcp");
+
+interface JsonRpcRequest {
+  jsonrpc: "2.0";
+  id: number;
+  method: string;
+  params?: Record<string, unknown>;
+}
+
+interface JsonRpcResponse {
+  jsonrpc: "2.0";
+  id: number;
+  result?: unknown;
+  error?: { code: number; message: string; data?: unknown };
+}
+
+interface McpToolSchema {
+  name: string;
+  description?: string;
+  inputSchema?: Record<string, unknown>;
+}
+
+interface McpToolCallResult {
+  content: Array<{ type: string; text?: string }>;
+  isError?: boolean;
+}
+
+interface McpServerConnection {
+  config: McpEndpointConfig;
+  resolvedUrl: string;
+  tools: Map<string, McpToolSchema>;
+}
+
+/**
+ * Lightweight MCP client for Databricks-hosted MCP servers.
+ *
+ * Uses raw fetch() with JSON-RPC 2.0 over HTTP — no @modelcontextprotocol/sdk
+ * or LangChain dependency. Supports the Streamable HTTP transport (POST with
+ * JSON-RPC request, single JSON-RPC response).
+ */
+export class AppKitMcpClient {
+  private connections = new Map<string, McpServerConnection>();
+  private sessionIds = new Map<string, string>();
+  private requestId = 0;
+  private closed = false;
+
+  constructor(
+    private workspaceHost: string,
+    private authenticate: () => Promise<Record<string, string>>,
+  ) {}
+
+  async connectAll(endpoints: McpEndpointConfig[]): Promise<void> {
+    const results = await Promise.allSettled(
+      endpoints.map((ep) => this.connect(ep)),
+    );
+    for (let i = 0; i < results.length; i++) {
+      if (results[i].status === "rejected") {
+        logger.error(
+          "Failed to connect MCP server %s: %O",
+          endpoints[i].name,
+          (results[i] as PromiseRejectedResult).reason,
+        );
+      }
+    }
+  }
+
+  private resolveUrl(endpoint: McpEndpointConfig): string {
+    if (
+      endpoint.url.startsWith("http://") ||
+      endpoint.url.startsWith("https://")
+    ) {
+      return endpoint.url;
+    }
+    return `${this.workspaceHost}${endpoint.url}`;
+  }
+
+  async connect(endpoint: McpEndpointConfig): Promise<void> {
+    const url = this.resolveUrl(endpoint);
+    logger.info("Connecting to MCP server: %s at %s", endpoint.name, url);
+
+    const initResponse = await this.sendRpc(url, "initialize", {
+      protocolVersion: "2025-03-26",
+      capabilities: {},
+      clientInfo: { name: "appkit-agent", version: "0.1.0" },
+    });
+
+    if (initResponse.sessionId) {
+      this.sessionIds.set(endpoint.name, initResponse.sessionId);
+    }
+    const sessionId = this.sessionIds.get(endpoint.name);
+
+    await this.sendNotification(url, "notifications/initialized", sessionId);
+
+    const listResponse = await this.sendRpc(
+      url,
+      "tools/list",
+      {},
+      { sessionId },
+    );
+    const toolList =
+      (listResponse.result as { tools?: McpToolSchema[] })?.tools ?? [];
+
+    const tools = new Map<string, McpToolSchema>();
+    for (const tool of toolList) {
+      tools.set(tool.name, tool);
+    }
+
+    this.connections.set(endpoint.name, {
+      config: endpoint,
+      resolvedUrl: url,
+      tools,
+    });
+    logger.info(
+      "Connected to MCP server %s: %d tools available",
+      endpoint.name,
+      tools.size,
+    );
+  }
+
+  getAllToolDefinitions(): AgentToolDefinition[] {
+    const defs: AgentToolDefinition[] = [];
+    for (const [serverName, conn] of this.connections) {
+      for (const [toolName, schema] of conn.tools) {
+        defs.push({
+          name: `mcp.${serverName}.${toolName}`,
+          description: schema.description ?? toolName,
+          parameters:
+            (schema.inputSchema as AgentToolDefinition["parameters"]) ?? {
+              type: "object",
+              properties: {},
+            },
+        });
+      }
+    }
+    return defs;
+  }
+
+  async callTool(
+    qualifiedName: string,
+    args: unknown,
+    authHeaders?: Record<string, string>,
+  ): Promise<string> {
+    const parts = qualifiedName.split(".");
+    if (parts.length < 3 || parts[0] !== "mcp") {
+      throw new Error(`Invalid MCP tool name: ${qualifiedName}`);
+    }
+    const serverName = parts[1];
+    const toolName = parts.slice(2).join(".");
+
+    const conn = this.connections.get(serverName);
+    if (!conn) {
+      throw new Error(`MCP server not connected: ${serverName}`);
+    }
+
+    const sessionId = this.sessionIds.get(serverName);
+    const rpcResult = await this.sendRpc(
+      conn.resolvedUrl,
+      "tools/call",
+      { name: toolName, arguments: args },
+      { authOverride: authHeaders, sessionId },
+    );
+    const result = rpcResult.result as McpToolCallResult;
+
+    if (result.isError) {
+      const errText = result.content
+        .filter((c) => c.type === "text")
+        .map((c) => c.text)
+        .join("\n");
+      throw new Error(errText || "MCP tool call failed");
+    }
+
+    return result.content
+      .filter((c) => c.type === "text")
+      .map((c) => c.text)
+      .join("\n");
+  }
+
+  async close(): Promise<void> {
+    this.closed = true;
+    this.connections.clear();
+  }
+
+  private async sendRpc(
+    url: string,
+    method: string,
+    params?: Record<string, unknown>,
+    options?: {
+      authOverride?: Record<string, string>;
+      sessionId?: string;
+    },
+  ): Promise<{ result: unknown; sessionId?: string }> {
+    if (this.closed) throw new Error("MCP client is closed");
+
+    const request: JsonRpcRequest = {
+      jsonrpc: "2.0",
+      id: ++this.requestId,
+      method,
+      ...(params && { params }),
+    };
+
+    const authHeaders = options?.authOverride ?? (await this.authenticate());
+    const headers: Record<string, string> = {
+      "Content-Type": "application/json",
+      Accept: "application/json, text/event-stream",
+      ...authHeaders,
+    };
+    if (options?.sessionId) {
+      headers["Mcp-Session-Id"] = options.sessionId;
+    }
+
+    const response = await fetch(url, {
+      method: "POST",
+      headers,
+      body: JSON.stringify(request),
+      signal: AbortSignal.timeout(30_000),
+    });
+
+    if (!response.ok) {
+      throw new Error(
+        `MCP request to ${method} failed: ${response.status} ${response.statusText}`,
+      );
+    }
+
+    const contentType = response.headers.get("content-type") ?? "";
+    let json: JsonRpcResponse;
+
+    if (contentType.includes("text/event-stream")) {
+      const text = await response.text();
+      const lastData = text
+        .split("\n")
+        .filter((line) => line.startsWith("data: "))
+        .map((line) => line.slice(6))
+        .pop();
+      if (!lastData) {
+        throw new Error(`MCP SSE response for ${method} contained no data`);
+      }
+      json = JSON.parse(lastData) as JsonRpcResponse;
+    } else {
+      json = (await response.json()) as JsonRpcResponse;
+    }
+
+    if (json.error) {
+      throw new Error(`MCP error (${json.error.code}): ${json.error.message}`);
+    }
+
+    const sid = response.headers.get("mcp-session-id") ?? undefined;
+    return { result: json.result, sessionId: sid };
+  }
+
+  private async sendNotification(
+    url: string,
+    method: string,
+    sessionId?: string,
+  ): Promise<void> {
+    if (this.closed) return;
+
+    const authHeaders = await this.authenticate();
+    const headers: Record<string, string> = {
+      "Content-Type": "application/json",
+      Accept: "application/json, text/event-stream",
+      ...authHeaders,
+    };
+    if (sessionId) {
+      headers["Mcp-Session-Id"] = sessionId;
+    }
+
+    await fetch(url, {
+      method: "POST",
+      headers,
+      body: JSON.stringify({ jsonrpc: "2.0", method }),
+      signal: AbortSignal.timeout(30_000),
+    });
+  }
+}
diff --git a/packages/appkit/src/plugins/agents/tools/tool.ts b/packages/appkit/src/plugins/agents/tools/tool.ts
new file mode 100644
index 00000000..b5d4db65
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tools/tool.ts
@@ -0,0 +1,53 @@
+import type { z } from "zod";
+import type { FunctionTool } from "./function-tool";
+import { toToolJSONSchema } from "./json-schema";
+
+export interface ToolConfig<S extends z.ZodType> {
+  name: string;
+  description?: string;
+  schema: S;
+  execute: (args: z.infer<S>) => Promise<string> | string;
+}
+
+/**
+ * Factory for defining function tools with Zod schemas.
+ *
+ * - Generates JSON Schema (for the LLM) from the Zod schema via `z.toJSONSchema()`.
+ * - Infers the `execute` argument type from the schema.
+ * - Validates tool call arguments at runtime. On validation failure, returns
+ *   a formatted error string to the LLM instead of throwing, so the model
+ *   can self-correct on its next turn.
+ */
+export function tool<S extends z.ZodType>(config: ToolConfig<S>): FunctionTool {
+  const parameters = toToolJSONSchema(config.schema) as unknown as Record<
+    string,
+    unknown
+  >;
+
+  return {
+    type: "function",
+    name: config.name,
+    description: config.description ?? config.name,
+    parameters,
+    execute: async (args: Record<string, unknown>) => {
+      const parsed = config.schema.safeParse(args);
+      if (!parsed.success) {
+        return formatZodError(parsed.error, config.name);
+      }
+      return config.execute(parsed.data as z.infer<S>);
+    },
+  };
+}
+
+/**
+ * Formats a Zod validation error into an LLM-friendly string.
+ *
+ * Example: `Invalid arguments for get_weather: city: Invalid input: expected string, received undefined`
+ */
+export function formatZodError(error: z.ZodError, toolName: string): string {
+  const parts = error.issues.map((issue) => {
+    const field = issue.path.length > 0 ? issue.path.join(".") : "(root)";
+    return `${field}: ${issue.message}`;
+  });
+  return `Invalid arguments for ${toolName}: ${parts.join("; ")}`;
+}
diff --git a/packages/appkit/src/plugins/agents/types.ts b/packages/appkit/src/plugins/agents/types.ts
new file mode 100644
index 00000000..861be26d
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/types.ts
@@ -0,0 +1,47 @@
+import type { AgentToolDefinition, ToolAnnotations } from "shared";
+import type { FunctionTool } from "./tools/function-tool";
+import type { HostedTool } from "./tools/hosted-tools";
+
+/**
+ * A tool reference produced by a plugin's `.toolkit()` call. The agents plugin
+ * recognizes the `__toolkitRef` brand and dispatches tool invocations through
+ * `PluginContext.executeTool(req, pluginName, localName, ...)`, preserving
+ * OBO (asUser) and telemetry spans.
+ */
+export interface ToolkitEntry {
+  readonly __toolkitRef: true;
+  pluginName: string;
+  localName: string;
+  def: AgentToolDefinition;
+  annotations?: ToolAnnotations;
+}
+
+/**
+ * Any tool an agent can invoke: inline function tools (`tool()`), hosted MCP
+ * tools (`mcpServer()` / raw hosted), or toolkit references from plugins
+ * (`analytics().toolkit()`).
+ */
+export type AgentTool = FunctionTool | HostedTool | ToolkitEntry;
+
+export interface ToolkitOptions {
+  /** Key prefix to prepend to each tool's local name. Defaults to `${pluginName}.`. */
+  prefix?: string;
+  /** Only include tools whose local name matches one of these. */
+  only?: string[];
+  /** Exclude tools whose local name matches one of these. */
+  except?: string[];
+  /** Remap specific local names to different keys (applied after prefix). */
+  rename?: Record<string, string>;
+}
+
+/**
+ * Type guard for `ToolkitEntry` — used to differentiate toolkit references
+ * from inline tools in a mixed `tools` record.
+ */
+export function isToolkitEntry(value: unknown): value is ToolkitEntry {
+  return (
+    typeof value === "object" &&
+    value !== null &&
+    (value as { __toolkitRef?: unknown }).__toolkitRef === true
+  );
+}
diff --git a/packages/appkit/src/plugins/analytics/analytics.ts b/packages/appkit/src/plugins/analytics/analytics.ts
index a9c688da..26f326cc 100644
--- a/packages/appkit/src/plugins/analytics/analytics.ts
+++ b/packages/appkit/src/plugins/analytics/analytics.ts
@@ -1,16 +1,25 @@
 import type { WorkspaceClient } from "@databricks/sdk-experimental";
 import type express from "express";
 import type {
+  AgentToolDefinition,
   IAppRouter,
   PluginExecuteConfig,
   SQLTypeMarker,
   StreamExecutionSettings,
+  ToolProvider,
 } from "shared";
+import { z } from "zod";
 import { SQLWarehouseConnector } from "../../connectors";
 import { getWarehouseId, getWorkspaceClient } from "../../context";
 import { createLogger } from "../../logging/logger";
 import { Plugin, toPlugin } from "../../plugin";
 import type { PluginManifest } from "../../registry";
+import { buildToolkitEntries } from "../agents/build-toolkit";
+import {
+  defineTool,
+  executeFromRegistry,
+  toolsFromRegistry,
+} from "../agents/tools/define-tool";
 import { queryDefaults } from "./defaults";
 import manifest from "./manifest.json";
 import { QueryProcessor } from "./query";
@@ -22,7 +31,7 @@ import type {
 
 const logger = createLogger("analytics");
 
-export class AnalyticsPlugin extends Plugin {
+export class AnalyticsPlugin extends Plugin implements ToolProvider {
   /** Plugin manifest declaring metadata and resource requirements */
   static manifest = manifest as PluginManifest<"analytics">;
 
@@ -262,6 +271,45 @@ export class AnalyticsPlugin extends Plugin {
     this.streamManager.abortAll();
   }
 
+  private tools = {
+    query: defineTool({
+      description:
+        "Execute a SQL query against the Databricks SQL warehouse. Returns the query results as JSON.",
+      schema: z.object({
+        query: z.string().describe("The SQL query to execute"),
+      }),
+      annotations: {
+        readOnly: true,
+        requiresUserContext: true,
+      },
+      handler: (args, signal) =>
+        this.query(args.query, undefined, undefined, signal),
+    }),
+  };
+
+  getAgentTools(): AgentToolDefinition[] {
+    return toolsFromRegistry(this.tools);
+  }
+
+  async executeAgentTool(
+    name: string,
+    args: unknown,
+    signal?: AbortSignal,
+  ): Promise<unknown> {
+    return executeFromRegistry(this.tools, name, args, signal);
+  }
+
+  /**
+   * Returns the plugin's tools as a keyed record of `ToolkitEntry` markers.
+   * Called by the agents plugin (via `resolveToolkitFromProvider`) to spread
+   * a filtered, renamed view of the plugin's tools into an agent's tool
+   * index. Most callers should go through `fromPlugin(analytics, opts)` at
+   * module scope instead of reaching for this directly.
+   */
+  toolkit(opts?: import("../agents/types").ToolkitOptions) {
+    return buildToolkitEntries(this.name, this.tools, opts);
+  }
+
   /**
    * Returns the public exports for the analytics plugin.
    * Note: `asUser()` is automatically added by AppKit.
diff --git a/packages/appkit/src/plugins/analytics/tests/analytics.test.ts b/packages/appkit/src/plugins/analytics/tests/analytics.test.ts
index 9a30440e..29157fff 100644
--- a/packages/appkit/src/plugins/analytics/tests/analytics.test.ts
+++ b/packages/appkit/src/plugins/analytics/tests/analytics.test.ts
@@ -608,4 +608,22 @@ describe("Analytics Plugin", () => {
       });
     });
   });
+
+  describe("toolkit()", () => {
+    test("produces ToolkitEntry records keyed by the plugin name", () => {
+      const plugin = new AnalyticsPlugin({ name: "analytics" });
+      const entries = plugin.toolkit();
+      expect(Object.keys(entries)).toContain("analytics.query");
+      const entry = entries["analytics.query"];
+      expect(entry.__toolkitRef).toBe(true);
+      expect(entry.pluginName).toBe("analytics");
+      expect(entry.localName).toBe("query");
+    });
+
+    test("respects prefix and only options", () => {
+      const plugin = new AnalyticsPlugin({ name: "analytics" });
+      const entries = plugin.toolkit({ prefix: "", only: ["query"] });
+      expect(Object.keys(entries)).toEqual(["query"]);
+    });
+  });
 });
diff --git a/packages/appkit/src/plugins/files/plugin.ts b/packages/appkit/src/plugins/files/plugin.ts
index 9344af85..cb588352 100644
--- a/packages/appkit/src/plugins/files/plugin.ts
+++ b/packages/appkit/src/plugins/files/plugin.ts
@@ -2,7 +2,13 @@ import { STATUS_CODES } from "node:http";
 import { Readable } from "node:stream";
 import { ApiError } from "@databricks/sdk-experimental";
 import type express from "express";
-import type { IAppRouter, PluginExecutionSettings } from "shared";
+import type {
+  AgentToolDefinition,
+  IAppRouter,
+  PluginExecutionSettings,
+  ToolProvider,
+} from "shared";
+import { z } from "zod";
 import {
   contentTypeFromPath,
   FilesConnector,
@@ -15,6 +21,13 @@ import { createLogger } from "../../logging/logger";
 import { Plugin, toPlugin } from "../../plugin";
 import type { PluginManifest, ResourceRequirement } from "../../registry";
 import { ResourceType } from "../../registry";
+import { buildToolkitEntries } from "../agents/build-toolkit";
+import {
+  defineTool,
+  executeFromRegistry,
+  type ToolRegistry,
+  toolsFromRegistry,
+} from "../agents/tools/define-tool";
 import {
   FILES_DOWNLOAD_DEFAULTS,
   FILES_MAX_UPLOAD_SIZE,
@@ -34,7 +47,7 @@ import type {
 
 const logger = createLogger("files");
 
-export class FilesPlugin extends Plugin {
+export class FilesPlugin extends Plugin implements ToolProvider {
   name = "files";
 
   /** Plugin manifest declaring metadata and resource requirements. */
@@ -45,6 +58,7 @@ export class FilesPlugin extends Plugin {
   private volumeConnectors: Record<string, FilesConnector> = {};
   private volumeConfigs: Record<string, VolumeConfig> = {};
   private volumeKeys: string[] = [];
+  private tools: ToolRegistry = {};
 
   /**
    * Scans `process.env` for `DATABRICKS_VOLUME_*` keys and merges them with
@@ -148,6 +162,79 @@ export class FilesPlugin extends Plugin {
         customContentTypes: mergedConfig.customContentTypes,
       });
     }
+
+    for (const volumeKey of this.volumeKeys) {
+      Object.assign(this.tools, this._defineVolumeTools(volumeKey));
+    }
+  }
+
+  /**
+   * Builds the registry entries for a single volume. One set of tools per
+   * configured volume, keyed by `${volumeKey}.${method}`.
+   */
+  private _defineVolumeTools(volumeKey: string): ToolRegistry {
+    const api = () => this.createVolumeAPI(volumeKey);
+    return {
+      [`${volumeKey}.list`]: defineTool({
+        description: `List files and directories in the "${volumeKey}" volume`,
+        schema: z.object({
+          path: z
+            .string()
+            .optional()
+            .describe("Directory path to list (optional, defaults to root)"),
+        }),
+        annotations: { readOnly: true, requiresUserContext: true },
+        handler: (args) => api().list(args.path),
+      }),
+      [`${volumeKey}.read`]: defineTool({
+        description: `Read a text file from the "${volumeKey}" volume`,
+        schema: z.object({
+          path: z.string().describe("File path to read"),
+        }),
+        annotations: { readOnly: true, requiresUserContext: true },
+        handler: (args) => api().read(args.path),
+      }),
+      [`${volumeKey}.exists`]: defineTool({
+        description: `Check if a file or directory exists in the "${volumeKey}" volume`,
+        schema: z.object({
+          path: z.string().describe("Path to check"),
+        }),
+        annotations: { readOnly: true, requiresUserContext: true },
+        handler: (args) => api().exists(args.path),
+      }),
+      [`${volumeKey}.metadata`]: defineTool({
+        description: `Get metadata (size, type, last modified) for a file in the "${volumeKey}" volume`,
+        schema: z.object({
+          path: z.string().describe("File path"),
+        }),
+        annotations: { readOnly: true, requiresUserContext: true },
+        handler: (args) => api().metadata(args.path),
+      }),
+      [`${volumeKey}.upload`]: defineTool({
+        description: `Upload a text file to the "${volumeKey}" volume`,
+        schema: z.object({
+          path: z.string().describe("Destination file path"),
+          contents: z.string().describe("File contents as a string"),
+          overwrite: z
+            .boolean()
+            .optional()
+            .describe("Whether to overwrite existing file"),
+        }),
+        annotations: { destructive: true, requiresUserContext: true },
+        handler: (args) =>
+          api().upload(args.path, args.contents, {
+            overwrite: args.overwrite,
+          }),
+      }),
+      [`${volumeKey}.delete`]: defineTool({
+        description: `Delete a file from the "${volumeKey}" volume`,
+        schema: z.object({
+          path: z.string().describe("File path to delete"),
+        }),
+        annotations: { destructive: true, requiresUserContext: true },
+        handler: (args) => api().delete(args.path),
+      }),
+    };
   }
 
   /**
@@ -950,6 +1037,23 @@ export class FilesPlugin extends Plugin {
    * appKit.files("uploads").list()
    * ```
    */
+
+  getAgentTools(): AgentToolDefinition[] {
+    return toolsFromRegistry(this.tools);
+  }
+
+  async executeAgentTool(
+    name: string,
+    args: unknown,
+    signal?: AbortSignal,
+  ): Promise<unknown> {
+    return executeFromRegistry(this.tools, name, args, signal);
+  }
+
+  toolkit(opts?: import("../agents/types").ToolkitOptions) {
+    return buildToolkitEntries(this.name, this.tools, opts);
+  }
+
   exports(): FilesExport {
     const resolveVolume = (volumeKey: string): VolumeHandle => {
       if (!this.volumeKeys.includes(volumeKey)) {
diff --git a/packages/appkit/src/plugins/files/tests/plugin.test.ts b/packages/appkit/src/plugins/files/tests/plugin.test.ts
index 99e08b8c..17591a45 100644
--- a/packages/appkit/src/plugins/files/tests/plugin.test.ts
+++ b/packages/appkit/src/plugins/files/tests/plugin.test.ts
@@ -204,6 +204,62 @@ describe("FilesPlugin", () => {
     });
   });
 
+  describe("getAgentTools / executeAgentTool", () => {
+    test("produces independent tool entries per volume", () => {
+      const plugin = new FilesPlugin(VOLUMES_CONFIG);
+      const tools = plugin.getAgentTools();
+      const names = tools.map((t) => t.name);
+
+      expect(names).toContain("uploads.list");
+      expect(names).toContain("uploads.read");
+      expect(names).toContain("uploads.exists");
+      expect(names).toContain("uploads.metadata");
+      expect(names).toContain("uploads.upload");
+      expect(names).toContain("uploads.delete");
+
+      expect(names).toContain("exports.list");
+      expect(names).toContain("exports.read");
+      expect(names).toContain("exports.delete");
+
+      expect(tools).toHaveLength(12);
+    });
+
+    test("dispatches to the correct volume API based on the tool name", async () => {
+      const plugin = new FilesPlugin(VOLUMES_CONFIG);
+      const asyncIterable = (items: { path: string }[]) => ({
+        [Symbol.asyncIterator]: async function* () {
+          for (const item of items) yield item;
+        },
+      });
+      mockClient.files.listDirectoryContents.mockReturnValueOnce(
+        asyncIterable([{ path: "uploads-file" }]),
+      );
+      mockClient.files.listDirectoryContents.mockReturnValueOnce(
+        asyncIterable([{ path: "exports-file" }]),
+      );
+
+      const uploadsResult = (await plugin.executeAgentTool(
+        "uploads.list",
+        {},
+      )) as { path: string }[];
+      const exportsResult = (await plugin.executeAgentTool(
+        "exports.list",
+        {},
+      )) as { path: string }[];
+
+      expect(uploadsResult[0].path).toBe("uploads-file");
+      expect(exportsResult[0].path).toBe("exports-file");
+    });
+
+    test("returns LLM-friendly error string for invalid tool args", async () => {
+      const plugin = new FilesPlugin(VOLUMES_CONFIG);
+      const result = await plugin.executeAgentTool("uploads.read", {});
+      expect(typeof result).toBe("string");
+      expect(result).toContain("Invalid arguments for uploads.read");
+      expect(result).toContain("path");
+    });
+  });
+
   describe("exports()", () => {
     test("returns a callable function with a .volume alias", () => {
       const plugin = new FilesPlugin(VOLUMES_CONFIG);
diff --git a/packages/appkit/src/plugins/genie/genie.ts b/packages/appkit/src/plugins/genie/genie.ts
index 712aadbf..0c251994 100644
--- a/packages/appkit/src/plugins/genie/genie.ts
+++ b/packages/appkit/src/plugins/genie/genie.ts
@@ -1,11 +1,24 @@
 import { randomUUID } from "node:crypto";
 import type express from "express";
-import type { IAppRouter, StreamExecutionSettings } from "shared";
+import type {
+  AgentToolDefinition,
+  IAppRouter,
+  StreamExecutionSettings,
+  ToolProvider,
+} from "shared";
+import { z } from "zod";
 import { GenieConnector } from "../../connectors";
 import { getWorkspaceClient } from "../../context";
 import { createLogger } from "../../logging";
 import { Plugin, toPlugin } from "../../plugin";
 import type { PluginManifest } from "../../registry";
+import { buildToolkitEntries } from "../agents/build-toolkit";
+import {
+  defineTool,
+  executeFromRegistry,
+  type ToolRegistry,
+  toolsFromRegistry,
+} from "../agents/tools/define-tool";
 import { genieStreamDefaults } from "./defaults";
 import manifest from "./manifest.json";
 import type {
@@ -17,7 +30,7 @@ import type {
 
 const logger = createLogger("genie");
 
-export class GeniePlugin extends Plugin {
+export class GeniePlugin extends Plugin implements ToolProvider {
   static manifest = manifest as PluginManifest<"genie">;
 
   protected static description =
@@ -25,6 +38,7 @@ export class GeniePlugin extends Plugin {
   protected declare config: IGenieConfig;
 
   private readonly genieConnector: GenieConnector;
+  private tools: ToolRegistry = {};
 
   constructor(config: IGenieConfig) {
     super(config);
@@ -36,6 +50,53 @@ export class GeniePlugin extends Plugin {
       timeout: this.config.timeout,
       maxMessages: 200,
     });
+
+    for (const alias of Object.keys(this.config.spaces ?? {})) {
+      Object.assign(this.tools, this._defineSpaceTools(alias));
+    }
+  }
+
+  /**
+   * Builds the registry entries for a single Genie space alias.
+   * One set of tools per configured space, keyed by `${alias}.${method}`.
+   */
+  private _defineSpaceTools(alias: string): ToolRegistry {
+    return {
+      [`${alias}.sendMessage`]: defineTool({
+        description: `Send a natural language question to the Genie space "${alias}" and get data analysis results`,
+        schema: z.object({
+          content: z.string().describe("The natural language question to ask"),
+          conversationId: z
+            .string()
+            .optional()
+            .describe(
+              "Optional conversation ID to continue an existing conversation",
+            ),
+        }),
+        annotations: { requiresUserContext: true },
+        handler: async (args) => {
+          const events: GenieStreamEvent[] = [];
+          for await (const event of this.sendMessage(
+            alias,
+            args.content,
+            args.conversationId,
+          )) {
+            events.push(event);
+          }
+          return events;
+        },
+      }),
+      [`${alias}.getConversation`]: defineTool({
+        description: `Retrieve the conversation history from the Genie space "${alias}"`,
+        schema: z.object({
+          conversationId: z
+            .string()
+            .describe("The conversation ID to retrieve"),
+        }),
+        annotations: { readOnly: true, requiresUserContext: true },
+        handler: (args) => this.getConversation(alias, args.conversationId),
+      }),
+    };
   }
 
   private defaultSpaces(): Record<string, string> {
@@ -287,6 +348,22 @@ export class GeniePlugin extends Plugin {
     this.streamManager.abortAll();
   }
 
+  getAgentTools(): AgentToolDefinition[] {
+    return toolsFromRegistry(this.tools);
+  }
+
+  async executeAgentTool(
+    name: string,
+    args: unknown,
+    signal?: AbortSignal,
+  ): Promise<unknown> {
+    return executeFromRegistry(this.tools, name, args, signal);
+  }
+
+  toolkit(opts?: import("../agents/types").ToolkitOptions) {
+    return buildToolkitEntries(this.name, this.tools, opts);
+  }
+
   exports() {
     return {
       sendMessage: this.sendMessage,
diff --git a/packages/appkit/src/plugins/genie/tests/genie.test.ts b/packages/appkit/src/plugins/genie/tests/genie.test.ts
index 3cf0784d..672e6242 100644
--- a/packages/appkit/src/plugins/genie/tests/genie.test.ts
+++ b/packages/appkit/src/plugins/genie/tests/genie.test.ts
@@ -187,6 +187,30 @@ describe("Genie Plugin", () => {
     });
   });
 
+  describe("getAgentTools / executeAgentTool", () => {
+    test("produces independent tool entries per configured space", () => {
+      const plugin = new GeniePlugin(config);
+      const names = plugin.getAgentTools().map((t) => t.name);
+
+      expect(names).toContain("myspace.sendMessage");
+      expect(names).toContain("myspace.getConversation");
+      expect(names).toContain("salesbot.sendMessage");
+      expect(names).toContain("salesbot.getConversation");
+      expect(names).toHaveLength(4);
+    });
+
+    test("returns LLM-friendly error string for invalid tool args", async () => {
+      const plugin = new GeniePlugin(config);
+      const result = await plugin.executeAgentTool(
+        "myspace.getConversation",
+        {},
+      );
+      expect(typeof result).toBe("string");
+      expect(result).toContain("Invalid arguments for myspace.getConversation");
+      expect(result).toContain("conversationId");
+    });
+  });
+
   describe("space alias resolution", () => {
     test("should return 404 for unknown alias", async () => {
       const plugin = new GeniePlugin(config);
diff --git a/packages/appkit/src/plugins/lakebase/lakebase.ts b/packages/appkit/src/plugins/lakebase/lakebase.ts
index 3071d539..f1866d39 100644
--- a/packages/appkit/src/plugins/lakebase/lakebase.ts
+++ b/packages/appkit/src/plugins/lakebase/lakebase.ts
@@ -1,4 +1,6 @@
 import type { Pool, QueryResult, QueryResultRow } from "pg";
+import type { AgentToolDefinition, ToolProvider } from "shared";
+import { z } from "zod";
 import {
   createLakebasePool,
   getLakebaseOrmConfig,
@@ -8,6 +10,12 @@ import {
 import { createLogger } from "../../logging/logger";
 import { Plugin, toPlugin } from "../../plugin";
 import type { PluginManifest } from "../../registry";
+import { buildToolkitEntries } from "../agents/build-toolkit";
+import {
+  defineTool,
+  executeFromRegistry,
+  toolsFromRegistry,
+} from "../agents/tools/define-tool";
 import manifest from "./manifest.json";
 import type { ILakebaseConfig } from "./types";
 
@@ -30,7 +38,7 @@ const logger = createLogger("lakebase");
  * const result = await AppKit.lakebase.query("SELECT * FROM users WHERE id = $1", [userId]);
  * ```
  */
-class LakebasePlugin extends Plugin {
+class LakebasePlugin extends Plugin implements ToolProvider {
   /** Plugin manifest declaring metadata and resource requirements */
   static manifest = manifest as PluginManifest<"lakebase">;
 
@@ -102,6 +110,50 @@ class LakebasePlugin extends Plugin {
    * - `getOrmConfig()` — Returns a config object compatible with Drizzle, TypeORM, Sequelize, etc.
    * - `getPgConfig()` — Returns a `pg.PoolConfig` object for manual pool construction
    */
+
+  private tools = {
+    query: defineTool({
+      description:
+        "Execute a parameterized SQL query against the Lakebase PostgreSQL database. Use $1, $2, etc. as placeholders and pass values separately.",
+      schema: z.object({
+        text: z
+          .string()
+          .describe(
+            "SQL query string with $1, $2, ... placeholders for parameters",
+          ),
+        values: z
+          .array(z.unknown())
+          .optional()
+          .describe("Parameter values corresponding to placeholders"),
+      }),
+      annotations: {
+        readOnly: false,
+        destructive: false,
+        idempotent: false,
+      },
+      handler: async (args) => {
+        const result = await this.query(args.text, args.values);
+        return result.rows;
+      },
+    }),
+  };
+
+  getAgentTools(): AgentToolDefinition[] {
+    return toolsFromRegistry(this.tools);
+  }
+
+  async executeAgentTool(
+    name: string,
+    args: unknown,
+    signal?: AbortSignal,
+  ): Promise<unknown> {
+    return executeFromRegistry(this.tools, name, args, signal);
+  }
+
+  toolkit(opts?: import("../agents/types").ToolkitOptions) {
+    return buildToolkitEntries(this.name, this.tools, opts);
+  }
+
   exports() {
     return {
       // biome-ignore lint/style/noNonNullAssertion: pool is guaranteed non-null after setup(), which AppKit always awaits before exposing the plugin API

From e26795bdc134ff0e910e3c76f708c7e2cd3aac6b Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Tue, 21 Apr 2026 19:48:00 +0200
Subject: [PATCH 2/6] =?UTF-8?q?feat(appkit):=20plugin=20infrastructure=20?=
 =?UTF-8?q?=E2=80=94=20attachContext=20lifecycle=20+=20PluginContext=20med?=
 =?UTF-8?q?iator?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Third layer: the substrate every downstream PR relies on. No user-
facing API changes here; the surface for this PR is the mediator
pattern, lifecycle semantics, and factory stamping.

### Split Plugin construction from context binding

`Plugin` constructors become pure — no `CacheManager.getInstanceSync()`,
no `TelemetryManager.getProvider()`, no `PluginContext` wiring inside
`constructor()`. That work moves to a new lifecycle method:

```ts
interface BasePlugin {
  attachContext?(deps: {
    context?: unknown;
    telemetryConfig?: TelemetryOptions;
  }): void;
}
```

`createApp` calls `attachContext()` on every plugin after all
constructors have run, before `setup()`. This lets factories return
`PluginData` tuples at module scope without pulling core services into
the import graph — a prerequisite for later PRs that construct agent
definitions before `createApp`.

### PluginContext mediator

`packages/appkit/src/core/plugin-context.ts` — new class that mediates
all inter-plugin communication:

- **Route buffering**: `addRoute()` / `addMiddleware()` buffer until
  the server plugin calls `registerAsRouteTarget()`, then flush via
  `addExtension()`. Eliminates plugin-ordering fragility.
- **ToolProvider registry**: `registerToolProvider(name, plugin)` +
  live `getToolProviders()`. Typed discovery of tool-exposing plugins.
- **User-scoped tool execution**: `executeTool(req, pluginName,
  localName, args, signal?)` resolves the provider, wraps in
  `asUser(req)` for OBO, opens a telemetry span, applies a 30s
  timeout, dispatches, returns.
- **Lifecycle hooks**: `onLifecycle('setup:complete' | 'server:ready'
  | 'shutdown', cb)` + `emitLifecycle(event)`. Callback errors don't
  block siblings.

### `toPlugin` stamps `pluginName`

`packages/appkit/src/plugin/to-plugin.ts` — the factory now attaches a
read-only `pluginName` property to the returned function. Later PRs'
`fromPlugin(factory)` reads it to identify which plugin a factory
refers to without needing to construct an instance. `NamedPluginFactory`
type exported for consumers who want to type-constrain factories.

### Server plugin defers start to `setup:complete`

`ServerPlugin.setup()` no longer calls `extendRoutes()` synchronously.
It subscribes to the `setup:complete` lifecycle event via
`PluginContext` and starts the HTTP server there. This ensures that
any deferred-phase plugin (agents plugin in a later PR) has had a
chance to register routes via `PluginContext.addRoute()` before the
server binds. Removes the `plugins` field from `ServerConfig` (routes
are now discovered via the context, not a config snapshot).

### Test plan

- 25 new PluginContext tests (route buffering, tool provider registry,
  executeTool paths, lifecycle hooks, plugin metadata)
- Updated AppKit lifecycle tests to inject `context` instead of
  `plugins`
- Full appkit vitest suite: 1237 tests passing
- Typecheck clean across all 8 workspace projects

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 packages/appkit/src/core/appkit.ts            |  27 +-
 packages/appkit/src/core/plugin-context.ts    | 287 ++++++++++++++++
 .../appkit/src/core/tests/databricks.test.ts  |  15 +-
 .../src/core/tests/plugin-context.test.ts     | 325 ++++++++++++++++++
 packages/appkit/src/plugin/index.ts           |   2 +-
 packages/appkit/src/plugin/plugin.ts          |  56 ++-
 packages/appkit/src/plugin/to-plugin.ts       |  32 +-
 packages/appkit/src/plugins/server/index.ts   |  41 ++-
 .../src/plugins/server/tests/server.test.ts   |  42 ++-
 packages/appkit/src/plugins/server/types.ts   |   2 -
 packages/shared/src/plugin.ts                 |   9 +
 11 files changed, 799 insertions(+), 39 deletions(-)
 create mode 100644 packages/appkit/src/core/plugin-context.ts
 create mode 100644 packages/appkit/src/core/tests/plugin-context.test.ts

diff --git a/packages/appkit/src/core/appkit.ts b/packages/appkit/src/core/appkit.ts
index a2cba994..a0c2e566 100644
--- a/packages/appkit/src/core/appkit.ts
+++ b/packages/appkit/src/core/appkit.ts
@@ -13,14 +13,18 @@ import { ServiceContext } from "../context";
 import { ResourceRegistry, ResourceType } from "../registry";
 import type { TelemetryConfig } from "../telemetry";
 import { TelemetryManager } from "../telemetry";
+import { isToolProvider, PluginContext } from "./plugin-context";
 
 export class AppKit<TPlugins extends InputPluginMap> {
   #pluginInstances: Record<string, BasePlugin> = {};
   #setupPromises: Promise<void>[] = [];
+  #context: PluginContext;
 
   private constructor(config: { plugins: TPlugins }) {
     const { plugins, ...globalConfig } = config;
 
+    this.#context = new PluginContext();
+
     const pluginEntries = Object.entries(plugins);
 
     const corePlugins = pluginEntries.filter(([_, p]) => {
@@ -35,20 +39,24 @@ export class AppKit<TPlugins extends InputPluginMap> {
 
     for (const [name, pluginData] of corePlugins) {
       if (pluginData) {
-        this.createAndRegisterPlugin(globalConfig, name, pluginData);
+        this.createAndRegisterPlugin(globalConfig, name, pluginData, {
+          context: this.#context,
+        });
       }
     }
 
     for (const [name, pluginData] of normalPlugins) {
       if (pluginData) {
-        this.createAndRegisterPlugin(globalConfig, name, pluginData);
+        this.createAndRegisterPlugin(globalConfig, name, pluginData, {
+          context: this.#context,
+        });
       }
     }
 
     for (const [name, pluginData] of deferredPlugins) {
       if (pluginData) {
         this.createAndRegisterPlugin(globalConfig, name, pluginData, {
-          plugins: this.#pluginInstances,
+          context: this.#context,
         });
       }
     }
@@ -70,8 +78,20 @@ export class AppKit<TPlugins extends InputPluginMap> {
     };
     const pluginInstance = new Plugin(baseConfig);
 
+    if (typeof pluginInstance.attachContext === "function") {
+      pluginInstance.attachContext({
+        context: this.#context,
+        telemetryConfig: baseConfig.telemetry,
+      });
+    }
+
     this.#pluginInstances[name] = pluginInstance;
 
+    this.#context.registerPlugin(name, pluginInstance);
+    if (isToolProvider(pluginInstance)) {
+      this.#context.registerToolProvider(name, pluginInstance);
+    }
+
     this.#setupPromises.push(pluginInstance.setup());
 
     const self = this;
@@ -199,6 +219,7 @@ export class AppKit<TPlugins extends InputPluginMap> {
     const instance = new AppKit(mergedConfig);
 
     await Promise.all(instance.#setupPromises);
+    await instance.#context.emitLifecycle("setup:complete");
 
     return instance as unknown as PluginMap<T>;
   }
diff --git a/packages/appkit/src/core/plugin-context.ts b/packages/appkit/src/core/plugin-context.ts
new file mode 100644
index 00000000..c2801585
--- /dev/null
+++ b/packages/appkit/src/core/plugin-context.ts
@@ -0,0 +1,287 @@
+import type express from "express";
+import type { BasePlugin, ToolProvider } from "shared";
+import { createLogger } from "../logging/logger";
+import { TelemetryManager } from "../telemetry";
+
+const logger = createLogger("plugin-context");
+
+interface BufferedRoute {
+  method: string;
+  path: string;
+  handlers: express.RequestHandler[];
+}
+
+interface RouteTarget {
+  addExtension(fn: (app: express.Application) => void): void;
+}
+
+interface ToolProviderEntry {
+  plugin: BasePlugin & ToolProvider;
+  name: string;
+}
+
+type LifecycleEvent = "setup:complete" | "server:ready" | "shutdown";
+
+/**
+ * Mediator for inter-plugin communication.
+ *
+ * Created by AppKit core and passed to every plugin. Plugins request
+ * capabilities from the context instead of holding direct references
+ * to sibling plugin instances.
+ *
+ * Capabilities:
+ * - Route mounting with buffering (order-independent)
+ * - Typed ToolProvider registry (live, not snapshot-based)
+ * - User-scoped tool execution with automatic telemetry
+ * - Lifecycle hooks for plugin coordination
+ */
+export class PluginContext {
+  private routeBuffer: BufferedRoute[] = [];
+  private routeTarget: RouteTarget | null = null;
+  private toolProviders = new Map<string, ToolProviderEntry>();
+  private plugins = new Map<string, BasePlugin>();
+  private lifecycleHooks = new Map<
+    LifecycleEvent,
+    Set<() => void | Promise<void>>
+  >();
+  private telemetry = TelemetryManager.getProvider("plugin-context");
+
+  /**
+   * Register a route on the root Express application.
+   *
+   * If a route target (server plugin) has registered, the route is applied
+   * immediately. Otherwise it is buffered and flushed when a route target
+   * becomes available.
+   */
+  addRoute(
+    method: string,
+    path: string,
+    ...handlers: express.RequestHandler[]
+  ): void {
+    if (this.routeTarget) {
+      this.applyRoute({ method, path, handlers });
+    } else {
+      this.routeBuffer.push({ method, path, handlers });
+    }
+  }
+
+  /**
+   * Register middleware on the root Express application.
+   *
+   * Same buffering semantics as `addRoute`.
+   */
+  addMiddleware(path: string, ...handlers: express.RequestHandler[]): void {
+    if (this.routeTarget) {
+      this.applyMiddleware(path, handlers);
+    } else {
+      this.routeBuffer.push({ method: "use", path, handlers });
+    }
+  }
+
+  /**
+   * Called by the server plugin to opt in as the route target.
+   * Flushes all buffered routes via the server's `addExtension`.
+   */
+  registerAsRouteTarget(target: RouteTarget): void {
+    this.routeTarget = target;
+
+    for (const route of this.routeBuffer) {
+      if (route.method === "use") {
+        this.applyMiddleware(route.path, route.handlers);
+      } else {
+        this.applyRoute(route);
+      }
+    }
+    this.routeBuffer = [];
+  }
+
+  /**
+   * Register a plugin that implements the ToolProvider interface.
+   * Called by AppKit core after constructing each plugin.
+   */
+  registerToolProvider(name: string, plugin: BasePlugin & ToolProvider): void {
+    this.toolProviders.set(name, { plugin, name });
+  }
+
+  /**
+   * Register a plugin instance.
+   * Called by AppKit core after constructing each plugin.
+   */
+  registerPlugin(name: string, instance: BasePlugin): void {
+    this.plugins.set(name, instance);
+  }
+
+  /**
+   * Returns all registered plugin instances keyed by name.
+   * Used by the server plugin for route injection, client config,
+   * and shutdown coordination.
+   */
+  getPlugins(): Map<string, BasePlugin> {
+    return this.plugins;
+  }
+
+  /**
+   * Returns all registered ToolProvider plugins.
+   * Always returns the current set — not a frozen snapshot.
+   */
+  getToolProviders(): Array<{ name: string; provider: ToolProvider }> {
+    return Array.from(this.toolProviders.values()).map((entry) => ({
+      name: entry.name,
+      provider: entry.plugin,
+    }));
+  }
+
+  /**
+   * Execute a tool on a ToolProvider plugin with automatic user scoping
+   * and telemetry.
+   *
+   * The context:
+   * 1. Resolves the plugin by name
+   * 2. Calls `asUser(req)` for user-scoped execution
+   * 3. Wraps the call in a telemetry span with a 30s timeout
+   */
+  async executeTool(
+    req: express.Request,
+    pluginName: string,
+    toolName: string,
+    args: unknown,
+    signal?: AbortSignal,
+  ): Promise<unknown> {
+    const entry = this.toolProviders.get(pluginName);
+    if (!entry) {
+      throw new Error(
+        `PluginContext: unknown plugin "${pluginName}". Available: ${Array.from(this.toolProviders.keys()).join(", ")}`,
+      );
+    }
+
+    const tracer = this.telemetry.getTracer();
+    const operationName = `executeTool:${pluginName}.${toolName}`;
+
+    return tracer.startActiveSpan(operationName, async (span) => {
+      const timeout = 30_000;
+      const timeoutSignal = AbortSignal.timeout(timeout);
+      const combinedSignal = signal
+        ? AbortSignal.any([signal, timeoutSignal])
+        : timeoutSignal;
+
+      try {
+        const userPlugin = (entry.plugin as any).asUser(req);
+        const result = await (userPlugin as ToolProvider).executeAgentTool(
+          toolName,
+          args,
+          combinedSignal,
+        );
+        span.setStatus({ code: 0 });
+        return result;
+      } catch (error) {
+        span.setStatus({
+          code: 2,
+          message:
+            error instanceof Error ? error.message : "Tool execution failed",
+        });
+        span.recordException(
+          error instanceof Error ? error : new Error(String(error)),
+        );
+        throw error;
+      } finally {
+        span.end();
+      }
+    });
+  }
+
+  /**
+   * Register a lifecycle hook callback.
+   */
+  onLifecycle(event: LifecycleEvent, fn: () => void | Promise<void>): void {
+    let hooks = this.lifecycleHooks.get(event);
+    if (!hooks) {
+      hooks = new Set();
+      this.lifecycleHooks.set(event, hooks);
+    }
+    hooks.add(fn);
+  }
+
+  /**
+   * Emit a lifecycle event, calling all registered callbacks.
+   * Errors in individual callbacks are logged but do not prevent
+   * other callbacks from running.
+   *
+   * @internal Called by AppKit core only.
+   */
+  async emitLifecycle(event: LifecycleEvent): Promise<void> {
+    const hooks = this.lifecycleHooks.get(event);
+    if (!hooks) return;
+
+    if (
+      event === "setup:complete" &&
+      this.routeBuffer.length > 0 &&
+      !this.routeTarget
+    ) {
+      logger.warn(
+        "%d buffered routes were never applied — no server plugin registered as route target",
+        this.routeBuffer.length,
+      );
+    }
+
+    for (const fn of hooks) {
+      try {
+        await fn();
+      } catch (error) {
+        logger.error("Lifecycle hook '%s' failed: %O", event, error);
+      }
+    }
+  }
+
+  /**
+   * Returns all registered plugin names.
+   */
+  getPluginNames(): string[] {
+    return Array.from(this.plugins.keys());
+  }
+
+  /**
+   * Check if a plugin with the given name is registered.
+   */
+  hasPlugin(name: string): boolean {
+    return this.plugins.has(name);
+  }
+
+  private applyRoute(route: BufferedRoute): void {
+    if (!this.routeTarget) return;
+    this.routeTarget.addExtension((app) => {
+      const method = route.method.toLowerCase() as keyof express.Application;
+      if (typeof app[method] === "function") {
+        (app[method] as (...a: unknown[]) => void)(
+          route.path,
+          ...route.handlers,
+        );
+      }
+    });
+  }
+
+  private applyMiddleware(
+    path: string,
+    handlers: express.RequestHandler[],
+  ): void {
+    if (!this.routeTarget) return;
+    this.routeTarget.addExtension((app) => {
+      app.use(path, ...handlers);
+    });
+  }
+}
+
+/**
+ * Type guard: checks whether a plugin implements the ToolProvider interface.
+ */
+export function isToolProvider(
+  plugin: unknown,
+): plugin is BasePlugin & ToolProvider {
+  return (
+    typeof plugin === "object" &&
+    plugin !== null &&
+    "getAgentTools" in plugin &&
+    typeof (plugin as ToolProvider).getAgentTools === "function" &&
+    "executeAgentTool" in plugin &&
+    typeof (plugin as ToolProvider).executeAgentTool === "function"
+  );
+}
diff --git a/packages/appkit/src/core/tests/databricks.test.ts b/packages/appkit/src/core/tests/databricks.test.ts
index c05345a6..9d3fe5f8 100644
--- a/packages/appkit/src/core/tests/databricks.test.ts
+++ b/packages/appkit/src/core/tests/databricks.test.ts
@@ -109,11 +109,11 @@ class DeferredTestPlugin implements BasePlugin {
   name = "deferredTest";
   setupCalled = false;
   injectedConfig: any;
-  injectedPlugins: any;
+  injectedContext: any;
 
   constructor(config: any) {
     this.injectedConfig = config;
-    this.injectedPlugins = config.plugins;
+    this.injectedContext = config.context;
   }
 
   async setup() {
@@ -130,7 +130,7 @@ class DeferredTestPlugin implements BasePlugin {
     return {
       setupCalled: this.setupCalled,
       injectedConfig: this.injectedConfig,
-      injectedPlugins: this.injectedPlugins,
+      injectedContext: this.injectedContext,
     };
   }
 }
@@ -276,7 +276,7 @@ describe("AppKit", () => {
       expect(setupOrder).toEqual(["core", "normal", "deferred"]);
     });
 
-    test("should provide plugin instances to deferred plugins", async () => {
+    test("should provide PluginContext to deferred plugins", async () => {
       const pluginData = [
         { plugin: CoreTestPlugin, config: {}, name: "coreTest" },
         { plugin: DeferredTestPlugin, config: {}, name: "deferredTest" },
@@ -284,10 +284,9 @@ describe("AppKit", () => {
 
       const instance = (await createApp({ plugins: pluginData })) as any;
 
-      // Deferred plugins receive plugin instances (not SDKs) for internal use
-      expect(instance.deferredTest.injectedPlugins).toBeDefined();
-      expect(instance.deferredTest.injectedPlugins.coreTest).toBeInstanceOf(
-        CoreTestPlugin,
+      expect(instance.deferredTest.injectedContext).toBeDefined();
+      expect(instance.deferredTest.injectedContext.hasPlugin("coreTest")).toBe(
+        true,
       );
     });
 
diff --git a/packages/appkit/src/core/tests/plugin-context.test.ts b/packages/appkit/src/core/tests/plugin-context.test.ts
new file mode 100644
index 00000000..276c5502
--- /dev/null
+++ b/packages/appkit/src/core/tests/plugin-context.test.ts
@@ -0,0 +1,325 @@
+import type { AgentToolDefinition } from "shared";
+import { beforeEach, describe, expect, test, vi } from "vitest";
+import { isToolProvider, PluginContext } from "../plugin-context";
+
+vi.mock("../../telemetry", () => ({
+  TelemetryManager: {
+    getProvider: () => ({
+      getTracer: () => ({
+        startActiveSpan: (_name: string, fn: (span: any) => any) => {
+          const span = {
+            setStatus: vi.fn(),
+            recordException: vi.fn(),
+            end: vi.fn(),
+          };
+          return fn(span);
+        },
+      }),
+    }),
+  },
+}));
+
+vi.mock("../../logging/logger", () => ({
+  createLogger: () => ({
+    info: vi.fn(),
+    warn: vi.fn(),
+    error: vi.fn(),
+    debug: vi.fn(),
+  }),
+}));
+
+function createMockToolProvider(tools: AgentToolDefinition[] = []) {
+  const mock = {
+    name: "mock-plugin",
+    setup: vi.fn().mockResolvedValue(undefined),
+    injectRoutes: vi.fn(),
+    getEndpoints: vi.fn().mockReturnValue({}),
+    getAgentTools: vi.fn().mockReturnValue(tools),
+    executeAgentTool: vi.fn().mockResolvedValue("tool-result"),
+    asUser: vi.fn().mockReturnThis(),
+  };
+  return mock as any;
+}
+
+describe("PluginContext", () => {
+  let ctx: PluginContext;
+
+  beforeEach(() => {
+    ctx = new PluginContext();
+  });
+
+  describe("route buffering", () => {
+    test("addRoute buffers when no route target exists", () => {
+      const handler = vi.fn();
+      ctx.addRoute("post", "/invocations", handler);
+
+      expect(ctx.getPluginNames()).toEqual([]);
+    });
+
+    test("flushRoutes applies buffered routes via addExtension", () => {
+      const handler = vi.fn();
+      ctx.addRoute("post", "/invocations", handler);
+
+      const addExtension = vi.fn();
+      ctx.registerAsRouteTarget({ addExtension });
+
+      expect(addExtension).toHaveBeenCalledTimes(1);
+      const extensionFn = addExtension.mock.calls[0][0];
+
+      const mockApp = { post: vi.fn() };
+      extensionFn(mockApp);
+      expect(mockApp.post).toHaveBeenCalledWith("/invocations", handler);
+    });
+
+    test("addRoute called after registerAsRouteTarget applies immediately", () => {
+      const addExtension = vi.fn();
+      ctx.registerAsRouteTarget({ addExtension });
+
+      const handler = vi.fn();
+      ctx.addRoute("get", "/health", handler);
+
+      expect(addExtension).toHaveBeenCalledTimes(1);
+      const extensionFn = addExtension.mock.calls[0][0];
+
+      const mockApp = { get: vi.fn() };
+      extensionFn(mockApp);
+      expect(mockApp.get).toHaveBeenCalledWith("/health", handler);
+    });
+
+    test("addRoute supports middleware chains", () => {
+      const auth = vi.fn();
+      const handler = vi.fn();
+
+      const addExtension = vi.fn();
+      ctx.registerAsRouteTarget({ addExtension });
+
+      ctx.addRoute("post", "/api", auth, handler);
+
+      const extensionFn = addExtension.mock.calls[0][0];
+      const mockApp = { post: vi.fn() };
+      extensionFn(mockApp);
+      expect(mockApp.post).toHaveBeenCalledWith("/api", auth, handler);
+    });
+
+    test("addMiddleware buffers and applies via use()", () => {
+      const handler = vi.fn();
+      ctx.addMiddleware("/api", handler);
+
+      const addExtension = vi.fn();
+      ctx.registerAsRouteTarget({ addExtension });
+
+      expect(addExtension).toHaveBeenCalledTimes(1);
+      const extensionFn = addExtension.mock.calls[0][0];
+
+      const mockApp = { use: vi.fn() };
+      extensionFn(mockApp);
+      expect(mockApp.use).toHaveBeenCalledWith("/api", handler);
+    });
+
+    test("multiple buffered routes are all applied on registration", () => {
+      const h1 = vi.fn();
+      const h2 = vi.fn();
+      ctx.addRoute("post", "/a", h1);
+      ctx.addRoute("get", "/b", h2);
+
+      const addExtension = vi.fn();
+      ctx.registerAsRouteTarget({ addExtension });
+
+      expect(addExtension).toHaveBeenCalledTimes(2);
+    });
+  });
+
+  describe("ToolProvider registry", () => {
+    test("registerToolProvider makes provider visible via getToolProviders", () => {
+      const provider = createMockToolProvider([
+        {
+          name: "query",
+          description: "Run query",
+          parameters: { type: "object" },
+        },
+      ]);
+
+      ctx.registerToolProvider("analytics", provider);
+
+      const providers = ctx.getToolProviders();
+      expect(providers).toHaveLength(1);
+      expect(providers[0].name).toBe("analytics");
+      expect(providers[0].provider.getAgentTools()).toHaveLength(1);
+    });
+
+    test("getToolProviders returns all registered providers", () => {
+      ctx.registerToolProvider("analytics", createMockToolProvider());
+      ctx.registerToolProvider("files", createMockToolProvider());
+      ctx.registerToolProvider("genie", createMockToolProvider());
+
+      expect(ctx.getToolProviders()).toHaveLength(3);
+    });
+
+    test("getToolProviders returns current set, not snapshot", () => {
+      const before = ctx.getToolProviders();
+      expect(before).toHaveLength(0);
+
+      ctx.registerToolProvider("analytics", createMockToolProvider());
+
+      const after = ctx.getToolProviders();
+      expect(after).toHaveLength(1);
+    });
+  });
+
+  describe("executeTool", () => {
+    test("calls asUser(req).executeAgentTool on the correct plugin", async () => {
+      const provider = createMockToolProvider();
+      ctx.registerToolProvider("analytics", provider);
+
+      const mockReq = { headers: {} } as any;
+      await ctx.executeTool(mockReq, "analytics", "query", { sql: "SELECT 1" });
+
+      expect(provider.asUser).toHaveBeenCalledWith(mockReq);
+      expect(provider.executeAgentTool).toHaveBeenCalledWith(
+        "query",
+        { sql: "SELECT 1" },
+        expect.any(Object),
+      );
+    });
+
+    test("throws for unknown plugin name", async () => {
+      const mockReq = { headers: {} } as any;
+
+      await expect(
+        ctx.executeTool(mockReq, "nonexistent", "query", {}),
+      ).rejects.toThrow('unknown plugin "nonexistent"');
+    });
+
+    test("propagates tool execution errors", async () => {
+      const provider = createMockToolProvider();
+      (provider.executeAgentTool as any).mockRejectedValue(
+        new Error("Query failed"),
+      );
+      ctx.registerToolProvider("analytics", provider);
+
+      const mockReq = { headers: {} } as any;
+
+      await expect(
+        ctx.executeTool(mockReq, "analytics", "query", {}),
+      ).rejects.toThrow("Query failed");
+    });
+
+    test("passes abort signal to executeAgentTool", async () => {
+      const provider = createMockToolProvider();
+      ctx.registerToolProvider("analytics", provider);
+
+      const controller = new AbortController();
+      const mockReq = { headers: {} } as any;
+
+      await ctx.executeTool(
+        mockReq,
+        "analytics",
+        "query",
+        {},
+        controller.signal,
+      );
+
+      const callArgs = (provider.executeAgentTool as any).mock.calls[0];
+      expect(callArgs[2]).toBeDefined();
+    });
+  });
+
+  describe("lifecycle hooks", () => {
+    test("onLifecycle registers callback, emitLifecycle invokes it", async () => {
+      const fn = vi.fn();
+      ctx.onLifecycle("setup:complete", fn);
+
+      await ctx.emitLifecycle("setup:complete");
+
+      expect(fn).toHaveBeenCalledTimes(1);
+    });
+
+    test("multiple callbacks for the same event all fire", async () => {
+      const fn1 = vi.fn();
+      const fn2 = vi.fn();
+      ctx.onLifecycle("setup:complete", fn1);
+      ctx.onLifecycle("setup:complete", fn2);
+
+      await ctx.emitLifecycle("setup:complete");
+
+      expect(fn1).toHaveBeenCalledTimes(1);
+      expect(fn2).toHaveBeenCalledTimes(1);
+    });
+
+    test("callback error does not prevent other callbacks from running", async () => {
+      const fn1 = vi.fn().mockRejectedValue(new Error("fail"));
+      const fn2 = vi.fn();
+      ctx.onLifecycle("shutdown", fn1);
+      ctx.onLifecycle("shutdown", fn2);
+
+      await ctx.emitLifecycle("shutdown");
+
+      expect(fn1).toHaveBeenCalled();
+      expect(fn2).toHaveBeenCalled();
+    });
+
+    test("emitLifecycle with no registered hooks does nothing", async () => {
+      await expect(ctx.emitLifecycle("server:ready")).resolves.toBeUndefined();
+    });
+  });
+
+  describe("plugin metadata", () => {
+    const stubPlugin = { name: "stub" } as any;
+
+    test("getPluginNames returns all registered names", () => {
+      ctx.registerPlugin("analytics", stubPlugin);
+      ctx.registerPlugin("server", stubPlugin);
+      ctx.registerPlugin("agent", stubPlugin);
+
+      const names = ctx.getPluginNames();
+      expect(names).toContain("analytics");
+      expect(names).toContain("server");
+      expect(names).toContain("agent");
+      expect(names).toHaveLength(3);
+    });
+
+    test("hasPlugin returns true for registered plugins", () => {
+      ctx.registerPlugin("analytics", stubPlugin);
+
+      expect(ctx.hasPlugin("analytics")).toBe(true);
+      expect(ctx.hasPlugin("nonexistent")).toBe(false);
+    });
+
+    test("getPlugins returns all registered instances", () => {
+      const p1 = { name: "analytics" } as any;
+      const p2 = { name: "server" } as any;
+      ctx.registerPlugin("analytics", p1);
+      ctx.registerPlugin("server", p2);
+
+      const plugins = ctx.getPlugins();
+      expect(plugins.size).toBe(2);
+      expect(plugins.get("analytics")).toBe(p1);
+      expect(plugins.get("server")).toBe(p2);
+    });
+  });
+});
+
+describe("isToolProvider", () => {
+  test("returns true for objects with getAgentTools and executeAgentTool", () => {
+    const provider = createMockToolProvider();
+    expect(isToolProvider(provider)).toBe(true);
+  });
+
+  test("returns false for null", () => {
+    expect(isToolProvider(null)).toBe(false);
+  });
+
+  test("returns false for objects missing executeAgentTool", () => {
+    expect(isToolProvider({ getAgentTools: vi.fn() })).toBe(false);
+  });
+
+  test("returns false for objects missing getAgentTools", () => {
+    expect(isToolProvider({ executeAgentTool: vi.fn() })).toBe(false);
+  });
+
+  test("returns false for non-objects", () => {
+    expect(isToolProvider("string")).toBe(false);
+    expect(isToolProvider(42)).toBe(false);
+    expect(isToolProvider(undefined)).toBe(false);
+  });
+});
diff --git a/packages/appkit/src/plugin/index.ts b/packages/appkit/src/plugin/index.ts
index 93765219..46a4eb94 100644
--- a/packages/appkit/src/plugin/index.ts
+++ b/packages/appkit/src/plugin/index.ts
@@ -1,4 +1,4 @@
 export type { ToPlugin } from "shared";
 export type { ExecutionResult } from "./execution-result";
 export { Plugin } from "./plugin";
-export { toPlugin } from "./to-plugin";
+export { type NamedPluginFactory, toPlugin } from "./to-plugin";
diff --git a/packages/appkit/src/plugin/plugin.ts b/packages/appkit/src/plugin/plugin.ts
index 5173cb61..4c9a0e64 100644
--- a/packages/appkit/src/plugin/plugin.ts
+++ b/packages/appkit/src/plugin/plugin.ts
@@ -19,6 +19,7 @@ import {
   ServiceContext,
   type UserContext,
 } from "../context";
+import type { PluginContext } from "../core/plugin-context";
 import { AppKitError, AuthenticationError } from "../errors";
 import { createLogger } from "../logging/logger";
 import { StreamManager } from "../stream";
@@ -163,11 +164,12 @@ export abstract class Plugin<
 > implements BasePlugin
 {
   protected isReady = false;
-  protected cache: CacheManager;
+  protected cache!: CacheManager;
   protected app: AppManager;
   protected devFileReader: DevFileReader;
   protected streamManager: StreamManager;
-  protected telemetry: ITelemetry;
+  protected telemetry!: ITelemetry;
+  protected context?: PluginContext;
 
   /** Registered endpoints for this plugin */
   private registeredEndpoints: PluginEndpointMap = {};
@@ -193,12 +195,58 @@ export abstract class Plugin<
       config.name ??
       (this.constructor as { manifest?: { name: string } }).manifest?.name ??
       "plugin";
-    this.telemetry = TelemetryManager.getProvider(this.name, config.telemetry);
     this.streamManager = new StreamManager();
-    this.cache = CacheManager.getInstanceSync();
     this.app = new AppManager();
     this.devFileReader = DevFileReader.getInstance();
+    this.context = (config as Record<string, unknown>).context as
+      | PluginContext
+      | undefined;
+
+    // Eagerly bind telemetry + cache if the core services have already been
+    // initialized (normal createApp path, or tests that mock CacheManager).
+    // If they haven't, we leave these undefined and rely on `attachContext`
+    // being called later — this lets factories eagerly construct plugin
+    // instances at module top-level before `createApp` has run.
+    this.tryAttachContext();
+  }
+
+  private tryAttachContext(): void {
+    try {
+      this.cache = CacheManager.getInstanceSync();
+    } catch {
+      return;
+    }
+    this.telemetry = TelemetryManager.getProvider(
+      this.name,
+      this.config.telemetry,
+    );
+    this.isReady = true;
+  }
 
+  /**
+   * Binds runtime dependencies (telemetry provider, cache, plugin context) to
+   * this plugin. Called by `AppKit._createApp` after construction and before
+   * `setup()`. Idempotent: safe to call if the constructor already bound them
+   * eagerly. Kept separate so factories can eagerly construct plugin instances
+   * without running this before `TelemetryManager.initialize()` /
+   * `CacheManager.getInstance()` have run.
+   */
+  attachContext(
+    deps: {
+      context?: unknown;
+      telemetryConfig?: BasePluginConfig["telemetry"];
+    } = {},
+  ): void {
+    if (!this.cache) {
+      this.cache = CacheManager.getInstanceSync();
+    }
+    this.telemetry = TelemetryManager.getProvider(
+      this.name,
+      deps.telemetryConfig ?? this.config.telemetry,
+    );
+    if (deps.context !== undefined) {
+      this.context = deps.context as PluginContext;
+    }
     this.isReady = true;
   }
 
diff --git a/packages/appkit/src/plugin/to-plugin.ts b/packages/appkit/src/plugin/to-plugin.ts
index 77725027..c882f300 100644
--- a/packages/appkit/src/plugin/to-plugin.ts
+++ b/packages/appkit/src/plugin/to-plugin.ts
@@ -1,19 +1,41 @@
 import type { PluginConstructor, PluginData, ToPlugin } from "shared";
 
 /**
- * Wraps a plugin class so it can be passed to createApp with optional config.
- * Infers config type from the constructor and plugin name from the static `name` property.
+ * Factory function produced by {@link toPlugin}. Carries a static
+ * `pluginName` field so tooling (e.g. `fromPlugin`) can identify which
+ * plugin a factory references without constructing an instance.
+ */
+export type NamedPluginFactory<Name extends string = string> = {
+  readonly pluginName: Name;
+};
+
+/**
+ * Wraps a plugin class so it can be passed to `createApp` with optional
+ * config. Infers the config type from the constructor and the plugin name
+ * from the static `manifest.name` property, and stamps `pluginName` onto
+ * the returned factory function so `fromPlugin` can identify the plugin
+ * without needing to construct it.
  *
  * @internal
  */
 export function toPlugin<T extends PluginConstructor>(
   plugin: T,
-): ToPlugin<T, ConstructorParameters<T>[0], T["manifest"]["name"]> {
+): ToPlugin<T, ConstructorParameters<T>[0], T["manifest"]["name"]> &
+  NamedPluginFactory<T["manifest"]["name"]> {
   type Config = ConstructorParameters<T>[0];
   type Name = T["manifest"]["name"];
-  return (config: Config = {} as Config): PluginData<T, Config, Name> => ({
+  const pluginName = plugin.manifest.name as Name;
+  const factory = (
+    config: Config = {} as Config,
+  ): PluginData<T, Config, Name> => ({
     plugin: plugin as T,
     config: config as Config,
-    name: plugin.manifest.name as Name,
+    name: pluginName,
+  });
+  Object.defineProperty(factory, "pluginName", {
+    value: pluginName,
+    writable: false,
+    enumerable: true,
   });
+  return factory as ToPlugin<T, Config, Name> & NamedPluginFactory<Name>;
 }
diff --git a/packages/appkit/src/plugins/server/index.ts b/packages/appkit/src/plugins/server/index.ts
index e7b9b31a..4c911b10 100644
--- a/packages/appkit/src/plugins/server/index.ts
+++ b/packages/appkit/src/plugins/server/index.ts
@@ -59,17 +59,34 @@ export class ServerPlugin extends Plugin {
     this.serverApplication = express();
     this.server = null;
     this.serverExtensions = [];
+  }
+
+  attachContext(deps: Parameters<Plugin["attachContext"]>[0] = {}): void {
+    super.attachContext(deps);
     this.telemetry.registerInstrumentations([
       instrumentations.http,
       instrumentations.express,
     ]);
+    this.context?.registerAsRouteTarget(this);
   }
 
   /** Setup the server plugin. */
   async setup() {
-    if (this.shouldAutoStart()) {
-      await this.start();
+    if (!this.shouldAutoStart()) return;
+    if (this.context) {
+      // Defer the actual listen+extendRoutes to the `setup:complete` lifecycle
+      // hook. That way every plugin (including other deferred-phase plugins
+      // like `agents`) is already registered in PluginContext by the time
+      // extendRoutes() iterates. Otherwise plugins declared after server()
+      // in the plugin array would be silently dropped from /api/* mounts.
+      this.context.onLifecycle("setup:complete", async () => {
+        await this.start();
+      });
+      return;
     }
+    // No plugin context (e.g. tests constructing ServerPlugin directly) —
+    // start immediately.
+    await this.start();
   }
 
   /** Get the server configuration. */
@@ -179,6 +196,16 @@ export class ServerPlugin extends Plugin {
     return this;
   }
 
+  /**
+   * Register a server extension from another plugin during setup.
+   * Unlike extend(), this does not guard on autoStart — it's designed
+   * for internal plugin-to-plugin coordination where extensions are
+   * registered before the server starts listening.
+   */
+  addExtension(fn: (app: express.Application) => void) {
+    this.serverExtensions.push(fn);
+  }
+
   /**
    * Setup the routes with the plugins.
    *
@@ -193,14 +220,15 @@ export class ServerPlugin extends Plugin {
     const endpoints: PluginEndpoints = {};
     const pluginConfigs: PluginClientConfigs = {};
 
-    if (!this.config.plugins) return { endpoints, pluginConfigs };
+    const plugins = this.context?.getPlugins();
+    if (!plugins || plugins.size === 0) return { endpoints, pluginConfigs };
 
     this.serverApplication.get("/health", (_, res) => {
       res.status(200).json({ status: "ok" });
     });
     this.registerEndpoint("health", "/health");
 
-    for (const plugin of Object.values(this.config.plugins)) {
+    for (const plugin of plugins.values()) {
       if (EXCLUDED_PLUGINS.includes(plugin.name)) continue;
 
       if (plugin?.injectRoutes && typeof plugin.injectRoutes === "function") {
@@ -349,8 +377,9 @@ export class ServerPlugin extends Plugin {
     }
 
     // 1. abort active operations from plugins
-    if (this.config.plugins) {
-      for (const plugin of Object.values(this.config.plugins)) {
+    const shutdownPlugins = this.context?.getPlugins();
+    if (shutdownPlugins) {
+      for (const plugin of shutdownPlugins.values()) {
         if (plugin.abortActiveOperations) {
           try {
             plugin.abortActiveOperations();
diff --git a/packages/appkit/src/plugins/server/tests/server.test.ts b/packages/appkit/src/plugins/server/tests/server.test.ts
index 22f18129..52d15845 100644
--- a/packages/appkit/src/plugins/server/tests/server.test.ts
+++ b/packages/appkit/src/plugins/server/tests/server.test.ts
@@ -1,4 +1,6 @@
+import type { BasePlugin } from "shared";
 import { afterEach, beforeEach, describe, expect, test, vi } from "vitest";
+import { PluginContext } from "../../../core/plugin-context";
 
 // Use vi.hoisted for mocks that need to be available before module loading
 const {
@@ -171,6 +173,14 @@ import { RemoteTunnelController } from "../remote-tunnel/remote-tunnel-controlle
 import { StaticServer } from "../static-server";
 import { ViteDevServer } from "../vite-dev-server";
 
+function createContextWithPlugins(plugins: Record<string, any>): PluginContext {
+  const ctx = new PluginContext();
+  for (const [name, instance] of Object.entries(plugins)) {
+    ctx.registerPlugin(name, instance as BasePlugin);
+  }
+  return ctx;
+}
+
 describe("ServerPlugin", () => {
   let originalEnv: NodeJS.ProcessEnv;
 
@@ -340,7 +350,7 @@ describe("ServerPlugin", () => {
       process.env.NODE_ENV = "production";
 
       const injectRoutes = vi.fn();
-      const plugins: any = {
+      const testPlugins: any = {
         "test-plugin": {
           name: "test-plugin",
           injectRoutes,
@@ -348,7 +358,10 @@ describe("ServerPlugin", () => {
         },
       };
 
-      const plugin = new ServerPlugin({ autoStart: false, plugins });
+      const plugin = new ServerPlugin({
+        autoStart: false,
+        context: createContextWithPlugins(testPlugins),
+      } as any);
       await plugin.start();
 
       const routerFn = (express as any).Router as ReturnType<typeof vi.fn>;
@@ -386,7 +399,10 @@ describe("ServerPlugin", () => {
         },
       };
 
-      const plugin = new ServerPlugin({ autoStart: false, plugins });
+      const plugin = new ServerPlugin({
+        autoStart: false,
+        context: createContextWithPlugins(plugins),
+      } as any);
       await plugin.start();
 
       expect(plugins["plugin-a"].clientConfig).toHaveBeenCalled();
@@ -413,7 +429,10 @@ describe("ServerPlugin", () => {
         },
       };
 
-      const plugin = new ServerPlugin({ autoStart: false, plugins });
+      const plugin = new ServerPlugin({
+        autoStart: false,
+        context: createContextWithPlugins(plugins),
+      } as any);
       await plugin.start();
 
       expect(plugins["plugin-null"].clientConfig).toHaveBeenCalled();
@@ -444,7 +463,10 @@ describe("ServerPlugin", () => {
         },
       };
 
-      const plugin = new ServerPlugin({ autoStart: false, plugins });
+      const plugin = new ServerPlugin({
+        autoStart: false,
+        context: createContextWithPlugins(plugins),
+      } as any);
       await expect(plugin.start()).resolves.toBeDefined();
       expect(mockLoggerError).toHaveBeenCalledWith(
         "Plugin '%s' clientConfig() failed, skipping its config: %O",
@@ -608,19 +630,19 @@ describe("ServerPlugin", () => {
 
       const plugin = new ServerPlugin({
         autoStart: false,
-        plugins: {
+        context: createContextWithPlugins({
           ok: {
             name: "ok",
             abortActiveOperations: vi.fn(),
-          } as any,
+          },
           bad: {
             name: "bad",
             abortActiveOperations: vi.fn(() => {
               throw new Error("boom");
             }),
-          } as any,
-        },
-      });
+          },
+        }),
+      } as any);
 
       // pretend started
       (plugin as any).server = mockHttpServer;
diff --git a/packages/appkit/src/plugins/server/types.ts b/packages/appkit/src/plugins/server/types.ts
index e187cacc..84a2327e 100644
--- a/packages/appkit/src/plugins/server/types.ts
+++ b/packages/appkit/src/plugins/server/types.ts
@@ -1,9 +1,7 @@
 import type { BasePluginConfig } from "shared";
-import type { Plugin } from "../../plugin";
 
 export interface ServerConfig extends BasePluginConfig {
   port?: number;
-  plugins?: Record<string, Plugin>;
   staticPath?: string;
   autoStart?: boolean;
   host?: string;
diff --git a/packages/shared/src/plugin.ts b/packages/shared/src/plugin.ts
index 9fa8066c..651840c7 100644
--- a/packages/shared/src/plugin.ts
+++ b/packages/shared/src/plugin.ts
@@ -26,6 +26,15 @@ export interface BasePlugin {
   exports?(): unknown;
 
   clientConfig?(): Record<string, unknown>;
+
+  /**
+   * Binds runtime dependencies (telemetry, cache, plugin context) after the
+   * plugin has been constructed. Called by the AppKit core before `setup()`.
+   */
+  attachContext?(deps: {
+    context?: unknown;
+    telemetryConfig?: TelemetryOptions;
+  }): void;
 }
 
 /** Base configuration interface for AppKit plugins */

From cb7fe2be3f0322fc88d89400b758638480a57fab Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Tue, 21 Apr 2026 19:51:21 +0200
Subject: [PATCH 3/6] feat(appkit): agents() plugin, createAgent(def), and
 markdown-driven agents
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The main product layer. Turns an AppKit app into an AI-agent host with
markdown-driven agent discovery, code-defined agents, sub-agents, and
a standalone run-without-HTTP executor.

### `createAgent(def)` — pure factory

`packages/appkit/src/core/create-agent-def.ts`. Returns the passed-in
definition after cycle-detecting the sub-agent graph. No adapter
construction, no side effects — safe at module top-level. The returned
`AgentDefinition` is plain data, consumable by either `agents({ agents
})` or `runAgent(def, input)`.

### `agents()` plugin

`packages/appkit/src/plugins/agents/agents.ts`. `AgentsPlugin` class:

- Loads markdown agents from `config/agents/*.md` (configurable dir)
  via real YAML frontmatter parsing (`js-yaml`). Frontmatter schema:
  `endpoint`, `model`, `toolkits`, `tools`, `default`, `maxSteps`,
  `maxTokens`, `baseSystemPrompt`. Unknown keys logged, invalid YAML
  throws at boot.
- Merges code-defined agents passed via `agents({ agents: { name: def
  } })`. Code wins on key collision.
- For each agent, builds a per-agent tool index from:
  1. Sub-agents (`agents: {...}`) — synthesized as `agent-<key>`
     tools on the parent.
  2. Explicit tool record entries — `ToolkitEntry`s, inline
     `FunctionTool`s, or `HostedTool`s.
  3. Auto-inherit (if nothing explicit) — pulls every registered
     `ToolProvider` plugin's tools. Asymmetric default: markdown
     agents inherit (`file: true`), code-defined agents don't (`code:
     false`).
- Mounts `POST /invocations` (OpenAI Responses compatible) + `POST
  /chat`, `POST /cancel`, `GET /threads/:id`, `DELETE /threads/:id`,
  `GET /info`.
- SSE streaming via `executeStream`. Tool calls dispatch through
  `PluginContext.executeTool(req, pluginName, localName, args, signal)`
  for OBO, telemetry, and timeout.
- Exposes `appkit.agent.{register, list, get, reload, getDefault,
  getThreads}` runtime helpers.

### `runAgent(def, input)` — standalone executor

`packages/appkit/src/core/run-agent.ts`. Runs an `AgentDefinition`
without `createApp` or HTTP. Drives the adapter's event stream to
completion, executing inline tools + sub-agents along the way.
Aggregates events into `{ text, events }`. Useful for tests, CLI
scripts, and offline pipelines. Hosted/MCP tools and plugin toolkits
require the agents plugin and throw clear errors with guidance.

### Event translation and thread storage

- `AgentEventTranslator` — stateful converter from internal
  `AgentEvent`s to OpenAI Responses API `ResponseStreamEvent`s with
  sequence numbers and output indices.
- `InMemoryThreadStore` — per-user conversation persistence. Nested
  `Map<userId, Map<threadId, Thread>>`. Implements `ThreadStore` from
  shared types.
- `buildBaseSystemPrompt` + `composeSystemPrompt` — formats the
  AppKit base prompt (with plugin names and tool names) and layers
  the agent's instructions on top.

### Frontmatter loader

`load-agents.ts` — reads `*.md` files, parses YAML frontmatter with
`js-yaml`, resolves `toolkits: [...]` entries against the plugin
provider index at load time, wraps ambient tools (from `agents({
tools: {...} })`) for `tools: [...]` frontmatter references.

### Plumbing

- Adds `js-yaml` + `@types/js-yaml` deps.
- Manifest mounts routes at `/api/agent/*` (singular — matches
  `appkit.agent.*` runtime handle).
- Exports from the main barrel: `agents`, `createAgent`, `runAgent`,
  `AgentDefinition`, `AgentsPluginConfig`, `AgentTool`, `ToolkitEntry`,
  `ToolkitOptions`, `BaseSystemPromptOption`, `PromptContext`,
  `isToolkitEntry`, `loadAgentFromFile`, `loadAgentsFromDir`.

### Test plan

- 60 new tests: agents plugin lifecycle, markdown loading, code-agent
  registration, auto-inherit asymmetry, sub-agent tool synthesis,
  cycle detection, event translator, thread store, system prompt
  composition, standalone `runAgent`.
- Full appkit vitest suite: 1297 tests passing.
- Typecheck clean across all 8 workspace projects.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 packages/appkit/package.json                  |   2 +
 packages/appkit/src/core/create-agent-def.ts  |  53 +
 packages/appkit/src/core/run-agent.ts         | 226 ++++
 packages/appkit/src/index.ts                  |  15 +-
 packages/appkit/src/plugins/agents/agents.ts  | 991 ++++++++++++++++++
 .../appkit/src/plugins/agents/defaults.ts     |  12 +
 .../src/plugins/agents/event-translator.ts    | 230 ++++
 packages/appkit/src/plugins/agents/index.ts   |  22 +
 .../appkit/src/plugins/agents/load-agents.ts  | 252 +++++
 .../appkit/src/plugins/agents/manifest.json   |  10 +
 packages/appkit/src/plugins/agents/schemas.ts |  19 +
 .../src/plugins/agents/system-prompt.ts       |  40 +
 .../agents/tests/agents-plugin.test.ts        | 289 +++++
 .../plugins/agents/tests/create-agent.test.ts |  75 ++
 .../agents/tests/event-translator.test.ts     | 204 ++++
 .../plugins/agents/tests/load-agents.test.ts  | 150 +++
 .../plugins/agents/tests/run-agent.test.ts    | 120 +++
 .../agents/tests/system-prompt.test.ts        |  45 +
 .../plugins/agents/tests/thread-store.test.ts | 138 +++
 .../appkit/src/plugins/agents/thread-store.ts |  59 ++
 packages/appkit/src/plugins/agents/types.ts   | 112 +-
 pnpm-lock.yaml                                |  11 +
 22 files changed, 3071 insertions(+), 4 deletions(-)
 create mode 100644 packages/appkit/src/core/create-agent-def.ts
 create mode 100644 packages/appkit/src/core/run-agent.ts
 create mode 100644 packages/appkit/src/plugins/agents/agents.ts
 create mode 100644 packages/appkit/src/plugins/agents/defaults.ts
 create mode 100644 packages/appkit/src/plugins/agents/event-translator.ts
 create mode 100644 packages/appkit/src/plugins/agents/index.ts
 create mode 100644 packages/appkit/src/plugins/agents/load-agents.ts
 create mode 100644 packages/appkit/src/plugins/agents/manifest.json
 create mode 100644 packages/appkit/src/plugins/agents/schemas.ts
 create mode 100644 packages/appkit/src/plugins/agents/system-prompt.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/create-agent.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/event-translator.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/load-agents.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/run-agent.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/system-prompt.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/thread-store.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/thread-store.ts

diff --git a/packages/appkit/package.json b/packages/appkit/package.json
index 27a14e66..49d6c516 100644
--- a/packages/appkit/package.json
+++ b/packages/appkit/package.json
@@ -83,6 +83,7 @@
     "@types/semver": "7.7.1",
     "dotenv": "16.6.1",
     "express": "4.22.0",
+    "js-yaml": "^4.1.1",
     "obug": "2.1.1",
     "pg": "8.18.0",
     "picocolors": "1.1.1",
@@ -108,6 +109,7 @@
     "@ai-sdk/openai": "4.0.0-beta.27",
     "@langchain/core": "^1.1.39",
     "@types/express": "4.17.25",
+    "@types/js-yaml": "^4.0.9",
     "@types/json-schema": "7.0.15",
     "@types/pg": "8.16.0",
     "@types/ws": "8.18.1",
diff --git a/packages/appkit/src/core/create-agent-def.ts b/packages/appkit/src/core/create-agent-def.ts
new file mode 100644
index 00000000..3e93371d
--- /dev/null
+++ b/packages/appkit/src/core/create-agent-def.ts
@@ -0,0 +1,53 @@
+import { ConfigurationError } from "../errors";
+import type { AgentDefinition } from "../plugins/agents/types";
+
+/**
+ * Pure factory for agent definitions. Returns the passed-in definition after
+ * cycle-detecting the sub-agent graph. Accepts the full `AgentDefinition` shape
+ * and is safe to call at module top-level.
+ *
+ * The returned value is a plain `AgentDefinition` — no adapter construction,
+ * no side effects. Register it with `agents({ agents: { name: def } })` or run
+ * it standalone via `runAgent(def, input)`.
+ *
+ * @example
+ * ```ts
+ * const support = createAgent({
+ *   instructions: "You help customers.",
+ *   model: "databricks-claude-sonnet-4-5",
+ *   tools: {
+ *     get_weather: tool({ ... }),
+ *   },
+ * });
+ * ```
+ */
+export function createAgent(def: AgentDefinition): AgentDefinition {
+  detectCycles(def);
+  return def;
+}
+
+/**
+ * Walks the `agents: { ... }` sub-agent tree via DFS and throws if a cycle is
+ * found. Cycles would cause infinite recursion at tool-invocation time.
+ */
+function detectCycles(def: AgentDefinition): void {
+  const visiting = new Set<AgentDefinition>();
+  const visited = new Set<AgentDefinition>();
+
+  const walk = (current: AgentDefinition, path: string[]): void => {
+    if (visited.has(current)) return;
+    if (visiting.has(current)) {
+      throw new ConfigurationError(
+        `Agent sub-agent cycle detected: ${path.join(" -> ")}`,
+      );
+    }
+    visiting.add(current);
+    for (const [childKey, child] of Object.entries(current.agents ?? {})) {
+      walk(child, [...path, childKey]);
+    }
+    visiting.delete(current);
+    visited.add(current);
+  };
+
+  walk(def, [def.name ?? "(root)"]);
+}
diff --git a/packages/appkit/src/core/run-agent.ts b/packages/appkit/src/core/run-agent.ts
new file mode 100644
index 00000000..e83c2c9c
--- /dev/null
+++ b/packages/appkit/src/core/run-agent.ts
@@ -0,0 +1,226 @@
+import { randomUUID } from "node:crypto";
+import type {
+  AgentAdapter,
+  AgentEvent,
+  AgentToolDefinition,
+  Message,
+} from "shared";
+import {
+  type FunctionTool,
+  functionToolToDefinition,
+  isFunctionTool,
+} from "../plugins/agents/tools/function-tool";
+import { isHostedTool } from "../plugins/agents/tools/hosted-tools";
+import type {
+  AgentDefinition,
+  AgentTool,
+  ToolkitEntry,
+} from "../plugins/agents/types";
+import { isToolkitEntry } from "../plugins/agents/types";
+
+export interface RunAgentInput {
+  /** Seed messages for the run. Either a single user string or a full message list. */
+  messages: string | Message[];
+  /** Abort signal for cancellation. */
+  signal?: AbortSignal;
+}
+
+export interface RunAgentResult {
+  /** Aggregated text output from all `message_delta` events. */
+  text: string;
+  /** Every event the adapter yielded, in order. Useful for inspection/tests. */
+  events: AgentEvent[];
+}
+
+/**
+ * Standalone agent execution without `createApp`. Resolves the adapter, binds
+ * inline tools, and drives the adapter's `run()` loop to completion.
+ *
+ * Limitations vs. running through the agents() plugin:
+ * - No OBO: there is no HTTP request, so plugin tools run as the service
+ *   principal (when they work at all).
+ * - Plugin tools (`ToolkitEntry`) are not supported — they require a live
+ *   `PluginContext` that only exists when registered in a `createApp`
+ *   instance. This function throws a clear error if encountered.
+ * - Sub-agents (`agents: { ... }` on the def) are executed as nested
+ *   `runAgent` calls with no shared thread state.
+ */
+export async function runAgent(
+  def: AgentDefinition,
+  input: RunAgentInput,
+): Promise<RunAgentResult> {
+  const adapter = await resolveAdapter(def);
+  const messages = normalizeMessages(input.messages, def.instructions);
+  const toolIndex = buildStandaloneToolIndex(def);
+  const tools = Array.from(toolIndex.values()).map((e) => e.def);
+
+  const signal = input.signal;
+
+  const executeTool = async (name: string, args: unknown): Promise<unknown> => {
+    const entry = toolIndex.get(name);
+    if (!entry) throw new Error(`Unknown tool: ${name}`);
+    if (entry.kind === "function") {
+      return entry.tool.execute(args as Record<string, unknown>);
+    }
+    if (entry.kind === "subagent") {
+      const subInput: RunAgentInput = {
+        messages:
+          typeof args === "object" &&
+          args !== null &&
+          typeof (args as { input?: unknown }).input === "string"
+            ? (args as { input: string }).input
+            : JSON.stringify(args),
+        signal,
+      };
+      const res = await runAgent(entry.agentDef, subInput);
+      return res.text;
+    }
+    throw new Error(
+      `runAgent: tool "${name}" is a ${entry.kind} tool. ` +
+        "Plugin toolkits and MCP tools are only usable via createApp({ plugins: [..., agents(...)] }).",
+    );
+  };
+
+  const events: AgentEvent[] = [];
+  let text = "";
+
+  const stream = adapter.run(
+    {
+      messages,
+      tools,
+      threadId: randomUUID(),
+      signal,
+    },
+    { executeTool, signal },
+  );
+
+  for await (const event of stream) {
+    if (signal?.aborted) break;
+    events.push(event);
+    if (event.type === "message_delta") {
+      text += event.content;
+    } else if (event.type === "message") {
+      text = event.content;
+    }
+  }
+
+  return { text, events };
+}
+
+async function resolveAdapter(def: AgentDefinition): Promise<AgentAdapter> {
+  const { model } = def;
+  if (!model) {
+    const { DatabricksAdapter } = await import("../agents/databricks");
+    return DatabricksAdapter.fromModelServing();
+  }
+  if (typeof model === "string") {
+    const { DatabricksAdapter } = await import("../agents/databricks");
+    return DatabricksAdapter.fromModelServing(model);
+  }
+  return await model;
+}
+
+function normalizeMessages(
+  input: string | Message[],
+  instructions: string,
+): Message[] {
+  const systemMessage: Message = {
+    id: "system",
+    role: "system",
+    content: instructions,
+    createdAt: new Date(),
+  };
+  if (typeof input === "string") {
+    return [
+      systemMessage,
+      {
+        id: randomUUID(),
+        role: "user",
+        content: input,
+        createdAt: new Date(),
+      },
+    ];
+  }
+  return [systemMessage, ...input];
+}
+
+type StandaloneEntry =
+  | {
+      kind: "function";
+      def: AgentToolDefinition;
+      tool: FunctionTool;
+    }
+  | {
+      kind: "subagent";
+      def: AgentToolDefinition;
+      agentDef: AgentDefinition;
+    }
+  | {
+      kind: "toolkit";
+      def: AgentToolDefinition;
+      entry: ToolkitEntry;
+    }
+  | {
+      kind: "hosted";
+      def: AgentToolDefinition;
+    };
+
+function buildStandaloneToolIndex(
+  def: AgentDefinition,
+): Map<string, StandaloneEntry> {
+  const index = new Map<string, StandaloneEntry>();
+
+  for (const [key, tool] of Object.entries(def.tools ?? {})) {
+    index.set(key, classifyTool(key, tool));
+  }
+
+  for (const [childKey, child] of Object.entries(def.agents ?? {})) {
+    const toolName = `agent-${childKey}`;
+    index.set(toolName, {
+      kind: "subagent",
+      agentDef: { ...child, name: child.name ?? childKey },
+      def: {
+        name: toolName,
+        description:
+          child.instructions.slice(0, 120) ||
+          `Delegate to the ${childKey} sub-agent`,
+        parameters: {
+          type: "object",
+          properties: {
+            input: {
+              type: "string",
+              description: "Message to send to the sub-agent.",
+            },
+          },
+          required: ["input"],
+        },
+      },
+    });
+  }
+
+  return index;
+}
+
+function classifyTool(key: string, tool: AgentTool): StandaloneEntry {
+  if (isToolkitEntry(tool)) {
+    return { kind: "toolkit", def: { ...tool.def, name: key }, entry: tool };
+  }
+  if (isFunctionTool(tool)) {
+    return {
+      kind: "function",
+      tool,
+      def: { ...functionToolToDefinition(tool), name: key },
+    };
+  }
+  if (isHostedTool(tool)) {
+    return {
+      kind: "hosted",
+      def: {
+        name: key,
+        description: `Hosted tool: ${tool.type}`,
+        parameters: { type: "object", properties: {} },
+      },
+    };
+  }
+  throw new Error(`runAgent: unrecognized tool shape at key "${key}"`);
+}
diff --git a/packages/appkit/src/index.ts b/packages/appkit/src/index.ts
index 8d236780..dbefe3e5 100644
--- a/packages/appkit/src/index.ts
+++ b/packages/appkit/src/index.ts
@@ -43,6 +43,12 @@ export {
 } from "./connectors/lakebase";
 export { getExecutionContext } from "./context";
 export { createApp } from "./core";
+export { createAgent } from "./core/create-agent-def";
+export {
+  type RunAgentInput,
+  type RunAgentResult,
+  runAgent,
+} from "./core/run-agent";
 // Errors
 export {
   AppKitError,
@@ -64,11 +70,18 @@ export {
 } from "./plugin";
 export { analytics, files, genie, lakebase, server, serving } from "./plugins";
 export {
+  type AgentDefinition,
+  type AgentsPluginConfig,
   type AgentTool,
+  agents,
+  type BaseSystemPromptOption,
   isToolkitEntry,
+  loadAgentFromFile,
+  loadAgentsFromDir,
+  type PromptContext,
   type ToolkitEntry,
   type ToolkitOptions,
-} from "./plugins/agents/types";
+} from "./plugins/agents";
 export {
   type FunctionTool,
   type HostedTool,
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
new file mode 100644
index 00000000..03b9257c
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -0,0 +1,991 @@
+import { randomUUID } from "node:crypto";
+import path from "node:path";
+import type express from "express";
+import pc from "picocolors";
+import type {
+  AgentAdapter,
+  AgentEvent,
+  AgentRunContext,
+  AgentToolDefinition,
+  IAppRouter,
+  Message,
+  PluginPhase,
+  ResponseStreamEvent,
+  Thread,
+  ToolProvider,
+} from "shared";
+import { createLogger } from "../../logging/logger";
+import { Plugin, toPlugin } from "../../plugin";
+import type { PluginManifest } from "../../registry";
+import { agentStreamDefaults } from "./defaults";
+import { AgentEventTranslator } from "./event-translator";
+import { loadAgentsFromDir } from "./load-agents";
+import manifest from "./manifest.json";
+import { chatRequestSchema, invocationsRequestSchema } from "./schemas";
+import { buildBaseSystemPrompt, composeSystemPrompt } from "./system-prompt";
+import { InMemoryThreadStore } from "./thread-store";
+import {
+  AppKitMcpClient,
+  type FunctionTool,
+  functionToolToDefinition,
+  isFunctionTool,
+  isHostedTool,
+  resolveHostedTools,
+} from "./tools";
+import type {
+  AgentDefinition,
+  AgentsPluginConfig,
+  BaseSystemPromptOption,
+  PromptContext,
+  RegisteredAgent,
+  ResolvedToolEntry,
+} from "./types";
+import { isToolkitEntry } from "./types";
+
+const logger = createLogger("agents");
+
+const DEFAULT_AGENTS_DIR = "./config/agents";
+
+/**
+ * Context flag recorded on the in-memory AgentDefinition to indicate whether
+ * it came from markdown (file) or from user code. Drives the asymmetric
+ * `autoInheritTools` default.
+ */
+interface AgentSource {
+  origin: "file" | "code";
+}
+
+export class AgentsPlugin extends Plugin implements ToolProvider {
+  static manifest = manifest as PluginManifest;
+  static phase: PluginPhase = "deferred";
+
+  protected declare config: AgentsPluginConfig;
+
+  private agents = new Map<string, RegisteredAgent>();
+  private defaultAgentName: string | null = null;
+  private activeStreams = new Map<string, AbortController>();
+  private mcpClient: AppKitMcpClient | null = null;
+  private threadStore;
+
+  constructor(config: AgentsPluginConfig) {
+    super(config);
+    this.config = config;
+    this.threadStore = config.threadStore ?? new InMemoryThreadStore();
+  }
+
+  async setup() {
+    await this.loadAgents();
+    this.mountInvocationsRoute();
+    this.printRegistry();
+  }
+
+  /**
+   * Reload agents from the configured directory, preserving code-defined
+   * agents. Swaps the registry atomically at the end.
+   */
+  async reload(): Promise<void> {
+    this.agents.clear();
+    this.defaultAgentName = null;
+    if (this.mcpClient) {
+      await this.mcpClient.close();
+      this.mcpClient = null;
+    }
+    await this.loadAgents();
+  }
+
+  private async loadAgents() {
+    const { defs: fileDefs, defaultAgent: fileDefault } =
+      await this.loadFileDefinitions();
+
+    const codeDefs = this.config.agents ?? {};
+
+    for (const name of Object.keys(fileDefs)) {
+      if (codeDefs[name]) {
+        logger.warn(
+          "Agent '%s' defined in both code and a markdown file. Code definition takes precedence.",
+          name,
+        );
+      }
+    }
+
+    const merged: Record<string, { def: AgentDefinition; src: AgentSource }> =
+      {};
+    for (const [name, def] of Object.entries(fileDefs)) {
+      merged[name] = { def, src: { origin: "file" } };
+    }
+    for (const [name, def] of Object.entries(codeDefs)) {
+      merged[name] = { def, src: { origin: "code" } };
+    }
+
+    if (Object.keys(merged).length === 0) {
+      logger.info(
+        "No agents registered (no files in %s, no code-defined agents)",
+        this.resolvedAgentsDir() ?? "<disabled>",
+      );
+      return;
+    }
+
+    for (const [name, { def, src }] of Object.entries(merged)) {
+      try {
+        const registered = await this.buildRegisteredAgent(name, def, src);
+        this.agents.set(name, registered);
+        if (!this.defaultAgentName) this.defaultAgentName = name;
+      } catch (err) {
+        throw new Error(
+          `Failed to register agent '${name}' (${src.origin}): ${
+            err instanceof Error ? err.message : String(err)
+          }`,
+          { cause: err instanceof Error ? err : undefined },
+        );
+      }
+    }
+
+    if (this.config.defaultAgent) {
+      if (!this.agents.has(this.config.defaultAgent)) {
+        throw new Error(
+          `defaultAgent '${this.config.defaultAgent}' is not registered. Available: ${Array.from(this.agents.keys()).join(", ")}`,
+        );
+      }
+      this.defaultAgentName = this.config.defaultAgent;
+    } else if (fileDefault && this.agents.has(fileDefault)) {
+      this.defaultAgentName = fileDefault;
+    }
+  }
+
+  private resolvedAgentsDir(): string | null {
+    if (this.config.dir === false) return null;
+    const dir = this.config.dir ?? DEFAULT_AGENTS_DIR;
+    return path.isAbsolute(dir) ? dir : path.resolve(process.cwd(), dir);
+  }
+
+  private async loadFileDefinitions(): Promise<{
+    defs: Record<string, AgentDefinition>;
+    defaultAgent: string | null;
+  }> {
+    const dir = this.resolvedAgentsDir();
+    if (!dir) return { defs: {}, defaultAgent: null };
+
+    const pluginToolProviders = this.pluginProviderIndex();
+    const ambient = this.config.tools ?? {};
+
+    const result = await loadAgentsFromDir(dir, {
+      defaultModel: this.config.defaultModel,
+      availableTools: ambient,
+      plugins: pluginToolProviders,
+    });
+
+    return result;
+  }
+
+  /**
+   * Builds the map of plugin-name → toolkit that the markdown loader consults
+   * when resolving `toolkits:` frontmatter entries.
+   */
+  private pluginProviderIndex(): Map<
+    string,
+    { toolkit: (opts?: unknown) => Record<string, unknown> }
+  > {
+    const out = new Map();
+    if (!this.context) return out;
+    for (const { name, provider } of this.context.getToolProviders()) {
+      const withToolkit = provider as ToolProvider & {
+        toolkit?: (opts?: unknown) => Record<string, unknown>;
+      };
+      if (typeof withToolkit.toolkit === "function") {
+        out.set(name, {
+          toolkit: withToolkit.toolkit.bind(withToolkit),
+        });
+      }
+    }
+    return out;
+  }
+
+  private async buildRegisteredAgent(
+    name: string,
+    def: AgentDefinition,
+    src: AgentSource,
+  ): Promise<RegisteredAgent> {
+    const adapter = await this.resolveAdapter(def, name);
+    const toolIndex = await this.buildToolIndex(name, def, src);
+
+    return {
+      name,
+      instructions: def.instructions,
+      adapter,
+      toolIndex,
+      baseSystemPrompt: def.baseSystemPrompt,
+      maxSteps: def.maxSteps,
+      maxTokens: def.maxTokens,
+    };
+  }
+
+  private async resolveAdapter(
+    def: AgentDefinition,
+    name: string,
+  ): Promise<AgentAdapter> {
+    const source = def.model ?? this.config.defaultModel;
+    if (!source) {
+      const { DatabricksAdapter } = await import("../../agents/databricks");
+      try {
+        return await DatabricksAdapter.fromModelServing();
+      } catch (err) {
+        throw new Error(
+          `Agent '${name}' has no model configured and no DATABRICKS_AGENT_ENDPOINT default available`,
+          { cause: err instanceof Error ? err : undefined },
+        );
+      }
+    }
+    if (typeof source === "string") {
+      const { DatabricksAdapter } = await import("../../agents/databricks");
+      return DatabricksAdapter.fromModelServing(source);
+    }
+    return await source;
+  }
+
+  /**
+   * Resolves an agent's tool record into a per-agent dispatch index. Connects
+   * hosted tools via MCP client. Applies `autoInheritTools` defaults when the
+   * definition has no declared tools/agents.
+   */
+  private async buildToolIndex(
+    agentName: string,
+    def: AgentDefinition,
+    src: AgentSource,
+  ): Promise<Map<string, ResolvedToolEntry>> {
+    const index = new Map<string, ResolvedToolEntry>();
+    const hasExplicitTools = def.tools && Object.keys(def.tools).length > 0;
+    const hasExplicitSubAgents =
+      def.agents && Object.keys(def.agents).length > 0;
+
+    const inheritDefaults = normalizeAutoInherit(this.config.autoInheritTools);
+    const shouldInherit =
+      !hasExplicitTools &&
+      !hasExplicitSubAgents &&
+      (src.origin === "file" ? inheritDefaults.file : inheritDefaults.code);
+
+    if (shouldInherit) {
+      await this.applyAutoInherit(agentName, index);
+    }
+
+    // 1. Sub-agents → agent-<key>
+    for (const [childKey, childDef] of Object.entries(def.agents ?? {})) {
+      const toolName = `agent-${childKey}`;
+      index.set(toolName, {
+        source: "subagent",
+        agentName: childDef.name ?? childKey,
+        def: {
+          name: toolName,
+          description:
+            childDef.instructions.slice(0, 120) ||
+            `Delegate to the ${childKey} sub-agent`,
+          parameters: {
+            type: "object",
+            properties: {
+              input: {
+                type: "string",
+                description: "Message to send to the sub-agent.",
+              },
+            },
+            required: ["input"],
+          },
+        },
+      });
+    }
+
+    // 2. Explicit tools (toolkit entries, function tools, hosted tools)
+    const hostedToCollect: import("./tools/hosted-tools").HostedTool[] = [];
+    for (const [key, tool] of Object.entries(def.tools ?? {})) {
+      if (isToolkitEntry(tool)) {
+        index.set(key, {
+          source: "toolkit",
+          pluginName: tool.pluginName,
+          localName: tool.localName,
+          def: { ...tool.def, name: key },
+        });
+        continue;
+      }
+      if (isFunctionTool(tool)) {
+        index.set(key, {
+          source: "function",
+          functionTool: tool,
+          def: { ...functionToolToDefinition(tool), name: key },
+        });
+        continue;
+      }
+      if (isHostedTool(tool)) {
+        hostedToCollect.push(tool);
+        continue;
+      }
+      throw new Error(
+        `Agent '${agentName}' tool '${key}' has an unrecognized shape`,
+      );
+    }
+
+    if (hostedToCollect.length > 0) {
+      await this.connectHostedTools(hostedToCollect, index);
+    }
+
+    return index;
+  }
+
+  private async applyAutoInherit(
+    agentName: string,
+    index: Map<string, ResolvedToolEntry>,
+  ): Promise<void> {
+    if (!this.context) return;
+    for (const {
+      name: pluginName,
+      provider,
+    } of this.context.getToolProviders()) {
+      if (pluginName === this.name) continue;
+      const withToolkit = provider as ToolProvider & {
+        toolkit?: (opts?: unknown) => Record<string, unknown>;
+      };
+      if (typeof withToolkit.toolkit === "function") {
+        const entries = withToolkit.toolkit() as Record<string, unknown>;
+        for (const [key, maybeEntry] of Object.entries(entries)) {
+          if (!isToolkitEntry(maybeEntry)) continue;
+          index.set(key, {
+            source: "toolkit",
+            pluginName: maybeEntry.pluginName,
+            localName: maybeEntry.localName,
+            def: { ...maybeEntry.def, name: key },
+          });
+        }
+        continue;
+      }
+      // Fallback: providers without a toolkit() still expose getAgentTools();
+      // dispatch goes through PluginContext.executeTool by plugin name.
+      for (const tool of provider.getAgentTools()) {
+        const qualifiedName = `${pluginName}.${tool.name}`;
+        index.set(qualifiedName, {
+          source: "toolkit",
+          pluginName,
+          localName: tool.name,
+          def: { ...tool, name: qualifiedName },
+        });
+      }
+    }
+    const aliased = Array.from(index.keys());
+    if (aliased.length > 0) {
+      logger.info(
+        "[agent %s] auto-inherited %d tools",
+        agentName,
+        aliased.length,
+      );
+    }
+  }
+
+  private async connectHostedTools(
+    hostedTools: import("./tools/hosted-tools").HostedTool[],
+    index: Map<string, ResolvedToolEntry>,
+  ): Promise<void> {
+    let host: string | undefined;
+    let authenticate: () => Promise<Record<string, string>>;
+
+    try {
+      const { getWorkspaceClient } = await import("../../context");
+      const wsClient = getWorkspaceClient();
+      await wsClient.config.ensureResolved();
+      host = wsClient.config.host;
+      authenticate = async () => {
+        const headers = new Headers();
+        await wsClient.config.authenticate(headers);
+        return Object.fromEntries(headers.entries());
+      };
+    } catch {
+      host = process.env.DATABRICKS_HOST;
+      authenticate = async (): Promise<Record<string, string>> => {
+        const token = process.env.DATABRICKS_TOKEN;
+        return token ? { Authorization: `Bearer ${token}` } : {};
+      };
+    }
+
+    if (!host) {
+      logger.warn(
+        "No Databricks host available — skipping %d hosted tool(s)",
+        hostedTools.length,
+      );
+      return;
+    }
+
+    if (!this.mcpClient) {
+      this.mcpClient = new AppKitMcpClient(host, authenticate);
+    }
+
+    const endpoints = resolveHostedTools(hostedTools);
+    await this.mcpClient.connectAll(endpoints);
+
+    for (const def of this.mcpClient.getAllToolDefinitions()) {
+      index.set(def.name, {
+        source: "mcp",
+        mcpToolName: def.name,
+        def,
+      });
+    }
+  }
+
+  // ----------------- ToolProvider (no tools of our own) --------------------
+
+  getAgentTools(): AgentToolDefinition[] {
+    return [];
+  }
+
+  async executeAgentTool(): Promise<unknown> {
+    throw new Error("AgentsPlugin does not expose executeAgentTool directly");
+  }
+
+  // ----------------- Route mounting and handlers ---------------------------
+
+  private mountInvocationsRoute() {
+    if (!this.context) return;
+    this.context.addRoute(
+      "post",
+      "/invocations",
+      (req: express.Request, res: express.Response) => {
+        this._handleInvocations(req, res);
+      },
+    );
+  }
+
+  injectRoutes(router: IAppRouter) {
+    this.route(router, {
+      name: "chat",
+      method: "post",
+      path: "/chat",
+      handler: async (req, res) => this._handleChat(req, res),
+    });
+    this.route(router, {
+      name: "cancel",
+      method: "post",
+      path: "/cancel",
+      handler: async (req, res) => this._handleCancel(req, res),
+    });
+    this.route(router, {
+      name: "threads",
+      method: "get",
+      path: "/threads",
+      handler: async (req, res) => this._handleListThreads(req, res),
+    });
+    this.route(router, {
+      name: "thread",
+      method: "get",
+      path: "/threads/:threadId",
+      handler: async (req, res) => this._handleGetThread(req, res),
+    });
+    this.route(router, {
+      name: "deleteThread",
+      method: "delete",
+      path: "/threads/:threadId",
+      handler: async (req, res) => this._handleDeleteThread(req, res),
+    });
+    this.route(router, {
+      name: "info",
+      method: "get",
+      path: "/info",
+      handler: async (_req, res) => {
+        res.json({
+          agents: Array.from(this.agents.keys()),
+          defaultAgent: this.defaultAgentName,
+        });
+      },
+    });
+  }
+
+  clientConfig(): Record<string, unknown> {
+    return {
+      agents: Array.from(this.agents.keys()),
+      defaultAgent: this.defaultAgentName,
+    };
+  }
+
+  private async _handleChat(req: express.Request, res: express.Response) {
+    const parsed = chatRequestSchema.safeParse(req.body);
+    if (!parsed.success) {
+      res.status(400).json({
+        error: "Invalid request",
+        details: parsed.error.flatten().fieldErrors,
+      });
+      return;
+    }
+    const { message, threadId, agent: agentName } = parsed.data;
+
+    const registered = this.resolveAgent(agentName);
+    if (!registered) {
+      res.status(400).json({
+        error: agentName
+          ? `Agent "${agentName}" not found`
+          : "No agent registered",
+      });
+      return;
+    }
+
+    const userId = this.resolveUserId(req);
+    let thread = threadId ? await this.threadStore.get(threadId, userId) : null;
+    if (threadId && !thread) {
+      res.status(404).json({ error: `Thread ${threadId} not found` });
+      return;
+    }
+    if (!thread) {
+      thread = await this.threadStore.create(userId);
+    }
+
+    const userMessage: Message = {
+      id: randomUUID(),
+      role: "user",
+      content: message,
+      createdAt: new Date(),
+    };
+    await this.threadStore.addMessage(thread.id, userId, userMessage);
+    return this._streamAgent(req, res, registered, thread, userId);
+  }
+
+  private async _handleInvocations(
+    req: express.Request,
+    res: express.Response,
+  ) {
+    const parsed = invocationsRequestSchema.safeParse(req.body);
+    if (!parsed.success) {
+      res.status(400).json({
+        error: "Invalid request",
+        details: parsed.error.flatten().fieldErrors,
+      });
+      return;
+    }
+    const { input } = parsed.data;
+    const registered = this.resolveAgent();
+    if (!registered) {
+      res.status(400).json({ error: "No agent registered" });
+      return;
+    }
+    const userId = this.resolveUserId(req);
+    const thread = await this.threadStore.create(userId);
+
+    if (typeof input === "string") {
+      await this.threadStore.addMessage(thread.id, userId, {
+        id: randomUUID(),
+        role: "user",
+        content: input,
+        createdAt: new Date(),
+      });
+    } else {
+      for (const item of input) {
+        const role = (item.role ?? "user") as Message["role"];
+        const content =
+          typeof item.content === "string"
+            ? item.content
+            : JSON.stringify(item.content ?? "");
+        if (!content) continue;
+        await this.threadStore.addMessage(thread.id, userId, {
+          id: randomUUID(),
+          role,
+          content,
+          createdAt: new Date(),
+        });
+      }
+    }
+
+    return this._streamAgent(req, res, registered, thread, userId);
+  }
+
+  private async _streamAgent(
+    req: express.Request,
+    res: express.Response,
+    registered: RegisteredAgent,
+    thread: Thread,
+    userId: string,
+  ): Promise<void> {
+    const abortController = new AbortController();
+    const signal = abortController.signal;
+    const requestId = randomUUID();
+    this.activeStreams.set(requestId, abortController);
+
+    const tools = Array.from(registered.toolIndex.values()).map((e) => e.def);
+    const self = this;
+
+    const executeTool = async (
+      name: string,
+      args: unknown,
+    ): Promise<unknown> => {
+      const entry = registered.toolIndex.get(name);
+      if (!entry) throw new Error(`Unknown tool: ${name}`);
+
+      let result: unknown;
+      if (entry.source === "toolkit") {
+        if (!self.context) {
+          throw new Error(
+            "Plugin tool execution requires PluginContext; this should never happen through createApp",
+          );
+        }
+        result = await self.context.executeTool(
+          req,
+          entry.pluginName,
+          entry.localName,
+          args,
+          signal,
+        );
+      } else if (entry.source === "function") {
+        result = await entry.functionTool.execute(
+          args as Record<string, unknown>,
+        );
+      } else if (entry.source === "mcp") {
+        if (!self.mcpClient) throw new Error("MCP client not connected");
+        const oboToken = req.headers["x-forwarded-access-token"];
+        const mcpAuth =
+          typeof oboToken === "string"
+            ? { Authorization: `Bearer ${oboToken}` }
+            : undefined;
+        result = await self.mcpClient.callTool(
+          entry.mcpToolName,
+          args,
+          mcpAuth,
+        );
+      } else if (entry.source === "subagent") {
+        const childAgent = self.agents.get(entry.agentName);
+        if (!childAgent)
+          throw new Error(`Sub-agent not found: ${entry.agentName}`);
+        result = await self.runSubAgent(req, childAgent, args, signal);
+      }
+
+      if (result === undefined) {
+        return `Error: Tool "${name}" execution failed`;
+      }
+      const MAX = 50_000;
+      const serialized =
+        typeof result === "string" ? result : JSON.stringify(result);
+      if (serialized.length > MAX) {
+        return `${serialized.slice(0, MAX)}\n\n[Result truncated: ${serialized.length} chars exceeds ${MAX} limit]`;
+      }
+      return result;
+    };
+
+    await this.executeStream<ResponseStreamEvent>(
+      res,
+      async function* () {
+        const translator = new AgentEventTranslator();
+        try {
+          for (const evt of translator.translate({
+            type: "metadata",
+            data: { threadId: thread.id },
+          })) {
+            yield evt;
+          }
+
+          const pluginNames = self.context
+            ? self.context
+                .getPluginNames()
+                .filter((n) => n !== self.name && n !== "server")
+            : [];
+          const fullPrompt = composePromptForAgent(
+            registered,
+            self.config.baseSystemPrompt,
+            {
+              agentName: registered.name,
+              pluginNames,
+              toolNames: tools.map((t) => t.name),
+            },
+          );
+
+          const messagesWithSystem: Message[] = [
+            {
+              id: "system",
+              role: "system",
+              content: fullPrompt,
+              createdAt: new Date(),
+            },
+            ...thread.messages,
+          ];
+
+          const stream = registered.adapter.run(
+            {
+              messages: messagesWithSystem,
+              tools,
+              threadId: thread.id,
+              signal,
+            },
+            { executeTool, signal },
+          );
+
+          let fullContent = "";
+          for await (const event of stream) {
+            if (signal.aborted) break;
+            if (event.type === "message_delta") {
+              fullContent += event.content;
+            }
+            for (const translated of translator.translate(event)) {
+              yield translated;
+            }
+          }
+
+          if (fullContent) {
+            await self.threadStore.addMessage(thread.id, userId, {
+              id: randomUUID(),
+              role: "assistant",
+              content: fullContent,
+              createdAt: new Date(),
+            });
+          }
+
+          for (const evt of translator.finalize()) yield evt;
+        } catch (error) {
+          if (signal.aborted) return;
+          logger.error("Agent chat error: %O", error);
+          throw error;
+        } finally {
+          self.activeStreams.delete(requestId);
+        }
+      },
+      {
+        ...agentStreamDefaults,
+        stream: { ...agentStreamDefaults.stream, streamId: requestId },
+      },
+    );
+  }
+
+  /**
+   * Runs a sub-agent in response to an `agent-<key>` tool call. Returns the
+   * concatenated text output to hand back to the parent adapter as the tool
+   * result.
+   */
+  private async runSubAgent(
+    req: express.Request,
+    child: RegisteredAgent,
+    args: unknown,
+    signal: AbortSignal,
+  ): Promise<string> {
+    const input =
+      typeof args === "object" &&
+      args !== null &&
+      typeof (args as { input?: unknown }).input === "string"
+        ? (args as { input: string }).input
+        : JSON.stringify(args);
+    const childTools = Array.from(child.toolIndex.values()).map((e) => e.def);
+
+    const childExecute = async (
+      name: string,
+      childArgs: unknown,
+    ): Promise<unknown> => {
+      const entry = child.toolIndex.get(name);
+      if (!entry) throw new Error(`Unknown tool in sub-agent: ${name}`);
+      if (entry.source === "toolkit" && this.context) {
+        return this.context.executeTool(
+          req,
+          entry.pluginName,
+          entry.localName,
+          childArgs,
+          signal,
+        );
+      }
+      if (entry.source === "function") {
+        return entry.functionTool.execute(childArgs as Record<string, unknown>);
+      }
+      if (entry.source === "subagent") {
+        const grandchild = this.agents.get(entry.agentName);
+        if (!grandchild)
+          throw new Error(`Sub-agent not found: ${entry.agentName}`);
+        return this.runSubAgent(req, grandchild, childArgs, signal);
+      }
+      if (entry.source === "mcp" && this.mcpClient) {
+        const oboToken = req.headers["x-forwarded-access-token"];
+        const mcpAuth =
+          typeof oboToken === "string"
+            ? { Authorization: `Bearer ${oboToken}` }
+            : undefined;
+        return this.mcpClient.callTool(entry.mcpToolName, childArgs, mcpAuth);
+      }
+      throw new Error(`Unsupported sub-agent tool source: ${entry.source}`);
+    };
+
+    const runContext: AgentRunContext = { executeTool: childExecute, signal };
+
+    const pluginNames = this.context
+      ? this.context
+          .getPluginNames()
+          .filter((n) => n !== this.name && n !== "server")
+      : [];
+    const systemPrompt = composePromptForAgent(
+      child,
+      this.config.baseSystemPrompt,
+      {
+        agentName: child.name,
+        pluginNames,
+        toolNames: childTools.map((t) => t.name),
+      },
+    );
+
+    const messages: Message[] = [
+      {
+        id: "system",
+        role: "system",
+        content: systemPrompt,
+        createdAt: new Date(),
+      },
+      {
+        id: randomUUID(),
+        role: "user",
+        content: input,
+        createdAt: new Date(),
+      },
+    ];
+
+    let output = "";
+    const events: AgentEvent[] = [];
+    for await (const event of child.adapter.run(
+      { messages, tools: childTools, threadId: randomUUID(), signal },
+      runContext,
+    )) {
+      events.push(event);
+      if (event.type === "message_delta") output += event.content;
+      else if (event.type === "message") output = event.content;
+    }
+    return output;
+  }
+
+  private async _handleCancel(req: express.Request, res: express.Response) {
+    const { streamId } = req.body as { streamId?: string };
+    if (!streamId) {
+      res.status(400).json({ error: "streamId is required" });
+      return;
+    }
+    const controller = this.activeStreams.get(streamId);
+    if (controller) {
+      controller.abort("Cancelled by user");
+      this.activeStreams.delete(streamId);
+    }
+    res.json({ cancelled: true });
+  }
+
+  private async _handleListThreads(
+    req: express.Request,
+    res: express.Response,
+  ) {
+    const userId = this.resolveUserId(req);
+    const threads = await this.threadStore.list(userId);
+    res.json({ threads });
+  }
+
+  private async _handleGetThread(req: express.Request, res: express.Response) {
+    const userId = this.resolveUserId(req);
+    const thread = await this.threadStore.get(req.params.threadId, userId);
+    if (!thread) {
+      res.status(404).json({ error: "Thread not found" });
+      return;
+    }
+    res.json(thread);
+  }
+
+  private async _handleDeleteThread(
+    req: express.Request,
+    res: express.Response,
+  ) {
+    const userId = this.resolveUserId(req);
+    const deleted = await this.threadStore.delete(req.params.threadId, userId);
+    if (!deleted) {
+      res.status(404).json({ error: "Thread not found" });
+      return;
+    }
+    res.json({ deleted: true });
+  }
+
+  private resolveAgent(name?: string): RegisteredAgent | null {
+    if (name) return this.agents.get(name) ?? null;
+    if (this.defaultAgentName) {
+      return this.agents.get(this.defaultAgentName) ?? null;
+    }
+    const first = this.agents.values().next();
+    return first.done ? null : first.value;
+  }
+
+  private printRegistry(): void {
+    if (this.agents.size === 0) return;
+    console.log("");
+    console.log(`  ${pc.bold("Agents")} ${pc.dim(`(${this.agents.size})`)}`);
+    console.log(`  ${pc.dim("─".repeat(60))}`);
+    for (const [name, reg] of this.agents) {
+      const tools = reg.toolIndex.size;
+      const marker = name === this.defaultAgentName ? pc.green("●") : " ";
+      console.log(
+        `  ${marker} ${pc.bold(name.padEnd(24))} ${pc.dim(`${tools} tools`)}`,
+      );
+    }
+    console.log(`  ${pc.dim("─".repeat(60))}`);
+    console.log("");
+  }
+
+  async shutdown(): Promise<void> {
+    if (this.mcpClient) {
+      await this.mcpClient.close();
+      this.mcpClient = null;
+    }
+  }
+
+  exports() {
+    return {
+      register: (name: string, def: AgentDefinition) =>
+        this.registerCodeAgent(name, def),
+      list: () => Array.from(this.agents.keys()),
+      get: (name: string) => this.agents.get(name) ?? null,
+      reload: () => this.reload(),
+      getDefault: () => this.defaultAgentName,
+      getThreads: (userId: string) => this.threadStore.list(userId),
+    };
+  }
+
+  private async registerCodeAgent(
+    name: string,
+    def: AgentDefinition,
+  ): Promise<void> {
+    const registered = await this.buildRegisteredAgent(name, def, {
+      origin: "code",
+    });
+    this.agents.set(name, registered);
+    if (!this.defaultAgentName) this.defaultAgentName = name;
+  }
+}
+
+function normalizeAutoInherit(value: AgentsPluginConfig["autoInheritTools"]): {
+  file: boolean;
+  code: boolean;
+} {
+  if (value === undefined) return { file: true, code: false };
+  if (typeof value === "boolean") return { file: value, code: value };
+  return { file: value.file ?? true, code: value.code ?? false };
+}
+
+function composePromptForAgent(
+  registered: RegisteredAgent,
+  pluginLevel: BaseSystemPromptOption | undefined,
+  ctx: PromptContext,
+): string {
+  const perAgent = registered.baseSystemPrompt;
+  const resolved = perAgent !== undefined ? perAgent : pluginLevel;
+
+  let base = "";
+  if (resolved === false) {
+    base = "";
+  } else if (typeof resolved === "string") {
+    base = resolved;
+  } else if (typeof resolved === "function") {
+    base = resolved(ctx);
+  } else {
+    base = buildBaseSystemPrompt(ctx.pluginNames);
+  }
+
+  return composeSystemPrompt(base, registered.instructions);
+}
+
+/**
+ * Plugin factory for the agents plugin. Reads `config/agents/*.md` by default,
+ * resolves toolkits/tools from registered plugins, exposes `appkit.agents.*`
+ * runtime API and mounts `/invocations`.
+ *
+ * @example
+ * ```ts
+ * import { agents, analytics, createApp, server } from "@databricks/appkit";
+ *
+ * await createApp({
+ *   plugins: [server(), analytics(), agents()],
+ * });
+ * ```
+ */
+export const agents = toPlugin(AgentsPlugin);
diff --git a/packages/appkit/src/plugins/agents/defaults.ts b/packages/appkit/src/plugins/agents/defaults.ts
new file mode 100644
index 00000000..4da11bef
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/defaults.ts
@@ -0,0 +1,12 @@
+import type { StreamExecutionSettings } from "shared";
+
+export const agentStreamDefaults: StreamExecutionSettings = {
+  default: {
+    cache: { enabled: false },
+    retry: { enabled: false },
+    timeout: 300_000,
+  },
+  stream: {
+    bufferSize: 200,
+  },
+};
diff --git a/packages/appkit/src/plugins/agents/event-translator.ts b/packages/appkit/src/plugins/agents/event-translator.ts
new file mode 100644
index 00000000..314f8066
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/event-translator.ts
@@ -0,0 +1,230 @@
+import { randomUUID } from "node:crypto";
+import type {
+  AgentEvent,
+  ResponseFunctionCallOutput,
+  ResponseFunctionToolCall,
+  ResponseOutputMessage,
+  ResponseStreamEvent,
+} from "shared";
+
+/**
+ * Translates internal AgentEvent stream into Responses API SSE events.
+ *
+ * Stateful: one instance per streaming request. Tracks sequence numbers,
+ * output indices, and message accumulation state.
+ */
+export class AgentEventTranslator {
+  private seqNum = 0;
+  private outputIndex = 0;
+  private messageId: string | null = null;
+  private messageText = "";
+  private finalized = false;
+
+  translate(event: AgentEvent): ResponseStreamEvent[] {
+    switch (event.type) {
+      case "message_delta":
+        return this.handleMessageDelta(event.content);
+      case "message":
+        return this.handleFullMessage(event.content);
+      case "tool_call":
+        return this.handleToolCall(event.callId, event.name, event.args);
+      case "tool_result":
+        return this.handleToolResult(event.callId, event.result, event.error);
+      case "thinking":
+        return [
+          {
+            type: "appkit.thinking",
+            content: event.content,
+            sequence_number: this.seqNum++,
+          },
+        ];
+      case "metadata":
+        return [
+          {
+            type: "appkit.metadata",
+            data: event.data,
+            sequence_number: this.seqNum++,
+          },
+        ];
+      case "status":
+        return this.handleStatus(event.status, event.error);
+    }
+  }
+
+  finalize(): ResponseStreamEvent[] {
+    if (this.finalized) return [];
+    this.finalized = true;
+
+    const events: ResponseStreamEvent[] = [];
+
+    if (this.messageId) {
+      const doneItem: ResponseOutputMessage = {
+        type: "message",
+        id: this.messageId,
+        status: "completed",
+        role: "assistant",
+        content: [{ type: "output_text", text: this.messageText }],
+      };
+      events.push({
+        type: "response.output_item.done",
+        output_index: 0,
+        item: doneItem,
+        sequence_number: this.seqNum++,
+      });
+    }
+
+    events.push({
+      type: "response.completed",
+      sequence_number: this.seqNum++,
+      response: {},
+    });
+
+    return events;
+  }
+
+  private handleMessageDelta(content: string): ResponseStreamEvent[] {
+    const events: ResponseStreamEvent[] = [];
+    this.messageText += content;
+
+    if (!this.messageId) {
+      this.messageId = `msg_${randomUUID()}`;
+      const item: ResponseOutputMessage = {
+        type: "message",
+        id: this.messageId,
+        status: "in_progress",
+        role: "assistant",
+        content: [],
+      };
+      events.push({
+        type: "response.output_item.added",
+        output_index: 0,
+        item,
+        sequence_number: this.seqNum++,
+      });
+    }
+
+    events.push({
+      type: "response.output_text.delta",
+      item_id: this.messageId,
+      output_index: 0,
+      content_index: 0,
+      delta: content,
+      sequence_number: this.seqNum++,
+    });
+
+    return events;
+  }
+
+  private handleFullMessage(content: string): ResponseStreamEvent[] {
+    if (!this.messageId) {
+      this.messageId = `msg_${randomUUID()}`;
+    }
+    this.messageText = content;
+
+    const item: ResponseOutputMessage = {
+      type: "message",
+      id: this.messageId,
+      status: "completed",
+      role: "assistant",
+      content: [{ type: "output_text", text: content }],
+    };
+
+    return [
+      {
+        type: "response.output_item.added",
+        output_index: 0,
+        item,
+        sequence_number: this.seqNum++,
+      },
+      {
+        type: "response.output_item.done",
+        output_index: 0,
+        item,
+        sequence_number: this.seqNum++,
+      },
+    ];
+  }
+
+  private handleToolCall(
+    callId: string,
+    name: string,
+    args: unknown,
+  ): ResponseStreamEvent[] {
+    this.outputIndex++;
+    const item: ResponseFunctionToolCall = {
+      type: "function_call",
+      id: `fc_${randomUUID()}`,
+      call_id: callId,
+      name,
+      arguments: typeof args === "string" ? args : JSON.stringify(args),
+    };
+
+    return [
+      {
+        type: "response.output_item.added",
+        output_index: this.outputIndex,
+        item,
+        sequence_number: this.seqNum++,
+      },
+      {
+        type: "response.output_item.done",
+        output_index: this.outputIndex,
+        item,
+        sequence_number: this.seqNum++,
+      },
+    ];
+  }
+
+  private handleToolResult(
+    callId: string,
+    result: unknown,
+    error?: string,
+  ): ResponseStreamEvent[] {
+    this.outputIndex++;
+    const output =
+      error ?? (typeof result === "string" ? result : JSON.stringify(result));
+    const item: ResponseFunctionCallOutput = {
+      type: "function_call_output",
+      id: `fc_output_${randomUUID()}`,
+      call_id: callId,
+      output,
+    };
+
+    return [
+      {
+        type: "response.output_item.added",
+        output_index: this.outputIndex,
+        item,
+        sequence_number: this.seqNum++,
+      },
+      {
+        type: "response.output_item.done",
+        output_index: this.outputIndex,
+        item,
+        sequence_number: this.seqNum++,
+      },
+    ];
+  }
+
+  private handleStatus(status: string, error?: string): ResponseStreamEvent[] {
+    if (status === "error") {
+      return [
+        {
+          type: "error",
+          error: error ?? "Unknown error",
+          sequence_number: this.seqNum++,
+        },
+        {
+          type: "response.failed",
+          sequence_number: this.seqNum++,
+        },
+      ];
+    }
+
+    if (status === "complete") {
+      return this.finalize();
+    }
+
+    return [];
+  }
+}
diff --git a/packages/appkit/src/plugins/agents/index.ts b/packages/appkit/src/plugins/agents/index.ts
new file mode 100644
index 00000000..1adc41c1
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/index.ts
@@ -0,0 +1,22 @@
+export { AgentsPlugin, agents } from "./agents";
+export { buildToolkitEntries } from "./build-toolkit";
+export {
+  type LoadContext,
+  type LoadResult,
+  loadAgentFromFile,
+  loadAgentsFromDir,
+  parseFrontmatter,
+} from "./load-agents";
+export {
+  type AgentDefinition,
+  type AgentsPluginConfig,
+  type AgentTool,
+  type AutoInheritToolsConfig,
+  type BaseSystemPromptOption,
+  isToolkitEntry,
+  type PromptContext,
+  type RegisteredAgent,
+  type ResolvedToolEntry,
+  type ToolkitEntry,
+  type ToolkitOptions,
+} from "./types";
diff --git a/packages/appkit/src/plugins/agents/load-agents.ts b/packages/appkit/src/plugins/agents/load-agents.ts
new file mode 100644
index 00000000..d10321c6
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/load-agents.ts
@@ -0,0 +1,252 @@
+import fs from "node:fs";
+import path from "node:path";
+import yaml from "js-yaml";
+import type { AgentAdapter } from "shared";
+import { createLogger } from "../../logging/logger";
+import type {
+  AgentDefinition,
+  AgentTool,
+  BaseSystemPromptOption,
+  ToolkitEntry,
+  ToolkitOptions,
+} from "./types";
+import { isToolkitEntry } from "./types";
+
+const logger = createLogger("agents:loader");
+
+interface ToolkitProvider {
+  toolkit: (opts?: ToolkitOptions) => Record<string, unknown>;
+}
+
+export interface LoadContext {
+  /** Default model when frontmatter has no `endpoint` and the def has no `model`. */
+  defaultModel?: AgentAdapter | Promise<AgentAdapter> | string;
+  /** Ambient tool library referenced by frontmatter `tools: [key1, key2]`. */
+  availableTools?: Record<string, AgentTool>;
+  /** Registered plugin toolkits referenced by frontmatter `toolkits: [...]`. */
+  plugins?: Map<string, ToolkitProvider>;
+}
+
+export interface LoadResult {
+  /** Agent definitions keyed by file-stem name. */
+  defs: Record<string, AgentDefinition>;
+  /** First file with `default: true` frontmatter, or `null`. */
+  defaultAgent: string | null;
+}
+
+interface Frontmatter {
+  endpoint?: string;
+  model?: string;
+  toolkits?: ToolkitSpec[];
+  tools?: string[];
+  maxSteps?: number;
+  maxTokens?: number;
+  default?: boolean;
+  baseSystemPrompt?: false | string;
+}
+
+type ToolkitSpec = string | { [pluginName: string]: ToolkitOptions | string[] };
+
+const ALLOWED_KEYS = new Set([
+  "endpoint",
+  "model",
+  "toolkits",
+  "tools",
+  "maxSteps",
+  "maxTokens",
+  "default",
+  "baseSystemPrompt",
+]);
+
+/**
+ * Loads a single markdown agent file and resolves its frontmatter against
+ * registered plugin toolkits + ambient tool library.
+ */
+export async function loadAgentFromFile(
+  filePath: string,
+  ctx: LoadContext,
+): Promise<AgentDefinition> {
+  const raw = fs.readFileSync(filePath, "utf-8");
+  const name = path.basename(filePath, ".md");
+  return buildDefinition(name, raw, filePath, ctx);
+}
+
+/**
+ * Scans a directory for `*.md` files and produces an `AgentDefinition` record
+ * keyed by file-stem. Throws on frontmatter errors or unresolved references.
+ * Returns an empty map if the directory does not exist.
+ */
+export async function loadAgentsFromDir(
+  dir: string,
+  ctx: LoadContext,
+): Promise<LoadResult> {
+  if (!fs.existsSync(dir)) {
+    return { defs: {}, defaultAgent: null };
+  }
+  const files = fs.readdirSync(dir).filter((f) => f.endsWith(".md"));
+  const defs: Record<string, AgentDefinition> = {};
+  let defaultAgent: string | null = null;
+
+  for (const file of files) {
+    const fullPath = path.join(dir, file);
+    const raw = fs.readFileSync(fullPath, "utf-8");
+    const name = path.basename(file, ".md");
+    defs[name] = buildDefinition(name, raw, fullPath, ctx);
+    const { data } = parseFrontmatter(raw, fullPath);
+    if (data?.default === true && !defaultAgent) {
+      defaultAgent = name;
+    }
+  }
+
+  if (!defaultAgent && Object.keys(defs).length > 0) {
+    // Fall through — plugin's defaultAgent resolution handles "first registered".
+  }
+
+  return { defs, defaultAgent };
+}
+
+/** Exposed for tests. Parses `--- yaml ---\nbody` and validates frontmatter keys. */
+export function parseFrontmatter(
+  raw: string,
+  sourcePath?: string,
+): { data: Frontmatter | null; content: string } {
+  const match = raw.match(/^---\r?\n([\s\S]*?)\r?\n---\r?\n?([\s\S]*)$/);
+  if (!match) {
+    return { data: null, content: raw.trim() };
+  }
+  let parsed: unknown;
+  try {
+    parsed = yaml.load(match[1]);
+  } catch (err) {
+    const src = sourcePath ? ` (${sourcePath})` : "";
+    throw new Error(
+      `Invalid YAML frontmatter${src}: ${err instanceof Error ? err.message : String(err)}`,
+    );
+  }
+  if (parsed === null || parsed === undefined) {
+    return { data: {}, content: match[2].trim() };
+  }
+  if (typeof parsed !== "object" || Array.isArray(parsed)) {
+    const src = sourcePath ? ` (${sourcePath})` : "";
+    throw new Error(`Frontmatter must be a YAML object${src}`);
+  }
+  const data = parsed as Record<string, unknown>;
+  for (const key of Object.keys(data)) {
+    if (!ALLOWED_KEYS.has(key)) {
+      logger.warn(
+        "Ignoring unknown frontmatter key '%s' in %s",
+        key,
+        sourcePath ?? "<inline>",
+      );
+    }
+  }
+  return { data: data as Frontmatter, content: match[2].trim() };
+}
+
+function buildDefinition(
+  name: string,
+  raw: string,
+  filePath: string,
+  ctx: LoadContext,
+): AgentDefinition {
+  const { data, content } = parseFrontmatter(raw, filePath);
+  const fm: Frontmatter = data ?? {};
+
+  const tools = resolveFrontmatterTools(name, fm, filePath, ctx);
+  const model = fm.model ?? fm.endpoint ?? ctx.defaultModel;
+
+  let baseSystemPrompt: BaseSystemPromptOption | undefined;
+  if (fm.baseSystemPrompt === false) baseSystemPrompt = false;
+  else if (typeof fm.baseSystemPrompt === "string")
+    baseSystemPrompt = fm.baseSystemPrompt;
+
+  return {
+    name,
+    instructions: content,
+    model,
+    tools: Object.keys(tools).length > 0 ? tools : undefined,
+    maxSteps: typeof fm.maxSteps === "number" ? fm.maxSteps : undefined,
+    maxTokens: typeof fm.maxTokens === "number" ? fm.maxTokens : undefined,
+    baseSystemPrompt,
+  };
+}
+
+function resolveFrontmatterTools(
+  agentName: string,
+  fm: Frontmatter,
+  filePath: string,
+  ctx: LoadContext,
+): Record<string, AgentTool> {
+  const out: Record<string, AgentTool> = {};
+  const pluginIdx = ctx.plugins ?? new Map<string, ToolkitProvider>();
+
+  for (const spec of fm.toolkits ?? []) {
+    const [pluginName, opts] = parseToolkitSpec(spec, filePath, agentName);
+    const provider = pluginIdx.get(pluginName);
+    if (!provider) {
+      throw new Error(
+        `Agent '${agentName}' (${filePath}) references toolkit '${pluginName}', but plugin '${pluginName}' is not registered. Available: ${
+          pluginIdx.size > 0
+            ? Array.from(pluginIdx.keys()).join(", ")
+            : "<none>"
+        }`,
+      );
+    }
+    const entries = provider.toolkit(opts) as Record<string, unknown>;
+    for (const [key, entry] of Object.entries(entries)) {
+      if (!isToolkitEntry(entry)) {
+        throw new Error(
+          `Plugin '${pluginName}'.toolkit() returned a value at key '${key}' that is not a ToolkitEntry`,
+        );
+      }
+      out[key] = entry as ToolkitEntry;
+    }
+  }
+
+  for (const key of fm.tools ?? []) {
+    const tool = ctx.availableTools?.[key];
+    if (!tool) {
+      const available = ctx.availableTools
+        ? Object.keys(ctx.availableTools).join(", ")
+        : "<none>";
+      throw new Error(
+        `Agent '${agentName}' (${filePath}) references tool '${key}', which is not in the agents() plugin's tools field. Available: ${available}`,
+      );
+    }
+    out[key] = tool;
+  }
+
+  return out;
+}
+
+function parseToolkitSpec(
+  spec: ToolkitSpec,
+  filePath: string,
+  agentName: string,
+): [string, ToolkitOptions | undefined] {
+  if (typeof spec === "string") {
+    return [spec, undefined];
+  }
+  if (typeof spec !== "object" || spec === null) {
+    throw new Error(
+      `Agent '${agentName}' (${filePath}) has invalid toolkit entry: ${JSON.stringify(spec)}`,
+    );
+  }
+  const keys = Object.keys(spec);
+  if (keys.length !== 1) {
+    throw new Error(
+      `Agent '${agentName}' (${filePath}) toolkit entry must have exactly one key, got: ${keys.join(", ")}`,
+    );
+  }
+  const pluginName = keys[0];
+  const value = spec[pluginName];
+  if (Array.isArray(value)) {
+    return [pluginName, { only: value }];
+  }
+  if (typeof value === "object" && value !== null) {
+    return [pluginName, value as ToolkitOptions];
+  }
+  throw new Error(
+    `Agent '${agentName}' (${filePath}) toolkit '${pluginName}' options must be an array of tool names or an options object`,
+  );
+}
diff --git a/packages/appkit/src/plugins/agents/manifest.json b/packages/appkit/src/plugins/agents/manifest.json
new file mode 100644
index 00000000..0cdf2170
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/manifest.json
@@ -0,0 +1,10 @@
+{
+  "$schema": "https://databricks.github.io/appkit/schemas/plugin-manifest.schema.json",
+  "name": "agent",
+  "displayName": "Agents Plugin",
+  "description": "AI agents driven by markdown configs or code, with auto-tool-discovery from registered plugins",
+  "resources": {
+    "required": [],
+    "optional": []
+  }
+}
diff --git a/packages/appkit/src/plugins/agents/schemas.ts b/packages/appkit/src/plugins/agents/schemas.ts
new file mode 100644
index 00000000..84ab3b88
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/schemas.ts
@@ -0,0 +1,19 @@
+import { z } from "zod";
+
+export const chatRequestSchema = z.object({
+  message: z.string().min(1, "message must not be empty"),
+  threadId: z.string().optional(),
+  agent: z.string().optional(),
+});
+
+const messageItemSchema = z.object({
+  role: z.enum(["user", "assistant", "system"]).optional(),
+  content: z.union([z.string(), z.array(z.any())]).optional(),
+  type: z.string().optional(),
+});
+
+export const invocationsRequestSchema = z.object({
+  input: z.union([z.string().min(1), z.array(messageItemSchema).min(1)]),
+  stream: z.boolean().optional().default(true),
+  model: z.string().optional(),
+});
diff --git a/packages/appkit/src/plugins/agents/system-prompt.ts b/packages/appkit/src/plugins/agents/system-prompt.ts
new file mode 100644
index 00000000..634f49c5
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/system-prompt.ts
@@ -0,0 +1,40 @@
+/**
+ * Builds the AppKit base system prompt from active plugin names.
+ *
+ * The base prompt provides guidelines and app context. It does NOT
+ * include individual tool descriptions — those are sent via the
+ * structured `tools` API parameter to the LLM.
+ */
+export function buildBaseSystemPrompt(pluginNames: string[]): string {
+  const lines: string[] = [
+    "You are an AI assistant running on Databricks AppKit.",
+  ];
+
+  if (pluginNames.length > 0) {
+    lines.push("");
+    lines.push(`Active plugins: ${pluginNames.join(", ")}`);
+  }
+
+  lines.push("");
+  lines.push("Guidelines:");
+  lines.push("- Use Databricks SQL syntax when writing queries");
+  lines.push(
+    "- When results are large, summarize key findings rather than dumping raw data",
+  );
+  lines.push("- If a tool call fails, explain the error clearly to the user");
+  lines.push("- When browsing files, verify the path exists before reading");
+
+  return lines.join("\n");
+}
+
+/**
+ * Compose the full system prompt from the base prompt and an optional
+ * per-agent user prompt.
+ */
+export function composeSystemPrompt(
+  basePrompt: string,
+  agentPrompt?: string,
+): string {
+  if (!agentPrompt) return basePrompt;
+  return `${basePrompt}\n\n${agentPrompt}`;
+}
diff --git a/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts b/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
new file mode 100644
index 00000000..8116551e
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
@@ -0,0 +1,289 @@
+import fs from "node:fs";
+import os from "node:os";
+import path from "node:path";
+import type {
+  AgentAdapter,
+  AgentInput,
+  AgentRunContext,
+  AgentToolDefinition,
+  ToolProvider,
+} from "shared";
+import { afterEach, beforeEach, describe, expect, test, vi } from "vitest";
+import { z } from "zod";
+import { CacheManager } from "../../../cache";
+// Import the class directly so we can construct it without a createApp
+import { AgentsPlugin } from "../agents";
+import { buildToolkitEntries } from "../build-toolkit";
+import { defineTool, type ToolRegistry } from "../tools/define-tool";
+import type { AgentsPluginConfig, ToolkitEntry } from "../types";
+import { isToolkitEntry } from "../types";
+
+interface FakeContext {
+  providers: Array<{ name: string; provider: ToolProvider }>;
+  getToolProviders(): Array<{ name: string; provider: ToolProvider }>;
+  getPluginNames(): string[];
+  addRoute(): void;
+  executeTool: (
+    req: unknown,
+    pluginName: string,
+    localName: string,
+    args: unknown,
+  ) => Promise<unknown>;
+}
+
+function fakeContext(
+  providers: Array<{ name: string; provider: ToolProvider }>,
+): FakeContext {
+  return {
+    providers,
+    getToolProviders: () => providers,
+    getPluginNames: () => providers.map((p) => p.name),
+    addRoute: vi.fn(),
+    executeTool: vi.fn(async (_req, p, n, args) => ({
+      plugin: p,
+      tool: n,
+      args,
+    })),
+  };
+}
+
+function stubAdapter(): AgentAdapter {
+  return {
+    async *run(_input: AgentInput, _ctx: AgentRunContext) {
+      yield { type: "message_delta", content: "" };
+    },
+  };
+}
+
+function makeToolProvider(
+  pluginName: string,
+  registry: ToolRegistry,
+): ToolProvider & {
+  toolkit: (opts?: unknown) => Record<string, ToolkitEntry>;
+} {
+  return {
+    getAgentTools(): AgentToolDefinition[] {
+      return Object.entries(registry).map(([name, entry]) => ({
+        name,
+        description: entry.description,
+        parameters: { type: "object", properties: {} },
+      }));
+    },
+    async executeAgentTool(name, args) {
+      return { callFrom: pluginName, name, args };
+    },
+    toolkit: (opts) => buildToolkitEntries(pluginName, registry, opts as never),
+  };
+}
+
+let tmpDir: string;
+
+beforeEach(async () => {
+  tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), "agents-plugin-"));
+  const storage = {
+    get: vi.fn(),
+    set: vi.fn(),
+    delete: vi.fn(),
+    keys: vi.fn(),
+    healthCheck: vi.fn(async () => true),
+    close: vi.fn(async () => {}),
+  };
+  // biome-ignore lint/suspicious/noExplicitAny: test-only CacheManager wiring
+  await CacheManager.getInstance({ storage: storage as any });
+});
+
+afterEach(() => {
+  fs.rmSync(tmpDir, { recursive: true, force: true });
+});
+
+function instantiate(config: AgentsPluginConfig, ctx?: FakeContext) {
+  const plugin = new AgentsPlugin({ ...config, name: "agent" });
+  plugin.attachContext({ context: ctx as unknown as object });
+  return plugin;
+}
+
+describe("AgentsPlugin", () => {
+  test("registers code-defined agents and exposes them via exports", async () => {
+    const plugin = instantiate({
+      dir: false,
+      agents: {
+        support: {
+          instructions: "You help customers.",
+          model: stubAdapter(),
+        },
+      },
+    });
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      list: () => string[];
+      getDefault: () => string | null;
+    };
+    expect(api.list()).toEqual(["support"]);
+    expect(api.getDefault()).toBe("support");
+  });
+
+  test("loads markdown agents from a directory", async () => {
+    fs.writeFileSync(
+      path.join(tmpDir, "assistant.md"),
+      "---\ndefault: true\n---\nYou are helpful.",
+      "utf-8",
+    );
+    const plugin = instantiate({
+      dir: tmpDir,
+      defaultModel: stubAdapter(),
+    });
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      list: () => string[];
+      getDefault: () => string | null;
+    };
+    expect(api.list()).toEqual(["assistant"]);
+    expect(api.getDefault()).toBe("assistant");
+  });
+
+  test("code definitions override markdown on key collision", async () => {
+    fs.writeFileSync(
+      path.join(tmpDir, "support.md"),
+      "---\n---\nFrom markdown.",
+      "utf-8",
+    );
+    const plugin = instantiate({
+      dir: tmpDir,
+      defaultModel: stubAdapter(),
+      agents: {
+        support: {
+          instructions: "From code",
+          model: stubAdapter(),
+        },
+      },
+    });
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      get: (name: string) => { instructions: string } | null;
+    };
+    expect(api.get("support")?.instructions).toBe("From code");
+  });
+
+  test("auto-inherit default is asymmetric (file yes, code no)", async () => {
+    const registry: ToolRegistry = {
+      query: defineTool({
+        description: "q",
+        schema: z.object({ sql: z.string() }),
+        handler: () => "ok",
+      }),
+    };
+    const provider = makeToolProvider("analytics", registry);
+    const ctx = fakeContext([{ name: "analytics", provider }]);
+
+    fs.writeFileSync(
+      path.join(tmpDir, "assistant.md"),
+      "---\n---\nYou are helpful.",
+      "utf-8",
+    );
+
+    const plugin = instantiate(
+      {
+        dir: tmpDir,
+        defaultModel: stubAdapter(),
+        agents: {
+          manual: {
+            instructions: "Manual agent",
+            model: stubAdapter(),
+          },
+        },
+      },
+      ctx,
+    );
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+    };
+    const fileAgent = api.get("assistant");
+    const codeAgent = api.get("manual");
+
+    expect(fileAgent?.toolIndex.size).toBeGreaterThan(0); // inherited analytics.query
+    expect(codeAgent?.toolIndex.size).toBe(0); // code opted out by default
+  });
+
+  test("file-loaded agent respects explicit toolkits (skips auto-inherit)", async () => {
+    const registry: ToolRegistry = {
+      query: defineTool({
+        description: "q",
+        schema: z.object({ sql: z.string() }),
+        handler: () => "ok",
+      }),
+    };
+    const registry2: ToolRegistry = {
+      list: defineTool({
+        description: "l",
+        schema: z.object({}),
+        handler: () => [],
+      }),
+    };
+    const ctx = fakeContext([
+      { name: "analytics", provider: makeToolProvider("analytics", registry) },
+      { name: "files", provider: makeToolProvider("files", registry2) },
+    ]);
+
+    fs.writeFileSync(
+      path.join(tmpDir, "analyst.md"),
+      "---\ntoolkits: [analytics]\n---\nAnalyst.",
+      "utf-8",
+    );
+
+    const plugin = instantiate(
+      { dir: tmpDir, defaultModel: stubAdapter() },
+      ctx,
+    );
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+    };
+    const agent = api.get("analyst");
+    const toolNames = Array.from(agent?.toolIndex.keys() ?? []);
+    expect(toolNames.some((n) => n.startsWith("analytics."))).toBe(true);
+    expect(toolNames.some((n) => n.startsWith("files."))).toBe(false);
+  });
+
+  test("registers sub-agents as agent-<key> tools", async () => {
+    const plugin = instantiate({
+      dir: false,
+      agents: {
+        supervisor: {
+          instructions: "Supervise",
+          model: stubAdapter(),
+          agents: {
+            worker: {
+              instructions: "Work",
+              model: stubAdapter(),
+            },
+          },
+        },
+      },
+    });
+    await plugin.setup();
+
+    const api = plugin.exports() as {
+      get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+    };
+    const sup = api.get("supervisor");
+    expect(sup?.toolIndex.has("agent-worker")).toBe(true);
+  });
+
+  test("isToolkitEntry type guard recognizes toolkit entries", () => {
+    const entry: ToolkitEntry = {
+      __toolkitRef: true,
+      pluginName: "x",
+      localName: "y",
+      def: { name: "x.y", description: "", parameters: { type: "object" } },
+    };
+    expect(isToolkitEntry(entry)).toBe(true);
+    expect(isToolkitEntry({ foo: 1 })).toBe(false);
+    expect(isToolkitEntry(null)).toBe(false);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/create-agent.test.ts b/packages/appkit/src/plugins/agents/tests/create-agent.test.ts
new file mode 100644
index 00000000..3822897f
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/create-agent.test.ts
@@ -0,0 +1,75 @@
+import { describe, expect, test } from "vitest";
+import { z } from "zod";
+import { createAgent } from "../../../core/create-agent-def";
+import { tool } from "../tools/tool";
+import type { AgentDefinition } from "../types";
+
+describe("createAgent", () => {
+  test("returns the definition unchanged for a simple agent", () => {
+    const def: AgentDefinition = {
+      name: "support",
+      instructions: "You help customers.",
+      model: "endpoint-x",
+    };
+    const result = createAgent(def);
+    expect(result).toBe(def);
+  });
+
+  test("accepts tools as a keyed record", () => {
+    const get_weather = tool({
+      name: "get_weather",
+      description: "Get the weather",
+      schema: z.object({ city: z.string() }),
+      execute: async ({ city }) => `Sunny in ${city}`,
+    });
+
+    const def = createAgent({
+      instructions: "...",
+      tools: { get_weather },
+    });
+
+    expect(def.tools?.get_weather).toBe(get_weather);
+  });
+
+  test("accepts sub-agents in a keyed record", () => {
+    const researcher = createAgent({ instructions: "Research." });
+    const supervisor = createAgent({
+      instructions: "Supervise.",
+      agents: { researcher },
+    });
+    expect(supervisor.agents?.researcher).toBe(researcher);
+  });
+
+  test("throws on a direct self-cycle", () => {
+    const a: AgentDefinition = { instructions: "a" };
+    // biome-ignore lint/suspicious/noExplicitAny: intentional cycle setup for test
+    (a as any).agents = { self: a };
+    expect(() => createAgent(a)).toThrow(/cycle/i);
+  });
+
+  test("throws on an indirect cycle", () => {
+    const a: AgentDefinition = { instructions: "a" };
+    const b: AgentDefinition = { instructions: "b" };
+    a.agents = { b };
+    b.agents = { a };
+    expect(() => createAgent(a)).toThrow(/cycle/i);
+  });
+
+  test("accepts a DAG of sub-agents without throwing", () => {
+    const leaf: AgentDefinition = { instructions: "leaf" };
+    const branchA: AgentDefinition = {
+      instructions: "a",
+      agents: { leaf },
+    };
+    const branchB: AgentDefinition = {
+      instructions: "b",
+      agents: { leaf },
+    };
+    const root = createAgent({
+      instructions: "root",
+      agents: { branchA, branchB },
+    });
+    expect(root.agents?.branchA.agents?.leaf).toBe(leaf);
+    expect(root.agents?.branchB.agents?.leaf).toBe(leaf);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/event-translator.test.ts b/packages/appkit/src/plugins/agents/tests/event-translator.test.ts
new file mode 100644
index 00000000..eda72ebb
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/event-translator.test.ts
@@ -0,0 +1,204 @@
+import { describe, expect, test } from "vitest";
+import { AgentEventTranslator } from "../event-translator";
+
+describe("AgentEventTranslator", () => {
+  test("translates message_delta to output_item.added + output_text.delta on first delta", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "message_delta",
+      content: "Hello",
+    });
+
+    expect(events).toHaveLength(2);
+    expect(events[0].type).toBe("response.output_item.added");
+    expect(events[1].type).toBe("response.output_text.delta");
+
+    if (events[1].type === "response.output_text.delta") {
+      expect(events[1].delta).toBe("Hello");
+    }
+  });
+
+  test("subsequent message_delta only produces output_text.delta", () => {
+    const translator = new AgentEventTranslator();
+    translator.translate({ type: "message_delta", content: "Hello" });
+    const events = translator.translate({
+      type: "message_delta",
+      content: " world",
+    });
+
+    expect(events).toHaveLength(1);
+    expect(events[0].type).toBe("response.output_text.delta");
+  });
+
+  test("sequence_number is monotonically increasing", () => {
+    const translator = new AgentEventTranslator();
+    const e1 = translator.translate({ type: "message_delta", content: "a" });
+    const e2 = translator.translate({ type: "message_delta", content: "b" });
+    const e3 = translator.finalize();
+
+    const allSeqs = [...e1, ...e2, ...e3].map((e) =>
+      "sequence_number" in e ? e.sequence_number : -1,
+    );
+
+    for (let i = 1; i < allSeqs.length; i++) {
+      expect(allSeqs[i]).toBeGreaterThan(allSeqs[i - 1]);
+    }
+  });
+
+  test("translates tool_call to paired output_item.added + output_item.done", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "tool_call",
+      callId: "call_1",
+      name: "analytics.query",
+      args: { sql: "SELECT 1" },
+    });
+
+    expect(events).toHaveLength(2);
+    expect(events[0].type).toBe("response.output_item.added");
+    expect(events[1].type).toBe("response.output_item.done");
+
+    if (events[0].type === "response.output_item.added") {
+      expect(events[0].item.type).toBe("function_call");
+      if (events[0].item.type === "function_call") {
+        expect(events[0].item.name).toBe("analytics.query");
+        expect(events[0].item.call_id).toBe("call_1");
+      }
+    }
+  });
+
+  test("translates tool_result to paired output_item events", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "tool_result",
+      callId: "call_1",
+      result: { rows: 42 },
+    });
+
+    expect(events).toHaveLength(2);
+    expect(events[0].type).toBe("response.output_item.added");
+
+    if (events[0].type === "response.output_item.added") {
+      expect(events[0].item.type).toBe("function_call_output");
+    }
+  });
+
+  test("translates tool_result error", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "tool_result",
+      callId: "call_1",
+      result: null,
+      error: "Query failed",
+    });
+
+    if (
+      events[0].type === "response.output_item.added" &&
+      events[0].item.type === "function_call_output"
+    ) {
+      expect(events[0].item.output).toBe("Query failed");
+    }
+  });
+
+  test("translates thinking to appkit.thinking extension event", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "thinking",
+      content: "Let me think about this...",
+    });
+
+    expect(events).toHaveLength(1);
+    expect(events[0].type).toBe("appkit.thinking");
+    if (events[0].type === "appkit.thinking") {
+      expect(events[0].content).toBe("Let me think about this...");
+    }
+  });
+
+  test("translates metadata to appkit.metadata extension event", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "metadata",
+      data: { threadId: "t-123" },
+    });
+
+    expect(events).toHaveLength(1);
+    expect(events[0].type).toBe("appkit.metadata");
+    if (events[0].type === "appkit.metadata") {
+      expect(events[0].data.threadId).toBe("t-123");
+    }
+  });
+
+  test("status:complete triggers finalize with response.completed", () => {
+    const translator = new AgentEventTranslator();
+    translator.translate({ type: "message_delta", content: "Hi" });
+    const events = translator.translate({ type: "status", status: "complete" });
+
+    const types = events.map((e) => e.type);
+    expect(types).toContain("response.output_item.done");
+    expect(types).toContain("response.completed");
+  });
+
+  test("status:error emits error + response.failed", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.translate({
+      type: "status",
+      status: "error",
+      error: "Something broke",
+    });
+
+    expect(events).toHaveLength(2);
+    expect(events[0].type).toBe("error");
+    expect(events[1].type).toBe("response.failed");
+
+    if (events[0].type === "error") {
+      expect(events[0].error).toBe("Something broke");
+    }
+  });
+
+  test("finalize produces response.completed", () => {
+    const translator = new AgentEventTranslator();
+    const events = translator.finalize();
+
+    expect(events.some((e) => e.type === "response.completed")).toBe(true);
+  });
+
+  test("finalize with accumulated message text produces output_item.done", () => {
+    const translator = new AgentEventTranslator();
+    translator.translate({ type: "message_delta", content: "Hello " });
+    translator.translate({ type: "message_delta", content: "world" });
+    const events = translator.finalize();
+
+    const doneEvent = events.find(
+      (e) => e.type === "response.output_item.done",
+    );
+    expect(doneEvent).toBeDefined();
+    if (
+      doneEvent?.type === "response.output_item.done" &&
+      doneEvent.item.type === "message"
+    ) {
+      expect(doneEvent.item.content[0].text).toBe("Hello world");
+    }
+  });
+
+  test("output_index increments for tool calls", () => {
+    const translator = new AgentEventTranslator();
+    const e1 = translator.translate({
+      type: "tool_call",
+      callId: "c1",
+      name: "tool1",
+      args: {},
+    });
+    const e2 = translator.translate({
+      type: "tool_result",
+      callId: "c1",
+      result: "ok",
+    });
+
+    if (
+      e1[0].type === "response.output_item.added" &&
+      e2[0].type === "response.output_item.added"
+    ) {
+      expect(e2[0].output_index).toBeGreaterThan(e1[0].output_index);
+    }
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/load-agents.test.ts b/packages/appkit/src/plugins/agents/tests/load-agents.test.ts
new file mode 100644
index 00000000..5a7b1253
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/load-agents.test.ts
@@ -0,0 +1,150 @@
+import fs from "node:fs";
+import os from "node:os";
+import path from "node:path";
+import { afterEach, beforeEach, describe, expect, test } from "vitest";
+import { z } from "zod";
+import { buildToolkitEntries } from "../build-toolkit";
+import {
+  loadAgentFromFile,
+  loadAgentsFromDir,
+  parseFrontmatter,
+} from "../load-agents";
+import { defineTool, type ToolRegistry } from "../tools/define-tool";
+import { tool } from "../tools/tool";
+
+let workDir: string;
+
+beforeEach(() => {
+  workDir = fs.mkdtempSync(path.join(os.tmpdir(), "agents-test-"));
+});
+
+afterEach(() => {
+  fs.rmSync(workDir, { recursive: true, force: true });
+});
+
+function write(name: string, content: string) {
+  fs.writeFileSync(path.join(workDir, name), content, "utf-8");
+  return path.join(workDir, name);
+}
+
+describe("parseFrontmatter", () => {
+  test("parses a simple object", () => {
+    const { data, content } = parseFrontmatter(
+      "---\nendpoint: foo\ndefault: true\n---\nHello body",
+    );
+    expect(data).toEqual({ endpoint: "foo", default: true });
+    expect(content).toBe("Hello body");
+  });
+
+  test("parses nested arrays", () => {
+    const { data } = parseFrontmatter(
+      "---\ntoolkits:\n  - analytics\n  - files: [uploads.list]\n---\nbody",
+    );
+    expect(data?.toolkits).toEqual(["analytics", { files: ["uploads.list"] }]);
+  });
+
+  test("returns null data when no frontmatter", () => {
+    const { data, content } = parseFrontmatter("No frontmatter here");
+    expect(data).toBeNull();
+    expect(content).toBe("No frontmatter here");
+  });
+
+  test("throws on invalid YAML", () => {
+    expect(() => parseFrontmatter("---\nkey: : : bad\n---\n")).toThrow(/YAML/);
+  });
+});
+
+describe("loadAgentFromFile", () => {
+  test("returns AgentDefinition with body as instructions", async () => {
+    const p = write(
+      "assistant.md",
+      "---\nendpoint: e-1\n---\nYou are helpful.",
+    );
+    const def = await loadAgentFromFile(p, {});
+    expect(def.name).toBe("assistant");
+    expect(def.instructions).toBe("You are helpful.");
+    expect(def.model).toBe("e-1");
+  });
+});
+
+describe("loadAgentsFromDir", () => {
+  test("returns empty map when dir doesn't exist", async () => {
+    const res = await loadAgentsFromDir("/nonexistent-for-tests", {});
+    expect(res.defs).toEqual({});
+    expect(res.defaultAgent).toBeNull();
+  });
+
+  test("loads all .md files keyed by file-stem", async () => {
+    write("support.md", "---\nendpoint: e-1\n---\nSupport prompt.");
+    write("sales.md", "---\nendpoint: e-2\n---\nSales prompt.");
+    const res = await loadAgentsFromDir(workDir, {});
+    expect(Object.keys(res.defs).sort()).toEqual(["sales", "support"]);
+  });
+
+  test("picks up default: true from frontmatter", async () => {
+    write("one.md", "---\nendpoint: a\n---\nOne.");
+    write("two.md", "---\nendpoint: b\ndefault: true\n---\nTwo.");
+    const res = await loadAgentsFromDir(workDir, {});
+    expect(res.defaultAgent).toBe("two");
+  });
+
+  test("throws when frontmatter references an unregistered plugin", async () => {
+    write(
+      "broken.md",
+      "---\nendpoint: e\ntoolkits: [missing]\n---\nBroken agent.",
+    );
+    await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+      /references toolkit 'missing'/,
+    );
+  });
+
+  test("throws when frontmatter references an unknown ambient tool", async () => {
+    write("broken.md", "---\nendpoint: e\ntools: [unknown_tool]\n---\nBroken.");
+    await expect(loadAgentsFromDir(workDir, {})).rejects.toThrow(
+      /references tool 'unknown_tool'/,
+    );
+  });
+
+  test("resolves toolkits + ambient tools when provided", async () => {
+    const registry: ToolRegistry = {
+      query: defineTool({
+        description: "q",
+        schema: z.object({ sql: z.string() }),
+        handler: () => "ok",
+      }),
+    };
+    const plugins = new Map<
+      string,
+      { toolkit: (opts?: unknown) => Record<string, unknown> }
+    >([
+      [
+        "analytics",
+        {
+          toolkit: (opts) =>
+            buildToolkitEntries("analytics", registry, opts as never),
+        },
+      ],
+    ]);
+
+    const weather = tool({
+      name: "get_weather",
+      description: "Weather",
+      schema: z.object({ city: z.string() }),
+      execute: async () => "sunny",
+    });
+
+    write(
+      "analyst.md",
+      "---\nendpoint: e\ntoolkits:\n  - analytics\ntools:\n  - get_weather\n---\nBody.",
+    );
+    const res = await loadAgentsFromDir(workDir, {
+      plugins,
+      availableTools: { get_weather: weather },
+    });
+    expect(res.defs.analyst.tools).toBeDefined();
+    expect(Object.keys(res.defs.analyst.tools ?? {}).sort()).toEqual([
+      "analytics.query",
+      "get_weather",
+    ]);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/run-agent.test.ts b/packages/appkit/src/plugins/agents/tests/run-agent.test.ts
new file mode 100644
index 00000000..1a974811
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/run-agent.test.ts
@@ -0,0 +1,120 @@
+import type {
+  AgentAdapter,
+  AgentEvent,
+  AgentInput,
+  AgentRunContext,
+} from "shared";
+import { describe, expect, test, vi } from "vitest";
+import { z } from "zod";
+import { createAgent } from "../../../core/create-agent-def";
+import { runAgent } from "../../../core/run-agent";
+import { tool } from "../tools/tool";
+import type { ToolkitEntry } from "../types";
+
+function scriptedAdapter(events: AgentEvent[]): AgentAdapter {
+  return {
+    async *run(_input: AgentInput, _context: AgentRunContext) {
+      for (const event of events) {
+        yield event;
+      }
+    },
+  };
+}
+
+describe("runAgent", () => {
+  test("drives the adapter and returns aggregated text", async () => {
+    const events: AgentEvent[] = [
+      { type: "message_delta", content: "Hello " },
+      { type: "message_delta", content: "world" },
+      { type: "status", status: "complete" },
+    ];
+    const def = createAgent({
+      instructions: "Say hello",
+      model: scriptedAdapter(events),
+    });
+
+    const result = await runAgent(def, { messages: "hi" });
+    expect(result.text).toBe("Hello world");
+    expect(result.events).toHaveLength(3);
+  });
+
+  test("prefers terminal 'message' event over deltas when present", async () => {
+    const events: AgentEvent[] = [
+      { type: "message_delta", content: "partial" },
+      { type: "message", content: "final answer" },
+    ];
+    const def = createAgent({
+      instructions: "x",
+      model: scriptedAdapter(events),
+    });
+    const result = await runAgent(def, { messages: "hi" });
+    expect(result.text).toBe("final answer");
+  });
+
+  test("invokes inline tools via executeTool callback", async () => {
+    const weatherFn = vi.fn(async () => "Sunny in NYC");
+    const weather = tool({
+      name: "get_weather",
+      description: "Weather",
+      schema: z.object({ city: z.string() }),
+      execute: weatherFn,
+    });
+
+    let capturedCtx: AgentRunContext | null = null;
+    const adapter: AgentAdapter = {
+      async *run(_input, context) {
+        capturedCtx = context;
+        yield { type: "message_delta", content: "" };
+      },
+    };
+
+    const def = createAgent({
+      instructions: "x",
+      model: adapter,
+      tools: { get_weather: weather },
+    });
+
+    await runAgent(def, { messages: "hi" });
+    expect(capturedCtx).not.toBeNull();
+    // biome-ignore lint/style/noNonNullAssertion: asserted above
+    const result = await capturedCtx!.executeTool("get_weather", {
+      city: "NYC",
+    });
+    expect(result).toBe("Sunny in NYC");
+    expect(weatherFn).toHaveBeenCalledWith({ city: "NYC" });
+  });
+
+  test("throws a clear error when a ToolkitEntry is invoked", async () => {
+    const toolkitEntry: ToolkitEntry = {
+      __toolkitRef: true,
+      pluginName: "analytics",
+      localName: "query",
+      def: {
+        name: "analytics.query",
+        description: "SQL",
+        parameters: { type: "object", properties: {} },
+      },
+    };
+
+    let capturedCtx: AgentRunContext | null = null;
+    const adapter: AgentAdapter = {
+      async *run(_input, context) {
+        capturedCtx = context;
+        yield { type: "message_delta", content: "" };
+      },
+    };
+
+    const def = createAgent({
+      instructions: "x",
+      model: adapter,
+      tools: { "analytics.query": toolkitEntry },
+    });
+
+    await runAgent(def, { messages: "hi" });
+    expect(capturedCtx).not.toBeNull();
+    await expect(
+      // biome-ignore lint/style/noNonNullAssertion: asserted above
+      capturedCtx!.executeTool("analytics.query", {}),
+    ).rejects.toThrow(/only usable via createApp/);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/system-prompt.test.ts b/packages/appkit/src/plugins/agents/tests/system-prompt.test.ts
new file mode 100644
index 00000000..83bf8e19
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/system-prompt.test.ts
@@ -0,0 +1,45 @@
+import { describe, expect, test } from "vitest";
+import { buildBaseSystemPrompt, composeSystemPrompt } from "../system-prompt";
+
+describe("buildBaseSystemPrompt", () => {
+  test("includes plugin names", () => {
+    const prompt = buildBaseSystemPrompt(["analytics", "files", "genie"]);
+    expect(prompt).toContain("Active plugins: analytics, files, genie");
+  });
+
+  test("includes guidelines", () => {
+    const prompt = buildBaseSystemPrompt([]);
+    expect(prompt).toContain("Guidelines:");
+    expect(prompt).toContain("Databricks SQL");
+    expect(prompt).toContain("summarize key findings");
+  });
+
+  test("works with no plugins", () => {
+    const prompt = buildBaseSystemPrompt([]);
+    expect(prompt).toContain("AI assistant running on Databricks AppKit");
+    expect(prompt).not.toContain("Active plugins:");
+  });
+
+  test("does NOT include individual tool names", () => {
+    const prompt = buildBaseSystemPrompt(["analytics"]);
+    expect(prompt).not.toContain("analytics.query");
+    expect(prompt).not.toContain("Available tools:");
+  });
+});
+
+describe("composeSystemPrompt", () => {
+  test("concatenates base + agent prompt with double newline", () => {
+    const composed = composeSystemPrompt("Base prompt.", "Agent prompt.");
+    expect(composed).toBe("Base prompt.\n\nAgent prompt.");
+  });
+
+  test("returns base prompt alone when no agent prompt", () => {
+    const composed = composeSystemPrompt("Base prompt.");
+    expect(composed).toBe("Base prompt.");
+  });
+
+  test("returns base prompt when agent prompt is empty string", () => {
+    const composed = composeSystemPrompt("Base prompt.", "");
+    expect(composed).toBe("Base prompt.");
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/thread-store.test.ts b/packages/appkit/src/plugins/agents/tests/thread-store.test.ts
new file mode 100644
index 00000000..ed4f70ba
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/thread-store.test.ts
@@ -0,0 +1,138 @@
+import { describe, expect, test } from "vitest";
+import { InMemoryThreadStore } from "../thread-store";
+
+describe("InMemoryThreadStore", () => {
+  test("create() returns a new thread with the given userId", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+
+    expect(thread.id).toBeDefined();
+    expect(thread.userId).toBe("user-1");
+    expect(thread.messages).toEqual([]);
+    expect(thread.createdAt).toBeInstanceOf(Date);
+    expect(thread.updatedAt).toBeInstanceOf(Date);
+  });
+
+  test("get() returns the thread for the correct user", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+
+    const retrieved = await store.get(thread.id, "user-1");
+    expect(retrieved).toEqual(thread);
+  });
+
+  test("get() returns null for wrong user", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+
+    const retrieved = await store.get(thread.id, "user-2");
+    expect(retrieved).toBeNull();
+  });
+
+  test("get() returns null for non-existent thread", async () => {
+    const store = new InMemoryThreadStore();
+    const retrieved = await store.get("non-existent", "user-1");
+    expect(retrieved).toBeNull();
+  });
+
+  test("list() returns threads sorted by updatedAt desc", async () => {
+    const store = new InMemoryThreadStore();
+    const t1 = await store.create("user-1");
+    const t2 = await store.create("user-1");
+
+    // Make t1 more recently updated
+    await store.addMessage(t1.id, "user-1", {
+      id: "msg-1",
+      role: "user",
+      content: "hello",
+      createdAt: new Date(),
+    });
+
+    const threads = await store.list("user-1");
+    expect(threads).toHaveLength(2);
+    expect(threads[0].id).toBe(t1.id);
+    expect(threads[1].id).toBe(t2.id);
+  });
+
+  test("list() returns empty for unknown user", async () => {
+    const store = new InMemoryThreadStore();
+    await store.create("user-1");
+
+    const threads = await store.list("user-2");
+    expect(threads).toEqual([]);
+  });
+
+  test("addMessage() appends to thread and updates timestamp", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+    const originalUpdatedAt = thread.updatedAt;
+
+    // Small delay to ensure timestamp differs
+    await new Promise((r) => setTimeout(r, 5));
+
+    await store.addMessage(thread.id, "user-1", {
+      id: "msg-1",
+      role: "user",
+      content: "hello",
+      createdAt: new Date(),
+    });
+
+    const updated = await store.get(thread.id, "user-1");
+    expect(updated?.messages).toHaveLength(1);
+    expect(updated?.messages[0].content).toBe("hello");
+    expect(updated?.updatedAt.getTime()).toBeGreaterThanOrEqual(
+      originalUpdatedAt.getTime(),
+    );
+  });
+
+  test("addMessage() throws for non-existent thread", async () => {
+    const store = new InMemoryThreadStore();
+
+    await expect(
+      store.addMessage("non-existent", "user-1", {
+        id: "msg-1",
+        role: "user",
+        content: "hello",
+        createdAt: new Date(),
+      }),
+    ).rejects.toThrow("Thread non-existent not found");
+  });
+
+  test("delete() removes a thread and returns true", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+
+    const deleted = await store.delete(thread.id, "user-1");
+    expect(deleted).toBe(true);
+
+    const retrieved = await store.get(thread.id, "user-1");
+    expect(retrieved).toBeNull();
+  });
+
+  test("delete() returns false for non-existent thread", async () => {
+    const store = new InMemoryThreadStore();
+    const deleted = await store.delete("non-existent", "user-1");
+    expect(deleted).toBe(false);
+  });
+
+  test("delete() returns false for wrong user", async () => {
+    const store = new InMemoryThreadStore();
+    const thread = await store.create("user-1");
+
+    const deleted = await store.delete(thread.id, "user-2");
+    expect(deleted).toBe(false);
+  });
+
+  test("threads are isolated per user", async () => {
+    const store = new InMemoryThreadStore();
+    await store.create("user-1");
+    await store.create("user-1");
+    await store.create("user-2");
+
+    const user1Threads = await store.list("user-1");
+    const user2Threads = await store.list("user-2");
+
+    expect(user1Threads).toHaveLength(2);
+    expect(user2Threads).toHaveLength(1);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/thread-store.ts b/packages/appkit/src/plugins/agents/thread-store.ts
new file mode 100644
index 00000000..f3ca0599
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/thread-store.ts
@@ -0,0 +1,59 @@
+import { randomUUID } from "node:crypto";
+import type { Message, Thread, ThreadStore } from "shared";
+
+/**
+ * In-memory thread store backed by a nested Map.
+ *
+ * Outer key: userId, inner key: threadId.
+ * Suitable for development and single-instance deployments.
+ */
+export class InMemoryThreadStore implements ThreadStore {
+  private store = new Map<string, Map<string, Thread>>();
+
+  async create(userId: string): Promise<Thread> {
+    const now = new Date();
+    const thread: Thread = {
+      id: randomUUID(),
+      userId,
+      messages: [],
+      createdAt: now,
+      updatedAt: now,
+    };
+    this.userMap(userId).set(thread.id, thread);
+    return thread;
+  }
+
+  async get(threadId: string, userId: string): Promise<Thread | null> {
+    return this.userMap(userId).get(threadId) ?? null;
+  }
+
+  async list(userId: string): Promise<Thread[]> {
+    return Array.from(this.userMap(userId).values()).sort(
+      (a, b) => b.updatedAt.getTime() - a.updatedAt.getTime(),
+    );
+  }
+
+  async addMessage(
+    threadId: string,
+    userId: string,
+    message: Message,
+  ): Promise<void> {
+    const thread = this.userMap(userId).get(threadId);
+    if (!thread) throw new Error(`Thread ${threadId} not found`);
+    thread.messages.push(message);
+    thread.updatedAt = new Date();
+  }
+
+  async delete(threadId: string, userId: string): Promise<boolean> {
+    return this.userMap(userId).delete(threadId);
+  }
+
+  private userMap(userId: string): Map<string, Thread> {
+    let map = this.store.get(userId);
+    if (!map) {
+      map = new Map();
+      this.store.set(userId, map);
+    }
+    return map;
+  }
+}
diff --git a/packages/appkit/src/plugins/agents/types.ts b/packages/appkit/src/plugins/agents/types.ts
index 861be26d..4963a52a 100644
--- a/packages/appkit/src/plugins/agents/types.ts
+++ b/packages/appkit/src/plugins/agents/types.ts
@@ -1,4 +1,10 @@
-import type { AgentToolDefinition, ToolAnnotations } from "shared";
+import type {
+  AgentAdapter,
+  AgentToolDefinition,
+  BasePluginConfig,
+  ThreadStore,
+  ToolAnnotations,
+} from "shared";
 import type { FunctionTool } from "./tools/function-tool";
 import type { HostedTool } from "./tools/hosted-tools";
 
@@ -35,8 +41,108 @@ export interface ToolkitOptions {
 }
 
 /**
- * Type guard for `ToolkitEntry` — used to differentiate toolkit references
- * from inline tools in a mixed `tools` record.
+ * Context passed to `baseSystemPrompt` callbacks.
+ */
+export interface PromptContext {
+  agentName: string;
+  pluginNames: string[];
+  toolNames: string[];
+}
+
+export type BaseSystemPromptOption =
+  | false
+  | string
+  | ((ctx: PromptContext) => string);
+
+export interface AgentDefinition {
+  /** Filled in from the enclosing key when used in `agents: { foo: def }`. */
+  name?: string;
+  /** System prompt body. For markdown-loaded agents this is the file body. */
+  instructions: string;
+  /**
+   * Model adapter (or endpoint-name string sugar for
+   * `DatabricksAdapter.fromServingEndpoint({ endpointName })`). Optional —
+   * falls back to the plugin's `defaultModel`.
+   */
+  model?: AgentAdapter | Promise<AgentAdapter> | string;
+  /** Per-agent tool record. Key is the LLM-visible tool-call name. */
+  tools?: Record<string, AgentTool>;
+  /** Sub-agents, exposed as `agent-<key>` tools on this agent. */
+  agents?: Record<string, AgentDefinition>;
+  /** Override the plugin's baseSystemPrompt for this agent only. */
+  baseSystemPrompt?: BaseSystemPromptOption;
+  maxSteps?: number;
+  maxTokens?: number;
+}
+
+/**
+ * Asymmetric auto-inherit configuration. `true` on either side means "spread
+ * every registered ToolProvider plugin's toolkit() output into this agent's
+ * tool record when it declares no explicit tools/toolkits".
+ */
+export interface AutoInheritToolsConfig {
+  /** Default for agents loaded from markdown files. Default: `true`. */
+  file?: boolean;
+  /** Default for code-defined agents (via `agents: { foo: createAgent(...) }`). Default: `false`. */
+  code?: boolean;
+}
+
+export interface AgentsPluginConfig extends BasePluginConfig {
+  /** Directory to scan for markdown agent files. Default `./config/agents`. Set to `false` to disable. */
+  dir?: string | false;
+  /** Code-defined agents, merged with file-loaded ones (code wins on key collision). */
+  agents?: Record<string, AgentDefinition>;
+  /** Agent used when clients don't specify one. Defaults to the first-registered agent or the file with `default: true` frontmatter. */
+  defaultAgent?: string;
+  /** Default model for agents that don't specify their own (in code or frontmatter). */
+  defaultModel?: AgentAdapter | Promise<AgentAdapter> | string;
+  /** Ambient tool library. Keys may be referenced by markdown frontmatter via `tools: [key1, key2]`. */
+  tools?: Record<string, AgentTool>;
+  /** Whether to auto-inherit every ToolProvider plugin's toolkit. Accepts a boolean shorthand. */
+  autoInheritTools?: boolean | AutoInheritToolsConfig;
+  /** Persistent thread store. Default: in-memory. */
+  threadStore?: ThreadStore;
+  /** Customize or disable the AppKit base system prompt. */
+  baseSystemPrompt?: BaseSystemPromptOption;
+}
+
+/** Internal tool-index entry after a tool record has been resolved to a dispatchable form. */
+export type ResolvedToolEntry =
+  | {
+      source: "toolkit";
+      pluginName: string;
+      localName: string;
+      def: AgentToolDefinition;
+    }
+  | {
+      source: "function";
+      functionTool: FunctionTool;
+      def: AgentToolDefinition;
+    }
+  | {
+      source: "mcp";
+      mcpToolName: string;
+      def: AgentToolDefinition;
+    }
+  | {
+      source: "subagent";
+      agentName: string;
+      def: AgentToolDefinition;
+    };
+
+export interface RegisteredAgent {
+  name: string;
+  instructions: string;
+  adapter: AgentAdapter;
+  toolIndex: Map<string, ResolvedToolEntry>;
+  baseSystemPrompt?: BaseSystemPromptOption;
+  maxSteps?: number;
+  maxTokens?: number;
+}
+
+/**
+ * Type guard for `ToolkitEntry` — used by the agents plugin to differentiate
+ * toolkit references from inline tools in a mixed `tools` record.
  */
 export function isToolkitEntry(value: unknown): value is ToolkitEntry {
   return (
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 16079b1d..307f44cf 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -305,6 +305,9 @@ importers:
       express:
         specifier: 4.22.0
         version: 4.22.0
+      js-yaml:
+        specifier: ^4.1.1
+        version: 4.1.1
       obug:
         specifier: 2.1.1
         version: 2.1.1
@@ -339,6 +342,9 @@ importers:
       '@types/express':
         specifier: 4.17.25
         version: 4.17.25
+      '@types/js-yaml':
+        specifier: ^4.0.9
+        version: 4.0.9
       '@types/json-schema':
         specifier: 7.0.15
         version: 7.0.15
@@ -4989,6 +4995,9 @@ packages:
   '@types/istanbul-reports@3.0.4':
     resolution: {integrity: sha512-pk2B1NWalF9toCRu6gjBzR69syFjP4Od8WRAX+0mmf9lAjCRicLOWc+ZrxZHx/0XRjotgkF9t6iaMJ+aXcOdZQ==}
 
+  '@types/js-yaml@4.0.9':
+    resolution: {integrity: sha512-k4MGaQl5TGo/iipqb2UDG2UwjXziSWkh0uysQelTlJpX1qGlpUZYm8PnO4DxG1qBomtJUdYJ6qR6xdIah10JLg==}
+
   '@types/jsesc@2.5.1':
     resolution: {integrity: sha512-9VN+6yxLOPLOav+7PwjZbxiID2bVaeq0ED4qSQmdQTdjnXJSaCVKTR58t15oqH1H5t8Ng2ZX1SabJVoN9Q34bw==}
 
@@ -17421,6 +17430,8 @@ snapshots:
     dependencies:
       '@types/istanbul-lib-report': 3.0.3
 
+  '@types/js-yaml@4.0.9': {}
+
   '@types/jsesc@2.5.1': {}
 
   '@types/json-schema@7.0.15': {}

From 29e35345a212cb2350768a16447155bab301cbf4 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Tue, 21 Apr 2026 19:52:50 +0200
Subject: [PATCH 4/6] feat(appkit): fromPlugin() DX, runAgent plugins arg,
 shared toolkit-resolver
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

DX centerpiece. Introduces the symbol-marker pattern that collapses
plugin tool references in code-defined agents from a three-touch dance
to a single line, and extracts the shared resolver that the agents
plugin, auto-inherit, and standalone runAgent all now go through.

### `fromPlugin(factory, opts?)` — the marker

`packages/appkit/src/plugins/agents/from-plugin.ts`. Returns a spread-
friendly `{ [Symbol()]: FromPluginMarker }` record. The symbol key is
freshly generated per call, so multiple spreads of the same plugin
coexist safely. The marker's brand is a globally-interned
`Symbol.for("@databricks/appkit.fromPluginMarker")` — stable across
module boundaries.

### `resolveToolkitFromProvider(pluginName, provider, opts?)`

`packages/appkit/src/plugins/agents/toolkit-resolver.ts`. Single source
of truth for "turn a ToolProvider into a keyed record of `ToolkitEntry`
markers". Prefers `provider.toolkit(opts)` when available (core plugins
implement it), falls back to walking `getAgentTools()` and synthesizing
namespaced keys (`${pluginName}.${localName}`) for third-party
providers, honoring `only` / `except` / `rename` / `prefix` the same
way.

Used by three call sites, previously all copy-pasted:
1. `AgentsPlugin.buildToolIndex` — fromPlugin marker resolution pass
2. `AgentsPlugin.applyAutoInherit` — markdown auto-inherit path
3. `runAgent` — standalone-mode plugin tool dispatch

### `AgentsPlugin.buildToolIndex` — symbol-key resolution pass

Before the existing string-key iteration, `buildToolIndex` now walks
`Object.getOwnPropertySymbols(def.tools)`. For each `FromPluginMarker`,
it looks up the plugin by name in `PluginContext.getToolProviders()`,
calls `resolveToolkitFromProvider`, and merges the resulting entries
into the per-agent index. Missing plugins throw at setup time with a
clear `Available: ...` listing — wiring errors surface on boot, not
mid-request.

`hasExplicitTools` now counts symbol keys too, so a
`tools: { ...fromPlugin(x) }` record correctly disables auto-inherit
on code-defined agents.

### Type plumbing

- `AgentTools` type: `{ [key: string]: AgentTool } & { [key: symbol]:
  FromPluginMarker }`. Preserves string-key autocomplete while
  accepting marker spreads under strict TS.
- `AgentDefinition.tools` switched to `AgentTools`.

### `runAgent` gains `plugins?: PluginData[]`

`packages/appkit/src/core/run-agent.ts`. When an agent def contains
`fromPlugin` markers, the caller passes plugins via
`RunAgentInput.plugins`. A local provider cache constructs each plugin
and dispatches tool calls via `provider.executeAgentTool()`. Runs as
service principal (no OBO — there's no HTTP request). If a def
contains markers but `plugins` is absent, throws with guidance.

### Exports

`fromPlugin`, `FromPluginMarker`, `isFromPluginMarker`, `AgentTools`
added to the main barrel.

### Test plan

- 14 new tests: marker shape, symbol uniqueness, type guard,
  factory-without-pluginName error, fromPlugin marker resolution in
  AgentsPlugin, fallback to getAgentTools for providers without
  .toolkit(), symbol-only tools disables auto-inherit, runAgent
  standalone marker resolution via `plugins` arg, guidance error when
  missing.
- Full appkit vitest suite: 1311 tests passing.
- Typecheck clean.

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 packages/appkit/src/core/run-agent.ts         | 145 +++++++++++-
 packages/appkit/src/index.ts                  |   4 +
 packages/appkit/src/plugins/agents/agents.ts  |  91 +++++---
 .../appkit/src/plugins/agents/from-plugin.ts  |  97 +++++++++
 packages/appkit/src/plugins/agents/index.ts   |   8 +
 .../agents/tests/agents-plugin.test.ts        | 206 ++++++++++++++++++
 .../plugins/agents/tests/from-plugin.test.ts  |  80 +++++++
 .../plugins/agents/tests/run-agent.test.ts    |  96 ++++++++
 .../src/plugins/agents/toolkit-resolver.ts    |  62 ++++++
 packages/appkit/src/plugins/agents/types.ts   |  13 +-
 10 files changed, 765 insertions(+), 37 deletions(-)
 create mode 100644 packages/appkit/src/plugins/agents/from-plugin.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/from-plugin.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/toolkit-resolver.ts

diff --git a/packages/appkit/src/core/run-agent.ts b/packages/appkit/src/core/run-agent.ts
index e83c2c9c..6bbed55f 100644
--- a/packages/appkit/src/core/run-agent.ts
+++ b/packages/appkit/src/core/run-agent.ts
@@ -4,7 +4,12 @@ import type {
   AgentEvent,
   AgentToolDefinition,
   Message,
+  PluginConstructor,
+  PluginData,
+  ToolProvider,
 } from "shared";
+import { isFromPluginMarker } from "../plugins/agents/from-plugin";
+import { resolveToolkitFromProvider } from "../plugins/agents/toolkit-resolver";
 import {
   type FunctionTool,
   functionToolToDefinition,
@@ -23,6 +28,14 @@ export interface RunAgentInput {
   messages: string | Message[];
   /** Abort signal for cancellation. */
   signal?: AbortSignal;
+  /**
+   * Optional plugin list used to resolve `fromPlugin` markers in `def.tools`.
+   * Required when the def contains any `...fromPlugin(factory)` spreads;
+   * ignored otherwise. `runAgent` constructs a fresh instance per plugin
+   * and dispatches tool calls against it as the service principal (no
+   * OBO — there is no HTTP request in standalone mode).
+   */
+  plugins?: PluginData<PluginConstructor, unknown, string>[];
 }
 
 export interface RunAgentResult {
@@ -39,11 +52,12 @@ export interface RunAgentResult {
  * Limitations vs. running through the agents() plugin:
  * - No OBO: there is no HTTP request, so plugin tools run as the service
  *   principal (when they work at all).
- * - Plugin tools (`ToolkitEntry`) are not supported — they require a live
- *   `PluginContext` that only exists when registered in a `createApp`
- *   instance. This function throws a clear error if encountered.
+ * - Hosted tools (MCP) are not supported — they require a live MCP client
+ *   that only exists inside the agents plugin.
  * - Sub-agents (`agents: { ... }` on the def) are executed as nested
  *   `runAgent` calls with no shared thread state.
+ * - Plugin tools (`fromPlugin` markers or `ToolkitEntry` spreads) require
+ *   passing `plugins: [...]` via `RunAgentInput`.
  */
 export async function runAgent(
   def: AgentDefinition,
@@ -51,7 +65,7 @@ export async function runAgent(
 ): Promise<RunAgentResult> {
   const adapter = await resolveAdapter(def);
   const messages = normalizeMessages(input.messages, def.instructions);
-  const toolIndex = buildStandaloneToolIndex(def);
+  const toolIndex = buildStandaloneToolIndex(def, input.plugins ?? []);
   const tools = Array.from(toolIndex.values()).map((e) => e.def);
 
   const signal = input.signal;
@@ -62,6 +76,13 @@ export async function runAgent(
     if (entry.kind === "function") {
       return entry.tool.execute(args as Record<string, unknown>);
     }
+    if (entry.kind === "toolkit") {
+      return entry.provider.executeAgentTool(
+        entry.localName,
+        args as Record<string, unknown>,
+        signal,
+      );
+    }
     if (entry.kind === "subagent") {
       const subInput: RunAgentInput = {
         messages:
@@ -71,13 +92,14 @@ export async function runAgent(
             ? (args as { input: string }).input
             : JSON.stringify(args),
         signal,
+        plugins: input.plugins,
       };
       const res = await runAgent(entry.agentDef, subInput);
       return res.text;
     }
     throw new Error(
       `runAgent: tool "${name}" is a ${entry.kind} tool. ` +
-        "Plugin toolkits and MCP tools are only usable via createApp({ plugins: [..., agents(...)] }).",
+        "Hosted/MCP tools are only usable via createApp({ plugins: [..., agents(...)] }).",
     );
   };
 
@@ -158,20 +180,61 @@ type StandaloneEntry =
   | {
       kind: "toolkit";
       def: AgentToolDefinition;
-      entry: ToolkitEntry;
+      provider: ToolProvider;
+      pluginName: string;
+      localName: string;
     }
   | {
       kind: "hosted";
       def: AgentToolDefinition;
     };
 
+/**
+ * Resolves `def.tools` (string-keyed entries + symbol-keyed `fromPlugin`
+ * markers) and `def.agents` (sub-agents) into a flat dispatch index.
+ * Symbol-keyed markers are resolved against `plugins`; missing references
+ * throw with an `Available: …` listing.
+ */
 function buildStandaloneToolIndex(
   def: AgentDefinition,
+  plugins: PluginData<PluginConstructor, unknown, string>[],
 ): Map<string, StandaloneEntry> {
   const index = new Map<string, StandaloneEntry>();
+  const tools = def.tools;
 
-  for (const [key, tool] of Object.entries(def.tools ?? {})) {
-    index.set(key, classifyTool(key, tool));
+  const symbolKeys = tools ? Object.getOwnPropertySymbols(tools) : [];
+  if (symbolKeys.length > 0) {
+    const providerCache = new Map<string, ToolProvider>();
+    for (const sym of symbolKeys) {
+      const marker = (tools as Record<symbol, unknown>)[sym];
+      if (!isFromPluginMarker(marker)) continue;
+
+      const provider = resolveStandaloneProvider(
+        marker.pluginName,
+        plugins,
+        providerCache,
+      );
+      const entries = resolveToolkitFromProvider(
+        marker.pluginName,
+        provider,
+        marker.opts,
+      );
+      for (const [key, entry] of Object.entries(entries)) {
+        index.set(key, {
+          kind: "toolkit",
+          provider,
+          pluginName: entry.pluginName,
+          localName: entry.localName,
+          def: { ...entry.def, name: key },
+        });
+      }
+    }
+  }
+
+  if (tools) {
+    for (const [key, tool] of Object.entries(tools)) {
+      index.set(key, classifyTool(key, tool));
+    }
   }
 
   for (const [childKey, child] of Object.entries(def.agents ?? {})) {
@@ -203,7 +266,7 @@ function buildStandaloneToolIndex(
 
 function classifyTool(key: string, tool: AgentTool): StandaloneEntry {
   if (isToolkitEntry(tool)) {
-    return { kind: "toolkit", def: { ...tool.def, name: key }, entry: tool };
+    return toolkitEntryToStandalone(key, tool);
   }
   if (isFunctionTool(tool)) {
     return {
@@ -224,3 +287,67 @@ function classifyTool(key: string, tool: AgentTool): StandaloneEntry {
   }
   throw new Error(`runAgent: unrecognized tool shape at key "${key}"`);
 }
+
+/**
+ * Pre-`fromPlugin` code could reach a `ToolkitEntry` by calling
+ * `.toolkit()` at module scope (which requires an instance). Those entries
+ * still flow through `def.tools` but without a provider we can dispatch
+ * against — runAgent cannot execute them and errors clearly.
+ */
+function toolkitEntryToStandalone(
+  key: string,
+  entry: ToolkitEntry,
+): StandaloneEntry {
+  const def: AgentToolDefinition = { ...entry.def, name: key };
+  return {
+    kind: "hosted",
+    def: {
+      ...def,
+      description:
+        `${def.description ?? ""} ` +
+        `[runAgent: this ToolkitEntry refers to plugin '${entry.pluginName}' but ` +
+        "runAgent cannot dispatch it without the plugin instance. Pass the " +
+        "plugin via plugins: [...] and use fromPlugin(factory) instead of " +
+        ".toolkit() spreads.]".trim(),
+    },
+  };
+}
+
+function resolveStandaloneProvider(
+  pluginName: string,
+  plugins: PluginData<PluginConstructor, unknown, string>[],
+  cache: Map<string, ToolProvider>,
+): ToolProvider {
+  const cached = cache.get(pluginName);
+  if (cached) return cached;
+
+  const match = plugins.find((p) => p.name === pluginName);
+  if (!match) {
+    const available = plugins.map((p) => p.name).join(", ") || "(none)";
+    throw new Error(
+      `runAgent: agent references plugin '${pluginName}' via fromPlugin(), but ` +
+        "that plugin is missing from RunAgentInput.plugins. " +
+        `Available: ${available}.`,
+    );
+  }
+
+  const instance = new match.plugin({
+    ...(match.config ?? {}),
+    name: pluginName,
+  });
+  const provider = instance as unknown as ToolProvider;
+  if (
+    typeof (provider as { getAgentTools?: unknown }).getAgentTools !==
+      "function" ||
+    typeof (provider as { executeAgentTool?: unknown }).executeAgentTool !==
+      "function"
+  ) {
+    throw new Error(
+      `runAgent: plugin '${pluginName}' is not a ToolProvider ` +
+        "(missing getAgentTools/executeAgentTool). Only ToolProvider plugins " +
+        "are supported via fromPlugin() in runAgent.",
+    );
+  }
+  cache.set(pluginName, provider);
+  return provider;
+}
diff --git a/packages/appkit/src/index.ts b/packages/appkit/src/index.ts
index dbefe3e5..6e643cc8 100644
--- a/packages/appkit/src/index.ts
+++ b/packages/appkit/src/index.ts
@@ -73,8 +73,12 @@ export {
   type AgentDefinition,
   type AgentsPluginConfig,
   type AgentTool,
+  type AgentTools,
   agents,
   type BaseSystemPromptOption,
+  type FromPluginMarker,
+  fromPlugin,
+  isFromPluginMarker,
   isToolkitEntry,
   loadAgentFromFile,
   loadAgentsFromDir,
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index 03b9257c..c8758ac8 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -19,11 +19,13 @@ import { Plugin, toPlugin } from "../../plugin";
 import type { PluginManifest } from "../../registry";
 import { agentStreamDefaults } from "./defaults";
 import { AgentEventTranslator } from "./event-translator";
+import { isFromPluginMarker } from "./from-plugin";
 import { loadAgentsFromDir } from "./load-agents";
 import manifest from "./manifest.json";
 import { chatRequestSchema, invocationsRequestSchema } from "./schemas";
 import { buildBaseSystemPrompt, composeSystemPrompt } from "./system-prompt";
 import { InMemoryThreadStore } from "./thread-store";
+import { resolveToolkitFromProvider } from "./toolkit-resolver";
 import {
   AppKitMcpClient,
   type FunctionTool,
@@ -253,7 +255,11 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     src: AgentSource,
   ): Promise<Map<string, ResolvedToolEntry>> {
     const index = new Map<string, ResolvedToolEntry>();
-    const hasExplicitTools = def.tools && Object.keys(def.tools).length > 0;
+    const toolsRecord = def.tools ?? {};
+    const hasExplicitTools =
+      def.tools !== undefined &&
+      (Object.keys(toolsRecord).length > 0 ||
+        Object.getOwnPropertySymbols(toolsRecord).length > 0);
     const hasExplicitSubAgents =
       def.agents && Object.keys(def.agents).length > 0;
 
@@ -292,9 +298,13 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
       });
     }
 
-    // 2. Explicit tools (toolkit entries, function tools, hosted tools)
+    // 2. fromPlugin markers — resolve against registered ToolProviders first so
+    //    explicit string-keyed tools can still overwrite on the same key.
+    this.resolveFromPluginMarkers(agentName, toolsRecord, index);
+
+    // 3. Explicit tools (toolkit entries, function tools, hosted tools)
     const hostedToCollect: import("./tools/hosted-tools").HostedTool[] = [];
-    for (const [key, tool] of Object.entries(def.tools ?? {})) {
+    for (const [key, tool] of Object.entries(toolsRecord)) {
       if (isToolkitEntry(tool)) {
         index.set(key, {
           source: "toolkit",
@@ -338,31 +348,13 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
       provider,
     } of this.context.getToolProviders()) {
       if (pluginName === this.name) continue;
-      const withToolkit = provider as ToolProvider & {
-        toolkit?: (opts?: unknown) => Record<string, unknown>;
-      };
-      if (typeof withToolkit.toolkit === "function") {
-        const entries = withToolkit.toolkit() as Record<string, unknown>;
-        for (const [key, maybeEntry] of Object.entries(entries)) {
-          if (!isToolkitEntry(maybeEntry)) continue;
-          index.set(key, {
-            source: "toolkit",
-            pluginName: maybeEntry.pluginName,
-            localName: maybeEntry.localName,
-            def: { ...maybeEntry.def, name: key },
-          });
-        }
-        continue;
-      }
-      // Fallback: providers without a toolkit() still expose getAgentTools();
-      // dispatch goes through PluginContext.executeTool by plugin name.
-      for (const tool of provider.getAgentTools()) {
-        const qualifiedName = `${pluginName}.${tool.name}`;
-        index.set(qualifiedName, {
+      const entries = resolveToolkitFromProvider(pluginName, provider);
+      for (const [key, entry] of Object.entries(entries)) {
+        index.set(key, {
           source: "toolkit",
-          pluginName,
-          localName: tool.name,
-          def: { ...tool, name: qualifiedName },
+          pluginName: entry.pluginName,
+          localName: entry.localName,
+          def: { ...entry.def, name: key },
         });
       }
     }
@@ -376,6 +368,51 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     }
   }
 
+  /**
+   * Walks the symbol-keyed `fromPlugin` markers in an agent's `tools` record
+   * and resolves each one against a registered `ToolProvider`. Throws with a
+   * helpful `Available: …` listing if a referenced plugin isn't registered.
+   */
+  private resolveFromPluginMarkers(
+    agentName: string,
+    toolsRecord: Record<string | symbol, unknown>,
+    index: Map<string, ResolvedToolEntry>,
+  ): void {
+    const symbolKeys = Object.getOwnPropertySymbols(toolsRecord);
+    if (symbolKeys.length === 0) return;
+
+    const providers = this.context?.getToolProviders() ?? [];
+
+    for (const sym of symbolKeys) {
+      const marker = (toolsRecord as Record<symbol, unknown>)[sym];
+      if (!isFromPluginMarker(marker)) continue;
+
+      const providerEntry = providers.find((p) => p.name === marker.pluginName);
+      if (!providerEntry) {
+        const available = providers.map((p) => p.name).join(", ") || "(none)";
+        throw new Error(
+          `Agent '${agentName}' references plugin '${marker.pluginName}' via ` +
+            `fromPlugin(), but that plugin is not registered in createApp. ` +
+            `Available: ${available}.`,
+        );
+      }
+
+      const entries = resolveToolkitFromProvider(
+        marker.pluginName,
+        providerEntry.provider,
+        marker.opts,
+      );
+      for (const [key, entry] of Object.entries(entries)) {
+        index.set(key, {
+          source: "toolkit",
+          pluginName: entry.pluginName,
+          localName: entry.localName,
+          def: { ...entry.def, name: key },
+        });
+      }
+    }
+  }
+
   private async connectHostedTools(
     hostedTools: import("./tools/hosted-tools").HostedTool[],
     index: Map<string, ResolvedToolEntry>,
diff --git a/packages/appkit/src/plugins/agents/from-plugin.ts b/packages/appkit/src/plugins/agents/from-plugin.ts
new file mode 100644
index 00000000..b1128594
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/from-plugin.ts
@@ -0,0 +1,97 @@
+import type { NamedPluginFactory } from "../../plugin/to-plugin";
+import type { ToolkitOptions } from "./types";
+
+/**
+ * Symbol brand for the `fromPlugin` marker. Using a globally-interned symbol
+ * (`Symbol.for`) keeps the brand stable across module boundaries / bundle
+ * duplicates so `isFromPluginMarker` stays reliable.
+ */
+export const FROM_PLUGIN_MARKER = Symbol.for(
+  "@databricks/appkit.fromPluginMarker",
+);
+
+/**
+ * A lazy reference to a plugin's tools, produced by {@link fromPlugin} and
+ * resolved to concrete `ToolkitEntry`s at `AgentsPlugin.setup()` time.
+ *
+ * The marker is spread under a unique symbol key so multiple calls to
+ * `fromPlugin` (even for the same plugin) coexist in an `AgentDefinition.tools`
+ * record without colliding.
+ */
+export interface FromPluginMarker {
+  readonly [FROM_PLUGIN_MARKER]: true;
+  readonly pluginName: string;
+  readonly opts: ToolkitOptions | undefined;
+}
+
+/**
+ * Record shape returned by {@link fromPlugin} — a single symbol-keyed entry
+ * suitable for spreading into `AgentDefinition.tools`.
+ */
+export type FromPluginSpread = { readonly [key: symbol]: FromPluginMarker };
+
+/**
+ * Reference a plugin's tools inside an `AgentDefinition.tools` record without
+ * naming the plugin instance. The returned spread-friendly object carries a
+ * symbol-keyed marker that the agents plugin resolves against registered
+ * `ToolProvider`s at setup time.
+ *
+ * The factory argument must come from `toPlugin` (or any function that
+ * carries a `pluginName` field). `fromPlugin` reads `factory.pluginName`
+ * synchronously — it does not construct an instance.
+ *
+ * If the referenced plugin is also registered in `createApp({ plugins })`, the
+ * same runtime instance is used for dispatch. If the plugin is missing,
+ * `AgentsPlugin.setup()` throws with a clear `Available: …` listing.
+ *
+ * @example
+ * ```ts
+ * import { analytics, createAgent, files, fromPlugin, tool } from "@databricks/appkit";
+ *
+ * const support = createAgent({
+ *   instructions: "You help customers.",
+ *   tools: {
+ *     ...fromPlugin(analytics),
+ *     ...fromPlugin(files, { only: ["uploads.read"] }),
+ *     get_weather: tool({ ... }),
+ *   },
+ * });
+ * ```
+ *
+ * @param factory A plugin factory produced by `toPlugin`. Must expose a
+ *   `pluginName` field.
+ * @param opts Optional toolkit scoping — `prefix`, `only`, `except`, `rename`.
+ *   Same shape as the `.toolkit()` method.
+ */
+export function fromPlugin<F extends NamedPluginFactory>(
+  factory: F,
+  opts?: ToolkitOptions,
+): FromPluginSpread {
+  if (
+    !factory ||
+    typeof factory.pluginName !== "string" ||
+    !factory.pluginName
+  ) {
+    throw new Error(
+      "fromPlugin(): factory is missing pluginName. Pass a factory created by toPlugin().",
+    );
+  }
+  const pluginName = factory.pluginName;
+  const marker: FromPluginMarker = {
+    [FROM_PLUGIN_MARKER]: true,
+    pluginName,
+    opts,
+  };
+  return { [Symbol(`fromPlugin:${pluginName}`)]: marker };
+}
+
+/**
+ * Type guard for {@link FromPluginMarker}.
+ */
+export function isFromPluginMarker(value: unknown): value is FromPluginMarker {
+  return (
+    typeof value === "object" &&
+    value !== null &&
+    (value as Record<symbol, unknown>)[FROM_PLUGIN_MARKER] === true
+  );
+}
diff --git a/packages/appkit/src/plugins/agents/index.ts b/packages/appkit/src/plugins/agents/index.ts
index 1adc41c1..7adc49ff 100644
--- a/packages/appkit/src/plugins/agents/index.ts
+++ b/packages/appkit/src/plugins/agents/index.ts
@@ -1,5 +1,12 @@
 export { AgentsPlugin, agents } from "./agents";
 export { buildToolkitEntries } from "./build-toolkit";
+export {
+  FROM_PLUGIN_MARKER,
+  type FromPluginMarker,
+  type FromPluginSpread,
+  fromPlugin,
+  isFromPluginMarker,
+} from "./from-plugin";
 export {
   type LoadContext,
   type LoadResult,
@@ -11,6 +18,7 @@ export {
   type AgentDefinition,
   type AgentsPluginConfig,
   type AgentTool,
+  type AgentTools,
   type AutoInheritToolsConfig,
   type BaseSystemPromptOption,
   isToolkitEntry,
diff --git a/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts b/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
index 8116551e..b2152b61 100644
--- a/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
+++ b/packages/appkit/src/plugins/agents/tests/agents-plugin.test.ts
@@ -14,10 +14,18 @@ import { CacheManager } from "../../../cache";
 // Import the class directly so we can construct it without a createApp
 import { AgentsPlugin } from "../agents";
 import { buildToolkitEntries } from "../build-toolkit";
+import { fromPlugin } from "../from-plugin";
 import { defineTool, type ToolRegistry } from "../tools/define-tool";
+import { tool } from "../tools/tool";
 import type { AgentsPluginConfig, ToolkitEntry } from "../types";
 import { isToolkitEntry } from "../types";
 
+function namedFactory(name: string) {
+  const f = () => ({ name });
+  Object.defineProperty(f, "pluginName", { value: name, enumerable: true });
+  return f as typeof f & { readonly pluginName: string };
+}
+
 interface FakeContext {
   providers: Array<{ name: string; provider: ToolProvider }>;
   getToolProviders(): Array<{ name: string; provider: ToolProvider }>;
@@ -286,4 +294,202 @@ describe("AgentsPlugin", () => {
     expect(isToolkitEntry({ foo: 1 })).toBe(false);
     expect(isToolkitEntry(null)).toBe(false);
   });
+
+  describe("fromPlugin markers", () => {
+    test("spreading fromPlugin registers all tools from the referenced plugin", async () => {
+      const registry: ToolRegistry = {
+        query: defineTool({
+          description: "q",
+          schema: z.object({ sql: z.string() }),
+          handler: () => "ok",
+        }),
+      };
+      const ctx = fakeContext([
+        {
+          name: "analytics",
+          provider: makeToolProvider("analytics", registry),
+        },
+      ]);
+
+      const plugin = instantiate(
+        {
+          dir: false,
+          agents: {
+            support: {
+              instructions: "...",
+              model: stubAdapter(),
+              tools: { ...fromPlugin(namedFactory("analytics")) },
+            },
+          },
+        },
+        ctx,
+      );
+      await plugin.setup();
+
+      const api = plugin.exports() as {
+        get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+      };
+      const agent = api.get("support");
+      expect(agent?.toolIndex.has("analytics.query")).toBe(true);
+    });
+
+    test("mixed inline + fromPlugin tools coexist", async () => {
+      const registry: ToolRegistry = {
+        query: defineTool({
+          description: "q",
+          schema: z.object({ sql: z.string() }),
+          handler: () => "ok",
+        }),
+      };
+      const ctx = fakeContext([
+        {
+          name: "analytics",
+          provider: makeToolProvider("analytics", registry),
+        },
+      ]);
+
+      const plugin = instantiate(
+        {
+          dir: false,
+          agents: {
+            support: {
+              instructions: "...",
+              model: stubAdapter(),
+              tools: {
+                ...fromPlugin(namedFactory("analytics")),
+                get_weather: tool({
+                  name: "get_weather",
+                  description: "Weather",
+                  schema: z.object({ city: z.string() }),
+                  execute: async ({ city }) => `Sunny in ${city}`,
+                }),
+              },
+            },
+          },
+        },
+        ctx,
+      );
+      await plugin.setup();
+
+      const api = plugin.exports() as {
+        get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+      };
+      const agent = api.get("support");
+      expect(agent?.toolIndex.has("analytics.query")).toBe(true);
+      expect(agent?.toolIndex.has("get_weather")).toBe(true);
+    });
+
+    test("missing plugin throws at setup with Available: listing", async () => {
+      const ctx = fakeContext([
+        {
+          name: "files",
+          provider: makeToolProvider("files", {}),
+        },
+      ]);
+
+      const plugin = instantiate(
+        {
+          dir: false,
+          agents: {
+            support: {
+              instructions: "...",
+              model: stubAdapter(),
+              tools: { ...fromPlugin(namedFactory("analytics")) },
+            },
+          },
+        },
+        ctx,
+      );
+      await expect(plugin.setup()).rejects.toThrow(/analytics/);
+      await expect(plugin.setup()).rejects.toThrow(/Available:/);
+      await expect(plugin.setup()).rejects.toThrow(/files/);
+    });
+
+    test("symbol-only tools record disables auto-inherit", async () => {
+      const analyticsReg: ToolRegistry = {
+        query: defineTool({
+          description: "q",
+          schema: z.object({ sql: z.string() }),
+          handler: () => "ok",
+        }),
+      };
+      const filesReg: ToolRegistry = {
+        list: defineTool({
+          description: "l",
+          schema: z.object({}),
+          handler: () => [],
+        }),
+      };
+      const ctx = fakeContext([
+        {
+          name: "analytics",
+          provider: makeToolProvider("analytics", analyticsReg),
+        },
+        {
+          name: "files",
+          provider: makeToolProvider("files", filesReg),
+        },
+      ]);
+
+      const plugin = instantiate(
+        {
+          dir: false,
+          autoInheritTools: { code: true },
+          agents: {
+            support: {
+              instructions: "...",
+              model: stubAdapter(),
+              tools: { ...fromPlugin(namedFactory("analytics")) },
+            },
+          },
+        },
+        ctx,
+      );
+      await plugin.setup();
+
+      const api = plugin.exports() as {
+        get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+      };
+      const agent = api.get("support");
+      const toolNames = Array.from(agent?.toolIndex.keys() ?? []);
+      expect(toolNames.some((n) => n.startsWith("analytics."))).toBe(true);
+      expect(toolNames.some((n) => n.startsWith("files."))).toBe(false);
+    });
+
+    test("falls back to getAgentTools() for providers without toolkit()", async () => {
+      // Provider lacks .toolkit() — only getAgentTools/executeAgentTool.
+      const bareProvider: ToolProvider = {
+        getAgentTools: () => [
+          {
+            name: "ping",
+            description: "ping",
+            parameters: { type: "object", properties: {} },
+          },
+        ],
+        executeAgentTool: vi.fn(async () => "pong"),
+      };
+      const ctx = fakeContext([{ name: "bare", provider: bareProvider }]);
+
+      const plugin = instantiate(
+        {
+          dir: false,
+          agents: {
+            support: {
+              instructions: "...",
+              model: stubAdapter(),
+              tools: { ...fromPlugin(namedFactory("bare")) },
+            },
+          },
+        },
+        ctx,
+      );
+      await plugin.setup();
+
+      const api = plugin.exports() as {
+        get: (name: string) => { toolIndex: Map<string, unknown> } | null;
+      };
+      const agent = api.get("support");
+      expect(agent?.toolIndex.has("bare.ping")).toBe(true);
+    });
+  });
 });
diff --git a/packages/appkit/src/plugins/agents/tests/from-plugin.test.ts b/packages/appkit/src/plugins/agents/tests/from-plugin.test.ts
new file mode 100644
index 00000000..cd8a12b4
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/from-plugin.test.ts
@@ -0,0 +1,80 @@
+import { describe, expect, test } from "vitest";
+import {
+  FROM_PLUGIN_MARKER,
+  fromPlugin,
+  isFromPluginMarker,
+} from "../from-plugin";
+
+function fakeFactory(name: string) {
+  const f = () => ({ name });
+  Object.defineProperty(f, "pluginName", { value: name, enumerable: true });
+  return f as typeof f & { readonly pluginName: string };
+}
+
+describe("fromPlugin", () => {
+  test("returns a spread-friendly object with a single symbol-keyed marker", () => {
+    const spread = fromPlugin(fakeFactory("analytics"));
+
+    expect(Object.keys(spread)).toHaveLength(0);
+    const syms = Object.getOwnPropertySymbols(spread);
+    expect(syms).toHaveLength(1);
+
+    const marker = (spread as Record<symbol, unknown>)[syms[0]!];
+    expect(isFromPluginMarker(marker)).toBe(true);
+    expect((marker as { pluginName: string }).pluginName).toBe("analytics");
+  });
+
+  test("multiple calls produce distinct symbol keys (spreads coexist)", () => {
+    const spread = {
+      ...fromPlugin(fakeFactory("analytics")),
+      ...fromPlugin(fakeFactory("analytics")),
+      ...fromPlugin(fakeFactory("files")),
+    };
+
+    const syms = Object.getOwnPropertySymbols(spread);
+    expect(syms).toHaveLength(3);
+  });
+
+  test("passes opts through to the marker", () => {
+    const spread = fromPlugin(fakeFactory("analytics"), {
+      only: ["query"],
+      prefix: "q_",
+    });
+    const sym = Object.getOwnPropertySymbols(spread)[0]!;
+    const marker = (spread as Record<symbol, unknown>)[sym] as {
+      opts: { only: string[]; prefix: string };
+    };
+    expect(marker.opts.only).toEqual(["query"]);
+    expect(marker.opts.prefix).toBe("q_");
+  });
+
+  test("throws when factory has no pluginName", () => {
+    const missing = () => ({ name: "nope" });
+    expect(() =>
+      fromPlugin(missing as unknown as { readonly pluginName: string }),
+    ).toThrow(/missing pluginName/);
+  });
+
+  test("FROM_PLUGIN_MARKER is a globally-interned symbol", () => {
+    expect(FROM_PLUGIN_MARKER).toBe(
+      Symbol.for("@databricks/appkit.fromPluginMarker"),
+    );
+  });
+});
+
+describe("isFromPluginMarker", () => {
+  test("returns true for real markers", () => {
+    const spread = fromPlugin(fakeFactory("analytics"));
+    const sym = Object.getOwnPropertySymbols(spread)[0]!;
+    expect(isFromPluginMarker((spread as Record<symbol, unknown>)[sym])).toBe(
+      true,
+    );
+  });
+
+  test("returns false for objects without the brand", () => {
+    expect(isFromPluginMarker({ pluginName: "x" })).toBe(false);
+    expect(isFromPluginMarker(null)).toBe(false);
+    expect(isFromPluginMarker(undefined)).toBe(false);
+    expect(isFromPluginMarker("string")).toBe(false);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/run-agent.test.ts b/packages/appkit/src/plugins/agents/tests/run-agent.test.ts
index 1a974811..da626f49 100644
--- a/packages/appkit/src/plugins/agents/tests/run-agent.test.ts
+++ b/packages/appkit/src/plugins/agents/tests/run-agent.test.ts
@@ -3,11 +3,16 @@ import type {
   AgentEvent,
   AgentInput,
   AgentRunContext,
+  AgentToolDefinition,
+  PluginConstructor,
+  PluginData,
+  ToolProvider,
 } from "shared";
 import { describe, expect, test, vi } from "vitest";
 import { z } from "zod";
 import { createAgent } from "../../../core/create-agent-def";
 import { runAgent } from "../../../core/run-agent";
+import { fromPlugin } from "../from-plugin";
 import { tool } from "../tools/tool";
 import type { ToolkitEntry } from "../types";
 
@@ -84,6 +89,97 @@ describe("runAgent", () => {
     expect(weatherFn).toHaveBeenCalledWith({ city: "NYC" });
   });
 
+  test("resolves fromPlugin markers against RunAgentInput.plugins", async () => {
+    const pingExec = vi.fn(async () => "pong");
+    class FakePlugin implements ToolProvider {
+      static manifest = { name: "ping" };
+      static DEFAULT_CONFIG = {};
+      name = "ping";
+      constructor(public config: unknown) {}
+      async setup() {}
+      injectRoutes() {}
+      getEndpoints() {
+        return {};
+      }
+      getAgentTools(): AgentToolDefinition[] {
+        return [
+          {
+            name: "ping",
+            description: "ping",
+            parameters: { type: "object", properties: {} },
+          },
+        ];
+      }
+      executeAgentTool = pingExec;
+    }
+
+    const factory = () => ({
+      plugin: FakePlugin as unknown as PluginConstructor,
+      config: {},
+      name: "ping" as const,
+    });
+    Object.defineProperty(factory, "pluginName", {
+      value: "ping",
+      enumerable: true,
+    });
+
+    let capturedCtx: AgentRunContext | null = null;
+    const adapter: AgentAdapter = {
+      async *run(_input, context) {
+        capturedCtx = context;
+        yield { type: "message_delta", content: "" };
+      },
+    };
+
+    const def = createAgent({
+      instructions: "x",
+      model: adapter,
+      tools: {
+        ...fromPlugin(factory as unknown as { readonly pluginName: string }),
+      },
+    });
+
+    const pluginData = factory() as PluginData<
+      PluginConstructor,
+      unknown,
+      string
+    >;
+
+    await runAgent(def, { messages: "hi", plugins: [pluginData] });
+    expect(capturedCtx).not.toBeNull();
+    // biome-ignore lint/style/noNonNullAssertion: asserted above
+    const result = await capturedCtx!.executeTool("ping.ping", {});
+    expect(result).toBe("pong");
+    expect(pingExec).toHaveBeenCalled();
+  });
+
+  test("throws with guidance when fromPlugin marker has no matching plugin", async () => {
+    const factory = () => ({ name: "absent" as const });
+    Object.defineProperty(factory, "pluginName", {
+      value: "absent",
+      enumerable: true,
+    });
+
+    const adapter: AgentAdapter = {
+      async *run(_input, _context) {
+        yield { type: "message_delta", content: "" };
+      },
+    };
+
+    const def = createAgent({
+      instructions: "x",
+      model: adapter,
+      tools: {
+        ...fromPlugin(factory as unknown as { readonly pluginName: string }),
+      },
+    });
+
+    await expect(runAgent(def, { messages: "hi" })).rejects.toThrow(/absent/);
+    await expect(runAgent(def, { messages: "hi" })).rejects.toThrow(
+      /Available:/,
+    );
+  });
+
   test("throws a clear error when a ToolkitEntry is invoked", async () => {
     const toolkitEntry: ToolkitEntry = {
       __toolkitRef: true,
diff --git a/packages/appkit/src/plugins/agents/toolkit-resolver.ts b/packages/appkit/src/plugins/agents/toolkit-resolver.ts
new file mode 100644
index 00000000..8ec8cf1f
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/toolkit-resolver.ts
@@ -0,0 +1,62 @@
+import type { ToolProvider } from "shared";
+import type { ToolkitEntry, ToolkitOptions } from "./types";
+
+/**
+ * Internal interface: a `ToolProvider` that optionally exposes a typed
+ * `.toolkit(opts)` method. Core plugins (analytics, files, genie, lakebase)
+ * implement this; third-party `ToolProvider`s may not.
+ */
+type MaybeToolkitProvider = ToolProvider & {
+  toolkit?: (opts?: ToolkitOptions) => Record<string, ToolkitEntry>;
+};
+
+/**
+ * Resolve a plugin's tools into a keyed record of {@link ToolkitEntry} markers
+ * ready to be merged into an agent's tool index.
+ *
+ * Preferred path: call the plugin's own `.toolkit(opts)` method, which
+ * typically delegates to `buildToolkitEntries` with full `ToolkitOptions`
+ * support (prefix, only, except, rename).
+ *
+ * Fallback path: when the plugin doesn't expose `.toolkit()` (e.g. a
+ * third-party `ToolProvider` built with plain `toPlugin`), walk
+ * `getAgentTools()` and synthesize namespaced keys (`${pluginName}.${name}`)
+ * while still honoring `only` / `except` / `rename` / `prefix`.
+ *
+ * This helper is the single source of truth for "turn a provider into a
+ * toolkit entry record" and is used by `AgentsPlugin.buildToolIndex`
+ * (both the `fromPlugin` resolution pass and auto-inherit) and by the
+ * standalone `runAgent` executor.
+ */
+export function resolveToolkitFromProvider(
+  pluginName: string,
+  provider: ToolProvider,
+  opts?: ToolkitOptions,
+): Record<string, ToolkitEntry> {
+  const withToolkit = provider as MaybeToolkitProvider;
+  if (typeof withToolkit.toolkit === "function") {
+    return withToolkit.toolkit(opts);
+  }
+
+  const only = opts?.only ? new Set(opts.only) : null;
+  const except = opts?.except ? new Set(opts.except) : null;
+  const rename = opts?.rename ?? {};
+  const prefix = opts?.prefix ?? `${pluginName}.`;
+
+  const out: Record<string, ToolkitEntry> = {};
+  for (const tool of provider.getAgentTools()) {
+    if (only && !only.has(tool.name)) continue;
+    if (except?.has(tool.name)) continue;
+
+    const keyAfterPrefix = `${prefix}${tool.name}`;
+    const key = rename[tool.name] ?? keyAfterPrefix;
+
+    out[key] = {
+      __toolkitRef: true,
+      pluginName,
+      localName: tool.name,
+      def: { ...tool, name: key },
+    };
+  }
+  return out;
+}
diff --git a/packages/appkit/src/plugins/agents/types.ts b/packages/appkit/src/plugins/agents/types.ts
index 4963a52a..37c322e6 100644
--- a/packages/appkit/src/plugins/agents/types.ts
+++ b/packages/appkit/src/plugins/agents/types.ts
@@ -5,6 +5,7 @@ import type {
   ThreadStore,
   ToolAnnotations,
 } from "shared";
+import type { FromPluginMarker } from "./from-plugin";
 import type { FunctionTool } from "./tools/function-tool";
 import type { HostedTool } from "./tools/hosted-tools";
 
@@ -54,6 +55,16 @@ export type BaseSystemPromptOption =
   | string
   | ((ctx: PromptContext) => string);
 
+/**
+ * Per-agent tool record. String keys map to inline tools, toolkit entries,
+ * hosted tools, etc. Symbol keys hold `FromPluginMarker` references produced
+ * by `fromPlugin(factory)` spreads — these are resolved at
+ * `AgentsPlugin.setup()` time against registered `ToolProvider` plugins.
+ */
+export type AgentTools = { [key: string]: AgentTool } & {
+  [key: symbol]: FromPluginMarker;
+};
+
 export interface AgentDefinition {
   /** Filled in from the enclosing key when used in `agents: { foo: def }`. */
   name?: string;
@@ -66,7 +77,7 @@ export interface AgentDefinition {
    */
   model?: AgentAdapter | Promise<AgentAdapter> | string;
   /** Per-agent tool record. Key is the LLM-visible tool-call name. */
-  tools?: Record<string, AgentTool>;
+  tools?: AgentTools;
   /** Sub-agents, exposed as `agent-<key>` tools on this agent. */
   agents?: Record<string, AgentDefinition>;
   /** Override the plugin's baseSystemPrompt for this agent only. */

From 4a441d2259caa82ad665eb57cc6f75a2f2b41617 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Tue, 21 Apr 2026 19:58:04 +0200
Subject: [PATCH 5/6] feat(appkit): reference agent-app, dev-playground chat
 UI, docs, and template
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Final layer of the agents feature stack. Everything needed to
exercise, demonstrate, and learn the feature.

### Reference application: agent-app

`apps/agent-app/` — a standalone app purpose-built around the agents
feature. Ships with:

- `server.ts` — full example of code-defined agents via `fromPlugin`:
  ```ts
  const support = createAgent({
    instructions: "…",
    tools: {
      ...fromPlugin(analytics),
      ...fromPlugin(files),
      get_weather,
      "mcp.vector-search": mcpServer("vector-search", "https://…"),
    },
  });

  await createApp({
    plugins: [server({ port }), analytics(), files(), agents({ agents: { support } })],
  });
  ```
- `config/agents/assistant.md` — markdown-driven agent alongside the
  code-defined one, showing the asymmetric auto-inherit default.
- Vite + React 19 + TailwindCSS frontend with a chat UI.
- Databricks deployment config (`databricks.yml`, `app.yaml`) and
  deploy scripts.

### dev-playground chat UI + demo agent

`apps/dev-playground/client/src/routes/agent.route.tsx` — chat UI with
inline autocomplete (hits the `autocomplete` markdown agent) and a
full threaded conversation panel (hits the default agent).

`apps/dev-playground/server/index.ts` — adds a code-defined `helper`
agent using `fromPlugin(analytics)` alongside the markdown-driven
`autocomplete` agent in `config/agents/`. Exercises the mixed-style
setup (markdown + code) against the same plugin list.

`apps/dev-playground/config/agents/*.md` — both agents defined with
valid YAML frontmatter.

### Docs

`docs/docs/plugins/agents.md` — progressive five-level guide:

1. Drop a markdown file → it just works.
2. Scope tools via `toolkits:` / `tools:` frontmatter.
3. Code-defined agents with `fromPlugin()`.
4. Sub-agents.
5. Standalone `runAgent()` (no `createApp` or HTTP).

Plus a configuration reference, runtime API reference, and frontmatter
schema table.

`docs/docs/api/appkit/` — regenerated typedoc for the new public
surface (fromPlugin, runAgent, AgentDefinition, AgentsPluginConfig,
ToolkitEntry, ToolkitOptions, all adapter types, and the agents
plugin factory).

### Template

`template/appkit.plugins.json` — adds the `agent` plugin entry so
`npx @databricks/appkit init --features agent` scaffolds the plugin
correctly.

### Test plan

- Full appkit vitest suite: 1311 tests passing
- Typecheck clean across all 8 workspace projects
- `pnpm docs:build` clean (no broken links)
- `pnpm --filter=@databricks/appkit build:package` clean, publint
  clean

Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 apps/agent-app/.env.example                   |  11 +
 apps/agent-app/.gitignore                     |   3 +
 apps/agent-app/app.yaml                       |   8 +
 apps/agent-app/config/agents/assistant.md     |  12 +
 apps/agent-app/databricks.yml                 |  50 ++
 apps/agent-app/index.html                     |  12 +
 apps/agent-app/package.json                   |  40 ++
 apps/agent-app/postcss.config.js              |   6 +
 apps/agent-app/server.ts                      |  75 +++
 apps/agent-app/src/App.css                    | 362 ++++++++++++++
 apps/agent-app/src/App.tsx                    | 292 +++++++++++
 .../src/components/theme-selector.tsx         | 135 +++++
 apps/agent-app/src/index.css                  |   1 +
 apps/agent-app/src/main.tsx                   |  15 +
 apps/agent-app/tailwind.config.ts             |  11 +
 apps/agent-app/tsconfig.app.json              |  24 +
 apps/agent-app/tsconfig.json                  |   7 +
 apps/agent-app/tsconfig.node.json             |  22 +
 apps/agent-app/vite.config.ts                 |  31 ++
 .../client/src/routes/__root.tsx              |  12 +-
 .../client/src/routes/agent.route.tsx         | 466 ++++++++++++++++++
 .../client/src/routes/index.tsx               |  11 +-
 .../dev-playground/config/agents/assistant.md |   6 +
 .../config/agents/autocomplete.md             |   6 +
 apps/dev-playground/server/index.ts           |  38 +-
 docs/docs/api/appkit/Class.Plugin.md          |  44 ++
 docs/docs/api/appkit/Function.createAgent.md  |  35 ++
 docs/docs/api/appkit/Function.fromPlugin.md   |  50 ++
 .../api/appkit/Function.isFromPluginMarker.md |  17 +
 .../api/appkit/Function.isFunctionTool.md     |  15 +
 docs/docs/api/appkit/Function.isHostedTool.md |  15 +
 .../api/appkit/Function.isToolkitEntry.md     |  18 +
 .../api/appkit/Function.loadAgentFromFile.md  |  19 +
 .../api/appkit/Function.loadAgentsFromDir.md  |  20 +
 docs/docs/api/appkit/Function.mcpServer.md    |  26 +
 docs/docs/api/appkit/Function.runAgent.md     |  29 ++
 docs/docs/api/appkit/Function.tool.md         |  29 ++
 .../docs/api/appkit/Interface.AgentAdapter.md |  20 +
 .../api/appkit/Interface.AgentDefinition.md   |  82 +++
 docs/docs/api/appkit/Interface.AgentInput.md  |  33 ++
 .../api/appkit/Interface.AgentRunContext.md   |  28 ++
 .../appkit/Interface.AgentToolDefinition.md   |  33 ++
 .../appkit/Interface.AgentsPluginConfig.md    | 132 +++++
 .../api/appkit/Interface.BasePluginConfig.md  |   4 +
 .../api/appkit/Interface.FromPluginMarker.md  |  32 ++
 .../docs/api/appkit/Interface.FunctionTool.md |  59 +++
 docs/docs/api/appkit/Interface.Message.md     |  49 ++
 .../api/appkit/Interface.PromptContext.md     |  27 +
 .../api/appkit/Interface.RunAgentInput.md     |  35 ++
 .../api/appkit/Interface.RunAgentResult.md    |  21 +
 docs/docs/api/appkit/Interface.Thread.md      |  41 ++
 docs/docs/api/appkit/Interface.ThreadStore.md |  98 ++++
 docs/docs/api/appkit/Interface.ToolConfig.md  |  49 ++
 .../docs/api/appkit/Interface.ToolProvider.md |  36 ++
 .../docs/api/appkit/Interface.ToolkitEntry.md |  46 ++
 .../api/appkit/Interface.ToolkitOptions.md    |  41 ++
 docs/docs/api/appkit/TypeAlias.AgentEvent.md  |  38 ++
 docs/docs/api/appkit/TypeAlias.AgentTool.md   |  12 +
 docs/docs/api/appkit/TypeAlias.AgentTools.md  |  14 +
 .../TypeAlias.BaseSystemPromptOption.md       |   8 +
 docs/docs/api/appkit/TypeAlias.HostedTool.md  |   9 +
 docs/docs/api/appkit/Variable.agents.md       |  19 +
 docs/docs/api/appkit/index.md                 |  35 ++
 docs/docs/api/appkit/typedoc-sidebar.ts       | 175 +++++++
 docs/docs/plugins/agents.md                   | 237 +++++++++
 pnpm-lock.yaml                                | 336 +++++++++++--
 template/appkit.plugins.json                  |  10 +
 67 files changed, 3673 insertions(+), 59 deletions(-)
 create mode 100644 apps/agent-app/.env.example
 create mode 100644 apps/agent-app/.gitignore
 create mode 100644 apps/agent-app/app.yaml
 create mode 100644 apps/agent-app/config/agents/assistant.md
 create mode 100644 apps/agent-app/databricks.yml
 create mode 100644 apps/agent-app/index.html
 create mode 100644 apps/agent-app/package.json
 create mode 100644 apps/agent-app/postcss.config.js
 create mode 100644 apps/agent-app/server.ts
 create mode 100644 apps/agent-app/src/App.css
 create mode 100644 apps/agent-app/src/App.tsx
 create mode 100644 apps/agent-app/src/components/theme-selector.tsx
 create mode 100644 apps/agent-app/src/index.css
 create mode 100644 apps/agent-app/src/main.tsx
 create mode 100644 apps/agent-app/tailwind.config.ts
 create mode 100644 apps/agent-app/tsconfig.app.json
 create mode 100644 apps/agent-app/tsconfig.json
 create mode 100644 apps/agent-app/tsconfig.node.json
 create mode 100644 apps/agent-app/vite.config.ts
 create mode 100644 apps/dev-playground/client/src/routes/agent.route.tsx
 create mode 100644 apps/dev-playground/config/agents/assistant.md
 create mode 100644 apps/dev-playground/config/agents/autocomplete.md
 create mode 100644 docs/docs/api/appkit/Function.createAgent.md
 create mode 100644 docs/docs/api/appkit/Function.fromPlugin.md
 create mode 100644 docs/docs/api/appkit/Function.isFromPluginMarker.md
 create mode 100644 docs/docs/api/appkit/Function.isFunctionTool.md
 create mode 100644 docs/docs/api/appkit/Function.isHostedTool.md
 create mode 100644 docs/docs/api/appkit/Function.isToolkitEntry.md
 create mode 100644 docs/docs/api/appkit/Function.loadAgentFromFile.md
 create mode 100644 docs/docs/api/appkit/Function.loadAgentsFromDir.md
 create mode 100644 docs/docs/api/appkit/Function.mcpServer.md
 create mode 100644 docs/docs/api/appkit/Function.runAgent.md
 create mode 100644 docs/docs/api/appkit/Function.tool.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentAdapter.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentDefinition.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentInput.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentRunContext.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentToolDefinition.md
 create mode 100644 docs/docs/api/appkit/Interface.AgentsPluginConfig.md
 create mode 100644 docs/docs/api/appkit/Interface.FromPluginMarker.md
 create mode 100644 docs/docs/api/appkit/Interface.FunctionTool.md
 create mode 100644 docs/docs/api/appkit/Interface.Message.md
 create mode 100644 docs/docs/api/appkit/Interface.PromptContext.md
 create mode 100644 docs/docs/api/appkit/Interface.RunAgentInput.md
 create mode 100644 docs/docs/api/appkit/Interface.RunAgentResult.md
 create mode 100644 docs/docs/api/appkit/Interface.Thread.md
 create mode 100644 docs/docs/api/appkit/Interface.ThreadStore.md
 create mode 100644 docs/docs/api/appkit/Interface.ToolConfig.md
 create mode 100644 docs/docs/api/appkit/Interface.ToolProvider.md
 create mode 100644 docs/docs/api/appkit/Interface.ToolkitEntry.md
 create mode 100644 docs/docs/api/appkit/Interface.ToolkitOptions.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.AgentEvent.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.AgentTool.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.AgentTools.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.BaseSystemPromptOption.md
 create mode 100644 docs/docs/api/appkit/TypeAlias.HostedTool.md
 create mode 100644 docs/docs/api/appkit/Variable.agents.md
 create mode 100644 docs/docs/plugins/agents.md

diff --git a/apps/agent-app/.env.example b/apps/agent-app/.env.example
new file mode 100644
index 00000000..c062af54
--- /dev/null
+++ b/apps/agent-app/.env.example
@@ -0,0 +1,11 @@
+# Databricks workspace (auto-injected by platform on deploy)
+DATABRICKS_HOST=https://e2-dogfood.staging.cloud.databricks.com
+
+# Agent LLM endpoint
+DATABRICKS_AGENT_ENDPOINT=databricks-claude-sonnet-4-5
+
+# Analytics plugin — SQL warehouse ID
+DATABRICKS_WAREHOUSE_ID=dd43ee29fedd958d
+
+# Files plugin — Volume path
+DATABRICKS_VOLUME_FILES=/Volumes/main/mario/mario-vol
diff --git a/apps/agent-app/.gitignore b/apps/agent-app/.gitignore
new file mode 100644
index 00000000..9c97bbd4
--- /dev/null
+++ b/apps/agent-app/.gitignore
@@ -0,0 +1,3 @@
+node_modules
+dist
+.env
diff --git a/apps/agent-app/app.yaml b/apps/agent-app/app.yaml
new file mode 100644
index 00000000..215b89ec
--- /dev/null
+++ b/apps/agent-app/app.yaml
@@ -0,0 +1,8 @@
+command: ['node', '--import', 'tsx', 'server.ts']
+env:
+  - name: DATABRICKS_WAREHOUSE_ID
+    valueFrom: sql-warehouse
+  - name: DATABRICKS_AGENT_ENDPOINT
+    valueFrom: serving-endpoint
+  - name: DATABRICKS_VOLUME_FILES
+    valueFrom: volume
diff --git a/apps/agent-app/config/agents/assistant.md b/apps/agent-app/config/agents/assistant.md
new file mode 100644
index 00000000..bd6e9b7e
--- /dev/null
+++ b/apps/agent-app/config/agents/assistant.md
@@ -0,0 +1,12 @@
+---
+endpoint: databricks-claude-sonnet-4-5
+default: true
+---
+
+You are a helpful data assistant running on Databricks.
+
+Use the available tools to query data, browse files, and help users with their analysis.
+
+When using `analytics.query`, write Databricks SQL. When results are large, summarize the key findings rather than dumping raw data.
+
+You also have access to additional tools from MCP servers — use them when relevant.
diff --git a/apps/agent-app/databricks.yml b/apps/agent-app/databricks.yml
new file mode 100644
index 00000000..3ed6e50a
--- /dev/null
+++ b/apps/agent-app/databricks.yml
@@ -0,0 +1,50 @@
+bundle:
+  name: appkit-agent-app
+
+variables:
+  sql_warehouse_id:
+    description: SQL Warehouse ID for analytics queries
+  serving_endpoint_name:
+    description: Model Serving endpoint name for the agent LLM
+  volume_full_name:
+    description: "UC Volume full name (e.g. catalog.schema.volume_name)"
+
+resources:
+  apps:
+    agent_app:
+      name: "appkit-agent-app"
+      description: "AppKit agent with auto-discovered tools from analytics, files, and genie plugins"
+      source_code_path: ./
+
+      user_api_scopes:
+        - sql
+        - files.files
+        - dashboards.genie
+
+      resources:
+        - name: sql-warehouse
+          sql_warehouse:
+            id: ${var.sql_warehouse_id}
+            permission: CAN_USE
+
+        - name: serving-endpoint
+          serving_endpoint:
+            name: ${var.serving_endpoint_name}
+            permission: CAN_QUERY
+
+        - name: volume
+          uc_securable:
+            securable_type: VOLUME
+            securable_full_name: ${var.volume_full_name}
+            permission: WRITE_VOLUME
+
+targets:
+  dogfood:
+    default: true
+    workspace:
+      host: https://e2-dogfood.staging.cloud.databricks.com
+
+    variables:
+      sql_warehouse_id: dd43ee29fedd958d
+      serving_endpoint_name: databricks-claude-sonnet-4-5
+      volume_full_name: main.mario.mario-vol
diff --git a/apps/agent-app/index.html b/apps/agent-app/index.html
new file mode 100644
index 00000000..80e54faf
--- /dev/null
+++ b/apps/agent-app/index.html
@@ -0,0 +1,12 @@
+<!doctype html>
+<html lang="en">
+  <head>
+    <meta charset="UTF-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+    <title>AppKit Agent</title>
+  </head>
+  <body>
+    <div id="root"></div>
+    <script type="module" src="/src/main.tsx"></script>
+  </body>
+</html>
diff --git a/apps/agent-app/package.json b/apps/agent-app/package.json
new file mode 100644
index 00000000..ed159ca8
--- /dev/null
+++ b/apps/agent-app/package.json
@@ -0,0 +1,40 @@
+{
+  "name": "agent-app",
+  "private": true,
+  "version": "0.0.0",
+  "type": "module",
+  "scripts": {
+    "dev": "NODE_ENV=development tsx watch server.ts",
+    "build": "tsc -b && vite build",
+    "preview": "vite preview"
+  },
+  "dependencies": {
+    "@databricks/appkit": "workspace:*",
+    "@databricks/appkit-ui": "workspace:*",
+    "@databricks/sdk-experimental": "^0.16.0",
+    "dotenv": "^16.6.1",
+    "lucide-react": "^0.511.0",
+    "react": "19.2.0",
+    "react-dom": "19.2.0",
+    "marked": "^15.0.0",
+    "zod": "^4.0.0"
+  },
+  "devDependencies": {
+    "@tailwindcss/postcss": "4.1.17",
+    "@types/node": "24.10.1",
+    "@types/react": "19.2.7",
+    "@types/react-dom": "19.2.3",
+    "@vitejs/plugin-react": "5.1.1",
+    "autoprefixer": "10.4.21",
+    "postcss": "8.5.6",
+    "tailwindcss": "4.1.17",
+    "tailwindcss-animate": "1.0.7",
+    "tw-animate-css": "1.4.0",
+    "tsx": "4.20.6",
+    "typescript": "5.9.3",
+    "vite": "npm:rolldown-vite@7.1.14"
+  },
+  "overrides": {
+    "vite": "npm:rolldown-vite@7.1.14"
+  }
+}
diff --git a/apps/agent-app/postcss.config.js b/apps/agent-app/postcss.config.js
new file mode 100644
index 00000000..f69c5d41
--- /dev/null
+++ b/apps/agent-app/postcss.config.js
@@ -0,0 +1,6 @@
+export default {
+  plugins: {
+    "@tailwindcss/postcss": {},
+    autoprefixer: {},
+  },
+};
diff --git a/apps/agent-app/server.ts b/apps/agent-app/server.ts
new file mode 100644
index 00000000..29756079
--- /dev/null
+++ b/apps/agent-app/server.ts
@@ -0,0 +1,75 @@
+import {
+  agents,
+  analytics,
+  createAgent,
+  createApp,
+  files,
+  fromPlugin,
+  mcpServer,
+  server,
+  tool,
+} from "@databricks/appkit";
+import { z } from "zod";
+
+const port = Number(process.env.DATABRICKS_APP_PORT) || 8003;
+
+// Shared tool available to any agent that declares `tools: [get_weather]` in
+// its markdown frontmatter.
+const get_weather = tool({
+  name: "get_weather",
+  description: "Get the current weather for a city",
+  schema: z.object({
+    city: z.string().describe("City name"),
+  }),
+  execute: async ({ city }) => `The weather in ${city} is sunny, 22°C`,
+});
+
+// Code-defined agent. Overrides config/agents/support.md if a file with that
+// name exists. Tools here are explicit; defaults are strict (no auto-inherit
+// for code-defined agents), so we pull analytics + files in via fromPlugin.
+const support = createAgent({
+  instructions:
+    "You help customers with data analysis, file browsing, and general questions. " +
+    "Use the available tools as needed and summarize results concisely.",
+  tools: {
+    ...fromPlugin(analytics),
+    ...fromPlugin(files),
+    get_weather,
+    "mcp.vector-search": mcpServer(
+      "vector-search",
+      "https://e2-dogfood.staging.cloud.databricks.com/api/2.0/mcp/vector-search/main/default",
+    ),
+    "mcp.uc-greet": mcpServer(
+      "uc-greet",
+      "https://e2-dogfood.staging.cloud.databricks.com/api/2.0/mcp/functions/main/mario/greet",
+    ),
+    "mcp.mario-hello": mcpServer(
+      "mario-mcp-hello",
+      "https://mario-mcp-hello-6051921418418893.staging.aws.databricksapps.com/mcp",
+    ),
+  },
+});
+
+const appkit = await createApp({
+  plugins: [
+    server({ port }),
+    analytics(),
+    files(),
+    agents({
+      // Ambient tool library referenced by markdown frontmatter `tools: [...]`.
+      tools: { get_weather },
+      // Code-defined agents are merged with markdown agents; code wins on key
+      // collision. Markdown agents still auto-inherit analytics+files tools
+      // unless their frontmatter says otherwise.
+      agents: { support },
+    }),
+  ],
+});
+
+const registry = appkit.agent as {
+  list: () => string[];
+  getDefault: () => string | null;
+};
+console.log(
+  `Agent app running on port ${port}. Agents: ${registry.list().join(", ")}. Default: ${registry.getDefault() ?? "(none)"}.`,
+);
diff --git a/apps/agent-app/src/App.css b/apps/agent-app/src/App.css
new file mode 100644
index 00000000..1928960d
--- /dev/null
+++ b/apps/agent-app/src/App.css
@@ -0,0 +1,362 @@
+:root {
+  --bg: #fafafa;
+  --card: #ffffff;
+  --border: #e5e5e5;
+  --text: #171717;
+  --text-muted: #737373;
+  --text-faint: #a3a3a3;
+  --primary: #2563eb;
+  --primary-fg: #ffffff;
+  --muted: #f5f5f5;
+  --ring: #93c5fd;
+  --radius: 10px;
+  --font: system-ui, -apple-system, sans-serif;
+  --mono: "SF Mono", "Cascadia Code", "Fira Code", monospace;
+}
+
+:root.dark {
+  --bg: #0a0a0a;
+  --card: #171717;
+  --border: #262626;
+  --text: #fafafa;
+  --text-muted: #a3a3a3;
+  --text-faint: #525252;
+  --primary: #3b82f6;
+  --primary-fg: #ffffff;
+  --muted: #262626;
+  --ring: #1d4ed8;
+}
+
+* {
+  margin: 0;
+  padding: 0;
+  box-sizing: border-box;
+}
+
+body {
+  font-family: var(--font);
+  background: var(--bg);
+  color: var(--text);
+  -webkit-font-smoothing: antialiased;
+}
+
+.app {
+  min-height: 100vh;
+}
+
+.container {
+  max-width: 1100px;
+  margin: 0 auto;
+  padding: 2.5rem 1.5rem;
+}
+
+.header {
+  margin-bottom: 1.5rem;
+  display: flex;
+  align-items: flex-start;
+  justify-content: space-between;
+}
+
+.header h1 {
+  font-size: 1.75rem;
+  font-weight: 700;
+  letter-spacing: -0.025em;
+}
+
+.subtitle {
+  color: var(--text-muted);
+  font-size: 0.875rem;
+  margin-top: 0.25rem;
+}
+
+.thread-id {
+  font-family: var(--mono);
+  font-size: 0.75rem;
+  opacity: 0.6;
+}
+
+.main-layout {
+  display: flex;
+  gap: 1.25rem;
+  height: 700px;
+}
+
+.chat-panel {
+  flex: 1;
+  display: flex;
+  flex-direction: column;
+  border: 1px solid var(--border);
+  border-radius: var(--radius);
+  background: var(--card);
+  min-width: 0;
+  overflow: hidden;
+}
+
+.messages {
+  flex: 1;
+  overflow-y: auto;
+  padding: 1.25rem;
+  display: flex;
+  flex-direction: column;
+  gap: 1rem;
+}
+
+.empty-state {
+  text-align: center;
+  padding: 5rem 1rem;
+  color: var(--text-muted);
+}
+
+.empty-title {
+  font-size: 1.1rem;
+  font-weight: 500;
+}
+
+.empty-sub {
+  font-size: 0.85rem;
+  margin-top: 0.5rem;
+  color: var(--text-faint);
+}
+
+.message-row {
+  display: flex;
+}
+
+.message-row.user {
+  justify-content: flex-end;
+}
+
+.message-row.assistant {
+  justify-content: flex-start;
+}
+
+.bubble {
+  max-width: 80%;
+  padding: 0.625rem 0.875rem;
+  border-radius: var(--radius);
+  font-size: 0.875rem;
+  line-height: 1.5;
+  word-break: break-word;
+}
+
+.bubble.user {
+  white-space: pre-wrap;
+  background: var(--primary);
+  color: var(--primary-fg);
+  border-bottom-right-radius: 3px;
+}
+
+.bubble.assistant {
+  background: var(--muted);
+  color: var(--text);
+  border-bottom-left-radius: 3px;
+}
+
+.bubble.thinking {
+  color: var(--text-muted);
+  animation: pulse 1.5s ease-in-out infinite;
+}
+
+.bubble.assistant > * + * {
+  margin-top: 0.5em;
+}
+
+.bubble.assistant p {
+  margin: 0;
+}
+
+.bubble.assistant p + p {
+  margin-top: 0.4em;
+}
+
+.bubble.assistant code {
+  font-family: var(--mono);
+  font-size: 0.8em;
+  background: color-mix(in srgb, var(--text) 8%, transparent);
+  padding: 0.15em 0.35em;
+  border-radius: 4px;
+}
+
+.bubble.assistant pre {
+  margin: 0.5em 0;
+  padding: 0.75em;
+  border-radius: 6px;
+  background: color-mix(in srgb, var(--text) 6%, transparent);
+  overflow-x: auto;
+}
+
+.bubble.assistant pre code {
+  background: none;
+  padding: 0;
+  font-size: 0.8em;
+}
+
+.bubble.assistant ul,
+.bubble.assistant ol {
+  margin: 0.4em 0;
+  padding-left: 1.5em;
+}
+
+.bubble.assistant li {
+  margin: 0.15em 0;
+}
+
+.bubble.assistant h1,
+.bubble.assistant h2,
+.bubble.assistant h3 {
+  font-weight: 600;
+}
+
+.bubble.assistant h1 {
+  font-size: 1.1em;
+}
+.bubble.assistant h2 {
+  font-size: 1em;
+}
+.bubble.assistant h3 {
+  font-size: 0.95em;
+}
+
+.bubble.assistant blockquote {
+  margin: 0.4em 0;
+  padding-left: 0.75em;
+  border-left: 3px solid var(--border);
+  color: var(--text-muted);
+}
+
+.bubble.assistant table {
+  border-collapse: collapse;
+  margin: 0.5em 0;
+  font-size: 0.85em;
+}
+
+.bubble.assistant th,
+.bubble.assistant td {
+  border: 1px solid var(--border);
+  padding: 0.35em 0.6em;
+}
+
+.bubble.assistant th {
+  background: color-mix(in srgb, var(--text) 4%, transparent);
+  font-weight: 600;
+}
+
+@keyframes pulse {
+  0%,
+  100% {
+    opacity: 1;
+  }
+  50% {
+    opacity: 0.5;
+  }
+}
+
+.input-bar {
+  display: flex;
+  gap: 0.5rem;
+  padding: 0.875rem 1rem;
+  border-top: 1px solid var(--border);
+}
+
+.input-bar textarea {
+  flex: 1;
+  padding: 0.5rem 0.75rem;
+  border: 1px solid var(--border);
+  border-radius: 8px;
+  background: var(--bg);
+  color: var(--text);
+  font-family: var(--font);
+  font-size: 0.875rem;
+  resize: none;
+  outline: none;
+  transition: border-color 0.15s;
+}
+
+.input-bar textarea:focus {
+  border-color: var(--ring);
+  box-shadow: 0 0 0 2px color-mix(in srgb, var(--ring) 25%, transparent);
+}
+
+.input-bar textarea:disabled {
+  opacity: 0.5;
+}
+
+.input-bar button {
+  padding: 0.5rem 1rem;
+  border: none;
+  border-radius: 8px;
+  background: var(--primary);
+  color: var(--primary-fg);
+  font-family: var(--font);
+  font-size: 0.875rem;
+  font-weight: 500;
+  cursor: pointer;
+  transition: opacity 0.15s;
+  align-self: flex-end;
+}
+
+.input-bar button:hover:not(:disabled) {
+  opacity: 0.9;
+}
+
+.input-bar button:disabled {
+  opacity: 0.4;
+  cursor: not-allowed;
+}
+
+.event-panel {
+  width: 300px;
+  flex-shrink: 0;
+  display: flex;
+  flex-direction: column;
+  border: 1px solid var(--border);
+  border-radius: var(--radius);
+  background: var(--card);
+  overflow: hidden;
+}
+
+.event-header {
+  padding: 0.625rem 0.875rem;
+  border-bottom: 1px solid var(--border);
+  font-size: 0.8rem;
+  font-weight: 600;
+  color: var(--text-muted);
+  text-transform: uppercase;
+  letter-spacing: 0.05em;
+}
+
+.event-list {
+  flex: 1;
+  overflow-y: auto;
+  padding: 0.75rem;
+  display: flex;
+  flex-direction: column;
+  gap: 0.25rem;
+}
+
+.event-empty {
+  text-align: center;
+  padding: 2.5rem 0;
+  font-size: 0.75rem;
+  color: var(--text-faint);
+}
+
+.event-row {
+  font-family: var(--mono);
+  font-size: 0.7rem;
+  line-height: 1.4;
+  display: flex;
+  gap: 0.5rem;
+}
+
+.event-type {
+  flex-shrink: 0;
+  width: 90px;
+  text-align: right;
+  color: var(--text-faint);
+}
+
+.event-detail {
+  color: var(--text-muted);
+  word-break: break-all;
+}
diff --git a/apps/agent-app/src/App.tsx b/apps/agent-app/src/App.tsx
new file mode 100644
index 00000000..5c54997a
--- /dev/null
+++ b/apps/agent-app/src/App.tsx
@@ -0,0 +1,292 @@
+import { TooltipProvider } from "@databricks/appkit-ui/react";
+import { useCallback, useEffect, useRef, useState } from "react";
+import "./App.css";
+import { ThemeSelector } from "./components/theme-selector";
+
+interface SSEEvent {
+  type: string;
+  delta?: string;
+  item_id?: string;
+  item?: {
+    type?: string;
+    id?: string;
+    call_id?: string;
+    name?: string;
+    arguments?: string;
+    output?: string;
+    status?: string;
+  };
+  content?: string;
+  data?: Record<string, unknown>;
+  error?: string;
+  sequence_number?: number;
+  output_index?: number;
+}
+
+interface ChatMessage {
+  id: number;
+  role: "user" | "assistant";
+  content: string;
+}
+
+export default function App() {
+  const [messages, setMessages] = useState<ChatMessage[]>([]);
+  const [events, setEvents] = useState<SSEEvent[]>([]);
+  const [input, setInput] = useState("");
+  const [isLoading, setIsLoading] = useState(false);
+  const [threadId, setThreadId] = useState<string | null>(null);
+  const messagesEndRef = useRef<HTMLDivElement>(null);
+  const idRef = useRef(0);
+
+  const [toolCount, setToolCount] = useState(0);
+
+  useEffect(() => {
+    const timer = setTimeout(() => {
+      fetch("/api/agent/info")
+        .then((r) => r.json())
+        .then((data) => setToolCount(data.toolCount ?? 0))
+        .catch(() => {});
+    }, 500);
+    return () => clearTimeout(timer);
+  }, []);
+
+  // biome-ignore lint/correctness/useExhaustiveDependencies: scroll on new messages
+  useEffect(() => {
+    messagesEndRef.current?.scrollIntoView({ behavior: "smooth" });
+  }, [messages]);
+
+  const sendMessage = useCallback(async () => {
+    if (!input.trim() || isLoading) return;
+
+    const text = input.trim();
+    setInput("");
+    setMessages((prev) => [
+      ...prev,
+      { id: ++idRef.current, role: "user", content: text },
+    ]);
+    setEvents([]);
+    setIsLoading(true);
+
+    try {
+      const res = await fetch("/api/agent/chat", {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({
+          message: text,
+          ...(threadId && { threadId }),
+        }),
+      });
+
+      if (!res.ok) {
+        const err = await res.json();
+        setMessages((prev) => [
+          ...prev,
+          {
+            id: ++idRef.current,
+            role: "assistant",
+            content: `Error: ${err.error}`,
+          },
+        ]);
+        return;
+      }
+
+      const reader = res.body?.getReader();
+      if (!reader) return;
+
+      const decoder = new TextDecoder();
+      let content = "";
+      let buffer = "";
+
+      while (true) {
+        const { done, value } = await reader.read();
+        if (done) break;
+        buffer += decoder.decode(value, { stream: true });
+        const lines = buffer.split("\n");
+        buffer = lines.pop() ?? "";
+
+        for (const line of lines) {
+          if (!line.startsWith("data: ")) continue;
+          const data = line.slice(6).trim();
+          if (!data || data === "[DONE]") continue;
+          try {
+            const event: SSEEvent = JSON.parse(data);
+            if (!event.type) continue;
+            setEvents((prev) => [...prev, event]);
+
+            if (event.type === "appkit.metadata" && event.data?.threadId) {
+              setThreadId(event.data.threadId as string);
+            }
+            if (event.type === "response.output_text.delta" && event.delta) {
+              content += event.delta;
+              setMessages((prev) => {
+                const updated = [...prev];
+                const last = updated[updated.length - 1];
+                if (last?.role === "assistant") {
+                  updated[updated.length - 1] = { ...last, content };
+                } else {
+                  updated.push({
+                    id: ++idRef.current,
+                    role: "assistant",
+                    content,
+                  });
+                }
+                return updated;
+              });
+            }
+          } catch {
+            /* skip */
+          }
+        }
+      }
+    } catch (err) {
+      setMessages((prev) => [
+        ...prev,
+        {
+          id: ++idRef.current,
+          role: "assistant",
+          content: `Error: ${err instanceof Error ? err.message : "Unknown error"}`,
+        },
+      ]);
+    } finally {
+      setIsLoading(false);
+    }
+  }, [input, isLoading, threadId]);
+
+  return (
+    <TooltipProvider>
+      <div className="app">
+        <div className="container">
+          <header className="header">
+            <div>
+              <h1>Agent Chat</h1>
+              <p className="subtitle">
+                AI agent with {toolCount} auto-discovered tools
+                {threadId && (
+                  <span className="thread-id">
+                    {" "}
+                    · Thread {threadId.slice(0, 8)}
+                  </span>
+                )}
+              </p>
+            </div>
+            <ThemeSelector />
+          </header>
+
+          <div className="main-layout">
+            <div className="chat-panel">
+              <div className="messages">
+                {messages.length === 0 && (
+                  <div className="empty-state">
+                    <p className="empty-title">
+                      Send a message to start a conversation
+                    </p>
+                    <p className="empty-sub">
+                      The agent can query data, browse files, and more
+                    </p>
+                  </div>
+                )}
+
+                {messages.map((msg) => (
+                  <div
+                    key={msg.id}
+                    className={`message-row ${msg.role === "user" ? "user" : "assistant"}`}
+                  >
+                    <div className={`bubble ${msg.role}`}>
+                      <p className="whitespace-pre-wrap">{msg.content}</p>
+                    </div>
+                  </div>
+                ))}
+
+                {isLoading &&
+                  messages[messages.length - 1]?.role === "user" && (
+                    <div className="message-row assistant">
+                      <div className="bubble assistant thinking">
+                        Thinking...
+                      </div>
+                    </div>
+                  )}
+
+                <div ref={messagesEndRef} />
+              </div>
+
+              <form
+                className="input-bar"
+                onSubmit={(e) => {
+                  e.preventDefault();
+                  sendMessage();
+                }}
+              >
+                <textarea
+                  value={input}
+                  onChange={(e) => setInput(e.target.value)}
+                  onKeyDown={(e) => {
+                    if (e.key === "Enter" && !e.shiftKey) {
+                      e.preventDefault();
+                      sendMessage();
+                    }
+                  }}
+                  placeholder="Ask a question..."
+                  disabled={isLoading}
+                  rows={1}
+                />
+                <button type="submit" disabled={isLoading || !input.trim()}>
+                  Send
+                </button>
+              </form>
+            </div>
+
+            <div className="event-panel">
+              <div className="event-header">Event Stream</div>
+              <div className="event-list">
+                {events.length === 0 && (
+                  <p className="event-empty">Events will appear here</p>
+                )}
+                {events.map((event, i) => {
+                  let detail: string;
+                  switch (event.type) {
+                    case "response.output_text.delta":
+                      detail = event.delta?.slice(0, 60) ?? "";
+                      break;
+                    case "response.output_item.added":
+                    case "response.output_item.done":
+                      detail =
+                        event.item?.type === "function_call"
+                          ? `${event.item.name}(${(event.item.arguments ?? "").slice(0, 40)})`
+                          : event.item?.type === "function_call_output"
+                            ? (event.item.output?.slice(0, 60) ?? "")
+                            : (event.item?.status ?? event.item?.type ?? "");
+                      break;
+                    case "response.completed":
+                      detail = "done";
+                      break;
+                    case "error":
+                      detail = event.error ?? "unknown";
+                      break;
+                    case "appkit.metadata":
+                      detail = JSON.stringify(event.data).slice(0, 60);
+                      break;
+                    case "appkit.thinking":
+                      detail = event.content?.slice(0, 60) ?? "";
+                      break;
+                    default:
+                      detail = JSON.stringify(event).slice(0, 60);
+                  }
+                  return (
+                    <div key={`${event.type}-${i}`} className="event-row">
+                      <span className="event-type">
+                        {event.type
+                          .replace("response.", "")
+                          .replace("appkit.", "")}
+                      </span>
+                      <span className="event-detail">{detail}</span>
+                    </div>
+                  );
+                })}
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+    </TooltipProvider>
+  );
+}
diff --git a/apps/agent-app/src/components/theme-selector.tsx b/apps/agent-app/src/components/theme-selector.tsx
new file mode 100644
index 00000000..18bb4f14
--- /dev/null
+++ b/apps/agent-app/src/components/theme-selector.tsx
@@ -0,0 +1,135 @@
+import {
+  Button,
+  DropdownMenu,
+  DropdownMenuContent,
+  DropdownMenuItem,
+  DropdownMenuTrigger,
+} from "@databricks/appkit-ui/react";
+import { MonitorIcon, MoonIcon, SunIcon } from "lucide-react";
+import { useEffect, useState } from "react";
+
+type Theme = "light" | "dark" | "system";
+
+const THEME_STORAGE_KEY = "agent-app-theme";
+
+function getSystemTheme(): "light" | "dark" {
+  if (typeof window === "undefined") return "light";
+  return window.matchMedia("(prefers-color-scheme: dark)").matches
+    ? "dark"
+    : "light";
+}
+
+function getStoredTheme(): Theme {
+  if (typeof window === "undefined") return "system";
+  const stored = localStorage.getItem(THEME_STORAGE_KEY);
+  return (stored as Theme) || "system";
+}
+
+function applyTheme(theme: Theme) {
+  if (typeof window === "undefined") return;
+
+  const root = document.documentElement;
+  root.classList.remove("light", "dark");
+
+  if (theme === "system") {
+    const systemTheme = getSystemTheme();
+    root.classList.add(systemTheme);
+  } else {
+    root.classList.add(theme);
+  }
+}
+
+export function ThemeSelector() {
+  const [theme, setTheme] = useState<Theme>(() => getStoredTheme());
+  const [mounted, setMounted] = useState(false);
+  const [systemTheme, setSystemTheme] = useState<"light" | "dark">(() =>
+    getSystemTheme(),
+  );
+
+  useEffect(() => {
+    setMounted(true);
+    applyTheme(theme);
+  }, [theme]);
+
+  useEffect(() => {
+    const mediaQuery = window.matchMedia("(prefers-color-scheme: dark)");
+    const handleChange = (e: MediaQueryListEvent | MediaQueryList) => {
+      const isDark = e.matches;
+      setSystemTheme(isDark ? "dark" : "light");
+      if (theme === "system") {
+        applyTheme("system");
+      }
+    };
+
+    handleChange(mediaQuery);
+
+    if (mediaQuery.addEventListener) {
+      mediaQuery.addEventListener("change", handleChange);
+      return () => mediaQuery.removeEventListener("change", handleChange);
+    } else {
+      mediaQuery.addListener(handleChange);
+      return () => mediaQuery.removeListener(handleChange);
+    }
+  }, [theme]);
+
+  const handleThemeChange = (newTheme: Theme) => {
+    setTheme(newTheme);
+    localStorage.setItem(THEME_STORAGE_KEY, newTheme);
+    applyTheme(newTheme);
+  };
+
+  const effectiveTheme = theme === "system" ? systemTheme : theme;
+
+  if (!mounted) {
+    return (
+      <Button variant="ghost" size="icon" className="h-9 w-9">
+        <SunIcon className="h-4 w-4" />
+      </Button>
+    );
+  }
+
+  return (
+    <DropdownMenu>
+      <DropdownMenuTrigger asChild>
+        <Button
+          variant="ghost"
+          size="icon"
+          className="h-9 w-9 text-foreground hover:text-secondary-foreground"
+          aria-label="Toggle theme"
+        >
+          {effectiveTheme === "dark" ? (
+            <MoonIcon className="h-4 w-4" />
+          ) : (
+            <SunIcon className="h-4 w-4" />
+          )}
+        </Button>
+      </DropdownMenuTrigger>
+      <DropdownMenuContent align="end">
+        <DropdownMenuItem
+          onClick={() => handleThemeChange("light")}
+          className="cursor-pointer"
+        >
+          <SunIcon className="mr-2 h-4 w-4" />
+          <span>Light</span>
+          {theme === "light" && <span className="ml-auto text-xs">✓</span>}
+        </DropdownMenuItem>
+        <DropdownMenuItem
+          onClick={() => handleThemeChange("dark")}
+          className="cursor-pointer"
+        >
+          <MoonIcon className="mr-2 h-4 w-4" />
+          <span>Dark</span>
+          {theme === "dark" && <span className="ml-auto text-xs">✓</span>}
+        </DropdownMenuItem>
+        <DropdownMenuItem
+          onClick={() => handleThemeChange("system")}
+          className="cursor-pointer"
+        >
+          <MonitorIcon className="mr-2 h-4 w-4" />
+          <span>System</span>
+          {theme === "system" && <span className="ml-auto text-xs">✓</span>}
+        </DropdownMenuItem>
+      </DropdownMenuContent>
+    </DropdownMenu>
+  );
+}
diff --git a/apps/agent-app/src/index.css b/apps/agent-app/src/index.css
new file mode 100644
index 00000000..5dcc4cf8
--- /dev/null
+++ b/apps/agent-app/src/index.css
@@ -0,0 +1 @@
+@import "@databricks/appkit-ui/styles.css";
diff --git a/apps/agent-app/src/main.tsx b/apps/agent-app/src/main.tsx
new file mode 100644
index 00000000..98b62364
--- /dev/null
+++ b/apps/agent-app/src/main.tsx
@@ -0,0 +1,15 @@
+import { StrictMode } from "react";
+import { createRoot } from "react-dom/client";
+import App from "./App.tsx";
+import "./index.css";
+
+const rootElement = document.getElementById("root");
+if (!rootElement) {
+  throw new Error("Root element not found");
+}
+
+createRoot(rootElement).render(
+  <StrictMode>
+    <App />
+  </StrictMode>,
+);
diff --git a/apps/agent-app/tailwind.config.ts b/apps/agent-app/tailwind.config.ts
new file mode 100644
index 00000000..fad89bf6
--- /dev/null
+++ b/apps/agent-app/tailwind.config.ts
@@ -0,0 +1,11 @@
+import path from "node:path";
+import type { Config } from "tailwindcss";
+
+export default {
+  darkMode: ["class", "media"],
+  content: [
+    path.resolve(__dirname, "./index.html"),
+    path.resolve(__dirname, "./src/**/*.{js,ts,jsx,tsx}"),
+  ],
+  plugins: [require("tailwindcss-animate")],
+} satisfies Config;
diff --git a/apps/agent-app/tsconfig.app.json b/apps/agent-app/tsconfig.app.json
new file mode 100644
index 00000000..2877c218
--- /dev/null
+++ b/apps/agent-app/tsconfig.app.json
@@ -0,0 +1,24 @@
+{
+  "compilerOptions": {
+    "tsBuildInfoFile": "./node_modules/.tmp/tsconfig.app.tsbuildinfo",
+    "target": "ES2022",
+    "useDefineForClassFields": true,
+    "lib": ["ES2022", "DOM", "DOM.Iterable"],
+    "module": "ESNext",
+    "types": ["vite/client"],
+    "skipLibCheck": true,
+    "moduleResolution": "bundler",
+    "allowImportingTsExtensions": true,
+    "verbatimModuleSyntax": true,
+    "moduleDetection": "force",
+    "noEmit": true,
+    "jsx": "react-jsx",
+    "strict": true,
+    "noUnusedLocals": true,
+    "noUnusedParameters": true,
+    "erasableSyntaxOnly": true,
+    "noFallthroughCasesInSwitch": true,
+    "noUncheckedSideEffectImports": true
+  },
+  "include": ["src"]
+}
diff --git a/apps/agent-app/tsconfig.json b/apps/agent-app/tsconfig.json
new file mode 100644
index 00000000..1ffef600
--- /dev/null
+++ b/apps/agent-app/tsconfig.json
@@ -0,0 +1,7 @@
+{
+  "files": [],
+  "references": [
+    { "path": "./tsconfig.app.json" },
+    { "path": "./tsconfig.node.json" }
+  ]
+}
diff --git a/apps/agent-app/tsconfig.node.json b/apps/agent-app/tsconfig.node.json
new file mode 100644
index 00000000..35bcd118
--- /dev/null
+++ b/apps/agent-app/tsconfig.node.json
@@ -0,0 +1,22 @@
+{
+  "compilerOptions": {
+    "tsBuildInfoFile": "./node_modules/.tmp/tsconfig.node.tsbuildinfo",
+    "target": "ES2023",
+    "lib": ["ES2023"],
+    "module": "ESNext",
+    "types": ["node"],
+    "skipLibCheck": true,
+    "moduleResolution": "bundler",
+    "allowImportingTsExtensions": true,
+    "verbatimModuleSyntax": true,
+    "moduleDetection": "force",
+    "noEmit": true,
+    "strict": true,
+    "noUnusedLocals": true,
+    "noUnusedParameters": true,
+    "erasableSyntaxOnly": true,
+    "noFallthroughCasesInSwitch": true,
+    "noUncheckedSideEffectImports": true
+  },
+  "include": ["vite.config.ts"]
+}
diff --git a/apps/agent-app/vite.config.ts b/apps/agent-app/vite.config.ts
new file mode 100644
index 00000000..bd1cea62
--- /dev/null
+++ b/apps/agent-app/vite.config.ts
@@ -0,0 +1,31 @@
+import path from "node:path";
+import react from "@vitejs/plugin-react";
+import { defineConfig } from "vite";
+
+export default defineConfig({
+  plugins: [react()],
+  optimizeDeps: {
+    include: [
+      "react",
+      "react-dom",
+      "react/jsx-dev-runtime",
+      "react/jsx-runtime",
+    ],
+    exclude: ["@databricks/appkit-ui", "@databricks/appkit"],
+  },
+  server: {
+    hmr: {
+      port: 24679,
+    },
+  },
+  resolve: {
+    dedupe: ["react", "react-dom"],
+    preserveSymlinks: true,
+    alias: {
+      "@databricks/appkit-ui": path.resolve(
+        __dirname,
+        "../../packages/appkit-ui/dist",
+      ),
+    },
+  },
+});
diff --git a/apps/dev-playground/client/src/routes/__root.tsx b/apps/dev-playground/client/src/routes/__root.tsx
index bc7f1e34..0cfee693 100644
--- a/apps/dev-playground/client/src/routes/__root.tsx
+++ b/apps/dev-playground/client/src/routes/__root.tsx
@@ -104,20 +104,12 @@ function RootComponent() {
                     Files
                   </Button>
                 </Link>
-                <Link to="/serving" className="no-underline">
+                <Link to="/agent" className="no-underline">
                   <Button
                     variant="ghost"
                     className="text-foreground hover:text-secondary-foreground"
                   >
-                    Serving
-                  </Button>
-                </Link>
-                <Link to="/vector-search" className="no-underline">
-                  <Button
-                    variant="ghost"
-                    className="text-foreground hover:text-secondary-foreground"
-                  >
-                    Vector Search
+                    Agent
                   </Button>
                 </Link>
                 <ThemeSelector />
diff --git a/apps/dev-playground/client/src/routes/agent.route.tsx b/apps/dev-playground/client/src/routes/agent.route.tsx
new file mode 100644
index 00000000..613d4d1f
--- /dev/null
+++ b/apps/dev-playground/client/src/routes/agent.route.tsx
@@ -0,0 +1,466 @@
+import { getPluginClientConfig } from "@databricks/appkit-ui/js";
+import { Button } from "@databricks/appkit-ui/react";
+import { createFileRoute } from "@tanstack/react-router";
+import { useCallback, useEffect, useRef, useState } from "react";
+
+export const Route = createFileRoute("/agent")({
+  component: AgentRoute,
+});
+
+interface SSEEvent {
+  type: string;
+  delta?: string;
+  item_id?: string;
+  item?: {
+    type?: string;
+    id?: string;
+    call_id?: string;
+    name?: string;
+    arguments?: string;
+    output?: string;
+    status?: string;
+  };
+  content?: string;
+  data?: Record<string, unknown>;
+  error?: string;
+  sequence_number?: number;
+  output_index?: number;
+}
+
+interface ChatMessage {
+  id: number;
+  role: "user" | "assistant";
+  content: string;
+}
+
+function useAutocomplete(enabled: boolean) {
+  const [suggestion, setSuggestion] = useState("");
+  const [isLoading, setIsLoading] = useState(false);
+  const abortRef = useRef<AbortController | null>(null);
+  const timerRef = useRef<ReturnType<typeof setTimeout> | null>(null);
+
+  const requestSuggestion = useCallback(
+    (text: string) => {
+      setSuggestion("");
+
+      if (timerRef.current) clearTimeout(timerRef.current);
+      if (abortRef.current) abortRef.current.abort();
+
+      if (!text.trim() || text.length < 3 || !enabled) {
+        return;
+      }
+
+      timerRef.current = setTimeout(async () => {
+        const controller = new AbortController();
+        abortRef.current = controller;
+        setIsLoading(true);
+
+        try {
+          const response = await fetch("/api/agent/chat", {
+            method: "POST",
+            headers: { "Content-Type": "application/json" },
+            body: JSON.stringify({ message: text, agent: "autocomplete" }),
+            signal: controller.signal,
+          });
+
+          if (!response.ok || !response.body) return;
+
+          const reader = response.body.getReader();
+          const decoder = new TextDecoder();
+          let result = "";
+          let buffer = "";
+
+          while (true) {
+            const { done, value } = await reader.read();
+            if (done) break;
+
+            buffer += decoder.decode(value, { stream: true });
+            const lines = buffer.split("\n");
+            buffer = lines.pop() ?? "";
+
+            for (const line of lines) {
+              if (!line.startsWith("data: ")) continue;
+              const data = line.slice(6).trim();
+              if (!data || data === "[DONE]") continue;
+              try {
+                const event = JSON.parse(data);
+                if (
+                  event.type === "response.output_text.delta" &&
+                  event.delta
+                ) {
+                  result += event.delta;
+                  setSuggestion(result);
+                }
+              } catch {
+                /* skip */
+              }
+            }
+          }
+        } catch {
+          /* aborted or failed */
+        } finally {
+          setIsLoading(false);
+        }
+      }, 500);
+    },
+    [enabled],
+  );
+
+  const clear = useCallback(() => {
+    setSuggestion("");
+    if (timerRef.current) clearTimeout(timerRef.current);
+    if (abortRef.current) abortRef.current.abort();
+  }, []);
+
+  return {
+    suggestion,
+    isLoading: isLoading && !suggestion,
+    requestSuggestion,
+    clear,
+  };
+}
+
+function AgentRoute() {
+  const [messages, setMessages] = useState<ChatMessage[]>([]);
+  const [events, setEvents] = useState<AgentEvent[]>([]);
+  const [input, setInput] = useState("");
+  const [isLoading, setIsLoading] = useState(false);
+  const [threadId, setThreadId] = useState<string | null>(null);
+  const messagesEndRef = useRef<HTMLDivElement>(null);
+  const inputRef = useRef<HTMLTextAreaElement>(null);
+  const msgIdCounter = useRef(0);
+
+  const agentConfig = getPluginClientConfig<{
+    agents?: string[];
+    defaultAgent?: string;
+  }>("agent");
+  const hasAutocomplete = (agentConfig.agents ?? []).includes("autocomplete");
+
+  const {
+    suggestion,
+    isLoading: isAutocompleting,
+    requestSuggestion,
+    clear: clearSuggestion,
+  } = useAutocomplete(hasAutocomplete);
+
+  // biome-ignore lint/correctness/useExhaustiveDependencies: scroll on new messages
+  useEffect(() => {
+    messagesEndRef.current?.scrollIntoView({ behavior: "smooth" });
+  }, [messages]);
+
+  const sendMessage = useCallback(async () => {
+    if (!input.trim() || isLoading) return;
+
+    clearSuggestion();
+    const userMessage = input.trim();
+    setInput("");
+    setMessages((prev) => [
+      ...prev,
+      { id: ++msgIdCounter.current, role: "user", content: userMessage },
+    ]);
+    setEvents([]);
+    setIsLoading(true);
+
+    try {
+      const response = await fetch("/api/agent/chat", {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({
+          message: userMessage,
+          ...(threadId && { threadId }),
+        }),
+      });
+
+      if (!response.ok) {
+        const error = await response.json();
+        setMessages((prev) => [
+          ...prev,
+          {
+            id: ++msgIdCounter.current,
+            role: "assistant",
+            content: `Error: ${error.error}`,
+          },
+        ]);
+        return;
+      }
+
+      const reader = response.body?.getReader();
+      if (!reader) return;
+
+      const decoder = new TextDecoder();
+      let assistantContent = "";
+      let buffer = "";
+
+      while (true) {
+        const { done, value } = await reader.read();
+        if (done) break;
+
+        buffer += decoder.decode(value, { stream: true });
+        const lines = buffer.split("\n");
+        buffer = lines.pop() ?? "";
+
+        for (const line of lines) {
+          if (!line.startsWith("data: ")) continue;
+          const data = line.slice(6).trim();
+          if (!data || data === "[DONE]") continue;
+
+          try {
+            const event: SSEEvent = JSON.parse(data);
+            if (!event.type) continue;
+            setEvents((prev) => [...prev, event]);
+
+            if (event.type === "appkit.metadata" && event.data?.threadId) {
+              setThreadId(event.data.threadId as string);
+            }
+
+            if (event.type === "response.output_text.delta" && event.delta) {
+              assistantContent += event.delta;
+              setMessages((prev) => {
+                const updated = [...prev];
+                const last = updated[updated.length - 1];
+                if (last?.role === "assistant") {
+                  updated[updated.length - 1] = {
+                    ...last,
+                    content: assistantContent,
+                  };
+                } else {
+                  updated.push({
+                    id: ++msgIdCounter.current,
+                    role: "assistant",
+                    content: assistantContent,
+                  });
+                }
+                return updated;
+              });
+            }
+          } catch {
+            // skip malformed events
+          }
+        }
+      }
+    } catch (err) {
+      setMessages((prev) => [
+        ...prev,
+        {
+          id: ++msgIdCounter.current,
+          role: "assistant",
+          content: `Error: ${err instanceof Error ? err.message : "Unknown error"}`,
+        },
+      ]);
+    } finally {
+      setIsLoading(false);
+    }
+  }, [input, isLoading, threadId, clearSuggestion]);
+
+  const handleInputChange = (value: string) => {
+    setInput(value);
+    requestSuggestion(value);
+  };
+
+  const acceptSuggestion = () => {
+    if (!suggestion) return;
+    const newValue = input + suggestion;
+    setInput(newValue);
+    clearSuggestion();
+    inputRef.current?.focus();
+  };
+
+  return (
+    <div className="min-h-screen bg-background">
+      <div className="max-w-7xl mx-auto px-6 py-12">
+        <div className="mb-8 flex items-end justify-between">
+          <div>
+            <h1 className="text-3xl font-bold mb-2">Agent Chat</h1>
+            <p className="text-base text-muted-foreground">
+              AI agent with auto-discovered tools from all AppKit plugins.
+              {threadId && (
+                <span className="ml-2 text-xs font-mono opacity-60">
+                  Thread: {threadId.slice(0, 8)}...
+                </span>
+              )}
+            </p>
+          </div>
+          {hasAutocomplete && (
+            <span className="text-xs text-muted-foreground bg-muted px-2 py-1 rounded">
+              Autocomplete enabled
+            </span>
+          )}
+        </div>
+
+        <div className="flex gap-6 h-[700px]">
+          <div className="flex-1 flex flex-col border rounded-lg bg-card min-w-0">
+            <div className="flex-1 overflow-y-auto p-4 space-y-4">
+              {messages.length === 0 && (
+                <div className="text-center text-muted-foreground py-20">
+                  <p className="text-lg">
+                    Send a message to start a conversation
+                  </p>
+                  <p className="text-sm mt-2">
+                    The agent can use analytics, files, genie, and lakebase
+                    tools.
+                    {hasAutocomplete && " Start typing for inline suggestions."}
+                  </p>
+                </div>
+              )}
+
+              {messages.map((msg) => (
+                <div
+                  key={msg.id}
+                  className={`flex ${msg.role === "user" ? "justify-end" : "justify-start"}`}
+                >
+                  <div
+                    className={`max-w-[85%] rounded-lg px-4 py-2 ${
+                      msg.role === "user"
+                        ? "bg-primary text-primary-foreground"
+                        : "bg-muted"
+                    }`}
+                  >
+                    <p className="whitespace-pre-wrap text-sm">{msg.content}</p>
+                  </div>
+                </div>
+              ))}
+
+              {isLoading && messages[messages.length - 1]?.role === "user" && (
+                <div className="flex justify-start">
+                  <div className="bg-muted rounded-lg px-4 py-2">
+                    <p className="text-sm text-muted-foreground animate-pulse">
+                      Thinking...
+                    </p>
+                  </div>
+                </div>
+              )}
+
+              <div ref={messagesEndRef} />
+            </div>
+
+            <div className="border-t p-4">
+              {hasAutocomplete && (suggestion || isAutocompleting) && (
+                <div className="flex items-center gap-2 mb-2 text-xs text-muted-foreground">
+                  {isAutocompleting && (
+                    <span className="animate-pulse">Thinking...</span>
+                  )}
+                  {suggestion && (
+                    <span>
+                      Press{" "}
+                      <kbd className="px-1.5 py-0.5 rounded bg-muted border text-[10px] font-mono">
+                        Tab
+                      </kbd>{" "}
+                      to accept suggestion
+                    </span>
+                  )}
+                </div>
+              )}
+              <form
+                onSubmit={(e) => {
+                  e.preventDefault();
+                  sendMessage();
+                }}
+                className="flex gap-2"
+              >
+                <div className="flex-1 relative">
+                  <div
+                    aria-hidden
+                    className="absolute inset-0 px-3 py-2 text-sm pointer-events-none whitespace-pre-wrap break-words overflow-hidden"
+                  >
+                    <span className="invisible">{input}</span>
+                    <span className="text-muted-foreground/40">
+                      {suggestion}
+                    </span>
+                  </div>
+                  <textarea
+                    ref={inputRef}
+                    value={input}
+                    onChange={(e) => handleInputChange(e.target.value)}
+                    onKeyDown={(e) => {
+                      if (e.key === "Tab" && suggestion) {
+                        e.preventDefault();
+                        acceptSuggestion();
+                      }
+                      if (e.key === "Escape" && suggestion) {
+                        clearSuggestion();
+                      }
+                      if (e.key === "Enter" && !e.shiftKey && !suggestion) {
+                        e.preventDefault();
+                        sendMessage();
+                      }
+                    }}
+                    placeholder="Ask a question..."
+                    disabled={isLoading}
+                    rows={1}
+                    className="w-full rounded-md border border-input bg-transparent px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring disabled:opacity-50 resize-none"
+                  />
+                </div>
+                <Button
+                  type="submit"
+                  disabled={isLoading || !input.trim()}
+                  className="self-end"
+                >
+                  Send
+                </Button>
+              </form>
+            </div>
+          </div>
+
+          <div className="w-80 shrink-0 flex flex-col border rounded-lg bg-card">
+            <div className="px-3 py-2 border-b">
+              <h3 className="text-sm font-semibold text-muted-foreground">
+                Event Stream
+              </h3>
+            </div>
+            <div className="flex-1 overflow-y-auto p-3 space-y-1">
+              {events.length === 0 && (
+                <p className="text-xs text-muted-foreground/50 text-center py-8">
+                  Events will appear here
+                </p>
+              )}
+              {events.map((event, i) => {
+                let detail: string;
+                switch (event.type) {
+                  case "response.output_text.delta":
+                    detail = event.delta?.slice(0, 60) ?? "";
+                    break;
+                  case "response.output_item.added":
+                  case "response.output_item.done":
+                    detail =
+                      event.item?.type === "function_call"
+                        ? `${event.item.name}(${(event.item.arguments ?? "").slice(0, 40)})`
+                        : event.item?.type === "function_call_output"
+                          ? (event.item.output?.slice(0, 60) ?? "")
+                          : (event.item?.status ?? event.item?.type ?? "");
+                    break;
+                  case "response.completed":
+                    detail = "done";
+                    break;
+                  case "error":
+                    detail = event.error ?? "unknown";
+                    break;
+                  case "appkit.metadata":
+                    detail = JSON.stringify(event.data).slice(0, 60);
+                    break;
+                  case "appkit.thinking":
+                    detail = event.content?.slice(0, 60) ?? "";
+                    break;
+                  default:
+                    detail = JSON.stringify(event).slice(0, 60);
+                }
+                return (
+                  <div
+                    key={`${event.type}-${i}`}
+                    className="font-mono text-xs text-muted-foreground"
+                  >
+                    <span className="inline-block w-24 text-right mr-2 opacity-50">
+                      {event.type
+                        .replace("response.", "")
+                        .replace("appkit.", "")}
+                    </span>
+                    <span className="opacity-80 break-all">{detail}</span>
+                  </div>
+                );
+              })}
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/apps/dev-playground/client/src/routes/index.tsx b/apps/dev-playground/client/src/routes/index.tsx
index 934b1467..896a6e9d 100644
--- a/apps/dev-playground/client/src/routes/index.tsx
+++ b/apps/dev-playground/client/src/routes/index.tsx
@@ -222,17 +222,18 @@ function IndexRoute() {
           <Card className="p-6 hover:shadow-lg transition-shadow cursor-pointer">
             <div className="flex flex-col h-full">
               <h3 className="text-2xl font-semibold text-foreground mb-3">
-                Model Serving
+                Custom Agent
               </h3>
               <p className="text-muted-foreground mb-6 flex-grow">
-                Chat with a Databricks Model Serving endpoint using streaming
-                completions with real-time SSE responses.
+                AI agent powered by Databricks Model Serving with
+                auto-discovered tools from all AppKit plugins. Chat with your
+                data using natural language.
               </p>
               <Button
-                onClick={() => navigate({ to: "/serving" })}
+                onClick={() => navigate({ to: "/agent" })}
                 className="w-full"
               >
-                Try Model Serving
+                Chat with Agent
               </Button>
             </div>
           </Card>
diff --git a/apps/dev-playground/config/agents/assistant.md b/apps/dev-playground/config/agents/assistant.md
new file mode 100644
index 00000000..ea99d47b
--- /dev/null
+++ b/apps/dev-playground/config/agents/assistant.md
@@ -0,0 +1,6 @@
+---
+endpoint: databricks-claude-sonnet-4-5
+default: true
+---
+
+You are a helpful data assistant. Use the available tools to query data and help users with their analysis.
diff --git a/apps/dev-playground/config/agents/autocomplete.md b/apps/dev-playground/config/agents/autocomplete.md
new file mode 100644
index 00000000..fafe3330
--- /dev/null
+++ b/apps/dev-playground/config/agents/autocomplete.md
@@ -0,0 +1,6 @@
+---
+endpoint: databricks-gemini-3-1-flash-lite
+maxSteps: 1
+---
+
+You are an autocomplete engine. The user will give you the beginning of a sentence or paragraph. Continue the text naturally, as if you are the same author. Do NOT repeat the input. Only output the continuation. Do NOT use tools. Do NOT explain. Just write the next words.
diff --git a/apps/dev-playground/server/index.ts b/apps/dev-playground/server/index.ts
index 913f547c..b782dcbb 100644
--- a/apps/dev-playground/server/index.ts
+++ b/apps/dev-playground/server/index.ts
@@ -1,15 +1,17 @@
 import "reflect-metadata";
 import {
+  agents,
   analytics,
+  createAgent,
   createApp,
   files,
+  fromPlugin,
   genie,
   server,
-  serving,
+  tool,
 } from "@databricks/appkit";
 import { WorkspaceClient } from "@databricks/sdk-experimental";
-// TODO: re-enable once vector-search is exported from @databricks/appkit
-// import { vectorSearch } from "@databricks/appkit";
+import { z } from "zod";
 import { lakebaseExamples } from "./lakebase-examples-plugin";
 import { reconnect } from "./reconnect-plugin";
 import { telemetryExamples } from "./telemetry-example-plugin";
@@ -24,6 +26,23 @@ function createMockClient() {
   return client;
 }
 
+// Code-defined demo agent showing the fromPlugin() API alongside the
+// markdown-driven agents in config/agents/.
+const helper = createAgent({
+  instructions:
+    "You are a demo helper. Use analytics tools to answer data questions, " +
+    "or get_weather for light small-talk.",
+  tools: {
+    ...fromPlugin(analytics),
+    get_weather: tool({
+      name: "get_weather",
+      description: "Get the current weather for a city",
+      schema: z.object({ city: z.string().describe("City name") }),
+      execute: async ({ city }) => `The weather in ${city} is sunny, 22°C`,
+    }),
+  },
+});
+
 createApp({
   plugins: [
     server({ autoStart: false }),
@@ -35,18 +54,7 @@ createApp({
     }),
     lakebaseExamples(),
     files(),
-    serving(),
-    // TODO: re-enable once vector-search is exported from @databricks/appkit
-    // vectorSearch({
-    //   indexes: {
-    //     demo: {
-    //       indexName:
-    //         process.env.DATABRICKS_VS_INDEX_NAME ?? "catalog.schema.index",
-    //       columns: ["id", "text", "title"],
-    //       queryType: "hybrid",
-    //     },
-    //   },
-    // }),
+    agents({ agents: { helper } }),
   ],
   ...(process.env.APPKIT_E2E_TEST && { client: createMockClient() }),
 }).then((appkit) => {
diff --git a/docs/docs/api/appkit/Class.Plugin.md b/docs/docs/api/appkit/Class.Plugin.md
index 06e558dc..34034537 100644
--- a/docs/docs/api/appkit/Class.Plugin.md
+++ b/docs/docs/api/appkit/Class.Plugin.md
@@ -136,6 +136,14 @@ protected config: TConfig;
 
 ***
 
+### context?
+
+```ts
+protected optional context: PluginContext;
+```
+
+***
+
 ### devFileReader
 
 ```ts
@@ -244,6 +252,42 @@ AuthenticationError if user token is not available in request headers (productio
 
 ***
 
+### attachContext()
+
+```ts
+attachContext(deps: {
+  context?: unknown;
+  telemetryConfig?: TelemetryOptions;
+}): void;
+```
+
+Binds runtime dependencies (telemetry provider, cache, plugin context) to
+this plugin. Called by `AppKit._createApp` after construction and before
+`setup()`. Idempotent: safe to call if the constructor already bound them
+eagerly. Kept separate so factories can eagerly construct plugin instances
+without running this before `TelemetryManager.initialize()` /
+`CacheManager.getInstance()` have run.
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `deps` | \{ `context?`: `unknown`; `telemetryConfig?`: `TelemetryOptions`; \} |
+| `deps.context?` | `unknown` |
+| `deps.telemetryConfig?` | `TelemetryOptions` |
+
+#### Returns
+
+`void`
+
+#### Implementation of
+
+```ts
+BasePlugin.attachContext
+```
+
+***
+
 ### clientConfig()
 
 ```ts
diff --git a/docs/docs/api/appkit/Function.createAgent.md b/docs/docs/api/appkit/Function.createAgent.md
new file mode 100644
index 00000000..61064e51
--- /dev/null
+++ b/docs/docs/api/appkit/Function.createAgent.md
@@ -0,0 +1,35 @@
+# Function: createAgent()
+
+```ts
+function createAgent(def: AgentDefinition): AgentDefinition;
+```
+
+Pure factory for agent definitions. Returns the passed-in definition after
+cycle-detecting the sub-agent graph. Accepts the full `AgentDefinition` shape
+and is safe to call at module top-level.
+
+The returned value is a plain `AgentDefinition` — no adapter construction,
+no side effects. Register it with `agents({ agents: { name: def } })` or run
+it standalone via `runAgent(def, input)`.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `def` | [`AgentDefinition`](Interface.AgentDefinition.md) |
+
+## Returns
+
+[`AgentDefinition`](Interface.AgentDefinition.md)
+
+## Example
+
+```ts
+const support = createAgent({
+  instructions: "You help customers.",
+  model: "databricks-claude-sonnet-4-5",
+  tools: {
+    get_weather: tool({ ... }),
+  },
+});
+```
diff --git a/docs/docs/api/appkit/Function.fromPlugin.md b/docs/docs/api/appkit/Function.fromPlugin.md
new file mode 100644
index 00000000..5262ef54
--- /dev/null
+++ b/docs/docs/api/appkit/Function.fromPlugin.md
@@ -0,0 +1,50 @@
+# Function: fromPlugin()
+
+```ts
+function fromPlugin<F>(factory: F, opts?: ToolkitOptions): FromPluginSpread;
+```
+
+Reference a plugin's tools inside an `AgentDefinition.tools` record without
+naming the plugin instance. The returned spread-friendly object carries a
+symbol-keyed marker that the agents plugin resolves against registered
+`ToolProvider`s at setup time.
+
+The factory argument must come from `toPlugin` (or any function that
+carries a `pluginName` field). `fromPlugin` reads `factory.pluginName`
+synchronously — it does not construct an instance.
+
+If the referenced plugin is also registered in `createApp({ plugins })`, the
+same runtime instance is used for dispatch. If the plugin is missing,
+`AgentsPlugin.setup()` throws with a clear `Available: …` listing.
+
+## Type Parameters
+
+| Type Parameter |
+| ------ |
+| `F` *extends* `NamedPluginFactory` |
+
+## Parameters
+
+| Parameter | Type | Description |
+| ------ | ------ | ------ |
+| `factory` | `F` | A plugin factory produced by `toPlugin`. Must expose a `pluginName` field. |
+| `opts?` | [`ToolkitOptions`](Interface.ToolkitOptions.md) | Optional toolkit scoping — `prefix`, `only`, `except`, `rename`. Same shape as the `.toolkit()` method. |
+
+## Returns
+
+`FromPluginSpread`
+
+## Example
+
+```ts
+import { analytics, createAgent, files, fromPlugin, tool } from "@databricks/appkit";
+
+const support = createAgent({
+  instructions: "You help customers.",
+  tools: {
+    ...fromPlugin(analytics),
+    ...fromPlugin(files, { only: ["uploads.read"] }),
+    get_weather: tool({ ... }),
+  },
+});
+```
diff --git a/docs/docs/api/appkit/Function.isFromPluginMarker.md b/docs/docs/api/appkit/Function.isFromPluginMarker.md
new file mode 100644
index 00000000..2ba9c752
--- /dev/null
+++ b/docs/docs/api/appkit/Function.isFromPluginMarker.md
@@ -0,0 +1,17 @@
+# Function: isFromPluginMarker()
+
+```ts
+function isFromPluginMarker(value: unknown): value is FromPluginMarker;
+```
+
+Type guard for [FromPluginMarker](Interface.FromPluginMarker.md).
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `value` | `unknown` |
+
+## Returns
+
+`value is FromPluginMarker`
diff --git a/docs/docs/api/appkit/Function.isFunctionTool.md b/docs/docs/api/appkit/Function.isFunctionTool.md
new file mode 100644
index 00000000..ebd84ee4
--- /dev/null
+++ b/docs/docs/api/appkit/Function.isFunctionTool.md
@@ -0,0 +1,15 @@
+# Function: isFunctionTool()
+
+```ts
+function isFunctionTool(value: unknown): value is FunctionTool;
+```
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `value` | `unknown` |
+
+## Returns
+
+`value is FunctionTool`
diff --git a/docs/docs/api/appkit/Function.isHostedTool.md b/docs/docs/api/appkit/Function.isHostedTool.md
new file mode 100644
index 00000000..73be7e16
--- /dev/null
+++ b/docs/docs/api/appkit/Function.isHostedTool.md
@@ -0,0 +1,15 @@
+# Function: isHostedTool()
+
+```ts
+function isHostedTool(value: unknown): value is HostedTool;
+```
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `value` | `unknown` |
+
+## Returns
+
+`value is HostedTool`
diff --git a/docs/docs/api/appkit/Function.isToolkitEntry.md b/docs/docs/api/appkit/Function.isToolkitEntry.md
new file mode 100644
index 00000000..892907a4
--- /dev/null
+++ b/docs/docs/api/appkit/Function.isToolkitEntry.md
@@ -0,0 +1,18 @@
+# Function: isToolkitEntry()
+
+```ts
+function isToolkitEntry(value: unknown): value is ToolkitEntry;
+```
+
+Type guard for `ToolkitEntry` — used by the agents plugin to differentiate
+toolkit references from inline tools in a mixed `tools` record.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `value` | `unknown` |
+
+## Returns
+
+`value is ToolkitEntry`
diff --git a/docs/docs/api/appkit/Function.loadAgentFromFile.md b/docs/docs/api/appkit/Function.loadAgentFromFile.md
new file mode 100644
index 00000000..3eab5346
--- /dev/null
+++ b/docs/docs/api/appkit/Function.loadAgentFromFile.md
@@ -0,0 +1,19 @@
+# Function: loadAgentFromFile()
+
+```ts
+function loadAgentFromFile(filePath: string, ctx: LoadContext): Promise<AgentDefinition>;
+```
+
+Loads a single markdown agent file and resolves its frontmatter against
+registered plugin toolkits + ambient tool library.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `filePath` | `string` |
+| `ctx` | `LoadContext` |
+
+## Returns
+
+`Promise`\<[`AgentDefinition`](Interface.AgentDefinition.md)\>
diff --git a/docs/docs/api/appkit/Function.loadAgentsFromDir.md b/docs/docs/api/appkit/Function.loadAgentsFromDir.md
new file mode 100644
index 00000000..86665e17
--- /dev/null
+++ b/docs/docs/api/appkit/Function.loadAgentsFromDir.md
@@ -0,0 +1,20 @@
+# Function: loadAgentsFromDir()
+
+```ts
+function loadAgentsFromDir(dir: string, ctx: LoadContext): Promise<LoadResult>;
+```
+
+Scans a directory for `*.md` files and produces an `AgentDefinition` record
+keyed by file-stem. Throws on frontmatter errors or unresolved references.
+Returns an empty map if the directory does not exist.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `dir` | `string` |
+| `ctx` | `LoadContext` |
+
+## Returns
+
+`Promise`\<`LoadResult`\>
diff --git a/docs/docs/api/appkit/Function.mcpServer.md b/docs/docs/api/appkit/Function.mcpServer.md
new file mode 100644
index 00000000..cafd4657
--- /dev/null
+++ b/docs/docs/api/appkit/Function.mcpServer.md
@@ -0,0 +1,26 @@
+# Function: mcpServer()
+
+```ts
+function mcpServer(name: string, url: string): CustomMcpServerTool;
+```
+
+Factory for declaring a custom MCP server tool.
+
+Replaces the verbose `{ type: "custom_mcp_server", custom_mcp_server: { app_name, app_url } }`
+wrapper with a concise positional call.
+
+Example:
+```ts
+mcpServer("my-app", "https://my-app.databricksapps.com/mcp")
+```
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `name` | `string` |
+| `url` | `string` |
+
+## Returns
+
+`CustomMcpServerTool`
diff --git a/docs/docs/api/appkit/Function.runAgent.md b/docs/docs/api/appkit/Function.runAgent.md
new file mode 100644
index 00000000..4e1f8608
--- /dev/null
+++ b/docs/docs/api/appkit/Function.runAgent.md
@@ -0,0 +1,29 @@
+# Function: runAgent()
+
+```ts
+function runAgent(def: AgentDefinition, input: RunAgentInput): Promise<RunAgentResult>;
+```
+
+Standalone agent execution without `createApp`. Resolves the adapter, binds
+inline tools, and drives the adapter's `run()` loop to completion.
+
+Limitations vs. running through the agents() plugin:
+- No OBO: there is no HTTP request, so plugin tools run as the service
+  principal (when they work at all).
+- Hosted tools (MCP) are not supported — they require a live MCP client
+  that only exists inside the agents plugin.
+- Sub-agents (`agents: { ... }` on the def) are executed as nested
+  `runAgent` calls with no shared thread state.
+- Plugin tools (`fromPlugin` markers or `ToolkitEntry` spreads) require
+  passing `plugins: [...]` via `RunAgentInput`.
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `def` | [`AgentDefinition`](Interface.AgentDefinition.md) |
+| `input` | [`RunAgentInput`](Interface.RunAgentInput.md) |
+
+## Returns
+
+`Promise`\<[`RunAgentResult`](Interface.RunAgentResult.md)\>
diff --git a/docs/docs/api/appkit/Function.tool.md b/docs/docs/api/appkit/Function.tool.md
new file mode 100644
index 00000000..d6799cfd
--- /dev/null
+++ b/docs/docs/api/appkit/Function.tool.md
@@ -0,0 +1,29 @@
+# Function: tool()
+
+```ts
+function tool<S>(config: ToolConfig<S>): FunctionTool;
+```
+
+Factory for defining function tools with Zod schemas.
+
+- Generates JSON Schema (for the LLM) from the Zod schema via `z.toJSONSchema()`.
+- Infers the `execute` argument type from the schema.
+- Validates tool call arguments at runtime. On validation failure, returns
+  a formatted error string to the LLM instead of throwing, so the model
+  can self-correct on its next turn.
+
+## Type Parameters
+
+| Type Parameter |
+| ------ |
+| `S` *extends* `ZodType`\<`unknown`, `unknown`, `$ZodTypeInternals`\<`unknown`, `unknown`\>\> |
+
+## Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `config` | [`ToolConfig`](Interface.ToolConfig.md)\<`S`\> |
+
+## Returns
+
+[`FunctionTool`](Interface.FunctionTool.md)
diff --git a/docs/docs/api/appkit/Interface.AgentAdapter.md b/docs/docs/api/appkit/Interface.AgentAdapter.md
new file mode 100644
index 00000000..52083157
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentAdapter.md
@@ -0,0 +1,20 @@
+# Interface: AgentAdapter
+
+## Methods
+
+### run()
+
+```ts
+run(input: AgentInput, context: AgentRunContext): AsyncGenerator<AgentEvent, void, unknown>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `input` | [`AgentInput`](Interface.AgentInput.md) |
+| `context` | [`AgentRunContext`](Interface.AgentRunContext.md) |
+
+#### Returns
+
+`AsyncGenerator`\<[`AgentEvent`](TypeAlias.AgentEvent.md), `void`, `unknown`\>
diff --git a/docs/docs/api/appkit/Interface.AgentDefinition.md b/docs/docs/api/appkit/Interface.AgentDefinition.md
new file mode 100644
index 00000000..a3d7dc77
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentDefinition.md
@@ -0,0 +1,82 @@
+# Interface: AgentDefinition
+
+## Properties
+
+### agents?
+
+```ts
+optional agents: Record<string, AgentDefinition>;
+```
+
+Sub-agents, exposed as `agent-<key>` tools on this agent.
+
+***
+
+### baseSystemPrompt?
+
+```ts
+optional baseSystemPrompt: BaseSystemPromptOption;
+```
+
+Override the plugin's baseSystemPrompt for this agent only.
+
+***
+
+### instructions
+
+```ts
+instructions: string;
+```
+
+System prompt body. For markdown-loaded agents this is the file body.
+
+***
+
+### maxSteps?
+
+```ts
+optional maxSteps: number;
+```
+
+***
+
+### maxTokens?
+
+```ts
+optional maxTokens: number;
+```
+
+***
+
+### model?
+
+```ts
+optional model: 
+  | string
+  | AgentAdapter
+| Promise<AgentAdapter>;
+```
+
+Model adapter (or endpoint-name string sugar for
+`DatabricksAdapter.fromServingEndpoint({ endpointName })`). Optional —
+falls back to the plugin's `defaultModel`.
+
+***
+
+### name?
+
+```ts
+optional name: string;
+```
+
+Filled in from the enclosing key when used in `agents: { foo: def }`.
+
+***
+
+### tools?
+
+```ts
+optional tools: AgentTools;
+```
+
+Per-agent tool record. Key is the LLM-visible tool-call name.
diff --git a/docs/docs/api/appkit/Interface.AgentInput.md b/docs/docs/api/appkit/Interface.AgentInput.md
new file mode 100644
index 00000000..6d2eff8b
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentInput.md
@@ -0,0 +1,33 @@
+# Interface: AgentInput
+
+## Properties
+
+### messages
+
+```ts
+messages: Message[];
+```
+
+***
+
+### signal?
+
+```ts
+optional signal: AbortSignal;
+```
+
+***
+
+### threadId
+
+```ts
+threadId: string;
+```
+
+***
+
+### tools
+
+```ts
+tools: AgentToolDefinition[];
+```
diff --git a/docs/docs/api/appkit/Interface.AgentRunContext.md b/docs/docs/api/appkit/Interface.AgentRunContext.md
new file mode 100644
index 00000000..c9bfcb79
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentRunContext.md
@@ -0,0 +1,28 @@
+# Interface: AgentRunContext
+
+## Properties
+
+### executeTool()
+
+```ts
+executeTool: (name: string, args: unknown) => Promise<unknown>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `name` | `string` |
+| `args` | `unknown` |
+
+#### Returns
+
+`Promise`\<`unknown`\>
+
+***
+
+### signal?
+
+```ts
+optional signal: AbortSignal;
+```
diff --git a/docs/docs/api/appkit/Interface.AgentToolDefinition.md b/docs/docs/api/appkit/Interface.AgentToolDefinition.md
new file mode 100644
index 00000000..51c37595
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentToolDefinition.md
@@ -0,0 +1,33 @@
+# Interface: AgentToolDefinition
+
+## Properties
+
+### annotations?
+
+```ts
+optional annotations: ToolAnnotations;
+```
+
+***
+
+### description
+
+```ts
+description: string;
+```
+
+***
+
+### name
+
+```ts
+name: string;
+```
+
+***
+
+### parameters
+
+```ts
+parameters: JSONSchema7;
+```
diff --git a/docs/docs/api/appkit/Interface.AgentsPluginConfig.md b/docs/docs/api/appkit/Interface.AgentsPluginConfig.md
new file mode 100644
index 00000000..79af0562
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.AgentsPluginConfig.md
@@ -0,0 +1,132 @@
+# Interface: AgentsPluginConfig
+
+Base configuration interface for AppKit plugins
+
+## Extends
+
+- [`BasePluginConfig`](Interface.BasePluginConfig.md)
+
+## Indexable
+
+```ts
+[key: string]: unknown
+```
+
+## Properties
+
+### agents?
+
+```ts
+optional agents: Record<string, AgentDefinition>;
+```
+
+Code-defined agents, merged with file-loaded ones (code wins on key collision).
+
+***
+
+### autoInheritTools?
+
+```ts
+optional autoInheritTools: boolean | AutoInheritToolsConfig;
+```
+
+Whether to auto-inherit every ToolProvider plugin's toolkit. Accepts a boolean shorthand.
+
+***
+
+### baseSystemPrompt?
+
+```ts
+optional baseSystemPrompt: BaseSystemPromptOption;
+```
+
+Customize or disable the AppKit base system prompt.
+
+***
+
+### defaultAgent?
+
+```ts
+optional defaultAgent: string;
+```
+
+Agent used when clients don't specify one. Defaults to the first-registered agent or the file with `default: true` frontmatter.
+
+***
+
+### defaultModel?
+
+```ts
+optional defaultModel: 
+  | string
+  | AgentAdapter
+| Promise<AgentAdapter>;
+```
+
+Default model for agents that don't specify their own (in code or frontmatter).
+
+***
+
+### dir?
+
+```ts
+optional dir: string | false;
+```
+
+Directory to scan for markdown agent files. Default `./config/agents`. Set to `false` to disable.
+
+***
+
+### host?
+
+```ts
+optional host: string;
+```
+
+#### Inherited from
+
+[`BasePluginConfig`](Interface.BasePluginConfig.md).[`host`](Interface.BasePluginConfig.md#host)
+
+***
+
+### name?
+
+```ts
+optional name: string;
+```
+
+#### Inherited from
+
+[`BasePluginConfig`](Interface.BasePluginConfig.md).[`name`](Interface.BasePluginConfig.md#name)
+
+***
+
+### telemetry?
+
+```ts
+optional telemetry: TelemetryOptions;
+```
+
+#### Inherited from
+
+[`BasePluginConfig`](Interface.BasePluginConfig.md).[`telemetry`](Interface.BasePluginConfig.md#telemetry)
+
+***
+
+### threadStore?
+
+```ts
+optional threadStore: ThreadStore;
+```
+
+Persistent thread store. Default: in-memory.
+
+***
+
+### tools?
+
+```ts
+optional tools: Record<string, AgentTool>;
+```
+
+Ambient tool library. Keys may be referenced by markdown frontmatter via `tools: [key1, key2]`.
diff --git a/docs/docs/api/appkit/Interface.BasePluginConfig.md b/docs/docs/api/appkit/Interface.BasePluginConfig.md
index a7faffc6..130a61c1 100644
--- a/docs/docs/api/appkit/Interface.BasePluginConfig.md
+++ b/docs/docs/api/appkit/Interface.BasePluginConfig.md
@@ -2,6 +2,10 @@
 
 Base configuration interface for AppKit plugins
 
+## Extended by
+
+- [`AgentsPluginConfig`](Interface.AgentsPluginConfig.md)
+
 ## Indexable
 
 ```ts
diff --git a/docs/docs/api/appkit/Interface.FromPluginMarker.md b/docs/docs/api/appkit/Interface.FromPluginMarker.md
new file mode 100644
index 00000000..1a1fedd3
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.FromPluginMarker.md
@@ -0,0 +1,32 @@
+# Interface: FromPluginMarker
+
+A lazy reference to a plugin's tools, produced by [fromPlugin](Function.fromPlugin.md) and
+resolved to concrete `ToolkitEntry`s at `AgentsPlugin.setup()` time.
+
+The marker is spread under a unique symbol key so multiple calls to
+`fromPlugin` (even for the same plugin) coexist in an `AgentDefinition.tools`
+record without colliding.
+
+## Properties
+
+### \[FROM\_PLUGIN\_MARKER\]
+
+```ts
+readonly [FROM_PLUGIN_MARKER]: true;
+```
+
+***
+
+### opts
+
+```ts
+readonly opts: ToolkitOptions | undefined;
+```
+
+***
+
+### pluginName
+
+```ts
+readonly pluginName: string;
+```
diff --git a/docs/docs/api/appkit/Interface.FunctionTool.md b/docs/docs/api/appkit/Interface.FunctionTool.md
new file mode 100644
index 00000000..c096daca
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.FunctionTool.md
@@ -0,0 +1,59 @@
+# Interface: FunctionTool
+
+## Properties
+
+### description?
+
+```ts
+optional description: string | null;
+```
+
+***
+
+### execute()
+
+```ts
+execute: (args: Record<string, unknown>) => string | Promise<string>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `args` | `Record`\<`string`, `unknown`\> |
+
+#### Returns
+
+`string` \| `Promise`\<`string`\>
+
+***
+
+### name
+
+```ts
+name: string;
+```
+
+***
+
+### parameters?
+
+```ts
+optional parameters: Record<string, unknown> | null;
+```
+
+***
+
+### strict?
+
+```ts
+optional strict: boolean | null;
+```
+
+***
+
+### type
+
+```ts
+type: "function";
+```
diff --git a/docs/docs/api/appkit/Interface.Message.md b/docs/docs/api/appkit/Interface.Message.md
new file mode 100644
index 00000000..ed818408
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.Message.md
@@ -0,0 +1,49 @@
+# Interface: Message
+
+## Properties
+
+### content
+
+```ts
+content: string;
+```
+
+***
+
+### createdAt
+
+```ts
+createdAt: Date;
+```
+
+***
+
+### id
+
+```ts
+id: string;
+```
+
+***
+
+### role
+
+```ts
+role: "user" | "assistant" | "system" | "tool";
+```
+
+***
+
+### toolCallId?
+
+```ts
+optional toolCallId: string;
+```
+
+***
+
+### toolCalls?
+
+```ts
+optional toolCalls: ToolCall[];
+```
diff --git a/docs/docs/api/appkit/Interface.PromptContext.md b/docs/docs/api/appkit/Interface.PromptContext.md
new file mode 100644
index 00000000..e26ea167
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.PromptContext.md
@@ -0,0 +1,27 @@
+# Interface: PromptContext
+
+Context passed to `baseSystemPrompt` callbacks.
+
+## Properties
+
+### agentName
+
+```ts
+agentName: string;
+```
+
+***
+
+### pluginNames
+
+```ts
+pluginNames: string[];
+```
+
+***
+
+### toolNames
+
+```ts
+toolNames: string[];
+```
diff --git a/docs/docs/api/appkit/Interface.RunAgentInput.md b/docs/docs/api/appkit/Interface.RunAgentInput.md
new file mode 100644
index 00000000..c7fa4b02
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.RunAgentInput.md
@@ -0,0 +1,35 @@
+# Interface: RunAgentInput
+
+## Properties
+
+### messages
+
+```ts
+messages: string | Message[];
+```
+
+Seed messages for the run. Either a single user string or a full message list.
+
+***
+
+### plugins?
+
+```ts
+optional plugins: PluginData<PluginConstructor, unknown, string>[];
+```
+
+Optional plugin list used to resolve `fromPlugin` markers in `def.tools`.
+Required when the def contains any `...fromPlugin(factory)` spreads;
+ignored otherwise. `runAgent` constructs a fresh instance per plugin
+and dispatches tool calls against it as the service principal (no
+OBO — there is no HTTP request in standalone mode).
+
+***
+
+### signal?
+
+```ts
+optional signal: AbortSignal;
+```
+
+Abort signal for cancellation.
diff --git a/docs/docs/api/appkit/Interface.RunAgentResult.md b/docs/docs/api/appkit/Interface.RunAgentResult.md
new file mode 100644
index 00000000..a9ba258d
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.RunAgentResult.md
@@ -0,0 +1,21 @@
+# Interface: RunAgentResult
+
+## Properties
+
+### events
+
+```ts
+events: AgentEvent[];
+```
+
+Every event the adapter yielded, in order. Useful for inspection/tests.
+
+***
+
+### text
+
+```ts
+text: string;
+```
+
+Aggregated text output from all `message_delta` events.
diff --git a/docs/docs/api/appkit/Interface.Thread.md b/docs/docs/api/appkit/Interface.Thread.md
new file mode 100644
index 00000000..e9f15fee
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.Thread.md
@@ -0,0 +1,41 @@
+# Interface: Thread
+
+## Properties
+
+### createdAt
+
+```ts
+createdAt: Date;
+```
+
+***
+
+### id
+
+```ts
+id: string;
+```
+
+***
+
+### messages
+
+```ts
+messages: Message[];
+```
+
+***
+
+### updatedAt
+
+```ts
+updatedAt: Date;
+```
+
+***
+
+### userId
+
+```ts
+userId: string;
+```
diff --git a/docs/docs/api/appkit/Interface.ThreadStore.md b/docs/docs/api/appkit/Interface.ThreadStore.md
new file mode 100644
index 00000000..215b76a2
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ThreadStore.md
@@ -0,0 +1,98 @@
+# Interface: ThreadStore
+
+## Methods
+
+### addMessage()
+
+```ts
+addMessage(
+   threadId: string, 
+   userId: string, 
+message: Message): Promise<void>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `threadId` | `string` |
+| `userId` | `string` |
+| `message` | [`Message`](Interface.Message.md) |
+
+#### Returns
+
+`Promise`\<`void`\>
+
+***
+
+### create()
+
+```ts
+create(userId: string): Promise<Thread>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `userId` | `string` |
+
+#### Returns
+
+`Promise`\<[`Thread`](Interface.Thread.md)\>
+
+***
+
+### delete()
+
+```ts
+delete(threadId: string, userId: string): Promise<boolean>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `threadId` | `string` |
+| `userId` | `string` |
+
+#### Returns
+
+`Promise`\<`boolean`\>
+
+***
+
+### get()
+
+```ts
+get(threadId: string, userId: string): Promise<Thread | null>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `threadId` | `string` |
+| `userId` | `string` |
+
+#### Returns
+
+`Promise`\<[`Thread`](Interface.Thread.md) \| `null`\>
+
+***
+
+### list()
+
+```ts
+list(userId: string): Promise<Thread[]>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `userId` | `string` |
+
+#### Returns
+
+`Promise`\<[`Thread`](Interface.Thread.md)[]\>
diff --git a/docs/docs/api/appkit/Interface.ToolConfig.md b/docs/docs/api/appkit/Interface.ToolConfig.md
new file mode 100644
index 00000000..48828a38
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ToolConfig.md
@@ -0,0 +1,49 @@
+# Interface: ToolConfig\<S\>
+
+## Type Parameters
+
+| Type Parameter |
+| ------ |
+| `S` *extends* `z.ZodType` |
+
+## Properties
+
+### description?
+
+```ts
+optional description: string;
+```
+
+***
+
+### execute()
+
+```ts
+execute: (args: output<S>) => string | Promise<string>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `args` | `output`\<`S`\> |
+
+#### Returns
+
+`string` \| `Promise`\<`string`\>
+
+***
+
+### name
+
+```ts
+name: string;
+```
+
+***
+
+### schema
+
+```ts
+schema: S;
+```
diff --git a/docs/docs/api/appkit/Interface.ToolProvider.md b/docs/docs/api/appkit/Interface.ToolProvider.md
new file mode 100644
index 00000000..9c8851a0
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ToolProvider.md
@@ -0,0 +1,36 @@
+# Interface: ToolProvider
+
+## Methods
+
+### executeAgentTool()
+
+```ts
+executeAgentTool(
+   name: string, 
+   args: unknown, 
+signal?: AbortSignal): Promise<unknown>;
+```
+
+#### Parameters
+
+| Parameter | Type |
+| ------ | ------ |
+| `name` | `string` |
+| `args` | `unknown` |
+| `signal?` | `AbortSignal` |
+
+#### Returns
+
+`Promise`\<`unknown`\>
+
+***
+
+### getAgentTools()
+
+```ts
+getAgentTools(): AgentToolDefinition[];
+```
+
+#### Returns
+
+[`AgentToolDefinition`](Interface.AgentToolDefinition.md)[]
diff --git a/docs/docs/api/appkit/Interface.ToolkitEntry.md b/docs/docs/api/appkit/Interface.ToolkitEntry.md
new file mode 100644
index 00000000..699c07b0
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ToolkitEntry.md
@@ -0,0 +1,46 @@
+# Interface: ToolkitEntry
+
+A tool reference produced by a plugin's `.toolkit()` call. The agents plugin
+recognizes the `__toolkitRef` brand and dispatches tool invocations through
+`PluginContext.executeTool(req, pluginName, localName, ...)`, preserving
+OBO (asUser) and telemetry spans.
+
+## Properties
+
+### \_\_toolkitRef
+
+```ts
+readonly __toolkitRef: true;
+```
+
+***
+
+### annotations?
+
+```ts
+optional annotations: ToolAnnotations;
+```
+
+***
+
+### def
+
+```ts
+def: AgentToolDefinition;
+```
+
+***
+
+### localName
+
+```ts
+localName: string;
+```
+
+***
+
+### pluginName
+
+```ts
+pluginName: string;
+```
diff --git a/docs/docs/api/appkit/Interface.ToolkitOptions.md b/docs/docs/api/appkit/Interface.ToolkitOptions.md
new file mode 100644
index 00000000..1beb22b0
--- /dev/null
+++ b/docs/docs/api/appkit/Interface.ToolkitOptions.md
@@ -0,0 +1,41 @@
+# Interface: ToolkitOptions
+
+## Properties
+
+### except?
+
+```ts
+optional except: string[];
+```
+
+Exclude tools whose local name matches one of these.
+
+***
+
+### only?
+
+```ts
+optional only: string[];
+```
+
+Only include tools whose local name matches one of these.
+
+***
+
+### prefix?
+
+```ts
+optional prefix: string;
+```
+
+Key prefix to prepend to each tool's local name. Defaults to `${pluginName}.`.
+
+***
+
+### rename?
+
+```ts
+optional rename: Record<string, string>;
+```
+
+Remap specific local names to different keys (applied after prefix).
diff --git a/docs/docs/api/appkit/TypeAlias.AgentEvent.md b/docs/docs/api/appkit/TypeAlias.AgentEvent.md
new file mode 100644
index 00000000..7c7cd92c
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.AgentEvent.md
@@ -0,0 +1,38 @@
+# Type Alias: AgentEvent
+
+```ts
+type AgentEvent = 
+  | {
+  content: string;
+  type: "message_delta";
+}
+  | {
+  content: string;
+  type: "message";
+}
+  | {
+  args: unknown;
+  callId: string;
+  name: string;
+  type: "tool_call";
+}
+  | {
+  callId: string;
+  error?: string;
+  result: unknown;
+  type: "tool_result";
+}
+  | {
+  content: string;
+  type: "thinking";
+}
+  | {
+  error?: string;
+  status: "running" | "waiting" | "complete" | "error";
+  type: "status";
+}
+  | {
+  data: Record<string, unknown>;
+  type: "metadata";
+};
+```
diff --git a/docs/docs/api/appkit/TypeAlias.AgentTool.md b/docs/docs/api/appkit/TypeAlias.AgentTool.md
new file mode 100644
index 00000000..e165cec6
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.AgentTool.md
@@ -0,0 +1,12 @@
+# Type Alias: AgentTool
+
+```ts
+type AgentTool = 
+  | FunctionTool
+  | HostedTool
+  | ToolkitEntry;
+```
+
+Any tool an agent can invoke: inline function tools (`tool()`), hosted MCP
+tools (`mcpServer()` / raw hosted), or toolkit references from plugins
+(`analytics().toolkit()`).
diff --git a/docs/docs/api/appkit/TypeAlias.AgentTools.md b/docs/docs/api/appkit/TypeAlias.AgentTools.md
new file mode 100644
index 00000000..05b9ce61
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.AgentTools.md
@@ -0,0 +1,14 @@
+# Type Alias: AgentTools
+
+```ts
+type AgentTools = {
+[key: string]: AgentTool;
+} & {
+[key: symbol]: FromPluginMarker;
+};
+```
+
+Per-agent tool record. String keys map to inline tools, toolkit entries,
+hosted tools, etc. Symbol keys hold `FromPluginMarker` references produced
+by `fromPlugin(factory)` spreads — these are resolved at
+`AgentsPlugin.setup()` time against registered `ToolProvider` plugins.
diff --git a/docs/docs/api/appkit/TypeAlias.BaseSystemPromptOption.md b/docs/docs/api/appkit/TypeAlias.BaseSystemPromptOption.md
new file mode 100644
index 00000000..c5922661
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.BaseSystemPromptOption.md
@@ -0,0 +1,8 @@
+# Type Alias: BaseSystemPromptOption
+
+```ts
+type BaseSystemPromptOption = 
+  | false
+  | string
+  | (ctx: PromptContext) => string;
+```
diff --git a/docs/docs/api/appkit/TypeAlias.HostedTool.md b/docs/docs/api/appkit/TypeAlias.HostedTool.md
new file mode 100644
index 00000000..433c0ac8
--- /dev/null
+++ b/docs/docs/api/appkit/TypeAlias.HostedTool.md
@@ -0,0 +1,9 @@
+# Type Alias: HostedTool
+
+```ts
+type HostedTool = 
+  | GenieTool
+  | VectorSearchIndexTool
+  | CustomMcpServerTool
+  | ExternalMcpServerTool;
+```
diff --git a/docs/docs/api/appkit/Variable.agents.md b/docs/docs/api/appkit/Variable.agents.md
new file mode 100644
index 00000000..d5bc7a09
--- /dev/null
+++ b/docs/docs/api/appkit/Variable.agents.md
@@ -0,0 +1,19 @@
+# Variable: agents
+
+```ts
+const agents: ToPlugin<typeof AgentsPlugin, AgentsPluginConfig, string> & NamedPluginFactory<string>;
+```
+
+Plugin factory for the agents plugin. Reads `config/agents/*.md` by default,
+resolves toolkits/tools from registered plugins, exposes `appkit.agents.*`
+runtime API and mounts `/invocations`.
+
+## Example
+
+```ts
+import { agents, analytics, createApp, server } from "@databricks/appkit";
+
+await createApp({
+  plugins: [server(), analytics(), agents()],
+});
+```
diff --git a/docs/docs/api/appkit/index.md b/docs/docs/api/appkit/index.md
index f5163db4..4abfedcb 100644
--- a/docs/docs/api/appkit/index.md
+++ b/docs/docs/api/appkit/index.md
@@ -30,31 +30,54 @@ plugin architecture, and React integration.
 
 | Interface | Description |
 | ------ | ------ |
+| [AgentAdapter](Interface.AgentAdapter.md) | - |
+| [AgentDefinition](Interface.AgentDefinition.md) | - |
+| [AgentInput](Interface.AgentInput.md) | - |
+| [AgentRunContext](Interface.AgentRunContext.md) | - |
+| [AgentsPluginConfig](Interface.AgentsPluginConfig.md) | Base configuration interface for AppKit plugins |
+| [AgentToolDefinition](Interface.AgentToolDefinition.md) | - |
 | [BasePluginConfig](Interface.BasePluginConfig.md) | Base configuration interface for AppKit plugins |
 | [CacheConfig](Interface.CacheConfig.md) | Configuration for the CacheInterceptor. Controls TTL, size limits, storage backend, and probabilistic cleanup. |
 | [DatabaseCredential](Interface.DatabaseCredential.md) | Database credentials with OAuth token for Postgres connection |
 | [EndpointConfig](Interface.EndpointConfig.md) | - |
+| [FromPluginMarker](Interface.FromPluginMarker.md) | A lazy reference to a plugin's tools, produced by [fromPlugin](Function.fromPlugin.md) and resolved to concrete `ToolkitEntry`s at `AgentsPlugin.setup()` time. |
+| [FunctionTool](Interface.FunctionTool.md) | - |
 | [GenerateDatabaseCredentialRequest](Interface.GenerateDatabaseCredentialRequest.md) | Request parameters for generating database OAuth credentials |
 | [ITelemetry](Interface.ITelemetry.md) | Plugin-facing interface for OpenTelemetry instrumentation. Provides a thin abstraction over OpenTelemetry APIs for plugins. |
 | [LakebasePoolConfig](Interface.LakebasePoolConfig.md) | Configuration for creating a Lakebase connection pool |
+| [Message](Interface.Message.md) | - |
 | [PluginManifest](Interface.PluginManifest.md) | Plugin manifest that declares metadata and resource requirements. Attached to plugin classes as a static property. Extends the shared PluginManifest with strict resource types. |
+| [PromptContext](Interface.PromptContext.md) | Context passed to `baseSystemPrompt` callbacks. |
 | [RequestedClaims](Interface.RequestedClaims.md) | Optional claims for fine-grained Unity Catalog table permissions When specified, the returned token will be scoped to only the requested tables |
 | [RequestedResource](Interface.RequestedResource.md) | Resource to request permissions for in Unity Catalog |
 | [ResourceEntry](Interface.ResourceEntry.md) | Internal representation of a resource in the registry. Extends ResourceRequirement with resolution state and plugin ownership. |
 | [ResourceFieldEntry](Interface.ResourceFieldEntry.md) | Defines a single field for a resource. Each field has its own environment variable and optional description. Single-value types use one key (e.g. id); multi-value types (database, secret) use multiple (e.g. instance_name, database_name or scope, key). |
 | [ResourceRequirement](Interface.ResourceRequirement.md) | Declares a resource requirement for a plugin. Can be defined statically in a manifest or dynamically via getResourceRequirements(). Narrows the generated base: type → ResourceType enum, permission → ResourcePermission union. |
+| [RunAgentInput](Interface.RunAgentInput.md) | - |
+| [RunAgentResult](Interface.RunAgentResult.md) | - |
 | [ServingEndpointEntry](Interface.ServingEndpointEntry.md) | Shape of a single registry entry. |
 | [ServingEndpointRegistry](Interface.ServingEndpointRegistry.md) | Registry interface for serving endpoint type generation. Empty by default — augmented by the Vite type generator's `.d.ts` output via module augmentation. When populated, provides autocomplete for alias names and typed request/response/chunk per endpoint. |
 | [StreamExecutionSettings](Interface.StreamExecutionSettings.md) | Execution settings for streaming endpoints. Extends PluginExecutionSettings with SSE stream configuration. |
 | [TelemetryConfig](Interface.TelemetryConfig.md) | OpenTelemetry configuration for AppKit applications |
+| [Thread](Interface.Thread.md) | - |
+| [ThreadStore](Interface.ThreadStore.md) | - |
+| [ToolConfig](Interface.ToolConfig.md) | - |
+| [ToolkitEntry](Interface.ToolkitEntry.md) | A tool reference produced by a plugin's `.toolkit()` call. The agents plugin recognizes the `__toolkitRef` brand and dispatches tool invocations through `PluginContext.executeTool(req, pluginName, localName, ...)`, preserving OBO (asUser) and telemetry spans. |
+| [ToolkitOptions](Interface.ToolkitOptions.md) | - |
+| [ToolProvider](Interface.ToolProvider.md) | - |
 | [ValidationResult](Interface.ValidationResult.md) | Result of validating all registered resources against the environment. |
 
 ## Type Aliases
 
 | Type Alias | Description |
 | ------ | ------ |
+| [AgentEvent](TypeAlias.AgentEvent.md) | - |
+| [AgentTool](TypeAlias.AgentTool.md) | Any tool an agent can invoke: inline function tools (`tool()`), hosted MCP tools (`mcpServer()` / raw hosted), or toolkit references from plugins (`analytics().toolkit()`). |
+| [AgentTools](TypeAlias.AgentTools.md) | Per-agent tool record. String keys map to inline tools, toolkit entries, hosted tools, etc. Symbol keys hold `FromPluginMarker` references produced by `fromPlugin(factory)` spreads — these are resolved at `AgentsPlugin.setup()` time against registered `ToolProvider` plugins. |
+| [BaseSystemPromptOption](TypeAlias.BaseSystemPromptOption.md) | - |
 | [ConfigSchema](TypeAlias.ConfigSchema.md) | Configuration schema definition for plugin config. Re-exported from the standard JSON Schema Draft 7 types. |
 | [ExecutionResult](TypeAlias.ExecutionResult.md) | Discriminated union for plugin execution results. |
+| [HostedTool](TypeAlias.HostedTool.md) | - |
 | [IAppRouter](TypeAlias.IAppRouter.md) | Express router type for plugin route registration |
 | [PluginData](TypeAlias.PluginData.md) | Tuple of plugin class, config, and name. Created by `toPlugin()` and passed to `createApp()`. |
 | [ResourcePermission](TypeAlias.ResourcePermission.md) | Union of all possible permission levels across all resource types. |
@@ -65,6 +88,7 @@ plugin architecture, and React integration.
 
 | Variable | Description |
 | ------ | ------ |
+| [agents](Variable.agents.md) | Plugin factory for the agents plugin. Reads `config/agents/*.md` by default, resolves toolkits/tools from registered plugins, exposes `appkit.agents.*` runtime API and mounts `/invocations`. |
 | [sql](Variable.sql.md) | SQL helper namespace |
 
 ## Functions
@@ -73,10 +97,12 @@ plugin architecture, and React integration.
 | ------ | ------ |
 | [appKitServingTypesPlugin](Function.appKitServingTypesPlugin.md) | Vite plugin to generate TypeScript types for AppKit serving endpoints. Fetches OpenAPI schemas from Databricks and generates a .d.ts with ServingEndpointRegistry module augmentation. |
 | [appKitTypesPlugin](Function.appKitTypesPlugin.md) | Vite plugin to generate types for AppKit queries. Calls generateFromEntryPoint under the hood. |
+| [createAgent](Function.createAgent.md) | Pure factory for agent definitions. Returns the passed-in definition after cycle-detecting the sub-agent graph. Accepts the full `AgentDefinition` shape and is safe to call at module top-level. |
 | [createApp](Function.createApp.md) | Bootstraps AppKit with the provided configuration. |
 | [createLakebasePool](Function.createLakebasePool.md) | Create a Lakebase pool with appkit's logger integration. Telemetry automatically uses appkit's OpenTelemetry configuration via global registry. |
 | [extractServingEndpoints](Function.extractServingEndpoints.md) | Extract serving endpoint config from a server file by AST-parsing it. Looks for `serving({ endpoints: { alias: { env: "..." }, ... } })` calls and extracts the endpoint alias names and their environment variable mappings. |
 | [findServerFile](Function.findServerFile.md) | Find the server entry file by checking candidate paths in order. |
+| [fromPlugin](Function.fromPlugin.md) | Reference a plugin's tools inside an `AgentDefinition.tools` record without naming the plugin instance. The returned spread-friendly object carries a symbol-keyed marker that the agents plugin resolves against registered `ToolProvider`s at setup time. |
 | [generateDatabaseCredential](Function.generateDatabaseCredential.md) | Generate OAuth credentials for Postgres database connection using the proper Postgres API. |
 | [getExecutionContext](Function.getExecutionContext.md) | Get the current execution context. |
 | [getLakebaseOrmConfig](Function.getLakebaseOrmConfig.md) | Get Lakebase connection configuration for ORMs that don't accept pg.Pool directly. |
@@ -85,4 +111,13 @@ plugin architecture, and React integration.
 | [getResourceRequirements](Function.getResourceRequirements.md) | Gets the resource requirements from a plugin's manifest. |
 | [getUsernameWithApiLookup](Function.getUsernameWithApiLookup.md) | Resolves the PostgreSQL username for a Lakebase connection. |
 | [getWorkspaceClient](Function.getWorkspaceClient.md) | Get workspace client from config or SDK default auth chain |
+| [isFromPluginMarker](Function.isFromPluginMarker.md) | Type guard for [FromPluginMarker](Interface.FromPluginMarker.md). |
+| [isFunctionTool](Function.isFunctionTool.md) | - |
+| [isHostedTool](Function.isHostedTool.md) | - |
 | [isSQLTypeMarker](Function.isSQLTypeMarker.md) | Type guard to check if a value is a SQL type marker |
+| [isToolkitEntry](Function.isToolkitEntry.md) | Type guard for `ToolkitEntry` — used by the agents plugin to differentiate toolkit references from inline tools in a mixed `tools` record. |
+| [loadAgentFromFile](Function.loadAgentFromFile.md) | Loads a single markdown agent file and resolves its frontmatter against registered plugin toolkits + ambient tool library. |
+| [loadAgentsFromDir](Function.loadAgentsFromDir.md) | Scans a directory for `*.md` files and produces an `AgentDefinition` record keyed by file-stem. Throws on frontmatter errors or unresolved references. Returns an empty map if the directory does not exist. |
+| [mcpServer](Function.mcpServer.md) | Factory for declaring a custom MCP server tool. |
+| [runAgent](Function.runAgent.md) | Standalone agent execution without `createApp`. Resolves the adapter, binds inline tools, and drives the adapter's `run()` loop to completion. |
+| [tool](Function.tool.md) | Factory for defining function tools with Zod schemas. |
diff --git a/docs/docs/api/appkit/typedoc-sidebar.ts b/docs/docs/api/appkit/typedoc-sidebar.ts
index 720c78ea..cf001fcc 100644
--- a/docs/docs/api/appkit/typedoc-sidebar.ts
+++ b/docs/docs/api/appkit/typedoc-sidebar.ts
@@ -82,6 +82,36 @@ const typedocSidebar: SidebarsConfig = {
       type: "category",
       label: "Interfaces",
       items: [
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentAdapter",
+          label: "AgentAdapter"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentDefinition",
+          label: "AgentDefinition"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentInput",
+          label: "AgentInput"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentRunContext",
+          label: "AgentRunContext"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentsPluginConfig",
+          label: "AgentsPluginConfig"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.AgentToolDefinition",
+          label: "AgentToolDefinition"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.BasePluginConfig",
@@ -102,6 +132,16 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.EndpointConfig",
           label: "EndpointConfig"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.FromPluginMarker",
+          label: "FromPluginMarker"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.FunctionTool",
+          label: "FunctionTool"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.GenerateDatabaseCredentialRequest",
@@ -117,11 +157,21 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.LakebasePoolConfig",
           label: "LakebasePoolConfig"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.Message",
+          label: "Message"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.PluginManifest",
           label: "PluginManifest"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.PromptContext",
+          label: "PromptContext"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.RequestedClaims",
@@ -147,6 +197,16 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.ResourceRequirement",
           label: "ResourceRequirement"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.RunAgentInput",
+          label: "RunAgentInput"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.RunAgentResult",
+          label: "RunAgentResult"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.ServingEndpointEntry",
@@ -167,6 +227,36 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Interface.TelemetryConfig",
           label: "TelemetryConfig"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.Thread",
+          label: "Thread"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ThreadStore",
+          label: "ThreadStore"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ToolConfig",
+          label: "ToolConfig"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ToolkitEntry",
+          label: "ToolkitEntry"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ToolkitOptions",
+          label: "ToolkitOptions"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Interface.ToolProvider",
+          label: "ToolProvider"
+        },
         {
           type: "doc",
           id: "api/appkit/Interface.ValidationResult",
@@ -178,6 +268,26 @@ const typedocSidebar: SidebarsConfig = {
       type: "category",
       label: "Type Aliases",
       items: [
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.AgentEvent",
+          label: "AgentEvent"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.AgentTool",
+          label: "AgentTool"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.AgentTools",
+          label: "AgentTools"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.BaseSystemPromptOption",
+          label: "BaseSystemPromptOption"
+        },
         {
           type: "doc",
           id: "api/appkit/TypeAlias.ConfigSchema",
@@ -188,6 +298,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/TypeAlias.ExecutionResult",
           label: "ExecutionResult"
         },
+        {
+          type: "doc",
+          id: "api/appkit/TypeAlias.HostedTool",
+          label: "HostedTool"
+        },
         {
           type: "doc",
           id: "api/appkit/TypeAlias.IAppRouter",
@@ -219,6 +334,11 @@ const typedocSidebar: SidebarsConfig = {
       type: "category",
       label: "Variables",
       items: [
+        {
+          type: "doc",
+          id: "api/appkit/Variable.agents",
+          label: "agents"
+        },
         {
           type: "doc",
           id: "api/appkit/Variable.sql",
@@ -240,6 +360,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Function.appKitTypesPlugin",
           label: "appKitTypesPlugin"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Function.createAgent",
+          label: "createAgent"
+        },
         {
           type: "doc",
           id: "api/appkit/Function.createApp",
@@ -260,6 +385,11 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Function.findServerFile",
           label: "findServerFile"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Function.fromPlugin",
+          label: "fromPlugin"
+        },
         {
           type: "doc",
           id: "api/appkit/Function.generateDatabaseCredential",
@@ -300,10 +430,55 @@ const typedocSidebar: SidebarsConfig = {
           id: "api/appkit/Function.getWorkspaceClient",
           label: "getWorkspaceClient"
         },
+        {
+          type: "doc",
+          id: "api/appkit/Function.isFromPluginMarker",
+          label: "isFromPluginMarker"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.isFunctionTool",
+          label: "isFunctionTool"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.isHostedTool",
+          label: "isHostedTool"
+        },
         {
           type: "doc",
           id: "api/appkit/Function.isSQLTypeMarker",
           label: "isSQLTypeMarker"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.isToolkitEntry",
+          label: "isToolkitEntry"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.loadAgentFromFile",
+          label: "loadAgentFromFile"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.loadAgentsFromDir",
+          label: "loadAgentsFromDir"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.mcpServer",
+          label: "mcpServer"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.runAgent",
+          label: "runAgent"
+        },
+        {
+          type: "doc",
+          id: "api/appkit/Function.tool",
+          label: "tool"
         }
       ]
     }
diff --git a/docs/docs/plugins/agents.md b/docs/docs/plugins/agents.md
new file mode 100644
index 00000000..adf8dd69
--- /dev/null
+++ b/docs/docs/plugins/agents.md
@@ -0,0 +1,237 @@
+# Agents
+
+The `agents` plugin turns a Databricks AppKit app into an AI-agent host. It loads agent definitions from markdown files (convention: `config/agents/*.md`), from TypeScript (`createAgent(def)`), or both, and exposes them at `POST /invocations` alongside routes for chat, thread management, and cancellation.
+
+This page covers the full lifecycle. For the hand-written primitives (`tool()`, `mcpServer()`), see [tools](./server.md).
+
+## Install
+
+`agents` is a regular plugin. Add it to `plugins[]` alongside `server()` and any ToolProvider plugins whose tools you want agents to reach.
+
+```ts
+import { agents, analytics, createApp, files, server } from "@databricks/appkit";
+
+await createApp({
+  plugins: [server(), analytics(), files(), agents()],
+});
+```
+
+That alone gives you a live HTTP server with `POST /invocations` wired to a markdown-driven agent.
+
+## Level 1: drop a markdown file
+
+```
+my-app/
+  server.ts
+  config/agents/
+    assistant.md
+```
+
+```md
+---
+endpoint: databricks-claude-sonnet-4-5
+default: true
+---
+
+You are a helpful data assistant running on Databricks.
+
+Use the available tools to query data, browse files, and help users.
+```
+
+On startup the plugin:
+
+1. Discovers the file at `./config/agents/assistant.md`.
+2. Parses the YAML frontmatter and markdown body as the agent's `instructions`.
+3. Resolves the adapter from `endpoint` (or falls back to `DATABRICKS_AGENT_ENDPOINT`).
+4. Auto-inherits every registered ToolProvider plugin's tools (`analytics.*`, `files.*`, …).
+5. Mounts the agent at the default name (`assistant`).
+
+Requests land at `POST /invocations` with an OpenAI Responses-compatible body. Every tool call runs through `asUser(req)` so SQL executes as the requesting user, file access respects Unity Catalog ACLs, and telemetry spans are created automatically.
+
+## Level 2: scope tools in frontmatter
+
+```md
+---
+endpoint: databricks-claude-sonnet-4-5
+toolkits:
+  - analytics                             # all analytics.* tools
+  - files: [uploads.read, uploads.list]   # only these files tools
+  - genie: { except: [getConversation] }  # everything but getConversation
+tools: [get_weather]                      # ambient tool declared in code
+default: true
+---
+
+You are a read-only data analyst.
+```
+
+When any `toolkits:` or `tools:` is declared the auto-inherit default is turned off — the agent sees exactly the listed tools. Ambient tools (`tools: [get_weather]`) are looked up in the `agents({ tools: { ... } })` config.
+
+## Level 3: code-defined agents
+
+```ts
+import {
+  agents,
+  analytics,
+  createAgent,
+  createApp,
+  files,
+  fromPlugin,
+  server,
+  tool,
+} from "@databricks/appkit";
+import { z } from "zod";
+
+const support = createAgent({
+  instructions: "You help customers with data and files.",
+  model: "databricks-claude-sonnet-4-5",                  // string sugar
+  tools: {
+    ...fromPlugin(analytics),                             // all analytics tools
+    ...fromPlugin(files, { only: ["uploads.read"] }),     // filtered subset
+    get_weather: tool({
+      name: "get_weather",
+      description: "Weather",
+      schema: z.object({ city: z.string() }),
+      execute: async ({ city }) => `Sunny in ${city}`,
+    }),
+  },
+});
+
+await createApp({
+  plugins: [server(), analytics(), files(), agents({ agents: { support } })],
+});
+```
+
+Code-defined agents start with no tools by default. `fromPlugin(factory)` is the primary way to pull in a plugin's tools — it returns a spread-friendly marker that the agents plugin resolves against registered `ToolProvider`s at setup time. No intermediate variable, no duplicate `plugins: [analyticsP, filesP, ...]` dance: you write the factory reference once inside `fromPlugin` and again in `plugins: [...]`.
+
+The asymmetry (file: auto-inherit, code: strict) matches the personas: prompt authors want zero ceremony, engineers want no surprises.
+
+### Scoping tools in code
+
+`fromPlugin(factory, opts?)` accepts the same `ToolkitOptions` as markdown frontmatter:
+
+| Option | Example | Meaning |
+|---|---|---|
+| `only` | `{ only: ["query"] }` | Allowlist of local tool names |
+| `except` | `{ except: ["legacy"] }` | Denylist of local tool names |
+| `prefix` | `{ prefix: "" }` | Drop the `${pluginName}.` prefix |
+| `rename` | `{ rename: { query: "q" } }` | Remap specific local names |
+
+For plugins that don't expose a `.toolkit()` method (e.g., third-party `ToolProvider` plugins authored with plain `toPlugin`), `fromPlugin` falls back to walking `getAgentTools()` and synthesizing namespaced keys (`${pluginName}.${localName}`). The fallback respects `only` / `except` / `rename` / `prefix` the same way.
+
+If a referenced plugin is not registered in `createApp({ plugins })`, the agents plugin throws at setup with an `Available: …` listing so you can fix the wiring before the first request.
+
+## Level 4: sub-agents
+
+```ts
+const researcher = createAgent({
+  instructions: "Research the question. Return concise bullets.",
+  model: "databricks-claude-sonnet-4-5",
+  tools: { search: tool({ /* ... */ }) },
+});
+
+const writer = createAgent({
+  instructions: "Draft prose from notes.",
+  model: "databricks-claude-sonnet-4-5",
+});
+
+const supervisor = createAgent({
+  instructions: "Coordinate researcher and writer.",
+  model: "databricks-claude-sonnet-4-5",
+  agents: { researcher, writer },  // exposed as agent-researcher, agent-writer
+});
+
+await createApp({
+  plugins: [
+    server(),
+    agents({ agents: { supervisor, researcher, writer } }),
+  ],
+});
+```
+
+Each key in `agents: {...}` on an `AgentDefinition` becomes an `agent-<key>` tool on the parent. When invoked, the agents plugin runs the child's adapter with a fresh message list (no shared thread state) and returns the aggregated text. Cycles are rejected at load time.
+
+## Level 5: standalone (no `createApp`)
+
+```ts
+import { createAgent, runAgent, tool } from "@databricks/appkit";
+import { z } from "zod";
+
+const classifier = createAgent({
+  instructions: "Classify tickets: billing | bug | feature.",
+  model: "databricks-claude-sonnet-4-5",
+  tools: {
+    lookup_account: tool({ /* ... */ }),
+  },
+});
+
+for (const ticket of tickets) {
+  const result = await runAgent(classifier, {
+    messages: [{ role: "user", content: ticket.body }],
+  });
+  await persistClassification(ticket.id, result.text);
+}
+```
+
+`runAgent` drives the adapter without `createApp` or HTTP. Inline `tool()` calls work standalone as shown above. To use plugin tools in standalone mode, pass the plugin factories through `RunAgentInput.plugins` — `runAgent` will resolve any `fromPlugin` markers in the def against that list:
+
+```ts
+import { analytics, createAgent, fromPlugin, runAgent } from "@databricks/appkit";
+
+const classifier = createAgent({
+  instructions: "Classify tickets. Use analytics.query for historical data.",
+  model: "databricks-claude-sonnet-4-5",
+  tools: { ...fromPlugin(analytics) },
+});
+
+const result = await runAgent(classifier, {
+  messages: "is ticket 42 a duplicate?",
+  plugins: [analytics()],
+});
+```
+
+Hosted tools (MCP) are still `agents()`-only since they require the live MCP client. Plugin tool dispatch in standalone mode runs as the service principal (no OBO) since there is no HTTP request.
+
+## Configuration reference
+
+```ts
+agents({
+  dir?: string | false,         // "./config/agents" default; false disables
+  agents?: Record<string, AgentDefinition>,
+  defaultAgent?: string,
+  defaultModel?: AgentAdapter | Promise<AgentAdapter> | string,
+  tools?: Record<string, AgentTool>,
+  autoInheritTools?: boolean | { file?: boolean, code?: boolean },
+  threadStore?: ThreadStore,    // default in-memory
+  baseSystemPrompt?: false | string | (ctx: PromptContext) => string,
+})
+```
+
+`autoInheritTools` defaults to `{ file: true, code: false }`. Boolean shorthand applies to both.
+
+## Runtime API
+
+After `createApp`, the plugin exposes:
+
+```ts
+appkit.agents.list();               // => ["support", "researcher", ...]
+appkit.agents.get("support");       // => RegisteredAgent | null
+appkit.agents.getDefault();         // => "support"
+appkit.agents.register(name, def);  // dynamic registration
+appkit.agents.reload();             // re-scan the directory
+appkit.agents.getThreads(userId);   // list user's threads
+```
+
+## Frontmatter schema
+
+| Key | Type | Notes |
+|---|---|---|
+| `endpoint` | string | Model serving endpoint name. Shortcut for `model`. |
+| `model` | string | Same as `endpoint`; either works. |
+| `toolkits` | array of string or `{ name: options }` | Spread plugin toolkits. Supports `only`, `except`, `rename`, `prefix`. |
+| `tools` | array of string | Keys into `agents({ tools: {...} })`. |
+| `default` | boolean | First file with `default: true` becomes the default agent. |
+| `maxSteps` | number | Adapter max-step hint. |
+| `maxTokens` | number | Adapter max-token hint. |
+| `baseSystemPrompt` | false \| string | Per-agent override. `false` disables the AppKit base prompt. |
+
+Unknown keys are logged and ignored. Invalid YAML and missing plugin/tool references throw at boot.
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 307f44cf..86791f22 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -81,6 +81,76 @@ importers:
         specifier: 3.2.4
         version: 3.2.4(@types/debug@4.1.12)(@types/node@24.7.2)(jiti@2.6.1)(jsdom@27.0.0(bufferutil@4.0.9)(postcss@8.5.6))(lightningcss@1.30.2)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2)
 
+  apps/agent-app:
+    dependencies:
+      '@databricks/appkit':
+        specifier: workspace:*
+        version: link:../../packages/appkit
+      '@databricks/appkit-ui':
+        specifier: workspace:*
+        version: link:../../packages/appkit-ui
+      '@databricks/sdk-experimental':
+        specifier: ^0.16.0
+        version: 0.16.0
+      dotenv:
+        specifier: ^16.6.1
+        version: 16.6.1
+      lucide-react:
+        specifier: ^0.511.0
+        version: 0.511.0(react@19.2.0)
+      marked:
+        specifier: ^15.0.0
+        version: 15.0.12
+      react:
+        specifier: 19.2.0
+        version: 19.2.0
+      react-dom:
+        specifier: 19.2.0
+        version: 19.2.0(react@19.2.0)
+      zod:
+        specifier: ^4.0.0
+        version: 4.1.13
+    devDependencies:
+      '@tailwindcss/postcss':
+        specifier: 4.1.17
+        version: 4.1.17
+      '@types/node':
+        specifier: 24.10.1
+        version: 24.10.1
+      '@types/react':
+        specifier: 19.2.7
+        version: 19.2.7
+      '@types/react-dom':
+        specifier: 19.2.3
+        version: 19.2.3(@types/react@19.2.7)
+      '@vitejs/plugin-react':
+        specifier: 5.1.1
+        version: 5.1.1(rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2))
+      autoprefixer:
+        specifier: 10.4.21
+        version: 10.4.21(postcss@8.5.6)
+      postcss:
+        specifier: 8.5.6
+        version: 8.5.6
+      tailwindcss:
+        specifier: 4.1.17
+        version: 4.1.17
+      tailwindcss-animate:
+        specifier: 1.0.7
+        version: 1.0.7(tailwindcss@4.1.17)
+      tsx:
+        specifier: 4.20.6
+        version: 4.20.6
+      tw-animate-css:
+        specifier: 1.4.0
+        version: 1.4.0
+      typescript:
+        specifier: 5.9.3
+        version: 5.9.3
+      vite:
+        specifier: npm:rolldown-vite@7.1.14
+        version: rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2)
+
   apps/clean-app:
     dependencies:
       '@databricks/appkit':
@@ -2194,15 +2264,9 @@ packages:
     resolution: {integrity: sha512-lBSBiRruFurFKXr5Hbsl2thmGweAPmddhF3jb99U4EMDA5L+e5Y1rAkOS07Nvrup7HUMBDrCV45meaxZnt28nQ==}
     engines: {node: '>=20.0'}
 
-  '@emnapi/core@1.7.1':
-    resolution: {integrity: sha512-o1uhUASyo921r2XtHYOHy7gdkGLge8ghBEQHMWmyJFoXlpU58kIrhhN3w26lpQb6dspetweapMn2CSNwQ8I4wg==}
-
   '@emnapi/core@1.8.1':
     resolution: {integrity: sha512-AvT9QFpxK0Zd8J0jopedNm+w/2fIzvtPKPjqyw9jwvBaReTTqPBk9Hixaz7KbjimP+QNz605/XnjFcDAL2pqBg==}
 
-  '@emnapi/runtime@1.7.1':
-    resolution: {integrity: sha512-PVtJr5CmLwYAU9PZDMITZoR5iAOShYREoR45EyyLrbntV50mdePTgUn4AmOw90Ifcj+x2kRjdzr1HP3RrNiHGA==}
-
   '@emnapi/runtime@1.8.1':
     resolution: {integrity: sha512-mehfKSMWjjNol8659Z8KxEMrdSJDDot5SXMq00dM8BN4o+CLNXQ0xH2V7EchNHV4RmbZLmmPdEaXZc5H2FXmDg==}
 
@@ -2708,9 +2772,6 @@ packages:
   '@mermaid-js/parser@0.6.3':
     resolution: {integrity: sha512-lnjOhe7zyHjc+If7yT4zoedx2vo4sHaTmtkl1+or8BRTnCtDmcTpAjpzDSfCZrshM5bCoz0GyidzadJAH1xobA==}
 
-  '@napi-rs/wasm-runtime@1.0.7':
-    resolution: {integrity: sha512-SeDnOO0Tk7Okiq6DbXmmBODgOAb9dp9gjlphokTUxmt8U3liIP1ZsozBahH69j/RJv+Rfs6IwUKHTgQYJ/HBAw==}
-
   '@napi-rs/wasm-runtime@1.1.1':
     resolution: {integrity: sha512-p64ah1M1ld8xjWv3qbvFwHiFVWrq1yFvV4f7w+mzaqiR4IlSgkqhcRdHwsGgomwzBH51sRY4NEowLxnaBjcW/A==}
 
@@ -4662,39 +4723,79 @@ packages:
     resolution: {integrity: sha512-+PmQX0PiAYPMeVYe237LJAYvOMYW1j2rH5YROyS3b4CTVJum34HfRvKvAzozHAQG0TnHNdUfY9nCeUyRAs//cw==}
     engines: {node: '>=14.16'}
 
+  '@tailwindcss/node@4.1.17':
+    resolution: {integrity: sha512-csIkHIgLb3JisEFQ0vxr2Y57GUNYh447C8xzwj89U/8fdW8LhProdxvnVH6U8M2Y73QKiTIH+LWbK3V2BBZsAg==}
+
   '@tailwindcss/node@4.1.18':
     resolution: {integrity: sha512-DoR7U1P7iYhw16qJ49fgXUlry1t4CpXeErJHnQ44JgTSKMaZUdf17cfn5mHchfJ4KRBZRFA/Coo+MUF5+gOaCQ==}
 
+  '@tailwindcss/oxide-android-arm64@4.1.17':
+    resolution: {integrity: sha512-BMqpkJHgOZ5z78qqiGE6ZIRExyaHyuxjgrJ6eBO5+hfrfGkuya0lYfw8fRHG77gdTjWkNWEEm+qeG2cDMxArLQ==}
+    engines: {node: '>= 10'}
+    cpu: [arm64]
+    os: [android]
+
   '@tailwindcss/oxide-android-arm64@4.1.18':
     resolution: {integrity: sha512-dJHz7+Ugr9U/diKJA0W6N/6/cjI+ZTAoxPf9Iz9BFRF2GzEX8IvXxFIi/dZBloVJX/MZGvRuFA9rqwdiIEZQ0Q==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [android]
 
+  '@tailwindcss/oxide-darwin-arm64@4.1.17':
+    resolution: {integrity: sha512-EquyumkQweUBNk1zGEU/wfZo2qkp/nQKRZM8bUYO0J+Lums5+wl2CcG1f9BgAjn/u9pJzdYddHWBiFXJTcxmOg==}
+    engines: {node: '>= 10'}
+    cpu: [arm64]
+    os: [darwin]
+
   '@tailwindcss/oxide-darwin-arm64@4.1.18':
     resolution: {integrity: sha512-Gc2q4Qhs660bhjyBSKgq6BYvwDz4G+BuyJ5H1xfhmDR3D8HnHCmT/BSkvSL0vQLy/nkMLY20PQ2OoYMO15Jd0A==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [darwin]
 
+  '@tailwindcss/oxide-darwin-x64@4.1.17':
+    resolution: {integrity: sha512-gdhEPLzke2Pog8s12oADwYu0IAw04Y2tlmgVzIN0+046ytcgx8uZmCzEg4VcQh+AHKiS7xaL8kGo/QTiNEGRog==}
+    engines: {node: '>= 10'}
+    cpu: [x64]
+    os: [darwin]
+
   '@tailwindcss/oxide-darwin-x64@4.1.18':
     resolution: {integrity: sha512-FL5oxr2xQsFrc3X9o1fjHKBYBMD1QZNyc1Xzw/h5Qu4XnEBi3dZn96HcHm41c/euGV+GRiXFfh2hUCyKi/e+yw==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [darwin]
 
+  '@tailwindcss/oxide-freebsd-x64@4.1.17':
+    resolution: {integrity: sha512-hxGS81KskMxML9DXsaXT1H0DyA+ZBIbyG/sSAjWNe2EDl7TkPOBI42GBV3u38itzGUOmFfCzk1iAjDXds8Oh0g==}
+    engines: {node: '>= 10'}
+    cpu: [x64]
+    os: [freebsd]
+
   '@tailwindcss/oxide-freebsd-x64@4.1.18':
     resolution: {integrity: sha512-Fj+RHgu5bDodmV1dM9yAxlfJwkkWvLiRjbhuO2LEtwtlYlBgiAT4x/j5wQr1tC3SANAgD+0YcmWVrj8R9trVMA==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [freebsd]
 
+  '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.17':
+    resolution: {integrity: sha512-k7jWk5E3ldAdw0cNglhjSgv501u7yrMf8oeZ0cElhxU6Y2o7f8yqelOp3fhf7evjIS6ujTI3U8pKUXV2I4iXHQ==}
+    engines: {node: '>= 10'}
+    cpu: [arm]
+    os: [linux]
+
   '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.18':
     resolution: {integrity: sha512-Fp+Wzk/Ws4dZn+LV2Nqx3IilnhH51YZoRaYHQsVq3RQvEl+71VGKFpkfHrLM/Li+kt5c0DJe/bHXK1eHgDmdiA==}
     engines: {node: '>= 10'}
     cpu: [arm]
     os: [linux]
 
+  '@tailwindcss/oxide-linux-arm64-gnu@4.1.17':
+    resolution: {integrity: sha512-HVDOm/mxK6+TbARwdW17WrgDYEGzmoYayrCgmLEw7FxTPLcp/glBisuyWkFz/jb7ZfiAXAXUACfyItn+nTgsdQ==}
+    engines: {node: '>= 10'}
+    cpu: [arm64]
+    os: [linux]
+    libc: [glibc]
+
   '@tailwindcss/oxide-linux-arm64-gnu@4.1.18':
     resolution: {integrity: sha512-S0n3jboLysNbh55Vrt7pk9wgpyTTPD0fdQeh7wQfMqLPM/Hrxi+dVsLsPrycQjGKEQk85Kgbx+6+QnYNiHalnw==}
     engines: {node: '>= 10'}
@@ -4702,6 +4803,13 @@ packages:
     os: [linux]
     libc: [glibc]
 
+  '@tailwindcss/oxide-linux-arm64-musl@4.1.17':
+    resolution: {integrity: sha512-HvZLfGr42i5anKtIeQzxdkw/wPqIbpeZqe7vd3V9vI3RQxe3xU1fLjss0TjyhxWcBaipk7NYwSrwTwK1hJARMg==}
+    engines: {node: '>= 10'}
+    cpu: [arm64]
+    os: [linux]
+    libc: [musl]
+
   '@tailwindcss/oxide-linux-arm64-musl@4.1.18':
     resolution: {integrity: sha512-1px92582HkPQlaaCkdRcio71p8bc8i/ap5807tPRDK/uw953cauQBT8c5tVGkOwrHMfc2Yh6UuxaH4vtTjGvHg==}
     engines: {node: '>= 10'}
@@ -4709,6 +4817,13 @@ packages:
     os: [linux]
     libc: [musl]
 
+  '@tailwindcss/oxide-linux-x64-gnu@4.1.17':
+    resolution: {integrity: sha512-M3XZuORCGB7VPOEDH+nzpJ21XPvK5PyjlkSFkFziNHGLc5d6g3di2McAAblmaSUNl8IOmzYwLx9NsE7bplNkwQ==}
+    engines: {node: '>= 10'}
+    cpu: [x64]
+    os: [linux]
+    libc: [glibc]
+
   '@tailwindcss/oxide-linux-x64-gnu@4.1.18':
     resolution: {integrity: sha512-v3gyT0ivkfBLoZGF9LyHmts0Isc8jHZyVcbzio6Wpzifg/+5ZJpDiRiUhDLkcr7f/r38SWNe7ucxmGW3j3Kb/g==}
     engines: {node: '>= 10'}
@@ -4716,6 +4831,13 @@ packages:
     os: [linux]
     libc: [glibc]
 
+  '@tailwindcss/oxide-linux-x64-musl@4.1.17':
+    resolution: {integrity: sha512-k7f+pf9eXLEey4pBlw+8dgfJHY4PZ5qOUFDyNf7SI6lHjQ9Zt7+NcscjpwdCEbYi6FI5c2KDTDWyf2iHcCSyyQ==}
+    engines: {node: '>= 10'}
+    cpu: [x64]
+    os: [linux]
+    libc: [musl]
+
   '@tailwindcss/oxide-linux-x64-musl@4.1.18':
     resolution: {integrity: sha512-bhJ2y2OQNlcRwwgOAGMY0xTFStt4/wyU6pvI6LSuZpRgKQwxTec0/3Scu91O8ir7qCR3AuepQKLU/kX99FouqQ==}
     engines: {node: '>= 10'}
@@ -4723,6 +4845,18 @@ packages:
     os: [linux]
     libc: [musl]
 
+  '@tailwindcss/oxide-wasm32-wasi@4.1.17':
+    resolution: {integrity: sha512-cEytGqSSoy7zK4JRWiTCx43FsKP/zGr0CsuMawhH67ONlH+T79VteQeJQRO/X7L0juEUA8ZyuYikcRBf0vsxhg==}
+    engines: {node: '>=14.0.0'}
+    cpu: [wasm32]
+    bundledDependencies:
+      - '@napi-rs/wasm-runtime'
+      - '@emnapi/core'
+      - '@emnapi/runtime'
+      - '@tybys/wasm-util'
+      - '@emnapi/wasi-threads'
+      - tslib
+
   '@tailwindcss/oxide-wasm32-wasi@4.1.18':
     resolution: {integrity: sha512-LffYTvPjODiP6PT16oNeUQJzNVyJl1cjIebq/rWWBF+3eDst5JGEFSc5cWxyRCJ0Mxl+KyIkqRxk1XPEs9x8TA==}
     engines: {node: '>=14.0.0'}
@@ -4735,22 +4869,41 @@ packages:
       - '@emnapi/wasi-threads'
       - tslib
 
+  '@tailwindcss/oxide-win32-arm64-msvc@4.1.17':
+    resolution: {integrity: sha512-JU5AHr7gKbZlOGvMdb4722/0aYbU+tN6lv1kONx0JK2cGsh7g148zVWLM0IKR3NeKLv+L90chBVYcJ8uJWbC9A==}
+    engines: {node: '>= 10'}
+    cpu: [arm64]
+    os: [win32]
+
   '@tailwindcss/oxide-win32-arm64-msvc@4.1.18':
     resolution: {integrity: sha512-HjSA7mr9HmC8fu6bdsZvZ+dhjyGCLdotjVOgLA2vEqxEBZaQo9YTX4kwgEvPCpRh8o4uWc4J/wEoFzhEmjvPbA==}
     engines: {node: '>= 10'}
     cpu: [arm64]
     os: [win32]
 
+  '@tailwindcss/oxide-win32-x64-msvc@4.1.17':
+    resolution: {integrity: sha512-SKWM4waLuqx0IH+FMDUw6R66Hu4OuTALFgnleKbqhgGU30DY20NORZMZUKgLRjQXNN2TLzKvh48QXTig4h4bGw==}
+    engines: {node: '>= 10'}
+    cpu: [x64]
+    os: [win32]
+
   '@tailwindcss/oxide-win32-x64-msvc@4.1.18':
     resolution: {integrity: sha512-bJWbyYpUlqamC8dpR7pfjA0I7vdF6t5VpUGMWRkXVE3AXgIZjYUYAK7II1GNaxR8J1SSrSrppRar8G++JekE3Q==}
     engines: {node: '>= 10'}
     cpu: [x64]
     os: [win32]
 
+  '@tailwindcss/oxide@4.1.17':
+    resolution: {integrity: sha512-F0F7d01fmkQhsTjXezGBLdrl1KresJTcI3DB8EkScCldyKp3Msz4hub4uyYaVnk88BAS1g5DQjjF6F5qczheLA==}
+    engines: {node: '>= 10'}
+
   '@tailwindcss/oxide@4.1.18':
     resolution: {integrity: sha512-EgCR5tTS5bUSKQgzeMClT6iCY3ToqE1y+ZB0AKldj809QXk1Y+3jB0upOYZrn9aGIzPtUsP7sX4QQ4XtjBB95A==}
     engines: {node: '>= 10'}
 
+  '@tailwindcss/postcss@4.1.17':
+    resolution: {integrity: sha512-+nKl9N9mN5uJ+M7dBOOCzINw94MPstNR/GtIhz1fpZysxL/4a+No64jCBD6CPN+bIHWFx3KWuu8XJRrj/572Dw==}
+
   '@tailwindcss/postcss@4.1.18':
     resolution: {integrity: sha512-Ce0GFnzAOuPyfV5SxjXGn0CubwGcuDB0zcdaPuCSzAa/2vII24JTkH+I6jcbXLb1ctjZMZZI6OjDaLPJQL1S0g==}
 
@@ -5536,6 +5689,13 @@ packages:
   autocomplete.js@0.37.1:
     resolution: {integrity: sha512-PgSe9fHYhZEsm/9jggbjtVsGXJkPLvd+9mC7gZJ662vVL5CRWEtm/mIrrzCx0MrNxHVwxD5d00UOn6NsmL2LUQ==}
 
+  autoprefixer@10.4.21:
+    resolution: {integrity: sha512-O+A6LWV5LDHSJD3LjHYoNi4VLsj/Whi7k6zG12xTYaU4cQ8oxQGckXNX8cRHK5yOZ/ppVHe0ZBXGzSV9jXdVbQ==}
+    engines: {node: ^10 || ^12 || >=14}
+    hasBin: true
+    peerDependencies:
+      postcss: ^8.1.0
+
   autoprefixer@10.4.23:
     resolution: {integrity: sha512-YYTXSFulfwytnjAPlw8QHncHJmlvFKtczb8InXaAx9Q0LbfDnfEYDE55omerIJKihhmU61Ft+cAOSzQVaBUmeA==}
     engines: {node: ^10 || ^12 || >=14}
@@ -7304,6 +7464,9 @@ packages:
     resolution: {integrity: sha512-buRG0fpBtRHSTCOASe6hD258tEubFoRLb4ZNA6NxMVHNw2gOcwHo9wyablzMzOA5z9xA9L1KNjk/Nt6MT9aYow==}
     engines: {node: '>= 0.6'}
 
+  fraction.js@4.3.7:
+    resolution: {integrity: sha512-ZsDfxO51wGAXREY55a7la9LScWpwv9RxIrYABrlvOFBlH/ShPnrtsXeuUIfXKKOVicNxQ+o8JTbJvjS4M89yew==}
+
   fraction.js@5.3.4:
     resolution: {integrity: sha512-1X1NTtiJphryn/uLQz3whtY6jK3fTqoE3ohKs0tT+Ujr1W59oopxmoEh7Lu5p6vBaPbgoM0bzveAW4Qi5RyWDQ==}
 
@@ -8554,6 +8717,11 @@ packages:
     resolution: {integrity: sha512-jumlc0BIUrS3qJGgIkWZsyfAM7NCWiBcCDhnd+3NNM5KbBmLTgHVfWBcg6W+rLUsIpzpERPsvwUP7CckAQSOoA==}
     engines: {node: '>=12'}
 
+  lucide-react@0.511.0:
+    resolution: {integrity: sha512-VK5a2ydJ7xm8GvBeKLS9mu1pVK6ucef9780JVUjw6bAjJL/QXnd4Y0p7SPeOUMC27YhzNCZvm5d/QX0Tp3rc0w==}
+    peerDependencies:
+      react: ^16.5.1 || ^17.0.0 || ^18.0.0 || ^19.0.0
+
   lucide-react@0.554.0:
     resolution: {integrity: sha512-St+z29uthEJVx0Is7ellNkgTEhaeSoA42I7JjOCBCrc5X6LYMGSv0P/2uS5HDLTExP5tpiqRD2PyUEOS6s9UXA==}
     peerDependencies:
@@ -8604,6 +8772,11 @@ packages:
   markdown-table@3.0.4:
     resolution: {integrity: sha512-wiYz4+JrLyb/DqW2hkFJxP7Vd7JuTDm77fvbM8VfEQdmSMqcImWeeRbHwZjBjIFki/VaMK2BhFi7oUUZeM5bqw==}
 
+  marked@15.0.12:
+    resolution: {integrity: sha512-8dD6FusOQSrpv9Z1rdNMdlSgQOIP880DHqnohobOmYLElGEqAL/JvxvuxZO16r4HtjTlfPRDC1hbvxC9dPN2nA==}
+    engines: {node: '>= 18'}
+    hasBin: true
+
   marked@16.4.2:
     resolution: {integrity: sha512-TI3V8YYWvkVf3KJe1dRkpnjs68JUPyEa5vjKrp1XEEJUAOaQc+Qj+L1qWbPd0SJuAdQkFU0h73sXXqwDYxsiDA==}
     engines: {node: '>= 20'}
@@ -9118,6 +9291,10 @@ packages:
     resolution: {integrity: sha512-6eZs5Ls3WtCisHWp9S2GUy8dqkpGi4BVSz3GaqiE6ezub0512ESztXUwUB6C6IKbQkY2Pnb/mD4WYojCRwcwLA==}
     engines: {node: '>=0.10.0'}
 
+  normalize-range@0.1.2:
+    resolution: {integrity: sha512-bdok/XvKII3nUpklnV6P2hxtMNrCboOjAcyBuQnWEhO665FwrSNRxU+AqpsyvO6LgGYPspN+lu5CLtw4jPRKNA==}
+    engines: {node: '>=0.10.0'}
+
   normalize-url@8.1.0:
     resolution: {integrity: sha512-X06Mfd/5aKsRHc0O0J5CUedwnPmnDtLF2+nq+KN9KSDlJHkPuh0JUviWjEWMe0SW/9TDdSLVPuk7L5gGTIA1/w==}
     engines: {node: '>=14.16'}
@@ -14535,23 +14712,12 @@ snapshots:
       - uglify-js
       - webpack-cli
 
-  '@emnapi/core@1.7.1':
-    dependencies:
-      '@emnapi/wasi-threads': 1.1.0
-      tslib: 2.8.1
-    optional: true
-
   '@emnapi/core@1.8.1':
     dependencies:
       '@emnapi/wasi-threads': 1.1.0
       tslib: 2.8.1
     optional: true
 
-  '@emnapi/runtime@1.7.1':
-    dependencies:
-      tslib: 2.8.1
-    optional: true
-
   '@emnapi/runtime@1.8.1':
     dependencies:
       tslib: 2.8.1
@@ -15041,13 +15207,6 @@ snapshots:
     dependencies:
       langium: 3.3.1
 
-  '@napi-rs/wasm-runtime@1.0.7':
-    dependencies:
-      '@emnapi/core': 1.7.1
-      '@emnapi/runtime': 1.7.1
-      '@tybys/wasm-util': 0.10.1
-    optional: true
-
   '@napi-rs/wasm-runtime@1.1.1':
     dependencies:
       '@emnapi/core': 1.8.1
@@ -16774,7 +16933,7 @@ snapshots:
 
   '@rolldown/binding-wasm32-wasi@1.0.0-beta.41':
     dependencies:
-      '@napi-rs/wasm-runtime': 1.0.7
+      '@napi-rs/wasm-runtime': 1.1.1
     optional: true
 
   '@rolldown/binding-wasm32-wasi@1.0.0-rc.3':
@@ -17070,6 +17229,16 @@ snapshots:
     dependencies:
       defer-to-connect: 2.0.1
 
+  '@tailwindcss/node@4.1.17':
+    dependencies:
+      '@jridgewell/remapping': 2.3.5
+      enhanced-resolve: 5.18.3
+      jiti: 2.6.1
+      lightningcss: 1.30.2
+      magic-string: 0.30.21
+      source-map-js: 1.2.1
+      tailwindcss: 4.1.17
+
   '@tailwindcss/node@4.1.18':
     dependencies:
       '@jridgewell/remapping': 2.3.5
@@ -17080,42 +17249,93 @@ snapshots:
       source-map-js: 1.2.1
       tailwindcss: 4.1.18
 
+  '@tailwindcss/oxide-android-arm64@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-android-arm64@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-darwin-arm64@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-darwin-arm64@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-darwin-x64@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-darwin-x64@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-freebsd-x64@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-freebsd-x64@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-linux-arm-gnueabihf@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-linux-arm64-gnu@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-linux-arm64-gnu@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-linux-arm64-musl@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-linux-arm64-musl@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-linux-x64-gnu@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-linux-x64-gnu@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-linux-x64-musl@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-linux-x64-musl@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-wasm32-wasi@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-wasm32-wasi@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-win32-arm64-msvc@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-win32-arm64-msvc@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide-win32-x64-msvc@4.1.17':
+    optional: true
+
   '@tailwindcss/oxide-win32-x64-msvc@4.1.18':
     optional: true
 
+  '@tailwindcss/oxide@4.1.17':
+    optionalDependencies:
+      '@tailwindcss/oxide-android-arm64': 4.1.17
+      '@tailwindcss/oxide-darwin-arm64': 4.1.17
+      '@tailwindcss/oxide-darwin-x64': 4.1.17
+      '@tailwindcss/oxide-freebsd-x64': 4.1.17
+      '@tailwindcss/oxide-linux-arm-gnueabihf': 4.1.17
+      '@tailwindcss/oxide-linux-arm64-gnu': 4.1.17
+      '@tailwindcss/oxide-linux-arm64-musl': 4.1.17
+      '@tailwindcss/oxide-linux-x64-gnu': 4.1.17
+      '@tailwindcss/oxide-linux-x64-musl': 4.1.17
+      '@tailwindcss/oxide-wasm32-wasi': 4.1.17
+      '@tailwindcss/oxide-win32-arm64-msvc': 4.1.17
+      '@tailwindcss/oxide-win32-x64-msvc': 4.1.17
+
   '@tailwindcss/oxide@4.1.18':
     optionalDependencies:
       '@tailwindcss/oxide-android-arm64': 4.1.18
@@ -17131,6 +17351,14 @@ snapshots:
       '@tailwindcss/oxide-win32-arm64-msvc': 4.1.18
       '@tailwindcss/oxide-win32-x64-msvc': 4.1.18
 
+  '@tailwindcss/postcss@4.1.17':
+    dependencies:
+      '@alloc/quick-lru': 5.2.0
+      '@tailwindcss/node': 4.1.17
+      '@tailwindcss/oxide': 4.1.17
+      postcss: 8.5.6
+      tailwindcss: 4.1.17
+
   '@tailwindcss/postcss@4.1.18':
     dependencies:
       '@alloc/quick-lru': 5.2.0
@@ -17712,6 +17940,18 @@ snapshots:
     transitivePeerDependencies:
       - supports-color
 
+  '@vitejs/plugin-react@5.1.1(rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2))':
+    dependencies:
+      '@babel/core': 7.28.5
+      '@babel/plugin-transform-react-jsx-self': 7.27.1(@babel/core@7.28.5)
+      '@babel/plugin-transform-react-jsx-source': 7.27.1(@babel/core@7.28.5)
+      '@rolldown/pluginutils': 1.0.0-beta.47
+      '@types/babel__core': 7.20.5
+      react-refresh: 0.18.0
+      vite: rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2)
+    transitivePeerDependencies:
+      - supports-color
+
   '@vitejs/plugin-react@5.1.1(rolldown-vite@7.1.14(@types/node@25.2.3)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2))':
     dependencies:
       '@babel/core': 7.28.5
@@ -18094,6 +18334,16 @@ snapshots:
     dependencies:
       immediate: 3.3.0
 
+  autoprefixer@10.4.21(postcss@8.5.6):
+    dependencies:
+      browserslist: 4.28.1
+      caniuse-lite: 1.0.30001760
+      fraction.js: 4.3.7
+      normalize-range: 0.1.2
+      picocolors: 1.1.1
+      postcss: 8.5.6
+      postcss-value-parser: 4.2.0
+
   autoprefixer@10.4.23(postcss@8.5.6):
     dependencies:
       browserslist: 4.28.1
@@ -18927,7 +19177,7 @@ snapshots:
 
   cssnano-preset-advanced@6.1.2(postcss@8.5.6):
     dependencies:
-      autoprefixer: 10.4.23(postcss@8.5.6)
+      autoprefixer: 10.4.21(postcss@8.5.6)
       browserslist: 4.28.1
       cssnano-preset-default: 6.1.2(postcss@8.5.6)
       postcss: 8.5.6
@@ -19959,6 +20209,8 @@ snapshots:
 
   forwarded@0.2.0: {}
 
+  fraction.js@4.3.7: {}
+
   fraction.js@5.3.4: {}
 
   fresh@0.5.2: {}
@@ -21389,6 +21641,10 @@ snapshots:
 
   lru-cache@7.18.3: {}
 
+  lucide-react@0.511.0(react@19.2.0):
+    dependencies:
+      react: 19.2.0
+
   lucide-react@0.554.0(react@19.2.0):
     dependencies:
       react: 19.2.0
@@ -21452,6 +21708,8 @@ snapshots:
 
   markdown-table@3.0.4: {}
 
+  marked@15.0.12: {}
+
   marked@16.4.2: {}
 
   marked@17.0.3: {}
@@ -22239,6 +22497,8 @@ snapshots:
 
   normalize-path@3.0.0: {}
 
+  normalize-range@0.1.2: {}
+
   normalize-url@8.1.0: {}
 
   normalize-url@8.1.1: {}
@@ -23758,6 +24018,24 @@ snapshots:
       tsx: 4.20.6
       yaml: 2.8.2
 
+  rolldown-vite@7.1.14(@types/node@24.10.1)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2):
+    dependencies:
+      '@oxc-project/runtime': 0.92.0
+      fdir: 6.5.0(picomatch@4.0.3)
+      lightningcss: 1.30.2
+      picomatch: 4.0.3
+      postcss: 8.5.6
+      rolldown: 1.0.0-beta.41
+      tinyglobby: 0.2.15
+    optionalDependencies:
+      '@types/node': 24.10.1
+      esbuild: 0.25.10
+      fsevents: 2.3.3
+      jiti: 2.6.1
+      terser: 5.44.1
+      tsx: 4.20.6
+      yaml: 2.8.2
+
   rolldown-vite@7.1.14(@types/node@25.2.3)(esbuild@0.25.10)(jiti@2.6.1)(terser@5.44.1)(tsx@4.20.6)(yaml@2.8.2):
     dependencies:
       '@oxc-project/runtime': 0.92.0
diff --git a/template/appkit.plugins.json b/template/appkit.plugins.json
index d1420d2e..8a1461a8 100644
--- a/template/appkit.plugins.json
+++ b/template/appkit.plugins.json
@@ -2,6 +2,16 @@
   "$schema": "https://databricks.github.io/appkit/schemas/template-plugins.schema.json",
   "version": "1.0",
   "plugins": {
+    "agent": {
+      "name": "agent",
+      "displayName": "Agents Plugin",
+      "description": "AI agents driven by markdown configs or code, with auto-tool-discovery from registered plugins",
+      "package": "@databricks/appkit",
+      "resources": {
+        "required": [],
+        "optional": []
+      }
+    },
     "analytics": {
       "name": "analytics",
       "displayName": "Analytics Plugin",

From 208d22c980a451fce58fdf566d1fab37b38a8c02 Mon Sep 17 00:00:00 2001
From: MarioCadenas <MarioCadenas@users.noreply.github.com>
Date: Wed, 22 Apr 2026 10:31:31 +0200
Subject: [PATCH 6/6] feat(appkit): zero-trust MCP host policy with URL
 allowlist and scoped auth
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Closes the MCP-URL token-exfiltration surface identified in the agents
stack review. Before this change, `AppKitMcpClient` accepted any
`http(s)://` URL as a hosted tool endpoint and forwarded the
service-principal token (on `initialize`/`tools/list`) plus the end-user
OBO token (on `tools/call`) to whatever host the developer wrote into
`mcpServer(name, url)`. A compromised or mistyped URL, or one pointed at
`http://169.254.169.254/latest/meta-data/`, would leak workspace
credentials on connect — no user interaction required.

### Policy surface

New `mcp` field on `AgentsPluginConfig`:

```ts
agents({
  mcp: {
    trustedHosts: ["mcp.corp.internal"],
    allowLocalhost: true, // default: NODE_ENV !== "production"
  },
});
```

By default only same-origin Databricks workspace URLs are reachable.
Workspace credentials (SP or OBO) are *never* forwarded to non-workspace
hosts — trusted external MCP servers must authenticate themselves.

### Gates enforced at connect()

1. Only `http(s):` schemes.
2. `http://` refused for everything except localhost in dev mode.
3. Hostname must match workspace, equal localhost (if permitted), or be
   in `trustedHosts`.
4. Resolved DNS addresses must not land in loopback, RFC1918, CGNAT,
   link-local (blocks cloud metadata 169.254.169.254), ULA, or
   multicast ranges. IP-literal URLs in these ranges are rejected
   without a DNS lookup. Malformed IPs fail-closed.

### Auth scoping

`AppKitMcpClient.callTool` drops any caller-supplied `Authorization`
header when the destination's `forwardWorkspaceAuth` was `false` at
connect time. `sendRpc` / `sendNotification` never invoke the
workspace `authenticate()` closure when forwarding is disallowed.

### Tests

New `mcp-host-policy.test.ts` (42 tests) covers:
- trustedHosts normalization, NODE_ENV default, invalid workspace URL
- same-origin admit with auth, trusted host admit without auth
- plaintext http rejection (including "same host wrong scheme")
- non-http(s) scheme rejection
- case-insensitive hostname match
- IP blocklist: RFC1918, link-local, CGNAT, 0.0.0.0/8, multicast,
  loopback (gated by allowLocalhost), ULA, link-local IPv6,
  IPv4-mapped IPv6, malformed IP fail-closed
- DNS-backed assertResolvedHostSafe: public, metadata, RFC1918,
  DNS failure, empty result, mixed-result "split DNS" defense

New `mcp-client.test.ts` (8 tests) covers the integrated client:
- connect rejects non-allowlisted host without any fetch
- connect rejects plaintext http without any fetch
- connect rejects DNS-resolves-to-blocked-IP without any fetch
- SP token attached only on same-origin workspace RPCs
- No auth header on any RPC to trusted external host
- callTool drops OBO token when destination is external
- callTool forwards OBO when destination is workspace
- callTool falls back to SP when no OBO override

Full appkit suite: 1361 tests passing (up from 1311).
Typecheck + biome + knip + generate:types all clean.

### Drive-by

- `json-schema.ts` formatting violation fixed (pre-existing biome drift
  on the stack tip that would fail CI regardless).
- `AppKitMcpClient` now accepts an optional `{ dnsLookup, fetchImpl }`
  for dependency injection in tests.

Refs: S1 in the stack security plan (Tier 1 — critical).
Signed-off-by: MarioCadenas <MarioCadenas@users.noreply.github.com>
---
 docs/docs/plugins/agents.md                   |  33 ++
 packages/appkit/src/plugins/agents/agents.ts  |   4 +-
 .../plugins/agents/tests/mcp-client.test.ts   | 332 ++++++++++++++++++
 .../agents/tests/mcp-host-policy.test.ts      | 324 +++++++++++++++++
 .../src/plugins/agents/tools/json-schema.ts   |   4 +-
 .../src/plugins/agents/tools/mcp-client.ts    | 128 +++++--
 .../plugins/agents/tools/mcp-host-policy.ts   | 270 ++++++++++++++
 packages/appkit/src/plugins/agents/types.ts   |   8 +
 8 files changed, 1078 insertions(+), 25 deletions(-)
 create mode 100644 packages/appkit/src/plugins/agents/tests/mcp-client.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tests/mcp-host-policy.test.ts
 create mode 100644 packages/appkit/src/plugins/agents/tools/mcp-host-policy.ts

diff --git a/docs/docs/plugins/agents.md b/docs/docs/plugins/agents.md
index adf8dd69..8eeabb5e 100644
--- a/docs/docs/plugins/agents.md
+++ b/docs/docs/plugins/agents.md
@@ -203,11 +203,44 @@ agents({
   autoInheritTools?: boolean | { file?: boolean, code?: boolean },
   threadStore?: ThreadStore,    // default in-memory
   baseSystemPrompt?: false | string | (ctx: PromptContext) => string,
+  mcp?: {
+    trustedHosts?: string[],    // extra hostnames allowed for custom MCP URLs
+    allowLocalhost?: boolean,   // default: NODE_ENV !== "production"
+  },
 })
 ```
 
 `autoInheritTools` defaults to `{ file: true, code: false }`. Boolean shorthand applies to both.
 
+### MCP host policy
+
+AppKit applies a zero-trust policy to every MCP URL used as a hosted tool. By default only **same-origin Databricks workspace URLs** (matching the resolved `DATABRICKS_HOST`) may be reached. Every other host must be explicitly allowlisted via `mcp.trustedHosts`, and workspace credentials (service-principal and on-behalf-of user tokens) are **never** forwarded to those hosts.
+
+```ts
+agents({
+  agents: {
+    support: createAgent({
+      instructions: "…",
+      tools: {
+        "mcp.internal": mcpServer("internal", "https://mcp.corp.internal/mcp"),
+      },
+    }),
+  },
+  mcp: {
+    trustedHosts: ["mcp.corp.internal"],
+  },
+});
+```
+
+The policy enforces four rules at MCP `connect()` time, before any byte is sent:
+
+1. Only `http` and `https` URLs are accepted.
+2. Plaintext `http://` is rejected for everything except `localhost` when `allowLocalhost` is true (default in development, off in production).
+3. The destination hostname must match the workspace host, equal `localhost` (if permitted), or appear in `trustedHosts`.
+4. The resolved DNS address must not fall in loopback, RFC1918, CGNAT (100.64.0.0/10), link-local (169.254.0.0/16 — covers cloud metadata services), ULA, or multicast ranges.
+
+`Authorization` headers carrying workspace credentials are scoped to same-origin workspace URLs. A `mcpServer(name, url)` pointing at a trusted external host must authenticate itself (for example, a custom token baked into `url`).
+
 ## Runtime API
 
 After `createApp`, the plugin exposes:
diff --git a/packages/appkit/src/plugins/agents/agents.ts b/packages/appkit/src/plugins/agents/agents.ts
index c8758ac8..a4612252 100644
--- a/packages/appkit/src/plugins/agents/agents.ts
+++ b/packages/appkit/src/plugins/agents/agents.ts
@@ -34,6 +34,7 @@ import {
   isHostedTool,
   resolveHostedTools,
 } from "./tools";
+import { buildMcpHostPolicy } from "./tools/mcp-host-policy";
 import type {
   AgentDefinition,
   AgentsPluginConfig,
@@ -447,7 +448,8 @@ export class AgentsPlugin extends Plugin implements ToolProvider {
     }
 
     if (!this.mcpClient) {
-      this.mcpClient = new AppKitMcpClient(host, authenticate);
+      const policy = buildMcpHostPolicy(this.config.mcp, host);
+      this.mcpClient = new AppKitMcpClient(host, authenticate, policy);
     }
 
     const endpoints = resolveHostedTools(hostedTools);
diff --git a/packages/appkit/src/plugins/agents/tests/mcp-client.test.ts b/packages/appkit/src/plugins/agents/tests/mcp-client.test.ts
new file mode 100644
index 00000000..bee5faa3
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/mcp-client.test.ts
@@ -0,0 +1,332 @@
+import { beforeEach, describe, expect, test, vi } from "vitest";
+import { AppKitMcpClient } from "../tools/mcp-client";
+import type { DnsLookup, McpHostPolicy } from "../tools/mcp-host-policy";
+
+const WORKSPACE = "https://test-workspace.cloud.databricks.com";
+
+const workspacePolicy: McpHostPolicy = {
+  workspaceHostname: "test-workspace.cloud.databricks.com",
+  trustedHosts: new Set(),
+  allowLocalhost: false,
+};
+
+const trustedExternalPolicy: McpHostPolicy = {
+  workspaceHostname: "test-workspace.cloud.databricks.com",
+  trustedHosts: new Set(["mcp.example.com"]),
+  allowLocalhost: false,
+};
+
+const publicDnsLookup: DnsLookup = async () => [
+  { address: "203.0.113.42", family: 4 },
+];
+
+const workspaceAuth = async (): Promise<Record<string, string>> => ({
+  Authorization: "Bearer SP-TOKEN",
+});
+
+type FetchCall = {
+  url: string;
+  init: RequestInit;
+};
+
+function recordingFetch(
+  responders: Array<(call: FetchCall) => Response | Promise<Response>>,
+) {
+  const calls: FetchCall[] = [];
+  let n = 0;
+  const fetchImpl: typeof fetch = async (input, init) => {
+    const url = typeof input === "string" ? input : (input as URL).toString();
+    const call: FetchCall = { url, init: init ?? {} };
+    calls.push(call);
+    const responder = responders[n++] ?? responders[responders.length - 1];
+    return Promise.resolve(responder(call));
+  };
+  return { fetchImpl, calls };
+}
+
+function jsonResponse(body: unknown, headers: Record<string, string> = {}) {
+  return new Response(JSON.stringify(body), {
+    status: 200,
+    headers: { "content-type": "application/json", ...headers },
+  });
+}
+
+describe("AppKitMcpClient — host allowlist", () => {
+  let authSpy: ReturnType<typeof vi.fn>;
+
+  beforeEach(() => {
+    authSpy = vi.fn(workspaceAuth);
+  });
+
+  test("connect rejects a URL whose host is not allowlisted without making any fetch", async () => {
+    const { fetchImpl, calls } = recordingFetch([() => jsonResponse({})]);
+    const client = new AppKitMcpClient(WORKSPACE, authSpy, workspacePolicy, {
+      fetchImpl,
+      dnsLookup: publicDnsLookup,
+    });
+    await expect(
+      client.connect({ name: "evil", url: "https://attacker.example.com/mcp" }),
+    ).rejects.toThrow(/attacker\.example\.com/);
+    expect(calls).toHaveLength(0);
+    expect(authSpy).not.toHaveBeenCalled();
+  });
+
+  test("connect rejects plaintext http:// for remote hosts", async () => {
+    const { fetchImpl, calls } = recordingFetch([() => jsonResponse({})]);
+    const client = new AppKitMcpClient(
+      WORKSPACE,
+      authSpy,
+      trustedExternalPolicy,
+      { fetchImpl, dnsLookup: publicDnsLookup },
+    );
+    await expect(
+      client.connect({ name: "plain", url: "http://mcp.example.com/mcp" }),
+    ).rejects.toThrow(/plaintext http/);
+    expect(calls).toHaveLength(0);
+    expect(authSpy).not.toHaveBeenCalled();
+  });
+
+  test("connect rejects a URL whose DNS resolves to a blocked IP and never sends SP token", async () => {
+    const ssrfLookup: DnsLookup = async () => [
+      { address: "169.254.169.254", family: 4 },
+    ];
+    const policy: McpHostPolicy = {
+      workspaceHostname: "test-workspace.cloud.databricks.com",
+      trustedHosts: new Set(["evil.example.com"]),
+      allowLocalhost: false,
+    };
+    const { fetchImpl, calls } = recordingFetch([() => jsonResponse({})]);
+    const client = new AppKitMcpClient(WORKSPACE, authSpy, policy, {
+      fetchImpl,
+      dnsLookup: ssrfLookup,
+    });
+    await expect(
+      client.connect({ name: "evil", url: "https://evil.example.com/mcp" }),
+    ).rejects.toThrow(/169\.254\.169\.254/);
+    expect(calls).toHaveLength(0);
+    expect(authSpy).not.toHaveBeenCalled();
+  });
+
+  test("connect to same-origin workspace forwards SP token on initialize + tools/list", async () => {
+    const { fetchImpl, calls } = recordingFetch([
+      () =>
+        jsonResponse(
+          { jsonrpc: "2.0", id: 1, result: {} },
+          {
+            "mcp-session-id": "sess-1",
+          },
+        ),
+      () => jsonResponse({ jsonrpc: "2.0", result: null }),
+      () =>
+        jsonResponse({
+          jsonrpc: "2.0",
+          id: 3,
+          result: { tools: [{ name: "echo", description: "Echo" }] },
+        }),
+    ]);
+    const client = new AppKitMcpClient(WORKSPACE, authSpy, workspacePolicy, {
+      fetchImpl,
+      dnsLookup: publicDnsLookup,
+    });
+
+    await client.connect({
+      name: "genie-1",
+      url: `${WORKSPACE}/api/2.0/mcp/genie/abc`,
+    });
+
+    // initialize + notifications/initialized + tools/list all carry SP token
+    expect(calls.map((c) => c.url)).toEqual([
+      `${WORKSPACE}/api/2.0/mcp/genie/abc`,
+      `${WORKSPACE}/api/2.0/mcp/genie/abc`,
+      `${WORKSPACE}/api/2.0/mcp/genie/abc`,
+    ]);
+    for (const call of calls) {
+      const headers = call.init.headers as Record<string, string>;
+      expect(headers.Authorization).toBe("Bearer SP-TOKEN");
+    }
+    expect(client.canForwardWorkspaceAuth("genie-1")).toBe(true);
+  });
+
+  test("connect to trusted external host does NOT forward SP token on any RPC", async () => {
+    const { fetchImpl, calls } = recordingFetch([
+      () =>
+        jsonResponse(
+          { jsonrpc: "2.0", id: 1, result: {} },
+          {
+            "mcp-session-id": "sess-1",
+          },
+        ),
+      () => jsonResponse({ jsonrpc: "2.0", result: null }),
+      () =>
+        jsonResponse({
+          jsonrpc: "2.0",
+          id: 3,
+          result: { tools: [{ name: "help" }] },
+        }),
+    ]);
+    const client = new AppKitMcpClient(
+      WORKSPACE,
+      authSpy,
+      trustedExternalPolicy,
+      { fetchImpl, dnsLookup: publicDnsLookup },
+    );
+
+    await client.connect({ name: "ext", url: "https://mcp.example.com/mcp" });
+
+    for (const call of calls) {
+      const headers = call.init.headers as Record<string, string>;
+      expect(headers.Authorization).toBeUndefined();
+    }
+    expect(authSpy).not.toHaveBeenCalled();
+    expect(client.canForwardWorkspaceAuth("ext")).toBe(false);
+  });
+});
+
+describe("AppKitMcpClient — callTool auth scoping", () => {
+  test("drops caller-supplied OBO token when destination is not workspace-origin", async () => {
+    const connectResponders = [
+      () =>
+        jsonResponse(
+          { jsonrpc: "2.0", id: 1, result: {} },
+          {
+            "mcp-session-id": "sess-1",
+          },
+        ),
+      () => jsonResponse({ jsonrpc: "2.0", result: null }),
+      () =>
+        jsonResponse({
+          jsonrpc: "2.0",
+          id: 3,
+          result: { tools: [{ name: "do" }] },
+        }),
+    ];
+    const callResponder = () =>
+      jsonResponse({
+        jsonrpc: "2.0",
+        id: 4,
+        result: { content: [{ type: "text", text: "ok" }] },
+      });
+    const { fetchImpl, calls } = recordingFetch([
+      ...connectResponders,
+      callResponder,
+    ]);
+    const client = new AppKitMcpClient(
+      WORKSPACE,
+      workspaceAuth,
+      trustedExternalPolicy,
+      { fetchImpl, dnsLookup: publicDnsLookup },
+    );
+    await client.connect({ name: "ext", url: "https://mcp.example.com/mcp" });
+
+    const output = await client.callTool(
+      "mcp.ext.do",
+      { x: 1 },
+      {
+        Authorization: "Bearer OBO-USER-TOKEN",
+      },
+    );
+    expect(output).toBe("ok");
+
+    const toolCall = calls[calls.length - 1];
+    const headers = toolCall.init.headers as Record<string, string>;
+    expect(headers.Authorization).toBeUndefined();
+  });
+
+  test("forwards caller-supplied OBO token when destination is workspace-origin", async () => {
+    const connectResponders = [
+      () =>
+        jsonResponse(
+          { jsonrpc: "2.0", id: 1, result: {} },
+          {
+            "mcp-session-id": "sess-1",
+          },
+        ),
+      () => jsonResponse({ jsonrpc: "2.0", result: null }),
+      () =>
+        jsonResponse({
+          jsonrpc: "2.0",
+          id: 3,
+          result: { tools: [{ name: "do" }] },
+        }),
+    ];
+    const callResponder = () =>
+      jsonResponse({
+        jsonrpc: "2.0",
+        id: 4,
+        result: { content: [{ type: "text", text: "ok" }] },
+      });
+    const { fetchImpl, calls } = recordingFetch([
+      ...connectResponders,
+      callResponder,
+    ]);
+    const client = new AppKitMcpClient(
+      WORKSPACE,
+      workspaceAuth,
+      workspacePolicy,
+      {
+        fetchImpl,
+        dnsLookup: publicDnsLookup,
+      },
+    );
+    await client.connect({
+      name: "genie-1",
+      url: `${WORKSPACE}/api/2.0/mcp/genie/abc`,
+    });
+
+    await client.callTool(
+      "mcp.genie-1.do",
+      {},
+      {
+        Authorization: "Bearer OBO-USER-TOKEN",
+      },
+    );
+
+    const toolCall = calls[calls.length - 1];
+    const headers = toolCall.init.headers as Record<string, string>;
+    expect(headers.Authorization).toBe("Bearer OBO-USER-TOKEN");
+  });
+
+  test("falls back to SP auth when no OBO override is provided and destination is workspace", async () => {
+    const authSpy = vi.fn(workspaceAuth);
+    const connectResponders = [
+      () =>
+        jsonResponse(
+          { jsonrpc: "2.0", id: 1, result: {} },
+          {
+            "mcp-session-id": "sess-1",
+          },
+        ),
+      () => jsonResponse({ jsonrpc: "2.0", result: null }),
+      () =>
+        jsonResponse({
+          jsonrpc: "2.0",
+          id: 3,
+          result: { tools: [{ name: "do" }] },
+        }),
+    ];
+    const callResponder = () =>
+      jsonResponse({
+        jsonrpc: "2.0",
+        id: 4,
+        result: { content: [{ type: "text", text: "ok" }] },
+      });
+    const { fetchImpl, calls } = recordingFetch([
+      ...connectResponders,
+      callResponder,
+    ]);
+    const client = new AppKitMcpClient(WORKSPACE, authSpy, workspacePolicy, {
+      fetchImpl,
+      dnsLookup: publicDnsLookup,
+    });
+    await client.connect({
+      name: "genie-1",
+      url: `${WORKSPACE}/api/2.0/mcp/genie/abc`,
+    });
+
+    await client.callTool("mcp.genie-1.do", {}, undefined);
+
+    const toolCall = calls[calls.length - 1];
+    const headers = toolCall.init.headers as Record<string, string>;
+    expect(headers.Authorization).toBe("Bearer SP-TOKEN");
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tests/mcp-host-policy.test.ts b/packages/appkit/src/plugins/agents/tests/mcp-host-policy.test.ts
new file mode 100644
index 00000000..8e8453bf
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tests/mcp-host-policy.test.ts
@@ -0,0 +1,324 @@
+import { describe, expect, test, vi } from "vitest";
+import {
+  assertResolvedHostSafe,
+  buildMcpHostPolicy,
+  checkMcpUrl,
+  type DnsLookup,
+  isBlockedIp,
+  isLoopbackHost,
+  type McpHostPolicy,
+} from "../tools/mcp-host-policy";
+
+function stubLookup(
+  addresses: Array<{ address: string; family?: number }>,
+): DnsLookup {
+  return vi
+    .fn<DnsLookup>()
+    .mockResolvedValue(addresses.map((a) => ({ family: 4, ...a })));
+}
+
+function failingLookup(message: string): DnsLookup {
+  return vi.fn<DnsLookup>().mockRejectedValue(new Error(message));
+}
+
+const WORKSPACE = "https://test-workspace.cloud.databricks.com";
+
+function policy(overrides: Partial<McpHostPolicy> = {}): McpHostPolicy {
+  return {
+    workspaceHostname: "test-workspace.cloud.databricks.com",
+    trustedHosts: new Set<string>(),
+    allowLocalhost: false,
+    ...overrides,
+  };
+}
+
+describe("buildMcpHostPolicy", () => {
+  test("extracts hostname from workspace URL", () => {
+    const p = buildMcpHostPolicy(undefined, WORKSPACE);
+    expect(p.workspaceHostname).toBe("test-workspace.cloud.databricks.com");
+  });
+
+  test("lowercases and trims trustedHosts", () => {
+    const p = buildMcpHostPolicy(
+      { trustedHosts: ["Example.COM", " corp.internal ", "mcp.example.com"] },
+      WORKSPACE,
+    );
+    expect(p.trustedHosts).toEqual(
+      new Set(["example.com", "corp.internal", "mcp.example.com"]),
+    );
+  });
+
+  test("allowLocalhost defaults to false in production", () => {
+    const prev = process.env.NODE_ENV;
+    process.env.NODE_ENV = "production";
+    try {
+      const p = buildMcpHostPolicy(undefined, WORKSPACE);
+      expect(p.allowLocalhost).toBe(false);
+    } finally {
+      process.env.NODE_ENV = prev;
+    }
+  });
+
+  test("allowLocalhost defaults to true outside production", () => {
+    const prev = process.env.NODE_ENV;
+    process.env.NODE_ENV = "development";
+    try {
+      const p = buildMcpHostPolicy(undefined, WORKSPACE);
+      expect(p.allowLocalhost).toBe(true);
+    } finally {
+      process.env.NODE_ENV = prev;
+    }
+  });
+
+  test("allowLocalhost respects explicit override", () => {
+    const prev = process.env.NODE_ENV;
+    process.env.NODE_ENV = "production";
+    try {
+      const p = buildMcpHostPolicy({ allowLocalhost: true }, WORKSPACE);
+      expect(p.allowLocalhost).toBe(true);
+    } finally {
+      process.env.NODE_ENV = prev;
+    }
+  });
+
+  test("throws on invalid workspace host", () => {
+    expect(() => buildMcpHostPolicy(undefined, "not-a-url")).toThrow(
+      /Invalid workspace host/,
+    );
+  });
+});
+
+describe("checkMcpUrl", () => {
+  test("admits same-origin workspace https URL and forwards auth", () => {
+    const result = checkMcpUrl(`${WORKSPACE}/api/2.0/mcp/genie/abc`, policy());
+    expect(result.ok).toBe(true);
+    if (result.ok) expect(result.forwardWorkspaceAuth).toBe(true);
+  });
+
+  test("admits trusted host but does NOT forward workspace auth", () => {
+    const p = policy({ trustedHosts: new Set(["mcp.example.com"]) });
+    const result = checkMcpUrl("https://mcp.example.com/mcp", p);
+    expect(result.ok).toBe(true);
+    if (result.ok) expect(result.forwardWorkspaceAuth).toBe(false);
+  });
+
+  test("rejects host that is neither workspace nor trusted", () => {
+    const result = checkMcpUrl("https://attacker.example.com/mcp", policy());
+    expect(result.ok).toBe(false);
+    if (!result.ok) {
+      expect(result.reason).toMatch(/attacker\.example\.com/);
+      expect(result.reason).toMatch(/trustedHosts/);
+    }
+  });
+
+  test("rejects plaintext http:// for remote hosts even when trusted", () => {
+    const p = policy({ trustedHosts: new Set(["mcp.example.com"]) });
+    const result = checkMcpUrl("http://mcp.example.com/mcp", p);
+    expect(result.ok).toBe(false);
+    if (!result.ok) expect(result.reason).toMatch(/plaintext http/);
+  });
+
+  test("rejects plaintext http://localhost when allowLocalhost is false", () => {
+    const result = checkMcpUrl("http://localhost:4000/mcp", policy());
+    expect(result.ok).toBe(false);
+  });
+
+  test("admits http://localhost when allowLocalhost is true, no workspace auth", () => {
+    const p = policy({ allowLocalhost: true });
+    const result = checkMcpUrl("http://localhost:4000/mcp", p);
+    expect(result.ok).toBe(true);
+    if (result.ok) expect(result.forwardWorkspaceAuth).toBe(false);
+  });
+
+  test("admits http://127.0.0.1 when allowLocalhost is true", () => {
+    const p = policy({ allowLocalhost: true });
+    const result = checkMcpUrl("http://127.0.0.1:4000/mcp", p);
+    expect(result.ok).toBe(true);
+    if (result.ok) expect(result.forwardWorkspaceAuth).toBe(false);
+  });
+
+  test("rejects non-http(s) schemes", () => {
+    for (const url of [
+      "file:///etc/passwd",
+      "ftp://host/x",
+      "gopher://host/x",
+      "javascript:alert(1)",
+    ]) {
+      const result = checkMcpUrl(url, policy());
+      expect(result.ok).toBe(false);
+    }
+  });
+
+  test("rejects obviously invalid URLs", () => {
+    const result = checkMcpUrl("not-a-url", policy());
+    expect(result.ok).toBe(false);
+  });
+
+  test("hostname comparison is case-insensitive", () => {
+    const result = checkMcpUrl(
+      "https://TEST-Workspace.CLOUD.Databricks.com/mcp",
+      policy(),
+    );
+    expect(result.ok).toBe(true);
+    if (result.ok) expect(result.forwardWorkspaceAuth).toBe(true);
+  });
+
+  test("rejects same hostname on different scheme (http) even for workspace", () => {
+    const result = checkMcpUrl(
+      "http://test-workspace.cloud.databricks.com/mcp",
+      policy(),
+    );
+    expect(result.ok).toBe(false);
+  });
+});
+
+describe("isBlockedIp", () => {
+  test("blocks RFC1918 IPv4 ranges", () => {
+    for (const addr of [
+      "10.0.0.1",
+      "10.255.255.255",
+      "172.16.0.1",
+      "172.31.255.255",
+      "192.168.0.1",
+      "192.168.255.255",
+    ]) {
+      expect(isBlockedIp(addr, true)).toBe(true);
+    }
+  });
+
+  test("blocks link-local 169.254.0.0/16 (covers cloud metadata 169.254.169.254)", () => {
+    expect(isBlockedIp("169.254.169.254", true)).toBe(true);
+    expect(isBlockedIp("169.254.0.1", true)).toBe(true);
+  });
+
+  test("blocks CGNAT 100.64.0.0/10", () => {
+    expect(isBlockedIp("100.64.0.1", true)).toBe(true);
+    expect(isBlockedIp("100.127.255.255", true)).toBe(true);
+  });
+
+  test("blocks 0.0.0.0/8 and multicast/reserved (>= 224.0.0.0)", () => {
+    expect(isBlockedIp("0.0.0.0", true)).toBe(true);
+    expect(isBlockedIp("0.1.2.3", true)).toBe(true);
+    expect(isBlockedIp("224.0.0.1", true)).toBe(true);
+    expect(isBlockedIp("255.255.255.255", true)).toBe(true);
+  });
+
+  test("blocks loopback when allowLocalhost is false", () => {
+    expect(isBlockedIp("127.0.0.1", false)).toBe(true);
+    expect(isBlockedIp("127.1.2.3", false)).toBe(true);
+    expect(isBlockedIp("::1", false)).toBe(true);
+  });
+
+  test("permits loopback when allowLocalhost is true", () => {
+    expect(isBlockedIp("127.0.0.1", true)).toBe(false);
+    expect(isBlockedIp("::1", true)).toBe(false);
+  });
+
+  test("blocks ULA (fc00::/7) and link-local (fe80::/10) IPv6", () => {
+    expect(isBlockedIp("fc00::1", true)).toBe(true);
+    expect(isBlockedIp("fd00::1", true)).toBe(true);
+    expect(isBlockedIp("fe80::1", true)).toBe(true);
+  });
+
+  test("blocks IPv4-mapped IPv6 addresses in blocked ranges", () => {
+    expect(isBlockedIp("::ffff:169.254.169.254", true)).toBe(true);
+    expect(isBlockedIp("::ffff:10.0.0.1", true)).toBe(true);
+  });
+
+  test("allows public IPv4 and IPv6 addresses", () => {
+    expect(isBlockedIp("8.8.8.8", false)).toBe(false);
+    expect(isBlockedIp("1.1.1.1", false)).toBe(false);
+    expect(isBlockedIp("2001:4860:4860::8888", false)).toBe(false);
+  });
+
+  test("treats malformed IP strings as blocked (fail-closed)", () => {
+    expect(isBlockedIp("10.0.0", true)).toBe(true);
+    expect(isBlockedIp("abc.def.ghi.jkl", true)).toBe(true);
+  });
+});
+
+describe("isLoopbackHost", () => {
+  test.each([
+    "localhost",
+    "LOCALHOST",
+    "127.0.0.1",
+    "::1",
+    "[::1]",
+    "0:0:0:0:0:0:0:1",
+  ])("recognises %s as loopback", (host) => {
+    expect(isLoopbackHost(host)).toBe(true);
+  });
+
+  test("does not match other hosts", () => {
+    expect(isLoopbackHost("example.com")).toBe(false);
+    expect(isLoopbackHost("10.0.0.1")).toBe(false);
+  });
+});
+
+describe("assertResolvedHostSafe", () => {
+  test("passes workspace hostname when resolved address is public", async () => {
+    const lookup = stubLookup([{ address: "203.0.113.42" }]);
+    await expect(
+      assertResolvedHostSafe(
+        "test-workspace.cloud.databricks.com",
+        policy(),
+        lookup,
+      ),
+    ).resolves.toBeUndefined();
+    expect(lookup).toHaveBeenCalledWith("test-workspace.cloud.databricks.com", {
+      all: true,
+    });
+  });
+
+  test("rejects hostname that resolves to link-local cloud metadata IP", async () => {
+    const lookup = stubLookup([{ address: "169.254.169.254" }]);
+    await expect(
+      assertResolvedHostSafe("evil.example.com", policy(), lookup),
+    ).rejects.toThrow(/169\.254\.169\.254/);
+  });
+
+  test("rejects hostname that resolves to RFC1918 IP", async () => {
+    const lookup = stubLookup([{ address: "10.0.0.1" }]);
+    await expect(
+      assertResolvedHostSafe("internal.example.com", policy(), lookup),
+    ).rejects.toThrow(/10\.0\.0\.1/);
+  });
+
+  test("rejects IP literal in blocked range without DNS lookup", async () => {
+    const lookup = stubLookup([{ address: "8.8.8.8" }]);
+    await expect(
+      assertResolvedHostSafe("169.254.169.254", policy(), lookup),
+    ).rejects.toThrow(/blocked IP range/);
+    expect(lookup).not.toHaveBeenCalled();
+  });
+
+  test("rejects plain 'localhost' when allowLocalhost is false", async () => {
+    await expect(assertResolvedHostSafe("localhost", policy())).rejects.toThrow(
+      /localhost is not allowed/,
+    );
+  });
+
+  test("surfaces DNS resolution failures", async () => {
+    const lookup = failingLookup("ENOTFOUND");
+    await expect(
+      assertResolvedHostSafe("nonexistent.example.com", policy(), lookup),
+    ).rejects.toThrow(/could not be resolved/);
+  });
+
+  test("rejects if any resolved address is blocked (defense against split DNS)", async () => {
+    const lookup = stubLookup([
+      { address: "8.8.8.8" },
+      { address: "169.254.169.254" },
+    ]);
+    await expect(
+      assertResolvedHostSafe("mixed.example.com", policy(), lookup),
+    ).rejects.toThrow(/169\.254\.169\.254/);
+  });
+
+  test("rejects hostname that resolves to empty DNS result", async () => {
+    const lookup = stubLookup([]);
+    await expect(
+      assertResolvedHostSafe("empty.example.com", policy(), lookup),
+    ).rejects.toThrow(/no DNS addresses/);
+  });
+});
diff --git a/packages/appkit/src/plugins/agents/tools/json-schema.ts b/packages/appkit/src/plugins/agents/tools/json-schema.ts
index 805fd48f..c5c10dbf 100644
--- a/packages/appkit/src/plugins/agents/tools/json-schema.ts
+++ b/packages/appkit/src/plugins/agents/tools/json-schema.ts
@@ -13,9 +13,7 @@ import { toJSONSchema, type z } from "zod";
  * providers either ignore the field or also trip on it, so stripping here is
  * safe across backends.
  */
-export function toToolJSONSchema(
-  schema: z.ZodType,
-): Record<string, unknown> {
+export function toToolJSONSchema(schema: z.ZodType): Record<string, unknown> {
   const raw = toJSONSchema(schema) as Record<string, unknown>;
   const { $schema: _ignored, ...rest } = raw;
   return rest;
diff --git a/packages/appkit/src/plugins/agents/tools/mcp-client.ts b/packages/appkit/src/plugins/agents/tools/mcp-client.ts
index bd96d348..8402f3bb 100644
--- a/packages/appkit/src/plugins/agents/tools/mcp-client.ts
+++ b/packages/appkit/src/plugins/agents/tools/mcp-client.ts
@@ -1,6 +1,12 @@
 import type { AgentToolDefinition } from "shared";
 import { createLogger } from "../../../logging/logger";
 import type { McpEndpointConfig } from "./hosted-tools";
+import {
+  assertResolvedHostSafe,
+  checkMcpUrl,
+  type DnsLookup,
+  type McpHostPolicy,
+} from "./mcp-host-policy";
 
 const logger = createLogger("agent:mcp");
 
@@ -32,6 +38,12 @@ interface McpToolCallResult {
 interface McpServerConnection {
   config: McpEndpointConfig;
   resolvedUrl: string;
+  /**
+   * Whether workspace auth (SP / OBO) may be forwarded to this endpoint's URL.
+   * Decided at `connect()` time via {@link McpHostPolicy} and cached for the
+   * lifetime of the connection.
+   */
+  forwardWorkspaceAuth: boolean;
   tools: Map<string, McpToolSchema>;
 }
 
@@ -41,6 +53,10 @@ interface McpServerConnection {
  * Uses raw fetch() with JSON-RPC 2.0 over HTTP — no @modelcontextprotocol/sdk
  * or LangChain dependency. Supports the Streamable HTTP transport (POST with
  * JSON-RPC request, single JSON-RPC response).
+ *
+ * All outbound URLs are gated by an {@link McpHostPolicy}: unallowlisted hosts
+ * are rejected before the first byte is sent, and workspace credentials are
+ * only forwarded to the same-origin workspace. See `mcp-host-policy.ts`.
  */
 export class AppKitMcpClient {
   private connections = new Map<string, McpServerConnection>();
@@ -51,6 +67,8 @@ export class AppKitMcpClient {
   constructor(
     private workspaceHost: string,
     private authenticate: () => Promise<Record<string, string>>,
+    private policy: McpHostPolicy,
+    private options: { dnsLookup?: DnsLookup; fetchImpl?: typeof fetch } = {},
   ) {}
 
   async connectAll(endpoints: McpEndpointConfig[]): Promise<void> {
@@ -79,27 +97,52 @@ export class AppKitMcpClient {
   }
 
   async connect(endpoint: McpEndpointConfig): Promise<void> {
-    const url = this.resolveUrl(endpoint);
-    logger.info("Connecting to MCP server: %s at %s", endpoint.name, url);
+    const resolvedUrl = this.resolveUrl(endpoint);
+    const check = checkMcpUrl(resolvedUrl, this.policy);
+    if (!check.ok) {
+      throw new Error(
+        `MCP endpoint '${endpoint.name}' refused at connect: ${check.reason}`,
+      );
+    }
+    await assertResolvedHostSafe(
+      check.url.hostname,
+      this.policy,
+      this.options.dnsLookup,
+    );
 
-    const initResponse = await this.sendRpc(url, "initialize", {
-      protocolVersion: "2025-03-26",
-      capabilities: {},
-      clientInfo: { name: "appkit-agent", version: "0.1.0" },
-    });
+    logger.info(
+      "Connecting to MCP server: %s at %s (forwardWorkspaceAuth=%s)",
+      endpoint.name,
+      resolvedUrl,
+      check.forwardWorkspaceAuth,
+    );
+
+    const initResponse = await this.sendRpc(
+      resolvedUrl,
+      "initialize",
+      {
+        protocolVersion: "2025-03-26",
+        capabilities: {},
+        clientInfo: { name: "appkit-agent", version: "0.1.0" },
+      },
+      { forwardWorkspaceAuth: check.forwardWorkspaceAuth },
+    );
 
     if (initResponse.sessionId) {
       this.sessionIds.set(endpoint.name, initResponse.sessionId);
     }
     const sessionId = this.sessionIds.get(endpoint.name);
 
-    await this.sendNotification(url, "notifications/initialized", sessionId);
+    await this.sendNotification(resolvedUrl, "notifications/initialized", {
+      sessionId,
+      forwardWorkspaceAuth: check.forwardWorkspaceAuth,
+    });
 
     const listResponse = await this.sendRpc(
-      url,
+      resolvedUrl,
       "tools/list",
       {},
-      { sessionId },
+      { sessionId, forwardWorkspaceAuth: check.forwardWorkspaceAuth },
     );
     const toolList =
       (listResponse.result as { tools?: McpToolSchema[] })?.tools ?? [];
@@ -111,7 +154,8 @@ export class AppKitMcpClient {
 
     this.connections.set(endpoint.name, {
       config: endpoint,
-      resolvedUrl: url,
+      resolvedUrl,
+      forwardWorkspaceAuth: check.forwardWorkspaceAuth,
       tools,
     });
     logger.info(
@@ -139,6 +183,16 @@ export class AppKitMcpClient {
     return defs;
   }
 
+  /**
+   * Whether the named MCP server may receive workspace-scoped auth headers
+   * (e.g., an OBO bearer token from an end-user request). Callers should gate
+   * auth-forwarding decisions on this to prevent credential exfiltration to
+   * non-workspace hosts.
+   */
+  canForwardWorkspaceAuth(serverName: string): boolean {
+    return this.connections.get(serverName)?.forwardWorkspaceAuth ?? false;
+  }
+
   async callTool(
     qualifiedName: string,
     args: unknown,
@@ -157,23 +211,34 @@ export class AppKitMcpClient {
     }
 
     const sessionId = this.sessionIds.get(serverName);
+    // authHeaders are caller-supplied credentials (typically the OBO token).
+    // Only honor them if the destination URL was admitted with
+    // forwardWorkspaceAuth=true at connect time.
+    const scopedAuthOverride = conn.forwardWorkspaceAuth
+      ? authHeaders
+      : undefined;
+
     const rpcResult = await this.sendRpc(
       conn.resolvedUrl,
       "tools/call",
       { name: toolName, arguments: args },
-      { authOverride: authHeaders, sessionId },
+      {
+        authOverride: scopedAuthOverride,
+        sessionId,
+        forwardWorkspaceAuth: conn.forwardWorkspaceAuth,
+      },
     );
     const result = rpcResult.result as McpToolCallResult;
 
     if (result.isError) {
-      const errText = result.content
+      const errText = (result.content ?? [])
         .filter((c) => c.type === "text")
         .map((c) => c.text)
         .join("\n");
       throw new Error(errText || "MCP tool call failed");
     }
 
-    return result.content
+    return (result.content ?? [])
       .filter((c) => c.type === "text")
       .map((c) => c.text)
       .join("\n");
@@ -182,6 +247,7 @@ export class AppKitMcpClient {
   async close(): Promise<void> {
     this.closed = true;
     this.connections.clear();
+    this.sessionIds.clear();
   }
 
   private async sendRpc(
@@ -191,6 +257,7 @@ export class AppKitMcpClient {
     options?: {
       authOverride?: Record<string, string>;
       sessionId?: string;
+      forwardWorkspaceAuth?: boolean;
     },
   ): Promise<{ result: unknown; sessionId?: string }> {
     if (this.closed) throw new Error("MCP client is closed");
@@ -202,7 +269,7 @@ export class AppKitMcpClient {
       ...(params && { params }),
     };
 
-    const authHeaders = options?.authOverride ?? (await this.authenticate());
+    const authHeaders = await this.resolveAuthHeaders(options);
     const headers: Record<string, string> = {
       "Content-Type": "application/json",
       Accept: "application/json, text/event-stream",
@@ -212,7 +279,8 @@ export class AppKitMcpClient {
       headers["Mcp-Session-Id"] = options.sessionId;
     }
 
-    const response = await fetch(url, {
+    const fetchImpl = this.options.fetchImpl ?? fetch;
+    const response = await fetchImpl(url, {
       method: "POST",
       headers,
       body: JSON.stringify(request),
@@ -254,25 +322,43 @@ export class AppKitMcpClient {
   private async sendNotification(
     url: string,
     method: string,
-    sessionId?: string,
+    options?: {
+      sessionId?: string;
+      forwardWorkspaceAuth?: boolean;
+    },
   ): Promise<void> {
     if (this.closed) return;
 
-    const authHeaders = await this.authenticate();
+    const authHeaders = await this.resolveAuthHeaders(options);
     const headers: Record<string, string> = {
       "Content-Type": "application/json",
       Accept: "application/json, text/event-stream",
       ...authHeaders,
     };
-    if (sessionId) {
-      headers["Mcp-Session-Id"] = sessionId;
+    if (options?.sessionId) {
+      headers["Mcp-Session-Id"] = options.sessionId;
     }
 
-    await fetch(url, {
+    const fetchImpl = this.options.fetchImpl ?? fetch;
+    await fetchImpl(url, {
       method: "POST",
       headers,
       body: JSON.stringify({ jsonrpc: "2.0", method }),
       signal: AbortSignal.timeout(30_000),
     });
   }
+
+  /**
+   * Return the auth headers to send on an outbound request. Workspace auth
+   * (SP or OBO) is only resolved when `forwardWorkspaceAuth` is true; for
+   * non-workspace hosts no bearer token is attached.
+   */
+  private async resolveAuthHeaders(options?: {
+    authOverride?: Record<string, string>;
+    forwardWorkspaceAuth?: boolean;
+  }): Promise<Record<string, string>> {
+    if (!options?.forwardWorkspaceAuth) return {};
+    if (options.authOverride) return options.authOverride;
+    return this.authenticate();
+  }
 }
diff --git a/packages/appkit/src/plugins/agents/tools/mcp-host-policy.ts b/packages/appkit/src/plugins/agents/tools/mcp-host-policy.ts
new file mode 100644
index 00000000..462fd4ce
--- /dev/null
+++ b/packages/appkit/src/plugins/agents/tools/mcp-host-policy.ts
@@ -0,0 +1,270 @@
+import { lookup as defaultLookup } from "node:dns/promises";
+import { isIP, isIPv4 } from "node:net";
+
+/**
+ * DNS lookup function compatible with `dns/promises.lookup(host, { all: true })`.
+ * Exposed as an injection point so callers (tests, custom DNS resolvers) can
+ * override the default resolver.
+ */
+export type DnsLookup = (
+  hostname: string,
+  options: { all: true },
+) => Promise<Array<{ address: string; family: number }>>;
+
+/**
+ * Policy that decides whether a given MCP endpoint URL is allowed and whether
+ * Databricks workspace credentials (SP or OBO) may be forwarded to it.
+ *
+ * The default posture is zero-trust: only same-origin workspace URLs receive
+ * workspace credentials, and all other destinations must be explicitly
+ * allowlisted by the application developer. Private / link-local IP ranges
+ * are blocked outright to prevent SSRF into cloud metadata services.
+ */
+export interface McpHostPolicy {
+  /** Lowercased hostname of the Databricks workspace (same-origin target). */
+  readonly workspaceHostname: string;
+  /** Additional allowlisted hostnames (lowercased). Workspace auth is NEVER forwarded to these. */
+  readonly trustedHosts: ReadonlySet<string>;
+  /** Permit `http://localhost`, `127.0.0.1`, `::1` URLs. Typically true only in development. */
+  readonly allowLocalhost: boolean;
+}
+
+/**
+ * Config shape accepted by {@link buildMcpHostPolicy}, matching the
+ * `mcp` field on `AgentsPluginConfig`.
+ */
+export interface McpHostPolicyConfig {
+  /**
+   * Additional hostnames that may host custom MCP servers beyond the same-origin
+   * workspace. Compared case-insensitively; bare hostnames only (no scheme or
+   * path). Workspace credentials (SP / OBO) are never forwarded to these hosts —
+   * they must handle authentication themselves.
+   */
+  trustedHosts?: string[];
+  /**
+   * Allow `http://localhost`, `127.0.0.1`, and `::1` MCP URLs for local
+   * development. Defaults to `true` when `NODE_ENV !== "production"`,
+   * otherwise `false`. Workspace credentials are never forwarded to localhost.
+   */
+  allowLocalhost?: boolean;
+}
+
+/** Build an {@link McpHostPolicy} from user config + the resolved workspace URL. */
+export function buildMcpHostPolicy(
+  config: McpHostPolicyConfig | undefined,
+  workspaceHost: string,
+): McpHostPolicy {
+  const workspaceHostname = safeHostname(workspaceHost);
+  if (!workspaceHostname) {
+    throw new Error(
+      `Invalid workspace host for MCP policy: ${JSON.stringify(workspaceHost)}`,
+    );
+  }
+  const trustedHosts = new Set(
+    (config?.trustedHosts ?? []).map((h) => h.trim().toLowerCase()),
+  );
+  const allowLocalhost =
+    config?.allowLocalhost ?? process.env.NODE_ENV !== "production";
+  return { workspaceHostname, trustedHosts, allowLocalhost };
+}
+
+type McpUrlCheck =
+  | {
+      readonly ok: true;
+      /** Whether it is safe to forward workspace-scoped credentials (SP/OBO) to this URL. */
+      readonly forwardWorkspaceAuth: boolean;
+      /** Parsed URL for reuse by the caller. */
+      readonly url: URL;
+    }
+  | { readonly ok: false; readonly reason: string };
+
+/**
+ * Synchronously decide whether an MCP URL is allowed under the given policy
+ * and whether workspace credentials may be forwarded to it.
+ *
+ * Hard rejections:
+ * - Non-`http(s)` schemes.
+ * - `http://` unless the host is localhost AND `allowLocalhost` is true.
+ * - Hosts that are neither same-origin workspace, localhost (if allowed),
+ *   nor in `trustedHosts`.
+ */
+export function checkMcpUrl(
+  rawUrl: string,
+  policy: McpHostPolicy,
+): McpUrlCheck {
+  let url: URL;
+  try {
+    url = new URL(rawUrl);
+  } catch {
+    return {
+      ok: false,
+      reason: `MCP URL is not a valid absolute URL: ${rawUrl}`,
+    };
+  }
+
+  if (url.protocol !== "http:" && url.protocol !== "https:") {
+    return {
+      ok: false,
+      reason: `MCP URL scheme '${url.protocol}' is not allowed (http(s) only): ${rawUrl}`,
+    };
+  }
+
+  const host = url.hostname.toLowerCase();
+  const isLoopback = isLoopbackHost(host);
+
+  if (url.protocol === "http:" && !(isLoopback && policy.allowLocalhost)) {
+    return {
+      ok: false,
+      reason: `MCP URL uses plaintext http:// which forwards bearer tokens in cleartext: ${rawUrl}. Use https:// or enable allowLocalhost for a localhost dev server.`,
+    };
+  }
+
+  if (host === policy.workspaceHostname) {
+    return { ok: true, forwardWorkspaceAuth: true, url };
+  }
+
+  if (isLoopback) {
+    if (!policy.allowLocalhost) {
+      return {
+        ok: false,
+        reason: `MCP URL points to localhost but allowLocalhost is disabled: ${rawUrl}`,
+      };
+    }
+    return { ok: true, forwardWorkspaceAuth: false, url };
+  }
+
+  if (policy.trustedHosts.has(host)) {
+    return { ok: true, forwardWorkspaceAuth: false, url };
+  }
+
+  return {
+    ok: false,
+    reason: `MCP host '${host}' is not allowed. Either use a same-origin workspace URL (${policy.workspaceHostname}) or add it to agents({ mcp: { trustedHosts: ['${host}'] } }).`,
+  };
+}
+
+/**
+ * Resolve `hostname` via DNS and assert that none of its addresses fall in a
+ * blocked IP range (loopback, RFC1918, link-local, CGNAT, cloud metadata).
+ *
+ * Throws with a descriptive error if any resolved address is blocked. Pass
+ * `allowLocalhost: true` to permit `127.0.0.1` / `::1` specifically.
+ *
+ * Note: this only guards against hosts that statically resolve to private
+ * ranges. Full SSRF protection requires socket-level IP pinning after
+ * resolution (DNS rebinding defense), which is out of scope here.
+ */
+export async function assertResolvedHostSafe(
+  hostname: string,
+  policy: McpHostPolicy,
+  lookup: DnsLookup = defaultLookup,
+): Promise<void> {
+  const lowered = hostname.toLowerCase();
+
+  if (isIP(lowered)) {
+    if (isBlockedIp(lowered, policy.allowLocalhost)) {
+      throw new Error(`MCP host ${lowered} is in a blocked IP range`);
+    }
+    return;
+  }
+
+  if (lowered === "localhost") {
+    if (!policy.allowLocalhost) {
+      throw new Error(
+        `MCP host localhost is not allowed under the current policy`,
+      );
+    }
+    return;
+  }
+
+  let resolved: Array<{ address: string }>;
+  try {
+    resolved = await lookup(hostname, { all: true });
+  } catch (cause) {
+    throw new Error(
+      `MCP host ${hostname} could not be resolved via DNS: ${cause instanceof Error ? cause.message : String(cause)}`,
+    );
+  }
+
+  if (resolved.length === 0) {
+    throw new Error(`MCP host ${hostname} returned no DNS addresses`);
+  }
+
+  for (const { address } of resolved) {
+    if (isBlockedIp(address, policy.allowLocalhost)) {
+      throw new Error(
+        `MCP host ${hostname} resolved to blocked address ${address} (private / link-local ranges are not allowed)`,
+      );
+    }
+  }
+}
+
+/** Whether a raw hostname literal is one of the recognised loopback aliases. */
+export function isLoopbackHost(host: string): boolean {
+  const lowered = host.toLowerCase();
+  return (
+    lowered === "localhost" ||
+    lowered === "127.0.0.1" ||
+    lowered === "::1" ||
+    lowered === "[::1]" ||
+    lowered === "0:0:0:0:0:0:0:1"
+  );
+}
+
+/**
+ * Check whether a resolved IP address is in a range that should never receive
+ * workspace credentials. `allowLocalhost` carves out 127.0.0.0/8 and ::1.
+ */
+export function isBlockedIp(address: string, allowLocalhost: boolean): boolean {
+  if (isIPv4(address)) {
+    return isBlockedIpv4(address, allowLocalhost);
+  }
+  if (isIP(address) === 6) {
+    return isBlockedIpv6(address, allowLocalhost);
+  }
+  // Not a recognisable IP literal — fail-closed.
+  return true;
+}
+
+function isBlockedIpv4(addr: string, allowLocalhost: boolean): boolean {
+  const parts = addr.split(".").map((p) => Number.parseInt(p, 10));
+  if (parts.length !== 4 || parts.some((n) => !Number.isFinite(n))) {
+    return true;
+  }
+  const [a, b] = parts;
+  if (a === 0) return true;
+  if (a === 127) return !allowLocalhost;
+  if (a === 10) return true;
+  if (a === 172 && b >= 16 && b <= 31) return true;
+  if (a === 192 && b === 168) return true;
+  if (a === 169 && b === 254) return true;
+  if (a === 100 && b >= 64 && b <= 127) return true;
+  if (a >= 224) return true;
+  return false;
+}
+
+function isBlockedIpv6(addr: string, allowLocalhost: boolean): boolean {
+  const lowered = addr.toLowerCase().replace(/^\[|\]$/g, "");
+
+  if (lowered === "::") return true;
+  if (lowered === "::1" || lowered === "0:0:0:0:0:0:0:1")
+    return !allowLocalhost;
+
+  if (lowered.startsWith("::ffff:")) {
+    const v4 = lowered.slice("::ffff:".length);
+    if (isIPv4(v4)) return isBlockedIpv4(v4, allowLocalhost);
+  }
+
+  if (/^f[cd][0-9a-f]{2}:/.test(lowered)) return true;
+  if (lowered.startsWith("fe80:") || lowered.startsWith("fe9")) return true;
+  if (lowered.startsWith("ff")) return true;
+  return false;
+}
+
+function safeHostname(rawUrl: string): string | null {
+  try {
+    return new URL(rawUrl).hostname.toLowerCase();
+  } catch {
+    return null;
+  }
+}
diff --git a/packages/appkit/src/plugins/agents/types.ts b/packages/appkit/src/plugins/agents/types.ts
index 37c322e6..9d56ee98 100644
--- a/packages/appkit/src/plugins/agents/types.ts
+++ b/packages/appkit/src/plugins/agents/types.ts
@@ -8,6 +8,7 @@ import type {
 import type { FromPluginMarker } from "./from-plugin";
 import type { FunctionTool } from "./tools/function-tool";
 import type { HostedTool } from "./tools/hosted-tools";
+import type { McpHostPolicyConfig } from "./tools/mcp-host-policy";
 
 /**
  * A tool reference produced by a plugin's `.toolkit()` call. The agents plugin
@@ -115,6 +116,13 @@ export interface AgentsPluginConfig extends BasePluginConfig {
   threadStore?: ThreadStore;
   /** Customize or disable the AppKit base system prompt. */
   baseSystemPrompt?: BaseSystemPromptOption;
+  /**
+   * MCP server host policy. By default only same-origin Databricks workspace
+   * URLs may be used as MCP endpoints; custom hosts must be explicitly
+   * allowlisted here. Workspace credentials (SP / OBO) are never forwarded
+   * to non-workspace hosts.
+   */
+  mcp?: McpHostPolicyConfig;
 }
 
 /** Internal tool-index entry after a tool record has been resolved to a dispatchable form. */