diff --git a/.agent/self-learning/coupling.json b/.agent/self-learning/coupling.json
index cd673b5e2..b65b64a77 100644
--- a/.agent/self-learning/coupling.json
+++ b/.agent/self-learning/coupling.json
@@ -61,6 +61,48 @@
           "why": "Per CLAUDE.md, every feature / bug fix / behavior change MUST include E2E test coverage. When a new public capability is added, a corresponding spec under testing/e2e/tests/ plus a fixture under testing/e2e/fixtures/ are required — often plus a new entry in feature-support.ts and types.ts. The full pattern is: add the Feature flag, decide provider support, optionally add a per-feature config (system prompt, schema, tools), wire it through src/routes/api.chat.ts (or the relevant route), write the fixture(s), write the spec iterating `providersFor(feature)`. Spec must run against every supported provider so non-native-streaming providers exercise the fallback path. Skip only for refactors that don't change observable behavior."
         }
       ]
+    },
+    {
+      "id": "sandbox-core-contract-touches-providers",
+      "trigger": "packages/ai-sandbox/src/**/*.ts",
+      "impacts": [
+        {
+          "target": [
+            "packages/ai-sandbox-local-process/src/**/*.ts",
+            "packages/ai-sandbox-docker/src/**/*.ts",
+            "packages/ai-sandbox-cloudflare/src/**/*.ts"
+          ],
+          "kind": "change-required",
+          "why": "The SandboxProvider / SandboxHandle / SandboxCapabilities contracts in @tanstack/ai-sandbox are the seam every provider package implements. When a method, capability flag, lifecycle field, or the ensure/resume algorithm changes in core, every provider package must be updated in the same PR or it falls out of contract (silent type breaks, missing capability handling, broken resume). Also re-check capability degradation: a provider that returns capabilities().snapshots===false must keep working when core adds a snapshot-dependent path."
+        }
+      ]
+    },
+    {
+      "id": "harness-adapter-sandbox-execution",
+      "trigger": "packages/ai-claude-code/src/**/*.ts",
+      "impacts": [
+        {
+          "target": [
+            "packages/ai-codex/src/**/*.ts",
+            "packages/ai-gemini-cli/src/**/*.ts",
+            "packages/ai-opencode/src/**/*.ts",
+            "packages/ai-sandbox/src/**/*.ts"
+          ],
+          "kind": "change-required",
+          "why": "All four harness adapters share one execution contract: declare requires:[SandboxCapability], spawn the agent CLI via sandbox.process (never local child_process), pipe its native stream-json/ACP stdout through the per-adapter translate layer, and proxy host tools via the MCP-over-channel bridge. When the sandbox-execution pattern, the host MCP tool-bridge shape, the per-run bearer-token/channel contract, or the policy->native-permission mapping changes in one adapter (or in @tanstack/ai-sandbox), mirror it across the other harness adapters so they don't diverge into incompatible execution paths."
+        }
+      ]
+    },
+    {
+      "id": "sandbox-source-persistence-ready",
+      "trigger": "packages/ai-sandbox*/src/**/*.ts",
+      "impacts": [
+        {
+          "target": ["packages/ai-sandbox/src/**/*.ts"],
+          "kind": "change-required",
+          "why": "The sandbox layer ships with zero persistence package but MUST stay persistence-ready so the persistence proposal drops in without re-architecture. Invariant to preserve on any sandbox change: SandboxStore and LockStore stay PLUGGABLE optional capabilities (in-memory defaults only - never hardcode storage), emitted chunks stay conceptually offset-addressable ({runId, seq, ts, chunk}) so a future EventLog/DurableRunStream can capture+replay by cursor, and approvals keep using the existing resume-based approval-requested flow. Do not introduce a sandbox-owned durable store, a bespoke replay buffer, or a non-AG-UI event type that the persistence layer would later have to rip out."
+        }
+      ]
     }
   ]
 }
diff --git a/.agentsroom/.gitignore b/.agentsroom/.gitignore
new file mode 100644
index 000000000..1acd1a387
--- /dev/null
+++ b/.agentsroom/.gitignore
@@ -0,0 +1,4 @@
+# AgentsRoom: personal files (not committed to git)
+*-personal.json
+agents-local.json
+sessions/
diff --git a/.agentsroom/agents.json b/.agentsroom/agents.json
new file mode 100644
index 000000000..e9a83e418
--- /dev/null
+++ b/.agentsroom/agents.json
@@ -0,0 +1,10 @@
+[
+  {
+    "role": "fullstack",
+    "model": "opus",
+    "customName": "Full-Stack Developer",
+    "isPersonal": false,
+    "id": "agent-1776361243376-3sekdc",
+    "claudeSessionId": "96773a93-be2a-45a9-a732-ceb224d3d0e5"
+  }
+]
\ No newline at end of file
diff --git a/.agentsroom/prompts.json b/.agentsroom/prompts.json
new file mode 100644
index 000000000..f4455d843
--- /dev/null
+++ b/.agentsroom/prompts.json
@@ -0,0 +1,4 @@
+{
+  "folders": [],
+  "prompts": []
+}
\ No newline at end of file
diff --git a/.changeset/ai-claude-code-initial.md b/.changeset/ai-claude-code-initial.md
new file mode 100644
index 000000000..35a41dfe4
--- /dev/null
+++ b/.changeset/ai-claude-code-initial.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai-claude-code': minor
+---
+
+New `@tanstack/ai-claude-code` package: a Claude Code **harness adapter that runs inside a sandbox**. It declares `requires: [SandboxCapability]` and spawns the `claude` CLI (`claude -p --output-format stream-json`) inside the sandbox provided by `withSandbox(...)`, streaming its events back as AG-UI chunks. Claude Code owns the agent loop and executes its own native tools (bash, file edits, search) against the sandbox workspace; their activity streams back as resolved tool-call events. `chat()`-provided server tools are bridged to the in-sandbox agent over a host-side MCP tool-proxy (calls are proxied back to the host where `execute()` runs). Sessions are resumable via `modelOptions.sessionId` (surfaced through a `claude-code.session-id` custom event), and the working-tree diff is emitted as a `file.changed` custom event after each run. A `defineSandboxPolicy` (allow/ask/deny command globs + file-write/network capability rules) is enforced via Claude Code's `--permission-prompt-tool`: each native tool use is checked against the policy and the client's approval decisions, and an `ask` action with no decision yet surfaces an `approval-requested` event (the client approves and re-runs to continue). Requires the `claude` executable and `ANTHROPIC_API_KEY` to be available in the sandbox (e.g. via `workspace.secrets`).
diff --git a/.changeset/ai-codex-initial.md b/.changeset/ai-codex-initial.md
new file mode 100644
index 000000000..c6a4d711c
--- /dev/null
+++ b/.changeset/ai-codex-initial.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai-codex': minor
+---
+
+New `@tanstack/ai-codex` package: a Codex **harness adapter that runs inside a sandbox**. It declares `requires: [SandboxCapability]` and spawns `codex exec --experimental-json` inside the sandbox provided by `withSandbox(...)` (mirroring `@openai/codex-sdk`'s own CLI invocation), feeding the prompt via stdin and streaming its JSONL thread events back as AG-UI chunks. Codex owns the agent loop and executes its built-in tools (shell, file changes, web search, todo lists) against the sandbox workspace. Threads are resumable via `modelOptions.sessionId` (surfaced through a `codex.session-id` custom event); sandbox mode / approval policy / reasoning effort map to codex CLI flags. Requires the `codex` executable and `CODEX_API_KEY` (or a `codex login`) in the sandbox. chat()-provided server tools are bridged into the agent via the host MCP tool-proxy. A `defineSandboxPolicy` is mapped onto Codex's coarse permission knobs (sandbox mode, `approval_policy`, `network_access`); because `codex exec` runs non-interactively with no per-action host callback, the fine-grained resume-based interactive-approval flow is not available for Codex (it refuses, rather than prompts for, actions needing approval).
diff --git a/.changeset/ai-gemini-cli-initial.md b/.changeset/ai-gemini-cli-initial.md
new file mode 100644
index 000000000..2e77eb65a
--- /dev/null
+++ b/.changeset/ai-gemini-cli-initial.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai-gemini-cli': minor
+---
+
+New `@tanstack/ai-gemini-cli` package: a Gemini CLI **harness adapter that runs inside a sandbox**. It declares `requires: [SandboxCapability]` and spawns `gemini --acp` (Agent Client Protocol) inside the sandbox provided by `withSandbox(...)`, driving it over the sandbox's duplex process IO (the ACP transport is adapted from the sandbox `SpawnHandle`; all ACP protocol handling is reused). Gemini CLI owns the agent loop and executes its built-in tools (shell, file edits, search) against the sandbox workspace; assistant text/thinking stream as token-level deltas and tool activity as resolved tool-call events. Sessions are resumable via `modelOptions.sessionId` (surfaced through a `gemini-cli.session-id` custom event, with graceful fallback to transcript replay), and ACP permission requests are answered by a configurable never-hanging policy (`default` / `acceptEdits` / `bypassPermissions` or a custom handler), and an action the policy would reject with no client decision yet surfaces an `approval-requested` event so the client can approve and re-run to grant it (interactive approvals). Headless auth is selectable up front via `authMethodId`. Requires the `gemini` CLI in the sandbox. chat()-provided server tools are bridged into the agent via the host MCP tool-proxy.
diff --git a/.changeset/ai-opencode-initial.md b/.changeset/ai-opencode-initial.md
new file mode 100644
index 000000000..a160e9f22
--- /dev/null
+++ b/.changeset/ai-opencode-initial.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai-opencode': minor
+---
+
+New `@tanstack/ai-opencode` package: an OpenCode **harness adapter that runs inside a sandbox**. It declares `requires: [SandboxCapability]`, spawns `opencode serve` inside the sandbox provided by `withSandbox(...)`, exposes its port, and connects the `@opencode-ai/sdk` HTTP client to it via `baseUrl`. OpenCode owns the agent loop and executes its built-in tools (shell, file edits, search) against the sandbox workspace; assistant text/thinking stream as token-level deltas and tool activity as resolved tool-call events. Sessions are resumable, and OpenCode permission requests are answered by a configurable `permissionMode` (`default` / `acceptEdits` / `bypassPermissions` or a custom handler), and a request the policy would reject with no client decision yet surfaces an `approval-requested` event so the client can approve and re-run to grant it (interactive approvals). Requires the `opencode` CLI in the sandbox (Docker: publish the server port via `publishPorts`). chat()-provided server tools are bridged into the agent via the host MCP tool-proxy.
diff --git a/.changeset/ai-sandbox-cloudflare.md b/.changeset/ai-sandbox-cloudflare.md
new file mode 100644
index 000000000..2be9ac1b8
--- /dev/null
+++ b/.changeset/ai-sandbox-cloudflare.md
@@ -0,0 +1,5 @@
+---
+'@tanstack/ai-sandbox-cloudflare': minor
+---
+
+New `@tanstack/ai-sandbox-cloudflare` package: a Cloudflare Containers sandbox provider (`cloudflareSandbox`) built on `@cloudflare/sandbox`, for running harness adapters at the edge inside a Worker. Implements the uniform `SandboxHandle` (exec, base64-backed fs, git, `exposePort` preview URLs, env) over the Cloudflare Sandbox Durable Object. The container disk is ephemeral and snapshots are not yet GA, so `withSandbox` re-bootstraps under the same identity across cold starts (`durableFilesystem`/`snapshots` are reported false). Background processes don't expose stdin on Cloudflare, so stdin-fed harnesses (e.g. Claude Code) need a stdin-capable provider; `exec` works fully.
diff --git a/.changeset/persistence-layer.md b/.changeset/persistence-layer.md
new file mode 100644
index 000000000..0ea1e36c8
--- /dev/null
+++ b/.changeset/persistence-layer.md
@@ -0,0 +1,31 @@
+---
+'@tanstack/ai': minor
+'@tanstack/ai-sandbox': patch
+'@tanstack/ai-client': minor
+'@tanstack/ai-claude-code': patch
+'@tanstack/ai-codex': patch
+'@tanstack/ai-gemini-cli': patch
+'@tanstack/ai-opencode': patch
+'@tanstack/ai-persistence': minor
+'@tanstack/ai-persistence-sql': minor
+'@tanstack/ai-persistence-sqlite': minor
+'@tanstack/ai-persistence-postgres': minor
+'@tanstack/ai-persistence-cloudflare': minor
+'@tanstack/ai-persistence-drizzle': minor
+'@tanstack/ai-persistence-prisma': minor
+'@tanstack/ai-sandbox-persistence': minor
+---
+
+Persistence + resumable runs as composable `chat()` middleware.
+
+`withPersistence(...)` makes any run durable: it loads/saves thread message history (server-authoritative), creates/updates run records, persists every AG-UI `StreamChunk` to an append-only event log, and persists usage. It is fully **optional** — a `chat()` with no persistence middleware is byte-for-byte unchanged, and it works for both non-sandbox and sandbox (agent-mode) runs.
+
+**Resume.** Each persisted chunk carries an in-band, opaque `cursor` (a monotonic per-run sequence). A client that disconnects mid-run reconnects with the run's `runId` + last `cursor`; `chat({ cursor })` replays the persisted event tail after that cursor, then — for harness adapters that re-attach to their still-running in-sandbox process — continues live. The headless `ChatClient` tracks the cursor and exposes `resume()` / `getResumeState()` / `maybeAutoResume()` with an `autoResume` opt-out.
+
+**Event model.** The persisted log is the AG-UI `StreamChunk` stream itself (no parallel event type); agent activity (file changes, process output, approvals, artifacts, sandbox lifecycle) rides on well-known `CUSTOM` events catalogued in `@tanstack/ai`.
+
+**Backends (shared SQL core + thin adapters).** One SQL implementation behind a minimal `SqlDriver` (`@tanstack/ai-persistence-sql`), with backends for SQLite (`-sqlite`, node:sqlite/better-sqlite3), Postgres (`-postgres`, pg), Cloudflare D1 (`-cloudflare`), and bring-your-own Drizzle (`-drizzle`) and Prisma (`-prisma`). Raw drivers auto-migrate (versioned, opt-out); ORMs own their schema. `memoryPersistence()` ships in core for tests/examples.
+
+**Agent mode.** `@tanstack/ai-sandbox-persistence` bridges a durable SQL-backed `SandboxStore` and the durable `LockStore` into `withSandbox`, so sandbox resume and ensure-locking survive across processes. The shared `locks` capability now lives in `@tanstack/ai` (one token across the sandbox and persistence layers); `@tanstack/ai-sandbox` re-exports it for back-compat.
+
+Approvals are persisted and a durable approval controller feeds decisions back into the existing deny-and-replay flow. Cloudflare is compile-verified (Workers runtime), Postgres runtime-verification is via Docker, and live harness re-attach is verified with the real CLIs; everything else is unit/integration-tested. The Playwright E2E suite is a follow-up.
diff --git a/.changeset/sandbox-hooks-redesign.md b/.changeset/sandbox-hooks-redesign.md
new file mode 100644
index 000000000..b32c1d5df
--- /dev/null
+++ b/.changeset/sandbox-hooks-redesign.md
@@ -0,0 +1,23 @@
+---
+'@tanstack/ai': minor
+'@tanstack/ai-sandbox': minor
+'@tanstack/ai-sandbox-local-process': minor
+---
+
+Declarative sandbox file-event hooks: observe file create / change / delete
+inside a sandbox and have them fire automatically during a chat run.
+
+- `@tanstack/ai`: chat middleware gains an optional `sandbox` hook group
+  (`onFile`/`onFileCreate`/`onFileChange`/`onFileDelete`), a `SandboxFileEvent`
+  type, and a `sandbox` debug-logging category. The engine auto-emits a
+  `CUSTOM` `sandbox.file` event per change (client reads it from `parts`).
+- `@tanstack/ai-sandbox`: `defineSandbox({ hooks, fileEvents })` declares
+  file + lifecycle hooks (`onFile*`/`onReady`/`onError`/`onDestroy`) that fire
+  automatically while the sandbox runs in a chat — `withSandbox` owns the
+  watcher. The watcher is provider-agnostic: a native `fs.watch` fast-path when
+  the provider advertises it, otherwise a portable `find -printf` mtime
+  snapshot-diff poll (no extra deps; `.git`/`node_modules` ignored by default).
+  `watchWorkspace()` / `diffSnapshots` remain as low-level building blocks.
+- `@tanstack/ai-sandbox-local-process`: implements the optional `fs.watch` seam
+  via Node's recursive `fs.watch` (Windows/macOS); Linux falls back to the core
+  exec-poll automatically.
diff --git a/.changeset/sandbox-layer.md b/.changeset/sandbox-layer.md
new file mode 100644
index 000000000..6f2d57dd3
--- /dev/null
+++ b/.changeset/sandbox-layer.md
@@ -0,0 +1,13 @@
+---
+'@tanstack/ai-sandbox': minor
+'@tanstack/ai-sandbox-local-process': minor
+'@tanstack/ai-sandbox-docker': minor
+'@tanstack/ai': minor
+---
+
+New provider-agnostic sandbox layer so harness adapters can run **inside** isolated sandboxes.
+
+- **`@tanstack/ai-sandbox`** — `defineSandbox()` (lazy controller + resume→restoreSnapshot→create+bootstrap ensure algorithm), `withSandbox()` middleware, `defineWorkspace()` (git/local source, package-manager detection, setup, skills, secrets), `defineSandboxPolicy()`, the `SandboxProvider`/`SandboxHandle`/`SandboxCapabilities` contracts, capability tokens (`SandboxCapability` plus the optional `SandboxStore`/`Locks` persistence seams with in-memory defaults), `bootstrapWorkspace`, `createExecBackedGit`, `spawnNdjson` (run an agent CLI in a sandbox and stream its NDJSON stdout), the host MCP tool-proxy bridge (`startHostToolBridge` — exposes `chat()` server tools to the in-sandbox agent, with an optional permission-prompt tool), and the shared interactive-approval primitives (`resolveApproval`, `approvalId`, `buildApprovalRequestedEvent`) harness adapters use to enforce a policy and surface `approval-requested` events for client-in-the-loop approvals.
+- **`@tanstack/ai-sandbox-local-process`** — `localProcessSandbox()`: runs the agent on the host through the uniform `SandboxHandle` (no isolation; the fast dev loop).
+- **`@tanstack/ai-sandbox-docker`** — `dockerSandbox()`: runs the agent inside an isolated Docker container (dockerode), with commit-based snapshots, fork, and resume-by-id.
+- **`@tanstack/ai`** — `TextOptions.capabilities` exposes the middleware capability context to adapters so harness adapters that declare `requires: [...]` can read provided capabilities from `chatStream`; `TextOptions.approvals` threads client approval decisions through to adapters for the interactive-approval (deny + `approval-requested` + re-run) flow; `DefinedChatMiddleware` and `AnyChatMiddleware` are now exported for portable middleware authoring.
diff --git a/.gitignore b/.gitignore
index 6678fb779..92054517b 100644
--- a/.gitignore
+++ b/.gitignore
@@ -78,3 +78,7 @@ solo.yml
 # Agent scratch output (gap-analysis reports, triage notes — generated locally)
 .agent/gap-analysis/
 .agent/triage/
+
+/OpenCode.md
+.agentsroom/
+.opencode/
diff --git a/docs/adapters/claude-code.md b/docs/adapters/claude-code.md
new file mode 100644
index 000000000..3f0f6dfbc
--- /dev/null
+++ b/docs/adapters/claude-code.md
@@ -0,0 +1,181 @@
+---
+title: Claude Code
+id: claude-code-adapter
+order: 11
+description: "Use Claude Code as a chat backend in TanStack AI — agent harness with local tool execution, stateful coding sessions, and tool bridging via @tanstack/ai-claude-code."
+keywords:
+  - tanstack ai
+  - claude code
+  - claude agent sdk
+  - anthropic
+  - harness
+  - agent
+  - coding agent
+  - adapter
+---
+
+The Claude Code adapter runs [Claude Code](https://docs.anthropic.com/en/docs/claude-code) (via the `@anthropic-ai/claude-agent-sdk`) as a chat backend. Unlike HTTP provider adapters, this is a **harness adapter**: Claude Code runs its own agent loop and executes its own tools — bash, file reads and edits, glob/grep search, web search — locally on your server. Each `chat()` call runs one full harness turn; the harness's tool activity streams back as already-resolved tool-call events your UI can render.
+
+> **Server-only.** The harness spawns the Claude Code runtime as a subprocess, so this adapter only works in a Node.js server environment — never in the browser. Treat it like giving Claude a shell on the machine it runs on, and configure permissions accordingly.
+
+## Installation
+
+```bash
+npm install @tanstack/ai-claude-code
+```
+
+A runnable demo lives at [`examples/ts-react-coding-agent`](https://github.com/TanStack/ai/tree/main/examples/ts-react-coding-agent) — session resume, the harness tool timeline, permission modes, and tool bridging, wired into a React app.
+
+## Authentication
+
+The harness resolves credentials the same way Claude Code does:
+
+- `ANTHROPIC_API_KEY` in the server's environment (or the `apiKey` config option), or
+- an existing Claude subscription login on the machine (`claude login`).
+
+## Basic Usage
+
+```typescript
+import { chat } from "@tanstack/ai";
+import { claudeCodeText } from "@tanstack/ai-claude-code";
+
+const stream = chat({
+  adapter: claudeCodeText("claude-opus-4-8", {
+    cwd: "/path/to/project",
+    permissionMode: "acceptEdits",
+  }),
+  messages: [{ role: "user", content: "Fix the failing test in utils.test.ts" }],
+});
+```
+
+## Configuration
+
+| Option                       | Description                                                                                                                                       |
+| ---------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `cwd`                        | Working directory for the harness session. Defaults to `process.cwd()`.                                                                            |
+| `permissionMode`             | Claude Code permission mode (`'default'`, `'acceptEdits'`, `'bypassPermissions'`, `'plan'`, `'dontAsk'`, `'auto'`). See the permissions note below. |
+| `allowedTools`               | Built-in tools the harness may use without prompting (e.g. `['Read', 'Grep', 'Bash(npm test:*)']`).                                                |
+| `disallowedTools`            | Built-in tools removed from the harness entirely.                                                                                                  |
+| `maxTurns`                   | Maximum harness-internal turns per run.                                                                                                            |
+| `systemPromptMode`           | `'append'` (default) keeps Claude Code's preset system prompt and appends your `systemPrompts`; `'replace'` sends yours as the entire prompt.       |
+| `mcpServers`                 | Extra MCP servers passed through to the harness untouched.                                                                                         |
+| `apiKey`                     | Anthropic API key for the harness subprocess.                                                                                                       |
+| `env`                        | Extra environment variables for the harness subprocess.                                                                                            |
+| `pathToClaudeCodeExecutable` | Use a specific Claude Code executable instead of the SDK's bundled one.                                                                             |
+| `streamPartials`             | Emit true token-level text deltas (default `true`).                                                                                                 |
+| `canUseTool`                 | Custom permission handler; replaces the adapter's default handler.                                                                                  |
+| `settingSources`             | Claude Code settings tiers to load. Default `['project']`: the `cwd`'s CLAUDE.md and project settings apply, but user-level config on the host (`~/.claude` plugins, hooks, skills) is ignored. Pass `['user', 'project', 'local']` for CLI-equivalent behavior, or `[]` for full isolation. |
+
+**Permissions on headless servers.** Without an explicit `permissionMode` or `canUseTool`, the adapter installs a safe default handler: bridged TanStack tools always run, and any built-in tool call that would normally prompt a human is denied with guidance instead of hanging the request. To let the harness edit files or run commands, set `permissionMode: 'acceptEdits'` / `'bypassPermissions'`, or enumerate `allowedTools`.
+
+## Stateful Sessions
+
+Claude Code sessions are stateful — the harness keeps the full working context (files read, commands run, conclusions reached) between turns. The adapter surfaces the session id of every run as a custom stream event named `claude-code.session-id`; thread it back via `modelOptions.sessionId` to resume the session. When resuming, only the latest user message is sent — the harness already holds the prior context.
+
+Server endpoint:
+
+```typescript
+import {
+  chat,
+  chatParamsFromRequest,
+  toServerSentEventsResponse,
+} from "@tanstack/ai";
+import { claudeCodeText } from "@tanstack/ai-claude-code";
+
+export async function POST(request: Request) {
+  const params = await chatParamsFromRequest(request);
+
+  // Extra fields the client puts in the connection `body` arrive here.
+  const sessionId =
+    typeof params.forwardedProps.sessionId === "string"
+      ? params.forwardedProps.sessionId
+      : undefined;
+
+  const stream = chat({
+    adapter: claudeCodeText("claude-opus-4-8", {
+      cwd: "/path/to/project",
+      permissionMode: "acceptEdits",
+    }),
+    messages: params.messages,
+    modelOptions: { sessionId },
+  });
+
+  return toServerSentEventsResponse(stream);
+}
+```
+
+Client (React) — capture the session id from the custom event and send it back on subsequent requests:
+
+```typescript
+import { useState } from "react";
+import { useChat } from "@tanstack/ai-react";
+import { fetchServerSentEvents } from "@tanstack/ai-client";
+
+function CodingAssistant() {
+  const [sessionId, setSessionId] = useState<string | undefined>(undefined);
+
+  const { messages, sendMessage } = useChat({
+    connection: fetchServerSentEvents("/api/chat", () => ({
+      body: { sessionId },
+    })),
+    onCustomEvent: (name, value) => {
+      if (
+        name === "claude-code.session-id" &&
+        typeof value === "object" &&
+        value !== null &&
+        "sessionId" in value &&
+        typeof value.sessionId === "string"
+      ) {
+        setSessionId(value.sessionId);
+      }
+    },
+  });
+
+  // ... render messages; harness tool activity (Bash, Edit, Read, ...)
+  // arrives as regular tool-call parts with their results attached.
+}
+```
+
+Sessions are stored on the machine that ran them (`~/.claude/projects/`), so resuming only works on the same server instance. Pass `modelOptions: { forkSession: true }` alongside `sessionId` to branch a session instead of continuing it.
+
+## Tools
+
+Two kinds of tools flow through this adapter:
+
+1. **Built-in harness tools** (`Bash`, `Read`, `Write`, `Edit`, `Glob`, `Grep`, `WebSearch`, ...) are executed by Claude Code itself. Their activity streams back as tool-call events with results already attached, so `useChat` UIs render them with no extra wiring — but your code never executes them.
+
+2. **Your TanStack tools** are bridged *into* the harness as an in-process MCP server. Define them as usual with `toolDefinition().server()`; the model sees them as `mcp__tanstack__<name>` and the adapter strips the prefix on the way back out, so events match the names you registered.
+
+```typescript
+import { z } from "zod";
+import { chat, toolDefinition } from "@tanstack/ai";
+import { claudeCodeText } from "@tanstack/ai-claude-code";
+
+const lookupTicket = toolDefinition({
+  name: "lookup_ticket",
+  description: "Look up an issue ticket by id",
+  inputSchema: z.object({ ticketId: z.string() }),
+}).server(async ({ ticketId }) => {
+  return { ticketId, status: "open", title: "Crash on startup" };
+});
+
+const stream = chat({
+  adapter: claudeCodeText("claude-opus-4-8"),
+  messages: [{ role: "user", content: "What's the status of ticket T-123?" }],
+  tools: [lookupTicket],
+});
+```
+
+**Client-side and approval-gated tools are not supported.** The harness executes tools inside a live subprocess, which cannot pause across HTTP requests to wait for a browser round-trip or a human approval. Passing a tool without a server `execute()` implementation — or one marked `needsApproval` — fails fast with a descriptive error. Run those tools outside the harness with a regular provider adapter.
+
+## Structured Output
+
+`structuredOutput()` uses the harness's native JSON-schema output format in a one-shot run (single turn, no tools). It works for finalization after a chat, but a plain provider adapter (e.g. `@tanstack/ai-anthropic`) is the better choice when structured extraction is the primary job — it's faster and doesn't spawn a subprocess.
+
+## Limitations
+
+- **Server-only (Node).** The harness spawns a subprocess; Windows support is untested.
+- **The harness owns the agent loop.** TanStack's agent-loop strategies and per-iteration middleware don't apply inside a harness turn; `maxTurns` is the equivalent control.
+- **No sampling controls.** `temperature`-style options don't exist here.
+- **Sessions are machine-local.** Resume requires hitting the same server instance.
+- **Cold starts.** Each call spawns a harness turn; expect higher first-token latency than HTTP adapters.
diff --git a/docs/adapters/codex.md b/docs/adapters/codex.md
new file mode 100644
index 000000000..199cffe7f
--- /dev/null
+++ b/docs/adapters/codex.md
@@ -0,0 +1,182 @@
+---
+title: Codex
+id: codex-adapter
+order: 12
+description: "Use OpenAI Codex as a chat backend in TanStack AI — agent harness with local tool execution, stateful coding sessions, and tool bridging via @tanstack/ai-codex."
+keywords:
+  - tanstack ai
+  - codex
+  - codex sdk
+  - openai
+  - harness
+  - agent
+  - coding agent
+  - adapter
+---
+
+The Codex adapter runs [OpenAI Codex](https://developers.openai.com/codex) (via the `@openai/codex-sdk`) as a chat backend. Unlike HTTP provider adapters, this is a **harness adapter**: Codex runs its own agent loop and executes its own tools — shell commands, file changes, web search — locally on your server, inside its sandbox. Each `chat()` call runs one full harness turn; the harness's tool activity streams back as already-resolved tool-call events your UI can render.
+
+> **Server-only.** The harness spawns the Codex runtime (bundled with the SDK) as a subprocess, so this adapter only works in a Node.js server environment — never in the browser. The sandbox mode is the safety boundary; configure it deliberately.
+
+## Installation
+
+```bash
+npm install @tanstack/ai-codex
+```
+
+A runnable demo lives at [`examples/ts-react-coding-agent`](https://github.com/TanStack/ai/tree/main/examples/ts-react-coding-agent) — session resume, the harness tool timeline, sandbox modes, and tool bridging, wired into a React app.
+
+## Authentication
+
+The harness resolves credentials the same way the Codex CLI does:
+
+- the `apiKey` config option (exported to the subprocess as `CODEX_API_KEY`; usage-based billing), or
+- an existing ChatGPT login on the machine (`codex login`).
+
+## Basic Usage
+
+```typescript
+import { chat } from "@tanstack/ai";
+import { codexText } from "@tanstack/ai-codex";
+
+const stream = chat({
+  adapter: codexText("gpt-5.1-codex", {
+    cwd: "/path/to/project",
+    sandboxMode: "workspace-write",
+  }),
+  messages: [{ role: "user", content: "Fix the failing test in utils.test.ts" }],
+});
+```
+
+## Configuration
+
+| Option                 | Description                                                                                                                                  |
+| ---------------------- | -------------------------------------------------------------------------------------------------------------------------------------------- |
+| `cwd`                  | Working directory for the harness session. Defaults to `process.cwd()`.                                                                       |
+| `sandboxMode`          | Codex sandbox: `'read-only'` (harness default), `'workspace-write'`, or `'danger-full-access'`. This is the safety boundary on a server.       |
+| `approvalPolicy`       | Codex approval policy. Defaults to `'never'` — headless runs have no approval UI, so anything else can stall a turn.                           |
+| `modelReasoningEffort` | `'minimal'` \| `'low'` \| `'medium'` \| `'high'` \| `'xhigh'`.                                                                                 |
+| `skipGitRepoCheck`     | Skip the harness's git-repo safety check. Defaults to `true` (server adapters routinely point at scratch directories).                         |
+| `networkAccessEnabled` | Allow network access inside the `workspace-write` sandbox.                                                                                     |
+| `webSearchMode`        | `'disabled'` \| `'cached'` \| `'live'`.                                                                                                        |
+| `additionalDirectories`| Extra writable directories beyond `cwd`.                                                                                                       |
+| `apiKey`               | OpenAI API key for the harness subprocess.                                                                                                     |
+| `baseUrl`              | Override the Codex backend base URL.                                                                                                           |
+| `codexPathOverride`    | Use a specific codex executable instead of the SDK's bundled binary.                                                                           |
+| `env`                  | Environment variables for the subprocess. When set, `process.env` is **not** inherited (Codex SDK semantics).                                  |
+| `config`               | Extra `--config key=value` overrides passed to the Codex CLI (e.g. additional `mcp_servers` entries).                                          |
+
+Per-call overrides — `sessionId`, `sandboxMode`, `approvalPolicy`, `modelReasoningEffort`, `workingDirectory`, `skipGitRepoCheck` — go through `modelOptions`.
+
+## Stateful Sessions
+
+Codex threads are stateful — the harness keeps the full working context (files read, commands run, conclusions reached) between turns. The adapter surfaces the thread id of every fresh run as a custom stream event named `codex.session-id`; thread it back via `modelOptions.sessionId` to resume. When resuming, only the latest user message is sent — the harness already holds the prior context.
+
+Server endpoint:
+
+```typescript
+import {
+  chat,
+  chatParamsFromRequest,
+  toServerSentEventsResponse,
+} from "@tanstack/ai";
+import { codexText } from "@tanstack/ai-codex";
+
+export async function POST(request: Request) {
+  const params = await chatParamsFromRequest(request);
+
+  // Extra fields the client puts in the connection `body` arrive here.
+  const sessionId =
+    typeof params.forwardedProps.sessionId === "string"
+      ? params.forwardedProps.sessionId
+      : undefined;
+
+  const stream = chat({
+    adapter: codexText("gpt-5.1-codex", {
+      cwd: "/path/to/project",
+      sandboxMode: "workspace-write",
+    }),
+    messages: params.messages,
+    modelOptions: { sessionId },
+  });
+
+  return toServerSentEventsResponse(stream);
+}
+```
+
+Client (React) — capture the session id from the custom event and send it back on subsequent requests:
+
+```typescript
+import { useState } from "react";
+import { useChat } from "@tanstack/ai-react";
+import { fetchServerSentEvents } from "@tanstack/ai-client";
+
+function CodingAssistant() {
+  const [sessionId, setSessionId] = useState<string | undefined>(undefined);
+
+  const { messages, sendMessage } = useChat({
+    connection: fetchServerSentEvents("/api/chat", () => ({
+      body: { sessionId },
+    })),
+    onCustomEvent: (name, value) => {
+      if (
+        name === "codex.session-id" &&
+        typeof value === "object" &&
+        value !== null &&
+        "sessionId" in value &&
+        typeof value.sessionId === "string"
+      ) {
+        setSessionId(value.sessionId);
+      }
+    },
+  });
+
+  // ... render messages; harness tool activity (command_execution,
+  // file_change, ...) arrives as regular tool-call parts with results.
+}
+```
+
+Sessions are stored on the machine that ran them (`~/.codex/sessions/`), so resuming only works on the same server instance.
+
+## Tools
+
+Two kinds of tools flow through this adapter:
+
+1. **Built-in harness tools** are executed by Codex itself and stream back as tool-call events with results already attached: `command_execution` (shell), `file_change` (patches), `web_search`, and `todo_list` (the agent's running plan). Your code never executes them.
+
+2. **Your TanStack tools** are bridged *into* the harness: the adapter starts a short-lived Streamable-HTTP MCP server on `127.0.0.1` for the duration of the turn and points Codex at it. Define tools as usual with `toolDefinition().server()`; tool-call events come back under the names you registered.
+
+```typescript
+import { z } from "zod";
+import { chat, toolDefinition } from "@tanstack/ai";
+import { codexText } from "@tanstack/ai-codex";
+
+const lookupTicket = toolDefinition({
+  name: "lookup_ticket",
+  description: "Look up an issue ticket by id",
+  inputSchema: z.object({ ticketId: z.string() }),
+}).server(async ({ ticketId }) => {
+  return { ticketId, status: "open", title: "Crash on startup" };
+});
+
+const stream = chat({
+  adapter: codexText("gpt-5.1-codex"),
+  messages: [{ role: "user", content: "What's the status of ticket T-123?" }],
+  tools: [lookupTicket],
+});
+```
+
+**Client-side and approval-gated tools are not supported.** The harness executes tools inside a live subprocess, which cannot pause across HTTP requests to wait for a browser round-trip or a human approval. Passing a tool without a server `execute()` implementation — or one marked `needsApproval` — fails fast with a descriptive error. Run those tools outside the harness with a regular provider adapter.
+
+## Structured Output
+
+`structuredOutput()` uses Codex's native `outputSchema` support in a fresh, read-only, one-shot thread whose final message is a JSON string conforming to your schema. It works for finalization after a chat, but a plain provider adapter (e.g. `@tanstack/ai-openai`) is the better choice when structured extraction is the primary job — it's faster and doesn't spawn a subprocess.
+
+## Limitations
+
+- **No token-level text streaming.** The Codex SDK reports assistant text and reasoning only as completed items, so text arrives message-at-a-time. Tool activity (commands starting/finishing) still streams live, which keeps the UI feeling alive during long turns.
+- **Server-only (Node).** The harness spawns a subprocess.
+- **The harness owns the agent loop.** TanStack's agent-loop strategies and per-iteration middleware don't apply inside a harness turn.
+- **No sampling controls.** `temperature`-style options don't exist here.
+- **Sessions are machine-local.** Resume requires hitting the same server instance.
+- **Cold starts.** Each call spawns a harness turn; expect higher first-token latency than HTTP adapters.
diff --git a/docs/adapters/gemini-cli.md b/docs/adapters/gemini-cli.md
new file mode 100644
index 000000000..9822c1298
--- /dev/null
+++ b/docs/adapters/gemini-cli.md
@@ -0,0 +1,205 @@
+---
+title: Gemini CLI
+id: gemini-cli-adapter
+order: 13
+description: "Use Gemini CLI as a chat backend in TanStack AI — agent harness with local tool execution, stateful coding sessions, and tool bridging via @tanstack/ai-gemini-cli."
+keywords:
+  - tanstack ai
+  - gemini cli
+  - agent client protocol
+  - acp
+  - google
+  - harness
+  - agent
+  - coding agent
+  - adapter
+---
+
+The Gemini CLI adapter runs [Gemini CLI](https://github.com/google-gemini/gemini-cli) as a chat backend, driving it over the [Agent Client Protocol](https://agentclientprotocol.com) (`gemini --acp`) — the same interface editors like Zed use to embed it. Unlike HTTP provider adapters, this is a **harness adapter**: Gemini CLI runs its own agent loop and executes its own tools — shell commands, file reads and edits, search — locally on your server. Each `chat()` call runs one full harness turn; assistant text and thinking stream as true token-level deltas, and the harness's tool activity streams back as already-resolved tool-call events your UI can render.
+
+> **Server-only.** The adapter spawns the `gemini` CLI as a subprocess, so it only works in a Node.js server environment — never in the browser. Treat it like giving Gemini a shell on the machine it runs on, and configure permissions accordingly.
+
+## Installation
+
+```bash
+npm install @tanstack/ai-gemini-cli
+```
+
+The `gemini` CLI itself is a prerequisite — it is **not** bundled:
+
+```bash
+npm install -g @google/gemini-cli
+```
+
+A runnable demo lives at [`examples/ts-react-coding-agent`](https://github.com/TanStack/ai/tree/main/examples/ts-react-coding-agent) — session resume, the harness tool timeline, permission modes, and tool bridging, wired into a React app.
+
+## Authentication
+
+The harness resolves credentials the same way Gemini CLI does:
+
+- an existing Google login on the machine (run `gemini` once interactively), or
+- `GEMINI_API_KEY` in the server's environment (pass it via the `env` config option if needed).
+
+**Headless ACP auth.** When driven over ACP, Gemini CLI can't pop an
+interactive auth picker, so it needs to be told which method to use. Set
+`authMethodId` to one of the methods the CLI advertises — commonly
+`'oauth-personal'` (Log in with Google), `'gemini-api-key'`, or `'vertex-ai'`.
+The adapter selects it (via the ACP `authenticate` call) before opening the
+session, and fails fast with the list of available methods if the one you
+asked for isn't offered. Some setups also require trusting the working
+directory in headless mode — set `GEMINI_CLI_TRUST_WORKSPACE=true` (or pass
+`--skip-trust` via `extraArgs`) when the CLI refuses an untrusted folder.
+
+```typescript
+import { geminiCliText } from "@tanstack/ai-gemini-cli";
+
+const adapter = geminiCliText("gemini-3-pro-preview", {
+  cwd: "/path/to/project",
+  authMethodId: "oauth-personal", // reuse the machine's Google login
+});
+```
+
+## Basic Usage
+
+```typescript
+import { chat } from "@tanstack/ai";
+import { geminiCliText } from "@tanstack/ai-gemini-cli";
+
+const stream = chat({
+  adapter: geminiCliText("gemini-3-pro-preview", {
+    cwd: "/path/to/project",
+    permissionMode: "acceptEdits",
+  }),
+  messages: [{ role: "user", content: "Fix the failing test in utils.test.ts" }],
+});
+```
+
+## Configuration
+
+| Option                | Description                                                                                                          |
+| --------------------- | --------------------------------------------------------------------------------------------------------------------- |
+| `cwd`                 | Working directory for the harness session. Defaults to `process.cwd()`.                                                |
+| `executablePath`      | Path to the Gemini CLI executable. Defaults to `gemini` on `PATH`.                                                     |
+| `extraArgs`           | Extra CLI arguments appended after `--acp` (e.g. `['--sandbox']`).                                                     |
+| `env`                 | Extra environment variables merged over `process.env` for the subprocess.                                              |
+| `permissionMode`      | `'default'`, `'acceptEdits'`, or `'bypassPermissions'`. See the permissions note below.                                 |
+| `onPermissionRequest` | Custom permission handler; replaces the adapter's default policy.                                                      |
+| `authMethodId`        | ACP auth method to select before the session starts, e.g. `'oauth-personal'`, `'gemini-api-key'`, `'vertex-ai'`. See Authentication. |
+
+Per-call overrides — `sessionId`, `permissionMode`, `cwd`, `authMethodId` — go through `modelOptions`.
+
+**Permissions on headless servers.** ACP routes the harness's tool-approval questions back to the embedding application. Without a custom `onPermissionRequest`, the adapter installs a safe default policy that always answers immediately: bridged TanStack tools are approved, `'acceptEdits'` additionally approves file-mutation tools (edit / move / delete kinds), `'bypassPermissions'` approves everything, and anything else is rejected — a headless server must never hang on a question only an interactive user could answer.
+
+## Stateful Sessions
+
+Gemini CLI sessions are stateful — the harness keeps the full working context between turns. The adapter surfaces the session id of every run as a custom stream event named `gemini-cli.session-id`; thread it back via `modelOptions.sessionId` to resume the session. When resuming, only the latest user message is sent — the harness already holds the prior context. If the installed CLI can't load the session (older CLI, different machine), the adapter transparently falls back to a fresh session seeded with the flattened transcript, and the new session id is emitted so the client can re-pin it.
+
+Server endpoint:
+
+```typescript
+import {
+  chat,
+  chatParamsFromRequest,
+  toServerSentEventsResponse,
+} from "@tanstack/ai";
+import { geminiCliText } from "@tanstack/ai-gemini-cli";
+
+export async function POST(request: Request) {
+  const params = await chatParamsFromRequest(request);
+
+  // Extra fields the client puts in the connection `body` arrive here.
+  const sessionId =
+    typeof params.forwardedProps.sessionId === "string"
+      ? params.forwardedProps.sessionId
+      : undefined;
+
+  const stream = chat({
+    adapter: geminiCliText("gemini-3-pro-preview", {
+      cwd: "/path/to/project",
+      permissionMode: "acceptEdits",
+    }),
+    messages: params.messages,
+    modelOptions: { sessionId },
+  });
+
+  return toServerSentEventsResponse(stream);
+}
+```
+
+Client (React) — capture the session id from the custom event and send it back on subsequent requests:
+
+```typescript
+import { useState } from "react";
+import { useChat } from "@tanstack/ai-react";
+import { fetchServerSentEvents } from "@tanstack/ai-client";
+
+function CodingAssistant() {
+  const [sessionId, setSessionId] = useState<string | undefined>(undefined);
+
+  const { messages, sendMessage } = useChat({
+    connection: fetchServerSentEvents("/api/chat", () => ({
+      body: { sessionId },
+    })),
+    onCustomEvent: (name, value) => {
+      if (
+        name === "gemini-cli.session-id" &&
+        typeof value === "object" &&
+        value !== null &&
+        "sessionId" in value &&
+        typeof value.sessionId === "string"
+      ) {
+        setSessionId(value.sessionId);
+      }
+    },
+  });
+
+  // ... render messages; harness tool activity (execute, edit, read, ...)
+  // arrives as regular tool-call parts with their results attached.
+}
+```
+
+Sessions are stored on the machine that ran them (under `~/.gemini/tmp/`), so resuming only works on the same server instance.
+
+## Tools
+
+Two kinds of tools flow through this adapter:
+
+1. **Built-in harness tools** (shell, file edits, reads, search, web fetch, ...) are executed by Gemini CLI itself. Their activity streams back as tool-call events — named by their ACP tool kind (`execute`, `edit`, `read`, `search`, ...), with the human-readable title in the arguments — and results attached, so `useChat` UIs render them with no extra wiring. Your code never executes them. The harness's running plan is surfaced as a CUSTOM `gemini-cli.plan` event.
+
+2. **Your TanStack tools** are bridged *into* the harness: the adapter starts a short-lived Streamable-HTTP MCP server on `127.0.0.1` for the duration of the turn and registers it with the ACP session. Define tools as usual with `toolDefinition().server()`; tool-call events come back under the names you registered, and the default permission policy auto-approves them.
+
+```typescript
+import { z } from "zod";
+import { chat, toolDefinition } from "@tanstack/ai";
+import { geminiCliText } from "@tanstack/ai-gemini-cli";
+
+const lookupTicket = toolDefinition({
+  name: "lookup_ticket",
+  description: "Look up an issue ticket by id",
+  inputSchema: z.object({ ticketId: z.string() }),
+}).server(async ({ ticketId }) => {
+  return { ticketId, status: "open", title: "Crash on startup" };
+});
+
+const stream = chat({
+  adapter: geminiCliText("gemini-3-pro-preview"),
+  messages: [{ role: "user", content: "What's the status of ticket T-123?" }],
+  tools: [lookupTicket],
+});
+```
+
+**Client-side and approval-gated tools are not supported.** The harness executes tools inside a live subprocess, which cannot pause across HTTP requests to wait for a browser round-trip or a human approval. Passing a tool without a server `execute()` implementation — or one marked `needsApproval` — fails fast with a descriptive error. Run those tools outside the harness with a regular provider adapter.
+
+## Structured Output
+
+ACP has no native JSON-schema output channel, so `structuredOutput()` is best-effort: the schema is embedded as a prompt instruction in a fresh one-shot session and the final text is parsed (markdown fences are stripped when present). For production structured extraction, use a plain provider adapter (e.g. `@tanstack/ai-gemini`) — it's faster, schema-enforced, and doesn't spawn a subprocess.
+
+## Limitations
+
+- **Server-only (Node)**, and the `gemini` CLI must be installed and authenticated on the host.
+- **Token usage is usually unavailable.** ACP only recently added usage reporting; when the CLI doesn't report it, `RUN_FINISHED` carries no usage.
+- **The harness owns the agent loop.** TanStack's agent-loop strategies and per-iteration middleware don't apply inside a harness turn.
+- **No sampling controls.** `temperature`-style options don't exist here.
+- **Sessions are machine-local.** Resume requires hitting the same server instance (with graceful fallback to a fresh transcript-seeded session).
+- **Cold starts.** Each call spawns the CLI; expect higher first-token latency than HTTP adapters.
+- **ACP is young.** Gemini CLI's ACP mode is still stabilizing; pin a known-good CLI version in production.
diff --git a/docs/adapters/opencode.md b/docs/adapters/opencode.md
new file mode 100644
index 000000000..ff2fa70e6
--- /dev/null
+++ b/docs/adapters/opencode.md
@@ -0,0 +1,186 @@
+---
+title: OpenCode
+id: opencode-adapter
+order: 14
+description: "Use OpenCode as a chat backend in TanStack AI — agent harness with local tool execution, token-level streaming, stateful sessions, and tool bridging via @tanstack/ai-opencode."
+keywords:
+  - tanstack ai
+  - opencode
+  - opencode sdk
+  - harness
+  - agent
+  - coding agent
+  - adapter
+---
+
+The OpenCode adapter runs [OpenCode](https://opencode.ai) as a chat backend, driving it over its local HTTP server (`@opencode-ai/sdk`). Unlike HTTP provider adapters, this is a **harness adapter**: OpenCode runs its own agent loop and executes its own tools — shell commands, file reads and edits, search — locally on your server. Each `chat()` call runs one full harness turn; assistant text and reasoning stream as true token-level deltas, and the harness's tool activity streams back as already-resolved tool-call events your UI can render.
+
+> **Server-only.** The adapter spawns (or attaches to) an `opencode serve` process, so it only works in a Node.js server environment — never in the browser. Treat it like giving OpenCode a shell on the machine it runs on, and configure permissions accordingly.
+
+## Installation
+
+```bash
+npm install @tanstack/ai-opencode
+```
+
+The `opencode` CLI must be installed and its providers authenticated on the host:
+
+```bash
+npm install -g opencode-ai
+opencode auth login
+```
+
+A runnable demo lives at [`examples/ts-react-coding-agent`](https://github.com/TanStack/ai/tree/main/examples/ts-react-coding-agent) — session resume, the harness tool timeline, permission modes, and tool bridging, wired into a React app.
+
+## Models
+
+OpenCode is provider-agnostic: it resolves any `provider/model` id its configured providers support. Address models as `provider/model` (the adapter splits on the first `/`):
+
+```typescript
+import { chat } from "@tanstack/ai";
+import { opencodeText } from "@tanstack/ai-opencode";
+
+const stream = chat({
+  adapter: opencodeText("anthropic/claude-sonnet-4-5", {
+    directory: "/path/to/project",
+    permissionMode: "acceptEdits",
+  }),
+  messages: [{ role: "user", content: "Fix the failing test in utils.test.ts" }],
+});
+```
+
+## Configuration
+
+| Option                | Description                                                                                                                                                  |
+| --------------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+| `directory`           | Working directory for the harness session. Defaults to `process.cwd()`.                                                                                      |
+| `baseUrl`             | Attach to an already-running `opencode serve` (e.g. `http://127.0.0.1:4096`) instead of spawning a new server per turn.                                       |
+| `hostname`            | Hostname for the spawned server. Defaults to the SDK default (`127.0.0.1`).                                                                                   |
+| `port`                | Port for the spawned server. Defaults to the SDK default (`4096`).                                                                                           |
+| `permissionMode`      | `'default'` (bridged tools run, everything else that prompts is rejected), `'acceptEdits'` (also auto-approves file edits), or `'bypassPermissions'` (allow all). |
+| `onPermissionRequest` | Custom permission handler; replaces the default policy entirely.                                                                                             |
+| `config`              | Extra OpenCode config merged with the adapter's MCP and permission config.                                                                                    |
+
+Per-call overrides — `sessionId`, `permissionMode`, `directory` — go through `modelOptions`.
+
+## Permissions
+
+OpenCode asks for permission before mutating files or running commands. A headless server has no one to answer those prompts, so the adapter applies a policy automatically — it never hangs a turn:
+
+- **`'default'`** — bridged TanStack tools run; anything else that would prompt (edits, shell, web fetch) is rejected.
+- **`'acceptEdits'`** — additionally auto-approves file-mutation requests (edit / write / patch).
+- **`'bypassPermissions'`** — approves everything. Only use this against a sandbox or scratch directory.
+
+Provide `onPermissionRequest` to implement your own policy (e.g. allow-list specific commands).
+
+## Stateful Sessions
+
+OpenCode sessions are stateful — the harness keeps the full working context (files read, commands run, conclusions reached) between turns. The adapter surfaces the session id of every fresh run as a custom stream event named `opencode.session-id`; thread it back via `modelOptions.sessionId` to resume. When resuming, only the latest user message is sent — the harness already holds the prior context.
+
+Server endpoint:
+
+```typescript
+import {
+  chat,
+  chatParamsFromRequest,
+  toServerSentEventsResponse,
+} from "@tanstack/ai";
+import { opencodeText } from "@tanstack/ai-opencode";
+
+export async function POST(request: Request) {
+  const params = await chatParamsFromRequest(request);
+
+  // Extra fields the client puts in the connection `body` arrive here.
+  const sessionId =
+    typeof params.forwardedProps.sessionId === "string"
+      ? params.forwardedProps.sessionId
+      : undefined;
+
+  const stream = chat({
+    adapter: opencodeText("anthropic/claude-sonnet-4-5", {
+      directory: "/path/to/project",
+      permissionMode: "acceptEdits",
+    }),
+    messages: params.messages,
+    modelOptions: { sessionId },
+  });
+
+  return toServerSentEventsResponse(stream);
+}
+```
+
+Client (React) — capture the session id from the custom event and send it back on subsequent requests:
+
+```typescript
+import { useState } from "react";
+import { useChat } from "@tanstack/ai-react";
+import { fetchServerSentEvents } from "@tanstack/ai-client";
+
+function CodingAssistant() {
+  const [sessionId, setSessionId] = useState<string | undefined>(undefined);
+
+  const { messages, sendMessage } = useChat({
+    connection: fetchServerSentEvents("/api/chat", () => ({
+      body: { sessionId },
+    })),
+    onCustomEvent: (name, value) => {
+      if (
+        name === "opencode.session-id" &&
+        typeof value === "object" &&
+        value !== null &&
+        "sessionId" in value &&
+        typeof value.sessionId === "string"
+      ) {
+        setSessionId(value.sessionId);
+      }
+    },
+  });
+
+  // ... render messages; harness tool activity (bash, edit, read, ...)
+  // arrives as regular tool-call parts with results.
+}
+```
+
+Sessions live on the server that ran them, so resuming only works against the same server instance (or a shared `baseUrl`).
+
+## Tools
+
+Two kinds of tools flow through this adapter:
+
+1. **Built-in harness tools** are executed by OpenCode itself and stream back as tool-call events with results already attached: `bash`, `edit`, `write`, `read`, `grep`, and the agent's running todo plan (surfaced as an `opencode.todo` custom event). Your code never executes them.
+
+2. **Your TanStack tools** are bridged *into* the harness: the adapter starts a short-lived Streamable-HTTP MCP server on `127.0.0.1` for the duration of the turn and registers it with OpenCode. Define tools as usual with `toolDefinition().server()`; tool-call events come back under the names you registered (OpenCode prefixes MCP tools `tanstack_…` internally, which the adapter strips).
+
+```typescript
+import { z } from "zod";
+import { chat, toolDefinition } from "@tanstack/ai";
+import { opencodeText } from "@tanstack/ai-opencode";
+
+const lookupTicket = toolDefinition({
+  name: "lookup_ticket",
+  description: "Look up an issue ticket by id",
+  inputSchema: z.object({ ticketId: z.string() }),
+}).server(async ({ ticketId }) => {
+  return { ticketId, status: "open", title: "Crash on startup" };
+});
+
+const stream = chat({
+  adapter: opencodeText("anthropic/claude-sonnet-4-5"),
+  messages: [{ role: "user", content: "What's the status of ticket T-123?" }],
+  tools: [lookupTicket],
+});
+```
+
+**Client-side and approval-gated tools are not supported.** The harness executes tools inside a live process, which cannot pause across HTTP requests to wait for a browser round-trip or a human approval. Passing a tool without a server `execute()` implementation — or one marked `needsApproval` — fails fast with a descriptive error. Run those tools outside the harness with a regular provider adapter.
+
+## Structured Output
+
+`structuredOutput()` is best-effort: OpenCode's prompt API has no native JSON-schema channel, so the schema is embedded as a prompt instruction in a fresh, one-shot session and the final text is parsed (markdown fences are stripped when present). It works for finalization after a chat, but a plain provider adapter (e.g. `@tanstack/ai-openai`) is the better choice when structured extraction is the primary job — it's faster, deterministic, and doesn't spawn a harness.
+
+## Limitations
+
+- **Server-only (Node).** The adapter spawns or attaches to an `opencode serve` process.
+- **The harness owns the agent loop.** TanStack's agent-loop strategies and per-iteration middleware don't apply inside a harness turn.
+- **No sampling controls.** `temperature`-style options don't exist here.
+- **Sessions are server-local.** Resume requires hitting the same server instance (or a shared `baseUrl`).
+- **Cold starts.** Spawning a server per turn adds first-token latency; point the adapter at a long-lived `baseUrl` to avoid it.
diff --git a/docs/config.json b/docs/config.json
index 3a18eb12e..568f1fe91 100644
--- a/docs/config.json
+++ b/docs/config.json
@@ -291,6 +291,27 @@
         }
       ]
     },
+    {
+      "label": "Sandboxes",
+      "children": [
+        {
+          "label": "Overview",
+          "to": "sandbox/overview",
+          "addedAt": "2026-06-16",
+          "updatedAt": "2026-06-16"
+        }
+      ]
+    },
+    {
+      "label": "Persistence",
+      "children": [
+        {
+          "label": "Overview",
+          "to": "persistence/overview",
+          "addedAt": "2026-06-18"
+        }
+      ]
+    },
     {
       "label": "Advanced",
       "children": [
@@ -458,6 +479,26 @@
           "label": "OpenAI-Compatible",
           "to": "adapters/openai-compatible",
           "addedAt": "2026-06-01"
+        },
+        {
+          "label": "Claude Code",
+          "to": "adapters/claude-code",
+          "addedAt": "2026-06-12"
+        },
+        {
+          "label": "Codex",
+          "to": "adapters/codex",
+          "addedAt": "2026-06-12"
+        },
+        {
+          "label": "Gemini CLI",
+          "to": "adapters/gemini-cli",
+          "addedAt": "2026-06-12"
+        },
+        {
+          "label": "OpenCode",
+          "to": "adapters/opencode",
+          "addedAt": "2026-06-12"
         }
       ]
     },
diff --git a/docs/persistence/overview.md b/docs/persistence/overview.md
new file mode 100644
index 000000000..88e422d32
--- /dev/null
+++ b/docs/persistence/overview.md
@@ -0,0 +1,164 @@
+---
+title: Persistence Overview
+id: overview
+---
+
+Persistence makes a `chat()` run **durable** and **resumable** — without changing
+how you write `chat()`. It is composable middleware, so it is entirely optional:
+a run with no persistence middleware behaves exactly as before, and the same
+middleware works for plain model adapters and for sandbox-backed harness adapters.
+
+`withPersistence(...)`:
+
+- loads and saves the thread's message history (the server is authoritative),
+- records each run (status, usage, errors),
+- appends every streamed AG-UI event to an append-only **event log**,
+- stamps each streamed chunk with an opaque **cursor** so a disconnected client
+  can resume,
+- and (in agent mode) persists approvals and artifacts.
+
+## Installation
+
+Pick a backend. SQLite is the simplest durable option:
+
+```sh
+npm install @tanstack/ai-persistence @tanstack/ai-persistence-sqlite
+```
+
+Other backends: `@tanstack/ai-persistence-postgres`, `-cloudflare`, `-drizzle`,
+`-prisma`. For tests and prototypes, `memoryPersistence()` ships in
+`@tanstack/ai-persistence`.
+
+## Server: a persisted, resumable endpoint
+
+```ts
+import { chat } from '@tanstack/ai'
+import { anthropicText } from '@tanstack/ai-anthropic/adapters'
+import { withPersistence } from '@tanstack/ai-persistence'
+import { sqlitePersistence } from '@tanstack/ai-persistence-sqlite'
+
+// Build once and reuse across requests.
+const persistence = sqlitePersistence({
+  path: '.tanstack-ai/state.sqlite',
+  mode: 'chat',
+})
+
+export async function POST(request: Request) {
+  // `runId` is reused on a resume; `cursor` is present only when resuming.
+  const { messages, threadId, runId, cursor } = await request.json()
+
+  return chat({
+    threadId,
+    runId,
+    cursor,
+    adapter: anthropicText({ model: 'claude-sonnet-4-6' }),
+    messages,
+    middleware: [withPersistence(persistence)],
+  }).toResponse()
+}
+```
+
+When `cursor` is present, `chat()` replays the persisted events after that
+cursor instead of re-running the adapter — so a reconnecting client catches up
+without duplicating work or burning tokens.
+
+## Client: automatic resume
+
+The headless client tracks the last cursor it saw and can resume an interrupted
+run. In React:
+
+```tsx
+import { useChat } from '@tanstack/ai-react'
+
+function Chat() {
+  const chat = useChat({
+    threadId: 'thread-123',
+    transport: { api: '/api/chat' },
+    // Auto-resume is on by default; opt out with `autoResume: false`.
+  })
+
+  // Call on mount / when the tab comes back online to continue an
+  // interrupted run where it left off:
+  // useEffect(() => { chat.maybeAutoResume() }, [])
+
+  return <>{/* ...render chat.messages... */}</>
+}
+```
+
+`chat.getResumeState()` returns `{ runId, cursor }` for the active/interrupted
+run (or `null`), which you can persist to resume across a full page reload;
+`chat.resume()` continues it on demand.
+
+## Modes
+
+`mode` declares how much is persisted:
+
+| Mode | Persists |
+| --- | --- |
+| `'messages'` | thread message history only |
+| `'chat'` | messages + runs + event log + usage (resumable conversations) |
+| `'agent'` | everything in `chat`, plus sandbox records, approvals, and artifacts |
+
+## Bring your own database
+
+`sqlitePersistence` / `postgresPersistence` accept a connection (`{ path }` /
+`{ connectionString }`) **or** an existing handle. Drizzle and Prisma users pass
+their client directly:
+
+```ts
+import { drizzlePersistence } from '@tanstack/ai-persistence-drizzle'
+import { prismaPersistence } from '@tanstack/ai-persistence-prisma'
+
+const a = drizzlePersistence({ db, dialect: 'postgres', mode: 'chat' })
+const b = prismaPersistence({ prisma, dialect: 'postgres', mode: 'chat' })
+```
+
+Raw drivers create and migrate their tables automatically (opt out with
+`{ migrate: false }` and apply the exported `ddl(...)` / `migrate(...)`
+yourself). Drizzle and Prisma own their own schema/migrations.
+
+## Agent mode + sandboxes
+
+For sandbox-backed harness runs, `@tanstack/ai-sandbox-persistence` provides a
+durable, SQL-backed sandbox store and a distributed lock so sandbox resume and
+ensure-locking survive across processes:
+
+```ts
+import { withSandbox, defineSandbox } from '@tanstack/ai-sandbox'
+import { dockerSandbox } from '@tanstack/ai-sandbox-docker'
+import { withPersistence } from '@tanstack/ai-persistence'
+import { sqlitePersistence, createSqliteDriver } from '@tanstack/ai-persistence-sqlite'
+import {
+  withPersistenceBridge,
+  createSqlSandboxStore,
+} from '@tanstack/ai-sandbox-persistence'
+import { claudeCode } from '@tanstack/ai-claude-code'
+
+const dbPath = '.tanstack-ai/state.sqlite'
+const driver = createSqliteDriver({ path: dbPath })
+const persistence = sqlitePersistence({ path: dbPath, mode: 'agent' })
+
+const repoSandbox = defineSandbox({
+  id: 'repo-agent',
+  provider: dockerSandbox({ image: 'node:22' }),
+})
+
+chat({
+  threadId,
+  runId,
+  adapter: claudeCode({ model: 'claude-sonnet-4-6' }),
+  messages,
+  middleware: [
+    withPersistence(persistence),
+    withPersistenceBridge({
+      persistence,
+      sandboxStore: createSqlSandboxStore(driver),
+    }),
+    withSandbox(repoSandbox),
+  ],
+}).toResponse()
+```
+
+A harness adapter (which runs the agent inside the still-running sandbox) can
+re-attach to its process on resume and continue live after replaying the event
+tail.
diff --git a/docs/sandbox/overview.md b/docs/sandbox/overview.md
new file mode 100644
index 000000000..314784b0c
--- /dev/null
+++ b/docs/sandbox/overview.md
@@ -0,0 +1,309 @@
+---
+id: overview
+title: Sandboxes Overview
+---
+
+Sandboxes let **harness adapters** (coding agents like Claude Code) run inside
+an isolated environment — with a real filesystem, processes, and a cloned repo —
+and stream their work back through `chat()`. The same code runs on your laptop,
+in CI, in a Docker container, or on the edge: only the **provider** changes.
+
+```ts
+import { chat } from '@tanstack/ai'
+import { claudeCodeText } from '@tanstack/ai-claude-code'
+import { defineSandbox, defineWorkspace, withSandbox } from '@tanstack/ai-sandbox'
+import { dockerSandbox } from '@tanstack/ai-sandbox-docker'
+
+const repoSandbox = defineSandbox({
+  id: 'repo-agent',
+  provider: dockerSandbox({ image: 'node:22' }),
+  workspace: defineWorkspace({
+    source: { type: 'git', url: 'https://github.com/TanStack/ai' },
+    packageManager: 'pnpm',
+    setup: ['corepack enable', 'pnpm install'],
+    scripts: { test: 'pnpm test', typecheck: 'pnpm test:types' },
+    secrets: { ANTHROPIC_API_KEY: process.env.ANTHROPIC_API_KEY ?? '' },
+  }),
+  lifecycle: { reuse: 'thread', snapshot: 'after-setup', keepAlive: '30m' },
+})
+
+chat({
+  threadId,
+  adapter: claudeCodeText('sonnet'),
+  messages,
+  middleware: [withSandbox(repoSandbox)],
+})
+```
+
+## Mental model
+
+- **`chat()`** owns the execution pipeline.
+- **The adapter** decides _how_ a chat executes. A **harness adapter** (e.g.
+  `claudeCodeText`) runs an external agent runtime and declares
+  `requires: [SandboxCapability]` — `chat()` errors at the call site if no
+  middleware provides a sandbox.
+- **`withSandbox(...)`** is middleware that _provides_ the `SandboxCapability`:
+  it resumes-or-creates the sandbox, bootstraps the workspace, and tears it
+  down per the lifecycle.
+
+```txt
+chat({ adapter: claudeCodeText(), middleware: [withSandbox(repoSandbox)] })
+  │
+  ├─ withSandbox.setup   → ensure sandbox (resume → restore snapshot → create + bootstrap), provide handle
+  ├─ adapter.chatStream  → spawn `claude` INSIDE the sandbox, stream its events back as AG-UI chunks
+  └─ withSandbox.onFinish→ snapshot / destroy per lifecycle
+```
+
+## Providers
+
+A provider owns the isolation primitive. All implement the same
+`SandboxProvider` / `SandboxHandle` contract, so adapters and workspaces are
+provider-agnostic.
+
+| Provider | Package | Isolation | Notes |
+| --- | --- | --- | --- |
+| Local process | `@tanstack/ai-sandbox-local-process` | none (host) | The fast, no-Docker dev loop. Trusted/dev use only. |
+| Docker | `@tanstack/ai-sandbox-docker` | container | Real isolation; commit-based snapshots, fork, resume-by-id. |
+
+```ts
+import { localProcessSandbox } from '@tanstack/ai-sandbox-local-process'
+import { dockerSandbox } from '@tanstack/ai-sandbox-docker'
+
+const dev = localProcessSandbox() // runs on your host
+const isolated = dockerSandbox({ image: 'node:22' }) // runs in a container
+```
+
+Providers declare what they support via `capabilities()`
+(`fs`, `exec`, `env`, `ports`, `backgroundProcesses`, `snapshots`,
+`networkPolicy`, `durableFilesystem`, `fork`). Code that uses an optional
+capability checks the flag first and degrades gracefully; calling an
+unsupported optional method throws `UnsupportedCapabilityError`.
+
+## Workspace
+
+`defineWorkspace()` describes what the agent sees. It is portable; each harness
+adapter projects it into its own native format.
+
+```ts
+import { defineWorkspace } from '@tanstack/ai-sandbox'
+
+defineWorkspace({
+  // Where the working tree comes from.
+  source: { type: 'git', url: 'https://github.com/owner/repo', ref: 'main' },
+  // Package manager (auto-detected from the lockfile when omitted).
+  packageManager: 'pnpm',
+  // Commands run once during bootstrap.
+  setup: ['corepack enable', 'pnpm install'],
+  // Named commands the agent can run.
+  scripts: { test: 'pnpm test', build: 'pnpm build' },
+  // Injected into the sandbox env at create/resume — never persisted to
+  // snapshots, the sandbox store, or the event log.
+  secrets: { ANTHROPIC_API_KEY: process.env.ANTHROPIC_API_KEY ?? '' },
+})
+```
+
+## Policy
+
+`defineSandboxPolicy()` is a portable allow/ask/deny description that each
+harness adapter maps onto its native permission system. Precedence is
+`deny` > `ask` > `allow`, with a configurable `default`.
+
+```ts group=overview
+import { defineSandboxPolicy,  defineSandbox } from '@tanstack/ai-sandbox'
+
+const policy = defineSandboxPolicy({
+  commands: {
+    allow: ['pnpm test', 'pnpm typecheck', 'git diff'],
+    ask: ['pnpm install', 'curl *'],
+    deny: ['sudo *', 'rm -rf *'],
+  },
+  capabilities: { fileWrite: 'allow', network: 'ask' },
+  default: 'ask',
+})
+
+const sandbox = defineSandbox({ id: 'repo', provider, policy /* … */ })
+```
+
+## Tools
+
+The agent always has its own native tools (Bash, file edits, search) inside the
+sandbox. In addition, `chat()`-provided server tools are **bridged** to the
+in-sandbox agent over a host-side MCP tool-proxy: the agent calls them, each call
+is proxied back to the host where the tool's `execute()` runs (keeping its
+DB/secrets/closures), and the result is returned into the sandbox. The bridge is
+gated by a per-run bearer token; the sandbox reaches the host on `localhost`
+(local-process) or `host.docker.internal` (Docker).
+
+```ts
+chat({
+  threadId,
+  adapter: claudeCodeText('sonnet'),
+  messages,
+  tools: [getTodos.server(async ({ userId }) => db.todos.find({ userId }))],
+  middleware: [withSandbox(sandbox)],
+})
+```
+
+## File-event hooks
+
+Listen to files being created, changed, or deleted inside a sandbox — e.g. to
+watch what the agent edits as it works. The watcher is provider-agnostic: it
+uses native OS watching where the provider supports it (local-process) and falls
+back to a portable `find` poll everywhere else (Docker and other exec-only
+providers), with no extra dependencies or image changes.
+
+Hooks are declared directly on `defineSandbox({ hooks })` (sandbox-scoped, fire
+once per file event regardless of how many runs share the sandbox) or on any
+chat middleware via the `sandbox` group (run-scoped, fired per-run):
+
+```ts
+import { defineSandbox, defineChatMiddleware, withSandbox } from '@tanstack/ai-sandbox'
+import { dockerSandbox } from '@tanstack/ai-sandbox-docker'
+
+// Sandbox-scoped hooks — declared once on the definition.
+const repoSandbox = defineSandbox({
+  id: 'repo-agent',
+  provider: dockerSandbox({ image: 'node:22' }),
+  hooks: {
+    // catch-all: fires for every event
+    onFile:       (e) => console.log(`[${e.type}] ${e.path}`),
+    // type-specific variants
+    onFileCreate: (e) => console.log('created', e.path),
+    onFileChange: (e) => console.log('changed', e.path),
+    onFileDelete: (e) => console.log('deleted', e.path),
+    // lifecycle
+    onReady:   (handle) => console.log('sandbox ready', handle.id),
+    onError:   (err)    => console.error('sandbox error', err),
+    onDestroy: ()       => console.log('sandbox destroyed'),
+  },
+})
+```
+
+To handle file events inside a run-scoped middleware (e.g. for per-request
+audit logging), use the `sandbox` hook group on `defineChatMiddleware`:
+
+```ts
+const auditMiddleware = defineChatMiddleware({
+  name: 'audit',
+  // ctx is the ChatMiddlewareContext for the current run
+  sandbox: {
+    onFile:       (ctx, e) => console.log(ctx.runId, e.type, e.path),
+    onFileCreate: (ctx, e) => db.log({ run: ctx.runId, event: e }),
+  },
+})
+```
+
+Both hook groups fire server-side. The engine automatically emits one `CUSTOM`
+`sandbox.file` event per change into the stream — no extra middleware needed.
+Read it from the `parts` array on the client:
+
+```ts
+for await (const chunk of stream) {
+  if (chunk.type === 'CUSTOM' && chunk.name === 'sandbox.file') {
+    const value = chunk.value
+    if (
+      value !== null &&
+      typeof value === 'object' &&
+      'type' in value &&
+      'path' in value
+    ) {
+      console.log('file event', value) // { type, path, timestamp }
+    }
+  }
+}
+```
+
+To disable file watching for a sandbox entirely, set `fileEvents: false`:
+
+```ts
+const sandbox = defineSandbox({
+  id: 'quiet-agent',
+  provider: dockerSandbox({ image: 'node:22' }),
+  fileEvents: false, // watcher not started; no sandbox.file events emitted
+})
+```
+
+To log sandbox internals (watcher start/stop, event dispatch, lifecycle
+transitions), pass the `sandbox` debug category:
+
+```ts
+chat({ threadId, adapter, messages, debug: true })
+// or selectively:
+chat({ threadId, adapter, messages, debug: { sandbox: true } })
+```
+
+`watchWorkspace()` remains available as a low-level building block for using
+the watcher outside a `chat()` run:
+
+```ts
+import { watchWorkspace } from '@tanstack/ai-sandbox'
+
+const handle = await sandbox.ensure({ threadId, runId })
+const watcher = await watchWorkspace(handle, {
+  onEvent: (event) => {
+    // event.type is 'create' | 'change' | 'delete'
+    console.log(`${event.type} ${event.path}`)
+  },
+  ignore: ['.git', 'node_modules'], // default
+})
+// …do work outside a chat run…
+await watcher.stop()
+```
+
+## Lifecycle &amp; resume
+
+```ts
+lifecycle: {
+  reuse: 'thread',          // one sandbox per threadId ('none' = fresh per run)
+  snapshot: 'after-setup',  // snapshot once bootstrapped (provider-permitting)
+  keepAlive: '30m',         // hint to keep the sandbox warm between runs
+  destroyOnComplete: false, // keep it for the next run
+}
+```
+
+A sandbox is keyed by a compound `sandboxInstanceKey` =
+`hash(threadId + sandbox.id + provider + workspaceHash + tenant?)`, so changing
+the repo, setup, image, or tenant safely starts a fresh sandbox rather than
+resuming a stale one. The ensure order is: **resume the running sandbox →
+restore the latest snapshot → create fresh and bootstrap**. Providers without
+durable disk or snapshots (e.g. ephemeral containers) re-create + re-bootstrap
+under the same identity.
+
+## Events
+
+Harness runs stream standard AG-UI `StreamChunk`s (text, tool calls, reasoning,
+run lifecycle) plus namespaced `CUSTOM` events for sandbox-specifics. Today the
+in-sandbox Claude Code adapter emits:
+
+- `claude-code.session-id` — the resumable harness session id.
+- `file.changed` — the working-tree `git diff` after the run.
+- `sandbox.file` — emitted per file create/change/delete automatically when a
+  sandbox is active (see [File-event hooks](#file-event-hooks)).
+
+```ts
+for await (const chunk of stream) {
+  if (chunk.type === 'CUSTOM' && chunk.name === 'file.changed') {
+    const value = chunk.value
+    if (value !== null && typeof value === 'object' && 'diff' in value) {
+      console.log(value.diff)
+    }
+  }
+}
+```
+
+## Try it
+
+A runnable end-to-end demo lives at `examples/sandbox-coding-agent`: it clones a
+tiny repo with a deliberate bug into a sandbox, asks Claude Code to fix it,
+streams the agent's output, and prints the resulting diff. Run it with Docker or
+with `SANDBOX=local` on your host (requires `ANTHROPIC_API_KEY`).
+
+`examples/sandbox-issue-triage` goes further: it fetches the first open issue on
+`TanStack/ai`, clones the repo into a sandbox, runs Claude Code to triage it, and
+writes a Markdown report locally — using **file-event hooks** to log the agent's
+edits live. It ships two entrypoints, `pnpm start:process` and `pnpm start:docker`.
+
+> **Persistence-ready:** the sandbox layer ships with in-memory stores for
+> resume bookkeeping. A future persistence package can provide durable
+> `SandboxStore` / `LockStore` implementations (and event-log replay) by
+> supplying those optional capabilities — no changes to the sandbox layer.
diff --git a/examples/sandbox-coding-agent/README.md b/examples/sandbox-coding-agent/README.md
new file mode 100644
index 000000000..78676301e
--- /dev/null
+++ b/examples/sandbox-coding-agent/README.md
@@ -0,0 +1,85 @@
+# Sandbox coding-agent demo
+
+Runs **Claude Code inside a sandbox** to fix a bug, end-to-end, through the
+public `chat()` API. Use this to manually verify the sandbox layer locally.
+
+It bootstraps a tiny git repo with a deliberate bug in `add.js`
+(`add(a, b)` returns `a - b`), asks Claude Code to fix it, streams the agent's
+output, and prints the resulting `git diff`.
+
+## Prerequisites
+
+1. **Build the workspace packages first** (examples consume built `dist`):
+
+   ```bash
+   # from the repo root
+   pnpm install
+   pnpm --filter "@tanstack/ai-sandbox..." --filter "@tanstack/ai-claude-code..." --filter "@tanstack/ai" build
+   # (or simply: pnpm build:all)
+   ```
+
+2. An **Anthropic API key**: `export ANTHROPIC_API_KEY=sk-ant-...`
+
+## Run it — Docker (isolated, recommended)
+
+Needs a running Docker daemon. The container image needs `git` + `node`
+(default `node:22`); the demo installs the `claude` CLI during bootstrap.
+
+```bash
+cd examples/sandbox-coding-agent
+pnpm start
+```
+
+Override the image (must have git + node):
+
+```bash
+SANDBOX_IMAGE=node:22 pnpm start
+```
+
+> First run pulls the image and `npm install -g @anthropic-ai/claude-code`, so
+> it takes a minute. Subsequent runs on the same `threadId` reuse the container.
+
+## Run it — local process (no Docker)
+
+Runs the agent directly on your host (no isolation — dev only). Requires the
+`claude` CLI, `git`, and `node` on your `PATH`. A local `claude` login works in
+place of `ANTHROPIC_API_KEY`.
+
+```bash
+cd examples/sandbox-coding-agent
+SANDBOX=local pnpm start
+```
+
+## What you should see
+
+- Streamed reasoning/text from Claude Code as it inspects and edits `add.js`.
+- `↳ [tool] …` lines as the agent uses its native tools (Read/Edit/Bash).
+- A final `===== git diff =====` block showing `- return a - b` → `+ return a + b`.
+- `✅ done`.
+
+## How it works
+
+```ts
+const sandbox = defineSandbox({
+  id: 'coding-agent-demo',
+  provider: dockerSandbox({ image: 'node:22' }), // or localProcessSandbox()
+  workspace: defineWorkspace({
+    source: { type: 'none' },
+    setup: ['npm install -g @anthropic-ai/claude-code' /* scaffold repo */],
+    secrets: { ANTHROPIC_API_KEY: process.env.ANTHROPIC_API_KEY! },
+  }),
+  lifecycle: { reuse: 'thread' },
+})
+
+chat({
+  threadId,
+  adapter: claudeCodeText('sonnet'), // declares requires:[SandboxCapability]
+  messages: [{ role: 'user', content: 'Fix the bug in add.js' }],
+  middleware: [withSandbox(sandbox)],
+})
+```
+
+`withSandbox` resumes-or-creates the sandbox and bootstraps the workspace; the
+`claudeCodeText` adapter spawns `claude -p --output-format stream-json` **inside**
+the sandbox, streams its events back as AG-UI chunks, and emits a `file.changed`
+event with the diff.
diff --git a/examples/sandbox-coding-agent/package.json b/examples/sandbox-coding-agent/package.json
new file mode 100644
index 000000000..fe393636e
--- /dev/null
+++ b/examples/sandbox-coding-agent/package.json
@@ -0,0 +1,18 @@
+{
+  "name": "@tanstack/example-sandbox-coding-agent",
+  "private": true,
+  "type": "module",
+  "scripts": {
+    "start": "tsx run.ts"
+  },
+  "dependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-claude-code": "workspace:*",
+    "@tanstack/ai-sandbox": "workspace:*",
+    "@tanstack/ai-sandbox-docker": "workspace:*",
+    "@tanstack/ai-sandbox-local-process": "workspace:*"
+  },
+  "devDependencies": {
+    "tsx": "^4.21.0"
+  }
+}
diff --git a/examples/sandbox-coding-agent/run.ts b/examples/sandbox-coding-agent/run.ts
new file mode 100644
index 000000000..6a68e779d
--- /dev/null
+++ b/examples/sandbox-coding-agent/run.ts
@@ -0,0 +1,120 @@
+/**
+ * Local end-to-end demo: run Claude Code INSIDE a sandbox to fix a bug.
+ *
+ * What it does:
+ *   1. Spins up a sandbox (Docker by default, or the local host process).
+ *   2. Bootstraps a tiny git repo containing a deliberate bug in `add.js`
+ *      (`add(a, b)` returns `a - b`).
+ *   3. Runs `chat()` with the in-sandbox `claudeCodeText` harness adapter and
+ *      asks it to fix the bug — Claude Code edits the file using its OWN native
+ *      tools inside the sandbox.
+ *   4. Streams the agent's text + tool activity, then prints the git diff it
+ *      produced.
+ *
+ * Run it: see README.md. Requires ANTHROPIC_API_KEY (or a local `claude` login
+ * for SANDBOX=local).
+ */
+import { chat } from '@tanstack/ai'
+import { claudeCodeText } from '@tanstack/ai-claude-code'
+import {
+  defineSandbox,
+  defineWorkspace,
+  withSandbox,
+} from '@tanstack/ai-sandbox'
+import { dockerSandbox } from '@tanstack/ai-sandbox-docker'
+import { localProcessSandbox } from '@tanstack/ai-sandbox-local-process'
+import type { StreamChunk } from '@tanstack/ai'
+
+const apiKey = process.env.ANTHROPIC_API_KEY
+const useLocal = process.env.SANDBOX === 'local'
+
+if (!apiKey && !useLocal) {
+  console.error(
+    'Set ANTHROPIC_API_KEY (or use SANDBOX=local with a local `claude` login).',
+  )
+  process.exit(1)
+}
+
+// Scaffold a tiny git repo with a deliberate bug in add.js.
+const scaffold = [
+  'git init -q',
+  'git config user.email demo@example.com',
+  'git config user.name tanstack-ai-demo',
+  `printf 'export function add(a, b) {\\n  return a - b\\n}\\n' > add.js`,
+  'git add -A',
+  'git commit -q -m "initial (with bug)"',
+]
+
+const provider = useLocal
+  ? // Runs on the host — needs `claude`, `git`, and `node` on your PATH.
+    localProcessSandbox()
+  : // Runs in an isolated Docker container. The image needs git + node; we
+    // install the claude CLI during setup. Override with SANDBOX_IMAGE.
+    dockerSandbox({ image: process.env.SANDBOX_IMAGE ?? 'node:22' })
+
+const setup = useLocal
+  ? scaffold
+  : ['npm install -g @anthropic-ai/claude-code', ...scaffold]
+
+const sandbox = defineSandbox({
+  id: 'coding-agent-demo',
+  provider,
+  workspace: defineWorkspace({
+    source: { type: 'none' },
+    setup,
+    // Injected into the sandbox env (never persisted to snapshots/logs).
+    secrets: apiKey ? { ANTHROPIC_API_KEY: apiKey } : {},
+  }),
+  lifecycle: { reuse: 'thread' },
+})
+
+async function main(): Promise<void> {
+  console.log(
+    `\n▶ Sandbox: ${useLocal ? 'local-process (host)' : 'docker'} — bootstrapping + running Claude Code...\n`,
+  )
+
+  const stream = chat({
+    threadId: `demo-${Date.now()}`,
+    adapter: claudeCodeText('sonnet'),
+    messages: [
+      {
+        role: 'user',
+        content:
+          'There is a bug in add.js: add(a, b) returns a - b instead of a + b. ' +
+          'Fix it so it correctly adds the two numbers.',
+      },
+    ],
+    middleware: [withSandbox(sandbox)],
+  }) as AsyncIterable<StreamChunk>
+
+  for await (const chunk of stream) {
+    const c = chunk as Record<string, unknown> & { type: string }
+    switch (c.type) {
+      case 'TEXT_MESSAGE_CONTENT':
+        process.stdout.write((c.delta as string) ?? '')
+        break
+      case 'TOOL_CALL_START':
+        console.log(`\n  ↳ [tool] ${(c.toolCallName as string) ?? ''}`)
+        break
+      case 'CUSTOM':
+        if (c.name === 'file.changed') {
+          const value = c.value as { diff?: string }
+          console.log('\n\n===== git diff =====\n' + (value.diff ?? '(none)'))
+        }
+        break
+      case 'RUN_FINISHED':
+        console.log('\n\n✅ done')
+        break
+      case 'RUN_ERROR':
+        console.error('\n\n❌ error:', c.message)
+        break
+      default:
+        break
+    }
+  }
+}
+
+main().catch((error) => {
+  console.error(error)
+  process.exit(1)
+})
diff --git a/examples/sandbox-issue-triage/README.md b/examples/sandbox-issue-triage/README.md
new file mode 100644
index 000000000..992361014
--- /dev/null
+++ b/examples/sandbox-issue-triage/README.md
@@ -0,0 +1,55 @@
+# Sandbox issue triage
+
+Fetches the first **open** issue on [`TanStack/ai`](https://github.com/TanStack/ai/issues),
+spins up a sandbox with the repo cloned in, runs **Claude Code inside the
+sandbox** to investigate and triage the issue, and writes a Markdown report to
+your local `reports/` directory.
+
+It demonstrates three pieces of the sandbox layer together:
+
+- **`@tanstack/ai-sandbox`** workspace bootstrap (`githubRepo` source → clone).
+- The **`@tanstack/ai-claude-code`** harness adapter running the `claude` CLI
+  inside the sandbox.
+- **Sandbox file-event hooks** — `defineSandbox({ hooks })` logs the agent's
+  create/change/delete events live; `withSandbox` owns the watcher and forwards
+  events to those hooks. File events are also automatically streamed to clients
+  as CUSTOM `sandbox.file` chunks. The observed events are appended to the
+  report.
+
+Two entrypoints, same logic ([`triage.ts`](./triage.ts)):
+
+| Command              | Sandbox              | Isolation            |
+| -------------------- | -------------------- | -------------------- |
+| `pnpm start:process` | local-process (host) | none — fast dev loop |
+| `pnpm start:docker`  | Docker container     | full                 |
+
+## Prerequisites
+
+- **Both:** `ANTHROPIC_API_KEY` in your environment (the local-process variant
+  can instead use an existing `claude` login).
+- **`start:process`:** `git`, `node`, and the `claude` CLI on your PATH.
+- **`start:docker`:** a running Docker daemon. The base image (`node:22`)
+  already has `git` + `node`; the `claude` CLI is installed during setup.
+- Optional: `GITHUB_TOKEN` to avoid GitHub API rate limits.
+- Optional: `SANDBOX_IMAGE` to override the Docker base image.
+
+## Run
+
+```bash
+# from the repo root, build the workspace packages first
+pnpm build
+
+cd examples/sandbox-issue-triage
+pnpm install
+
+# local-process sandbox
+ANTHROPIC_API_KEY=sk-... pnpm start:process
+
+# docker sandbox
+ANTHROPIC_API_KEY=sk-... pnpm start:docker
+```
+
+The report lands at `reports/issue-<number>-<process|docker>.md`.
+
+> Note: the workspace clones the **default branch** of `TanStack/ai` into the
+> sandbox. The first run pulls the full repo, so give it a moment.
diff --git a/examples/sandbox-issue-triage/docker.ts b/examples/sandbox-issue-triage/docker.ts
new file mode 100644
index 000000000..70b575f51
--- /dev/null
+++ b/examples/sandbox-issue-triage/docker.ts
@@ -0,0 +1,25 @@
+/**
+ * Issue triage with the DOCKER sandbox (isolated container).
+ *
+ * Prerequisites: a running Docker daemon and ANTHROPIC_API_KEY. The base image
+ * (`node:22` by default; override with SANDBOX_IMAGE) already ships git + node;
+ * we install the `claude` CLI during setup. Run: `pnpm start:docker`.
+ */
+import { dockerSandbox } from '@tanstack/ai-sandbox-docker'
+import { runTriage } from './triage'
+
+const apiKey = process.env.ANTHROPIC_API_KEY
+if (!apiKey) {
+  console.error('Set ANTHROPIC_API_KEY to run the Docker triage example.')
+  process.exit(1)
+}
+
+runTriage({
+  provider: dockerSandbox({ image: process.env.SANDBOX_IMAGE ?? 'node:22' }),
+  providerLabel: 'docker',
+  setup: ['npm install -g @anthropic-ai/claude-code'],
+  secrets: { ANTHROPIC_API_KEY: apiKey },
+}).catch((error) => {
+  console.error(error)
+  process.exit(1)
+})
diff --git a/examples/sandbox-issue-triage/package.json b/examples/sandbox-issue-triage/package.json
new file mode 100644
index 000000000..4ea3af36f
--- /dev/null
+++ b/examples/sandbox-issue-triage/package.json
@@ -0,0 +1,19 @@
+{
+  "name": "@tanstack/example-sandbox-issue-triage",
+  "private": true,
+  "type": "module",
+  "scripts": {
+    "start:process": "tsx process.ts",
+    "start:docker": "tsx docker.ts"
+  },
+  "dependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-claude-code": "workspace:*",
+    "@tanstack/ai-sandbox": "workspace:*",
+    "@tanstack/ai-sandbox-docker": "workspace:*",
+    "@tanstack/ai-sandbox-local-process": "workspace:*"
+  },
+  "devDependencies": {
+    "tsx": "^4.21.0"
+  }
+}
diff --git a/examples/sandbox-issue-triage/process.ts b/examples/sandbox-issue-triage/process.ts
new file mode 100644
index 000000000..6285cb3be
--- /dev/null
+++ b/examples/sandbox-issue-triage/process.ts
@@ -0,0 +1,21 @@
+/**
+ * Issue triage with the LOCAL-PROCESS sandbox (runs on the host — no isolation).
+ *
+ * Prerequisites on your PATH: `git`, `node`, and the `claude` CLI (logged in, or
+ * set ANTHROPIC_API_KEY). Run: `pnpm start:process`.
+ */
+import { localProcessSandbox } from '@tanstack/ai-sandbox-local-process'
+import { runTriage } from './triage'
+
+const apiKey = process.env.ANTHROPIC_API_KEY
+
+runTriage({
+  provider: localProcessSandbox(),
+  providerLabel: 'process',
+  // Host already has the tooling; nothing to install.
+  setup: [],
+  secrets: apiKey ? { ANTHROPIC_API_KEY: apiKey } : {},
+}).catch((error) => {
+  console.error(error)
+  process.exit(1)
+})
diff --git a/examples/sandbox-issue-triage/triage.ts b/examples/sandbox-issue-triage/triage.ts
new file mode 100644
index 000000000..6dd62e797
--- /dev/null
+++ b/examples/sandbox-issue-triage/triage.ts
@@ -0,0 +1,230 @@
+/**
+ * Shared logic for the issue-triage demo (used by process.ts and docker.ts).
+ *
+ * Flow:
+ *   1. Fetch the first OPEN issue on TanStack/ai from the GitHub API.
+ *   2. Spin up a sandbox with the repo cloned in.
+ *   3. Attach file-event hooks on the sandbox definition so we see the agent's edits live.
+ *   4. Run Claude Code INSIDE the sandbox to investigate the issue and write
+ *      `ISSUE-REPORT.md` at the repo root.
+ *   5. Read that report back out of the sandbox and persist it to ./reports/
+ *      on the HOST, with a header + the observed file events appended.
+ */
+import { mkdir, writeFile } from 'node:fs/promises'
+import { dirname, join } from 'node:path'
+import { fileURLToPath } from 'node:url'
+import { chat } from '@tanstack/ai'
+import { claudeCodeText } from '@tanstack/ai-claude-code'
+import {
+  defineSandbox,
+  defineWorkspace,
+  githubRepo,
+  withSandbox,
+} from '@tanstack/ai-sandbox'
+import type { FileEvent, SandboxProvider } from '@tanstack/ai-sandbox'
+import type { StreamChunk } from '@tanstack/ai'
+
+const REPO = 'TanStack/ai'
+
+export interface GitHubIssue {
+  number: number
+  title: string
+  body: string
+  url: string
+}
+
+/** Fetch the oldest open issue (filtering out pull requests). */
+export async function fetchFirstOpenIssue(): Promise<GitHubIssue> {
+  const headers: Record<string, string> = {
+    Accept: 'application/vnd.github+json',
+    'User-Agent': 'tanstack-ai-sandbox-issue-triage',
+  }
+  if (process.env.GITHUB_TOKEN) {
+    headers.Authorization = `Bearer ${process.env.GITHUB_TOKEN}`
+  }
+  const res = await fetch(
+    `https://api.github.com/repos/${REPO}/issues?state=open&sort=created&direction=asc&per_page=20`,
+    { headers },
+  )
+  if (!res.ok) {
+    throw new Error(
+      `GitHub API ${res.status} ${res.statusText}: ${await res.text()}`,
+    )
+  }
+  const items = (await res.json()) as Array<{
+    number: number
+    title: string
+    body: string | null
+    html_url: string
+    pull_request?: unknown
+  }>
+  const issue = items.find((item) => item.pull_request === undefined)
+  if (!issue) throw new Error(`No open issues found on ${REPO}.`)
+  return {
+    number: issue.number,
+    title: issue.title,
+    body: issue.body ?? '',
+    url: issue.html_url,
+  }
+}
+
+export interface RunTriageOptions {
+  provider: SandboxProvider
+  /** Short label used in logs + the report filename (e.g. 'process', 'docker'). */
+  providerLabel: string
+  /** Bootstrap commands run once after the repo is cloned. */
+  setup: Array<string>
+  /** Secrets injected into the sandbox env (never persisted). */
+  secrets: Record<string, string>
+}
+
+const REPORT_FILE = 'ISSUE-REPORT.md'
+
+function buildPrompt(issue: GitHubIssue): string {
+  return [
+    `You are triaging a GitHub issue in the ${REPO} repository, which is checked`,
+    `out in your current working directory.`,
+    '',
+    `Issue #${issue.number}: ${issue.title}`,
+    `URL: ${issue.url}`,
+    '',
+    'Issue body:',
+    issue.body || '(no description provided)',
+    '',
+    'Investigate the repository to understand and triage this issue. Do NOT',
+    'change any source code — this is analysis only. When done, WRITE your',
+    `findings to a file named ${REPORT_FILE} in the current working directory`,
+    '(the repository root), as Markdown with these sections:',
+    '',
+    '## Summary',
+    '## Root cause / analysis',
+    '## Affected files (with paths)',
+    '## Proposed fix',
+    '## Confidence',
+  ].join('\n')
+}
+
+/** Run one triage end-to-end against the given provider; returns the report path. */
+export async function runTriage(options: RunTriageOptions): Promise<string> {
+  const issue = await fetchFirstOpenIssue()
+  console.log(
+    `\n▶ [${options.providerLabel}] Triaging issue #${issue.number}: ${issue.title}\n  ${issue.url}\n`,
+  )
+
+  // Collect file events via declarative hooks on the sandbox definition.
+  const fileEvents: Array<FileEvent> = []
+  const sandbox = defineSandbox({
+    id: `issue-triage-${options.providerLabel}`,
+    provider: options.provider,
+    workspace: defineWorkspace({
+      source: githubRepo({ repo: REPO }),
+      setup: options.setup,
+      secrets: options.secrets,
+    }),
+    lifecycle: { reuse: 'thread' },
+    hooks: {
+      onFile: (e) => {
+        fileEvents.push(e)
+        const mark = e.type === 'create' ? '+' : e.type === 'delete' ? '-' : '~'
+        console.log(`    [${mark}] ${e.type} ${e.path}`)
+      },
+    },
+  })
+
+  const threadId = `triage-${options.providerLabel}-${issue.number}`
+
+  console.log('  ⧗ Bootstrapping sandbox (clone + setup)…')
+
+  let assistantText = ''
+  const stream = chat({
+    threadId,
+    adapter: claudeCodeText('sonnet'),
+    messages: [{ role: 'user', content: buildPrompt(issue) }],
+    // withSandbox provides the handle and starts the file-event watcher;
+    // file events are forwarded to the hooks declared above.
+    middleware: [withSandbox(sandbox)],
+  }) as AsyncIterable<StreamChunk>
+
+  for await (const chunk of stream) {
+    const c = chunk as Record<string, unknown> & { type: string }
+    switch (c.type) {
+      case 'TEXT_MESSAGE_CONTENT': {
+        const delta = (c.delta as string) ?? ''
+        assistantText += delta
+        process.stdout.write(delta)
+        break
+      }
+      case 'TOOL_CALL_START':
+        console.log(`\n  ↳ [tool] ${(c.toolCallName as string) ?? ''}`)
+        break
+      case 'CUSTOM':
+        if (c.name === 'sandbox.file') {
+          const value = c.value as FileEvent
+          console.log(`  ⟳ [stream] ${value.type} ${value.path}`)
+        }
+        break
+      case 'RUN_FINISHED':
+        console.log('\n\n✅ agent finished')
+        break
+      case 'RUN_ERROR':
+        console.error('\n\n❌ error:', c.message)
+        break
+      default:
+        break
+    }
+  }
+
+  // Obtain the handle after the run (reuse:'thread' returns the same sandbox).
+  const ensureCtx = { threadId, runId: 'triage-read' }
+  const handle = await sandbox.ensure(ensureCtx)
+
+  // Read the report back out of the sandbox; fall back to the streamed text.
+  let report: string
+  try {
+    report = await handle.fs.read(REPORT_FILE)
+  } catch {
+    report = ''
+  }
+  if (report.trim() === '') {
+    report = assistantText.trim() || '_(the agent produced no report)_'
+  }
+
+  const observed =
+    fileEvents.length === 0
+      ? '_(none observed)_'
+      : fileEvents.map((e) => `- \`${e.type}\` ${e.path}`).join('\n')
+
+  const stamp = new Date().toISOString()
+  const out = [
+    `# Issue triage — ${REPO}#${issue.number}`,
+    '',
+    `- **Issue:** [${issue.title}](${issue.url})`,
+    `- **Sandbox provider:** ${options.providerLabel} (${handle.provider})`,
+    `- **Generated:** ${stamp}`,
+    '',
+    '---',
+    '',
+    report.trim(),
+    '',
+    '---',
+    '',
+    '## Observed file events (sandbox hooks)',
+    '',
+    observed,
+    '',
+  ].join('\n')
+
+  const here = dirname(fileURLToPath(import.meta.url))
+  const reportPath = join(
+    here,
+    'reports',
+    `issue-${issue.number}-${options.providerLabel}.md`,
+  )
+  await mkdir(dirname(reportPath), { recursive: true })
+  await writeFile(reportPath, out, 'utf8')
+
+  await sandbox.destroy(ensureCtx)
+
+  console.log(`\n📝 Report written to ${reportPath}\n`)
+  return reportPath
+}
diff --git a/examples/ts-react-coding-agent/README.md b/examples/ts-react-coding-agent/README.md
new file mode 100644
index 000000000..b40587d90
--- /dev/null
+++ b/examples/ts-react-coding-agent/README.md
@@ -0,0 +1,148 @@
+# TanStack AI — Coding Agent Example
+
+A React (TanStack Start) app that drives **coding-agent harnesses** through
+TanStack AI — [Claude Code](https://docs.anthropic.com/en/docs/claude-code)
+via `@tanstack/ai-claude-code`, [Codex](https://developers.openai.com/codex)
+via `@tanstack/ai-codex`,
+[Gemini CLI](https://github.com/google-gemini/gemini-cli) via
+`@tanstack/ai-gemini-cli`, and [OpenCode](https://opencode.ai) via
+`@tanstack/ai-opencode`, switchable from a dropdown.
+
+Unlike a normal chat example, the agent here runs its own loop server-side
+and executes its own tools — reading, searching, and (in Edit mode) editing
+the files in `workspace/`. Its tool activity streams into the UI as a
+timeline of resolved tool calls.
+
+## What it demonstrates
+
+- **Session resume** — the server emits the harness session id via a
+  `<agent>.session-id` custom event (`claude-code.session-id`,
+  `codex.session-id`, `gemini-cli.session-id`, `opencode.session-id`); the
+  client pins it and sends
+  it back through `forwardedProps` → `modelOptions.sessionId`, so follow-ups
+  continue the same stateful session. Switching agents resets the session.
+- **Harness tool timeline** — built-in tools (Read, Grep, Edit,
+  command_execution, ...) arrive as already-resolved tool-call parts and
+  render with their inputs/outputs. Note that Codex streams text
+  message-at-a-time (its SDK has no token deltas), while Claude Code,
+  Gemini CLI, and OpenCode stream token-by-token.
+- **Permission modes** — a Read-only/Edit toggle maps to each harness's
+  knobs: `disallowedTools` vs `permissionMode: 'acceptEdits'` for Claude
+  Code, `sandboxMode: 'read-only'` vs `'workspace-write'` for Codex, and
+  the default-deny vs `acceptEdits` permission policy for Gemini CLI and
+  OpenCode. With Claude Code, Gemini CLI, and OpenCode, ask it to run a
+  shell command and watch the denial show up in the timeline.
+- **Tool bridging** — `lookup_style_guide` is an ordinary TanStack server
+  tool the harness calls from inside its own loop (in-process MCP for
+  Claude Code; a localhost Streamable-HTTP MCP bridge for Codex,
+  Gemini CLI, and OpenCode).
+- **Sandboxed cwd** — the agent only works inside `workspace/`.
+
+## Running
+
+This is a server-spawning example: each chat turn launches the selected
+harness as a subprocess on your machine. You only need to set up the agent(s)
+you actually want to try — the others stay selectable in the UI and pop a
+setup dialog explaining what's missing (see [Runtime config detection](#runtime-config-detection)).
+
+### 1. Set up the agent(s) you want
+
+**Claude Code** ([docs](https://docs.anthropic.com/en/docs/claude-code))
+
+```bash
+npm i -g @anthropic-ai/claude-code   # install the CLI
+claude login                         # log in with your Claude subscription
+# …or, instead of `claude login`, set an API key in the server env:
+export ANTHROPIC_API_KEY=sk-ant-…
+```
+
+The codex/gemini binaries are spawned per turn, so the CLI must be on `PATH`.
+
+**Codex** ([docs](https://developers.openai.com/codex))
+
+```bash
+codex login                          # log in interactively
+# …or set an API key in the server env (forwarded as CODEX_API_KEY):
+export OPENAI_API_KEY=sk-…
+```
+
+The `codex` binary ships with `@openai/codex-sdk`, so there's nothing extra to
+install. Note: a **ChatGPT-account** login can't run codex models in headless
+mode — use an API key or an entitled account, otherwise the run fails with an
+entitlement error from OpenAI.
+
+**Gemini CLI** ([docs](https://github.com/google-gemini/gemini-cli))
+
+```bash
+npm i -g @google/gemini-cli          # ACP mode needs a current build
+gemini                               # log in with Google once (interactive)
+```
+
+Headless ACP runs can't show an interactive auth picker, so you must tell the
+adapter which method to use via `GEMINI_ACP_AUTH_METHOD` (e.g. `oauth-personal`
+for a Google login, or `gemini-api-key`). If the CLI refuses the scratch
+workspace as untrusted, also export `GEMINI_CLI_TRUST_WORKSPACE=true`. So, for
+a Google-login setup, start the dev server like this:
+
+```bash
+GEMINI_ACP_AUTH_METHOD=oauth-personal GEMINI_CLI_TRUST_WORKSPACE=true pnpm dev
+```
+
+To use an API key instead, set `GEMINI_API_KEY` and
+`GEMINI_ACP_AUTH_METHOD=gemini-api-key`.
+
+**OpenCode** ([docs](https://opencode.ai/docs))
+
+```bash
+npm i -g opencode-ai                  # install the CLI
+opencode auth login                   # authenticate a provider (interactive)
+# …or set the provider API key in the server env (this example uses Anthropic):
+export ANTHROPIC_API_KEY=sk-ant-…
+```
+
+The adapter spawns `opencode serve` per turn, so the CLI must be on `PATH`. The
+example drives the `anthropic/claude-sonnet-4-5` model; point it at a different
+`provider/model` in `src/routes/api.chat.ts` to use another provider.
+
+### 2. Install and run
+
+```bash
+pnpm install
+pnpm dev
+```
+
+### 3. Try it out
+
+Open http://localhost:3000 and try:
+
+- "What files are in this project, and what do they do?" (Read-only)
+- Switch to **Edit mode**: "Fix the bug in temperature.js" — note it
+  calls `lookup_style_guide` first.
+- "Now update todo.md to check off what you did" — same session, no
+  re-explaining.
+
+Reset the demo workspace afterwards with `git checkout -- workspace/`.
+
+## Runtime config detection
+
+Environment variables and CLI logins live on the server, not in the browser, so
+the route loader calls a `createServerFn` (`src/lib/agent-status.ts`) that
+reports which agents are actually runnable. Every agent stays selectable in the
+dropdown; picking one that isn't configured — or trying to send to it — opens a
+dialog with the exact setup steps (sourced from `AGENT_SETUP` in
+`src/lib/agents.ts`, which mirrors the instructions above). An agent counts as
+configured when:
+
+- **Claude Code** — `ANTHROPIC_API_KEY` / `CLAUDE_CODE_OAUTH_TOKEN` is set, or
+  a `~/.claude.json` login exists.
+- **Codex** — `OPENAI_API_KEY` / `CODEX_API_KEY` is set, or a
+  `~/.codex/auth.json` login exists.
+- **Gemini CLI** — `GEMINI_API_KEY` or `GEMINI_ACP_AUTH_METHOD` is set (a
+  cached Google login alone isn't enough for headless ACP, so it isn't
+  counted).
+- **OpenCode** — a provider key (`ANTHROPIC_API_KEY` / `OPENAI_API_KEY` /
+  `GEMINI_API_KEY`) is set, or an `opencode auth login` credential file
+  (`~/.local/share/opencode/auth.json`) exists.
+
+Detection runs at server startup time per request to the loader, so set your
+env vars / log in **before** `pnpm dev` (or restart it after).
diff --git a/examples/ts-react-coding-agent/package.json b/examples/ts-react-coding-agent/package.json
new file mode 100644
index 000000000..2d8e74c09
--- /dev/null
+++ b/examples/ts-react-coding-agent/package.json
@@ -0,0 +1,39 @@
+{
+  "name": "ts-react-coding-agent",
+  "private": true,
+  "type": "module",
+  "scripts": {
+    "dev": "vite dev --port 3000",
+    "build": "vite build",
+    "serve": "vite preview",
+    "test": "exit 0",
+    "test:types": "tsc --noEmit"
+  },
+  "dependencies": {
+    "@tailwindcss/vite": "^4.1.18",
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-claude-code": "workspace:*",
+    "@tanstack/ai-client": "workspace:*",
+    "@tanstack/ai-codex": "workspace:*",
+    "@tanstack/ai-gemini-cli": "workspace:*",
+    "@tanstack/ai-opencode": "workspace:*",
+    "@tanstack/ai-react": "workspace:*",
+    "@tanstack/nitro-v2-vite-plugin": "^1.154.7",
+    "@tanstack/react-router": "^1.158.4",
+    "@tanstack/react-start": "^1.159.0",
+    "@tanstack/router-plugin": "^1.158.4",
+    "react": "^19.2.3",
+    "react-dom": "^19.2.3",
+    "tailwindcss": "^4.1.18",
+    "vite-tsconfig-paths": "^5.1.4",
+    "zod": "^4.2.0"
+  },
+  "devDependencies": {
+    "@types/node": "^24.10.1",
+    "@types/react": "^19.2.7",
+    "@types/react-dom": "^19.2.3",
+    "@vitejs/plugin-react": "^5.1.2",
+    "typescript": "5.9.3",
+    "vite": "^7.3.3"
+  }
+}
diff --git a/examples/ts-react-coding-agent/src/lib/agent-status.ts b/examples/ts-react-coding-agent/src/lib/agent-status.ts
new file mode 100644
index 000000000..d2db68e9c
--- /dev/null
+++ b/examples/ts-react-coding-agent/src/lib/agent-status.ts
@@ -0,0 +1,63 @@
+import { createServerFn } from '@tanstack/react-start'
+import type { AgentId } from './agents'
+
+/** Whether a path exists, swallowing any access error. */
+async function fileExists(filePath: string): Promise<boolean> {
+  try {
+    const { access } = await import('node:fs/promises')
+    await access(filePath)
+    return true
+  } catch {
+    return false
+  }
+}
+
+/**
+ * Reports, per agent, whether the server has credentials/config to actually
+ * run it. Environment variables aren't visible to the browser, so the client
+ * gets this through a server function (called from the route loader). Each
+ * agent counts as configured when an API key is present in the environment, or
+ * when a local CLI login exists — except Gemini CLI, whose headless ACP mode
+ * additionally needs an auth method selected up front (so we gate on the env
+ * vars the example's adapter actually reads).
+ */
+export const getAgentConfigFn = createServerFn({ method: 'GET' }).handler(
+  async (): Promise<Record<AgentId, boolean>> => {
+    const os = await import('node:os')
+    const path = await import('node:path')
+    const home = os.homedir()
+    const env = process.env
+
+    const claudeCode =
+      Boolean(env.ANTHROPIC_API_KEY) ||
+      Boolean(env.CLAUDE_CODE_OAUTH_TOKEN) ||
+      (await fileExists(path.join(home, '.claude.json')))
+
+    const codex =
+      Boolean(env.OPENAI_API_KEY) ||
+      Boolean(env.CODEX_API_KEY) ||
+      (await fileExists(path.join(home, '.codex', 'auth.json')))
+
+    // Gemini's headless ACP path needs an auth method (or an API key) chosen
+    // explicitly — a cached Google login alone isn't enough, so don't count it.
+    const geminiCli =
+      Boolean(env.GEMINI_API_KEY) || Boolean(env.GEMINI_ACP_AUTH_METHOD)
+
+    // OpenCode resolves any configured provider — count a provider API key in
+    // the environment or an `opencode auth login` credential file.
+    const opencode =
+      Boolean(env.ANTHROPIC_API_KEY) ||
+      Boolean(env.OPENAI_API_KEY) ||
+      Boolean(env.GEMINI_API_KEY) ||
+      (await fileExists(
+        path.join(home, '.local', 'share', 'opencode', 'auth.json'),
+      ))
+
+    return {
+      'claude-code': claudeCode,
+      codex,
+      'gemini-cli': geminiCli,
+      opencode,
+    }
+  },
+)
diff --git a/examples/ts-react-coding-agent/src/lib/agents.ts b/examples/ts-react-coding-agent/src/lib/agents.ts
new file mode 100644
index 000000000..00aaf9bad
--- /dev/null
+++ b/examples/ts-react-coding-agent/src/lib/agents.ts
@@ -0,0 +1,148 @@
+/**
+ * Registry of coding-agent harnesses this example can drive.
+ *
+ * Each entry maps to a harness adapter on the server (see
+ * `src/routes/api.chat.ts`): Claude Code (`@tanstack/ai-claude-code`),
+ * Codex (`@tanstack/ai-codex`), Gemini CLI (`@tanstack/ai-gemini-cli`), and
+ * OpenCode (`@tanstack/ai-opencode`).
+ */
+export const AGENTS = [
+  { id: 'claude-code', label: 'Claude Code' },
+  { id: 'codex', label: 'Codex' },
+  { id: 'gemini-cli', label: 'Gemini CLI' },
+  { id: 'opencode', label: 'OpenCode' },
+] as const
+
+/** Agent ids with a working adapter behind them. */
+export type AgentId = 'claude-code' | 'codex' | 'gemini-cli' | 'opencode'
+
+export const DEFAULT_AGENT: AgentId = 'claude-code'
+
+export function isAgentId(value: unknown): value is AgentId {
+  return (
+    value === 'claude-code' ||
+    value === 'codex' ||
+    value === 'gemini-cli' ||
+    value === 'opencode'
+  )
+}
+
+/** A single, optionally command-bearing step in an agent's setup guide. */
+export interface SetupStep {
+  text: string
+  /** A shell command to show in a copyable code block. */
+  code?: string
+}
+
+export interface AgentSetup {
+  /** Human label (mirrors the AGENTS entry). */
+  label: string
+  /** One-line description of what drives this agent. */
+  summary: string
+  /** Ordered setup steps shown in the "not configured" dialog. */
+  steps: Array<SetupStep>
+  /** Docs link for the underlying CLI/tool. */
+  docsUrl: string
+}
+
+/**
+ * Setup instructions surfaced in the UI when an agent isn't configured on the
+ * server at runtime. Mirrors the README "Running" section — keep them in sync.
+ */
+export const AGENT_SETUP: Record<AgentId, AgentSetup> = {
+  'claude-code': {
+    label: 'Claude Code',
+    summary:
+      'Drives the Claude Code CLI through @tanstack/ai-claude-code. Needs the CLI installed and authenticated on the server.',
+    steps: [
+      {
+        text: 'Install the Claude Code CLI:',
+        code: 'npm i -g @anthropic-ai/claude-code',
+      },
+      {
+        text: 'Log in interactively (uses your Claude subscription):',
+        code: 'claude login',
+      },
+      {
+        text: '…or set an API key in the server environment instead:',
+        code: 'export ANTHROPIC_API_KEY=sk-ant-…',
+      },
+      { text: 'Restart the dev server so it picks up new credentials.' },
+    ],
+    docsUrl: 'https://docs.anthropic.com/en/docs/claude-code',
+  },
+  codex: {
+    label: 'Codex',
+    summary:
+      'Drives OpenAI Codex through @tanstack/ai-codex. The codex binary ships with the SDK; you only need credentials.',
+    steps: [
+      { text: 'Log in interactively:', code: 'codex login' },
+      {
+        text: '…or set an API key in the server environment instead:',
+        code: 'export OPENAI_API_KEY=sk-…',
+      },
+      {
+        text: 'Heads up: ChatGPT-account logins cannot run codex models in headless mode — an API key or an entitled account is required.',
+      },
+      { text: 'Restart the dev server so it picks up new credentials.' },
+    ],
+    docsUrl: 'https://developers.openai.com/codex',
+  },
+  'gemini-cli': {
+    label: 'Gemini CLI',
+    summary:
+      'Drives the Gemini CLI over ACP through @tanstack/ai-gemini-cli. Needs a recent CLI and an ACP auth method chosen up front.',
+    steps: [
+      {
+        text: 'Install a current Gemini CLI (ACP mode needs a recent build):',
+        code: 'npm i -g @google/gemini-cli',
+      },
+      { text: 'Log in with Google once (interactive):', code: 'gemini' },
+      {
+        text: 'Headless ACP runs can’t show an auth picker, so tell the adapter which method to use and start the server:',
+        code: 'GEMINI_ACP_AUTH_METHOD=oauth-personal GEMINI_CLI_TRUST_WORKSPACE=true pnpm dev',
+      },
+      {
+        text: '…or use an API key instead (set GEMINI_ACP_AUTH_METHOD=gemini-api-key):',
+        code: 'export GEMINI_API_KEY=…',
+      },
+    ],
+    docsUrl: 'https://github.com/google-gemini/gemini-cli',
+  },
+  opencode: {
+    label: 'OpenCode',
+    summary:
+      'Drives OpenCode through @tanstack/ai-opencode. Needs the opencode CLI installed and a provider authenticated on the server.',
+    steps: [
+      {
+        text: 'Install the OpenCode CLI:',
+        code: 'npm i -g opencode-ai',
+      },
+      {
+        text: 'Authenticate a provider once (interactive):',
+        code: 'opencode auth login',
+      },
+      {
+        text: '…or set the provider API key in the server environment instead:',
+        code: 'export ANTHROPIC_API_KEY=sk-ant-…',
+      },
+      { text: 'Restart the dev server so it picks up new credentials.' },
+    ],
+    docsUrl: 'https://opencode.ai/docs',
+  },
+}
+
+/**
+ * What the agent is allowed to do in the workspace:
+ * - `read-only`: it can read and search, but file edits and shell commands
+ *   are blocked.
+ * - `edit`: file edits are auto-approved; with Claude Code, Gemini CLI, and
+ *   OpenCode, shell commands still get denied by each adapter's default
+ *   permission policy (a deliberate demo of the permission system), while
+ *   Codex sandboxes them inside the workspace instead.
+ */
+export type AgentMode = 'read-only' | 'edit'
+
+export function isAgentMode(value: unknown): value is AgentMode {
+  return value === 'read-only' || value === 'edit'
+}
diff --git a/examples/ts-react-coding-agent/src/lib/style-guide-tool.ts b/examples/ts-react-coding-agent/src/lib/style-guide-tool.ts
new file mode 100644
index 000000000..679356a48
--- /dev/null
+++ b/examples/ts-react-coding-agent/src/lib/style-guide-tool.ts
@@ -0,0 +1,26 @@
+import { z } from 'zod'
+import { toolDefinition } from '@tanstack/ai'
+
+/**
+ * A TanStack server tool bridged *into* the harness. The agent sees it as
+ * `mcp__tanstack__lookup_style_guide`, calls it like any built-in tool, and
+ * the adapter strips the prefix so the UI shows `lookup_style_guide`.
+ */
+export const lookupStyleGuide = toolDefinition({
+  name: 'lookup_style_guide',
+  description:
+    "Look up this project's coding style guide. Call this before writing or editing any code so your changes match the house style.",
+  inputSchema: z.object({
+    topic: z
+      .string()
+      .describe('What you are about to write, e.g. "functions", "naming"'),
+  }),
+}).server(({ topic }) => ({
+  topic,
+  rules: [
+    'Use arrow functions assigned to const, never function declarations.',
+    'Prefer single quotes and no semicolons.',
+    'Every exported function gets a one-line JSDoc comment.',
+    'Keep files under 100 lines; split modules instead of growing them.',
+  ],
+}))
diff --git a/examples/ts-react-coding-agent/src/routeTree.gen.ts b/examples/ts-react-coding-agent/src/routeTree.gen.ts
new file mode 100644
index 000000000..861dc17e2
--- /dev/null
+++ b/examples/ts-react-coding-agent/src/routeTree.gen.ts
@@ -0,0 +1,86 @@
+/* eslint-disable */
+
+// @ts-nocheck
+
+// noinspection JSUnusedGlobalSymbols
+
+// This file was automatically generated by TanStack Router.
+// You should NOT make any changes in this file as it will be overwritten.
+// Additionally, you should also exclude this file from your linter and/or formatter to prevent it from being checked or modified.
+
+import { Route as rootRouteImport } from './routes/__root'
+import { Route as IndexRouteImport } from './routes/index'
+import { Route as ApiChatRouteImport } from './routes/api.chat'
+
+const IndexRoute = IndexRouteImport.update({
+  id: '/',
+  path: '/',
+  getParentRoute: () => rootRouteImport,
+} as any)
+const ApiChatRoute = ApiChatRouteImport.update({
+  id: '/api/chat',
+  path: '/api/chat',
+  getParentRoute: () => rootRouteImport,
+} as any)
+
+export interface FileRoutesByFullPath {
+  '/': typeof IndexRoute
+  '/api/chat': typeof ApiChatRoute
+}
+export interface FileRoutesByTo {
+  '/': typeof IndexRoute
+  '/api/chat': typeof ApiChatRoute
+}
+export interface FileRoutesById {
+  __root__: typeof rootRouteImport
+  '/': typeof IndexRoute
+  '/api/chat': typeof ApiChatRoute
+}
+export interface FileRouteTypes {
+  fileRoutesByFullPath: FileRoutesByFullPath
+  fullPaths: '/' | '/api/chat'
+  fileRoutesByTo: FileRoutesByTo
+  to: '/' | '/api/chat'
+  id: '__root__' | '/' | '/api/chat'
+  fileRoutesById: FileRoutesById
+}
+export interface RootRouteChildren {
+  IndexRoute: typeof IndexRoute
+  ApiChatRoute: typeof ApiChatRoute
+}
+
+declare module '@tanstack/react-router' {
+  interface FileRoutesByPath {
+    '/': {
+      id: '/'
+      path: '/'
+      fullPath: '/'
+      preLoaderRoute: typeof IndexRouteImport
+      parentRoute: typeof rootRouteImport
+    }
+    '/api/chat': {
+      id: '/api/chat'
+      path: '/api/chat'
+      fullPath: '/api/chat'
+      preLoaderRoute: typeof ApiChatRouteImport
+      parentRoute: typeof rootRouteImport
+    }
+  }
+}
+
+const rootRouteChildren: RootRouteChildren = {
+  IndexRoute: IndexRoute,
+  ApiChatRoute: ApiChatRoute,
+}
+export const routeTree = rootRouteImport
+  ._addFileChildren(rootRouteChildren)
+  ._addFileTypes<FileRouteTypes>()
+
+import type { getRouter } from './router.tsx'
+import type { createStart } from '@tanstack/react-start'
+declare module '@tanstack/react-start' {
+  interface Register {
+    ssr: true
+    router: Awaited<ReturnType<typeof getRouter>>
+  }
+}
diff --git a/examples/ts-react-coding-agent/src/router.tsx b/examples/ts-react-coding-agent/src/router.tsx
new file mode 100644
index 000000000..ee1edab88
--- /dev/null
+++ b/examples/ts-react-coding-agent/src/router.tsx
@@ -0,0 +1,13 @@
+import { createRouter } from '@tanstack/react-router'
+
+// Import the generated route tree
+import { routeTree } from './routeTree.gen'
+
+// Create a new router instance
+export const getRouter = () => {
+  return createRouter({
+    routeTree,
+    scrollRestoration: true,
+    defaultPreloadStaleTime: 0,
+  })
+}
diff --git a/examples/ts-react-coding-agent/src/routes/__root.tsx b/examples/ts-react-coding-agent/src/routes/__root.tsx
new file mode 100644
index 000000000..950ce1bcc
--- /dev/null
+++ b/examples/ts-react-coding-agent/src/routes/__root.tsx
@@ -0,0 +1,41 @@
+import { HeadContent, Scripts, createRootRoute } from '@tanstack/react-router'
+import appCss from '../styles.css?url'
+
+export const Route = createRootRoute({
+  head: () => ({
+    meta: [
+      {
+        charSet: 'utf-8',
+      },
+      {
+        name: 'viewport',
+        content: 'width=device-width, initial-scale=1',
+      },
+      {
+        title: 'TanStack AI — Coding Agent',
+      },
+    ],
+    links: [
+      {
+        rel: 'stylesheet',
+        href: appCss,
+      },
+    ],
+  }),
+
+  shellComponent: RootDocument,
+})
+
+function RootDocument({ children }: { children: React.ReactNode }) {
+  return (
+    <html lang="en">
+      <head>
+        <HeadContent />
+      </head>
+      <body className="bg-gray-950 text-gray-100">
+        {children}
+        <Scripts />
+      </body>
+    </html>
+  )
+}
diff --git a/examples/ts-react-coding-agent/src/routes/api.chat.ts b/examples/ts-react-coding-agent/src/routes/api.chat.ts
new file mode 100644
index 000000000..6e4896936
--- /dev/null
+++ b/examples/ts-react-coding-agent/src/routes/api.chat.ts
@@ -0,0 +1,127 @@
+import path from 'node:path'
+import { createFileRoute } from '@tanstack/react-router'
+import {
+  chat,
+  chatParamsFromRequestBody,
+  toServerSentEventsResponse,
+} from '@tanstack/ai'
+import { claudeCodeText } from '@tanstack/ai-claude-code'
+import { codexText } from '@tanstack/ai-codex'
+import { geminiCliText } from '@tanstack/ai-gemini-cli'
+import { opencodeText } from '@tanstack/ai-opencode'
+import { isAgentId, isAgentMode } from '@/lib/agents'
+import { lookupStyleGuide } from '@/lib/style-guide-tool'
+import type { AgentId, AgentMode } from '@/lib/agents'
+import type { AnyTextAdapter } from '@tanstack/ai'
+
+const SYSTEM_PROMPT = `You are a coding assistant working on the small demo
+project mounted in your working directory. Before writing or editing any
+code, call the lookup_style_guide tool and follow what it says. Keep your
+answers short — the user is watching your tool activity stream by.`
+
+/** One harness adapter per agent id. */
+function createAdapter(
+  agentId: AgentId,
+  mode: AgentMode,
+  cwd: string,
+): AnyTextAdapter {
+  switch (agentId) {
+    case 'claude-code':
+      return claudeCodeText('claude-opus-4-8', {
+        cwd,
+        maxTurns: 25,
+        ...(mode === 'edit'
+          ? // Auto-approve file edits. Shell commands still go through the
+            // adapter's default permission policy, which denies them with an
+            // explanatory message — watch for it in the tool timeline.
+            { permissionMode: 'acceptEdits' }
+          : // Read-only: searching and reading work, mutating tools are
+            // removed from the harness entirely.
+            { disallowedTools: ['Write', 'Edit', 'NotebookEdit', 'Bash'] }),
+      })
+    case 'codex':
+      // Codex has no per-tool permission prompts in headless mode; the
+      // sandbox is the safety boundary. Edit mode lets it write inside the
+      // workspace, read-only keeps every command non-mutating.
+      return codexText('gpt-5.1-codex', {
+        cwd,
+        sandboxMode: mode === 'edit' ? 'workspace-write' : 'read-only',
+      })
+    case 'gemini-cli':
+      return geminiCliText('gemini-3-pro-preview', {
+        cwd,
+        // Edit mode auto-approves file edits; shell commands still get
+        // rejected by the adapter's default permission policy, same demo
+        // as Claude Code above.
+        permissionMode: mode === 'edit' ? 'acceptEdits' : 'default',
+        // Headless ACP runs must select an auth method up front (the CLI
+        // can't pop an interactive picker). Set GEMINI_ACP_AUTH_METHOD to
+        // the method your CLI is set up for, e.g. `oauth-personal` (Log in
+        // with Google) or `gemini-api-key`. See this example's README.
+        ...(process.env.GEMINI_ACP_AUTH_METHOD && {
+          authMethodId: process.env.GEMINI_ACP_AUTH_METHOD,
+        }),
+      })
+    case 'opencode':
+      return opencodeText('anthropic/claude-sonnet-4-5', {
+        directory: cwd,
+        // Edit mode auto-approves file edits; shell commands still get
+        // rejected by the adapter's default permission policy, same demo
+        // as Claude Code and Gemini CLI above.
+        permissionMode: mode === 'edit' ? 'acceptEdits' : 'default',
+      })
+  }
+}
+
+export const Route = createFileRoute('/api/chat')({
+  server: {
+    handlers: {
+      POST: async ({ request }) => {
+        if (request.signal.aborted) {
+          return new Response(null, { status: 499 })
+        }
+        const abortController = new AbortController()
+
+        let params
+        try {
+          params = await chatParamsFromRequestBody(await request.json())
+        } catch (error) {
+          return new Response(
+            error instanceof Error ? error.message : 'Bad request',
+            { status: 400 },
+          )
+        }
+
+        // Client-sent settings arrive via forwardedProps. Validate against
+        // the allowlist — never feed client strings straight into config.
+        const agentId = isAgentId(params.forwardedProps.agentId)
+          ? params.forwardedProps.agentId
+          : 'claude-code'
+        const mode = isAgentMode(params.forwardedProps.mode)
+          ? params.forwardedProps.mode
+          : 'read-only'
+        const sessionId =
+          typeof params.forwardedProps.sessionId === 'string' &&
+          params.forwardedProps.sessionId !== ''
+            ? params.forwardedProps.sessionId
+            : undefined
+
+        // The agent only ever works inside the example's scratch workspace.
+        const cwd = path.join(process.cwd(), 'workspace')
+
+        const stream = chat({
+          adapter: createAdapter(agentId, mode, cwd),
+          messages: params.messages,
+          systemPrompts: [SYSTEM_PROMPT],
+          tools: [lookupStyleGuide],
+          modelOptions: { sessionId },
+          threadId: params.threadId,
+          runId: params.runId,
+          abortController,
+        })
+
+        return toServerSentEventsResponse(stream, { abortController })
+      },
+    },
+  },
+})
diff --git a/examples/ts-react-coding-agent/src/routes/index.tsx b/examples/ts-react-coding-agent/src/routes/index.tsx
new file mode 100644
index 000000000..27c487849
--- /dev/null
+++ b/examples/ts-react-coding-agent/src/routes/index.tsx
@@ -0,0 +1,324 @@
+import { useMemo, useState } from 'react'
+import { createFileRoute } from '@tanstack/react-router'
+import { fetchServerSentEvents, useChat } from '@tanstack/ai-react'
+import { AGENTS, AGENT_SETUP, DEFAULT_AGENT, isAgentId } from '@/lib/agents'
+import { getAgentConfigFn } from '@/lib/agent-status'
+import type { UIMessage } from '@tanstack/ai-react'
+import type { AgentId, AgentMode } from '@/lib/agents'
+
+export const Route = createFileRoute('/')({
+  component: CodingAgentPage,
+  // Env vars aren't available client-side, so the loader asks the server which
+  // agents are actually configured (see src/lib/agent-status.ts).
+  loader: () => getAgentConfigFn(),
+})
+
+function ToolCallCard({
+  part,
+}: {
+  part: Extract<UIMessage['parts'][number], { type: 'tool-call' }>
+}) {
+  const args = useMemo(() => {
+    try {
+      return JSON.stringify(JSON.parse(part.arguments), null, 2)
+    } catch {
+      return part.arguments
+    }
+  }, [part.arguments])
+
+  const output = useMemo(() => {
+    if (part.output === undefined) return undefined
+    return typeof part.output === 'string'
+      ? part.output
+      : JSON.stringify(part.output, null, 2)
+  }, [part.output])
+
+  return (
+    <details className="my-1 rounded border border-gray-800 bg-gray-900/60 text-sm">
+      <summary className="cursor-pointer select-none px-3 py-1.5 font-mono text-amber-300">
+        🔧 {part.name}
+        <span className="ml-2 text-xs text-gray-500">
+          {output !== undefined ? 'done' : part.state}
+        </span>
+      </summary>
+      <div className="space-y-2 border-t border-gray-800 px-3 py-2">
+        <pre className="overflow-x-auto rounded bg-gray-950 p-2 text-xs text-gray-300">
+          {args}
+        </pre>
+        {output !== undefined && (
+          <pre className="max-h-48 overflow-auto rounded bg-gray-950 p-2 text-xs text-emerald-200">
+            {output}
+          </pre>
+        )}
+      </div>
+    </details>
+  )
+}
+
+function Message({ message }: { message: UIMessage }) {
+  const isUser = message.role === 'user'
+  return (
+    <div className={isUser ? 'text-right' : 'text-left'}>
+      <div
+        className={
+          isUser
+            ? 'inline-block max-w-[80%] rounded-lg bg-blue-600 px-3 py-2 text-left'
+            : 'block'
+        }
+      >
+        {message.parts.map((part, index) => {
+          if (part.type === 'text' && part.content.trim()) {
+            return (
+              <p key={index} className="whitespace-pre-wrap py-1">
+                {part.content}
+              </p>
+            )
+          }
+          if (part.type === 'thinking' && part.content.trim()) {
+            return (
+              <details key={index} className="my-1 text-sm text-gray-400">
+                <summary className="cursor-pointer select-none">
+                  💭 thinking…
+                </summary>
+                <p className="whitespace-pre-wrap border-l-2 border-gray-700 pl-3">
+                  {part.content}
+                </p>
+              </details>
+            )
+          }
+          if (part.type === 'tool-call') {
+            return <ToolCallCard key={part.id} part={part} />
+          }
+          return null
+        })}
+      </div>
+    </div>
+  )
+}
+
+function SetupDialog({
+  agentId,
+  onClose,
+}: {
+  agentId: AgentId
+  onClose: () => void
+}) {
+  const setup = AGENT_SETUP[agentId]
+  return (
+    <div
+      className="fixed inset-0 z-50 flex items-center justify-center bg-black/60 p-4"
+      onClick={onClose}
+      role="presentation"
+    >
+      <div
+        className="max-h-[85vh] w-full max-w-lg overflow-y-auto rounded-lg border border-gray-700 bg-gray-900 p-5 shadow-xl"
+        onClick={(event) => event.stopPropagation()}
+        role="dialog"
+        aria-modal="true"
+        aria-label={`${setup.label} setup`}
+      >
+        <div className="mb-3 flex items-start justify-between gap-4">
+          <h2 className="text-base font-semibold">Set up {setup.label}</h2>
+          <button
+            onClick={onClose}
+            aria-label="Close"
+            className="rounded px-2 text-gray-400 hover:bg-gray-800 hover:text-gray-100"
+          >
+            ✕
+          </button>
+        </div>
+        <p className="mb-4 text-sm text-gray-400">{setup.summary}</p>
+        <ol className="space-y-3">
+          {setup.steps.map((step, index) => (
+            <li key={index} className="text-sm">
+              <div className="flex gap-2">
+                <span className="select-none font-mono text-gray-500">
+                  {index + 1}.
+                </span>
+                <div className="flex-1 space-y-1.5">
+                  <p className="text-gray-200">{step.text}</p>
+                  {step.code && (
+                    <pre className="overflow-x-auto rounded bg-gray-950 px-3 py-2 text-xs text-emerald-200">
+                      <code>{step.code}</code>
+                    </pre>
+                  )}
+                </div>
+              </div>
+            </li>
+          ))}
+        </ol>
+        <div className="mt-5 flex items-center justify-between">
+          <a
+            href={setup.docsUrl}
+            target="_blank"
+            rel="noreferrer"
+            className="text-sm text-blue-400 hover:underline"
+          >
+            Documentation ↗
+          </a>
+          <button
+            onClick={onClose}
+            className="rounded bg-blue-600 px-3 py-1.5 text-sm font-medium hover:bg-blue-500"
+          >
+            Got it
+          </button>
+        </div>
+      </div>
+    </div>
+  )
+}
+
+function CodingAgentPage() {
+  const configured = Route.useLoaderData()
+  const [agentId, setAgentId] = useState<AgentId>(DEFAULT_AGENT)
+  const [mode, setMode] = useState<AgentMode>('read-only')
+  const [sessionId, setSessionId] = useState<string | undefined>(undefined)
+  const [input, setInput] = useState('')
+  const [setupOpen, setSetupOpen] = useState(false)
+
+  const isConfigured = configured[agentId]
+
+  const body = useMemo(
+    () => ({ agentId, mode, sessionId }),
+    [agentId, mode, sessionId],
+  )
+
+  const { messages, sendMessage, isLoading, clear, error } = useChat({
+    connection: fetchServerSentEvents('/api/chat'),
+    body,
+    onCustomEvent: (eventType, data) => {
+      // Every harness adapter pins its session with a `<agent>.session-id`
+      // CUSTOM event (claude-code.session-id, codex.session-id, ...).
+      if (
+        eventType.endsWith('.session-id') &&
+        typeof data === 'object' &&
+        data !== null &&
+        'sessionId' in data &&
+        typeof data.sessionId === 'string'
+      ) {
+        setSessionId(data.sessionId)
+      }
+    },
+  })
+
+  const newSession = () => {
+    setSessionId(undefined)
+    clear()
+  }
+
+  const send = () => {
+    const text = input.trim()
+    if (!text || isLoading) return
+    // Don't fire a request the server can't fulfil — explain the setup instead.
+    if (!isConfigured) {
+      setSetupOpen(true)
+      return
+    }
+    setInput('')
+    void sendMessage(text)
+  }
+
+  const selectAgent = (value: string) => {
+    if (!isAgentId(value)) return
+    // Sessions aren't portable across harnesses — switching agents starts fresh.
+    setAgentId(value)
+    setSessionId(undefined)
+    // Selecting is always allowed; if it isn't set up, show how to fix it.
+    if (!configured[value]) setSetupOpen(true)
+  }
+
+  return (
+    <main className="mx-auto flex h-screen max-w-3xl flex-col px-4">
+      <header className="flex flex-wrap items-center gap-3 border-b border-gray-800 py-3">
+        <h1 className="mr-auto text-lg font-semibold">Coding Agent</h1>
+        <select
+          value={agentId}
+          onChange={(event) => selectAgent(event.target.value)}
+          className="rounded border border-gray-700 bg-gray-900 px-2 py-1 text-sm"
+        >
+          {AGENTS.map((agent) => (
+            <option key={agent.id} value={agent.id}>
+              {agent.label}
+              {configured[agent.id] ? '' : ' (not configured)'}
+            </option>
+          ))}
+        </select>
+        <select
+          value={mode}
+          onChange={(event) => setMode(event.target.value as AgentMode)}
+          className="rounded border border-gray-700 bg-gray-900 px-2 py-1 text-sm"
+        >
+          <option value="read-only">Read-only</option>
+          <option value="edit">Edit mode</option>
+        </select>
+        <button
+          onClick={newSession}
+          className="rounded border border-gray-700 px-2 py-1 text-sm hover:bg-gray-800"
+        >
+          New session
+        </button>
+      </header>
+
+      {!isConfigured && (
+        <div className="mt-2 flex items-center gap-3 rounded border border-amber-800 bg-amber-950/40 px-3 py-2 text-sm text-amber-200">
+          <span className="flex-1">
+            ⚠️ {AGENT_SETUP[agentId].label} isn’t configured on the server.
+          </span>
+          <button
+            onClick={() => setSetupOpen(true)}
+            className="rounded border border-amber-700 px-2 py-1 text-xs hover:bg-amber-900/50"
+          >
+            Setup instructions
+          </button>
+        </div>
+      )}
+
+      <div className="py-1 text-xs text-gray-500">
+        {sessionId
+          ? `Resuming session ${sessionId.slice(0, 8)}… — follow-ups send only your latest message.`
+          : `No session yet — the first reply starts one and pins it via the ${agentId}.session-id event.`}
+      </div>
+
+      <div className="flex-1 space-y-3 overflow-y-auto py-4">
+        {messages.length === 0 && (
+          <p className="text-gray-500">
+            Try: “What files are in this project, and what do they do?” — then
+            switch to Edit mode and ask it to fix the bug in{' '}
+            <code className="text-gray-400">workspace/temperature.js</code>.
+          </p>
+        )}
+        {messages.map((message) => (
+          <Message key={message.id} message={message} />
+        ))}
+        {error && (
+          <p className="rounded border border-red-800 bg-red-950/40 p-2 text-sm text-red-300">
+            {String(error)}
+          </p>
+        )}
+      </div>
+
+      <footer className="flex gap-2 border-t border-gray-800 py-3">
+        <input
+          value={input}
+          onChange={(event) => setInput(event.target.value)}
+          onKeyDown={(event) => {
+            if (event.key === 'Enter') send()
+          }}
+          placeholder="Ask the agent to explore or change the workspace…"
+          className="flex-1 rounded border border-gray-700 bg-gray-900 px-3 py-2 outline-none focus:border-gray-500"
+        />
+        <button
+          onClick={send}
+          disabled={isLoading || !input.trim()}
+          className="rounded bg-blue-600 px-4 py-2 font-medium disabled:opacity-40"
+        >
+          {isLoading ? 'Working…' : 'Send'}
+        </button>
+      </footer>
+
+      {setupOpen && (
+        <SetupDialog agentId={agentId} onClose={() => setSetupOpen(false)} />
+      )}
+    </main>
+  )
+}
diff --git a/examples/ts-react-coding-agent/src/styles.css b/examples/ts-react-coding-agent/src/styles.css
new file mode 100644
index 000000000..d4b507858
--- /dev/null
+++ b/examples/ts-react-coding-agent/src/styles.css
@@ -0,0 +1 @@
+@import 'tailwindcss';
diff --git a/examples/ts-react-coding-agent/tsconfig.json b/examples/ts-react-coding-agent/tsconfig.json
new file mode 100644
index 000000000..477479fb7
--- /dev/null
+++ b/examples/ts-react-coding-agent/tsconfig.json
@@ -0,0 +1,28 @@
+{
+  "include": ["**/*.ts", "**/*.tsx"],
+  "compilerOptions": {
+    "target": "ES2022",
+    "jsx": "react-jsx",
+    "module": "ESNext",
+    "lib": ["ES2022", "DOM", "DOM.Iterable"],
+    "types": ["vite/client"],
+
+    /* Bundler mode */
+    "moduleResolution": "bundler",
+    "allowImportingTsExtensions": true,
+    "verbatimModuleSyntax": false,
+    "noEmit": true,
+
+    /* Linting */
+    "skipLibCheck": true,
+    "strict": true,
+    "noUnusedLocals": true,
+    "noUnusedParameters": true,
+    "noFallthroughCasesInSwitch": true,
+    "noUncheckedSideEffectImports": true,
+    "baseUrl": ".",
+    "paths": {
+      "@/*": ["./src/*"]
+    }
+  }
+}
diff --git a/examples/ts-react-coding-agent/vite.config.ts b/examples/ts-react-coding-agent/vite.config.ts
new file mode 100644
index 000000000..563d73a12
--- /dev/null
+++ b/examples/ts-react-coding-agent/vite.config.ts
@@ -0,0 +1,30 @@
+import { defineConfig } from 'vite'
+import { tanstackStart } from '@tanstack/react-start/plugin/vite'
+import viteReact from '@vitejs/plugin-react'
+import viteTsConfigPaths from 'vite-tsconfig-paths'
+import tailwindcss from '@tailwindcss/vite'
+import { nitroV2Plugin } from '@tanstack/nitro-v2-vite-plugin'
+
+const config = defineConfig({
+  // The Claude Agent SDK is server-only and ships its own bundled Claude
+  // Code runtime — keep it external so the SSR build resolves it at runtime
+  // via require() instead of inlining it into the rollup chunk.
+  ssr: {
+    external: ['@anthropic-ai/claude-agent-sdk'],
+  },
+  plugins: [
+    nitroV2Plugin({
+      externals: {
+        external: ['@anthropic-ai/claude-agent-sdk'],
+      },
+    }),
+    viteTsConfigPaths({
+      projects: ['./tsconfig.json'],
+    }),
+    tailwindcss(),
+    tanstackStart(),
+    viteReact(),
+  ],
+})
+
+export default config
diff --git a/examples/ts-react-coding-agent/workspace/README.md b/examples/ts-react-coding-agent/workspace/README.md
new file mode 100644
index 000000000..47dc36b1a
--- /dev/null
+++ b/examples/ts-react-coding-agent/workspace/README.md
@@ -0,0 +1,13 @@
+# Demo Workspace
+
+This directory is the coding agent's working directory (`cwd`). Everything
+the agent reads, searches, and edits happens in here — nothing outside this
+folder is touched.
+
+Files:
+
+- `temperature.js` — a tiny conversion module with a deliberate bug for the
+  agent to find and fix (in Edit mode).
+- `todo.md` — a short task list the agent can read or update.
+
+Feel free to reset this directory with `git checkout -- .` after demos.
diff --git a/examples/ts-react-coding-agent/workspace/temperature.js b/examples/ts-react-coding-agent/workspace/temperature.js
new file mode 100644
index 000000000..4aaeb517b
--- /dev/null
+++ b/examples/ts-react-coding-agent/workspace/temperature.js
@@ -0,0 +1,12 @@
+/** Convert Celsius to Fahrenheit. */
+const celsiusToFahrenheit = (celsius) => {
+  return celsius * (9 / 5) + 32
+}
+
+/** Convert Fahrenheit to Celsius. */
+const fahrenheitToCelsius = (fahrenheit) => {
+  // BUG: should subtract 32 before scaling, not after.
+  return fahrenheit * (5 / 9) - 32
+}
+
+export { celsiusToFahrenheit, fahrenheitToCelsius }
diff --git a/examples/ts-react-coding-agent/workspace/todo.md b/examples/ts-react-coding-agent/workspace/todo.md
new file mode 100644
index 000000000..945973c61
--- /dev/null
+++ b/examples/ts-react-coding-agent/workspace/todo.md
@@ -0,0 +1,5 @@
+# Tasks
+
+- [ ] Fix the Fahrenheit → Celsius conversion bug
+- [ ] Add a Kelvin conversion helper
+- [ ] Write a usage example in the README
diff --git a/knip.json b/knip.json
index a5e8a03e1..39655ddab 100644
--- a/knip.json
+++ b/knip.json
@@ -44,6 +44,9 @@
     },
     "packages/ai-vue-ui": {
       "ignore": ["src/use-chat-context.ts"]
+    },
+    "packages/ai-persistence-postgres": {
+      "ignoreDependencies": ["pg"]
     }
   }
 }
diff --git a/packages/ai-claude-code/README.md b/packages/ai-claude-code/README.md
new file mode 100644
index 000000000..8532fcaae
--- /dev/null
+++ b/packages/ai-claude-code/README.md
@@ -0,0 +1,18 @@
+# @tanstack/ai-claude-code
+
+Claude Code harness adapter for [TanStack AI](https://tanstack.com/ai) — run [Claude Code](https://docs.anthropic.com/en/docs/claude-code) (via `@anthropic-ai/claude-agent-sdk`) as a chat backend with local tool execution, stateful coding sessions, and TanStack tool bridging.
+
+```typescript
+import { chat } from '@tanstack/ai'
+import { claudeCodeText } from '@tanstack/ai-claude-code'
+
+const stream = chat({
+  adapter: claudeCodeText('claude-opus-4-8', {
+    cwd: '/path/to/project',
+    permissionMode: 'acceptEdits',
+  }),
+  messages: [{ role: 'user', content: 'Fix the failing test.' }],
+})
+```
+
+Server-only (Node). See the [Claude Code adapter docs](https://tanstack.com/ai/latest/docs/adapters/claude-code) for sessions, tool bridging, permissions, and limitations.
diff --git a/packages/ai-claude-code/package.json b/packages/ai-claude-code/package.json
new file mode 100644
index 000000000..3fb3ed30b
--- /dev/null
+++ b/packages/ai-claude-code/package.json
@@ -0,0 +1,59 @@
+{
+  "name": "@tanstack/ai-claude-code",
+  "version": "0.1.0",
+  "description": "Claude Code harness adapter for TanStack AI — run Claude Code as a chat backend with local tool execution and stateful sessions.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-claude-code"
+  },
+  "keywords": [
+    "ai",
+    "ai-sdk",
+    "typescript",
+    "tanstack",
+    "anthropic",
+    "claude",
+    "claude-code",
+    "harness",
+    "agent",
+    "adapter",
+    "chat",
+    "tool-calling"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-sandbox": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-sandbox": "workspace:*",
+    "@tanstack/ai-sandbox-local-process": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-claude-code/src/adapters/policy-map.ts b/packages/ai-claude-code/src/adapters/policy-map.ts
new file mode 100644
index 000000000..02a04f664
--- /dev/null
+++ b/packages/ai-claude-code/src/adapters/policy-map.ts
@@ -0,0 +1,83 @@
+/**
+ * Map a portable {@link SandboxPolicy} onto Claude Code CLI permission flags.
+ *
+ * This is a best-effort, coarse mapping (the CLI's permission model is
+ * tool-level + a permission mode, not arbitrary command globs):
+ *
+ * - `default` decision → `--permission-mode`:
+ *     `'allow'` → `bypassPermissions`, `'acceptEdits'`-ish `'ask'` → `acceptEdits`,
+ *     `'deny'` → `default` (in `-p` mode, prompts are auto-denied).
+ * - `capabilities.fileWrite === 'deny'` → disallow `Write`,`Edit`,`MultiEdit`.
+ * - `capabilities.network === 'deny'` → disallow `WebFetch`,`WebSearch`.
+ * - `commands.deny` that name a bare built-in tool (e.g. `Bash`) are added to
+ *   `--disallowedTools`; fine-grained command-glob enforcement is left to the
+ *   MCP permission-prompt tool (interactive approvals).
+ *
+ * Returns the permission mode plus tool allow/deny additions; the adapter
+ * merges these with its own config.
+ */
+import type { PolicyDecision, SandboxPolicy } from '@tanstack/ai-sandbox'
+import type { ClaudeCodePermissionMode } from './text'
+
+export interface ClaudePolicyFlags {
+  permissionMode?: ClaudeCodePermissionMode
+  allowedTools: Array<string>
+  disallowedTools: Array<string>
+}
+
+const WRITE_TOOLS = ['Write', 'Edit', 'MultiEdit']
+const NETWORK_TOOLS = ['WebFetch', 'WebSearch']
+const BUILTIN_TOOL_NAMES = new Set([
+  'Bash',
+  'Read',
+  'Write',
+  'Edit',
+  'MultiEdit',
+  'Glob',
+  'Grep',
+  'WebFetch',
+  'WebSearch',
+  'NotebookEdit',
+  'Task',
+])
+
+function modeFor(decision: PolicyDecision): ClaudeCodePermissionMode {
+  switch (decision) {
+    case 'allow':
+      return 'bypassPermissions'
+    case 'ask':
+      return 'acceptEdits'
+    case 'deny':
+      return 'default'
+  }
+}
+
+export function mapPolicyToClaudeFlags(
+  policy: SandboxPolicy | undefined,
+): ClaudePolicyFlags {
+  const allowedTools: Array<string> = []
+  const disallowedTools: Array<string> = []
+  if (!policy) return { allowedTools, disallowedTools }
+
+  if (policy.capabilities?.fileWrite === 'deny')
+    disallowedTools.push(...WRITE_TOOLS)
+  if (policy.capabilities?.network === 'deny')
+    disallowedTools.push(...NETWORK_TOOLS)
+
+  // Tool-name-level command rules map directly; everything else is left to the
+  // permission-prompt tool.
+  for (const pattern of policy.commands?.deny ?? []) {
+    if (BUILTIN_TOOL_NAMES.has(pattern)) disallowedTools.push(pattern)
+  }
+  for (const pattern of policy.commands?.allow ?? []) {
+    if (BUILTIN_TOOL_NAMES.has(pattern)) allowedTools.push(pattern)
+  }
+
+  const result: ClaudePolicyFlags = {
+    allowedTools: [...new Set(allowedTools)],
+    disallowedTools: [...new Set(disallowedTools)],
+  }
+  if (policy.default !== undefined)
+    result.permissionMode = modeFor(policy.default)
+  return result
+}
diff --git a/packages/ai-claude-code/src/adapters/text.ts b/packages/ai-claude-code/src/adapters/text.ts
new file mode 100644
index 000000000..5abb36416
--- /dev/null
+++ b/packages/ai-claude-code/src/adapters/text.ts
@@ -0,0 +1,466 @@
+import { EventType, normalizeSystemPrompts } from '@tanstack/ai'
+import { toRunErrorRawEvent } from '@tanstack/ai/adapter-internals'
+import { BaseTextAdapter } from '@tanstack/ai/adapters'
+import {
+  SandboxCapability,
+  approvalId,
+  buildApprovalRequestedEvent,
+  getSandbox,
+  getSandboxPolicy,
+  hostForSandbox,
+  resolveApproval,
+  spawnNdjson,
+  startHostToolBridge,
+} from '@tanstack/ai-sandbox'
+import { buildPrompt } from '../messages/prompt'
+import { translateSdkStream } from '../stream/translate'
+import { mapPolicyToClaudeFlags } from './policy-map'
+import type { ClaudePolicyFlags } from './policy-map'
+import type {
+  HostToolBridge,
+  PermissionToolResult,
+  SandboxHandle,
+  SandboxPolicy,
+} from '@tanstack/ai-sandbox'
+import type {
+  StructuredOutputOptions,
+  StructuredOutputResult,
+} from '@tanstack/ai/adapters'
+import type {
+  DefaultMessageMetadataByModality,
+  Modality,
+  StreamChunk,
+  TextOptions,
+} from '@tanstack/ai'
+import type { ClaudeCodeModel } from '../model-meta'
+import type { ClaudeCodeTextProviderOptions } from '../provider-options'
+import type { AgentSdkMessage } from '../stream/sdk-types'
+
+export type ClaudeCodePermissionMode =
+  | 'default'
+  | 'acceptEdits'
+  | 'bypassPermissions'
+  | 'plan'
+
+const DEFAULT_WORKDIR = '/workspace'
+
+export interface ClaudeCodeTextConfig {
+  /**
+   * Working directory inside the sandbox where `claude` runs. Defaults to
+   * `/workspace` (the conventional sandbox workspace root).
+   */
+  cwd?: string
+  /**
+   * Claude Code permission mode passed via `--permission-mode`. Defaults to
+   * `'bypassPermissions'` — a sandbox is isolated, so the agent is allowed to
+   * edit files and run commands without prompting. Tighten via `defineSandboxPolicy`
+   * / this option for less autonomy.
+   */
+  permissionMode?: ClaudeCodePermissionMode
+  /** Built-in tools the harness may use (`--allowedTools`). */
+  allowedTools?: Array<string>
+  /** Built-in tools removed from the harness (`--disallowedTools`). */
+  disallowedTools?: Array<string>
+  /** Extra directories the agent may access (`--add-dir`). */
+  addDirs?: Array<string>
+  /** Maximum harness-internal turns (`--max-turns`). */
+  maxTurns?: number
+  /**
+   * How `systemPrompts` from `chat()` are applied:
+   * - `'append'` (default): `--append-system-prompt` on top of the preset.
+   * - `'replace'`: `--system-prompt` as the entire system prompt.
+   */
+  systemPromptMode?: 'append' | 'replace'
+  /** Path/name of the claude executable inside the sandbox. Defaults to `claude`. */
+  claudeExecutable?: string
+  /** Emit token-level deltas via `--include-partial-messages` (default true). */
+  streamPartials?: boolean
+  /** Extra environment variables for the claude process inside the sandbox. */
+  env?: Record<string, string>
+  /** Emit a `file.changed` CUSTOM event with the git diff after the run (default true). */
+  emitDiff?: boolean
+}
+
+/** POSIX single-quote escape for embedding values in the `claude …` command. */
+function q(value: string): string {
+  return `'${value.replace(/'/g, `'\\''`)}'`
+}
+
+/** Format a host tool-bridge as claude's `--mcp-config` JSON. */
+function bridgeToMcpConfig(bridge: HostToolBridge): string {
+  return JSON.stringify({
+    mcpServers: {
+      [bridge.name]: {
+        type: 'http',
+        url: bridge.url,
+        headers: { Authorization: `Bearer ${bridge.token}` },
+      },
+    },
+  })
+}
+
+export class ClaudeCodeTextAdapter<
+  TModel extends ClaudeCodeModel,
+> extends BaseTextAdapter<
+  TModel,
+  ClaudeCodeTextProviderOptions,
+  ReadonlyArray<Modality> & readonly ['text'],
+  DefaultMessageMetadataByModality,
+  ReadonlyArray<string>,
+  unknown,
+  never
+> {
+  readonly name = 'claude-code' as const
+
+  // Harness adapter: requires a sandbox to run the agent CLI inside.
+  override readonly requires = [SandboxCapability] as const
+
+  // The agent runs inside the (persistent) sandbox, so on resume the engine can
+  // re-attach to the still-running process and continue live after replaying the
+  // persisted event tail (rather than ending at replay). Live re-attach behavior
+  // is verified with the real CLI; the engine seam is unit-tested.
+  readonly supportsReattach = true
+
+  private readonly adapterConfig: ClaudeCodeTextConfig
+
+  constructor(config: ClaudeCodeTextConfig, model: TModel) {
+    super({}, model)
+    this.adapterConfig = config
+  }
+
+  private sandboxFrom(
+    options: TextOptions<ClaudeCodeTextProviderOptions>,
+  ): SandboxHandle {
+    const ctx = options.capabilities
+    if (!ctx) {
+      throw new Error(
+        'Adapter "claude-code" requires a sandbox. Add withSandbox(defineSandbox({ ... })) ' +
+          'to chat() middleware (e.g. with the local-process or docker provider).',
+      )
+    }
+    return getSandbox(ctx)
+  }
+
+  private workdir(options: TextOptions<ClaudeCodeTextProviderOptions>): string {
+    return (
+      options.modelOptions?.cwd ?? this.adapterConfig.cwd ?? DEFAULT_WORKDIR
+    )
+  }
+
+  /** Build the `claude` command line (prompt goes via stdin, not argv). */
+  private buildCommand(
+    options: TextOptions<ClaudeCodeTextProviderOptions>,
+    resume: string | undefined,
+    policyFlags: ClaudePolicyFlags,
+    mcpConfigJson: string | undefined,
+    permissionPromptTool: string | undefined,
+  ): string {
+    const config = this.adapterConfig
+    const modelOptions = options.modelOptions
+    const exe = config.claudeExecutable ?? 'claude'
+
+    const args: Array<string> = [
+      '-p',
+      '--output-format',
+      'stream-json',
+      '--verbose',
+      '--model',
+      q(this.model),
+    ]
+
+    if (config.streamPartials !== false) args.push('--include-partial-messages')
+    if (resume !== undefined) args.push('--resume', q(resume))
+
+    // Precedence: per-call modelOptions > adapter config > policy > sandbox default.
+    const permissionMode =
+      modelOptions?.permissionMode ??
+      config.permissionMode ??
+      policyFlags.permissionMode ??
+      'bypassPermissions'
+    args.push('--permission-mode', q(permissionMode))
+
+    const maxTurns = modelOptions?.maxTurns ?? config.maxTurns
+    if (maxTurns !== undefined) args.push('--max-turns', String(maxTurns))
+
+    for (const dir of config.addDirs ?? []) args.push('--add-dir', q(dir))
+
+    const allowedTools = [
+      ...(modelOptions?.allowedTools ?? config.allowedTools ?? []),
+      ...policyFlags.allowedTools,
+    ]
+    if (allowedTools.length > 0) {
+      args.push('--allowedTools', q([...new Set(allowedTools)].join(',')))
+    }
+    const disallowedTools = [
+      ...(modelOptions?.disallowedTools ?? config.disallowedTools ?? []),
+      ...policyFlags.disallowedTools,
+    ]
+    if (disallowedTools.length > 0) {
+      args.push('--disallowedTools', q([...new Set(disallowedTools)].join(',')))
+    }
+
+    const systemPrompts = normalizeSystemPrompts(options.systemPrompts)
+      .map((prompt) => prompt.content)
+      .filter((content) => content.trim() !== '')
+    if (systemPrompts.length > 0) {
+      const joined = systemPrompts.join('\n\n')
+      const flag =
+        config.systemPromptMode === 'replace'
+          ? '--system-prompt'
+          : '--append-system-prompt'
+      args.push(flag, q(joined))
+    }
+
+    if (mcpConfigJson !== undefined) args.push('--mcp-config', q(mcpConfigJson))
+    if (permissionPromptTool !== undefined) {
+      args.push('--permission-prompt-tool', q(permissionPromptTool))
+    }
+
+    return `${exe} ${args.join(' ')}`
+  }
+
+  /**
+   * Build the permission-prompt resolver the host MCP bridge exposes to claude
+   * (`--permission-prompt-tool`). Maps claude's permission request onto the
+   * sandbox policy + client approvals; on an `ask` action with no decision yet,
+   * records an approval-requested event and denies (the client re-runs to grant).
+   */
+  private buildPermissionResolver(
+    policy: SandboxPolicy | undefined,
+    approvals: ReadonlyMap<string, boolean> | undefined,
+    sink: Array<StreamChunk>,
+    threadId: string,
+    runId: string,
+  ): (input: { tool_name?: string; input?: unknown }) => PermissionToolResult {
+    const writeTools = new Set(['Write', 'Edit', 'MultiEdit', 'NotebookEdit'])
+    const networkTools = new Set(['WebFetch', 'WebSearch'])
+    return (request) => {
+      const toolName = request.tool_name ?? 'tool'
+      const cmdInput = request.input
+      const command =
+        toolName === 'Bash' &&
+        cmdInput !== null &&
+        typeof cmdInput === 'object' &&
+        'command' in cmdInput &&
+        typeof (cmdInput as { command?: unknown }).command === 'string'
+          ? (cmdInput as { command: string }).command
+          : undefined
+      const capability = writeTools.has(toolName)
+        ? 'fileWrite'
+        : networkTools.has(toolName)
+          ? 'network'
+          : undefined
+      const id = approvalId({
+        provider: 'claude-code',
+        kind: command !== undefined ? 'command' : (capability ?? 'tool'),
+        target: command ?? toolName,
+      })
+      const outcome = resolveApproval({
+        policy,
+        approvals,
+        id,
+        ...(command !== undefined ? { command } : {}),
+        ...(capability !== undefined ? { capability } : {}),
+      })
+      if (outcome.needsApproval) {
+        sink.push(
+          buildApprovalRequestedEvent({
+            approvalId: id,
+            title: `Approve ${toolName}${command !== undefined ? `: ${command}` : ''}`,
+            threadId,
+            runId,
+            detail: { provider: 'claude-code', toolName },
+          }),
+        )
+        return {
+          behavior: 'deny',
+          message:
+            'Awaiting client approval. Approve in the UI and re-run to continue.',
+        }
+      }
+      return outcome.decision === 'allow'
+        ? { behavior: 'allow' }
+        : { behavior: 'deny', message: 'Denied by sandbox policy.' }
+    }
+  }
+
+  async *chatStream(
+    options: TextOptions<ClaudeCodeTextProviderOptions>,
+  ): AsyncIterable<StreamChunk> {
+    const { logger } = options
+    let bridge: HostToolBridge | undefined
+    const approvalRequests: Array<StreamChunk> = []
+    try {
+      const sandbox = this.sandboxFrom(options)
+      const cwd = this.workdir(options)
+      const runId = options.runId ?? this.generateId()
+      const threadId = options.threadId ?? this.generateId()
+
+      const policy = options.capabilities
+        ? getSandboxPolicy(options.capabilities, { optional: true })
+        : undefined
+
+      // A permission-prompt tool gates the agent's native tools when a policy
+      // can `ask`/`deny` (interactive approvals).
+      const permission =
+        policy !== undefined
+          ? {
+              toolName: 'approval_prompt',
+              resolve: this.buildPermissionResolver(
+                policy,
+                options.approvals,
+                approvalRequests,
+                threadId,
+                runId,
+              ),
+            }
+          : undefined
+
+      // Bridge chat()-provided server tools (and/or the permission tool) into
+      // the sandbox over MCP.
+      const hasTools = options.tools !== undefined && options.tools.length > 0
+      if (hasTools || permission !== undefined) {
+        bridge = await startHostToolBridge(options.tools ?? [], {
+          hostForSandbox: hostForSandbox(sandbox.provider),
+          context: options.context,
+          ...(permission !== undefined ? { permission } : {}),
+          ...(options.abortController?.signal
+            ? { signal: options.abortController.signal }
+            : {}),
+        })
+      }
+
+      const { prompt, resume } = buildPrompt(
+        options.messages,
+        options.modelOptions?.sessionId,
+      )
+      const command = this.buildCommand(
+        options,
+        resume,
+        mapPolicyToClaudeFlags(policy),
+        bridge ? bridgeToMcpConfig(bridge) : undefined,
+        bridge && permission
+          ? `mcp__${bridge.name}__${permission.toolName}`
+          : undefined,
+      )
+
+      logger.request(
+        `activity=chat provider=claude-code model=${this.model} sandbox=${sandbox.provider} messages=${options.messages.length} resume=${resume ?? 'none'}`,
+        { provider: 'claude-code', model: this.model },
+      )
+
+      const rawEvents = spawnNdjson(sandbox, command, {
+        cwd,
+        input: prompt,
+        ...(options.modelOptions === undefined &&
+        this.adapterConfig.env === undefined
+          ? {}
+          : { env: this.adapterConfig.env }),
+        ...(options.abortController?.signal
+          ? { signal: options.abortController.signal }
+          : options.request?.signal
+            ? { signal: options.request.signal }
+            : {}),
+        onNonJsonLine: (line) =>
+          logger.provider(`provider=claude-code non-json line: ${line}`, {
+            chunk: line,
+          }),
+      })
+
+      async function* asMessages(): AsyncIterable<AgentSdkMessage> {
+        for await (const event of rawEvents) yield event as AgentSdkMessage
+      }
+
+      yield* translateSdkStream(asMessages(), {
+        model: this.model,
+        runId,
+        threadId,
+        ...(options.parentRunId !== undefined && {
+          parentRunId: options.parentRunId,
+        }),
+        genId: () => this.generateId(),
+        onSdkMessage: (message) =>
+          logger.provider(`provider=claude-code type=${message.type}`, {
+            chunk: message,
+          }),
+      })
+
+      // Surface the working-tree diff so UIs can render what the agent changed.
+      if (this.adapterConfig.emitDiff !== false) {
+        try {
+          const diff = await sandbox.process.exec(`git -C ${q(cwd)} diff`, {
+            cwd,
+          })
+          if (diff.exitCode === 0 && diff.stdout.trim() !== '') {
+            yield {
+              type: EventType.CUSTOM,
+              name: 'file.changed',
+              value: { path: '.', diff: diff.stdout },
+              timestamp: Date.now(),
+              threadId,
+              runId,
+            }
+          }
+        } catch {
+          // not a git repo / git unavailable — skip the diff event
+        }
+      }
+
+      // Surface any pending approval requests (policy `ask` actions awaiting a
+      // client decision); the client approves and re-runs to continue.
+      for (const event of approvalRequests) yield event
+    } catch (error: unknown) {
+      const err = error as Error & { code?: string }
+      const rawEvent = toRunErrorRawEvent(error)
+      logger.errors('claude-code.chatStream fatal', {
+        error,
+        source: 'claude-code.chatStream',
+      })
+      yield {
+        type: EventType.RUN_ERROR,
+        model: options.model,
+        timestamp: Date.now(),
+        message: err.message || 'Unknown error occurred',
+        ...(err.code !== undefined && { code: err.code }),
+        ...(rawEvent !== undefined && { rawEvent }),
+        error: {
+          message: err.message || 'Unknown error occurred',
+          ...(err.code !== undefined && { code: err.code }),
+        },
+      }
+    } finally {
+      if (bridge) await bridge.close()
+    }
+  }
+
+  structuredOutput(
+    _options: StructuredOutputOptions<ClaudeCodeTextProviderOptions>,
+  ): Promise<StructuredOutputResult<unknown>> {
+    return Promise.reject(
+      new Error(
+        'Structured output is not yet supported by the in-sandbox Claude Code adapter. ' +
+          'Use a model adapter (e.g. anthropic) for structured output, or omit outputSchema.',
+      ),
+    )
+  }
+}
+
+/**
+ * Creates a Claude Code harness adapter that runs **inside a sandbox**.
+ *
+ * Unlike HTTP provider adapters, this is a *harness* adapter: it spawns the
+ * `claude` CLI inside the sandbox provided by `withSandbox(...)` (the adapter
+ * declares `requires: [SandboxCapability]`), streams its `stream-json` stdout
+ * back as AG-UI events, and lets Claude Code run its own agent loop and native
+ * tools (Bash, file edits, search, …) against the sandbox workspace. The
+ * sandbox image must provide the `claude` executable and `ANTHROPIC_API_KEY`
+ * in its environment (e.g. via `workspace.secrets`). The session id is
+ * surfaced via a CUSTOM `claude-code.session-id` event so follow-up calls can
+ * resume through `modelOptions.sessionId`.
+ */
+export function claudeCodeText<TModel extends ClaudeCodeModel>(
+  model: TModel,
+  config: ClaudeCodeTextConfig = {},
+): ClaudeCodeTextAdapter<TModel> {
+  return new ClaudeCodeTextAdapter(config, model)
+}
diff --git a/packages/ai-claude-code/src/index.ts b/packages/ai-claude-code/src/index.ts
new file mode 100644
index 000000000..93f2352d9
--- /dev/null
+++ b/packages/ai-claude-code/src/index.ts
@@ -0,0 +1,21 @@
+export { ClaudeCodeTextAdapter, claudeCodeText } from './adapters/text'
+export type {
+  ClaudeCodeTextConfig,
+  ClaudeCodePermissionMode,
+} from './adapters/text'
+export type { ClaudeCodeTextProviderOptions } from './provider-options'
+export { CLAUDE_CODE_MODELS } from './model-meta'
+export type { ClaudeCodeModel, KnownClaudeCodeModel } from './model-meta'
+export {
+  SESSION_ID_EVENT,
+  BRIDGED_MCP_SERVER_NAME,
+  translateSdkStream,
+  stripMcpPrefix,
+} from './stream/translate'
+export type {
+  ClaudeCodeProviderUsageDetails,
+  TranslateContext,
+} from './stream/translate'
+export type { AgentSdkMessage } from './stream/sdk-types'
+export { buildPrompt } from './messages/prompt'
+export type { BuiltPrompt } from './messages/prompt'
diff --git a/packages/ai-claude-code/src/messages/prompt.ts b/packages/ai-claude-code/src/messages/prompt.ts
new file mode 100644
index 000000000..ca88b7f14
--- /dev/null
+++ b/packages/ai-claude-code/src/messages/prompt.ts
@@ -0,0 +1,68 @@
+import type { ModelMessage } from '@tanstack/ai'
+
+export interface BuiltPrompt {
+  prompt: string
+  /** Claude Code session id to resume, when the caller threaded one through. */
+  resume?: string
+}
+
+function extractText(content: ModelMessage['content']): string {
+  if (content === null) return ''
+  if (typeof content === 'string') return content
+  return content
+    .map((part) =>
+      part.type === 'text' && typeof part.content === 'string'
+        ? part.content
+        : '',
+    )
+    .join('')
+}
+
+/**
+ * Convert TanStack chat history into the Agent SDK's `{ prompt, resume }`
+ * inputs.
+ *
+ * With a `sessionId`, the harness already holds the conversation context, so
+ * only the trailing user message is sent and the session is resumed. Without
+ * one, prior turns are flattened into a plain-text transcript preamble (tool
+ * messages and tool-call-only assistant turns are harness-internal noise and
+ * are skipped; prompts are text-only in v1).
+ */
+export function buildPrompt(
+  messages: Array<ModelMessage>,
+  sessionId: string | undefined,
+): BuiltPrompt {
+  const lastMessage = messages.at(-1)
+  const lastUserText =
+    lastMessage?.role === 'user' ? extractText(lastMessage.content).trim() : ''
+
+  if (!lastUserText) {
+    throw new Error(
+      'Claude Code adapter requires a trailing user message with text content.',
+    )
+  }
+
+  if (sessionId !== undefined) {
+    return { prompt: lastUserText, resume: sessionId }
+  }
+
+  const priorTurns = messages
+    .slice(0, -1)
+    .filter(
+      (message) =>
+        (message.role === 'user' || message.role === 'assistant') &&
+        extractText(message.content).trim() !== '',
+    )
+    .map(
+      (message) =>
+        `${message.role === 'user' ? 'User' : 'Assistant'}: ${extractText(message.content).trim()}`,
+    )
+
+  if (priorTurns.length === 0) {
+    return { prompt: lastUserText }
+  }
+
+  return {
+    prompt: `Previous conversation:\n${priorTurns.join('\n')}\n\n${lastUserText}`,
+  }
+}
diff --git a/packages/ai-claude-code/src/model-meta.ts b/packages/ai-claude-code/src/model-meta.ts
new file mode 100644
index 000000000..22edef39f
--- /dev/null
+++ b/packages/ai-claude-code/src/model-meta.ts
@@ -0,0 +1,21 @@
+/**
+ * Models known to work with Claude Code. The harness accepts any Anthropic
+ * model id (and the `opus` / `sonnet` / `haiku` aliases resolved by the CLI),
+ * so this list exists for autocomplete — any string is accepted via the
+ * `(string & {})` escape hatch in {@link ClaudeCodeModel}.
+ */
+export const CLAUDE_CODE_MODELS = [
+  'claude-opus-4-8',
+  'claude-opus-4-7',
+  'claude-opus-4-6',
+  'claude-sonnet-4-6',
+  'claude-haiku-4-5',
+  'opus',
+  'sonnet',
+  'haiku',
+] as const
+
+export type KnownClaudeCodeModel = (typeof CLAUDE_CODE_MODELS)[number]
+
+/** Any Claude model id accepted by Claude Code; known ids get autocomplete. */
+export type ClaudeCodeModel = KnownClaudeCodeModel | (string & {})
diff --git a/packages/ai-claude-code/src/provider-options.ts b/packages/ai-claude-code/src/provider-options.ts
new file mode 100644
index 000000000..4a40803b2
--- /dev/null
+++ b/packages/ai-claude-code/src/provider-options.ts
@@ -0,0 +1,30 @@
+type PermissionMode = 'default' | 'acceptEdits' | 'bypassPermissions' | 'plan'
+
+/**
+ * Per-call provider options for the Claude Code adapter, passed via
+ * `modelOptions` on `chat()`.
+ */
+export interface ClaudeCodeTextProviderOptions {
+  /**
+   * Resume an existing Claude Code session. The adapter emits the session id
+   * of every run via a CUSTOM `claude-code.session-id` stream event; thread
+   * it back here to continue that session (only the latest user message is
+   * sent — the harness already holds the prior context).
+   */
+  sessionId?: string
+  /**
+   * When resuming, fork to a new session id instead of continuing the
+   * original session.
+   */
+  forkSession?: boolean
+  /** Per-call override of the configured max harness turns. */
+  maxTurns?: number
+  /** Per-call override of the configured permission mode. */
+  permissionMode?: PermissionMode
+  /** Per-call override of the allowed built-in tool list. */
+  allowedTools?: Array<string>
+  /** Per-call override of the disallowed built-in tool list. */
+  disallowedTools?: Array<string>
+  /** Per-call override of the harness working directory. */
+  cwd?: string
+}
diff --git a/packages/ai-claude-code/src/stream/sdk-types.ts b/packages/ai-claude-code/src/stream/sdk-types.ts
new file mode 100644
index 000000000..a4b40be74
--- /dev/null
+++ b/packages/ai-claude-code/src/stream/sdk-types.ts
@@ -0,0 +1,135 @@
+/**
+ * Structural subset of the `@anthropic-ai/claude-agent-sdk` message types that
+ * the stream translator consumes.
+ *
+ * These are intentionally defined structurally (rather than imported from the
+ * agent SDK) so the translator stays a pure, fixture-testable state machine
+ * and the package's public types don't depend on the agent SDK's bundled
+ * `@anthropic-ai/sdk` type imports.
+ */
+
+export interface SdkInitMessage {
+  type: 'system'
+  subtype: 'init'
+  session_id: string
+  model: string
+  tools: Array<string>
+  cwd?: string
+}
+
+export type SdkAssistantContentBlock =
+  | { type: 'text'; text: string }
+  | { type: 'thinking'; thinking: string }
+  | { type: 'tool_use'; id: string; name: string; input: unknown }
+  | { type: string; [key: string]: unknown }
+
+export interface SdkAssistantMessage {
+  type: 'assistant'
+  message: {
+    id?: string
+    content: Array<SdkAssistantContentBlock>
+  }
+  parent_tool_use_id: string | null
+}
+
+export type SdkToolResultContent =
+  | string
+  | Array<{ type: string; text?: string; [key: string]: unknown }>
+
+export type SdkUserContentBlock =
+  | {
+      type: 'tool_result'
+      tool_use_id: string
+      content?: SdkToolResultContent
+      is_error?: boolean
+    }
+  | { type: string; [key: string]: unknown }
+
+export interface SdkUserMessage {
+  type: 'user'
+  message: {
+    role: 'user'
+    content: string | Array<SdkUserContentBlock>
+  }
+  parent_tool_use_id: string | null
+}
+
+/** Raw Anthropic streaming events forwarded when `includePartialMessages` is set. */
+export type SdkRawStreamEvent =
+  | { type: 'message_start'; message: { id?: string } }
+  | {
+      type: 'content_block_start'
+      index: number
+      content_block: { type: string }
+    }
+  | {
+      type: 'content_block_delta'
+      index: number
+      delta: { type: string; text?: string; thinking?: string }
+    }
+  | { type: 'content_block_stop'; index: number }
+  | { type: 'message_delta' }
+  | { type: 'message_stop' }
+
+export interface SdkPartialAssistantMessage {
+  type: 'stream_event'
+  event: SdkRawStreamEvent
+  parent_tool_use_id: string | null
+}
+
+export interface SdkUsage {
+  input_tokens?: number
+  output_tokens?: number
+  cache_read_input_tokens?: number
+  cache_creation_input_tokens?: number
+}
+
+export interface SdkResultMessage {
+  type: 'result'
+  subtype:
+    | 'success'
+    | 'error_max_turns'
+    | 'error_during_execution'
+    | 'error_max_budget_usd'
+    | 'error_max_structured_output_retries'
+  result?: string
+  errors?: Array<string>
+  usage?: SdkUsage
+  total_cost_usd?: number
+  structured_output?: unknown
+}
+
+/**
+ * Harness-internal system messages the translator deliberately ignores.
+ * (The real SDK union has many more members; unknown runtime types simply
+ * fall through every branch.)
+ */
+export interface SdkNoiseSystemMessage {
+  type: 'system'
+  subtype:
+    | 'status'
+    | 'permission_denied'
+    | 'plugin_install'
+    | 'session_state_changed'
+    | 'task_notification'
+    | 'task_progress'
+}
+
+/** Other harness-internal top-level message types the translator ignores. */
+export interface SdkNoiseMessage {
+  type:
+    | 'tool_progress'
+    | 'auth_status'
+    | 'rate_limit_event'
+    | 'prompt_suggestion'
+    | 'compact_boundary'
+}
+
+export type AgentSdkMessage =
+  | SdkInitMessage
+  | SdkAssistantMessage
+  | SdkUserMessage
+  | SdkPartialAssistantMessage
+  | SdkResultMessage
+  | SdkNoiseSystemMessage
+  | SdkNoiseMessage
diff --git a/packages/ai-claude-code/src/stream/translate.ts b/packages/ai-claude-code/src/stream/translate.ts
new file mode 100644
index 000000000..67271d63c
--- /dev/null
+++ b/packages/ai-claude-code/src/stream/translate.ts
@@ -0,0 +1,483 @@
+import { EventType, buildBaseUsage } from '@tanstack/ai'
+import type { StreamChunk, TokenUsage } from '@tanstack/ai'
+import type {
+  AgentSdkMessage,
+  SdkAssistantMessage,
+  SdkPartialAssistantMessage,
+  SdkResultMessage,
+  SdkToolResultContent,
+  SdkUsage,
+  SdkUserMessage,
+} from './sdk-types'
+
+/** Name of the CUSTOM event carrying the Claude Code session id. */
+export const SESSION_ID_EVENT = 'claude-code.session-id'
+
+/** Server name used for bridged TanStack tools (model sees `mcp__tanstack__<name>`). */
+export const BRIDGED_MCP_SERVER_NAME = 'tanstack'
+
+const BRIDGED_MCP_PREFIX = `mcp__${BRIDGED_MCP_SERVER_NAME}__`
+
+/** Claude Code-specific usage details attached to RUN_FINISHED usage. */
+export type ClaudeCodeProviderUsageDetails = {
+  /** Total cost of the harness run in USD, as reported by Claude Code. */
+  totalCostUsd?: number
+}
+
+export interface TranslateContext {
+  model: string
+  runId: string
+  threadId: string
+  parentRunId?: string
+  genId: () => string
+  /** Called as soon as the harness reports its session id. */
+  onSessionId?: (sessionId: string) => void
+  /** Called for each raw SDK message, for logging. */
+  onSdkMessage?: (message: AgentSdkMessage) => void
+}
+
+/**
+ * Strip the bridged MCP server prefix so tool-call events match the TanStack
+ * tool names the application registered. Built-in harness tools (Bash, Read,
+ * Edit, ...) and foreign MCP tools pass through verbatim.
+ */
+export function stripMcpPrefix(name: string): string {
+  return name.startsWith(BRIDGED_MCP_PREFIX)
+    ? name.slice(BRIDGED_MCP_PREFIX.length)
+    : name
+}
+
+function stringifyToolResultContent(
+  content: SdkToolResultContent | undefined,
+): string {
+  if (content === undefined) return ''
+  if (typeof content === 'string') return content
+  return content
+    .map((block) => (typeof block.text === 'string' ? block.text : ''))
+    .join('')
+}
+
+function buildUsage(
+  usage: SdkUsage | undefined,
+  totalCostUsd: number | undefined,
+): TokenUsage<ClaudeCodeProviderUsageDetails> | undefined {
+  if (!usage) return undefined
+  const promptTokens = usage.input_tokens ?? 0
+  const completionTokens = usage.output_tokens ?? 0
+  const result = buildBaseUsage<ClaudeCodeProviderUsageDetails>({
+    promptTokens,
+    completionTokens,
+    totalTokens: promptTokens + completionTokens,
+  })
+  const cacheWrite = usage.cache_creation_input_tokens
+  const cacheRead = usage.cache_read_input_tokens
+  const promptTokensDetails = {
+    ...(cacheWrite ? { cacheWriteTokens: cacheWrite } : {}),
+    ...(cacheRead ? { cachedTokens: cacheRead } : {}),
+  }
+  if (Object.keys(promptTokensDetails).length > 0) {
+    result.promptTokensDetails = promptTokensDetails
+  }
+  if (totalCostUsd !== undefined) {
+    result.providerUsageDetails = { totalCostUsd }
+  }
+  return result
+}
+
+/**
+ * Translate a Claude Code Agent SDK message stream into AG-UI StreamChunk
+ * events.
+ *
+ * The harness runs its own agent loop and executes its own tools, so the
+ * translation always ends with `finishReason: 'stop'` (or `'length'` /
+ * RUN_ERROR) — never `'tool_calls'`. Harness tool activity is emitted as
+ * already-resolved TOOL_CALL_START/ARGS/END + TOOL_CALL_RESULT sequences so
+ * UIs can render it, while the TanStack engine never tries to execute them.
+ *
+ * Invariant: every TOOL_CALL_START is eventually paired with a
+ * TOOL_CALL_RESULT (synthesized as `{"status":"interrupted"}` when the run
+ * ends or aborts before the harness reported one) so the engine's
+ * pending-tool-call scan on the next request never force-executes them.
+ */
+export async function* translateSdkStream(
+  sdkMessages: AsyncIterable<AgentSdkMessage>,
+  ctx: TranslateContext,
+): AsyncIterable<StreamChunk> {
+  const { model, runId, threadId, genId } = ctx
+  const now = () => Date.now()
+
+  let runStarted = false
+  /** Tool calls started but with no result yet. */
+  const unresolvedToolCalls = new Set<string>()
+  /** Anthropic message ids whose text/thinking already streamed via partials. */
+  const streamedMessageIds = new Set<string>()
+
+  // Partial-stream state
+  let partialMessageId: string | null = null
+  let partialBlockType: string | null = null
+  let partialTextMessageId: string | null = null
+  let partialTextContent = ''
+  let partialTextStarted = false
+  let partialReasoningId: string | null = null
+
+  function* startRun(): Generator<StreamChunk> {
+    if (runStarted) return
+    runStarted = true
+    yield {
+      type: EventType.RUN_STARTED,
+      runId,
+      threadId,
+      model,
+      timestamp: now(),
+      ...(ctx.parentRunId !== undefined && { parentRunId: ctx.parentRunId }),
+    }
+  }
+
+  function* synthesizeUnresolvedResults(): Generator<StreamChunk> {
+    for (const toolCallId of unresolvedToolCalls) {
+      yield {
+        type: EventType.TOOL_CALL_RESULT,
+        toolCallId,
+        messageId: genId(),
+        model,
+        timestamp: now(),
+        content: JSON.stringify({ status: 'interrupted' }),
+      }
+    }
+    unresolvedToolCalls.clear()
+  }
+
+  function* closePartialText(): Generator<StreamChunk> {
+    if (partialTextStarted && partialTextMessageId) {
+      yield {
+        type: EventType.TEXT_MESSAGE_END,
+        messageId: partialTextMessageId,
+        model,
+        timestamp: now(),
+      }
+    }
+    partialTextStarted = false
+    partialTextMessageId = null
+    partialTextContent = ''
+  }
+
+  function* closePartialReasoning(): Generator<StreamChunk> {
+    if (partialReasoningId) {
+      yield {
+        type: EventType.REASONING_MESSAGE_END,
+        messageId: partialReasoningId,
+        model,
+        timestamp: now(),
+      }
+      yield {
+        type: EventType.REASONING_END,
+        messageId: partialReasoningId,
+        model,
+        timestamp: now(),
+      }
+    }
+    partialReasoningId = null
+  }
+
+  function* emitToolUse(block: {
+    id: string
+    name: string
+    input: unknown
+  }): Generator<StreamChunk> {
+    const toolCallName = stripMcpPrefix(block.name)
+    const args = JSON.stringify(block.input ?? {})
+    yield {
+      type: EventType.TOOL_CALL_START,
+      toolCallId: block.id,
+      toolCallName,
+      toolName: toolCallName,
+      model,
+      timestamp: now(),
+    }
+    yield {
+      type: EventType.TOOL_CALL_ARGS,
+      toolCallId: block.id,
+      model,
+      timestamp: now(),
+      delta: args,
+      args,
+    }
+    yield {
+      type: EventType.TOOL_CALL_END,
+      toolCallId: block.id,
+      toolCallName,
+      toolName: toolCallName,
+      model,
+      timestamp: now(),
+      input: block.input ?? {},
+    }
+    unresolvedToolCalls.add(block.id)
+  }
+
+  function* handleAssistant(
+    message: SdkAssistantMessage,
+  ): Generator<StreamChunk> {
+    const alreadyStreamed =
+      message.message.id !== undefined &&
+      streamedMessageIds.has(message.message.id)
+
+    for (const block of message.message.content) {
+      if (block.type === 'text') {
+        if (alreadyStreamed) continue
+        const messageId = message.message.id ?? genId()
+        const text = (block as { text: string }).text
+        yield {
+          type: EventType.TEXT_MESSAGE_START,
+          messageId,
+          model,
+          timestamp: now(),
+          role: 'assistant',
+        }
+        yield {
+          type: EventType.TEXT_MESSAGE_CONTENT,
+          messageId,
+          model,
+          timestamp: now(),
+          delta: text,
+          content: text,
+        }
+        yield {
+          type: EventType.TEXT_MESSAGE_END,
+          messageId,
+          model,
+          timestamp: now(),
+        }
+      } else if (block.type === 'thinking') {
+        if (alreadyStreamed) continue
+        const reasoningId = genId()
+        const thinking = (block as { thinking: string }).thinking
+        yield {
+          type: EventType.REASONING_START,
+          messageId: reasoningId,
+          model,
+          timestamp: now(),
+        }
+        yield {
+          type: EventType.REASONING_MESSAGE_START,
+          messageId: reasoningId,
+          role: 'reasoning' as const,
+          model,
+          timestamp: now(),
+        }
+        yield {
+          type: EventType.REASONING_MESSAGE_CONTENT,
+          messageId: reasoningId,
+          delta: thinking,
+          model,
+          timestamp: now(),
+        }
+        yield {
+          type: EventType.REASONING_MESSAGE_END,
+          messageId: reasoningId,
+          model,
+          timestamp: now(),
+        }
+        yield {
+          type: EventType.REASONING_END,
+          messageId: reasoningId,
+          model,
+          timestamp: now(),
+        }
+      } else if (block.type === 'tool_use') {
+        yield* emitToolUse(
+          block as { id: string; name: string; input: unknown },
+        )
+      }
+    }
+  }
+
+  function* handleUser(message: SdkUserMessage): Generator<StreamChunk> {
+    const content = message.message.content
+    if (typeof content === 'string') return
+    for (const block of content) {
+      if (block.type !== 'tool_result') continue
+      const toolResult = block as {
+        tool_use_id: string
+        content?: SdkToolResultContent
+        is_error?: boolean
+      }
+      unresolvedToolCalls.delete(toolResult.tool_use_id)
+      yield {
+        type: EventType.TOOL_CALL_RESULT,
+        toolCallId: toolResult.tool_use_id,
+        messageId: genId(),
+        model,
+        timestamp: now(),
+        content: stringifyToolResultContent(toolResult.content),
+        ...(toolResult.is_error === true && { state: 'output-error' as const }),
+      }
+    }
+  }
+
+  function* handleResult(message: SdkResultMessage): Generator<StreamChunk> {
+    yield* closePartialText()
+    yield* closePartialReasoning()
+    yield* synthesizeUnresolvedResults()
+
+    const usage = buildUsage(message.usage, message.total_cost_usd)
+    if (message.subtype === 'success') {
+      yield {
+        type: EventType.RUN_FINISHED,
+        runId,
+        threadId,
+        model,
+        timestamp: now(),
+        finishReason: 'stop',
+        ...(usage !== undefined && { usage }),
+      }
+    } else if (message.subtype === 'error_max_turns') {
+      yield {
+        type: EventType.RUN_FINISHED,
+        runId,
+        threadId,
+        model,
+        timestamp: now(),
+        finishReason: 'length',
+        ...(usage !== undefined && { usage }),
+      }
+    } else {
+      const errorMessage =
+        message.errors && message.errors.length > 0
+          ? message.errors.join('; ')
+          : `Claude Code run failed: ${message.subtype}`
+      yield {
+        type: EventType.RUN_ERROR,
+        model,
+        timestamp: now(),
+        message: errorMessage,
+        code: message.subtype,
+        error: { message: errorMessage, code: message.subtype },
+      }
+    }
+  }
+
+  function* handleStreamEvent(
+    message: SdkPartialAssistantMessage,
+  ): Generator<StreamChunk> {
+    const event = message.event
+    if (event.type === 'message_start') {
+      partialMessageId = event.message.id ?? genId()
+      streamedMessageIds.add(partialMessageId)
+    } else if (event.type === 'content_block_start') {
+      partialBlockType = event.content_block.type
+      if (partialBlockType === 'text') {
+        partialTextMessageId = partialMessageId ?? genId()
+        partialTextContent = ''
+        if (!partialTextStarted) {
+          partialTextStarted = true
+          yield {
+            type: EventType.TEXT_MESSAGE_START,
+            messageId: partialTextMessageId,
+            model,
+            timestamp: now(),
+            role: 'assistant',
+          }
+        }
+      } else if (partialBlockType === 'thinking') {
+        partialReasoningId = genId()
+        yield {
+          type: EventType.REASONING_START,
+          messageId: partialReasoningId,
+          model,
+          timestamp: now(),
+        }
+        yield {
+          type: EventType.REASONING_MESSAGE_START,
+          messageId: partialReasoningId,
+          role: 'reasoning' as const,
+          model,
+          timestamp: now(),
+        }
+      }
+    } else if (event.type === 'content_block_delta') {
+      if (
+        event.delta.type === 'text_delta' &&
+        partialTextStarted &&
+        partialTextMessageId &&
+        typeof event.delta.text === 'string'
+      ) {
+        partialTextContent += event.delta.text
+        yield {
+          type: EventType.TEXT_MESSAGE_CONTENT,
+          messageId: partialTextMessageId,
+          model,
+          timestamp: now(),
+          delta: event.delta.text,
+          content: partialTextContent,
+        }
+      } else if (
+        event.delta.type === 'thinking_delta' &&
+        partialReasoningId &&
+        typeof event.delta.thinking === 'string'
+      ) {
+        yield {
+          type: EventType.REASONING_MESSAGE_CONTENT,
+          messageId: partialReasoningId,
+          delta: event.delta.thinking,
+          model,
+          timestamp: now(),
+        }
+      }
+    } else if (event.type === 'content_block_stop') {
+      if (partialBlockType === 'text') {
+        yield* closePartialText()
+      } else if (partialBlockType === 'thinking') {
+        yield* closePartialReasoning()
+      }
+      partialBlockType = null
+    }
+  }
+
+  try {
+    for await (const sdkMessage of sdkMessages) {
+      ctx.onSdkMessage?.(sdkMessage)
+
+      if (sdkMessage.type === 'system' && sdkMessage.subtype === 'init') {
+        yield* startRun()
+        ctx.onSessionId?.(sdkMessage.session_id)
+        yield {
+          type: EventType.CUSTOM,
+          model,
+          timestamp: now(),
+          name: SESSION_ID_EVENT,
+          value: {
+            sessionId: sdkMessage.session_id,
+            model: sdkMessage.model,
+            tools: sdkMessage.tools,
+          },
+        }
+        continue
+      }
+
+      // Anything before init still needs RUN_STARTED first.
+      yield* startRun()
+
+      if (sdkMessage.type === 'stream_event') {
+        if (sdkMessage.parent_tool_use_id !== null) continue
+        yield* handleStreamEvent(sdkMessage)
+      } else if (sdkMessage.type === 'assistant') {
+        if (sdkMessage.parent_tool_use_id !== null) continue
+        yield* handleAssistant(sdkMessage)
+      } else if (sdkMessage.type === 'user') {
+        if (sdkMessage.parent_tool_use_id !== null) continue
+        yield* handleUser(sdkMessage)
+      } else if (sdkMessage.type === 'result') {
+        yield* handleResult(sdkMessage)
+      }
+      // All other SDK message types (status, hooks, notifications, ...) are
+      // harness-internal and intentionally ignored.
+    }
+  } catch (error) {
+    // The run is dying (abort or SDK failure). Pair any started tool calls
+    // with a synthetic result first so the next request's pending-tool-call
+    // scan doesn't try to execute them, then let the adapter surface the
+    // error as RUN_ERROR.
+    yield* synthesizeUnresolvedResults()
+    throw error
+  }
+}
diff --git a/packages/ai-claude-code/tests/policy-map.test.ts b/packages/ai-claude-code/tests/policy-map.test.ts
new file mode 100644
index 000000000..d2d5f52d5
--- /dev/null
+++ b/packages/ai-claude-code/tests/policy-map.test.ts
@@ -0,0 +1,56 @@
+import { describe, expect, it } from 'vitest'
+import { defineSandboxPolicy } from '@tanstack/ai-sandbox'
+import { mapPolicyToClaudeFlags } from '../src/adapters/policy-map'
+
+describe('mapPolicyToClaudeFlags', () => {
+  it('returns empty additions for no policy', () => {
+    const flags = mapPolicyToClaudeFlags(undefined)
+    expect(flags).toEqual({ allowedTools: [], disallowedTools: [] })
+  })
+
+  it('maps the default decision to a permission mode', () => {
+    expect(
+      mapPolicyToClaudeFlags(defineSandboxPolicy({ default: 'allow' }))
+        .permissionMode,
+    ).toBe('bypassPermissions')
+    expect(
+      mapPolicyToClaudeFlags(defineSandboxPolicy({ default: 'deny' }))
+        .permissionMode,
+    ).toBe('default')
+    expect(
+      mapPolicyToClaudeFlags(defineSandboxPolicy({ default: 'ask' }))
+        .permissionMode,
+    ).toBe('acceptEdits')
+  })
+
+  it('disallows write tools when fileWrite is denied', () => {
+    const flags = mapPolicyToClaudeFlags(
+      defineSandboxPolicy({ capabilities: { fileWrite: 'deny' } }),
+    )
+    expect(flags.disallowedTools).toEqual(
+      expect.arrayContaining(['Write', 'Edit', 'MultiEdit']),
+    )
+  })
+
+  it('disallows network tools when network is denied', () => {
+    const flags = mapPolicyToClaudeFlags(
+      defineSandboxPolicy({ capabilities: { network: 'deny' } }),
+    )
+    expect(flags.disallowedTools).toEqual(
+      expect.arrayContaining(['WebFetch', 'WebSearch']),
+    )
+  })
+
+  it('maps tool-name command rules to allow/deny lists', () => {
+    const flags = mapPolicyToClaudeFlags(
+      defineSandboxPolicy({
+        commands: { allow: ['Read'], deny: ['Bash', 'pnpm *'] },
+      }),
+    )
+    // 'Bash' is a built-in tool name -> disallowed; 'pnpm *' is a command glob,
+    // not a tool name, so it's left to the permission-prompt tool.
+    expect(flags.allowedTools).toContain('Read')
+    expect(flags.disallowedTools).toContain('Bash')
+    expect(flags.disallowedTools).not.toContain('pnpm *')
+  })
+})
diff --git a/packages/ai-claude-code/tests/prompt.test.ts b/packages/ai-claude-code/tests/prompt.test.ts
new file mode 100644
index 000000000..6e8dfcdf3
--- /dev/null
+++ b/packages/ai-claude-code/tests/prompt.test.ts
@@ -0,0 +1,97 @@
+import { describe, expect, it } from 'vitest'
+import { buildPrompt } from '../src/messages/prompt'
+import type { ModelMessage } from '@tanstack/ai'
+
+const user = (content: ModelMessage['content']): ModelMessage => ({
+  role: 'user',
+  content,
+})
+const assistant = (content: ModelMessage['content']): ModelMessage => ({
+  role: 'assistant',
+  content,
+})
+
+describe('buildPrompt', () => {
+  it('resumes with only the last user message when sessionId is provided', () => {
+    const result = buildPrompt(
+      [
+        user('first question'),
+        assistant('first answer'),
+        user('follow-up question'),
+      ],
+      'sess-1',
+    )
+    expect(result).toEqual({
+      prompt: 'follow-up question',
+      resume: 'sess-1',
+    })
+  })
+
+  it('throws when sessionId is provided but there is no trailing user message', () => {
+    expect(() => buildPrompt([user('q'), assistant('a')], 'sess-1')).toThrow(
+      /user message/i,
+    )
+  })
+
+  it('sends a single user message as-is for a fresh session', () => {
+    expect(buildPrompt([user('hello')], undefined)).toEqual({
+      prompt: 'hello',
+    })
+  })
+
+  it('flattens prior turns into a transcript preamble for fresh multi-turn history', () => {
+    const { prompt, resume } = buildPrompt(
+      [user('What is 2+2?'), assistant('4'), user('And times 3?')],
+      undefined,
+    )
+    expect(resume).toBeUndefined()
+    expect(prompt).toBe(
+      'Previous conversation:\nUser: What is 2+2?\nAssistant: 4\n\nAnd times 3?',
+    )
+  })
+
+  it('skips tool messages and assistant tool-call-only turns when flattening', () => {
+    const messages: Array<ModelMessage> = [
+      user('list files'),
+      {
+        role: 'assistant',
+        content: null,
+        toolCalls: [
+          {
+            id: 't1',
+            type: 'function',
+            function: { name: 'ls', arguments: '{}' },
+          },
+        ],
+      } as unknown as ModelMessage,
+      { role: 'tool', content: 'file-a', toolCallId: 't1' },
+      assistant('There is one file.'),
+      user('thanks, which one?'),
+    ]
+    const { prompt } = buildPrompt(messages, undefined)
+    expect(prompt).toBe(
+      'Previous conversation:\nUser: list files\nAssistant: There is one file.\n\nthanks, which one?',
+    )
+  })
+
+  it('extracts text from content-part arrays and ignores non-text parts', () => {
+    const { prompt } = buildPrompt(
+      [
+        user([
+          { type: 'text', content: 'describe ' },
+          {
+            type: 'image',
+            source: { type: 'url', url: 'https://x/y.png' },
+          } as never,
+          { type: 'text', content: 'this' },
+        ] as ModelMessage['content']),
+      ],
+      undefined,
+    )
+    expect(prompt).toBe('describe this')
+  })
+
+  it('throws when there is no usable user content at all', () => {
+    expect(() => buildPrompt([], undefined)).toThrow(/user message/i)
+  })
+})
diff --git a/packages/ai-claude-code/tests/text-adapter.test.ts b/packages/ai-claude-code/tests/text-adapter.test.ts
new file mode 100644
index 000000000..8983050d3
--- /dev/null
+++ b/packages/ai-claude-code/tests/text-adapter.test.ts
@@ -0,0 +1,159 @@
+/**
+ * Deterministic test of the in-sandbox Claude Code adapter.
+ *
+ * Instead of the real `claude` CLI (nondeterministic, needs an API key — see
+ * the gated live smoke in testing/e2e), this runs a FAKE agent CLI: a tiny node
+ * script that reads the prompt from stdin and emits canned `stream-json`
+ * messages on stdout, exactly as `claude -p --output-format stream-json` would.
+ * It runs inside a real local-process sandbox, exercising the full
+ * spawn → stdout NDJSON → translate → StreamChunk path.
+ */
+import { afterAll, describe, expect, it } from 'vitest'
+import * as fsp from 'node:fs/promises'
+import * as os from 'node:os'
+import * as path from 'node:path'
+import { localProcessSandbox } from '@tanstack/ai-sandbox-local-process'
+import { SandboxCapability } from '@tanstack/ai-sandbox'
+import { claudeCodeText } from '../src/index'
+import type { InternalLogger } from '@tanstack/ai/adapter-internals'
+import type { CapabilityContext, StreamChunk } from '@tanstack/ai'
+import type { SandboxHandle } from '@tanstack/ai-sandbox'
+
+const baseDir = path.join(os.tmpdir(), `tanstack-ai-cc-test-${Date.now()}`)
+const provider = localProcessSandbox({ baseDir, removeOnDestroy: true })
+
+afterAll(async () => {
+  await fsp.rm(baseDir, { recursive: true, force: true })
+})
+
+// A stand-in for the `claude` CLI: ignores its flags, reads the prompt from
+// stdin, then emits stream-json (system/init → assistant text → result).
+const FAKE_CLAUDE = [
+  `let input = ''`,
+  `process.stdin.on('data', (d) => { input += d })`,
+  `process.stdin.on('end', () => {`,
+  `  const w = (o) => process.stdout.write(JSON.stringify(o) + '\\n')`,
+  `  w({ type: 'system', subtype: 'init', session_id: 'sess-abc', model: 'haiku', tools: [] })`,
+  `  w({ type: 'assistant', message: { id: 'msg-1', content: [{ type: 'text', text: 'pong' }] }, parent_tool_use_id: null })`,
+  `  w({ type: 'result', subtype: 'success', result: 'pong', usage: { input_tokens: 1, output_tokens: 1 } })`,
+  `})`,
+].join('\n')
+
+const noopLogger = {
+  request: () => {},
+  provider: () => {},
+  errors: () => {},
+  agentLoop: () => {},
+  warnings: () => {},
+  debug: () => {},
+} as unknown as InternalLogger
+
+/** Build a capability context that hands the adapter the given sandbox. */
+function capabilityContextWith(handle: SandboxHandle): CapabilityContext {
+  const [, provideSandbox] = SandboxCapability
+  const ctx = {
+    capabilities: { markProvided: () => {}, has: () => true },
+  } as unknown as CapabilityContext
+  provideSandbox(ctx, handle)
+  return ctx
+}
+
+async function collect(
+  stream: AsyncIterable<StreamChunk>,
+): Promise<Array<StreamChunk>> {
+  const out: Array<StreamChunk> = []
+  for await (const chunk of stream) out.push(chunk)
+  return out
+}
+
+describe('claude-code in-sandbox adapter', () => {
+  it('spawns the agent CLI in the sandbox and streams translated events', async () => {
+    const sbx = await provider.create({})
+    await sbx.fs.write('/workspace/fake-claude.mjs', FAKE_CLAUDE)
+
+    const adapter = claudeCodeText('haiku', {
+      // Relative executable + cwd=/workspace (mapped to the sandbox root).
+      claudeExecutable: 'node fake-claude.mjs',
+      streamPartials: false,
+      emitDiff: false,
+    })
+
+    const chunks = await collect(
+      adapter.chatStream({
+        model: 'haiku',
+        messages: [{ role: 'user', content: 'say pong' }],
+        logger: noopLogger,
+        capabilities: capabilityContextWith(sbx),
+      }),
+    )
+
+    const types = chunks.map((c) => c.type as string)
+    expect(types[0]).toBe('RUN_STARTED')
+
+    const sessionEvent = chunks.find(
+      (c) =>
+        c.type === 'CUSTOM' &&
+        (c as { name?: string }).name === 'claude-code.session-id',
+    )
+    expect(sessionEvent).toBeDefined()
+    expect(
+      (sessionEvent as { value: { sessionId: string } }).value.sessionId,
+    ).toBe('sess-abc')
+
+    const text = chunks
+      .filter((c) => c.type === 'TEXT_MESSAGE_CONTENT')
+      .map((c) => (c as { delta?: string }).delta ?? '')
+      .join('')
+    expect(text).toContain('pong')
+
+    expect(chunks.some((c) => c.type === 'RUN_FINISHED')).toBe(true)
+
+    await sbx.destroy()
+  })
+
+  it('requires a sandbox capability', async () => {
+    const adapter = claudeCodeText('haiku', { emitDiff: false })
+    const chunks = await collect(
+      adapter.chatStream({
+        model: 'haiku',
+        messages: [{ role: 'user', content: 'hi' }],
+        logger: noopLogger,
+        // no capabilities provided
+      }),
+    )
+    const err = chunks.find((c) => c.type === 'RUN_ERROR')
+    expect(err).toBeDefined()
+    expect((err as { message?: string }).message).toMatch(/requires a sandbox/i)
+  })
+
+  it('bridges chat()-provided tools (starts + tears down the MCP bridge)', async () => {
+    const sbx = await provider.create({})
+    await sbx.fs.write('/workspace/fake-claude.mjs', FAKE_CLAUDE)
+    const adapter = claudeCodeText('haiku', {
+      claudeExecutable: 'node fake-claude.mjs',
+      streamPartials: false,
+      emitDiff: false,
+    })
+    // The fake claude ignores the injected --mcp-config; this checks that
+    // passing tools no longer errors and the bridge lifecycle is clean.
+    const chunks = await collect(
+      adapter.chatStream({
+        model: 'haiku',
+        messages: [{ role: 'user', content: 'say pong' }],
+        logger: noopLogger,
+        capabilities: capabilityContextWith(sbx),
+        tools: [
+          {
+            name: 'getTime',
+            description: 'x',
+            inputSchema: { type: 'object', properties: {} },
+            execute: () => Promise.resolve('now'),
+          } as never,
+        ],
+      }),
+    )
+    expect(chunks.some((c) => c.type === 'RUN_ERROR')).toBe(false)
+    expect(chunks.some((c) => c.type === 'RUN_FINISHED')).toBe(true)
+    await sbx.destroy()
+  })
+})
diff --git a/packages/ai-claude-code/tests/translate.test.ts b/packages/ai-claude-code/tests/translate.test.ts
new file mode 100644
index 000000000..607d2c457
--- /dev/null
+++ b/packages/ai-claude-code/tests/translate.test.ts
@@ -0,0 +1,485 @@
+import { describe, expect, it } from 'vitest'
+import { translateSdkStream } from '../src/stream/translate'
+import type { AgentSdkMessage } from '../src/stream/sdk-types'
+import type { StreamChunk } from '@tanstack/ai'
+
+function makeContext() {
+  let id = 0
+  return {
+    model: 'claude-opus-4-6',
+    runId: 'run-1',
+    threadId: 'thread-1',
+    genId: () => `gen-${++id}`,
+  }
+}
+
+async function* fromArray(
+  messages: Array<AgentSdkMessage>,
+): AsyncIterable<AgentSdkMessage> {
+  for (const message of messages) {
+    yield message
+  }
+}
+
+async function collect(
+  messages: Array<AgentSdkMessage>,
+): Promise<Array<StreamChunk>> {
+  const chunks: Array<StreamChunk> = []
+  for await (const chunk of translateSdkStream(
+    fromArray(messages),
+    makeContext(),
+  )) {
+    chunks.push(chunk)
+  }
+  return chunks
+}
+
+const init: AgentSdkMessage = {
+  type: 'system',
+  subtype: 'init',
+  session_id: 'sess-abc',
+  model: 'claude-opus-4-6',
+  tools: ['Bash', 'Read'],
+  cwd: '/tmp',
+}
+
+const usage = {
+  input_tokens: 100,
+  output_tokens: 50,
+  cache_read_input_tokens: 10,
+  cache_creation_input_tokens: 5,
+}
+
+function assistantText(text: string, messageId = 'msg-1'): AgentSdkMessage {
+  return {
+    type: 'assistant',
+    message: { id: messageId, content: [{ type: 'text', text }] },
+    parent_tool_use_id: null,
+  }
+}
+
+const resultSuccess: AgentSdkMessage = {
+  type: 'result',
+  subtype: 'success',
+  result: 'done',
+  usage,
+  total_cost_usd: 0.12,
+}
+
+describe('translateSdkStream', () => {
+  it('translates a simple text turn into RUN_STARTED → CUSTOM → TEXT_* → RUN_FINISHED(stop)', async () => {
+    const chunks = await collect([init, assistantText('Hello!'), resultSuccess])
+
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'RUN_FINISHED',
+    ])
+
+    expect(chunks[0]).toMatchObject({
+      type: 'RUN_STARTED',
+      runId: 'run-1',
+      threadId: 'thread-1',
+      model: 'claude-opus-4-6',
+    })
+    expect(chunks[3]).toMatchObject({
+      type: 'TEXT_MESSAGE_CONTENT',
+      delta: 'Hello!',
+      content: 'Hello!',
+    })
+    expect(chunks[5]).toMatchObject({
+      type: 'RUN_FINISHED',
+      finishReason: 'stop',
+    })
+  })
+
+  it('surfaces the session id via a CUSTOM claude-code.session-id event', async () => {
+    const chunks = await collect([init, assistantText('hi'), resultSuccess])
+    const custom = chunks.find((c) => c.type === 'CUSTOM')
+    expect(custom).toMatchObject({
+      type: 'CUSTOM',
+      name: 'claude-code.session-id',
+      value: {
+        sessionId: 'sess-abc',
+        model: 'claude-opus-4-6',
+        tools: ['Bash', 'Read'],
+      },
+    })
+  })
+
+  it('maps usage onto RUN_FINISHED including cache token details', async () => {
+    const chunks = await collect([init, assistantText('hi'), resultSuccess])
+    const finished = chunks.find((c) => c.type === 'RUN_FINISHED')
+    expect(finished).toMatchObject({
+      usage: {
+        promptTokens: 100,
+        completionTokens: 50,
+        totalTokens: 150,
+        promptTokensDetails: { cachedTokens: 10, cacheWriteTokens: 5 },
+      },
+    })
+  })
+
+  it('emits resolved TOOL_CALL_* quadruples for harness tool activity and never finishes with tool_calls', async () => {
+    const messages: Array<AgentSdkMessage> = [
+      init,
+      {
+        type: 'assistant',
+        message: {
+          id: 'msg-1',
+          content: [
+            {
+              type: 'tool_use',
+              id: 'toolu_1',
+              name: 'Bash',
+              input: { command: 'ls' },
+            },
+          ],
+        },
+        parent_tool_use_id: null,
+      },
+      {
+        type: 'user',
+        message: {
+          role: 'user',
+          content: [
+            {
+              type: 'tool_result',
+              tool_use_id: 'toolu_1',
+              content: 'file-a\nfile-b',
+            },
+          ],
+        },
+        parent_tool_use_id: null,
+      },
+      assistantText('Found two files.', 'msg-2'),
+      resultSuccess,
+    ]
+
+    const chunks = await collect(messages)
+    const types = chunks.map((c) => c.type)
+    expect(types).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TOOL_CALL_START',
+      'TOOL_CALL_ARGS',
+      'TOOL_CALL_END',
+      'TOOL_CALL_RESULT',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'RUN_FINISHED',
+    ])
+
+    expect(chunks[2]).toMatchObject({
+      toolCallId: 'toolu_1',
+      toolCallName: 'Bash',
+    })
+    expect(chunks[3]).toMatchObject({
+      toolCallId: 'toolu_1',
+      delta: JSON.stringify({ command: 'ls' }),
+    })
+    expect(chunks[4]).toMatchObject({
+      toolCallId: 'toolu_1',
+      input: { command: 'ls' },
+    })
+    expect(chunks[5]).toMatchObject({
+      type: 'TOOL_CALL_RESULT',
+      toolCallId: 'toolu_1',
+      content: 'file-a\nfile-b',
+    })
+
+    const finished = chunks.filter((c) => c.type === 'RUN_FINISHED')
+    expect(finished).toHaveLength(1)
+    expect(finished[0]).toMatchObject({ finishReason: 'stop' })
+  })
+
+  it('strips the mcp__tanstack__ prefix from bridged tool names', async () => {
+    const chunks = await collect([
+      init,
+      {
+        type: 'assistant',
+        message: {
+          id: 'msg-1',
+          content: [
+            {
+              type: 'tool_use',
+              id: 'toolu_2',
+              name: 'mcp__tanstack__lookup_user',
+              input: { userId: 'u1' },
+            },
+          ],
+        },
+        parent_tool_use_id: null,
+      },
+      resultSuccess,
+    ])
+
+    const start = chunks.find((c) => c.type === 'TOOL_CALL_START')
+    expect(start).toMatchObject({ toolCallName: 'lookup_user' })
+  })
+
+  it('marks errored tool results with state output-error', async () => {
+    const chunks = await collect([
+      init,
+      {
+        type: 'assistant',
+        message: {
+          id: 'msg-1',
+          content: [
+            { type: 'tool_use', id: 'toolu_3', name: 'Bash', input: {} },
+          ],
+        },
+        parent_tool_use_id: null,
+      },
+      {
+        type: 'user',
+        message: {
+          role: 'user',
+          content: [
+            {
+              type: 'tool_result',
+              tool_use_id: 'toolu_3',
+              content: [{ type: 'text', text: 'command failed' }],
+              is_error: true,
+            },
+          ],
+        },
+        parent_tool_use_id: null,
+      },
+      resultSuccess,
+    ])
+
+    const result = chunks.find((c) => c.type === 'TOOL_CALL_RESULT')
+    expect(result).toMatchObject({
+      toolCallId: 'toolu_3',
+      content: 'command failed',
+      state: 'output-error',
+    })
+  })
+
+  it('synthesizes interrupted tool results for unresolved tool calls before RUN_FINISHED', async () => {
+    const chunks = await collect([
+      init,
+      {
+        type: 'assistant',
+        message: {
+          id: 'msg-1',
+          content: [
+            { type: 'tool_use', id: 'toolu_4', name: 'Bash', input: {} },
+          ],
+        },
+        parent_tool_use_id: null,
+      },
+      resultSuccess,
+    ])
+
+    const types = chunks.map((c) => c.type as string)
+    expect(types.indexOf('TOOL_CALL_RESULT')).toBeGreaterThan(-1)
+    expect(types.indexOf('TOOL_CALL_RESULT')).toBeLessThan(
+      types.indexOf('RUN_FINISHED'),
+    )
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_RESULT')).toMatchObject({
+      toolCallId: 'toolu_4',
+      content: JSON.stringify({ status: 'interrupted' }),
+    })
+  })
+
+  it('translates thinking blocks into REASONING_* events', async () => {
+    const chunks = await collect([
+      init,
+      {
+        type: 'assistant',
+        message: {
+          id: 'msg-1',
+          content: [
+            { type: 'thinking', thinking: 'pondering...' },
+            { type: 'text', text: 'answer' },
+          ],
+        },
+        parent_tool_use_id: null,
+      },
+      resultSuccess,
+    ])
+
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'REASONING_START',
+      'REASONING_MESSAGE_START',
+      'REASONING_MESSAGE_CONTENT',
+      'REASONING_MESSAGE_END',
+      'REASONING_END',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'RUN_FINISHED',
+    ])
+    expect(
+      chunks.find((c) => c.type === 'REASONING_MESSAGE_CONTENT'),
+    ).toMatchObject({ delta: 'pondering...' })
+  })
+
+  it('maps error_max_turns to RUN_FINISHED(length)', async () => {
+    const chunks = await collect([
+      init,
+      assistantText('partial'),
+      {
+        type: 'result',
+        subtype: 'error_max_turns',
+        usage,
+        total_cost_usd: 0.5,
+        errors: [],
+      },
+    ])
+    expect(chunks.at(-1)).toMatchObject({
+      type: 'RUN_FINISHED',
+      finishReason: 'length',
+    })
+  })
+
+  it('maps error_during_execution to RUN_ERROR', async () => {
+    const chunks = await collect([
+      init,
+      {
+        type: 'result',
+        subtype: 'error_during_execution',
+        usage,
+        total_cost_usd: 0,
+        errors: ['boom'],
+      },
+    ])
+    expect(chunks.at(-1)).toMatchObject({
+      type: 'RUN_ERROR',
+      message: 'boom',
+      code: 'error_during_execution',
+    })
+  })
+
+  it('skips subagent messages (parent_tool_use_id set)', async () => {
+    const chunks = await collect([
+      init,
+      {
+        type: 'assistant',
+        message: { id: 'msg-sub', content: [{ type: 'text', text: 'inner' }] },
+        parent_tool_use_id: 'toolu_task',
+      },
+      assistantText('outer'),
+      resultSuccess,
+    ])
+
+    const contents = chunks.filter((c) => c.type === 'TEXT_MESSAGE_CONTENT')
+    expect(contents).toHaveLength(1)
+    expect(contents[0]).toMatchObject({ delta: 'outer' })
+  })
+
+  it('streams partial text deltas and dedupes the whole assistant message', async () => {
+    const chunks = await collect([
+      init,
+      {
+        type: 'stream_event',
+        event: { type: 'message_start', message: { id: 'msg-1' } },
+        parent_tool_use_id: null,
+      },
+      {
+        type: 'stream_event',
+        event: {
+          type: 'content_block_start',
+          index: 0,
+          content_block: { type: 'text' },
+        },
+        parent_tool_use_id: null,
+      },
+      {
+        type: 'stream_event',
+        event: {
+          type: 'content_block_delta',
+          index: 0,
+          delta: { type: 'text_delta', text: 'Hel' },
+        },
+        parent_tool_use_id: null,
+      },
+      {
+        type: 'stream_event',
+        event: {
+          type: 'content_block_delta',
+          index: 0,
+          delta: { type: 'text_delta', text: 'lo' },
+        },
+        parent_tool_use_id: null,
+      },
+      {
+        type: 'stream_event',
+        event: { type: 'content_block_stop', index: 0 },
+        parent_tool_use_id: null,
+      },
+      assistantText('Hello', 'msg-1'),
+      resultSuccess,
+    ])
+
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'RUN_FINISHED',
+    ])
+    expect(chunks[3]).toMatchObject({ delta: 'Hel', content: 'Hel' })
+    expect(chunks[4]).toMatchObject({ delta: 'lo', content: 'Hello' })
+  })
+
+  it('emits synthetic tool results then rethrows when the SDK stream throws mid-run', async () => {
+    async function* throwing(): AsyncIterable<AgentSdkMessage> {
+      yield init
+      yield {
+        type: 'assistant',
+        message: {
+          id: 'msg-1',
+          content: [
+            { type: 'tool_use', id: 'toolu_5', name: 'Bash', input: {} },
+          ],
+        },
+        parent_tool_use_id: null,
+      }
+      throw new Error('aborted')
+    }
+
+    const chunks: Array<StreamChunk> = []
+    await expect(async () => {
+      for await (const chunk of translateSdkStream(throwing(), makeContext())) {
+        chunks.push(chunk)
+      }
+    }).rejects.toThrow('aborted')
+
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_RESULT')).toMatchObject({
+      toolCallId: 'toolu_5',
+      content: JSON.stringify({ status: 'interrupted' }),
+    })
+  })
+
+  it('ignores unknown SDK message types', async () => {
+    const chunks = await collect([
+      init,
+      {
+        type: 'system',
+        subtype: 'status',
+        status: 'compacting',
+      } as unknown as AgentSdkMessage,
+      assistantText('hi'),
+      resultSuccess,
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'RUN_FINISHED',
+    ])
+  })
+})
diff --git a/packages/ai-claude-code/tsconfig.json b/packages/ai-claude-code/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-claude-code/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-claude-code/vite.config.ts b/packages/ai-claude-code/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-claude-code/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-client/src/chat-client.ts b/packages/ai-client/src/chat-client.ts
index 468dc7618..7f3398d41 100644
--- a/packages/ai-client/src/chat-client.ts
+++ b/packages/ai-client/src/chat-client.ts
@@ -102,6 +102,14 @@ export class ChatClient<
   // focused on streaming. Undefined when no `persistence` adapter is configured.
   private readonly persistor?: ChatPersistor
   private currentRunId: string | null = null
+  // Resume tracking: the latest in-band cursor seen for the active run, so a
+  // reconnect can replay events after it. Cleared when the run terminates.
+  private lastResume: { runId: string; cursor: string } | null = null
+  private readonly autoResume: boolean
+  // When set, the next streamResponse() resumes this run/cursor instead of
+  // starting a fresh run (consumed once).
+  private pendingResumeRunId: string | null = null
+  private pendingResumeCursor: string | null = null
   // Track the legacy `body` option and the canonical `forwardedProps`
   // option as separate slots so that `updateOptions({ forwardedProps })`
   // doesn't wipe a previously-set `body` (and vice versa). They are
@@ -170,6 +178,7 @@ export class ChatClient<
   constructor(options: ChatClientOptions<TTools, TContext>) {
     this.uniqueId = options.id || this.generateUniqueId('chat')
     this.threadId = options.threadId || this.generateUniqueId('thread')
+    this.autoResume = options.autoResume ?? true
     if (options.persistence) {
       this.persistor = new ChatPersistor(
         options.persistence,
@@ -489,6 +498,66 @@ export class ChatClient<
     }
   }
 
+  /**
+   * Observe the in-band resume cursor on each chunk so a reconnect can replay
+   * after the last seen event. Cleared when the run reaches a terminal event.
+   */
+  private observeResumeCursor(chunk: StreamChunk): void {
+    if (chunk.type === 'RUN_FINISHED' || chunk.type === 'RUN_ERROR') {
+      // A server-signaled terminal event completes the run — drop its resume
+      // state. (A stream that merely ends without a terminal is an interruption
+      // and keeps its resume state so it can be continued.)
+      const runId = getChunkRunId(chunk)
+      if (!runId || this.lastResume?.runId === runId) {
+        this.lastResume = null
+      }
+      return
+    }
+    const cursor =
+      'cursor' in chunk && typeof chunk.cursor === 'string'
+        ? chunk.cursor
+        : undefined
+    if (cursor && this.currentRunId) {
+      this.lastResume = { runId: this.currentRunId, cursor }
+    }
+  }
+
+  /**
+   * The resume state for the active/interrupted run (the run id plus the last
+   * cursor seen), or null when there is nothing to resume. Apps can persist this
+   * to resume across a full reload; in-session reconnects use it automatically
+   * via {@link maybeAutoResume}.
+   */
+  getResumeState(): { runId: string; cursor: string } | null {
+    return this.lastResume ? { ...this.lastResume } : null
+  }
+
+  /**
+   * Resume a run by replaying its persisted events after the last cursor, then
+   * continuing live — without re-sending messages. Uses the supplied state, or
+   * the tracked in-session state. No-op (returns false) when there is nothing to
+   * resume or a stream is already in flight.
+   */
+  resume(state?: { runId: string; cursor: string }): Promise<boolean> {
+    const target = state ?? this.lastResume
+    if (!target || this.isLoading) return Promise.resolve(false)
+    this.pendingResumeRunId = target.runId
+    this.pendingResumeCursor = target.cursor
+    return this.streamResponse()
+  }
+
+  /**
+   * Auto-resume hook for framework integrations to call on mount / when the tab
+   * comes back online. Honors the `autoResume` option (default true) and only
+   * fires when an interrupted run is tracked and no stream is in flight.
+   */
+  maybeAutoResume(): Promise<boolean> {
+    if (!this.autoResume || this.isLoading || !this.lastResume) {
+      return Promise.resolve(false)
+    }
+    return this.resume()
+  }
+
   private generateUniqueId(prefix: string): string {
     return `${prefix}-${Date.now()}-${Math.random().toString(36).substring(7)}`
   }
@@ -696,6 +765,7 @@ export class ChatClient<
       // per-run error only clears that run, while a runId-less RUN_ERROR is
       // treated as a session-level error that clears every active run.
       this.updateRunLifecycle(chunk)
+      this.observeResumeCursor(chunk)
       // Yield control back to event loop for UI updates
       await new Promise((resolve) => setTimeout(resolve, 0))
     }
@@ -854,7 +924,14 @@ export class ChatClient<
 
     // Track generation so a superseded stream's cleanup doesn't clobber the new one
     const generation = ++this.streamGeneration
-    const runId = `run-${Date.now()}-${Math.random().toString(36).slice(2, 8)}`
+    // Resuming reuses the original runId so the server replays that run's events.
+    const resumeRunId = this.pendingResumeRunId
+    const resumeCursor = this.pendingResumeCursor
+    this.pendingResumeRunId = null
+    this.pendingResumeCursor = null
+    const runId =
+      resumeRunId ??
+      `run-${Date.now()}-${Math.random().toString(36).slice(2, 8)}`
     this.currentRunId = runId
 
     this.setIsLoading(true)
@@ -945,6 +1022,7 @@ export class ChatClient<
             : { type: 'object' },
         })),
         forwardedProps: { ...mergedBody },
+        ...(resumeCursor ? { cursor: resumeCursor } : {}),
       }
       this.devtoolsBridge.beginRun(runContext.runId, this.threadId)
       activeDevtoolsRunId = runContext.runId
diff --git a/packages/ai-client/src/connection-adapters.ts b/packages/ai-client/src/connection-adapters.ts
index 3c4010047..56e4d2e1c 100644
--- a/packages/ai-client/src/connection-adapters.ts
+++ b/packages/ai-client/src/connection-adapters.ts
@@ -199,6 +199,12 @@ export interface RunAgentInputContext {
   threadId: string
   runId: string
   parentRunId?: string
+  /**
+   * Resume cursor. When set, the request resumes `runId` — the server replays
+   * persisted events after this cursor (see `chat({ cursor })`). On a resume the
+   * client sends no new messages.
+   */
+  cursor?: string
   /** Client-declared tools to advertise in the request payload. */
   clientTools?: Array<{
     name: string
@@ -443,6 +449,7 @@ function buildRunAgentInputBody(
     ...(runContext?.parentRunId !== undefined && {
       parentRunId: runContext.parentRunId,
     }),
+    ...(runContext?.cursor !== undefined && { cursor: runContext.cursor }),
     state: {},
     messages: wireMessages,
     tools: runContext?.clientTools ?? [],
diff --git a/packages/ai-client/src/types.ts b/packages/ai-client/src/types.ts
index fa00811d7..d5cd7d3c4 100644
--- a/packages/ai-client/src/types.ts
+++ b/packages/ai-client/src/types.ts
@@ -391,6 +391,14 @@ export interface ChatClientBaseOptions<
    */
   threadId?: string
 
+  /**
+   * Whether to auto-resume an interrupted run when {@link maybeAutoResume} is
+   * called (e.g. by a framework integration on mount / when the tab comes back
+   * online). Requires server-side persistence so the run's events can be
+   * replayed by `runId + cursor`. Defaults to `true`; set `false` to opt out.
+   */
+  autoResume?: boolean
+
   /**
    * Arbitrary client-controlled JSON forwarded to the server in the
    * AG-UI `RunAgentInput.forwardedProps` field. Use this for per-session
diff --git a/packages/ai-client/tests/chat-client-resume.test.ts b/packages/ai-client/tests/chat-client-resume.test.ts
new file mode 100644
index 000000000..2c5583f9a
--- /dev/null
+++ b/packages/ai-client/tests/chat-client-resume.test.ts
@@ -0,0 +1,130 @@
+import { describe, expect, it } from 'vitest'
+import { EventType } from '@tanstack/ai/client'
+import { ChatClient } from '../src/chat-client'
+import type {
+  ConnectConnectionAdapter,
+  RunAgentInputContext,
+} from '../src/connection-adapters'
+import type { StreamChunk } from '@tanstack/ai/client'
+
+/**
+ * Adapter that records each connect's runContext and yields scripted chunks.
+ * A script can be a function of the live `runContext` (so a test can emit a
+ * RUN_FINISHED carrying the same runId the client generated and passed in).
+ */
+type Script =
+  | Array<StreamChunk>
+  | ((ctx: RunAgentInputContext | undefined) => Array<StreamChunk>)
+
+function recordingAdapter(scripts: Array<Script>) {
+  const contexts: Array<RunAgentInputContext | undefined> = []
+  let i = 0
+  const adapter: ConnectConnectionAdapter = {
+    // eslint-disable-next-line @typescript-eslint/require-await
+    async *connect(_messages, _data, _signal, runContext) {
+      contexts.push(runContext)
+      const script = scripts[i]
+      i++
+      const chunks =
+        typeof script === 'function' ? script(runContext) : (script ?? [])
+      for (const c of chunks) yield c
+    },
+  }
+  return { adapter, contexts }
+}
+
+const text = (delta: string, cursor?: string): StreamChunk => ({
+  type: EventType.TEXT_MESSAGE_CONTENT,
+  messageId: 'm1',
+  timestamp: Date.now(),
+  delta,
+  ...(cursor ? { cursor } : {}),
+})
+const runStarted: StreamChunk = {
+  type: EventType.RUN_STARTED,
+  runId: 'run-1',
+  threadId: 'thread-1',
+  timestamp: Date.now(),
+}
+
+describe('ChatClient resume', () => {
+  it('tracks the in-band cursor of an interrupted run', async () => {
+    // No RUN_FINISHED -> the run is "interrupted", resume state retained.
+    const { adapter } = recordingAdapter([
+      [runStarted, text('a', '1'), text('b', '2')],
+    ])
+    const client = new ChatClient({ connection: adapter })
+    await client.append({
+      id: 'u1',
+      role: 'user',
+      parts: [{ type: 'text', content: 'hi' }],
+      createdAt: new Date(),
+    })
+
+    const state = client.getResumeState()
+    expect(state).not.toBeNull()
+    expect(state?.cursor).toBe('2')
+  })
+
+  it('clears resume state once the run finishes', async () => {
+    const { adapter } = recordingAdapter([
+      (ctx) => [
+        runStarted,
+        text('a', '1'),
+        {
+          type: EventType.RUN_FINISHED,
+          // Carry the runId the client generated (passed in via runContext) so
+          // the terminal correlates to the tracked resume state.
+          runId: ctx?.runId ?? 'run-1',
+          threadId: 'thread-1',
+          timestamp: Date.now(),
+          finishReason: 'stop',
+        },
+      ],
+    ])
+    const client = new ChatClient({ connection: adapter })
+    await client.append({
+      id: 'u1',
+      role: 'user',
+      parts: [{ type: 'text', content: 'hi' }],
+      createdAt: new Date(),
+    })
+    expect(client.getResumeState()).toBeNull()
+  })
+
+  it('resume() reconnects with the cursor in runContext', async () => {
+    const { adapter, contexts } = recordingAdapter([
+      [runStarted, text('a', '7')], // interrupted (no finish)
+      [text('b', '8')], // resume continuation
+    ])
+    const client = new ChatClient({ connection: adapter })
+    await client.append({
+      id: 'u1',
+      role: 'user',
+      parts: [{ type: 'text', content: 'hi' }],
+      createdAt: new Date(),
+    })
+
+    await client.resume()
+    expect(contexts).toHaveLength(2)
+    // First connect: fresh run, no cursor. Second: resume with the last cursor.
+    expect(contexts[0]?.cursor).toBeUndefined()
+    expect(contexts[1]?.cursor).toBe('7')
+  })
+
+  it('maybeAutoResume is a no-op when autoResume is false', async () => {
+    const { adapter, contexts } = recordingAdapter([
+      [runStarted, text('a', '7')],
+    ])
+    const client = new ChatClient({ connection: adapter, autoResume: false })
+    await client.append({
+      id: 'u1',
+      role: 'user',
+      parts: [{ type: 'text', content: 'hi' }],
+      createdAt: new Date(),
+    })
+    const resumed = await client.maybeAutoResume()
+    expect(resumed).toBe(false)
+    expect(contexts).toHaveLength(1)
+  })
+})
diff --git a/packages/ai-codex/README.md b/packages/ai-codex/README.md
new file mode 100644
index 000000000..21284d4a1
--- /dev/null
+++ b/packages/ai-codex/README.md
@@ -0,0 +1,18 @@
+# @tanstack/ai-codex
+
+Codex harness adapter for [TanStack AI](https://tanstack.com/ai) — run [OpenAI Codex](https://developers.openai.com/codex) (via `@openai/codex-sdk`) as a chat backend with local tool execution, stateful coding sessions, and TanStack tool bridging.
+
+```typescript
+import { chat } from '@tanstack/ai'
+import { codexText } from '@tanstack/ai-codex'
+
+const stream = chat({
+  adapter: codexText('gpt-5.1-codex', {
+    cwd: '/path/to/project',
+    sandboxMode: 'workspace-write',
+  }),
+  messages: [{ role: 'user', content: 'Fix the failing test.' }],
+})
+```
+
+Server-only (Node). See the [Codex adapter docs](https://tanstack.com/ai/latest/docs/adapters/codex) for sessions, tool bridging, sandboxing, and limitations.
diff --git a/packages/ai-codex/package.json b/packages/ai-codex/package.json
new file mode 100644
index 000000000..cf0149965
--- /dev/null
+++ b/packages/ai-codex/package.json
@@ -0,0 +1,58 @@
+{
+  "name": "@tanstack/ai-codex",
+  "version": "0.1.0",
+  "description": "Codex harness adapter for TanStack AI — run OpenAI Codex as a chat backend with local tool execution and stateful sessions.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-codex"
+  },
+  "keywords": [
+    "ai",
+    "ai-sdk",
+    "typescript",
+    "tanstack",
+    "openai",
+    "codex",
+    "harness",
+    "agent",
+    "adapter",
+    "chat",
+    "tool-calling"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-sandbox": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-sandbox": "workspace:*",
+    "@tanstack/ai-sandbox-local-process": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-codex/src/adapters/policy-map.ts b/packages/ai-codex/src/adapters/policy-map.ts
new file mode 100644
index 000000000..14c127995
--- /dev/null
+++ b/packages/ai-codex/src/adapters/policy-map.ts
@@ -0,0 +1,58 @@
+/**
+ * Map a portable {@link SandboxPolicy} onto Codex CLI settings.
+ *
+ * **Best-effort, coarse mapping.** `codex exec --experimental-json` runs
+ * non-interactively: there is no per-action host callback (unlike Claude Code's
+ * `--permission-prompt-tool`), so the fine-grained, resume-based interactive
+ * approval flow (`deny` + `approval-requested` + re-run) is NOT available for
+ * Codex. Instead the policy collapses onto Codex's coarse knobs:
+ *
+ * - `capabilities.fileWrite === 'deny'` → `--sandbox read-only`
+ *   (otherwise `workspace-write`).
+ * - `capabilities.network` → `sandbox_workspace_write.network_access`
+ *   (`'allow'` → true, `'deny'` → false; unset leaves Codex's default).
+ * - `approval_policy`: a fully-permissive policy (`default: 'allow'` with no
+ *   `ask`/`deny` rules) → `never`; a `default: 'deny'` policy → `untrusted`;
+ *   anything with `ask`/`deny` rules → `on-request`. In `exec` mode Codex will
+ *   refuse (rather than prompt for) actions that need approval.
+ *
+ * Returns only the knobs the policy actually constrains; the adapter merges
+ * these with its own config (config/modelOptions still take precedence).
+ */
+import type { SandboxPolicy } from '@tanstack/ai-sandbox'
+import type { CodexApprovalMode, CodexSandboxMode } from './text'
+
+export interface CodexPolicyFlags {
+  sandboxMode?: CodexSandboxMode
+  approvalPolicy?: CodexApprovalMode
+  networkAccessEnabled?: boolean
+}
+
+export function mapPolicyToCodexFlags(
+  policy: SandboxPolicy | undefined,
+): CodexPolicyFlags {
+  if (!policy) return {}
+  const flags: CodexPolicyFlags = {}
+
+  if (policy.capabilities?.fileWrite === 'deny') {
+    flags.sandboxMode = 'read-only'
+  }
+  if (policy.capabilities?.network === 'allow') {
+    flags.networkAccessEnabled = true
+  } else if (policy.capabilities?.network === 'deny') {
+    flags.networkAccessEnabled = false
+  }
+
+  const hasAskOrDeny =
+    (policy.commands?.ask?.length ?? 0) > 0 ||
+    (policy.commands?.deny?.length ?? 0) > 0
+  if (hasAskOrDeny) {
+    flags.approvalPolicy = 'on-request'
+  } else if (policy.default === 'deny') {
+    flags.approvalPolicy = 'untrusted'
+  } else if (policy.default === 'allow') {
+    flags.approvalPolicy = 'never'
+  }
+
+  return flags
+}
diff --git a/packages/ai-codex/src/adapters/text.ts b/packages/ai-codex/src/adapters/text.ts
new file mode 100644
index 000000000..46b2e7952
--- /dev/null
+++ b/packages/ai-codex/src/adapters/text.ts
@@ -0,0 +1,323 @@
+import { EventType, normalizeSystemPrompts } from '@tanstack/ai'
+import { toRunErrorRawEvent } from '@tanstack/ai/adapter-internals'
+import { BaseTextAdapter } from '@tanstack/ai/adapters'
+import {
+  SandboxCapability,
+  getSandbox,
+  getSandboxPolicy,
+  hostForSandbox,
+  spawnNdjson,
+  startHostToolBridge,
+} from '@tanstack/ai-sandbox'
+import { buildPrompt } from '../messages/prompt'
+import { translateThreadEvents } from '../stream/translate'
+import { mapPolicyToCodexFlags } from './policy-map'
+import type { CodexPolicyFlags } from './policy-map'
+import type { HostToolBridge, SandboxHandle } from '@tanstack/ai-sandbox'
+import type {
+  StructuredOutputOptions,
+  StructuredOutputResult,
+} from '@tanstack/ai/adapters'
+import type {
+  DefaultMessageMetadataByModality,
+  Modality,
+  StreamChunk,
+  TextOptions,
+} from '@tanstack/ai'
+import type { CodexModel } from '../model-meta'
+import type { CodexTextProviderOptions } from '../provider-options'
+import type { CodexThreadEvent } from '../stream/sdk-types'
+
+export type CodexSandboxMode =
+  | 'read-only'
+  | 'workspace-write'
+  | 'danger-full-access'
+export type CodexApprovalMode =
+  | 'never'
+  | 'on-failure'
+  | 'on-request'
+  | 'untrusted'
+
+const DEFAULT_WORKDIR = '/workspace'
+
+export interface CodexTextConfig {
+  /** Working directory inside the sandbox. Defaults to `/workspace`. */
+  cwd?: string
+  /**
+   * Codex's own sandbox mode (`--sandbox`). Defaults to `'workspace-write'`
+   * so the agent can edit the workspace — the outer TanStack sandbox is the
+   * real isolation boundary.
+   */
+  sandboxMode?: CodexSandboxMode
+  /** Codex approval policy (`--config approval_policy=`). Defaults to `'never'`. */
+  approvalPolicy?: CodexApprovalMode
+  /** Model reasoning effort (`--config model_reasoning_effort=`). */
+  modelReasoningEffort?: 'minimal' | 'low' | 'medium' | 'high'
+  /** Skip Codex's git-repo safety check (`--skip-git-repo-check`). Defaults to true. */
+  skipGitRepoCheck?: boolean
+  /** Allow network in `workspace-write` (`--config sandbox_workspace_write.network_access=`). */
+  networkAccessEnabled?: boolean
+  /** Web search mode (`--config web_search=`). */
+  webSearchMode?: 'disabled' | 'live'
+  /** Extra writable directories (`--add-dir`). */
+  additionalDirectories?: Array<string>
+  /** Path/name of the codex executable inside the sandbox. Defaults to `codex`. */
+  codexExecutable?: string
+  /** Extra environment variables for the codex process inside the sandbox. */
+  env?: Record<string, string>
+  /** Extra raw `--config key=value` overrides (values passed verbatim as TOML). */
+  config?: Record<string, string>
+}
+
+function q(value: string): string {
+  return `'${value.replace(/'/g, `'\\''`)}'`
+}
+
+export class CodexTextAdapter<
+  TModel extends CodexModel,
+> extends BaseTextAdapter<
+  TModel,
+  CodexTextProviderOptions,
+  ReadonlyArray<Modality> & readonly ['text'],
+  DefaultMessageMetadataByModality,
+  ReadonlyArray<string>,
+  unknown,
+  never
+> {
+  readonly name = 'codex' as const
+
+  override readonly requires = [SandboxCapability] as const
+
+  // Agent runs inside the persistent sandbox; the engine can re-attach to the
+  // still-running process on resume (live re-attach verified with the real CLI;
+  // the engine seam is unit-tested).
+  readonly supportsReattach = true
+
+  private readonly adapterConfig: CodexTextConfig
+
+  constructor(config: CodexTextConfig, model: TModel) {
+    super({}, model)
+    this.adapterConfig = config
+  }
+
+  private sandboxFrom(
+    options: TextOptions<CodexTextProviderOptions>,
+  ): SandboxHandle {
+    const ctx = options.capabilities
+    if (!ctx) {
+      throw new Error(
+        'Adapter "codex" requires a sandbox. Add withSandbox(defineSandbox({ ... })) to chat() middleware.',
+      )
+    }
+    return getSandbox(ctx)
+  }
+
+  private workdir(options: TextOptions<CodexTextProviderOptions>): string {
+    return (
+      options.modelOptions?.workingDirectory ??
+      this.adapterConfig.cwd ??
+      DEFAULT_WORKDIR
+    )
+  }
+
+  /** Mirror @openai/codex-sdk's `codex exec --experimental-json` invocation. */
+  private buildCommand(
+    options: TextOptions<CodexTextProviderOptions>,
+    resume: string | undefined,
+    cwd: string,
+    bridge: HostToolBridge | undefined,
+    policyFlags: CodexPolicyFlags,
+  ): string {
+    const config = this.adapterConfig
+    const modelOptions = options.modelOptions
+    const exe = config.codexExecutable ?? 'codex'
+    const args: Array<string> = ['exec', '--experimental-json']
+
+    // Precedence: per-call modelOptions > adapter config > sandbox policy > default.
+    const sandboxMode =
+      modelOptions?.sandboxMode ??
+      config.sandboxMode ??
+      policyFlags.sandboxMode ??
+      'workspace-write'
+    const approvalPolicy =
+      modelOptions?.approvalPolicy ??
+      config.approvalPolicy ??
+      policyFlags.approvalPolicy ??
+      'never'
+    const networkAccessEnabled =
+      config.networkAccessEnabled ?? policyFlags.networkAccessEnabled
+    const reasoning =
+      modelOptions?.modelReasoningEffort ?? config.modelReasoningEffort
+    const skipGitRepoCheck =
+      modelOptions?.skipGitRepoCheck ?? config.skipGitRepoCheck
+
+    args.push('--model', q(this.model))
+    args.push('--sandbox', q(sandboxMode))
+    args.push('--cd', q(cwd))
+    if (skipGitRepoCheck !== false) args.push('--skip-git-repo-check')
+    for (const dir of config.additionalDirectories ?? []) {
+      args.push('--add-dir', q(dir))
+    }
+
+    const cfg: Record<string, string> = {
+      approval_policy: `"${approvalPolicy}"`,
+      ...(reasoning ? { model_reasoning_effort: `"${reasoning}"` } : {}),
+      ...(networkAccessEnabled !== undefined
+        ? {
+            'sandbox_workspace_write.network_access':
+              String(networkAccessEnabled),
+          }
+        : {}),
+      ...(config.webSearchMode
+        ? { web_search: `"${config.webSearchMode}"` }
+        : {}),
+      // Bridge chat()-provided tools via a streamable-HTTP MCP server.
+      ...(bridge
+        ? {
+            [`mcp_servers.${bridge.name}.url`]: `"${bridge.url}"`,
+            [`mcp_servers.${bridge.name}.bearer_token`]: `"${bridge.token}"`,
+          }
+        : {}),
+      ...config.config,
+    }
+    for (const [key, value] of Object.entries(cfg)) {
+      args.push('--config', q(`${key}=${value}`))
+    }
+
+    // Resume an existing thread (mirrors the SDK's `resume <threadId>`).
+    if (resume !== undefined) args.push('resume', q(resume))
+
+    return `${exe} ${args.join(' ')}`
+  }
+
+  async *chatStream(
+    options: TextOptions<CodexTextProviderOptions>,
+  ): AsyncIterable<StreamChunk> {
+    const { logger } = options
+    let bridge: HostToolBridge | undefined
+    try {
+      const sandbox = this.sandboxFrom(options)
+      const cwd = this.workdir(options)
+
+      if (options.tools && options.tools.length > 0) {
+        bridge = await startHostToolBridge(options.tools, {
+          hostForSandbox: hostForSandbox(sandbox.provider),
+          context: options.context,
+          ...(options.abortController?.signal
+            ? { signal: options.abortController.signal }
+            : {}),
+        })
+      }
+
+      const { prompt, resume } = buildPrompt(
+        options.messages,
+        options.modelOptions?.sessionId,
+      )
+      const systemPrompts = normalizeSystemPrompts(options.systemPrompts)
+        .map((p) => p.content)
+        .filter((c) => c.trim() !== '')
+      const fullPrompt =
+        systemPrompts.length > 0
+          ? `${systemPrompts.join('\n\n')}\n\n${prompt}`
+          : prompt
+
+      const policy = options.capabilities
+        ? getSandboxPolicy(options.capabilities, { optional: true })
+        : undefined
+      const command = this.buildCommand(
+        options,
+        resume,
+        cwd,
+        bridge,
+        mapPolicyToCodexFlags(policy),
+      )
+
+      logger.request(
+        `activity=chat provider=codex model=${this.model} sandbox=${sandbox.provider} messages=${options.messages.length} resume=${resume ?? 'none'}`,
+        { provider: 'codex', model: this.model },
+      )
+
+      const rawEvents = spawnNdjson(sandbox, command, {
+        cwd,
+        input: fullPrompt,
+        ...(this.adapterConfig.env ? { env: this.adapterConfig.env } : {}),
+        ...(options.abortController?.signal
+          ? { signal: options.abortController.signal }
+          : options.request?.signal
+            ? { signal: options.request.signal }
+            : {}),
+        onNonJsonLine: (line) =>
+          logger.provider(`provider=codex non-json line: ${line}`, {
+            chunk: line,
+          }),
+      })
+
+      async function* asEvents(): AsyncIterable<CodexThreadEvent> {
+        for await (const event of rawEvents) yield event as CodexThreadEvent
+      }
+
+      yield* translateThreadEvents(asEvents(), {
+        model: this.model,
+        runId: options.runId ?? this.generateId(),
+        threadId: options.threadId ?? this.generateId(),
+        ...(options.parentRunId !== undefined && {
+          parentRunId: options.parentRunId,
+        }),
+        genId: () => this.generateId(),
+        onThreadEvent: (event) =>
+          logger.provider(`provider=codex type=${event.type}`, {
+            chunk: event,
+          }),
+      })
+    } catch (error: unknown) {
+      const err = error as Error & { code?: string }
+      const rawEvent = toRunErrorRawEvent(error)
+      logger.errors('codex.chatStream fatal', {
+        error,
+        source: 'codex.chatStream',
+      })
+      yield {
+        type: EventType.RUN_ERROR,
+        model: options.model,
+        timestamp: Date.now(),
+        message: err.message || 'Unknown error occurred',
+        ...(err.code !== undefined && { code: err.code }),
+        ...(rawEvent !== undefined && { rawEvent }),
+        error: {
+          message: err.message || 'Unknown error occurred',
+          ...(err.code !== undefined && { code: err.code }),
+        },
+      }
+    } finally {
+      await bridge?.close()
+    }
+  }
+
+  structuredOutput(
+    _options: StructuredOutputOptions<CodexTextProviderOptions>,
+  ): Promise<StructuredOutputResult<unknown>> {
+    return Promise.reject(
+      new Error(
+        'Structured output is not yet supported by the in-sandbox Codex adapter. ' +
+          'Use a model adapter for structured output, or omit outputSchema.',
+      ),
+    )
+  }
+}
+
+/**
+ * Creates a Codex harness adapter that runs **inside a sandbox**.
+ *
+ * It declares `requires: [SandboxCapability]` and spawns
+ * `codex exec --experimental-json` inside the sandbox (mirroring
+ * `@openai/codex-sdk`'s own CLI invocation), feeding the prompt via stdin and
+ * streaming its JSONL thread events back as AG-UI chunks. The sandbox image
+ * must provide the `codex` executable and `CODEX_API_KEY` (or a `codex login`)
+ * in its environment.
+ */
+export function codexText<TModel extends CodexModel>(
+  model: TModel,
+  config: CodexTextConfig = {},
+): CodexTextAdapter<TModel> {
+  return new CodexTextAdapter(config, model)
+}
diff --git a/packages/ai-codex/src/index.ts b/packages/ai-codex/src/index.ts
new file mode 100644
index 000000000..4d127524c
--- /dev/null
+++ b/packages/ai-codex/src/index.ts
@@ -0,0 +1,23 @@
+export { CodexTextAdapter, codexText } from './adapters/text'
+export type {
+  CodexTextConfig,
+  CodexSandboxMode,
+  CodexApprovalMode,
+} from './adapters/text'
+export type { CodexTextProviderOptions } from './provider-options'
+export { CODEX_MODELS } from './model-meta'
+export type { CodexModel, KnownCodexModel } from './model-meta'
+export {
+  SESSION_ID_EVENT,
+  BRIDGED_MCP_SERVER_NAME,
+  translateThreadEvents,
+  toolNameForItem,
+} from './stream/translate'
+export type { TranslateContext } from './stream/translate'
+export type {
+  CodexThreadEvent,
+  CodexThreadItem,
+  CodexUsage,
+} from './stream/sdk-types'
+export { buildPrompt } from './messages/prompt'
+export type { BuiltPrompt } from './messages/prompt'
diff --git a/packages/ai-codex/src/messages/prompt.ts b/packages/ai-codex/src/messages/prompt.ts
new file mode 100644
index 000000000..73b9ac549
--- /dev/null
+++ b/packages/ai-codex/src/messages/prompt.ts
@@ -0,0 +1,67 @@
+import type { ModelMessage } from '@tanstack/ai'
+
+export interface BuiltPrompt {
+  prompt: string
+  /** Codex thread id to resume, when the caller threaded one through. */
+  resume?: string
+}
+
+function extractText(content: ModelMessage['content']): string {
+  if (content === null) return ''
+  if (typeof content === 'string') return content
+  return content
+    .map((part) =>
+      part.type === 'text' && typeof part.content === 'string'
+        ? part.content
+        : '',
+    )
+    .join('')
+}
+
+/**
+ * Convert TanStack chat history into the Codex SDK's prompt + resume inputs.
+ *
+ * With a `sessionId`, the harness already holds the conversation context, so
+ * only the trailing user message is sent and the thread is resumed. Without
+ * one, prior turns are flattened into a plain-text transcript preamble (tool
+ * messages and tool-call-only assistant turns are harness-internal noise and
+ * are skipped; prompts are text-only in v1).
+ */
+export function buildPrompt(
+  messages: Array<ModelMessage>,
+  sessionId: string | undefined,
+): BuiltPrompt {
+  const lastMessage = messages.at(-1)
+  const lastUserText =
+    lastMessage?.role === 'user' ? extractText(lastMessage.content).trim() : ''
+
+  if (!lastUserText) {
+    throw new Error(
+      'Codex adapter requires a trailing user message with text content.',
+    )
+  }
+
+  if (sessionId !== undefined) {
+    return { prompt: lastUserText, resume: sessionId }
+  }
+
+  const priorTurns = messages
+    .slice(0, -1)
+    .filter(
+      (message) =>
+        (message.role === 'user' || message.role === 'assistant') &&
+        extractText(message.content).trim() !== '',
+    )
+    .map(
+      (message) =>
+        `${message.role === 'user' ? 'User' : 'Assistant'}: ${extractText(message.content).trim()}`,
+    )
+
+  if (priorTurns.length === 0) {
+    return { prompt: lastUserText }
+  }
+
+  return {
+    prompt: `Previous conversation:\n${priorTurns.join('\n')}\n\n${lastUserText}`,
+  }
+}
diff --git a/packages/ai-codex/src/model-meta.ts b/packages/ai-codex/src/model-meta.ts
new file mode 100644
index 000000000..dbf2af0fe
--- /dev/null
+++ b/packages/ai-codex/src/model-meta.ts
@@ -0,0 +1,17 @@
+/**
+ * Models known to work with Codex. The harness accepts any OpenAI model id
+ * its backend supports, so this list exists for autocomplete — any string is
+ * accepted via the `(string & {})` escape hatch in {@link CodexModel}.
+ */
+export const CODEX_MODELS = [
+  'gpt-5.3-codex',
+  'gpt-5.2-codex',
+  'gpt-5.1-codex',
+  'gpt-5.1-codex-mini',
+  'gpt-5.1',
+] as const
+
+export type KnownCodexModel = (typeof CODEX_MODELS)[number]
+
+/** Any model id accepted by Codex; known ids get autocomplete. */
+export type CodexModel = KnownCodexModel | (string & {})
diff --git a/packages/ai-codex/src/provider-options.ts b/packages/ai-codex/src/provider-options.ts
new file mode 100644
index 000000000..5f34a3b10
--- /dev/null
+++ b/packages/ai-codex/src/provider-options.ts
@@ -0,0 +1,23 @@
+/**
+ * Per-call provider options for the Codex adapter, passed via `modelOptions`
+ * on `chat()`.
+ */
+export interface CodexTextProviderOptions {
+  /**
+   * Resume an existing Codex thread. The adapter emits the thread id of
+   * every fresh run via a CUSTOM `codex.session-id` stream event; thread it
+   * back here to continue that session (only the latest user message is
+   * sent — the harness already holds the prior context).
+   */
+  sessionId?: string
+  /** Per-call override of the configured sandbox mode. */
+  sandboxMode?: 'read-only' | 'workspace-write' | 'danger-full-access'
+  /** Per-call override of the configured approval policy. */
+  approvalPolicy?: 'never' | 'on-failure' | 'on-request' | 'untrusted'
+  /** Per-call override of the model reasoning effort. */
+  modelReasoningEffort?: 'minimal' | 'low' | 'medium' | 'high'
+  /** Per-call override of the harness working directory. */
+  workingDirectory?: string
+  /** Per-call override of the git-repo safety check (defaults to skipping). */
+  skipGitRepoCheck?: boolean
+}
diff --git a/packages/ai-codex/src/stream/sdk-types.ts b/packages/ai-codex/src/stream/sdk-types.ts
new file mode 100644
index 000000000..1e7d36726
--- /dev/null
+++ b/packages/ai-codex/src/stream/sdk-types.ts
@@ -0,0 +1,66 @@
+/**
+ * Structural subset of the `@openai/codex-sdk` event types that the stream
+ * translator consumes.
+ *
+ * These are intentionally defined structurally (rather than imported from the
+ * Codex SDK) so the translator stays a pure, fixture-testable state machine
+ * and the package's public types don't depend on the SDK's type exports.
+ * Unknown item or event types fall through every branch at runtime.
+ */
+
+export interface CodexUsage {
+  input_tokens?: number
+  cached_input_tokens?: number
+  output_tokens?: number
+  reasoning_output_tokens?: number
+}
+
+export interface CodexMcpToolCallResult {
+  content?: Array<{ type: string; text?: string; [key: string]: unknown }>
+  structured_content?: unknown
+}
+
+export type CodexThreadItem =
+  | { id: string; type: 'agent_message'; text: string }
+  | { id: string; type: 'reasoning'; text: string }
+  | {
+      id: string
+      type: 'command_execution'
+      command: string
+      aggregated_output?: string
+      exit_code?: number
+      status: string
+    }
+  | {
+      id: string
+      type: 'file_change'
+      changes: Array<{ path: string; kind: string }>
+      status: string
+    }
+  | {
+      id: string
+      type: 'mcp_tool_call'
+      server: string
+      tool: string
+      arguments?: unknown
+      result?: CodexMcpToolCallResult
+      error?: { message: string }
+      status: string
+    }
+  | { id: string; type: 'web_search'; query: string }
+  | {
+      id: string
+      type: 'todo_list'
+      items: Array<{ text: string; completed: boolean }>
+    }
+  | { id: string; type: 'error'; message: string }
+
+export type CodexThreadEvent =
+  | { type: 'thread.started'; thread_id: string }
+  | { type: 'turn.started' }
+  | { type: 'turn.completed'; usage?: CodexUsage }
+  | { type: 'turn.failed'; error?: { message?: string } }
+  | { type: 'item.started'; item: CodexThreadItem }
+  | { type: 'item.updated'; item: CodexThreadItem }
+  | { type: 'item.completed'; item: CodexThreadItem }
+  | { type: 'error'; message: string }
diff --git a/packages/ai-codex/src/stream/translate.ts b/packages/ai-codex/src/stream/translate.ts
new file mode 100644
index 000000000..082e26ba3
--- /dev/null
+++ b/packages/ai-codex/src/stream/translate.ts
@@ -0,0 +1,381 @@
+import { EventType, buildBaseUsage } from '@tanstack/ai'
+import type { StreamChunk, TokenUsage } from '@tanstack/ai'
+import type { CodexThreadEvent, CodexThreadItem, CodexUsage } from './sdk-types'
+
+/** Name of the CUSTOM event carrying the Codex thread (session) id. */
+export const SESSION_ID_EVENT = 'codex.session-id'
+
+/** Server name used for bridged TanStack tools. */
+export const BRIDGED_MCP_SERVER_NAME = 'tanstack'
+
+export interface TranslateContext {
+  model: string
+  runId: string
+  threadId: string
+  parentRunId?: string
+  genId: () => string
+  /** Called as soon as the harness reports its thread id. */
+  onSessionId?: (sessionId: string) => void
+  /** Called for each raw SDK thread event, for logging. */
+  onThreadEvent?: (event: CodexThreadEvent) => void
+}
+
+/**
+ * Resolve the AG-UI tool-call name for a Codex thread item. Bridged TanStack
+ * tools come back as `mcp_tool_call` items on the `tanstack` server and are
+ * surfaced under the names the application registered; foreign MCP tools are
+ * namespaced `mcp__<server>__<tool>`; harness-native items use their item
+ * type verbatim (`command_execution`, `file_change`, ...).
+ */
+export function toolNameForItem(item: CodexThreadItem): string {
+  if (item.type === 'mcp_tool_call') {
+    return item.server === BRIDGED_MCP_SERVER_NAME
+      ? item.tool
+      : `mcp__${item.server}__${item.tool}`
+  }
+  return item.type
+}
+
+/** Thread items the translator surfaces as already-resolved tool calls. */
+type CodexToolItem = Extract<
+  CodexThreadItem,
+  {
+    type:
+      | 'command_execution'
+      | 'mcp_tool_call'
+      | 'file_change'
+      | 'web_search'
+      | 'todo_list'
+  }
+>
+
+function toolArgsForItem(item: CodexToolItem): unknown {
+  switch (item.type) {
+    case 'command_execution':
+      return { command: item.command }
+    case 'mcp_tool_call':
+      return item.arguments ?? {}
+    case 'file_change':
+      return { changes: item.changes }
+    case 'web_search':
+      return { query: item.query }
+    case 'todo_list':
+      return {}
+  }
+}
+
+function toolResultForItem(item: CodexToolItem): {
+  content: string
+  isError: boolean
+} {
+  switch (item.type) {
+    case 'command_execution':
+      return {
+        content: JSON.stringify({
+          aggregated_output: item.aggregated_output ?? '',
+          ...(item.exit_code !== undefined && { exit_code: item.exit_code }),
+          status: item.status,
+        }),
+        isError: item.status === 'failed',
+      }
+    case 'mcp_tool_call': {
+      if (item.error) {
+        return { content: item.error.message, isError: true }
+      }
+      const text = (item.result?.content ?? [])
+        .map((block) => (typeof block.text === 'string' ? block.text : ''))
+        .join('')
+      if (text !== '') {
+        return { content: text, isError: item.status === 'failed' }
+      }
+      if (item.result?.structured_content !== undefined) {
+        return {
+          content: JSON.stringify(item.result.structured_content),
+          isError: item.status === 'failed',
+        }
+      }
+      return {
+        content: JSON.stringify({ status: item.status }),
+        isError: item.status === 'failed',
+      }
+    }
+    case 'file_change':
+      return {
+        content: JSON.stringify({ changes: item.changes, status: item.status }),
+        isError: item.status === 'failed',
+      }
+    case 'web_search':
+      return {
+        content: JSON.stringify({ status: 'completed' }),
+        isError: false,
+      }
+    case 'todo_list':
+      return { content: JSON.stringify({ items: item.items }), isError: false }
+  }
+}
+
+function isToolItem(item: CodexThreadItem): item is CodexToolItem {
+  return (
+    item.type === 'command_execution' ||
+    item.type === 'mcp_tool_call' ||
+    item.type === 'file_change' ||
+    item.type === 'web_search' ||
+    item.type === 'todo_list'
+  )
+}
+
+function buildUsage(usage: CodexUsage | undefined): TokenUsage | undefined {
+  if (!usage) return undefined
+  const promptTokens = usage.input_tokens ?? 0
+  const completionTokens = usage.output_tokens ?? 0
+  const result = buildBaseUsage({
+    promptTokens,
+    completionTokens,
+    totalTokens: promptTokens + completionTokens,
+  })
+  if (usage.cached_input_tokens) {
+    result.promptTokensDetails = { cachedTokens: usage.cached_input_tokens }
+  }
+  if (usage.reasoning_output_tokens) {
+    result.completionTokensDetails = {
+      reasoningTokens: usage.reasoning_output_tokens,
+    }
+  }
+  return result
+}
+
+/**
+ * Translate a Codex SDK thread-event stream into AG-UI StreamChunk events.
+ *
+ * The harness runs its own agent loop and executes its own tools, so the
+ * translation always ends with `finishReason: 'stop'` (or RUN_ERROR) — never
+ * `'tool_calls'`. Harness tool activity (commands, file changes, MCP calls,
+ * web searches, todo lists) is emitted as already-resolved
+ * TOOL_CALL_START/ARGS/END + TOOL_CALL_RESULT sequences so UIs can render it
+ * while the TanStack engine never tries to execute them.
+ *
+ * Codex reports assistant text and reasoning only as completed items (no
+ * token-level deltas), so each `agent_message` / `reasoning` item becomes a
+ * single START/CONTENT/END burst.
+ *
+ * Invariant: every TOOL_CALL_START is eventually paired with a
+ * TOOL_CALL_RESULT (synthesized as `{"status":"interrupted"}` when the run
+ * ends or aborts before the harness reported one) so the engine's
+ * pending-tool-call scan on the next request never force-executes them.
+ */
+export async function* translateThreadEvents(
+  events: AsyncIterable<CodexThreadEvent>,
+  ctx: TranslateContext,
+): AsyncIterable<StreamChunk> {
+  const { model, runId, threadId, genId } = ctx
+  const now = () => Date.now()
+
+  let runStarted = false
+  /** Tool calls started but with no result yet. */
+  const unresolvedToolCalls = new Set<string>()
+  /** Item ids that already emitted TOOL_CALL_START/ARGS/END. */
+  const openedToolItems = new Set<string>()
+
+  function* startRun(): Generator<StreamChunk> {
+    if (runStarted) return
+    runStarted = true
+    yield {
+      type: EventType.RUN_STARTED,
+      runId,
+      threadId,
+      model,
+      timestamp: now(),
+      ...(ctx.parentRunId !== undefined && { parentRunId: ctx.parentRunId }),
+    }
+  }
+
+  function* synthesizeUnresolvedResults(): Generator<StreamChunk> {
+    for (const toolCallId of unresolvedToolCalls) {
+      yield {
+        type: EventType.TOOL_CALL_RESULT,
+        toolCallId,
+        messageId: genId(),
+        model,
+        timestamp: now(),
+        content: JSON.stringify({ status: 'interrupted' }),
+      }
+    }
+    unresolvedToolCalls.clear()
+  }
+
+  function* openToolCall(item: CodexToolItem): Generator<StreamChunk> {
+    if (openedToolItems.has(item.id)) return
+    openedToolItems.add(item.id)
+    const toolCallName = toolNameForItem(item)
+    const input = toolArgsForItem(item)
+    const args = JSON.stringify(input)
+    yield {
+      type: EventType.TOOL_CALL_START,
+      toolCallId: item.id,
+      toolCallName,
+      toolName: toolCallName,
+      model,
+      timestamp: now(),
+    }
+    yield {
+      type: EventType.TOOL_CALL_ARGS,
+      toolCallId: item.id,
+      model,
+      timestamp: now(),
+      delta: args,
+      args,
+    }
+    yield {
+      type: EventType.TOOL_CALL_END,
+      toolCallId: item.id,
+      toolCallName,
+      toolName: toolCallName,
+      model,
+      timestamp: now(),
+      input,
+    }
+    unresolvedToolCalls.add(item.id)
+  }
+
+  function* handleItemCompleted(item: CodexThreadItem): Generator<StreamChunk> {
+    if (item.type === 'agent_message') {
+      const messageId = item.id
+      yield {
+        type: EventType.TEXT_MESSAGE_START,
+        messageId,
+        model,
+        timestamp: now(),
+        role: 'assistant',
+      }
+      yield {
+        type: EventType.TEXT_MESSAGE_CONTENT,
+        messageId,
+        model,
+        timestamp: now(),
+        delta: item.text,
+        content: item.text,
+      }
+      yield {
+        type: EventType.TEXT_MESSAGE_END,
+        messageId,
+        model,
+        timestamp: now(),
+      }
+    } else if (item.type === 'reasoning') {
+      const reasoningId = item.id
+      yield {
+        type: EventType.REASONING_START,
+        messageId: reasoningId,
+        model,
+        timestamp: now(),
+      }
+      yield {
+        type: EventType.REASONING_MESSAGE_START,
+        messageId: reasoningId,
+        role: 'reasoning' as const,
+        model,
+        timestamp: now(),
+      }
+      yield {
+        type: EventType.REASONING_MESSAGE_CONTENT,
+        messageId: reasoningId,
+        delta: item.text,
+        model,
+        timestamp: now(),
+      }
+      yield {
+        type: EventType.REASONING_MESSAGE_END,
+        messageId: reasoningId,
+        model,
+        timestamp: now(),
+      }
+      yield {
+        type: EventType.REASONING_END,
+        messageId: reasoningId,
+        model,
+        timestamp: now(),
+      }
+    } else if (isToolItem(item)) {
+      yield* openToolCall(item)
+      unresolvedToolCalls.delete(item.id)
+      const { content, isError } = toolResultForItem(item)
+      yield {
+        type: EventType.TOOL_CALL_RESULT,
+        toolCallId: item.id,
+        messageId: genId(),
+        model,
+        timestamp: now(),
+        content,
+        ...(isError && { state: 'output-error' as const }),
+      }
+    }
+    // `error` items are non-fatal diagnostics; `turn.failed` is the fatal
+    // signal. They are surfaced via onThreadEvent logging only.
+  }
+
+  try {
+    for await (const event of events) {
+      ctx.onThreadEvent?.(event)
+
+      if (event.type === 'thread.started') {
+        yield* startRun()
+        ctx.onSessionId?.(event.thread_id)
+        yield {
+          type: EventType.CUSTOM,
+          model,
+          timestamp: now(),
+          name: SESSION_ID_EVENT,
+          value: { sessionId: event.thread_id },
+        }
+        continue
+      }
+
+      // Resumed threads don't re-emit thread.started; anything else still
+      // needs RUN_STARTED first.
+      yield* startRun()
+
+      if (event.type === 'item.started') {
+        if (isToolItem(event.item)) {
+          yield* openToolCall(event.item)
+        }
+      } else if (event.type === 'item.completed') {
+        yield* handleItemCompleted(event.item)
+      } else if (event.type === 'turn.completed') {
+        yield* synthesizeUnresolvedResults()
+        const usage = buildUsage(event.usage)
+        yield {
+          type: EventType.RUN_FINISHED,
+          runId,
+          threadId,
+          model,
+          timestamp: now(),
+          finishReason: 'stop',
+          ...(usage !== undefined && { usage }),
+        }
+      } else if (event.type === 'turn.failed' || event.type === 'error') {
+        yield* synthesizeUnresolvedResults()
+        const message =
+          event.type === 'turn.failed'
+            ? (event.error?.message ?? 'Codex turn failed')
+            : event.message
+        yield {
+          type: EventType.RUN_ERROR,
+          model,
+          timestamp: now(),
+          message,
+          error: { message },
+        }
+      }
+      // turn.started and item.updated carry no state the chunk stream needs:
+      // long-running items resolve via item.completed, and intermediate
+      // updates (e.g. streaming command output) are intentionally dropped.
+    }
+  } catch (error) {
+    // The run is dying (abort or SDK failure). Pair any started tool calls
+    // with a synthetic result first so the next request's pending-tool-call
+    // scan doesn't try to execute them, then let the adapter surface the
+    // error as RUN_ERROR.
+    yield* synthesizeUnresolvedResults()
+    throw error
+  }
+}
diff --git a/packages/ai-codex/tests/policy-map.test.ts b/packages/ai-codex/tests/policy-map.test.ts
new file mode 100644
index 000000000..0420c361f
--- /dev/null
+++ b/packages/ai-codex/tests/policy-map.test.ts
@@ -0,0 +1,56 @@
+import { describe, expect, it } from 'vitest'
+import { defineSandboxPolicy } from '@tanstack/ai-sandbox'
+import { mapPolicyToCodexFlags } from '../src/adapters/policy-map'
+
+describe('mapPolicyToCodexFlags', () => {
+  it('returns no flags for no policy', () => {
+    expect(mapPolicyToCodexFlags(undefined)).toEqual({})
+  })
+
+  it('maps fileWrite deny to read-only sandbox mode', () => {
+    const flags = mapPolicyToCodexFlags(
+      defineSandboxPolicy({ capabilities: { fileWrite: 'deny' } }),
+    )
+    expect(flags.sandboxMode).toBe('read-only')
+  })
+
+  it('maps network capability to network_access', () => {
+    expect(
+      mapPolicyToCodexFlags(
+        defineSandboxPolicy({ capabilities: { network: 'allow' } }),
+      ).networkAccessEnabled,
+    ).toBe(true)
+    expect(
+      mapPolicyToCodexFlags(
+        defineSandboxPolicy({ capabilities: { network: 'deny' } }),
+      ).networkAccessEnabled,
+    ).toBe(false)
+  })
+
+  it('maps a fully-permissive policy to approval_policy=never', () => {
+    expect(
+      mapPolicyToCodexFlags(defineSandboxPolicy({ default: 'allow' }))
+        .approvalPolicy,
+    ).toBe('never')
+  })
+
+  it('maps a default-deny policy to approval_policy=untrusted', () => {
+    expect(
+      mapPolicyToCodexFlags(defineSandboxPolicy({ default: 'deny' }))
+        .approvalPolicy,
+    ).toBe('untrusted')
+  })
+
+  it('maps ask/deny command rules to approval_policy=on-request', () => {
+    expect(
+      mapPolicyToCodexFlags(
+        defineSandboxPolicy({ commands: { ask: ['pnpm *'] } }),
+      ).approvalPolicy,
+    ).toBe('on-request')
+    expect(
+      mapPolicyToCodexFlags(
+        defineSandboxPolicy({ default: 'allow', commands: { deny: ['rm *'] } }),
+      ).approvalPolicy,
+    ).toBe('on-request')
+  })
+})
diff --git a/packages/ai-codex/tests/prompt.test.ts b/packages/ai-codex/tests/prompt.test.ts
new file mode 100644
index 000000000..6e8dfcdf3
--- /dev/null
+++ b/packages/ai-codex/tests/prompt.test.ts
@@ -0,0 +1,97 @@
+import { describe, expect, it } from 'vitest'
+import { buildPrompt } from '../src/messages/prompt'
+import type { ModelMessage } from '@tanstack/ai'
+
+const user = (content: ModelMessage['content']): ModelMessage => ({
+  role: 'user',
+  content,
+})
+const assistant = (content: ModelMessage['content']): ModelMessage => ({
+  role: 'assistant',
+  content,
+})
+
+describe('buildPrompt', () => {
+  it('resumes with only the last user message when sessionId is provided', () => {
+    const result = buildPrompt(
+      [
+        user('first question'),
+        assistant('first answer'),
+        user('follow-up question'),
+      ],
+      'sess-1',
+    )
+    expect(result).toEqual({
+      prompt: 'follow-up question',
+      resume: 'sess-1',
+    })
+  })
+
+  it('throws when sessionId is provided but there is no trailing user message', () => {
+    expect(() => buildPrompt([user('q'), assistant('a')], 'sess-1')).toThrow(
+      /user message/i,
+    )
+  })
+
+  it('sends a single user message as-is for a fresh session', () => {
+    expect(buildPrompt([user('hello')], undefined)).toEqual({
+      prompt: 'hello',
+    })
+  })
+
+  it('flattens prior turns into a transcript preamble for fresh multi-turn history', () => {
+    const { prompt, resume } = buildPrompt(
+      [user('What is 2+2?'), assistant('4'), user('And times 3?')],
+      undefined,
+    )
+    expect(resume).toBeUndefined()
+    expect(prompt).toBe(
+      'Previous conversation:\nUser: What is 2+2?\nAssistant: 4\n\nAnd times 3?',
+    )
+  })
+
+  it('skips tool messages and assistant tool-call-only turns when flattening', () => {
+    const messages: Array<ModelMessage> = [
+      user('list files'),
+      {
+        role: 'assistant',
+        content: null,
+        toolCalls: [
+          {
+            id: 't1',
+            type: 'function',
+            function: { name: 'ls', arguments: '{}' },
+          },
+        ],
+      } as unknown as ModelMessage,
+      { role: 'tool', content: 'file-a', toolCallId: 't1' },
+      assistant('There is one file.'),
+      user('thanks, which one?'),
+    ]
+    const { prompt } = buildPrompt(messages, undefined)
+    expect(prompt).toBe(
+      'Previous conversation:\nUser: list files\nAssistant: There is one file.\n\nthanks, which one?',
+    )
+  })
+
+  it('extracts text from content-part arrays and ignores non-text parts', () => {
+    const { prompt } = buildPrompt(
+      [
+        user([
+          { type: 'text', content: 'describe ' },
+          {
+            type: 'image',
+            source: { type: 'url', url: 'https://x/y.png' },
+          } as never,
+          { type: 'text', content: 'this' },
+        ] as ModelMessage['content']),
+      ],
+      undefined,
+    )
+    expect(prompt).toBe('describe this')
+  })
+
+  it('throws when there is no usable user content at all', () => {
+    expect(() => buildPrompt([], undefined)).toThrow(/user message/i)
+  })
+})
diff --git a/packages/ai-codex/tests/text-adapter.test.ts b/packages/ai-codex/tests/text-adapter.test.ts
new file mode 100644
index 000000000..ba0e9fae1
--- /dev/null
+++ b/packages/ai-codex/tests/text-adapter.test.ts
@@ -0,0 +1,107 @@
+/**
+ * Deterministic test of the in-sandbox Codex adapter.
+ *
+ * Runs a FAKE codex CLI (a node script that reads the prompt from stdin and
+ * emits canned `codex exec --experimental-json` JSONL thread events) inside a
+ * real local-process sandbox, exercising spawn → stdout NDJSON → translate →
+ * StreamChunk. The real `codex` CLI is covered by the gated live path.
+ */
+import { afterAll, describe, expect, it } from 'vitest'
+import * as fsp from 'node:fs/promises'
+import * as os from 'node:os'
+import * as path from 'node:path'
+import { localProcessSandbox } from '@tanstack/ai-sandbox-local-process'
+import { SandboxCapability } from '@tanstack/ai-sandbox'
+import { codexText } from '../src/index'
+import type { InternalLogger } from '@tanstack/ai/adapter-internals'
+import type { CapabilityContext, StreamChunk } from '@tanstack/ai'
+import type { SandboxHandle } from '@tanstack/ai-sandbox'
+
+const baseDir = path.join(os.tmpdir(), `tanstack-ai-codex-test-${Date.now()}`)
+const provider = localProcessSandbox({ baseDir, removeOnDestroy: true })
+
+afterAll(async () => {
+  await fsp.rm(baseDir, { recursive: true, force: true })
+})
+
+// Stand-in for `codex exec --experimental-json`: ignores flags, reads the
+// prompt from stdin, emits codex thread-event JSONL.
+const FAKE_CODEX = [
+  `let input = ''`,
+  `process.stdin.on('data', (d) => { input += d })`,
+  `process.stdin.on('end', () => {`,
+  `  const w = (o) => process.stdout.write(JSON.stringify(o) + '\\n')`,
+  `  w({ type: 'thread.started', thread_id: 'th-1' })`,
+  `  w({ type: 'turn.started' })`,
+  `  w({ type: 'item.completed', item: { id: 'i1', type: 'agent_message', text: 'pong' } })`,
+  `  w({ type: 'turn.completed', usage: { input_tokens: 1, output_tokens: 1 } })`,
+  `})`,
+].join('\n')
+
+const noopLogger = {
+  request: () => {},
+  provider: () => {},
+  errors: () => {},
+  agentLoop: () => {},
+  warnings: () => {},
+  debug: () => {},
+} as unknown as InternalLogger
+
+function capabilityContextWith(handle: SandboxHandle): CapabilityContext {
+  const [, provideSandbox] = SandboxCapability
+  const ctx = {
+    capabilities: { markProvided: () => {}, has: () => true },
+  } as unknown as CapabilityContext
+  provideSandbox(ctx, handle)
+  return ctx
+}
+
+async function collect(
+  stream: AsyncIterable<StreamChunk>,
+): Promise<Array<StreamChunk>> {
+  const out: Array<StreamChunk> = []
+  for await (const chunk of stream) out.push(chunk)
+  return out
+}
+
+describe('codex in-sandbox adapter', () => {
+  it('spawns codex in the sandbox and streams translated events', async () => {
+    const sbx = await provider.create({})
+    await sbx.fs.write('/workspace/fake-codex.mjs', FAKE_CODEX)
+
+    const adapter = codexText('gpt-5.5-codex', {
+      codexExecutable: 'node fake-codex.mjs',
+    })
+
+    const chunks = await collect(
+      adapter.chatStream({
+        model: 'gpt-5.5-codex',
+        messages: [{ role: 'user', content: 'say pong' }],
+        logger: noopLogger,
+        capabilities: capabilityContextWith(sbx),
+      }),
+    )
+
+    expect((chunks[0] as { type: string }).type).toBe('RUN_STARTED')
+    const text = chunks
+      .filter((c) => c.type === 'TEXT_MESSAGE_CONTENT')
+      .map((c) => (c as { delta?: string }).delta ?? '')
+      .join('')
+    expect(text).toContain('pong')
+    expect(chunks.some((c) => c.type === 'RUN_FINISHED')).toBe(true)
+    await sbx.destroy()
+  })
+
+  it('requires a sandbox capability', async () => {
+    const adapter = codexText('gpt-5.5-codex')
+    const chunks = await collect(
+      adapter.chatStream({
+        model: 'gpt-5.5-codex',
+        messages: [{ role: 'user', content: 'hi' }],
+        logger: noopLogger,
+      }),
+    )
+    const err = chunks.find((c) => c.type === 'RUN_ERROR')
+    expect((err as { message?: string }).message).toMatch(/requires a sandbox/i)
+  })
+})
diff --git a/packages/ai-codex/tests/translate.test.ts b/packages/ai-codex/tests/translate.test.ts
new file mode 100644
index 000000000..b76e1d48f
--- /dev/null
+++ b/packages/ai-codex/tests/translate.test.ts
@@ -0,0 +1,454 @@
+import { describe, expect, it } from 'vitest'
+import {
+  SESSION_ID_EVENT,
+  toolNameForItem,
+  translateThreadEvents,
+} from '../src/stream/translate'
+import type { TranslateContext } from '../src/stream/translate'
+import type { CodexThreadEvent } from '../src/stream/sdk-types'
+import type { StreamChunk } from '@tanstack/ai'
+
+function makeCtx(overrides: Partial<TranslateContext> = {}): TranslateContext {
+  let id = 0
+  return {
+    model: 'gpt-5.1-codex',
+    runId: 'run-1',
+    threadId: 'thread-1',
+    genId: () => `gen-${++id}`,
+    ...overrides,
+  }
+}
+
+async function* fromArray(
+  events: Array<CodexThreadEvent>,
+): AsyncIterable<CodexThreadEvent> {
+  for (const event of events) yield event
+}
+
+async function collect(
+  events: Array<CodexThreadEvent>,
+  ctx: TranslateContext = makeCtx(),
+): Promise<Array<StreamChunk>> {
+  const chunks: Array<StreamChunk> = []
+  for await (const chunk of translateThreadEvents(fromArray(events), ctx)) {
+    chunks.push(chunk)
+  }
+  return chunks
+}
+
+const started: CodexThreadEvent = {
+  type: 'thread.started',
+  thread_id: 'sess-1',
+}
+
+const completedTurn: CodexThreadEvent = {
+  type: 'turn.completed',
+  usage: {
+    input_tokens: 100,
+    cached_input_tokens: 40,
+    output_tokens: 20,
+    reasoning_output_tokens: 5,
+  },
+}
+
+describe('translateThreadEvents', () => {
+  it('translates a simple text turn', async () => {
+    const chunks = await collect([
+      started,
+      { type: 'turn.started' },
+      {
+        type: 'item.completed',
+        item: { id: 'item-1', type: 'agent_message', text: 'hi there' },
+      },
+      completedTurn,
+    ])
+
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'RUN_FINISHED',
+    ])
+    expect(chunks[1]).toMatchObject({
+      name: SESSION_ID_EVENT,
+      value: { sessionId: 'sess-1' },
+    })
+    expect(chunks[3]).toMatchObject({ delta: 'hi there', content: 'hi there' })
+    expect(chunks.at(-1)).toMatchObject({ finishReason: 'stop' })
+  })
+
+  it('reports usage with cache and reasoning details', async () => {
+    const chunks = await collect([started, completedTurn])
+    const finished = chunks.at(-1) as unknown as {
+      usage: Record<string, unknown>
+    }
+    expect(finished.usage).toMatchObject({
+      promptTokens: 100,
+      completionTokens: 20,
+      totalTokens: 120,
+      promptTokensDetails: { cachedTokens: 40 },
+      completionTokensDetails: { reasoningTokens: 5 },
+    })
+  })
+
+  it('notifies onSessionId and forwards raw events to onThreadEvent', async () => {
+    const sessionIds: Array<string> = []
+    const raw: Array<string> = []
+    await collect(
+      [started, completedTurn],
+      makeCtx({
+        onSessionId: (id) => sessionIds.push(id),
+        onThreadEvent: (event) => raw.push(event.type),
+      }),
+    )
+    expect(sessionIds).toEqual(['sess-1'])
+    expect(raw).toEqual(['thread.started', 'turn.completed'])
+  })
+
+  it('starts the run without a session event on resumed threads', async () => {
+    const chunks = await collect([
+      { type: 'turn.started' },
+      {
+        type: 'item.completed',
+        item: { id: 'item-1', type: 'agent_message', text: 'resumed' },
+      },
+      completedTurn,
+    ])
+    expect(chunks[0]).toMatchObject({ type: 'RUN_STARTED' })
+    expect(chunks.some((c) => c.type === 'CUSTOM')).toBe(false)
+  })
+
+  it('translates reasoning items into a reasoning burst', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.completed',
+        item: { id: 'item-r', type: 'reasoning', text: 'thinking...' },
+      },
+      completedTurn,
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'REASONING_START',
+      'REASONING_MESSAGE_START',
+      'REASONING_MESSAGE_CONTENT',
+      'REASONING_MESSAGE_END',
+      'REASONING_END',
+      'RUN_FINISHED',
+    ])
+  })
+
+  it('pairs command executions across item.started and item.completed', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.started',
+        item: {
+          id: 'cmd-1',
+          type: 'command_execution',
+          command: 'ls -la',
+          status: 'in_progress',
+        },
+      },
+      {
+        type: 'item.completed',
+        item: {
+          id: 'cmd-1',
+          type: 'command_execution',
+          command: 'ls -la',
+          aggregated_output: 'file.txt',
+          exit_code: 0,
+          status: 'completed',
+        },
+      },
+      completedTurn,
+    ])
+
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TOOL_CALL_START',
+      'TOOL_CALL_ARGS',
+      'TOOL_CALL_END',
+      'TOOL_CALL_RESULT',
+      'RUN_FINISHED',
+    ])
+    expect(chunks[2]).toMatchObject({
+      toolCallId: 'cmd-1',
+      toolCallName: 'command_execution',
+    })
+    expect(chunks[3]).toMatchObject({
+      args: JSON.stringify({ command: 'ls -la' }),
+    })
+    const result = chunks[5] as { content: string; state?: string }
+    expect(JSON.parse(result.content)).toMatchObject({
+      aggregated_output: 'file.txt',
+      exit_code: 0,
+      status: 'completed',
+    })
+    expect(result.state).toBeUndefined()
+  })
+
+  it('marks failed command executions as output-error', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.completed',
+        item: {
+          id: 'cmd-2',
+          type: 'command_execution',
+          command: 'false',
+          aggregated_output: '',
+          exit_code: 1,
+          status: 'failed',
+        },
+      },
+      completedTurn,
+    ])
+    const result = chunks.find((c) => c.type === 'TOOL_CALL_RESULT')
+    expect(result).toMatchObject({ state: 'output-error' })
+  })
+
+  it('emits a full tool pair when item.completed arrives without item.started', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.completed',
+        item: {
+          id: 'fc-1',
+          type: 'file_change',
+          changes: [{ path: 'a.ts', kind: 'update' }],
+          status: 'completed',
+        },
+      },
+      completedTurn,
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TOOL_CALL_START',
+      'TOOL_CALL_ARGS',
+      'TOOL_CALL_END',
+      'TOOL_CALL_RESULT',
+      'RUN_FINISHED',
+    ])
+    expect(chunks[2]).toMatchObject({ toolCallName: 'file_change' })
+  })
+
+  it('does not duplicate START events when both started and completed fire', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.started',
+        item: {
+          id: 'ws-1',
+          type: 'web_search',
+          query: 'tanstack ai',
+        },
+      },
+      {
+        type: 'item.completed',
+        item: { id: 'ws-1', type: 'web_search', query: 'tanstack ai' },
+      },
+      completedTurn,
+    ])
+    const startEvents = chunks.filter((c) => c.type === 'TOOL_CALL_START')
+    expect(startEvents).toHaveLength(1)
+  })
+
+  it('strips the tanstack server prefix from bridged MCP tool calls', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.completed',
+        item: {
+          id: 'mcp-1',
+          type: 'mcp_tool_call',
+          server: 'tanstack',
+          tool: 'lookup_user',
+          arguments: { userId: '7' },
+          result: { content: [{ type: 'text', text: '{"name":"Ada"}' }] },
+          status: 'completed',
+        },
+      },
+      completedTurn,
+    ])
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_START')).toMatchObject({
+      toolCallName: 'lookup_user',
+    })
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_RESULT')).toMatchObject({
+      content: '{"name":"Ada"}',
+    })
+  })
+
+  it('namespaces foreign MCP tool calls as mcp__server__tool', async () => {
+    expect(
+      toolNameForItem({
+        id: 'x',
+        type: 'mcp_tool_call',
+        server: 'github',
+        tool: 'create_issue',
+        status: 'completed',
+      }),
+    ).toBe('mcp__github__create_issue')
+  })
+
+  it('surfaces MCP tool errors as output-error results', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.completed',
+        item: {
+          id: 'mcp-2',
+          type: 'mcp_tool_call',
+          server: 'tanstack',
+          tool: 'boom',
+          error: { message: 'kaboom' },
+          status: 'failed',
+        },
+      },
+      completedTurn,
+    ])
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_RESULT')).toMatchObject({
+      content: 'kaboom',
+      state: 'output-error',
+    })
+  })
+
+  it('ignores item.updated events', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.started',
+        item: {
+          id: 'todo-1',
+          type: 'todo_list',
+          items: [{ text: 'step 1', completed: false }],
+        },
+      },
+      {
+        type: 'item.updated',
+        item: {
+          id: 'todo-1',
+          type: 'todo_list',
+          items: [{ text: 'step 1', completed: true }],
+        },
+      },
+      {
+        type: 'item.completed',
+        item: {
+          id: 'todo-1',
+          type: 'todo_list',
+          items: [{ text: 'step 1', completed: true }],
+        },
+      },
+      completedTurn,
+    ])
+    expect(chunks.filter((c) => c.type === 'TOOL_CALL_ARGS')).toHaveLength(1)
+    expect(chunks.filter((c) => c.type === 'TOOL_CALL_RESULT')).toHaveLength(1)
+  })
+
+  it('synthesizes interrupted results for unresolved tool calls on turn.completed', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.started',
+        item: {
+          id: 'cmd-9',
+          type: 'command_execution',
+          command: 'sleep 100',
+          status: 'in_progress',
+        },
+      },
+      completedTurn,
+    ])
+    const result = chunks.find((c) => c.type === 'TOOL_CALL_RESULT')
+    expect(result).toMatchObject({
+      toolCallId: 'cmd-9',
+      content: JSON.stringify({ status: 'interrupted' }),
+    })
+    expect(chunks.at(-1)).toMatchObject({ type: 'RUN_FINISHED' })
+  })
+
+  it('maps turn.failed to RUN_ERROR after synthesizing results', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.started',
+        item: {
+          id: 'cmd-8',
+          type: 'command_execution',
+          command: 'x',
+          status: 'in_progress',
+        },
+      },
+      { type: 'turn.failed', error: { message: 'model exploded' } },
+    ])
+    const types: Array<string> = chunks.map((c) => c.type)
+    expect(types.indexOf('TOOL_CALL_RESULT')).toBeLessThan(
+      types.indexOf('RUN_ERROR'),
+    )
+    expect(chunks.at(-1)).toMatchObject({
+      type: 'RUN_ERROR',
+      message: 'model exploded',
+    })
+  })
+
+  it('maps stream error events to RUN_ERROR', async () => {
+    const chunks = await collect([
+      started,
+      { type: 'error', message: 'stream broke' },
+    ])
+    expect(chunks.at(-1)).toMatchObject({
+      type: 'RUN_ERROR',
+      message: 'stream broke',
+    })
+  })
+
+  it('synthesizes results then rethrows when the source stream throws', async () => {
+    async function* failing(): AsyncIterable<CodexThreadEvent> {
+      yield started
+      yield {
+        type: 'item.started',
+        item: {
+          id: 'cmd-7',
+          type: 'command_execution',
+          command: 'x',
+          status: 'in_progress',
+        },
+      }
+      throw new Error('aborted')
+    }
+
+    const chunks: Array<StreamChunk> = []
+    await expect(async () => {
+      for await (const chunk of translateThreadEvents(failing(), makeCtx())) {
+        chunks.push(chunk)
+      }
+    }).rejects.toThrow('aborted')
+    expect(chunks.at(-1)).toMatchObject({
+      type: 'TOOL_CALL_RESULT',
+      toolCallId: 'cmd-7',
+      content: JSON.stringify({ status: 'interrupted' }),
+    })
+  })
+
+  it('ignores non-fatal error items', async () => {
+    const chunks = await collect([
+      started,
+      {
+        type: 'item.completed',
+        item: { id: 'err-1', type: 'error', message: 'transient hiccup' },
+      },
+      completedTurn,
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'RUN_FINISHED',
+    ])
+  })
+})
diff --git a/packages/ai-codex/tsconfig.json b/packages/ai-codex/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-codex/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-codex/vite.config.ts b/packages/ai-codex/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-codex/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-gemini-cli/README.md b/packages/ai-gemini-cli/README.md
new file mode 100644
index 000000000..46876a4dd
--- /dev/null
+++ b/packages/ai-gemini-cli/README.md
@@ -0,0 +1,18 @@
+# @tanstack/ai-gemini-cli
+
+Gemini CLI harness adapter for [TanStack AI](https://tanstack.com/ai) — run [Gemini CLI](https://github.com/google-gemini/gemini-cli) (via the Agent Client Protocol) as a chat backend with local tool execution, stateful coding sessions, and TanStack tool bridging.
+
+```typescript
+import { chat } from '@tanstack/ai'
+import { geminiCliText } from '@tanstack/ai-gemini-cli'
+
+const stream = chat({
+  adapter: geminiCliText('gemini-3-pro-preview', {
+    cwd: '/path/to/project',
+    permissionMode: 'acceptEdits',
+  }),
+  messages: [{ role: 'user', content: 'Fix the failing test.' }],
+})
+```
+
+Server-only (Node). Requires the `gemini` CLI to be installed (`npm i -g @google/gemini-cli`) and authenticated. See the [Gemini CLI adapter docs](https://tanstack.com/ai/latest/docs/adapters/gemini-cli) for sessions, tool bridging, permissions, and limitations.
diff --git a/packages/ai-gemini-cli/package.json b/packages/ai-gemini-cli/package.json
new file mode 100644
index 000000000..cefedbc4e
--- /dev/null
+++ b/packages/ai-gemini-cli/package.json
@@ -0,0 +1,61 @@
+{
+  "name": "@tanstack/ai-gemini-cli",
+  "version": "0.1.0",
+  "description": "Gemini CLI harness adapter for TanStack AI — run Gemini CLI as a chat backend with local tool execution and stateful sessions.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-gemini-cli"
+  },
+  "keywords": [
+    "ai",
+    "ai-sdk",
+    "typescript",
+    "tanstack",
+    "google",
+    "gemini",
+    "gemini-cli",
+    "harness",
+    "agent",
+    "adapter",
+    "chat",
+    "tool-calling"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "dependencies": {
+    "@agentclientprotocol/sdk": "^0.25.0"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-sandbox": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-sandbox": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-gemini-cli/src/adapters/text.ts b/packages/ai-gemini-cli/src/adapters/text.ts
new file mode 100644
index 000000000..513e0c1c2
--- /dev/null
+++ b/packages/ai-gemini-cli/src/adapters/text.ts
@@ -0,0 +1,329 @@
+import { EventType, normalizeSystemPrompts } from '@tanstack/ai'
+import { toRunErrorRawEvent } from '@tanstack/ai/adapter-internals'
+import { BaseTextAdapter } from '@tanstack/ai/adapters'
+import {
+  SandboxCapability,
+  buildApprovalRequestedEvent,
+  getSandbox,
+  hostForSandbox,
+  startHostToolBridge,
+} from '@tanstack/ai-sandbox'
+import { buildPrompt } from '../messages/prompt'
+import { startAcpSession } from '../process/acp-client'
+import { resolveInteractivePermission } from '../process/permissions'
+import { AsyncQueue } from '../stream/queue'
+import { translateAcpStream } from '../stream/translate'
+import type { HostToolBridge, SandboxHandle } from '@tanstack/ai-sandbox'
+import type {
+  StructuredOutputOptions,
+  StructuredOutputResult,
+} from '@tanstack/ai/adapters'
+import type {
+  DefaultMessageMetadataByModality,
+  Modality,
+  StreamChunk,
+  TextOptions,
+} from '@tanstack/ai'
+import type { AcpSessionHandle } from '../process/acp-client'
+import type {
+  GeminiCliPermissionMode,
+  PermissionHandler,
+} from '../process/permissions'
+import type { AcpStreamEvent } from '../stream/translate'
+import type { GeminiCliModel } from '../model-meta'
+import type { GeminiCliTextProviderOptions } from '../provider-options'
+
+const DEFAULT_WORKDIR = '/workspace'
+
+export interface GeminiCliTextConfig {
+  /** Working directory inside the sandbox. Defaults to `/workspace`. */
+  cwd?: string
+  /** Path/name of the Gemini CLI executable inside the sandbox. Defaults to `gemini`. */
+  executablePath?: string
+  /** Extra CLI arguments appended after `--acp`. */
+  extraArgs?: Array<string>
+  /** Extra environment variables for the gemini process inside the sandbox. */
+  env?: Record<string, string>
+  /**
+   * Gemini CLI permission mode. Defaults to `'default'`; set `'acceptEdits'` /
+   * `'bypassPermissions'` to let the harness edit files and run commands
+   * autonomously inside the sandbox.
+   */
+  permissionMode?: GeminiCliPermissionMode
+  /** Custom permission handler; replaces the adapter's default policy. */
+  onPermissionRequest?: PermissionHandler
+  /**
+   * ACP auth method to select before starting the session, e.g.
+   * `'oauth-personal'`, `'gemini-api-key'`, or `'vertex-ai'`. Overridable per
+   * call via `modelOptions.authMethodId`.
+   */
+  authMethodId?: string
+}
+
+function q(value: string): string {
+  return `'${value.replace(/'/g, `'\\''`)}'`
+}
+
+export class GeminiCliTextAdapter<
+  TModel extends GeminiCliModel,
+> extends BaseTextAdapter<
+  TModel,
+  GeminiCliTextProviderOptions,
+  ReadonlyArray<Modality> & readonly ['text'],
+  DefaultMessageMetadataByModality,
+  ReadonlyArray<string>,
+  unknown,
+  never
+> {
+  readonly name = 'gemini-cli' as const
+
+  override readonly requires = [SandboxCapability] as const
+
+  // Agent runs inside the persistent sandbox; the engine can re-attach to the
+  // still-running process on resume (live re-attach verified with the real CLI;
+  // the engine seam is unit-tested).
+  readonly supportsReattach = true
+
+  private readonly adapterConfig: GeminiCliTextConfig
+
+  constructor(config: GeminiCliTextConfig, model: TModel) {
+    super({}, model)
+    this.adapterConfig = config
+  }
+
+  private sandboxFrom(
+    options: TextOptions<GeminiCliTextProviderOptions>,
+  ): SandboxHandle {
+    const ctx = options.capabilities
+    if (!ctx) {
+      throw new Error(
+        'Adapter "gemini-cli" requires a sandbox. Add withSandbox(defineSandbox({ ... })) to chat() middleware.',
+      )
+    }
+    return getSandbox(ctx)
+  }
+
+  private acpCommand(): string {
+    const exe = this.adapterConfig.executablePath ?? 'gemini'
+    const args = ['--acp', '-m', q(this.model)]
+    for (const arg of this.adapterConfig.extraArgs ?? []) args.push(q(arg))
+    return `${exe} ${args.join(' ')}`
+  }
+
+  private applySystemPrompts(
+    options: TextOptions<GeminiCliTextProviderOptions>,
+    prompt: string,
+  ): string {
+    const systemPrompts = normalizeSystemPrompts(options.systemPrompts)
+      .map((systemPrompt) => systemPrompt.content)
+      .filter((content) => content.trim() !== '')
+    if (systemPrompts.length === 0) return prompt
+    return `${systemPrompts.join('\n\n')}\n\n${prompt}`
+  }
+
+  async *chatStream(
+    options: TextOptions<GeminiCliTextProviderOptions>,
+  ): AsyncIterable<StreamChunk> {
+    const { logger } = options
+    let handle: AcpSessionHandle | undefined
+    let bridge: HostToolBridge | undefined
+    const externalSignal =
+      options.abortController?.signal ?? options.request?.signal ?? undefined
+    let onAbort: (() => void) | undefined
+
+    try {
+      const sandbox = this.sandboxFrom(options)
+      const cwd =
+        options.modelOptions?.cwd ?? this.adapterConfig.cwd ?? DEFAULT_WORKDIR
+
+      const modelOptions = options.modelOptions
+      const sessionId = modelOptions?.sessionId
+      const { prompt: resumePrompt } = buildPrompt(options.messages, sessionId)
+
+      // Bridge chat()-provided tools into the agent over MCP (ACP http server).
+      const bridgedToolNames = new Set(
+        (options.tools ?? []).map((tool) => tool.name),
+      )
+      if (options.tools && options.tools.length > 0) {
+        bridge = await startHostToolBridge(options.tools, {
+          hostForSandbox: hostForSandbox(sandbox.provider),
+          context: options.context,
+          ...(externalSignal ? { signal: externalSignal } : {}),
+        })
+      }
+
+      const runId = options.runId ?? this.generateId()
+      const threadId = options.threadId ?? this.generateId()
+      // Approval-requested events collected during the run (an `ask` action with
+      // no client decision yet) and emitted after the stream so the client can
+      // approve and re-run.
+      const approvalRequests: Array<StreamChunk> = []
+
+      const queue = new AsyncQueue<AcpStreamEvent>()
+      const mode =
+        modelOptions?.permissionMode ??
+        this.adapterConfig.permissionMode ??
+        'default'
+      const permissionHandler: PermissionHandler =
+        this.adapterConfig.onPermissionRequest ??
+        ((request) => {
+          const result = resolveInteractivePermission(
+            request,
+            mode,
+            bridgedToolNames,
+            options.approvals,
+          )
+          if (result.approvalId !== undefined) {
+            approvalRequests.push(
+              buildApprovalRequestedEvent({
+                approvalId: result.approvalId,
+                title:
+                  result.title ??
+                  request.toolCall.title ??
+                  request.toolCall.toolCallId,
+                threadId,
+                runId,
+                detail: { provider: 'gemini-cli' },
+              }),
+            )
+          }
+          return result.outcome
+        })
+
+      logger.request(
+        `activity=chat provider=gemini-cli model=${this.model} sandbox=${sandbox.provider} messages=${options.messages.length} resume=${sessionId ?? 'none'}`,
+        { provider: 'gemini-cli', model: this.model },
+      )
+
+      const proc = await sandbox.process.spawn(this.acpCommand(), {
+        cwd,
+        ...(this.adapterConfig.env ? { env: this.adapterConfig.env } : {}),
+        ...(externalSignal ? { signal: externalSignal } : {}),
+      })
+
+      handle = await startAcpSession({
+        process: proc,
+        cwd,
+        ...((modelOptions?.authMethodId ?? this.adapterConfig.authMethodId) !==
+          undefined && {
+          authMethodId:
+            modelOptions?.authMethodId ?? this.adapterConfig.authMethodId,
+        }),
+        ...(sessionId !== undefined && { resumeSessionId: sessionId }),
+        ...(bridge !== undefined && {
+          mcpServers: [
+            {
+              name: bridge.name,
+              url: bridge.url,
+              headers: [
+                { name: 'Authorization', value: `Bearer ${bridge.token}` },
+              ],
+            },
+          ],
+        }),
+        onUpdate: (update) => queue.push({ kind: 'update', update }),
+        onPermissionRequest: permissionHandler,
+      })
+      const session = handle
+
+      if (externalSignal !== undefined) {
+        onAbort = () => void session.cancel().catch(() => undefined)
+        if (externalSignal.aborted) onAbort()
+        else externalSignal.addEventListener('abort', onAbort, { once: true })
+      }
+
+      queue.push({ kind: 'session', sessionId: session.sessionId })
+
+      const promptText = this.applySystemPrompts(
+        options,
+        session.resumed || sessionId === undefined
+          ? resumePrompt
+          : buildPrompt(options.messages, undefined).prompt,
+      )
+
+      session
+        .prompt(promptText)
+        .then(({ stopReason, usage }) => {
+          queue.push({
+            kind: 'done',
+            stopReason,
+            ...(usage !== undefined && { usage }),
+          })
+          queue.end()
+        })
+        .catch((error: unknown) => queue.fail(error))
+
+      yield* translateAcpStream(queue, {
+        model: this.model,
+        runId,
+        threadId,
+        ...(options.parentRunId !== undefined && {
+          parentRunId: options.parentRunId,
+        }),
+        genId: () => this.generateId(),
+        bridgedToolNames,
+        onAcpEvent: (event) =>
+          logger.provider(`provider=gemini-cli kind=${event.kind}`, {
+            chunk: event,
+          }),
+      })
+
+      // Surface any pending approval requests (ask-policy actions awaiting a
+      // client decision); the client approves and re-runs to continue.
+      for (const event of approvalRequests) yield event
+    } catch (error: unknown) {
+      const err = error as Error & { code?: string }
+      const rawEvent = toRunErrorRawEvent(error)
+      logger.errors('gemini-cli.chatStream fatal', {
+        error,
+        source: 'gemini-cli.chatStream',
+      })
+      yield {
+        type: EventType.RUN_ERROR,
+        model: options.model,
+        timestamp: Date.now(),
+        message: err.message || 'Unknown error occurred',
+        ...(err.code !== undefined && { code: err.code }),
+        ...(rawEvent !== undefined && { rawEvent }),
+        error: {
+          message: err.message || 'Unknown error occurred',
+          ...(err.code !== undefined && { code: err.code }),
+        },
+      }
+    } finally {
+      if (externalSignal !== undefined && onAbort !== undefined) {
+        externalSignal.removeEventListener('abort', onAbort)
+      }
+      await handle?.dispose()
+      await bridge?.close()
+    }
+  }
+
+  structuredOutput(
+    _options: StructuredOutputOptions<GeminiCliTextProviderOptions>,
+  ): Promise<StructuredOutputResult<unknown>> {
+    return Promise.reject(
+      new Error(
+        'Structured output is not yet supported by the in-sandbox Gemini CLI adapter. ' +
+          'Use a model adapter for structured output, or omit outputSchema.',
+      ),
+    )
+  }
+}
+
+/**
+ * Creates a Gemini CLI harness adapter that runs **inside a sandbox**.
+ *
+ * It declares `requires: [SandboxCapability]` and spawns `gemini --acp` inside
+ * the sandbox provided by `withSandbox(...)`, driving it over the Agent Client
+ * Protocol via the sandbox's duplex process IO. The sandbox image must provide
+ * the `gemini` executable, authenticated for headless use (or pass
+ * `authMethodId`). chat()-provided tools aren't bridged yet (the agent uses its
+ * native tools).
+ */
+export function geminiCliText<TModel extends GeminiCliModel>(
+  model: TModel,
+  config: GeminiCliTextConfig = {},
+): GeminiCliTextAdapter<TModel> {
+  return new GeminiCliTextAdapter(config, model)
+}
diff --git a/packages/ai-gemini-cli/src/index.ts b/packages/ai-gemini-cli/src/index.ts
new file mode 100644
index 000000000..a889644af
--- /dev/null
+++ b/packages/ai-gemini-cli/src/index.ts
@@ -0,0 +1,36 @@
+export { GeminiCliTextAdapter, geminiCliText } from './adapters/text'
+export type { GeminiCliTextConfig } from './adapters/text'
+export type { GeminiCliTextProviderOptions } from './provider-options'
+export { GEMINI_CLI_MODELS } from './model-meta'
+export type { GeminiCliModel, KnownGeminiCliModel } from './model-meta'
+export {
+  SESSION_ID_EVENT,
+  PLAN_EVENT,
+  BRIDGED_MCP_SERVER_NAME,
+  translateAcpStream,
+  matchBridgedToolName,
+} from './stream/translate'
+export type { AcpStreamEvent, TranslateContext } from './stream/translate'
+export type {
+  AcpPermissionOption,
+  AcpPermissionOutcome,
+  AcpPermissionRequest,
+  AcpSessionUpdate,
+  AcpStopReason,
+  AcpToolCallUpdate,
+  AcpUsage,
+} from './stream/acp-types'
+export { resolvePermission } from './process/permissions'
+export type {
+  GeminiCliPermissionMode,
+  PermissionHandler,
+} from './process/permissions'
+export { startAcpSession } from './process/acp-client'
+export type {
+  AcpSessionHandle,
+  StartAcpSessionOptions,
+} from './process/acp-client'
+export { buildPrompt } from './messages/prompt'
+export type { BuiltPrompt } from './messages/prompt'
+export { spawnHandleToAcpTransport } from './process/sandbox-transport'
+export type { AcpTransport } from './process/sandbox-transport'
diff --git a/packages/ai-gemini-cli/src/messages/prompt.ts b/packages/ai-gemini-cli/src/messages/prompt.ts
new file mode 100644
index 000000000..ad1b069a6
--- /dev/null
+++ b/packages/ai-gemini-cli/src/messages/prompt.ts
@@ -0,0 +1,67 @@
+import type { ModelMessage } from '@tanstack/ai'
+
+export interface BuiltPrompt {
+  prompt: string
+  /** Gemini CLI session id to resume, when the caller threaded one through. */
+  resume?: string
+}
+
+function extractText(content: ModelMessage['content']): string {
+  if (content === null) return ''
+  if (typeof content === 'string') return content
+  return content
+    .map((part) =>
+      part.type === 'text' && typeof part.content === 'string'
+        ? part.content
+        : '',
+    )
+    .join('')
+}
+
+/**
+ * Convert TanStack chat history into the harness's prompt + resume inputs.
+ *
+ * With a `sessionId`, the harness already holds the conversation context, so
+ * only the trailing user message is sent and the session is resumed. Without
+ * one, prior turns are flattened into a plain-text transcript preamble (tool
+ * messages and tool-call-only assistant turns are harness-internal noise and
+ * are skipped; prompts are text-only in v1).
+ */
+export function buildPrompt(
+  messages: Array<ModelMessage>,
+  sessionId: string | undefined,
+): BuiltPrompt {
+  const lastMessage = messages.at(-1)
+  const lastUserText =
+    lastMessage?.role === 'user' ? extractText(lastMessage.content).trim() : ''
+
+  if (!lastUserText) {
+    throw new Error(
+      'Gemini CLI adapter requires a trailing user message with text content.',
+    )
+  }
+
+  if (sessionId !== undefined) {
+    return { prompt: lastUserText, resume: sessionId }
+  }
+
+  const priorTurns = messages
+    .slice(0, -1)
+    .filter(
+      (message) =>
+        (message.role === 'user' || message.role === 'assistant') &&
+        extractText(message.content).trim() !== '',
+    )
+    .map(
+      (message) =>
+        `${message.role === 'user' ? 'User' : 'Assistant'}: ${extractText(message.content).trim()}`,
+    )
+
+  if (priorTurns.length === 0) {
+    return { prompt: lastUserText }
+  }
+
+  return {
+    prompt: `Previous conversation:\n${priorTurns.join('\n')}\n\n${lastUserText}`,
+  }
+}
diff --git a/packages/ai-gemini-cli/src/model-meta.ts b/packages/ai-gemini-cli/src/model-meta.ts
new file mode 100644
index 000000000..039769910
--- /dev/null
+++ b/packages/ai-gemini-cli/src/model-meta.ts
@@ -0,0 +1,20 @@
+/**
+ * Models known to work with Gemini CLI. The harness accepts any Gemini model
+ * id (and the `auto` / `pro` / `flash` aliases resolved by the CLI), so this
+ * list exists for autocomplete — any string is accepted via the
+ * `(string & {})` escape hatch in {@link GeminiCliModel}.
+ */
+export const GEMINI_CLI_MODELS = [
+  'gemini-3-pro-preview',
+  'gemini-3-flash-preview',
+  'gemini-2.5-pro',
+  'gemini-2.5-flash',
+  'auto',
+  'pro',
+  'flash',
+] as const
+
+export type KnownGeminiCliModel = (typeof GEMINI_CLI_MODELS)[number]
+
+/** Any model id accepted by Gemini CLI; known ids get autocomplete. */
+export type GeminiCliModel = KnownGeminiCliModel | (string & {})
diff --git a/packages/ai-gemini-cli/src/process/acp-client.ts b/packages/ai-gemini-cli/src/process/acp-client.ts
new file mode 100644
index 000000000..51e7fd863
--- /dev/null
+++ b/packages/ai-gemini-cli/src/process/acp-client.ts
@@ -0,0 +1,192 @@
+import {
+  ClientSideConnection,
+  PROTOCOL_VERSION,
+  ndJsonStream,
+} from '@agentclientprotocol/sdk'
+import { spawnHandleToAcpTransport } from './sandbox-transport'
+import type {
+  Client,
+  McpServer,
+  RequestPermissionRequest,
+  RequestPermissionResponse,
+  SessionNotification,
+} from '@agentclientprotocol/sdk'
+import type { SpawnHandle } from '@tanstack/ai-sandbox'
+import type {
+  AcpPermissionOutcome,
+  AcpPermissionRequest,
+  AcpSessionUpdate,
+  AcpStopReason,
+  AcpUsage,
+} from '../stream/acp-types'
+
+/** A live ACP session backed by a `gemini --acp` process inside the sandbox. */
+export interface AcpSessionHandle {
+  sessionId: string
+  /** Whether an existing session was actually resumed via `session/load`. */
+  resumed: boolean
+  /** Run one prompt turn; resolves with the harness's stop reason. */
+  prompt: (
+    text: string,
+  ) => Promise<{ stopReason: AcpStopReason; usage?: AcpUsage }>
+  /** Ask the harness to cancel the in-flight prompt turn. */
+  cancel: () => Promise<void>
+  /** Tear down the process. */
+  dispose: () => Promise<void>
+}
+
+export interface StartAcpSessionOptions {
+  /** The already-spawned `gemini --acp` process (via sandbox.process.spawn). */
+  process: SpawnHandle
+  /** Working directory inside the sandbox (used for ACP session params). */
+  cwd: string
+  /**
+   * ACP auth method to select (via `authenticate`) before opening a session.
+   * The agent advertises the available method ids in its `initialize`
+   * response (e.g. `'oauth-personal'`, `'gemini-api-key'`, `'vertex-ai'`).
+   */
+  authMethodId?: string
+  /** MCP servers (e.g. a host tool bridge) for the session. */
+  mcpServers?: Array<{
+    name: string
+    url: string
+    headers?: Array<{ name: string; value: string }>
+  }>
+  /** Session id to resume via `session/load`, when supported by the CLI. */
+  resumeSessionId?: string
+  onUpdate: (update: AcpSessionUpdate) => void
+  onPermissionRequest: (
+    request: AcpPermissionRequest,
+  ) => Promise<AcpPermissionOutcome> | AcpPermissionOutcome
+}
+
+/**
+ * Drive a sandbox-spawned `gemini --acp` process over the Agent Client
+ * Protocol (JSON-RPC 2.0 on stdio). The transport is adapted from the
+ * sandbox {@link SpawnHandle}; all ACP protocol handling is reused.
+ *
+ * Resume semantics: when `resumeSessionId` is set and the CLI advertises the
+ * `loadSession` capability, the session is loaded by id and its replayed
+ * history is swallowed; otherwise a fresh session is created and
+ * `resumed: false` tells the adapter to send the flattened transcript.
+ */
+export async function startAcpSession(
+  options: StartAcpSessionOptions,
+): Promise<AcpSessionHandle> {
+  const transport = spawnHandleToAcpTransport(options.process)
+
+  /** Suppressed while session/load replays prior history. */
+  let replaying = false
+
+  const client: Client = {
+    requestPermission: async (
+      params: RequestPermissionRequest,
+    ): Promise<RequestPermissionResponse> => {
+      const outcome = await options.onPermissionRequest(params)
+      return { outcome }
+    },
+    sessionUpdate: (params: SessionNotification): Promise<void> => {
+      if (!replaying) {
+        options.onUpdate(params.update as AcpSessionUpdate)
+      }
+      return Promise.resolve()
+    },
+  }
+
+  const teardown = async (): Promise<void> => {
+    await transport.kill()
+  }
+
+  try {
+    const connection = new ClientSideConnection(
+      () => client,
+      ndJsonStream(transport.writable, transport.readable),
+    )
+
+    const race = <T>(work: Promise<T>): Promise<T> =>
+      Promise.race([work, transport.exited])
+
+    const initResult = await race(
+      connection.initialize({
+        protocolVersion: PROTOCOL_VERSION,
+        clientCapabilities: {
+          fs: { readTextFile: false, writeTextFile: false },
+        },
+      }),
+    )
+
+    if (options.authMethodId !== undefined) {
+      const available = initResult.authMethods ?? []
+      if (!available.some((method) => method.id === options.authMethodId)) {
+        throw new Error(
+          `Gemini CLI does not advertise the ACP auth method '${options.authMethodId}'. Available: ${
+            available.map((method) => method.id).join(', ') || '(none)'
+          }.`,
+        )
+      }
+      await race(connection.authenticate({ methodId: options.authMethodId }))
+    }
+
+    const mcpServers: Array<McpServer> = (options.mcpServers ?? []).map(
+      (server) => ({
+        type: 'http' as const,
+        name: server.name,
+        url: server.url,
+        headers: server.headers ?? [],
+      }),
+    )
+
+    let sessionId: string | undefined
+    let resumed = false
+    if (
+      options.resumeSessionId !== undefined &&
+      initResult.agentCapabilities?.loadSession === true
+    ) {
+      replaying = true
+      try {
+        await race(
+          connection.loadSession({
+            sessionId: options.resumeSessionId,
+            cwd: options.cwd,
+            mcpServers,
+          }),
+        )
+        sessionId = options.resumeSessionId
+        resumed = true
+      } catch {
+        // Session unknown to this CLI install — fall through to a fresh one.
+      } finally {
+        replaying = false
+      }
+    }
+
+    if (sessionId === undefined) {
+      const session = await race(
+        connection.newSession({ cwd: options.cwd, mcpServers }),
+      )
+      sessionId = session.sessionId
+    }
+
+    return {
+      sessionId,
+      resumed,
+      prompt: async (text: string) => {
+        const response = await race(
+          connection.prompt({
+            sessionId,
+            prompt: [{ type: 'text', text }],
+          }),
+        )
+        return {
+          stopReason: response.stopReason,
+          ...(response.usage != null && { usage: response.usage }),
+        }
+      },
+      cancel: () => connection.cancel({ sessionId }),
+      dispose: teardown,
+    }
+  } catch (error) {
+    await teardown()
+    throw error
+  }
+}
diff --git a/packages/ai-gemini-cli/src/process/permissions.ts b/packages/ai-gemini-cli/src/process/permissions.ts
new file mode 100644
index 000000000..144274e25
--- /dev/null
+++ b/packages/ai-gemini-cli/src/process/permissions.ts
@@ -0,0 +1,101 @@
+import { approvalId } from '@tanstack/ai-sandbox'
+import { matchBridgedToolName } from '../stream/translate'
+import type {
+  AcpPermissionOutcome,
+  AcpPermissionRequest,
+} from '../stream/acp-types'
+
+/**
+ * Permission modes for the Gemini CLI adapter, mirroring the Claude Code
+ * adapter's semantics:
+ *
+ * - `'default'`: bridged TanStack tools run; anything else that asks for
+ *   permission is rejected with no prompt (a headless server must never
+ *   hang on an interactive question).
+ * - `'acceptEdits'`: additionally auto-approves file-mutation tools
+ *   (edit / move / delete kinds).
+ * - `'bypassPermissions'`: approves everything.
+ */
+export type GeminiCliPermissionMode =
+  | 'default'
+  | 'acceptEdits'
+  | 'bypassPermissions'
+
+/** Custom permission handler; replaces the adapter's default policy. */
+export type PermissionHandler = (
+  request: AcpPermissionRequest,
+) => Promise<AcpPermissionOutcome> | AcpPermissionOutcome
+
+const EDIT_KINDS = new Set(['edit', 'move', 'delete'])
+
+function pickOption(
+  request: AcpPermissionRequest,
+  kinds: Array<string>,
+): AcpPermissionOutcome {
+  for (const kind of kinds) {
+    const option = request.options.find((candidate) => candidate.kind === kind)
+    if (option) return { outcome: 'selected', optionId: option.optionId }
+  }
+  return { outcome: 'cancelled' }
+}
+
+/**
+ * The adapter's default permission policy. Always answers immediately —
+ * never hangs a headless server on a question only an interactive user
+ * could answer.
+ */
+export function resolvePermission(
+  request: AcpPermissionRequest,
+  mode: GeminiCliPermissionMode,
+  bridgedToolNames: ReadonlySet<string> | undefined,
+): AcpPermissionOutcome {
+  const allow = () => pickOption(request, ['allow_once', 'allow_always'])
+  const reject = () => pickOption(request, ['reject_once', 'reject_always'])
+
+  if (
+    matchBridgedToolName(request.toolCall.title, bridgedToolNames) !== undefined
+  ) {
+    return allow()
+  }
+  if (mode === 'bypassPermissions') {
+    return allow()
+  }
+  if (mode === 'acceptEdits' && EDIT_KINDS.has(request.toolCall.kind ?? '')) {
+    return allow()
+  }
+  return reject()
+}
+
+/**
+ * Interactive variant: when the mode/bridge policy would reject, consult the
+ * client's approval decisions. Returns the ACP outcome plus, when the action
+ * still needs a client decision, the `approvalId`/`title` the adapter should
+ * surface via an `approval-requested` event (the client re-runs to grant it).
+ */
+export function resolveInteractivePermission(
+  request: AcpPermissionRequest,
+  mode: GeminiCliPermissionMode,
+  bridgedToolNames: ReadonlySet<string> | undefined,
+  approvals: ReadonlyMap<string, boolean> | undefined,
+): { outcome: AcpPermissionOutcome; approvalId?: string; title?: string } {
+  const allow = (): AcpPermissionOutcome =>
+    pickOption(request, ['allow_once', 'allow_always'])
+  const reject = (): AcpPermissionOutcome =>
+    pickOption(request, ['reject_once', 'reject_always'])
+  const title = request.toolCall.title ?? request.toolCall.toolCallId
+
+  if (matchBridgedToolName(title, bridgedToolNames) !== undefined) {
+    return { outcome: allow() }
+  }
+  if (mode === 'bypassPermissions') return { outcome: allow() }
+  if (mode === 'acceptEdits' && EDIT_KINDS.has(request.toolCall.kind ?? '')) {
+    return { outcome: allow() }
+  }
+
+  // Would reject — offer client-in-the-loop approval.
+  const id = approvalId({ provider: 'gemini-cli', kind: 'tool', target: title })
+  const granted = approvals?.get(id)
+  if (granted === true) return { outcome: allow() }
+  if (granted === false) return { outcome: reject() }
+  return { outcome: reject(), approvalId: id, title }
+}
diff --git a/packages/ai-gemini-cli/src/process/sandbox-transport.ts b/packages/ai-gemini-cli/src/process/sandbox-transport.ts
new file mode 100644
index 000000000..8890097ea
--- /dev/null
+++ b/packages/ai-gemini-cli/src/process/sandbox-transport.ts
@@ -0,0 +1,75 @@
+/**
+ * Adapt a sandbox {@link SpawnHandle} (duplex string IO) into the
+ * `{ writable, readable }` Uint8Array WebStreams that `@agentclientprotocol`'s
+ * `ndJsonStream` consumes. This is the ONLY new transport piece needed to run
+ * `gemini --acp` inside a sandbox instead of as a local child process — the ACP
+ * protocol handling is reused unchanged.
+ */
+import type { SpawnHandle } from '@tanstack/ai-sandbox'
+
+export interface AcpTransport {
+  writable: WritableStream<Uint8Array>
+  readable: ReadableStream<Uint8Array>
+  /** Resolves (throws) when the underlying process exits unexpectedly. */
+  exited: Promise<never>
+  /** Last bytes of stderr, for error messages. */
+  stderrTail: () => string
+  kill: () => Promise<void>
+}
+
+export function spawnHandleToAcpTransport(handle: SpawnHandle): AcpTransport {
+  const encoder = new TextEncoder()
+  const decoder = new TextDecoder()
+
+  const readable = new ReadableStream<Uint8Array>({
+    async start(controller) {
+      try {
+        for await (const chunk of handle.stdout) {
+          controller.enqueue(encoder.encode(chunk))
+        }
+        controller.close()
+      } catch (error) {
+        controller.error(error)
+      }
+    },
+  })
+
+  const writable = new WritableStream<Uint8Array>({
+    write(chunk) {
+      return handle.stdin.write(decoder.decode(chunk))
+    },
+    close() {
+      return handle.stdin.end()
+    },
+  })
+
+  let tail = ''
+  void (async () => {
+    try {
+      for await (const chunk of handle.stderr) {
+        tail = (tail + chunk).slice(-4096)
+      }
+    } catch {
+      // stderr closed
+    }
+  })()
+
+  const exited: Promise<never> = handle.wait().then((code) => {
+    throw new Error(
+      `Gemini CLI exited unexpectedly (code ${code}).${
+        tail.trim() !== '' ? `\nstderr: ${tail.trim()}` : ''
+      }`,
+    )
+  })
+  // Mark the rejection handled so it isn't an unhandled rejection when the
+  // consumer wins the race (consumers still observe it via Promise.race).
+  void exited.catch(() => undefined)
+
+  return {
+    writable,
+    readable,
+    exited,
+    stderrTail: () => tail,
+    kill: () => handle.kill(),
+  }
+}
diff --git a/packages/ai-gemini-cli/src/provider-options.ts b/packages/ai-gemini-cli/src/provider-options.ts
new file mode 100644
index 000000000..3d74cdc18
--- /dev/null
+++ b/packages/ai-gemini-cli/src/provider-options.ts
@@ -0,0 +1,23 @@
+import type { GeminiCliPermissionMode } from './process/permissions'
+
+/**
+ * Per-call provider options for the Gemini CLI adapter, passed via
+ * `modelOptions` on `chat()`.
+ */
+export interface GeminiCliTextProviderOptions {
+  /**
+   * Resume an existing Gemini CLI session. The adapter emits the session id
+   * of every run via a CUSTOM `gemini-cli.session-id` stream event; thread
+   * it back here to continue that session (only the latest user message is
+   * sent — the harness already holds the prior context). If the installed
+   * CLI doesn't support session loading, the adapter falls back to a fresh
+   * session seeded with the flattened transcript.
+   */
+  sessionId?: string
+  /** Per-call override of the configured permission mode. */
+  permissionMode?: GeminiCliPermissionMode
+  /** Per-call override of the harness working directory. */
+  cwd?: string
+  /** Per-call override of the configured ACP auth method id. */
+  authMethodId?: string
+}
diff --git a/packages/ai-gemini-cli/src/stream/acp-types.ts b/packages/ai-gemini-cli/src/stream/acp-types.ts
new file mode 100644
index 000000000..c59c4aa9e
--- /dev/null
+++ b/packages/ai-gemini-cli/src/stream/acp-types.ts
@@ -0,0 +1,82 @@
+/**
+ * Structural subset of the Agent Client Protocol (ACP) types that the
+ * adapter consumes.
+ *
+ * These are intentionally defined structurally (rather than imported from
+ * `@agentclientprotocol/sdk`) so the stream translator stays a pure,
+ * fixture-testable state machine and the package's public types don't depend
+ * on the ACP SDK's generated schema types. Unknown update types fall through
+ * every branch at runtime.
+ */
+
+export type AcpContentBlock =
+  | { type: 'text'; text: string }
+  | { type: string; [key: string]: unknown }
+
+export type AcpToolCallStatus =
+  | 'pending'
+  | 'in_progress'
+  | 'completed'
+  | 'failed'
+
+export interface AcpToolCallUpdate {
+  toolCallId: string
+  title?: string | null
+  kind?: string | null
+  status?: AcpToolCallStatus | null
+  rawInput?: unknown
+  rawOutput?: unknown
+  content?: Array<{
+    type: string
+    content?: AcpContentBlock
+    [key: string]: unknown
+  }> | null
+}
+
+/**
+ * The session-update variants the translator consumes. The harness can send
+ * other update types (`available_commands_update`, `current_mode_update`,
+ * ...); they fall through every branch and are ignored.
+ */
+export type AcpSessionUpdate =
+  | { sessionUpdate: 'agent_message_chunk'; content: AcpContentBlock }
+  | { sessionUpdate: 'agent_thought_chunk'; content: AcpContentBlock }
+  | ({ sessionUpdate: 'tool_call' } & AcpToolCallUpdate)
+  | ({ sessionUpdate: 'tool_call_update' } & AcpToolCallUpdate)
+  | { sessionUpdate: 'plan'; entries: Array<unknown> }
+  | { sessionUpdate: 'available_commands_update' }
+  | { sessionUpdate: 'current_mode_update' }
+  | { sessionUpdate: 'user_message_chunk'; content: AcpContentBlock }
+
+export type AcpStopReason =
+  | 'end_turn'
+  | 'max_tokens'
+  | 'max_turn_requests'
+  | 'refusal'
+  | 'cancelled'
+  | (string & {})
+
+/** Experimental per-turn token usage reported by the ACP prompt response. */
+export interface AcpUsage {
+  inputTokens?: number | null
+  outputTokens?: number | null
+  totalTokens?: number | null
+  cachedReadTokens?: number | null
+  thoughtTokens?: number | null
+}
+
+export interface AcpPermissionOption {
+  optionId: string
+  name: string
+  kind: 'allow_once' | 'allow_always' | 'reject_once' | 'reject_always'
+}
+
+export interface AcpPermissionRequest {
+  sessionId: string
+  toolCall: AcpToolCallUpdate
+  options: Array<AcpPermissionOption>
+}
+
+export type AcpPermissionOutcome =
+  | { outcome: 'cancelled' }
+  | { outcome: 'selected'; optionId: string }
diff --git a/packages/ai-gemini-cli/src/stream/queue.ts b/packages/ai-gemini-cli/src/stream/queue.ts
new file mode 100644
index 000000000..0f095feb1
--- /dev/null
+++ b/packages/ai-gemini-cli/src/stream/queue.ts
@@ -0,0 +1,64 @@
+/**
+ * Minimal promise-based async queue bridging the ACP connection's
+ * callback-style `session/update` notifications into the async-iterable
+ * world the stream translator consumes.
+ */
+export class AsyncQueue<T> implements AsyncIterable<T> {
+  private readonly values: Array<T> = []
+  private readonly waiters: Array<{
+    resolve: (result: IteratorResult<T>) => void
+    reject: (error: unknown) => void
+  }> = []
+  private ended = false
+  private error: unknown = undefined
+  private failed = false
+
+  push(value: T): void {
+    if (this.ended || this.failed) return
+    const waiter = this.waiters.shift()
+    if (waiter) {
+      waiter.resolve({ value, done: false })
+    } else {
+      this.values.push(value)
+    }
+  }
+
+  /** Signal normal completion; pending and future reads resolve as done. */
+  end(): void {
+    if (this.ended || this.failed) return
+    this.ended = true
+    for (const waiter of this.waiters.splice(0)) {
+      waiter.resolve({ value: undefined, done: true })
+    }
+  }
+
+  /** Signal failure; pending and future reads reject (after buffered values drain). */
+  fail(error: unknown): void {
+    if (this.ended || this.failed) return
+    this.failed = true
+    this.error = error
+    for (const waiter of this.waiters.splice(0)) {
+      waiter.reject(error)
+    }
+  }
+
+  [Symbol.asyncIterator](): AsyncIterator<T> {
+    return {
+      next: (): Promise<IteratorResult<T>> => {
+        if (this.values.length > 0) {
+          return Promise.resolve({
+            value: this.values.shift() as T,
+            done: false,
+          })
+        }
+        if (this.failed) return Promise.reject(this.error)
+        if (this.ended) {
+          return Promise.resolve({ value: undefined, done: true })
+        }
+        return new Promise((resolve, reject) => {
+          this.waiters.push({ resolve, reject })
+        })
+      },
+    }
+  }
+}
diff --git a/packages/ai-gemini-cli/src/stream/translate.ts b/packages/ai-gemini-cli/src/stream/translate.ts
new file mode 100644
index 000000000..db18c28c8
--- /dev/null
+++ b/packages/ai-gemini-cli/src/stream/translate.ts
@@ -0,0 +1,395 @@
+import { EventType, buildBaseUsage } from '@tanstack/ai'
+import type { StreamChunk, TokenUsage } from '@tanstack/ai'
+import type {
+  AcpSessionUpdate,
+  AcpStopReason,
+  AcpToolCallUpdate,
+  AcpUsage,
+} from './acp-types'
+
+/** Name of the CUSTOM event carrying the Gemini CLI session id. */
+export const SESSION_ID_EVENT = 'gemini-cli.session-id'
+
+/** Name of the CUSTOM event carrying the harness's plan updates. */
+export const PLAN_EVENT = 'gemini-cli.plan'
+
+/** Server name used for bridged TanStack tools. */
+export const BRIDGED_MCP_SERVER_NAME = 'tanstack'
+
+/**
+ * Events fed to the translator: the session id once established, every ACP
+ * `session/update` notification, and a terminal `done` carrying the prompt
+ * response's stop reason (the adapter's async queue produces these).
+ */
+export type AcpStreamEvent =
+  | { kind: 'session'; sessionId: string }
+  | { kind: 'update'; update: AcpSessionUpdate }
+  | { kind: 'done'; stopReason: AcpStopReason; usage?: AcpUsage }
+
+export interface TranslateContext {
+  model: string
+  runId: string
+  threadId: string
+  parentRunId?: string
+  genId: () => string
+  /**
+   * Names of bridged TanStack tools, used to surface the harness's MCP tool
+   * calls under the names the application registered.
+   */
+  bridgedToolNames?: ReadonlySet<string>
+  /** Called for each raw ACP stream event, for logging. */
+  onAcpEvent?: (event: AcpStreamEvent) => void
+}
+
+/**
+ * Match an ACP tool-call title against the bridged TanStack tool names.
+ * Gemini CLI labels MCP tools with the tool name, optionally suffixed with
+ * the server it came from (e.g. `lookup_user (tanstack MCP Server)`).
+ */
+export function matchBridgedToolName(
+  title: string | null | undefined,
+  bridgedToolNames: ReadonlySet<string> | undefined,
+): string | undefined {
+  if (!title || !bridgedToolNames) return undefined
+  if (bridgedToolNames.has(title)) return title
+  for (const name of bridgedToolNames) {
+    if (title.startsWith(`${name} (`)) return name
+  }
+  return undefined
+}
+
+function resolveToolName(
+  update: AcpToolCallUpdate,
+  bridgedToolNames: ReadonlySet<string> | undefined,
+): string {
+  return (
+    matchBridgedToolName(update.title, bridgedToolNames) ??
+    update.kind ??
+    'tool'
+  )
+}
+
+function stringifyToolOutput(update: AcpToolCallUpdate): string {
+  if (update.rawOutput !== undefined) {
+    return typeof update.rawOutput === 'string'
+      ? update.rawOutput
+      : JSON.stringify(update.rawOutput)
+  }
+  const text = (update.content ?? [])
+    .map((block) =>
+      block.content && typeof block.content.text === 'string'
+        ? block.content.text
+        : '',
+    )
+    .join('')
+  if (text !== '') return text
+  return JSON.stringify({ status: update.status ?? 'completed' })
+}
+
+function buildUsage(usage: AcpUsage | undefined): TokenUsage | undefined {
+  if (!usage) return undefined
+  const promptTokens = usage.inputTokens ?? 0
+  const completionTokens = usage.outputTokens ?? 0
+  const result = buildBaseUsage({
+    promptTokens,
+    completionTokens,
+    totalTokens: usage.totalTokens ?? promptTokens + completionTokens,
+  })
+  if (usage.cachedReadTokens) {
+    result.promptTokensDetails = { cachedTokens: usage.cachedReadTokens }
+  }
+  if (usage.thoughtTokens) {
+    result.completionTokensDetails = { reasoningTokens: usage.thoughtTokens }
+  }
+  return result
+}
+
+/**
+ * Translate a Gemini CLI ACP event stream into AG-UI StreamChunk events.
+ *
+ * The harness runs its own agent loop and executes its own tools, so the
+ * translation always ends with `finishReason: 'stop'` (or `'length'` /
+ * RUN_ERROR) — never `'tool_calls'`. Harness tool activity is emitted as
+ * already-resolved TOOL_CALL_START/ARGS/END + TOOL_CALL_RESULT sequences so
+ * UIs can render it, while the TanStack engine never tries to execute them.
+ *
+ * ACP delivers true token-level deltas for both assistant text
+ * (`agent_message_chunk`) and thinking (`agent_thought_chunk`).
+ *
+ * Invariant: every TOOL_CALL_START is eventually paired with a
+ * TOOL_CALL_RESULT (synthesized as `{"status":"interrupted"}` when the run
+ * ends or aborts before the harness reported one) so the engine's
+ * pending-tool-call scan on the next request never force-executes them.
+ */
+export async function* translateAcpStream(
+  events: AsyncIterable<AcpStreamEvent>,
+  ctx: TranslateContext,
+): AsyncIterable<StreamChunk> {
+  const { model, runId, threadId, genId } = ctx
+  const now = () => Date.now()
+
+  let runStarted = false
+  /** Tool calls started but with no result yet. */
+  const unresolvedToolCalls = new Set<string>()
+  /** Tool names by id, for synthetic opens on unknown tool_call_update ids. */
+  const knownToolCalls = new Set<string>()
+
+  let textMessageId: string | null = null
+  let textContent = ''
+  let reasoningId: string | null = null
+
+  function* startRun(): Generator<StreamChunk> {
+    if (runStarted) return
+    runStarted = true
+    yield {
+      type: EventType.RUN_STARTED,
+      runId,
+      threadId,
+      model,
+      timestamp: now(),
+      ...(ctx.parentRunId !== undefined && { parentRunId: ctx.parentRunId }),
+    }
+  }
+
+  function* closeText(): Generator<StreamChunk> {
+    if (textMessageId !== null) {
+      yield {
+        type: EventType.TEXT_MESSAGE_END,
+        messageId: textMessageId,
+        model,
+        timestamp: now(),
+      }
+    }
+    textMessageId = null
+    textContent = ''
+  }
+
+  function* closeReasoning(): Generator<StreamChunk> {
+    if (reasoningId !== null) {
+      yield {
+        type: EventType.REASONING_MESSAGE_END,
+        messageId: reasoningId,
+        model,
+        timestamp: now(),
+      }
+      yield {
+        type: EventType.REASONING_END,
+        messageId: reasoningId,
+        model,
+        timestamp: now(),
+      }
+    }
+    reasoningId = null
+  }
+
+  function* synthesizeUnresolvedResults(): Generator<StreamChunk> {
+    for (const toolCallId of unresolvedToolCalls) {
+      yield {
+        type: EventType.TOOL_CALL_RESULT,
+        toolCallId,
+        messageId: genId(),
+        model,
+        timestamp: now(),
+        content: JSON.stringify({ status: 'interrupted' }),
+      }
+    }
+    unresolvedToolCalls.clear()
+  }
+
+  function* openToolCall(update: AcpToolCallUpdate): Generator<StreamChunk> {
+    if (knownToolCalls.has(update.toolCallId)) return
+    knownToolCalls.add(update.toolCallId)
+    const toolCallName = resolveToolName(update, ctx.bridgedToolNames)
+    const input = {
+      ...(update.title != null && { title: update.title }),
+      ...(update.rawInput !== undefined && update.rawInput !== null
+        ? typeof update.rawInput === 'object'
+          ? (update.rawInput as Record<string, unknown>)
+          : { input: update.rawInput }
+        : {}),
+    }
+    const args = JSON.stringify(input)
+    yield {
+      type: EventType.TOOL_CALL_START,
+      toolCallId: update.toolCallId,
+      toolCallName,
+      toolName: toolCallName,
+      model,
+      timestamp: now(),
+    }
+    yield {
+      type: EventType.TOOL_CALL_ARGS,
+      toolCallId: update.toolCallId,
+      model,
+      timestamp: now(),
+      delta: args,
+      args,
+    }
+    yield {
+      type: EventType.TOOL_CALL_END,
+      toolCallId: update.toolCallId,
+      toolCallName,
+      toolName: toolCallName,
+      model,
+      timestamp: now(),
+      input,
+    }
+    unresolvedToolCalls.add(update.toolCallId)
+  }
+
+  function* resolveToolCall(update: AcpToolCallUpdate): Generator<StreamChunk> {
+    yield* openToolCall(update)
+    unresolvedToolCalls.delete(update.toolCallId)
+    yield {
+      type: EventType.TOOL_CALL_RESULT,
+      toolCallId: update.toolCallId,
+      messageId: genId(),
+      model,
+      timestamp: now(),
+      content: stringifyToolOutput(update),
+      ...(update.status === 'failed' && { state: 'output-error' as const }),
+    }
+  }
+
+  function* handleUpdate(update: AcpSessionUpdate): Generator<StreamChunk> {
+    if (update.sessionUpdate === 'agent_message_chunk') {
+      yield* closeReasoning()
+      const text =
+        typeof update.content.text === 'string' ? update.content.text : ''
+      if (text === '') return
+      if (textMessageId === null) {
+        textMessageId = genId()
+        yield {
+          type: EventType.TEXT_MESSAGE_START,
+          messageId: textMessageId,
+          model,
+          timestamp: now(),
+          role: 'assistant',
+        }
+      }
+      textContent += text
+      yield {
+        type: EventType.TEXT_MESSAGE_CONTENT,
+        messageId: textMessageId,
+        model,
+        timestamp: now(),
+        delta: text,
+        content: textContent,
+      }
+    } else if (update.sessionUpdate === 'agent_thought_chunk') {
+      yield* closeText()
+      const thought =
+        typeof update.content.text === 'string' ? update.content.text : ''
+      if (thought === '') return
+      if (reasoningId === null) {
+        reasoningId = genId()
+        yield {
+          type: EventType.REASONING_START,
+          messageId: reasoningId,
+          model,
+          timestamp: now(),
+        }
+        yield {
+          type: EventType.REASONING_MESSAGE_START,
+          messageId: reasoningId,
+          role: 'reasoning' as const,
+          model,
+          timestamp: now(),
+        }
+      }
+      yield {
+        type: EventType.REASONING_MESSAGE_CONTENT,
+        messageId: reasoningId,
+        delta: thought,
+        model,
+        timestamp: now(),
+      }
+    } else if (update.sessionUpdate === 'tool_call') {
+      yield* closeText()
+      yield* closeReasoning()
+      yield* openToolCall(update)
+      if (update.status === 'completed' || update.status === 'failed') {
+        yield* resolveToolCall(update)
+      }
+    } else if (update.sessionUpdate === 'tool_call_update') {
+      if (update.status === 'completed' || update.status === 'failed') {
+        yield* resolveToolCall(update)
+      }
+      // pending / in_progress updates carry no state the chunk stream needs.
+    } else if (update.sessionUpdate === 'plan') {
+      yield {
+        type: EventType.CUSTOM,
+        model,
+        timestamp: now(),
+        name: PLAN_EVENT,
+        value: { entries: update.entries },
+      }
+    }
+    // Other update types (available_commands_update, current_mode_update,
+    // user_message_chunk replays, ...) are harness-internal and ignored.
+  }
+
+  try {
+    for await (const event of events) {
+      ctx.onAcpEvent?.(event)
+
+      if (event.kind === 'session') {
+        yield* startRun()
+        yield {
+          type: EventType.CUSTOM,
+          model,
+          timestamp: now(),
+          name: SESSION_ID_EVENT,
+          value: { sessionId: event.sessionId },
+        }
+      } else if (event.kind === 'update') {
+        yield* startRun()
+        yield* handleUpdate(event.update)
+      } else {
+        yield* startRun()
+        yield* closeText()
+        yield* closeReasoning()
+        yield* synthesizeUnresolvedResults()
+
+        if (event.stopReason === 'refusal') {
+          yield {
+            type: EventType.RUN_ERROR,
+            model,
+            timestamp: now(),
+            message: 'Gemini CLI refused the request.',
+            code: 'refusal',
+            error: {
+              message: 'Gemini CLI refused the request.',
+              code: 'refusal',
+            },
+          }
+        } else {
+          const usage = buildUsage(event.usage)
+          const finishReason =
+            event.stopReason === 'max_tokens' ||
+            event.stopReason === 'max_turn_requests'
+              ? ('length' as const)
+              : ('stop' as const)
+          yield {
+            type: EventType.RUN_FINISHED,
+            runId,
+            threadId,
+            model,
+            timestamp: now(),
+            finishReason,
+            ...(usage !== undefined && { usage }),
+          }
+        }
+      }
+    }
+  } catch (error) {
+    // The run is dying (abort, process exit, or connection failure). Close
+    // any open message and pair started tool calls with a synthetic result
+    // first so the next request's pending-tool-call scan doesn't try to
+    // execute them, then let the adapter surface the error as RUN_ERROR.
+    yield* closeText()
+    yield* closeReasoning()
+    yield* synthesizeUnresolvedResults()
+    throw error
+  }
+}
diff --git a/packages/ai-gemini-cli/tests/permissions.test.ts b/packages/ai-gemini-cli/tests/permissions.test.ts
new file mode 100644
index 000000000..fd8dfd062
--- /dev/null
+++ b/packages/ai-gemini-cli/tests/permissions.test.ts
@@ -0,0 +1,103 @@
+import { describe, expect, it } from 'vitest'
+import { resolvePermission } from '../src/process/permissions'
+import type { AcpPermissionRequest } from '../src/stream/acp-types'
+
+function makeRequest(
+  overrides: Partial<AcpPermissionRequest['toolCall']> = {},
+): AcpPermissionRequest {
+  return {
+    sessionId: 'sess-1',
+    toolCall: {
+      toolCallId: 'tc-1',
+      title: 'Run shell command',
+      kind: 'execute',
+      ...overrides,
+    },
+    options: [
+      { optionId: 'allow-once', name: 'Allow once', kind: 'allow_once' },
+      { optionId: 'allow-always', name: 'Always allow', kind: 'allow_always' },
+      { optionId: 'reject-once', name: 'Reject', kind: 'reject_once' },
+    ],
+  }
+}
+
+describe('resolvePermission', () => {
+  it('rejects harness tools in default mode', () => {
+    expect(resolvePermission(makeRequest(), 'default', undefined)).toEqual({
+      outcome: 'selected',
+      optionId: 'reject-once',
+    })
+  })
+
+  it('allows bridged TanStack tools in every mode', () => {
+    const request = makeRequest({
+      title: 'lookup_user (tanstack MCP Server)',
+      kind: 'other',
+    })
+    const bridged = new Set(['lookup_user'])
+    for (const mode of [
+      'default',
+      'acceptEdits',
+      'bypassPermissions',
+    ] as const) {
+      expect(resolvePermission(request, mode, bridged)).toEqual({
+        outcome: 'selected',
+        optionId: 'allow-once',
+      })
+    }
+  })
+
+  it('allows edit-kind tools only in acceptEdits and bypassPermissions', () => {
+    const edit = makeRequest({ title: 'Edit file', kind: 'edit' })
+    expect(resolvePermission(edit, 'default', undefined)).toEqual({
+      outcome: 'selected',
+      optionId: 'reject-once',
+    })
+    expect(resolvePermission(edit, 'acceptEdits', undefined)).toEqual({
+      outcome: 'selected',
+      optionId: 'allow-once',
+    })
+    expect(resolvePermission(edit, 'bypassPermissions', undefined)).toEqual({
+      outcome: 'selected',
+      optionId: 'allow-once',
+    })
+  })
+
+  it('treats move and delete as edits', () => {
+    for (const kind of ['move', 'delete']) {
+      expect(
+        resolvePermission(makeRequest({ kind }), 'acceptEdits', undefined),
+      ).toEqual({ outcome: 'selected', optionId: 'allow-once' })
+    }
+  })
+
+  it('does not auto-approve execute tools in acceptEdits mode', () => {
+    expect(
+      resolvePermission(
+        makeRequest({ kind: 'execute' }),
+        'acceptEdits',
+        undefined,
+      ),
+    ).toEqual({ outcome: 'selected', optionId: 'reject-once' })
+  })
+
+  it('allows everything in bypassPermissions mode', () => {
+    expect(
+      resolvePermission(makeRequest(), 'bypassPermissions', undefined),
+    ).toEqual({ outcome: 'selected', optionId: 'allow-once' })
+  })
+
+  it('falls back through option kinds and cancels when nothing matches', () => {
+    const request: AcpPermissionRequest = {
+      ...makeRequest(),
+      options: [{ optionId: 'always', name: 'Always', kind: 'allow_always' }],
+    }
+    expect(resolvePermission(request, 'bypassPermissions', undefined)).toEqual({
+      outcome: 'selected',
+      optionId: 'always',
+    })
+    expect(resolvePermission(request, 'default', undefined)).toEqual({
+      outcome: 'cancelled',
+    })
+  })
+})
diff --git a/packages/ai-gemini-cli/tests/prompt.test.ts b/packages/ai-gemini-cli/tests/prompt.test.ts
new file mode 100644
index 000000000..6e8dfcdf3
--- /dev/null
+++ b/packages/ai-gemini-cli/tests/prompt.test.ts
@@ -0,0 +1,97 @@
+import { describe, expect, it } from 'vitest'
+import { buildPrompt } from '../src/messages/prompt'
+import type { ModelMessage } from '@tanstack/ai'
+
+const user = (content: ModelMessage['content']): ModelMessage => ({
+  role: 'user',
+  content,
+})
+const assistant = (content: ModelMessage['content']): ModelMessage => ({
+  role: 'assistant',
+  content,
+})
+
+describe('buildPrompt', () => {
+  it('resumes with only the last user message when sessionId is provided', () => {
+    const result = buildPrompt(
+      [
+        user('first question'),
+        assistant('first answer'),
+        user('follow-up question'),
+      ],
+      'sess-1',
+    )
+    expect(result).toEqual({
+      prompt: 'follow-up question',
+      resume: 'sess-1',
+    })
+  })
+
+  it('throws when sessionId is provided but there is no trailing user message', () => {
+    expect(() => buildPrompt([user('q'), assistant('a')], 'sess-1')).toThrow(
+      /user message/i,
+    )
+  })
+
+  it('sends a single user message as-is for a fresh session', () => {
+    expect(buildPrompt([user('hello')], undefined)).toEqual({
+      prompt: 'hello',
+    })
+  })
+
+  it('flattens prior turns into a transcript preamble for fresh multi-turn history', () => {
+    const { prompt, resume } = buildPrompt(
+      [user('What is 2+2?'), assistant('4'), user('And times 3?')],
+      undefined,
+    )
+    expect(resume).toBeUndefined()
+    expect(prompt).toBe(
+      'Previous conversation:\nUser: What is 2+2?\nAssistant: 4\n\nAnd times 3?',
+    )
+  })
+
+  it('skips tool messages and assistant tool-call-only turns when flattening', () => {
+    const messages: Array<ModelMessage> = [
+      user('list files'),
+      {
+        role: 'assistant',
+        content: null,
+        toolCalls: [
+          {
+            id: 't1',
+            type: 'function',
+            function: { name: 'ls', arguments: '{}' },
+          },
+        ],
+      } as unknown as ModelMessage,
+      { role: 'tool', content: 'file-a', toolCallId: 't1' },
+      assistant('There is one file.'),
+      user('thanks, which one?'),
+    ]
+    const { prompt } = buildPrompt(messages, undefined)
+    expect(prompt).toBe(
+      'Previous conversation:\nUser: list files\nAssistant: There is one file.\n\nthanks, which one?',
+    )
+  })
+
+  it('extracts text from content-part arrays and ignores non-text parts', () => {
+    const { prompt } = buildPrompt(
+      [
+        user([
+          { type: 'text', content: 'describe ' },
+          {
+            type: 'image',
+            source: { type: 'url', url: 'https://x/y.png' },
+          } as never,
+          { type: 'text', content: 'this' },
+        ] as ModelMessage['content']),
+      ],
+      undefined,
+    )
+    expect(prompt).toBe('describe this')
+  })
+
+  it('throws when there is no usable user content at all', () => {
+    expect(() => buildPrompt([], undefined)).toThrow(/user message/i)
+  })
+})
diff --git a/packages/ai-gemini-cli/tests/text-adapter.test.ts b/packages/ai-gemini-cli/tests/text-adapter.test.ts
new file mode 100644
index 000000000..9d49858c4
--- /dev/null
+++ b/packages/ai-gemini-cli/tests/text-adapter.test.ts
@@ -0,0 +1,106 @@
+/**
+ * Tests for the in-sandbox Gemini CLI adapter.
+ *
+ * The ACP protocol handling itself is the `@agentclientprotocol/sdk`'s and is
+ * reused unchanged; the new piece is the transport that drives `gemini --acp`
+ * over a sandbox {@link SpawnHandle} instead of a local child process. We test
+ * that transport adapter directly (bytes flow both ways, exit propagates) and
+ * the adapter's missing-sandbox path. A full ACP round-trip is covered by the
+ * gated live path.
+ */
+import { describe, expect, it } from 'vitest'
+import { spawnHandleToAcpTransport } from '../src/process/sandbox-transport'
+import { geminiCliText } from '../src/index'
+import type { InternalLogger } from '@tanstack/ai/adapter-internals'
+import type { StreamChunk } from '@tanstack/ai'
+import type { SpawnHandle } from '@tanstack/ai-sandbox'
+
+const noopLogger = {
+  request: () => {},
+  provider: () => {},
+  errors: () => {},
+  agentLoop: () => {},
+  warnings: () => {},
+  debug: () => {},
+} as unknown as InternalLogger
+
+async function* once(value: string): AsyncIterable<string> {
+  await Promise.resolve()
+  yield value
+}
+async function* empty(): AsyncIterable<string> {
+  // no output
+}
+
+function fakeSpawn(
+  stdoutChunks: AsyncIterable<string>,
+  exitCode = 0,
+): { handle: SpawnHandle; writes: Array<string>; ended: () => boolean } {
+  const writes: Array<string> = []
+  let didEnd = false
+  const handle: SpawnHandle = {
+    pid: 1,
+    stdout: stdoutChunks,
+    stderr: empty(),
+    stdin: {
+      write: (d) => {
+        writes.push(d)
+        return Promise.resolve()
+      },
+      end: () => {
+        didEnd = true
+        return Promise.resolve()
+      },
+    },
+    wait: () => Promise.resolve(exitCode),
+    kill: () => Promise.resolve(),
+  }
+  return { handle, writes, ended: () => didEnd }
+}
+
+async function collect(
+  stream: AsyncIterable<StreamChunk>,
+): Promise<Array<StreamChunk>> {
+  const out: Array<StreamChunk> = []
+  for await (const chunk of stream) out.push(chunk)
+  return out
+}
+
+describe('spawnHandleToAcpTransport', () => {
+  it('pipes writable bytes to stdin and stdout bytes to readable', async () => {
+    const { handle, writes } = fakeSpawn(once('{"jsonrpc":"2.0"}\n'))
+    const transport = spawnHandleToAcpTransport(handle)
+
+    // writable -> stdin (decoded to string)
+    const writer = transport.writable.getWriter()
+    await writer.write(new TextEncoder().encode('hello'))
+    await writer.close()
+    expect(writes.join('')).toBe('hello')
+
+    // stdout -> readable (encoded to bytes)
+    const reader = transport.readable.getReader()
+    const first = await reader.read()
+    expect(new TextDecoder().decode(first.value)).toContain('jsonrpc')
+  })
+
+  it('exited rejects when the process exits', async () => {
+    const { handle } = fakeSpawn(empty(), 1)
+    const transport = spawnHandleToAcpTransport(handle)
+    await expect(transport.exited).rejects.toThrow(/exited unexpectedly/i)
+  })
+})
+
+describe('gemini-cli adapter', () => {
+  it('requires a sandbox capability', async () => {
+    const adapter = geminiCliText('gemini-2.5-pro')
+    const chunks = await collect(
+      adapter.chatStream({
+        model: 'gemini-2.5-pro',
+        messages: [{ role: 'user', content: 'hi' }],
+        logger: noopLogger,
+      }),
+    )
+    const err = chunks.find((c) => c.type === 'RUN_ERROR')
+    expect((err as { message?: string }).message).toMatch(/requires a sandbox/i)
+  })
+})
diff --git a/packages/ai-gemini-cli/tests/translate.test.ts b/packages/ai-gemini-cli/tests/translate.test.ts
new file mode 100644
index 000000000..d93a7c7b7
--- /dev/null
+++ b/packages/ai-gemini-cli/tests/translate.test.ts
@@ -0,0 +1,435 @@
+import { describe, expect, it } from 'vitest'
+import {
+  PLAN_EVENT,
+  SESSION_ID_EVENT,
+  matchBridgedToolName,
+  translateAcpStream,
+} from '../src/stream/translate'
+import type { AcpStreamEvent, TranslateContext } from '../src/stream/translate'
+import type { StreamChunk } from '@tanstack/ai'
+
+function makeCtx(overrides: Partial<TranslateContext> = {}): TranslateContext {
+  let id = 0
+  return {
+    model: 'gemini-3-pro-preview',
+    runId: 'run-1',
+    threadId: 'thread-1',
+    genId: () => `gen-${++id}`,
+    ...overrides,
+  }
+}
+
+async function* fromArray(
+  events: Array<AcpStreamEvent>,
+): AsyncIterable<AcpStreamEvent> {
+  for (const event of events) yield event
+}
+
+async function collect(
+  events: Array<AcpStreamEvent>,
+  ctx: TranslateContext = makeCtx(),
+): Promise<Array<StreamChunk>> {
+  const chunks: Array<StreamChunk> = []
+  for await (const chunk of translateAcpStream(fromArray(events), ctx)) {
+    chunks.push(chunk)
+  }
+  return chunks
+}
+
+const session: AcpStreamEvent = { kind: 'session', sessionId: 'sess-1' }
+const done: AcpStreamEvent = { kind: 'done', stopReason: 'end_turn' }
+
+function text(value: string): AcpStreamEvent {
+  return {
+    kind: 'update',
+    update: {
+      sessionUpdate: 'agent_message_chunk',
+      content: { type: 'text', text: value },
+    },
+  }
+}
+
+function thought(value: string): AcpStreamEvent {
+  return {
+    kind: 'update',
+    update: {
+      sessionUpdate: 'agent_thought_chunk',
+      content: { type: 'text', text: value },
+    },
+  }
+}
+
+describe('translateAcpStream', () => {
+  it('translates streamed text deltas into one accumulated message', async () => {
+    const chunks = await collect([session, text('Hel'), text('lo'), done])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'RUN_FINISHED',
+    ])
+    expect(chunks[1]).toMatchObject({
+      name: SESSION_ID_EVENT,
+      value: { sessionId: 'sess-1' },
+    })
+    expect(chunks[3]).toMatchObject({ delta: 'Hel', content: 'Hel' })
+    expect(chunks[4]).toMatchObject({ delta: 'lo', content: 'Hello' })
+    expect(chunks.at(-1)).toMatchObject({ finishReason: 'stop' })
+  })
+
+  it('translates thought chunks into reasoning events', async () => {
+    const chunks = await collect([
+      session,
+      thought('hmm '),
+      thought('ok'),
+      text('answer'),
+      done,
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'REASONING_START',
+      'REASONING_MESSAGE_START',
+      'REASONING_MESSAGE_CONTENT',
+      'REASONING_MESSAGE_CONTENT',
+      'REASONING_MESSAGE_END',
+      'REASONING_END',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'RUN_FINISHED',
+    ])
+  })
+
+  it('closes an open text message when a tool call interleaves, then reopens', async () => {
+    const chunks = await collect([
+      session,
+      text('Let me check. '),
+      {
+        kind: 'update',
+        update: {
+          sessionUpdate: 'tool_call',
+          toolCallId: 'tc-1',
+          title: 'Reading file',
+          kind: 'read',
+          status: 'in_progress',
+          rawInput: { path: 'a.ts' },
+        },
+      },
+      {
+        kind: 'update',
+        update: {
+          sessionUpdate: 'tool_call_update',
+          toolCallId: 'tc-1',
+          status: 'completed',
+          rawOutput: 'contents',
+        },
+      },
+      text('Done.'),
+      done,
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'TOOL_CALL_START',
+      'TOOL_CALL_ARGS',
+      'TOOL_CALL_END',
+      'TOOL_CALL_RESULT',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'RUN_FINISHED',
+    ])
+    expect(chunks[5]).toMatchObject({
+      toolCallId: 'tc-1',
+      toolCallName: 'read',
+    })
+    expect(chunks[6]).toMatchObject({
+      args: JSON.stringify({ title: 'Reading file', path: 'a.ts' }),
+    })
+    expect(chunks[8]).toMatchObject({ content: 'contents' })
+  })
+
+  it('marks failed tool calls as output-error', async () => {
+    const chunks = await collect([
+      session,
+      {
+        kind: 'update',
+        update: {
+          sessionUpdate: 'tool_call',
+          toolCallId: 'tc-2',
+          kind: 'execute',
+          status: 'in_progress',
+        },
+      },
+      {
+        kind: 'update',
+        update: {
+          sessionUpdate: 'tool_call_update',
+          toolCallId: 'tc-2',
+          status: 'failed',
+          rawOutput: { error: 'denied' },
+        },
+      },
+      done,
+    ])
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_RESULT')).toMatchObject({
+      state: 'output-error',
+      content: JSON.stringify({ error: 'denied' }),
+    })
+  })
+
+  it('resolves a tool_call that arrives already completed', async () => {
+    const chunks = await collect([
+      session,
+      {
+        kind: 'update',
+        update: {
+          sessionUpdate: 'tool_call',
+          toolCallId: 'tc-3',
+          kind: 'search',
+          status: 'completed',
+          content: [
+            { type: 'content', content: { type: 'text', text: 'found it' } },
+          ],
+        },
+      },
+      done,
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TOOL_CALL_START',
+      'TOOL_CALL_ARGS',
+      'TOOL_CALL_END',
+      'TOOL_CALL_RESULT',
+      'RUN_FINISHED',
+    ])
+    expect(chunks[5]).toMatchObject({ content: 'found it' })
+  })
+
+  it('opens a synthetic pair for a tool_call_update with an unknown id', async () => {
+    const chunks = await collect([
+      session,
+      {
+        kind: 'update',
+        update: {
+          sessionUpdate: 'tool_call_update',
+          toolCallId: 'tc-mystery',
+          status: 'completed',
+          rawOutput: 'late result',
+        },
+      },
+      done,
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TOOL_CALL_START',
+      'TOOL_CALL_ARGS',
+      'TOOL_CALL_END',
+      'TOOL_CALL_RESULT',
+      'RUN_FINISHED',
+    ])
+  })
+
+  it('surfaces bridged TanStack tool calls under their registered names', async () => {
+    const chunks = await collect(
+      [
+        session,
+        {
+          kind: 'update',
+          update: {
+            sessionUpdate: 'tool_call',
+            toolCallId: 'tc-4',
+            title: 'lookup_user (tanstack MCP Server)',
+            kind: 'other',
+            status: 'completed',
+            rawOutput: '{"name":"Ada"}',
+          },
+        },
+        done,
+      ],
+      makeCtx({ bridgedToolNames: new Set(['lookup_user']) }),
+    )
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_START')).toMatchObject({
+      toolCallName: 'lookup_user',
+    })
+  })
+
+  it('emits plan updates as CUSTOM events', async () => {
+    const chunks = await collect([
+      session,
+      {
+        kind: 'update',
+        update: {
+          sessionUpdate: 'plan',
+          entries: [{ content: 'step 1', status: 'pending' }],
+        },
+      },
+      done,
+    ])
+    expect(chunks[2]).toMatchObject({
+      type: 'CUSTOM',
+      name: PLAN_EVENT,
+      value: { entries: [{ content: 'step 1', status: 'pending' }] },
+    })
+  })
+
+  it('maps max_tokens and max_turn_requests to finishReason length', async () => {
+    for (const stopReason of ['max_tokens', 'max_turn_requests'] as const) {
+      const chunks = await collect([session, { kind: 'done', stopReason }])
+      expect(chunks.at(-1)).toMatchObject({
+        type: 'RUN_FINISHED',
+        finishReason: 'length',
+      })
+    }
+  })
+
+  it('maps cancelled to a normal stop', async () => {
+    const chunks = await collect([
+      session,
+      { kind: 'done', stopReason: 'cancelled' },
+    ])
+    expect(chunks.at(-1)).toMatchObject({
+      type: 'RUN_FINISHED',
+      finishReason: 'stop',
+    })
+  })
+
+  it('maps refusal to RUN_ERROR', async () => {
+    const chunks = await collect([
+      session,
+      { kind: 'done', stopReason: 'refusal' },
+    ])
+    expect(chunks.at(-1)).toMatchObject({ type: 'RUN_ERROR', code: 'refusal' })
+  })
+
+  it('reports usage from the prompt response when present', async () => {
+    const chunks = await collect([
+      session,
+      {
+        kind: 'done',
+        stopReason: 'end_turn',
+        usage: {
+          inputTokens: 50,
+          outputTokens: 10,
+          totalTokens: 60,
+          cachedReadTokens: 20,
+          thoughtTokens: 4,
+        },
+      },
+    ])
+    const finished = chunks.at(-1) as unknown as {
+      usage: Record<string, unknown>
+    }
+    expect(finished.usage).toMatchObject({
+      promptTokens: 50,
+      completionTokens: 10,
+      totalTokens: 60,
+      promptTokensDetails: { cachedTokens: 20 },
+      completionTokensDetails: { reasoningTokens: 4 },
+    })
+  })
+
+  it('omits usage when the harness reports none', async () => {
+    const chunks = await collect([session, done])
+    expect(
+      (chunks.at(-1) as unknown as { usage?: unknown }).usage,
+    ).toBeUndefined()
+  })
+
+  it('closes open messages and synthesizes results before finishing', async () => {
+    const chunks = await collect([
+      session,
+      text('working...'),
+      {
+        kind: 'update',
+        update: {
+          sessionUpdate: 'tool_call',
+          toolCallId: 'tc-5',
+          kind: 'execute',
+          status: 'in_progress',
+        },
+      },
+      done,
+    ])
+    const types: Array<string> = chunks.map((c) => c.type)
+    expect(types.indexOf('TOOL_CALL_RESULT')).toBeGreaterThan(-1)
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_RESULT')).toMatchObject({
+      content: JSON.stringify({ status: 'interrupted' }),
+    })
+    expect(types.at(-1)).toBe('RUN_FINISHED')
+  })
+
+  it('synthesizes results then rethrows when the source stream throws', async () => {
+    async function* failing(): AsyncIterable<AcpStreamEvent> {
+      yield session
+      yield {
+        kind: 'update',
+        update: {
+          sessionUpdate: 'tool_call',
+          toolCallId: 'tc-6',
+          kind: 'execute',
+          status: 'in_progress',
+        },
+      }
+      throw new Error('process died')
+    }
+
+    const chunks: Array<StreamChunk> = []
+    await expect(async () => {
+      for await (const chunk of translateAcpStream(failing(), makeCtx())) {
+        chunks.push(chunk)
+      }
+    }).rejects.toThrow('process died')
+    expect(chunks.at(-1)).toMatchObject({
+      type: 'TOOL_CALL_RESULT',
+      toolCallId: 'tc-6',
+      content: JSON.stringify({ status: 'interrupted' }),
+    })
+  })
+
+  it('ignores harness-internal update types', async () => {
+    const chunks = await collect([
+      session,
+      {
+        kind: 'update',
+        update: { sessionUpdate: 'available_commands_update' },
+      },
+      { kind: 'update', update: { sessionUpdate: 'current_mode_update' } },
+      done,
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'RUN_FINISHED',
+    ])
+  })
+})
+
+describe('matchBridgedToolName', () => {
+  const names = new Set(['lookup_user', 'get_weather'])
+
+  it('matches exact tool names', () => {
+    expect(matchBridgedToolName('lookup_user', names)).toBe('lookup_user')
+  })
+
+  it('matches server-suffixed titles', () => {
+    expect(
+      matchBridgedToolName('get_weather (tanstack MCP Server)', names),
+    ).toBe('get_weather')
+  })
+
+  it('returns undefined for unrelated titles', () => {
+    expect(matchBridgedToolName('Run shell command', names)).toBeUndefined()
+    expect(matchBridgedToolName(undefined, names)).toBeUndefined()
+    expect(matchBridgedToolName('lookup_user', undefined)).toBeUndefined()
+  })
+})
diff --git a/packages/ai-gemini-cli/tsconfig.json b/packages/ai-gemini-cli/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-gemini-cli/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-gemini-cli/vite.config.ts b/packages/ai-gemini-cli/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-gemini-cli/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-opencode/README.md b/packages/ai-opencode/README.md
new file mode 100644
index 000000000..80f12e243
--- /dev/null
+++ b/packages/ai-opencode/README.md
@@ -0,0 +1,18 @@
+# @tanstack/ai-opencode
+
+OpenCode harness adapter for [TanStack AI](https://tanstack.com/ai) — run [OpenCode](https://opencode.ai) (via `@opencode-ai/sdk`) as a chat backend with local tool execution, token-level streaming, stateful sessions, and TanStack tool bridging.
+
+```typescript
+import { chat } from '@tanstack/ai'
+import { opencodeText } from '@tanstack/ai-opencode'
+
+const stream = chat({
+  adapter: opencodeText('anthropic/claude-sonnet-4-5', {
+    directory: '/path/to/project',
+    permissionMode: 'acceptEdits',
+  }),
+  messages: [{ role: 'user', content: 'Fix the failing test.' }],
+})
+```
+
+Server-only (Node); requires the `opencode` CLI installed and authenticated. See the [OpenCode adapter docs](https://tanstack.com/ai/latest/docs/adapters/opencode) for sessions, tool bridging, permissions, and limitations.
diff --git a/packages/ai-opencode/package.json b/packages/ai-opencode/package.json
new file mode 100644
index 000000000..093f72795
--- /dev/null
+++ b/packages/ai-opencode/package.json
@@ -0,0 +1,59 @@
+{
+  "name": "@tanstack/ai-opencode",
+  "version": "0.1.0",
+  "description": "OpenCode harness adapter for TanStack AI — run OpenCode as a chat backend with local tool execution and stateful sessions.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-opencode"
+  },
+  "keywords": [
+    "ai",
+    "ai-sdk",
+    "typescript",
+    "tanstack",
+    "opencode",
+    "harness",
+    "agent",
+    "adapter",
+    "chat",
+    "tool-calling"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "dependencies": {
+    "@opencode-ai/sdk": "^1.17.4"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-sandbox": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-sandbox": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-opencode/src/adapters/text.ts b/packages/ai-opencode/src/adapters/text.ts
new file mode 100644
index 000000000..0c0da8751
--- /dev/null
+++ b/packages/ai-opencode/src/adapters/text.ts
@@ -0,0 +1,333 @@
+import { EventType, normalizeSystemPrompts } from '@tanstack/ai'
+import { toRunErrorRawEvent } from '@tanstack/ai/adapter-internals'
+import { BaseTextAdapter } from '@tanstack/ai/adapters'
+import {
+  SandboxCapability,
+  buildApprovalRequestedEvent,
+  getSandbox,
+  hostForSandbox,
+  startHostToolBridge,
+} from '@tanstack/ai-sandbox'
+import { buildPrompt } from '../messages/prompt'
+import { startOpencodeSession } from '../process/server'
+import { startOpencodeServerInSandbox } from '../process/sandbox-server'
+import { resolveInteractivePermission } from '../process/permissions'
+import { AsyncQueue } from '../stream/queue'
+import { translateOpencodeStream } from '../stream/translate'
+import type { HostToolBridge, SandboxHandle } from '@tanstack/ai-sandbox'
+import type {
+  StructuredOutputOptions,
+  StructuredOutputResult,
+} from '@tanstack/ai/adapters'
+import type {
+  DefaultMessageMetadataByModality,
+  Modality,
+  StreamChunk,
+  TextOptions,
+} from '@tanstack/ai'
+import type { OpencodeSessionHandle } from '../process/server'
+import type {
+  OpencodePermissionMode,
+  PermissionHandler,
+} from '../process/permissions'
+import type { OpencodeStreamEvent } from '../stream/sdk-types'
+import type { OpencodeModel } from '../model-meta'
+import type { OpencodeTextProviderOptions } from '../provider-options'
+
+const DEFAULT_WORKDIR = '/workspace'
+const DEFAULT_PORT = 4096
+
+export interface OpencodeTextConfig {
+  /** Working directory inside the sandbox. Defaults to `/workspace`. */
+  directory?: string
+  /**
+   * Port the in-sandbox `opencode serve` listens on. Defaults to 4096. For the
+   * Docker provider this port must also be published (`publishPorts: [4096]`)
+   * so the host can reach it.
+   */
+  port?: number
+  /** Hostname the in-sandbox server binds. Defaults to `0.0.0.0`. */
+  hostname?: string
+  /**
+   * OpenCode permission mode driving the dynamic permission handler. Defaults
+   * to `'default'`; set `'acceptEdits'` / `'bypassPermissions'` to let the
+   * harness edit files and run commands autonomously inside the sandbox.
+   */
+  permissionMode?: OpencodePermissionMode
+  /** Custom permission handler; replaces the adapter's default policy. */
+  onPermissionRequest?: PermissionHandler
+}
+
+/** Split a `provider/model` id into its provider and model halves. */
+function splitModel(model: string): { providerID: string; modelID: string } {
+  const slash = model.indexOf('/')
+  if (slash <= 0 || slash === model.length - 1) {
+    throw new Error(
+      `OpenCode models must be addressed as "provider/model" (e.g. "anthropic/claude-sonnet-4-5"); received "${model}".`,
+    )
+  }
+  return { providerID: model.slice(0, slash), modelID: model.slice(slash + 1) }
+}
+
+export class OpencodeTextAdapter<
+  TModel extends OpencodeModel,
+> extends BaseTextAdapter<
+  TModel,
+  OpencodeTextProviderOptions,
+  ReadonlyArray<Modality> & readonly ['text'],
+  DefaultMessageMetadataByModality,
+  ReadonlyArray<string>,
+  unknown,
+  never
+> {
+  readonly name = 'opencode' as const
+
+  override readonly requires = [SandboxCapability] as const
+
+  // Agent runs inside the persistent sandbox; the engine can re-attach to the
+  // still-running process on resume (live re-attach verified with the real CLI;
+  // the engine seam is unit-tested).
+  readonly supportsReattach = true
+
+  private readonly adapterConfig: OpencodeTextConfig
+
+  constructor(config: OpencodeTextConfig, model: TModel) {
+    super({}, model)
+    this.adapterConfig = config
+  }
+
+  private sandboxFrom(
+    options: TextOptions<OpencodeTextProviderOptions>,
+  ): SandboxHandle {
+    const ctx = options.capabilities
+    if (!ctx) {
+      throw new Error(
+        'Adapter "opencode" requires a sandbox. Add withSandbox(defineSandbox({ ... })) to chat() middleware.',
+      )
+    }
+    return getSandbox(ctx)
+  }
+
+  private applySystemPrompts(
+    options: TextOptions<OpencodeTextProviderOptions>,
+    prompt: string,
+  ): string {
+    const systemPrompts = normalizeSystemPrompts(options.systemPrompts)
+      .map((systemPrompt) => systemPrompt.content)
+      .filter((content) => content.trim() !== '')
+    if (systemPrompts.length === 0) return prompt
+    return `${systemPrompts.join('\n\n')}\n\n${prompt}`
+  }
+
+  async *chatStream(
+    options: TextOptions<OpencodeTextProviderOptions>,
+  ): AsyncIterable<StreamChunk> {
+    const { logger } = options
+    let server:
+      | Awaited<ReturnType<typeof startOpencodeServerInSandbox>>
+      | undefined
+    let handle: OpencodeSessionHandle | undefined
+    let bridge: HostToolBridge | undefined
+    const externalSignal =
+      options.abortController?.signal ?? options.request?.signal ?? undefined
+    let onAbort: (() => void) | undefined
+
+    try {
+      const sandbox = this.sandboxFrom(options)
+      const directory =
+        options.modelOptions?.directory ??
+        this.adapterConfig.directory ??
+        DEFAULT_WORKDIR
+
+      const modelOptions = options.modelOptions
+      const sessionId = modelOptions?.sessionId
+      const { prompt: resumePrompt } = buildPrompt(options.messages, sessionId)
+      const { providerID, modelID } = splitModel(this.model)
+
+      // Bridge chat()-provided tools into the in-sandbox server over MCP
+      // (configured via OPENCODE_CONFIG_CONTENT at server spawn).
+      const bridgedToolNames = new Set(
+        (options.tools ?? []).map((tool) => tool.name),
+      )
+      if (options.tools && options.tools.length > 0) {
+        bridge = await startHostToolBridge(options.tools, {
+          hostForSandbox: hostForSandbox(sandbox.provider),
+          context: options.context,
+          ...(externalSignal ? { signal: externalSignal } : {}),
+        })
+      }
+
+      const runId = options.runId ?? this.generateId()
+      const threadId = options.threadId ?? this.generateId()
+      // Approval-requested events for `ask`-policy actions with no client
+      // decision yet, emitted after the stream so the client can approve + re-run.
+      const approvalRequests: Array<StreamChunk> = []
+
+      const queue = new AsyncQueue<OpencodeStreamEvent>()
+      const mode =
+        modelOptions?.permissionMode ??
+        this.adapterConfig.permissionMode ??
+        'default'
+      const permissionHandler: PermissionHandler =
+        this.adapterConfig.onPermissionRequest ??
+        ((request) => {
+          const result = resolveInteractivePermission(
+            request,
+            mode,
+            bridgedToolNames,
+            options.approvals,
+          )
+          if (result.approvalId !== undefined) {
+            approvalRequests.push(
+              buildApprovalRequestedEvent({
+                approvalId: result.approvalId,
+                title: result.title ?? request.title,
+                threadId,
+                runId,
+                detail: { provider: 'opencode' },
+              }),
+            )
+          }
+          return result.response
+        })
+
+      logger.request(
+        `activity=chat provider=opencode model=${this.model} sandbox=${sandbox.provider} messages=${options.messages.length} resume=${sessionId ?? 'none'}`,
+        { provider: 'opencode', model: this.model },
+      )
+
+      const serverEnv = bridge
+        ? {
+            OPENCODE_CONFIG_CONTENT: JSON.stringify({
+              mcp: {
+                [bridge.name]: {
+                  type: 'remote',
+                  url: bridge.url,
+                  enabled: true,
+                  headers: { Authorization: `Bearer ${bridge.token}` },
+                },
+              },
+            }),
+          }
+        : undefined
+
+      server = await startOpencodeServerInSandbox(sandbox, {
+        port: this.adapterConfig.port ?? DEFAULT_PORT,
+        ...(this.adapterConfig.hostname !== undefined && {
+          hostname: this.adapterConfig.hostname,
+        }),
+        cwd: directory,
+        ...(serverEnv ? { env: serverEnv } : {}),
+        ...(externalSignal ? { signal: externalSignal } : {}),
+      })
+
+      handle = await startOpencodeSession({
+        baseUrl: server.baseUrl,
+        directory,
+        providerID,
+        modelID,
+        ...(sessionId !== undefined && { resumeSessionId: sessionId }),
+        onEvent: (event) => queue.push({ kind: 'event', event }),
+        onPermissionRequest: permissionHandler,
+        onError: (error) => queue.fail(error),
+      })
+      const session = handle
+
+      if (externalSignal !== undefined) {
+        onAbort = () => void session.abort().catch(() => undefined)
+        if (externalSignal.aborted) onAbort()
+        else externalSignal.addEventListener('abort', onAbort, { once: true })
+      }
+
+      queue.push({ kind: 'session', sessionId: session.sessionId })
+
+      const promptText = this.applySystemPrompts(
+        options,
+        session.resumed || sessionId === undefined
+          ? resumePrompt
+          : buildPrompt(options.messages, undefined).prompt,
+      )
+
+      session
+        .prompt(promptText)
+        .then(({ message }) => {
+          queue.push({ kind: 'done', message })
+          queue.end()
+        })
+        .catch((error: unknown) => queue.fail(error))
+
+      yield* translateOpencodeStream(queue, {
+        model: this.model,
+        runId,
+        threadId,
+        ...(options.parentRunId !== undefined && {
+          parentRunId: options.parentRunId,
+        }),
+        genId: () => this.generateId(),
+        bridgedToolNames,
+        onStreamEvent: (event) =>
+          logger.provider(`provider=opencode kind=${event.kind}`, {
+            chunk: event,
+          }),
+      })
+
+      // Surface pending approval requests (ask-policy actions awaiting a client
+      // decision); the client approves and re-runs to continue.
+      for (const event of approvalRequests) yield event
+    } catch (error: unknown) {
+      const err = error as Error & { code?: string }
+      const rawEvent = toRunErrorRawEvent(error)
+      logger.errors('opencode.chatStream fatal', {
+        error,
+        source: 'opencode.chatStream',
+      })
+      yield {
+        type: EventType.RUN_ERROR,
+        model: options.model,
+        timestamp: Date.now(),
+        message: err.message || 'Unknown error occurred',
+        ...(err.code !== undefined && { code: err.code }),
+        ...(rawEvent !== undefined && { rawEvent }),
+        error: {
+          message: err.message || 'Unknown error occurred',
+          ...(err.code !== undefined && { code: err.code }),
+        },
+      }
+    } finally {
+      if (externalSignal !== undefined && onAbort !== undefined) {
+        externalSignal.removeEventListener('abort', onAbort)
+      }
+      await handle?.dispose()
+      await server?.dispose()
+      await bridge?.close()
+    }
+  }
+
+  structuredOutput(
+    _options: StructuredOutputOptions<OpencodeTextProviderOptions>,
+  ): Promise<StructuredOutputResult<unknown>> {
+    return Promise.reject(
+      new Error(
+        'Structured output is not yet supported by the in-sandbox OpenCode adapter. ' +
+          'Use a model adapter for structured output, or omit outputSchema.',
+      ),
+    )
+  }
+}
+
+/**
+ * Creates an OpenCode harness adapter that runs **inside a sandbox**.
+ *
+ * It declares `requires: [SandboxCapability]`, spawns `opencode serve` inside
+ * the sandbox provided by `withSandbox(...)`, exposes its port, and connects
+ * the `@opencode-ai/sdk` HTTP client to it. OpenCode owns the agent loop and
+ * executes its native tools against the sandbox workspace. The sandbox image
+ * must provide the `opencode` executable (Docker: also publish the server port
+ * via `publishPorts`). chat()-provided tools aren't bridged yet.
+ */
+export function opencodeText<TModel extends OpencodeModel>(
+  model: TModel,
+  config: OpencodeTextConfig = {},
+): OpencodeTextAdapter<TModel> {
+  return new OpencodeTextAdapter(config, model)
+}
diff --git a/packages/ai-opencode/src/index.ts b/packages/ai-opencode/src/index.ts
new file mode 100644
index 000000000..9246d323e
--- /dev/null
+++ b/packages/ai-opencode/src/index.ts
@@ -0,0 +1,40 @@
+export { OpencodeTextAdapter, opencodeText } from './adapters/text'
+export type { OpencodeTextConfig } from './adapters/text'
+export type { OpencodeTextProviderOptions } from './provider-options'
+export { OPENCODE_MODELS } from './model-meta'
+export type { OpencodeModel, KnownOpencodeModel } from './model-meta'
+export {
+  SESSION_ID_EVENT,
+  TODO_EVENT,
+  BRIDGED_MCP_SERVER_NAME,
+  translateOpencodeStream,
+  resolveToolName,
+} from './stream/translate'
+export type { TranslateContext } from './stream/translate'
+export type {
+  OpencodeAssistantMessage,
+  OpencodeEvent,
+  OpencodePart,
+  OpencodeStreamEvent,
+  OpencodeTokens,
+  OpencodeToolState,
+} from './stream/sdk-types'
+export { resolvePermission, matchBridgedToolName } from './process/permissions'
+export type {
+  OpencodePermissionMode,
+  OpencodePermissionRequest,
+  OpencodePermissionResponse,
+  PermissionHandler,
+} from './process/permissions'
+export { startOpencodeSession } from './process/server'
+export type {
+  OpencodeSessionHandle,
+  StartOpencodeSessionOptions,
+} from './process/server'
+export { buildPrompt } from './messages/prompt'
+export type { BuiltPrompt } from './messages/prompt'
+export { startOpencodeServerInSandbox } from './process/sandbox-server'
+export type {
+  SandboxOpencodeServer,
+  StartServerOptions,
+} from './process/sandbox-server'
diff --git a/packages/ai-opencode/src/messages/prompt.ts b/packages/ai-opencode/src/messages/prompt.ts
new file mode 100644
index 000000000..bb2824e17
--- /dev/null
+++ b/packages/ai-opencode/src/messages/prompt.ts
@@ -0,0 +1,67 @@
+import type { ModelMessage } from '@tanstack/ai'
+
+export interface BuiltPrompt {
+  prompt: string
+  /** OpenCode session id to resume, when the caller threaded one through. */
+  resume?: string
+}
+
+function extractText(content: ModelMessage['content']): string {
+  if (content === null) return ''
+  if (typeof content === 'string') return content
+  return content
+    .map((part) =>
+      part.type === 'text' && typeof part.content === 'string'
+        ? part.content
+        : '',
+    )
+    .join('')
+}
+
+/**
+ * Convert TanStack chat history into the OpenCode prompt + resume inputs.
+ *
+ * With a `sessionId`, the harness already holds the conversation context, so
+ * only the trailing user message is sent and the session is resumed. Without
+ * one, prior turns are flattened into a plain-text transcript preamble (tool
+ * messages and tool-call-only assistant turns are harness-internal noise and
+ * are skipped; prompts are text-only in v1).
+ */
+export function buildPrompt(
+  messages: Array<ModelMessage>,
+  sessionId: string | undefined,
+): BuiltPrompt {
+  const lastMessage = messages.at(-1)
+  const lastUserText =
+    lastMessage?.role === 'user' ? extractText(lastMessage.content).trim() : ''
+
+  if (!lastUserText) {
+    throw new Error(
+      'OpenCode adapter requires a trailing user message with text content.',
+    )
+  }
+
+  if (sessionId !== undefined) {
+    return { prompt: lastUserText, resume: sessionId }
+  }
+
+  const priorTurns = messages
+    .slice(0, -1)
+    .filter(
+      (message) =>
+        (message.role === 'user' || message.role === 'assistant') &&
+        extractText(message.content).trim() !== '',
+    )
+    .map(
+      (message) =>
+        `${message.role === 'user' ? 'User' : 'Assistant'}: ${extractText(message.content).trim()}`,
+    )
+
+  if (priorTurns.length === 0) {
+    return { prompt: lastUserText }
+  }
+
+  return {
+    prompt: `Previous conversation:\n${priorTurns.join('\n')}\n\n${lastUserText}`,
+  }
+}
diff --git a/packages/ai-opencode/src/model-meta.ts b/packages/ai-opencode/src/model-meta.ts
new file mode 100644
index 000000000..95a4e8efd
--- /dev/null
+++ b/packages/ai-opencode/src/model-meta.ts
@@ -0,0 +1,24 @@
+/**
+ * Models known to work with OpenCode. OpenCode is provider-agnostic — it
+ * resolves any `provider/model` id its configured providers support (via the
+ * Vercel AI SDK + Models.dev), so this list exists for autocomplete. Any
+ * string is accepted via the `(string & {})` escape hatch in
+ * {@link OpencodeModel}.
+ *
+ * Models are addressed as `provider_id/model_id` (e.g.
+ * `anthropic/claude-sonnet-4-5`); the adapter splits on the first `/`.
+ */
+export const OPENCODE_MODELS = [
+  'anthropic/claude-opus-4-5',
+  'anthropic/claude-sonnet-4-5',
+  'openai/gpt-5.2',
+  'openai/gpt-5.1-codex',
+  'google/gemini-3-pro-preview',
+  'opencode/claude-sonnet-4-5',
+  'opencode/gpt-5.1-codex',
+] as const
+
+export type KnownOpencodeModel = (typeof OPENCODE_MODELS)[number]
+
+/** Any `provider/model` id accepted by OpenCode; known ids get autocomplete. */
+export type OpencodeModel = KnownOpencodeModel | (string & {})
diff --git a/packages/ai-opencode/src/process/permissions.ts b/packages/ai-opencode/src/process/permissions.ts
new file mode 100644
index 000000000..f77f329e4
--- /dev/null
+++ b/packages/ai-opencode/src/process/permissions.ts
@@ -0,0 +1,119 @@
+import { approvalId } from '@tanstack/ai-sandbox'
+
+/**
+ * Permission modes for the OpenCode adapter, mirroring the Claude Code and
+ * Gemini CLI adapters' semantics:
+ *
+ * - `'default'`: bridged TanStack tools run; anything else that asks for
+ *   permission is rejected with no prompt (a headless server must never hang
+ *   on an interactive question).
+ * - `'acceptEdits'`: additionally auto-approves file-mutation requests
+ *   (edit / write / patch).
+ * - `'bypassPermissions'`: approves everything.
+ */
+export type OpencodePermissionMode =
+  | 'default'
+  | 'acceptEdits'
+  | 'bypassPermissions'
+
+/** Structural subset of an OpenCode `permission.updated` payload. */
+export interface OpencodePermissionRequest {
+  id: string
+  sessionID: string
+  /** Permission category, e.g. `'edit'`, `'bash'`, `'webfetch'`, a tool id. */
+  type: string
+  title: string
+  /** Tool call id this permission gates, when it gates a tool. */
+  callID?: string
+}
+
+/** OpenCode permission reply: allow once, allow always, or reject. */
+export type OpencodePermissionResponse = 'once' | 'always' | 'reject'
+
+/** Custom permission handler; replaces the adapter's default policy. */
+export type PermissionHandler = (
+  request: OpencodePermissionRequest,
+) => Promise<OpencodePermissionResponse> | OpencodePermissionResponse
+
+/** Permission categories treated as file mutations for `'acceptEdits'`. */
+const EDIT_TYPES = new Set(['edit', 'write', 'patch'])
+
+/**
+ * Decide whether an OpenCode permission request targets one of the bridged
+ * TanStack tools. OpenCode names MCP tools `<server>_<tool>` (e.g.
+ * `tanstack_lookup_user`), so a request is bridged when its type or title is
+ * a registered tool name, or carries the `tanstack` server prefix.
+ */
+export function matchBridgedToolName(
+  request: OpencodePermissionRequest,
+  bridgedToolNames: ReadonlySet<string> | undefined,
+): boolean {
+  if (!bridgedToolNames || bridgedToolNames.size === 0) return false
+  for (const field of [request.type, request.title]) {
+    if (typeof field !== 'string' || field === '') continue
+    if (bridgedToolNames.has(field)) return true
+    if (field.startsWith('tanstack_') && bridgedToolNames.has(field.slice(9))) {
+      return true
+    }
+    if (field.startsWith('tanstack.') && bridgedToolNames.has(field.slice(9))) {
+      return true
+    }
+  }
+  return false
+}
+
+/**
+ * The adapter's default permission policy. Always answers immediately — never
+ * hangs a headless server on a question only an interactive user could
+ * answer.
+ */
+export function resolvePermission(
+  request: OpencodePermissionRequest,
+  mode: OpencodePermissionMode,
+  bridgedToolNames: ReadonlySet<string> | undefined,
+): OpencodePermissionResponse {
+  if (matchBridgedToolName(request, bridgedToolNames)) {
+    return 'once'
+  }
+  if (mode === 'bypassPermissions') {
+    return 'once'
+  }
+  if (mode === 'acceptEdits' && EDIT_TYPES.has(request.type)) {
+    return 'once'
+  }
+  return 'reject'
+}
+
+/**
+ * Interactive variant: when the mode/bridge policy would reject, consult the
+ * client's approval decisions. Returns the OpenCode response plus, when the
+ * action still needs a client decision, the `approvalId`/`title` the adapter
+ * should surface via an `approval-requested` event.
+ */
+export function resolveInteractivePermission(
+  request: OpencodePermissionRequest,
+  mode: OpencodePermissionMode,
+  bridgedToolNames: ReadonlySet<string> | undefined,
+  approvals: ReadonlyMap<string, boolean> | undefined,
+): {
+  response: OpencodePermissionResponse
+  approvalId?: string
+  title?: string
+} {
+  if (matchBridgedToolName(request, bridgedToolNames))
+    return { response: 'once' }
+  if (mode === 'bypassPermissions') return { response: 'once' }
+  if (mode === 'acceptEdits' && EDIT_TYPES.has(request.type)) {
+    return { response: 'once' }
+  }
+
+  const id = approvalId({
+    provider: 'opencode',
+    kind: 'tool',
+    target: request.type || request.title,
+  })
+  const granted = approvals?.get(id)
+  if (granted === true) return { response: 'once' }
+  if (granted === false) return { response: 'reject' }
+  return { response: 'reject', approvalId: id, title: request.title }
+}
diff --git a/packages/ai-opencode/src/process/sandbox-server.ts b/packages/ai-opencode/src/process/sandbox-server.ts
new file mode 100644
index 000000000..3f1386342
--- /dev/null
+++ b/packages/ai-opencode/src/process/sandbox-server.ts
@@ -0,0 +1,94 @@
+/**
+ * Boot an `opencode serve` HTTP server INSIDE a sandbox and expose its port so
+ * the host `@opencode-ai/sdk` client can connect over `baseUrl`. Mirrors the
+ * SDK's own server launch (`opencode serve --hostname=H --port=P`, ready when
+ * stdout logs `opencode server listening`).
+ */
+import type { SandboxHandle, SpawnHandle } from '@tanstack/ai-sandbox'
+
+const READY_MARKER = 'opencode server listening'
+
+export interface SandboxOpencodeServer {
+  /** URL the host uses to reach the in-sandbox server. */
+  baseUrl: string
+  /** Stop the server process. */
+  dispose: () => Promise<void>
+}
+
+export interface StartServerOptions {
+  port: number
+  hostname?: string
+  cwd: string
+  /** Extra env for the server process (e.g. `OPENCODE_CONFIG_CONTENT`). */
+  env?: Record<string, string>
+  timeoutMs?: number
+  signal?: AbortSignal
+}
+
+export async function startOpencodeServerInSandbox(
+  sandbox: SandboxHandle,
+  options: StartServerOptions,
+): Promise<SandboxOpencodeServer> {
+  const hostname = options.hostname ?? '0.0.0.0'
+  const command = `opencode serve --hostname=${hostname} --port=${options.port}`
+  const proc: SpawnHandle = await sandbox.process.spawn(command, {
+    cwd: options.cwd,
+    ...(options.env ? { env: options.env } : {}),
+    ...(options.signal ? { signal: options.signal } : {}),
+  })
+
+  await waitForReady(proc, options.timeoutMs ?? 30_000)
+
+  const channel = await sandbox.ports.connect(options.port)
+  return {
+    baseUrl: channel.url,
+    dispose: () => proc.kill(),
+  }
+}
+
+function waitForReady(proc: SpawnHandle, timeoutMs: number): Promise<void> {
+  return new Promise<void>((resolve, reject) => {
+    let buffer = ''
+    // Holder object so reads stay typed as `boolean` across async closures
+    // (a plain `let` gets flow-narrowed to a literal and trips lint).
+    const state = { settled: false }
+    const settle = (fn: () => void): void => {
+      if (state.settled) return
+      state.settled = true
+      clearTimeout(timer)
+      fn()
+    }
+    const timer = setTimeout(
+      () =>
+        settle(() =>
+          reject(
+            new Error(
+              `opencode serve did not become ready within ${timeoutMs}ms`,
+            ),
+          ),
+        ),
+      timeoutMs,
+    )
+
+    void (async () => {
+      try {
+        for await (const chunk of proc.stdout) {
+          buffer += chunk
+          if (buffer.includes(READY_MARKER)) {
+            settle(resolve)
+            return
+          }
+        }
+        settle(() =>
+          reject(
+            new Error(
+              `opencode serve exited before becoming ready: ${buffer.slice(-500)}`,
+            ),
+          ),
+        )
+      } catch (error) {
+        settle(() => reject(error))
+      }
+    })()
+  })
+}
diff --git a/packages/ai-opencode/src/process/server.ts b/packages/ai-opencode/src/process/server.ts
new file mode 100644
index 000000000..199ead3a5
--- /dev/null
+++ b/packages/ai-opencode/src/process/server.ts
@@ -0,0 +1,250 @@
+import { createOpencode, createOpencodeClient } from '@opencode-ai/sdk'
+import type { Config, Event, OpencodeClient, Part } from '@opencode-ai/sdk'
+import type {
+  OpencodeAssistantMessage,
+  OpencodeEvent,
+} from '../stream/sdk-types'
+import type {
+  OpencodePermissionRequest,
+  OpencodePermissionResponse,
+} from './permissions'
+
+/** A live OpenCode session backed by an `opencode serve` HTTP server. */
+export interface OpencodeSessionHandle {
+  sessionId: string
+  /** Whether an existing session was actually resumed. */
+  resumed: boolean
+  /**
+   * Run one prompt turn. Resolves with the final assistant message (finish
+   * reason, token usage, error) and its concatenated text once the harness
+   * goes idle. Streaming deltas arrive via `onEvent` while this is pending.
+   */
+  prompt: (
+    text: string,
+  ) => Promise<{ message: OpencodeAssistantMessage; text: string }>
+  /** Ask the harness to abort the in-flight prompt turn. */
+  abort: () => Promise<void>
+  /** Tear down the event subscription and (if owned) the server. */
+  dispose: () => Promise<void>
+}
+
+export interface StartOpencodeSessionOptions {
+  /** Connect to an already-running server instead of spawning one. */
+  baseUrl?: string
+  /** Hostname for the spawned server. Defaults to the SDK default. */
+  hostname?: string
+  /** Port for the spawned server. Defaults to the SDK default. */
+  port?: number
+  /** Working directory for the session (absolute path). */
+  directory: string
+  /** Provider id (the part before `/` in the model id). */
+  providerID: string
+  /** Model id (the part after `/` in the model id). */
+  modelID: string
+  /** Extra OpenCode config merged with the adapter's mcp/permission config. */
+  config?: Config
+  /** Baseline permission policy applied to the spawned server. */
+  permission?: Config['permission']
+  /** MCP servers (e.g. the TanStack tool bridge) for the session. */
+  mcpServers?: Array<{ name: string; url: string }>
+  /** Session id to resume; falls back to a fresh session when not found. */
+  resumeSessionId?: string
+  onEvent: (event: OpencodeEvent) => void
+  onPermissionRequest: (
+    request: OpencodePermissionRequest,
+  ) => Promise<OpencodePermissionResponse> | OpencodePermissionResponse
+  /** Called when the event subscription fails mid-turn. */
+  onError?: (error: unknown) => void
+}
+
+/** Locate the session id an OpenCode event belongs to, when it carries one. */
+function sessionIdOf(event: Event): string | undefined {
+  const props = event.properties as { sessionID?: string } | undefined
+  if (props?.sessionID !== undefined) return props.sessionID
+  if (event.type === 'message.part.updated') {
+    return event.properties.part.sessionID
+  }
+  if (event.type === 'message.updated') {
+    return event.properties.info.sessionID
+  }
+  if (event.type === 'permission.updated') {
+    return event.properties.sessionID
+  }
+  return undefined
+}
+
+function buildConfig(options: StartOpencodeSessionOptions): Config {
+  const mcp: NonNullable<Config['mcp']> = { ...options.config?.mcp }
+  for (const server of options.mcpServers ?? []) {
+    mcp[server.name] = { type: 'remote', url: server.url, enabled: true }
+  }
+  return {
+    ...options.config,
+    ...(Object.keys(mcp).length > 0 && { mcp }),
+    ...(options.permission !== undefined && { permission: options.permission }),
+  }
+}
+
+/**
+ * Boot (or attach to) an OpenCode HTTP server, resolve a session, and wire its
+ * event subscription + permission replies.
+ *
+ * This module is the only place that touches `@opencode-ai/sdk`; the rest of
+ * the package works with the structural types in `sdk-types.ts`.
+ *
+ * Resume semantics: when `resumeSessionId` is set and the server still knows
+ * the session (same machine, same data dir), it is reused. Otherwise a fresh
+ * session is created and `resumed: false` tells the adapter to send the
+ * flattened transcript.
+ */
+export async function startOpencodeSession(
+  options: StartOpencodeSessionOptions,
+): Promise<OpencodeSessionHandle> {
+  const { directory } = options
+
+  let client: OpencodeClient
+  let ownedServer: { close: () => void } | undefined
+
+  if (options.baseUrl !== undefined) {
+    client = createOpencodeClient({ baseUrl: options.baseUrl, directory })
+  } else {
+    const config = buildConfig(options)
+    const result = await createOpencode({
+      ...(options.hostname !== undefined && { hostname: options.hostname }),
+      ...(options.port !== undefined && { port: options.port }),
+      ...(Object.keys(config).length > 0 && { config }),
+    })
+    client = result.client
+    ownedServer = result.server
+  }
+
+  // Mutated from several closures (the subscription loop, dispose, teardown);
+  // a holder object keeps reads typed as `boolean` rather than being
+  // flow-narrowed to a literal across those boundaries.
+  const lifecycle = { disposed: false }
+
+  const teardown = async (): Promise<void> => {
+    if (lifecycle.disposed) return
+    lifecycle.disposed = true
+    ownedServer?.close()
+    await Promise.resolve()
+  }
+
+  try {
+    // Resolve the session before subscribing so the event filter has an id.
+    let sessionId: string | undefined
+    let resumed = false
+    if (options.resumeSessionId !== undefined) {
+      const existing = await client.session.get({
+        path: { id: options.resumeSessionId },
+        query: { directory },
+      })
+      if (existing.data) {
+        sessionId = options.resumeSessionId
+        resumed = true
+      }
+    }
+    if (sessionId === undefined) {
+      const created = await client.session.create({
+        query: { directory },
+        body: {},
+        throwOnError: true,
+      })
+      sessionId = created.data.id
+    }
+    const resolvedSessionId = sessionId
+
+    const handlePermission = async (
+      permission: Extract<Event, { type: 'permission.updated' }>['properties'],
+    ): Promise<void> => {
+      try {
+        const response = await options.onPermissionRequest({
+          id: permission.id,
+          sessionID: permission.sessionID,
+          type: permission.type,
+          title: permission.title,
+          ...(permission.callID !== undefined && { callID: permission.callID }),
+        })
+        await client.postSessionIdPermissionsPermissionId({
+          path: { id: permission.sessionID, permissionID: permission.id },
+          query: { directory },
+          body: { response },
+          throwOnError: true,
+        })
+      } catch (error) {
+        if (!lifecycle.disposed) options.onError?.(error)
+      }
+    }
+
+    const subscription = await client.event.subscribe()
+    const stream = subscription.stream
+
+    void (async () => {
+      try {
+        for await (const event of stream) {
+          if (lifecycle.disposed) break
+          const sid = sessionIdOf(event)
+          if (sid !== undefined && sid !== resolvedSessionId) continue
+          if (event.type === 'permission.updated') {
+            void handlePermission(event.properties)
+            continue
+          }
+          // The SDK event union is a structural superset of the subset the
+          // translator consumes; unknown event types match no translator
+          // branch and are ignored.
+          options.onEvent(event as OpencodeEvent)
+        }
+      } catch (error) {
+        if (!lifecycle.disposed) options.onError?.(error)
+      }
+    })()
+
+    return {
+      sessionId: resolvedSessionId,
+      resumed,
+      prompt: async (text: string) => {
+        const result = await client.session.prompt({
+          path: { id: resolvedSessionId },
+          query: { directory },
+          body: {
+            model: { providerID: options.providerID, modelID: options.modelID },
+            parts: [{ type: 'text', text }],
+          },
+          throwOnError: true,
+        })
+        const data = result.data
+        const message = data.info as OpencodeAssistantMessage
+        const responseText = data.parts
+          .filter(
+            (part): part is Extract<Part, { type: 'text' }> =>
+              part.type === 'text',
+          )
+          .map((part) => part.text)
+          .join('')
+        return { message, text: responseText }
+      },
+      abort: async () => {
+        try {
+          await client.session.abort({
+            path: { id: resolvedSessionId },
+            query: { directory },
+          })
+        } catch {
+          // Best-effort: the turn may already be finishing.
+        }
+      },
+      dispose: async () => {
+        lifecycle.disposed = true
+        try {
+          await stream.return(undefined)
+        } catch {
+          // Ignore: stream may already be closed.
+        }
+        ownedServer?.close()
+      },
+    }
+  } catch (error) {
+    await teardown()
+    throw error
+  }
+}
diff --git a/packages/ai-opencode/src/provider-options.ts b/packages/ai-opencode/src/provider-options.ts
new file mode 100644
index 000000000..79c65e3f5
--- /dev/null
+++ b/packages/ai-opencode/src/provider-options.ts
@@ -0,0 +1,19 @@
+import type { OpencodePermissionMode } from './process/permissions'
+
+/**
+ * Per-call provider options for the OpenCode adapter, passed via
+ * `modelOptions` on `chat()`.
+ */
+export interface OpencodeTextProviderOptions {
+  /**
+   * Resume an existing OpenCode session. The adapter emits the session id of
+   * every fresh run via a CUSTOM `opencode.session-id` stream event; thread
+   * it back here to continue that session (only the latest user message is
+   * sent — the harness already holds the prior context).
+   */
+  sessionId?: string
+  /** Per-call override of the configured permission mode. */
+  permissionMode?: OpencodePermissionMode
+  /** Per-call override of the harness working directory. */
+  directory?: string
+}
diff --git a/packages/ai-opencode/src/stream/queue.ts b/packages/ai-opencode/src/stream/queue.ts
new file mode 100644
index 000000000..f0f37c5e9
--- /dev/null
+++ b/packages/ai-opencode/src/stream/queue.ts
@@ -0,0 +1,64 @@
+/**
+ * Minimal promise-based async queue bridging the OpenCode event
+ * subscription's callback-style notifications into the async-iterable world
+ * the stream translator consumes.
+ */
+export class AsyncQueue<T> implements AsyncIterable<T> {
+  private readonly values: Array<T> = []
+  private readonly waiters: Array<{
+    resolve: (result: IteratorResult<T>) => void
+    reject: (error: unknown) => void
+  }> = []
+  private ended = false
+  private error: unknown = undefined
+  private failed = false
+
+  push(value: T): void {
+    if (this.ended || this.failed) return
+    const waiter = this.waiters.shift()
+    if (waiter) {
+      waiter.resolve({ value, done: false })
+    } else {
+      this.values.push(value)
+    }
+  }
+
+  /** Signal normal completion; pending and future reads resolve as done. */
+  end(): void {
+    if (this.ended || this.failed) return
+    this.ended = true
+    for (const waiter of this.waiters.splice(0)) {
+      waiter.resolve({ value: undefined, done: true })
+    }
+  }
+
+  /** Signal failure; pending and future reads reject (after buffered values drain). */
+  fail(error: unknown): void {
+    if (this.ended || this.failed) return
+    this.failed = true
+    this.error = error
+    for (const waiter of this.waiters.splice(0)) {
+      waiter.reject(error)
+    }
+  }
+
+  [Symbol.asyncIterator](): AsyncIterator<T> {
+    return {
+      next: (): Promise<IteratorResult<T>> => {
+        if (this.values.length > 0) {
+          return Promise.resolve({
+            value: this.values.shift() as T,
+            done: false,
+          })
+        }
+        if (this.failed) return Promise.reject(this.error)
+        if (this.ended) {
+          return Promise.resolve({ value: undefined, done: true })
+        }
+        return new Promise((resolve, reject) => {
+          this.waiters.push({ resolve, reject })
+        })
+      },
+    }
+  }
+}
diff --git a/packages/ai-opencode/src/stream/sdk-types.ts b/packages/ai-opencode/src/stream/sdk-types.ts
new file mode 100644
index 000000000..8deb3ce87
--- /dev/null
+++ b/packages/ai-opencode/src/stream/sdk-types.ts
@@ -0,0 +1,104 @@
+/**
+ * Structural subset of the `@opencode-ai/sdk` event types that the stream
+ * translator consumes.
+ *
+ * These are intentionally defined structurally (rather than imported from the
+ * OpenCode SDK) so the translator stays a pure, fixture-testable state machine
+ * and the package's public types don't depend on the SDK's generated schema
+ * types. Unknown part or event types fall through every branch at runtime.
+ */
+
+export interface OpencodeTokens {
+  input?: number
+  output?: number
+  reasoning?: number
+  cache?: { read?: number; write?: number }
+}
+
+/** Error payload attached to a failed assistant message. */
+export interface OpencodeMessageError {
+  name: string
+  data?: { message?: string }
+}
+
+/**
+ * The final assistant message of a turn, returned by the blocking prompt
+ * call. Carries the finish reason, token usage, and any fatal error.
+ */
+export interface OpencodeAssistantMessage {
+  id: string
+  role: 'assistant'
+  finish?: string
+  error?: OpencodeMessageError
+  tokens?: OpencodeTokens
+  cost?: number
+}
+
+export type OpencodeToolState =
+  | { status: 'pending'; input?: Record<string, unknown> }
+  | {
+      status: 'running'
+      input?: Record<string, unknown>
+      title?: string
+    }
+  | {
+      status: 'completed'
+      input?: Record<string, unknown>
+      output: string
+      title?: string
+    }
+  | { status: 'error'; input?: Record<string, unknown>; error: string }
+
+/**
+ * The OpenCode message-part kinds the translator understands. The trailing
+ * catch-all member keeps the union open to other kinds (file, step-start,
+ * step-finish, snapshot, patch, agent, ...); the translator dispatches via
+ * the `is*Part` type guards, so those kinds simply match no guard.
+ */
+export type OpencodePart =
+  | { id: string; sessionID?: string; type: 'text'; text: string }
+  | { id: string; sessionID?: string; type: 'reasoning'; text: string }
+  | {
+      id: string
+      sessionID?: string
+      type: 'tool'
+      callID: string
+      tool: string
+      state: OpencodeToolState
+    }
+  | { id: string; sessionID?: string; type: string }
+
+/**
+ * The OpenCode events the translator understands. This is a closed
+ * discriminated union (so `event.type` narrows cleanly); the server forwards
+ * raw SDK events cast to this type, and any event whose `type` isn't listed
+ * here simply matches no branch and is ignored at runtime.
+ */
+export type OpencodeEvent =
+  | {
+      type: 'message.part.updated'
+      properties: { part: OpencodePart; delta?: string }
+    }
+  | {
+      type: 'message.updated'
+      properties: { info: { sessionID?: string } }
+    }
+  | { type: 'session.idle'; properties: { sessionID: string } }
+  | {
+      type: 'session.error'
+      properties: { sessionID?: string; error?: OpencodeMessageError }
+    }
+  | {
+      type: 'todo.updated'
+      properties: { sessionID: string; todos: Array<unknown> }
+    }
+
+/**
+ * Events fed to the translator: the session id once established, every
+ * session-scoped OpenCode event, and a terminal `done` carrying the final
+ * assistant message (the adapter's async queue produces these).
+ */
+export type OpencodeStreamEvent =
+  | { kind: 'session'; sessionId: string }
+  | { kind: 'event'; event: OpencodeEvent }
+  | { kind: 'done'; message: OpencodeAssistantMessage }
diff --git a/packages/ai-opencode/src/stream/translate.ts b/packages/ai-opencode/src/stream/translate.ts
new file mode 100644
index 000000000..2db145fa9
--- /dev/null
+++ b/packages/ai-opencode/src/stream/translate.ts
@@ -0,0 +1,419 @@
+import { EventType, buildBaseUsage } from '@tanstack/ai'
+import type { StreamChunk, TokenUsage } from '@tanstack/ai'
+import type {
+  OpencodeAssistantMessage,
+  OpencodeEvent,
+  OpencodePart,
+  OpencodeStreamEvent,
+  OpencodeTokens,
+} from './sdk-types'
+
+/** Name of the CUSTOM event carrying the OpenCode session id. */
+export const SESSION_ID_EVENT = 'opencode.session-id'
+
+/** Name of the CUSTOM event carrying the harness's todo list updates. */
+export const TODO_EVENT = 'opencode.todo'
+
+/** Server name used for bridged TanStack tools. */
+export const BRIDGED_MCP_SERVER_NAME = 'tanstack'
+
+export interface TranslateContext {
+  model: string
+  runId: string
+  threadId: string
+  parentRunId?: string
+  genId: () => string
+  /**
+   * Names of bridged TanStack tools, used to surface the harness's MCP tool
+   * calls under the names the application registered.
+   */
+  bridgedToolNames?: ReadonlySet<string>
+  /** Called for each raw stream event, for logging. */
+  onStreamEvent?: (event: OpencodeStreamEvent) => void
+}
+
+/**
+ * Resolve the AG-UI tool-call name for an OpenCode tool part. OpenCode names
+ * MCP tools `<server>_<tool>`, so bridged TanStack tools arrive as
+ * `tanstack_<tool>` and are surfaced under the names the application
+ * registered; everything else (built-in `read`, `edit`, `bash`, ... and
+ * foreign MCP tools) uses the harness tool name verbatim.
+ */
+export function resolveToolName(
+  tool: string,
+  bridgedToolNames: ReadonlySet<string> | undefined,
+): string {
+  if (!bridgedToolNames || bridgedToolNames.size === 0) return tool
+  if (bridgedToolNames.has(tool)) return tool
+  if (tool.startsWith('tanstack_') && bridgedToolNames.has(tool.slice(9))) {
+    return tool.slice(9)
+  }
+  return tool
+}
+
+function buildUsage(
+  tokens: OpencodeTokens | undefined,
+): TokenUsage | undefined {
+  if (!tokens) return undefined
+  const promptTokens = tokens.input ?? 0
+  const completionTokens = tokens.output ?? 0
+  const result = buildBaseUsage({
+    promptTokens,
+    completionTokens,
+    totalTokens: promptTokens + completionTokens,
+  })
+  if (tokens.cache?.read) {
+    result.promptTokensDetails = { cachedTokens: tokens.cache.read }
+  }
+  if (tokens.reasoning) {
+    result.completionTokensDetails = { reasoningTokens: tokens.reasoning }
+  }
+  return result
+}
+
+type TextPart = Extract<OpencodePart, { type: 'text' }>
+type ReasoningPart = Extract<OpencodePart, { type: 'reasoning' }>
+type ToolPart = Extract<OpencodePart, { type: 'tool' }>
+
+const isTextPart = (part: OpencodePart): part is TextPart =>
+  part.type === 'text'
+const isReasoningPart = (part: OpencodePart): part is ReasoningPart =>
+  part.type === 'reasoning'
+const isToolPart = (part: OpencodePart): part is ToolPart =>
+  part.type === 'tool'
+
+function messageError(
+  message: OpencodeAssistantMessage,
+): { message: string } | undefined {
+  if (!message.error) return undefined
+  return { message: message.error.data?.message ?? message.error.name }
+}
+
+/**
+ * Translate an OpenCode event stream into AG-UI StreamChunk events.
+ *
+ * The harness runs its own agent loop and executes its own tools, so the
+ * translation always ends with `finishReason: 'stop'` (or `'length'` /
+ * RUN_ERROR) — never `'tool_calls'`. Harness tool activity is emitted as
+ * already-resolved TOOL_CALL_START/ARGS/END + TOOL_CALL_RESULT sequences so
+ * UIs can render it, while the TanStack engine never tries to execute them.
+ *
+ * OpenCode delivers true token-level deltas for both assistant text and
+ * reasoning via `message.part.updated` events (a `delta` string when
+ * incremental, otherwise the full part text, from which the delta is
+ * derived). The final assistant message — finish reason, token usage, and any
+ * fatal error — arrives as the terminal `done` event.
+ *
+ * Invariant: every TOOL_CALL_START is eventually paired with a
+ * TOOL_CALL_RESULT (synthesized as `{"status":"interrupted"}` when the run
+ * ends or aborts before the harness reported one) so the engine's
+ * pending-tool-call scan on the next request never force-executes them.
+ */
+export async function* translateOpencodeStream(
+  events: AsyncIterable<OpencodeStreamEvent>,
+  ctx: TranslateContext,
+): AsyncIterable<StreamChunk> {
+  const { model, runId, threadId, genId } = ctx
+  const now = () => Date.now()
+
+  let runStarted = false
+  /** Tool calls started but with no result yet, keyed by callID. */
+  const unresolvedToolCalls = new Set<string>()
+  /** Tool call ids that already emitted TOOL_CALL_START/ARGS/END. */
+  const openedToolCalls = new Set<string>()
+  /** Tool call ids that already emitted a TOOL_CALL_RESULT. */
+  const resolvedToolCalls = new Set<string>()
+
+  /** Accumulated text per text-part id, for delta derivation. */
+  const textAccumulators = new Map<string, string>()
+  let openTextId: string | null = null
+  let openReasoningId: string | null = null
+
+  function* startRun(): Generator<StreamChunk> {
+    if (runStarted) return
+    runStarted = true
+    yield {
+      type: EventType.RUN_STARTED,
+      runId,
+      threadId,
+      model,
+      timestamp: now(),
+      ...(ctx.parentRunId !== undefined && { parentRunId: ctx.parentRunId }),
+    }
+  }
+
+  function* closeText(): Generator<StreamChunk> {
+    if (openTextId !== null) {
+      yield {
+        type: EventType.TEXT_MESSAGE_END,
+        messageId: openTextId,
+        model,
+        timestamp: now(),
+      }
+      openTextId = null
+    }
+  }
+
+  function* closeReasoning(): Generator<StreamChunk> {
+    if (openReasoningId !== null) {
+      yield {
+        type: EventType.REASONING_MESSAGE_END,
+        messageId: openReasoningId,
+        model,
+        timestamp: now(),
+      }
+      yield {
+        type: EventType.REASONING_END,
+        messageId: openReasoningId,
+        model,
+        timestamp: now(),
+      }
+      openReasoningId = null
+    }
+  }
+
+  function* synthesizeUnresolvedResults(): Generator<StreamChunk> {
+    for (const toolCallId of unresolvedToolCalls) {
+      yield {
+        type: EventType.TOOL_CALL_RESULT,
+        toolCallId,
+        messageId: genId(),
+        model,
+        timestamp: now(),
+        content: JSON.stringify({ status: 'interrupted' }),
+      }
+    }
+    unresolvedToolCalls.clear()
+  }
+
+  function* handleTextPart(
+    part: Extract<OpencodePart, { type: 'text' }>,
+    delta: string | undefined,
+  ): Generator<StreamChunk> {
+    yield* closeReasoning()
+
+    const prev = textAccumulators.get(part.id) ?? ''
+    let deltaText: string
+    if (typeof delta === 'string' && delta !== '') {
+      deltaText = delta
+      textAccumulators.set(part.id, prev + delta)
+    } else {
+      const full = part.text
+      deltaText = full.startsWith(prev) ? full.slice(prev.length) : full
+      textAccumulators.set(part.id, full)
+    }
+    if (deltaText === '') return
+
+    if (openTextId !== part.id) {
+      yield* closeText()
+      openTextId = part.id
+      yield {
+        type: EventType.TEXT_MESSAGE_START,
+        messageId: part.id,
+        model,
+        timestamp: now(),
+        role: 'assistant',
+      }
+    }
+    yield {
+      type: EventType.TEXT_MESSAGE_CONTENT,
+      messageId: part.id,
+      model,
+      timestamp: now(),
+      delta: deltaText,
+      content: textAccumulators.get(part.id) ?? deltaText,
+    }
+  }
+
+  function* handleReasoningPart(
+    part: Extract<OpencodePart, { type: 'reasoning' }>,
+    delta: string | undefined,
+  ): Generator<StreamChunk> {
+    yield* closeText()
+
+    const prev = textAccumulators.get(part.id) ?? ''
+    let deltaText: string
+    if (typeof delta === 'string' && delta !== '') {
+      deltaText = delta
+      textAccumulators.set(part.id, prev + delta)
+    } else {
+      const full = part.text
+      deltaText = full.startsWith(prev) ? full.slice(prev.length) : full
+      textAccumulators.set(part.id, full)
+    }
+    if (deltaText === '') return
+
+    if (openReasoningId !== part.id) {
+      yield* closeReasoning()
+      openReasoningId = part.id
+      yield {
+        type: EventType.REASONING_START,
+        messageId: part.id,
+        model,
+        timestamp: now(),
+      }
+      yield {
+        type: EventType.REASONING_MESSAGE_START,
+        messageId: part.id,
+        role: 'reasoning' as const,
+        model,
+        timestamp: now(),
+      }
+    }
+    yield {
+      type: EventType.REASONING_MESSAGE_CONTENT,
+      messageId: part.id,
+      delta: deltaText,
+      model,
+      timestamp: now(),
+    }
+  }
+
+  function* openToolCall(
+    part: Extract<OpencodePart, { type: 'tool' }>,
+  ): Generator<StreamChunk> {
+    if (openedToolCalls.has(part.callID)) return
+    openedToolCalls.add(part.callID)
+    const toolCallName = resolveToolName(part.tool, ctx.bridgedToolNames)
+    const input = part.state.input ?? {}
+    const args = JSON.stringify(input)
+    yield {
+      type: EventType.TOOL_CALL_START,
+      toolCallId: part.callID,
+      toolCallName,
+      toolName: toolCallName,
+      model,
+      timestamp: now(),
+    }
+    yield {
+      type: EventType.TOOL_CALL_ARGS,
+      toolCallId: part.callID,
+      model,
+      timestamp: now(),
+      delta: args,
+      args,
+    }
+    yield {
+      type: EventType.TOOL_CALL_END,
+      toolCallId: part.callID,
+      toolCallName,
+      toolName: toolCallName,
+      model,
+      timestamp: now(),
+      input,
+    }
+    unresolvedToolCalls.add(part.callID)
+  }
+
+  function* handleToolPart(
+    part: Extract<OpencodePart, { type: 'tool' }>,
+  ): Generator<StreamChunk> {
+    yield* closeText()
+    yield* closeReasoning()
+    yield* openToolCall(part)
+
+    const state = part.state
+    if (state.status !== 'completed' && state.status !== 'error') return
+    if (resolvedToolCalls.has(part.callID)) return
+    resolvedToolCalls.add(part.callID)
+    unresolvedToolCalls.delete(part.callID)
+
+    const isError = state.status === 'error'
+    yield {
+      type: EventType.TOOL_CALL_RESULT,
+      toolCallId: part.callID,
+      messageId: genId(),
+      model,
+      timestamp: now(),
+      content: isError ? state.error : state.output,
+      ...(isError && { state: 'output-error' as const }),
+    }
+  }
+
+  function* handleEvent(event: OpencodeEvent): Generator<StreamChunk> {
+    if (event.type === 'message.part.updated') {
+      const { part, delta } = event.properties
+      if (isTextPart(part)) {
+        yield* handleTextPart(part, delta)
+      } else if (isReasoningPart(part)) {
+        yield* handleReasoningPart(part, delta)
+      } else if (isToolPart(part)) {
+        yield* handleToolPart(part)
+      }
+      // Other part kinds (file, step-start/finish, snapshot, ...) carry no
+      // state the chunk stream needs.
+    } else if (event.type === 'todo.updated') {
+      yield {
+        type: EventType.CUSTOM,
+        model,
+        timestamp: now(),
+        name: TODO_EVENT,
+        value: { todos: event.properties.todos },
+      }
+    }
+    // session.idle / session.status / message.updated are redundant with the
+    // terminal `done` event and are ignored.
+  }
+
+  function* finish(message: OpencodeAssistantMessage): Generator<StreamChunk> {
+    yield* startRun()
+    yield* closeText()
+    yield* closeReasoning()
+    yield* synthesizeUnresolvedResults()
+
+    const error = messageError(message)
+    if (error) {
+      yield {
+        type: EventType.RUN_ERROR,
+        model,
+        timestamp: now(),
+        message: error.message,
+        error,
+      }
+      return
+    }
+
+    const usage = buildUsage(message.tokens)
+    const finishReason = message.finish === 'length' ? 'length' : 'stop'
+    yield {
+      type: EventType.RUN_FINISHED,
+      runId,
+      threadId,
+      model,
+      timestamp: now(),
+      finishReason,
+      ...(usage !== undefined && { usage }),
+    }
+  }
+
+  try {
+    for await (const streamEvent of events) {
+      ctx.onStreamEvent?.(streamEvent)
+
+      if (streamEvent.kind === 'session') {
+        yield* startRun()
+        yield {
+          type: EventType.CUSTOM,
+          model,
+          timestamp: now(),
+          name: SESSION_ID_EVENT,
+          value: { sessionId: streamEvent.sessionId },
+        }
+      } else if (streamEvent.kind === 'event') {
+        yield* startRun()
+        yield* handleEvent(streamEvent.event)
+      } else {
+        yield* finish(streamEvent.message)
+      }
+    }
+  } catch (error) {
+    // The run is dying (abort, server exit, or connection failure). Close any
+    // open message and pair started tool calls with a synthetic result first
+    // so the next request's pending-tool-call scan doesn't try to execute
+    // them, then let the adapter surface the error as RUN_ERROR.
+    yield* closeText()
+    yield* closeReasoning()
+    yield* synthesizeUnresolvedResults()
+    throw error
+  }
+}
diff --git a/packages/ai-opencode/tests/permissions.test.ts b/packages/ai-opencode/tests/permissions.test.ts
new file mode 100644
index 000000000..ebbb30016
--- /dev/null
+++ b/packages/ai-opencode/tests/permissions.test.ts
@@ -0,0 +1,118 @@
+import { describe, expect, it } from 'vitest'
+import {
+  matchBridgedToolName,
+  resolvePermission,
+} from '../src/process/permissions'
+import type { OpencodePermissionRequest } from '../src/process/permissions'
+
+function request(
+  overrides: Partial<OpencodePermissionRequest> = {},
+): OpencodePermissionRequest {
+  return {
+    id: 'perm-1',
+    sessionID: 'sess-1',
+    type: 'bash',
+    title: 'Run a command',
+    ...overrides,
+  }
+}
+
+describe('matchBridgedToolName', () => {
+  const bridged = new Set(['lookup_user'])
+
+  it('returns false without bridged tools', () => {
+    expect(
+      matchBridgedToolName(request({ type: 'lookup_user' }), undefined),
+    ).toBe(false)
+    expect(
+      matchBridgedToolName(request({ type: 'lookup_user' }), new Set()),
+    ).toBe(false)
+  })
+
+  it('matches a bare registered tool name in type or title', () => {
+    expect(
+      matchBridgedToolName(request({ type: 'lookup_user' }), bridged),
+    ).toBe(true)
+    expect(
+      matchBridgedToolName(
+        request({ type: 'tool', title: 'lookup_user' }),
+        bridged,
+      ),
+    ).toBe(true)
+  })
+
+  it('matches the tanstack_ and tanstack. server prefixes', () => {
+    expect(
+      matchBridgedToolName(request({ type: 'tanstack_lookup_user' }), bridged),
+    ).toBe(true)
+    expect(
+      matchBridgedToolName(request({ type: 'tanstack.lookup_user' }), bridged),
+    ).toBe(true)
+  })
+
+  it('does not match foreign tools', () => {
+    expect(
+      matchBridgedToolName(request({ type: 'github_create_issue' }), bridged),
+    ).toBe(false)
+  })
+})
+
+describe('resolvePermission', () => {
+  const bridged = new Set(['lookup_user'])
+
+  it('always allows bridged tools regardless of mode', () => {
+    for (const mode of [
+      'default',
+      'acceptEdits',
+      'bypassPermissions',
+    ] as const) {
+      expect(
+        resolvePermission(
+          request({ type: 'tanstack_lookup_user' }),
+          mode,
+          bridged,
+        ),
+      ).toBe('once')
+    }
+  })
+
+  it('rejects everything else in default mode', () => {
+    expect(
+      resolvePermission(request({ type: 'bash' }), 'default', bridged),
+    ).toBe('reject')
+    expect(
+      resolvePermission(request({ type: 'edit' }), 'default', bridged),
+    ).toBe('reject')
+    expect(
+      resolvePermission(request({ type: 'webfetch' }), 'default', bridged),
+    ).toBe('reject')
+  })
+
+  it('auto-approves file mutations only in acceptEdits mode', () => {
+    for (const type of ['edit', 'write', 'patch']) {
+      expect(resolvePermission(request({ type }), 'acceptEdits', bridged)).toBe(
+        'once',
+      )
+    }
+    expect(
+      resolvePermission(request({ type: 'bash' }), 'acceptEdits', bridged),
+    ).toBe('reject')
+  })
+
+  it('approves everything in bypassPermissions mode', () => {
+    expect(
+      resolvePermission(
+        request({ type: 'bash' }),
+        'bypassPermissions',
+        bridged,
+      ),
+    ).toBe('once')
+    expect(
+      resolvePermission(
+        request({ type: 'webfetch' }),
+        'bypassPermissions',
+        undefined,
+      ),
+    ).toBe('once')
+  })
+})
diff --git a/packages/ai-opencode/tests/prompt.test.ts b/packages/ai-opencode/tests/prompt.test.ts
new file mode 100644
index 000000000..b2285eeb3
--- /dev/null
+++ b/packages/ai-opencode/tests/prompt.test.ts
@@ -0,0 +1,92 @@
+import { describe, expect, it } from 'vitest'
+import { buildPrompt } from '../src/messages/prompt'
+import type { ModelMessage } from '@tanstack/ai'
+
+const user = (content: ModelMessage['content']): ModelMessage => ({
+  role: 'user',
+  content,
+})
+const assistant = (content: ModelMessage['content']): ModelMessage => ({
+  role: 'assistant',
+  content,
+})
+
+describe('buildPrompt', () => {
+  it('resumes with only the last user message when sessionId is provided', () => {
+    const result = buildPrompt(
+      [
+        user('first question'),
+        assistant('first answer'),
+        user('follow-up question'),
+      ],
+      'sess-1',
+    )
+    expect(result).toEqual({ prompt: 'follow-up question', resume: 'sess-1' })
+  })
+
+  it('throws when sessionId is provided but there is no trailing user message', () => {
+    expect(() => buildPrompt([user('q'), assistant('a')], 'sess-1')).toThrow(
+      /user message/i,
+    )
+  })
+
+  it('sends a single user message as-is for a fresh session', () => {
+    expect(buildPrompt([user('hello')], undefined)).toEqual({ prompt: 'hello' })
+  })
+
+  it('flattens prior turns into a transcript preamble for fresh multi-turn history', () => {
+    const { prompt, resume } = buildPrompt(
+      [user('What is 2+2?'), assistant('4'), user('And times 3?')],
+      undefined,
+    )
+    expect(resume).toBeUndefined()
+    expect(prompt).toBe(
+      'Previous conversation:\nUser: What is 2+2?\nAssistant: 4\n\nAnd times 3?',
+    )
+  })
+
+  it('skips tool messages and assistant tool-call-only turns when flattening', () => {
+    const messages: Array<ModelMessage> = [
+      user('list files'),
+      {
+        role: 'assistant',
+        content: null,
+        toolCalls: [
+          {
+            id: 't1',
+            type: 'function',
+            function: { name: 'ls', arguments: '{}' },
+          },
+        ],
+      } as unknown as ModelMessage,
+      { role: 'tool', content: 'file-a', toolCallId: 't1' },
+      assistant('There is one file.'),
+      user('thanks, which one?'),
+    ]
+    const { prompt } = buildPrompt(messages, undefined)
+    expect(prompt).toBe(
+      'Previous conversation:\nUser: list files\nAssistant: There is one file.\n\nthanks, which one?',
+    )
+  })
+
+  it('extracts text from content-part arrays and ignores non-text parts', () => {
+    const { prompt } = buildPrompt(
+      [
+        user([
+          { type: 'text', content: 'describe ' },
+          {
+            type: 'image',
+            source: { type: 'url', url: 'https://x/y.png' },
+          } as never,
+          { type: 'text', content: 'this' },
+        ] as ModelMessage['content']),
+      ],
+      undefined,
+    )
+    expect(prompt).toBe('describe this')
+  })
+
+  it('throws when there is no usable user content at all', () => {
+    expect(() => buildPrompt([], undefined)).toThrow(/user message/i)
+  })
+})
diff --git a/packages/ai-opencode/tests/text-adapter.test.ts b/packages/ai-opencode/tests/text-adapter.test.ts
new file mode 100644
index 000000000..0ab5f0fce
--- /dev/null
+++ b/packages/ai-opencode/tests/text-adapter.test.ts
@@ -0,0 +1,109 @@
+/**
+ * Tests for the in-sandbox OpenCode adapter.
+ *
+ * The OpenCode HTTP session itself is the `@opencode-ai/sdk`'s and is reused
+ * unchanged via its `baseUrl` connect path; the new piece is spawning
+ * `opencode serve` inside the sandbox and exposing its port. We test that
+ * server-launch helper (readiness detection + port exposure) and the adapter's
+ * missing-sandbox path. A full session round-trip is covered by the gated live
+ * path.
+ */
+import { describe, expect, it } from 'vitest'
+import { startOpencodeServerInSandbox } from '../src/process/sandbox-server'
+import { opencodeText } from '../src/index'
+import type { InternalLogger } from '@tanstack/ai/adapter-internals'
+import type { StreamChunk } from '@tanstack/ai'
+import type { SandboxHandle, SpawnHandle } from '@tanstack/ai-sandbox'
+
+const noopLogger = {
+  request: () => {},
+  provider: () => {},
+  errors: () => {},
+  agentLoop: () => {},
+  warnings: () => {},
+  debug: () => {},
+} as unknown as InternalLogger
+
+async function* chunks(values: Array<string>): AsyncIterable<string> {
+  for (const v of values) {
+    await Promise.resolve()
+    yield v
+  }
+}
+
+/** Mock sandbox whose spawn emits a scripted stdout and whose port resolves. */
+function mockSandbox(stdout: Array<string>): SandboxHandle {
+  const spawnHandle: SpawnHandle = {
+    pid: 1,
+    stdout: chunks(stdout),
+    stderr: chunks([]),
+    stdin: { write: () => Promise.resolve(), end: () => Promise.resolve() },
+    wait: () => Promise.resolve(0),
+    kill: () => Promise.resolve(),
+  }
+  return {
+    id: 'sbx',
+    provider: 'mock',
+    capabilities: {} as SandboxHandle['capabilities'],
+    fs: {} as SandboxHandle['fs'],
+    git: {} as SandboxHandle['git'],
+    process: {
+      exec: () => Promise.reject(new Error('unused')),
+      spawn: () => Promise.resolve(spawnHandle),
+    },
+    ports: {
+      connect: (port) => Promise.resolve({ url: `http://127.0.0.1:${port}` }),
+    },
+    env: { set: () => Promise.resolve() },
+    destroy: () => Promise.resolve(),
+  }
+}
+
+async function collect(
+  stream: AsyncIterable<StreamChunk>,
+): Promise<Array<StreamChunk>> {
+  const out: Array<StreamChunk> = []
+  for await (const chunk of stream) out.push(chunk)
+  return out
+}
+
+describe('startOpencodeServerInSandbox', () => {
+  it('resolves baseUrl once the server logs readiness', async () => {
+    const sandbox = mockSandbox([
+      'booting...\n',
+      'opencode server listening on http://0.0.0.0:4096\n',
+    ])
+    const server = await startOpencodeServerInSandbox(sandbox, {
+      port: 4096,
+      cwd: '/workspace',
+    })
+    expect(server.baseUrl).toBe('http://127.0.0.1:4096')
+    await server.dispose()
+  })
+
+  it('rejects if the server exits before becoming ready', async () => {
+    const sandbox = mockSandbox(['fatal: cannot bind port\n'])
+    await expect(
+      startOpencodeServerInSandbox(sandbox, {
+        port: 4096,
+        cwd: '/workspace',
+        timeoutMs: 1000,
+      }),
+    ).rejects.toThrow(/before becoming ready/i)
+  })
+})
+
+describe('opencode adapter', () => {
+  it('requires a sandbox capability', async () => {
+    const adapter = opencodeText('anthropic/claude-sonnet-4-5')
+    const result = await collect(
+      adapter.chatStream({
+        model: 'anthropic/claude-sonnet-4-5',
+        messages: [{ role: 'user', content: 'hi' }],
+        logger: noopLogger,
+      }),
+    )
+    const err = result.find((c) => c.type === 'RUN_ERROR')
+    expect((err as { message?: string }).message).toMatch(/requires a sandbox/i)
+  })
+})
diff --git a/packages/ai-opencode/tests/translate.test.ts b/packages/ai-opencode/tests/translate.test.ts
new file mode 100644
index 000000000..0b48da075
--- /dev/null
+++ b/packages/ai-opencode/tests/translate.test.ts
@@ -0,0 +1,410 @@
+import { describe, expect, it } from 'vitest'
+import {
+  SESSION_ID_EVENT,
+  TODO_EVENT,
+  resolveToolName,
+  translateOpencodeStream,
+} from '../src/stream/translate'
+import type { TranslateContext } from '../src/stream/translate'
+import type {
+  OpencodeAssistantMessage,
+  OpencodeStreamEvent,
+} from '../src/stream/sdk-types'
+import type { StreamChunk } from '@tanstack/ai'
+
+function makeCtx(overrides: Partial<TranslateContext> = {}): TranslateContext {
+  let id = 0
+  return {
+    model: 'anthropic/claude-sonnet-4-5',
+    runId: 'run-1',
+    threadId: 'thread-1',
+    genId: () => `gen-${++id}`,
+    ...overrides,
+  }
+}
+
+async function* fromArray(
+  events: Array<OpencodeStreamEvent>,
+): AsyncIterable<OpencodeStreamEvent> {
+  for (const event of events) yield event
+}
+
+async function collect(
+  events: Array<OpencodeStreamEvent>,
+  ctx: TranslateContext = makeCtx(),
+): Promise<Array<StreamChunk>> {
+  const chunks: Array<StreamChunk> = []
+  for await (const chunk of translateOpencodeStream(fromArray(events), ctx)) {
+    chunks.push(chunk)
+  }
+  return chunks
+}
+
+const session: OpencodeStreamEvent = { kind: 'session', sessionId: 'sess-1' }
+
+function done(
+  overrides: Partial<OpencodeAssistantMessage> = {},
+): OpencodeStreamEvent {
+  return {
+    kind: 'done',
+    message: { id: 'msg-1', role: 'assistant', finish: 'stop', ...overrides },
+  }
+}
+
+function textPart(
+  id: string,
+  text: string,
+  delta?: string,
+): OpencodeStreamEvent {
+  return {
+    kind: 'event',
+    event: {
+      type: 'message.part.updated',
+      properties: {
+        part: { id, sessionID: 'sess-1', type: 'text', text },
+        ...(delta !== undefined && { delta }),
+      },
+    },
+  }
+}
+
+describe('translateOpencodeStream', () => {
+  it('translates a simple text turn', async () => {
+    const chunks = await collect([
+      session,
+      textPart('part-1', 'hi there', 'hi there'),
+      done(),
+    ])
+
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TEXT_MESSAGE_START',
+      'TEXT_MESSAGE_CONTENT',
+      'TEXT_MESSAGE_END',
+      'RUN_FINISHED',
+    ])
+    expect(chunks[1]).toMatchObject({
+      name: SESSION_ID_EVENT,
+      value: { sessionId: 'sess-1' },
+    })
+    expect(chunks[3]).toMatchObject({ delta: 'hi there', content: 'hi there' })
+    expect(chunks.at(-1)).toMatchObject({ finishReason: 'stop' })
+  })
+
+  it('accumulates incremental text deltas', async () => {
+    const chunks = await collect([
+      session,
+      textPart('part-1', 'Hel', 'Hel'),
+      textPart('part-1', 'Hello', 'lo'),
+      done(),
+    ])
+    const contents = chunks.filter((c) => c.type === 'TEXT_MESSAGE_CONTENT')
+    expect(contents).toHaveLength(2)
+    expect(contents[0]).toMatchObject({ delta: 'Hel', content: 'Hel' })
+    expect(contents[1]).toMatchObject({ delta: 'lo', content: 'Hello' })
+    // A single START/END pair for the one part id.
+    expect(chunks.filter((c) => c.type === 'TEXT_MESSAGE_START')).toHaveLength(
+      1,
+    )
+    expect(chunks.filter((c) => c.type === 'TEXT_MESSAGE_END')).toHaveLength(1)
+  })
+
+  it('derives the delta from full-text snapshots when no delta is given', async () => {
+    const chunks = await collect([
+      session,
+      textPart('part-1', 'Hel'),
+      textPart('part-1', 'Hello'),
+      done(),
+    ])
+    const contents = chunks.filter((c) => c.type === 'TEXT_MESSAGE_CONTENT')
+    expect(contents[0]).toMatchObject({ delta: 'Hel' })
+    expect(contents[1]).toMatchObject({ delta: 'lo', content: 'Hello' })
+  })
+
+  it('reports usage with cache and reasoning details', async () => {
+    const chunks = await collect([
+      session,
+      done({
+        tokens: {
+          input: 100,
+          output: 20,
+          reasoning: 5,
+          cache: { read: 40, write: 0 },
+        },
+      }),
+    ])
+    const finished = chunks.at(-1) as unknown as {
+      usage: Record<string, unknown>
+    }
+    expect(finished.usage).toMatchObject({
+      promptTokens: 100,
+      completionTokens: 20,
+      totalTokens: 120,
+      promptTokensDetails: { cachedTokens: 40 },
+      completionTokensDetails: { reasoningTokens: 5 },
+    })
+  })
+
+  it('maps a length finish to finishReason length', async () => {
+    const chunks = await collect([session, done({ finish: 'length' })])
+    expect(chunks.at(-1)).toMatchObject({ finishReason: 'length' })
+  })
+
+  it('translates a reasoning part into a reasoning sequence', async () => {
+    const chunks = await collect([
+      session,
+      {
+        kind: 'event',
+        event: {
+          type: 'message.part.updated',
+          properties: {
+            part: {
+              id: 'r-1',
+              sessionID: 'sess-1',
+              type: 'reasoning',
+              text: 'thinking',
+            },
+            delta: 'thinking',
+          },
+        },
+      },
+      done(),
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'REASONING_START',
+      'REASONING_MESSAGE_START',
+      'REASONING_MESSAGE_CONTENT',
+      'REASONING_MESSAGE_END',
+      'REASONING_END',
+      'RUN_FINISHED',
+    ])
+  })
+
+  function toolEvent(
+    callID: string,
+    tool: string,
+    state: Record<string, unknown>,
+  ): OpencodeStreamEvent {
+    return {
+      kind: 'event',
+      event: {
+        type: 'message.part.updated',
+        properties: {
+          part: {
+            id: `part-${callID}`,
+            sessionID: 'sess-1',
+            type: 'tool',
+            callID,
+            tool,
+            state: state as never,
+          },
+        },
+      },
+    }
+  }
+
+  it('pairs a tool call across running and completed states', async () => {
+    const chunks = await collect([
+      session,
+      toolEvent('call-1', 'bash', {
+        status: 'running',
+        input: { command: 'ls' },
+      }),
+      toolEvent('call-1', 'bash', {
+        status: 'completed',
+        input: { command: 'ls' },
+        output: 'file.txt',
+        title: 'ls',
+      }),
+      done(),
+    ])
+    expect(chunks.map((c) => c.type)).toEqual([
+      'RUN_STARTED',
+      'CUSTOM',
+      'TOOL_CALL_START',
+      'TOOL_CALL_ARGS',
+      'TOOL_CALL_END',
+      'TOOL_CALL_RESULT',
+      'RUN_FINISHED',
+    ])
+    expect(chunks[2]).toMatchObject({
+      toolCallId: 'call-1',
+      toolCallName: 'bash',
+    })
+    expect(chunks[3]).toMatchObject({ args: JSON.stringify({ command: 'ls' }) })
+    expect(chunks[5]).toMatchObject({ content: 'file.txt' })
+    expect((chunks[5] as { state?: string }).state).toBeUndefined()
+  })
+
+  it('marks tool errors as output-error', async () => {
+    const chunks = await collect([
+      session,
+      toolEvent('call-2', 'bash', {
+        status: 'error',
+        input: { command: 'false' },
+        error: 'exit 1',
+      }),
+      done(),
+    ])
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_RESULT')).toMatchObject({
+      content: 'exit 1',
+      state: 'output-error',
+    })
+  })
+
+  it('does not duplicate START events across repeated tool updates', async () => {
+    const chunks = await collect([
+      session,
+      toolEvent('call-3', 'read', { status: 'pending', input: {} }),
+      toolEvent('call-3', 'read', { status: 'running', input: { path: 'a' } }),
+      toolEvent('call-3', 'read', {
+        status: 'completed',
+        input: { path: 'a' },
+        output: 'data',
+        title: 'read a',
+      }),
+      done(),
+    ])
+    expect(chunks.filter((c) => c.type === 'TOOL_CALL_START')).toHaveLength(1)
+    expect(chunks.filter((c) => c.type === 'TOOL_CALL_RESULT')).toHaveLength(1)
+  })
+
+  it('surfaces bridged MCP tool calls under the registered name', async () => {
+    const chunks = await collect(
+      [
+        session,
+        toolEvent('call-4', 'tanstack_lookup_user', {
+          status: 'completed',
+          input: { userId: '7' },
+          output: '{"name":"Ada"}',
+          title: 'lookup_user',
+        }),
+        done(),
+      ],
+      makeCtx({ bridgedToolNames: new Set(['lookup_user']) }),
+    )
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_START')).toMatchObject({
+      toolCallName: 'lookup_user',
+    })
+    expect(chunks.find((c) => c.type === 'TOOL_CALL_RESULT')).toMatchObject({
+      content: '{"name":"Ada"}',
+    })
+  })
+
+  it('synthesizes interrupted results for unresolved tool calls on done', async () => {
+    const chunks = await collect([
+      session,
+      toolEvent('call-9', 'bash', {
+        status: 'running',
+        input: { command: 'sleep 100' },
+      }),
+      done(),
+    ])
+    const result = chunks.find((c) => c.type === 'TOOL_CALL_RESULT')
+    expect(result).toMatchObject({
+      toolCallId: 'call-9',
+      content: JSON.stringify({ status: 'interrupted' }),
+    })
+    expect(chunks.at(-1)).toMatchObject({ type: 'RUN_FINISHED' })
+  })
+
+  it('maps a message error to RUN_ERROR', async () => {
+    const chunks = await collect([
+      session,
+      done({
+        finish: undefined,
+        error: { name: 'ProviderAuthError', data: { message: 'no key' } },
+      }),
+    ])
+    expect(chunks.at(-1)).toMatchObject({
+      type: 'RUN_ERROR',
+      message: 'no key',
+    })
+  })
+
+  it('emits a todo CUSTOM event', async () => {
+    const chunks = await collect([
+      session,
+      {
+        kind: 'event',
+        event: {
+          type: 'todo.updated',
+          properties: {
+            sessionID: 'sess-1',
+            todos: [{ content: 'step 1', status: 'pending' }],
+          },
+        },
+      },
+      done(),
+    ])
+    expect(
+      chunks.find((c) => c.type === 'CUSTOM' && c.name === TODO_EVENT),
+    ).toBeDefined()
+  })
+
+  it('forwards raw stream events to onStreamEvent', async () => {
+    const kinds: Array<string> = []
+    await collect(
+      [session, textPart('p', 'hi', 'hi'), done()],
+      makeCtx({ onStreamEvent: (event) => kinds.push(event.kind) }),
+    )
+    expect(kinds).toEqual(['session', 'event', 'done'])
+  })
+
+  it('synthesizes results then rethrows when the source stream throws', async () => {
+    async function* failing(): AsyncIterable<OpencodeStreamEvent> {
+      yield session
+      yield {
+        kind: 'event',
+        event: {
+          type: 'message.part.updated',
+          properties: {
+            part: {
+              id: 'p-c',
+              sessionID: 'sess-1',
+              type: 'tool',
+              callID: 'call-7',
+              tool: 'bash',
+              state: { status: 'running', input: {} } as never,
+            },
+          },
+        },
+      }
+      throw new Error('aborted')
+    }
+
+    const chunks: Array<StreamChunk> = []
+    await expect(async () => {
+      for await (const chunk of translateOpencodeStream(failing(), makeCtx())) {
+        chunks.push(chunk)
+      }
+    }).rejects.toThrow('aborted')
+    expect(chunks.at(-1)).toMatchObject({
+      type: 'TOOL_CALL_RESULT',
+      toolCallId: 'call-7',
+      content: JSON.stringify({ status: 'interrupted' }),
+    })
+  })
+})
+
+describe('resolveToolName', () => {
+  it('returns the tool name verbatim without bridged names', () => {
+    expect(resolveToolName('bash', undefined)).toBe('bash')
+    expect(resolveToolName('edit', new Set())).toBe('edit')
+  })
+
+  it('strips the tanstack_ prefix for bridged tools', () => {
+    const bridged = new Set(['lookup_user'])
+    expect(resolveToolName('tanstack_lookup_user', bridged)).toBe('lookup_user')
+    expect(resolveToolName('lookup_user', bridged)).toBe('lookup_user')
+  })
+
+  it('leaves foreign tool names untouched', () => {
+    expect(
+      resolveToolName('github_create_issue', new Set(['lookup_user'])),
+    ).toBe('github_create_issue')
+  })
+})
diff --git a/packages/ai-opencode/tsconfig.json b/packages/ai-opencode/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-opencode/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-opencode/vite.config.ts b/packages/ai-opencode/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-opencode/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-persistence-cloudflare/package.json b/packages/ai-persistence-cloudflare/package.json
new file mode 100644
index 000000000..e54b32a36
--- /dev/null
+++ b/packages/ai-persistence-cloudflare/package.json
@@ -0,0 +1,52 @@
+{
+  "name": "@tanstack/ai-persistence-cloudflare",
+  "version": "0.1.0",
+  "description": "Cloudflare backend for TanStack AI persistence — D1-backed SQL stores (compile-verified), with optional Durable Object locks and R2 artifact storage.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-persistence-cloudflare"
+  },
+  "keywords": [
+    "ai",
+    "tanstack",
+    "persistence"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-persistence": "workspace:^",
+    "@tanstack/ai-persistence-sql": "workspace:^"
+  },
+  "devDependencies": {
+    "@cloudflare/workers-types": "^4.20241230.0",
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-persistence": "workspace:*",
+    "@tanstack/ai-persistence-sql": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-persistence-cloudflare/src/index.ts b/packages/ai-persistence-cloudflare/src/index.ts
new file mode 100644
index 000000000..75732ecfd
--- /dev/null
+++ b/packages/ai-persistence-cloudflare/src/index.ts
@@ -0,0 +1,91 @@
+/// <reference types="@cloudflare/workers-types" />
+/**
+ * Cloudflare backend. D1 (SQLite-compatible) backs the shared SQL stores; an
+ * optional Durable Object namespace can back the distributed lock.
+ *
+ * COMPILE-VERIFIED ONLY: this package type-checks against real `@cloudflare`
+ * types but is not runtime-verified here (it needs a Workers runtime). The D1
+ * driver itself is unit-tested against a fake D1 so the adapter logic is
+ * covered. R2-backed artifact bytes are a documented follow-up — artifacts
+ * persist inline in D1 today.
+ */
+import { createSqlPersistence } from '@tanstack/ai-persistence-sql'
+import type { SqlDriver, SqlRow } from '@tanstack/ai-persistence-sql'
+import type { ChatPersistence, PersistenceMode } from '@tanstack/ai-persistence'
+import type { LockStore } from '@tanstack/ai'
+
+/** Build a {@link SqlDriver} over a Cloudflare D1 database (SQLite dialect). */
+export function createD1Driver(d1: D1Database): SqlDriver {
+  const driver: SqlDriver = {
+    dialect: 'sqlite',
+    async exec(sql, params = []) {
+      await d1
+        .prepare(sql)
+        .bind(...(params as Array<never>))
+        .run()
+    },
+    async query<T extends SqlRow = SqlRow>(
+      sql: string,
+      params: ReadonlyArray<unknown> = [],
+    ) {
+      const result = await d1
+        .prepare(sql)
+        .bind(...(params as Array<never>))
+        .all<T>()
+      return result.results
+    },
+    // D1 has no interactive transaction API (only batch); run statements
+    // directly. The stores only group DDL in a transaction, which is safe here.
+    transaction(fn) {
+      return fn(driver)
+    },
+  }
+  return driver
+}
+
+export interface CloudflarePersistenceOptions {
+  d1: D1Database
+  /** Optional Durable Object namespace for the distributed lock (see {@link createDurableObjectLockStore}). */
+  durableObjects?: DurableObjectNamespace
+  /** Optional R2 bucket for artifact blobs (follow-up; artifacts persist in D1 for now). */
+  r2?: R2Bucket
+  mode?: PersistenceMode
+  /** Run migrations on first use (default true). */
+  migrate?: boolean
+}
+
+/** Cloudflare-backed {@link ChatPersistence} (D1 SQL stores). */
+export function cloudflarePersistence(
+  opts: CloudflarePersistenceOptions,
+): ChatPersistence {
+  const persistence = createSqlPersistence(createD1Driver(opts.d1), {
+    mode: opts.mode,
+    migrate: opts.migrate,
+  })
+  if (opts.durableObjects) {
+    persistence.locks = createDurableObjectLockStore(opts.durableObjects)
+  }
+  return persistence
+}
+
+/**
+ * Distributed lock over a Durable Object namespace. The companion DO class must
+ * implement a `fetch` that serializes by holding the single-threaded DO; this
+ * acquires by calling the DO keyed by the lock name. COMPILE-VERIFIED ONLY.
+ */
+export function createDurableObjectLockStore(
+  ns: DurableObjectNamespace,
+): LockStore {
+  return {
+    async withLock<T>(key: string, fn: () => Promise<T>): Promise<T> {
+      const stub = ns.get(ns.idFromName(key))
+      // Acquire: the DO returns 200 once it holds the turn for this key.
+      await stub.fetch('https://lock/acquire')
+      try {
+        return await fn()
+      } finally {
+        await stub.fetch('https://lock/release')
+      }
+    },
+  }
+}
diff --git a/packages/ai-persistence-cloudflare/tests/d1.test.ts b/packages/ai-persistence-cloudflare/tests/d1.test.ts
new file mode 100644
index 000000000..78f93705e
--- /dev/null
+++ b/packages/ai-persistence-cloudflare/tests/d1.test.ts
@@ -0,0 +1,64 @@
+/// <reference types="@cloudflare/workers-types" />
+import { describe, expect, it } from 'vitest'
+import { DatabaseSync } from 'node:sqlite'
+import { EventType } from '@tanstack/ai'
+import type { StreamChunk } from '@tanstack/ai'
+import { cloudflarePersistence, createD1Driver } from '../src/index'
+
+/**
+ * A fake D1Database backed by node:sqlite. D1 is SQLite-compatible, so this
+ * exercises the real D1 driver + SQL stores end-to-end without a Workers runtime.
+ */
+function fakeD1(): D1Database {
+  const db = new DatabaseSync(':memory:')
+  const prepare = (sql: string) => {
+    let bound: Array<unknown> = []
+    const api = {
+      bind: (...values: Array<unknown>) => {
+        bound = values
+        return api
+      },
+      run: () => {
+        db.prepare(sql).run(...(bound as Array<never>))
+        return Promise.resolve({ success: true })
+      },
+      all: () =>
+        Promise.resolve({
+          results: db.prepare(sql).all(...(bound as Array<never>)),
+        }),
+      first: () => Promise.resolve(null),
+      raw: () => Promise.resolve([]),
+    }
+    return api
+  }
+  return { prepare } as unknown as D1Database
+}
+
+const text = (delta: string): StreamChunk => ({
+  type: EventType.TEXT_MESSAGE_CONTENT,
+  messageId: 'm1',
+  delta,
+  timestamp: 1,
+})
+
+describe('cloudflarePersistence (D1 via fake backed by node:sqlite)', () => {
+  it('round-trips runs and events through the D1 driver', async () => {
+    const p = cloudflarePersistence({ d1: fakeD1() })
+    await p.runs!.createOrResume({ runId: 'r1', threadId: 't1', startedAt: 1 })
+    await p.events!.append('r1', 1, text('a'))
+    await p.events!.append('r1', 2, text('b'))
+
+    expect((await p.runs!.get('r1'))?.status).toBe('running')
+    expect(await p.events!.latestSeq('r1')).toBe(2)
+
+    const deltas: Array<string> = []
+    for await (const e of p.events!.read('r1', { afterSeq: 0 })) {
+      if (e.event.type === 'TEXT_MESSAGE_CONTENT') deltas.push(e.event.delta)
+    }
+    expect(deltas).toEqual(['a', 'b'])
+  })
+
+  it('createD1Driver reports the sqlite dialect', () => {
+    expect(createD1Driver(fakeD1()).dialect).toBe('sqlite')
+  })
+})
diff --git a/packages/ai-persistence-cloudflare/tsconfig.json b/packages/ai-persistence-cloudflare/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-persistence-cloudflare/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-persistence-cloudflare/vite.config.ts b/packages/ai-persistence-cloudflare/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-persistence-cloudflare/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-persistence-drizzle/package.json b/packages/ai-persistence-drizzle/package.json
new file mode 100644
index 000000000..c6ba3ab66
--- /dev/null
+++ b/packages/ai-persistence-drizzle/package.json
@@ -0,0 +1,51 @@
+{
+  "name": "@tanstack/ai-persistence-drizzle",
+  "version": "0.1.0",
+  "description": "Drizzle ORM backend for TanStack AI persistence — bring your own Drizzle db (sqlite or postgres dialect); persists over the underlying client.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-persistence-drizzle"
+  },
+  "keywords": [
+    "ai",
+    "tanstack",
+    "persistence"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-persistence": "workspace:^",
+    "@tanstack/ai-persistence-sql": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-persistence": "workspace:*",
+    "@tanstack/ai-persistence-sql": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-persistence-drizzle/src/index.ts b/packages/ai-persistence-drizzle/src/index.ts
new file mode 100644
index 000000000..315dd5fcc
--- /dev/null
+++ b/packages/ai-persistence-drizzle/src/index.ts
@@ -0,0 +1,100 @@
+/**
+ * Drizzle backend (bring-your-own). A Drizzle `db` exposes its underlying client
+ * at `db.$client`: a `better-sqlite3`/`node:sqlite`-shaped handle for the sqlite
+ * dialect, or a node-postgres `Pool` for the postgres dialect. This adapter
+ * unwraps `$client` and persists over it through the shared SQL stores — so it
+ * reuses the exact, tested driver logic rather than re-deriving SQL through
+ * Drizzle's query builder.
+ *
+ * Schema: the tables are the same as the raw SQL backend. Re-export `ddl` so you
+ * can apply them with your own Drizzle migration workflow (`migrate: false`),
+ * or let the backend auto-migrate.
+ */
+import { createSqlPersistence, ddl } from '@tanstack/ai-persistence-sql'
+import type { Dialect, SqlDriver, SqlRow } from '@tanstack/ai-persistence-sql'
+import type { ChatPersistence, PersistenceMode } from '@tanstack/ai-persistence'
+
+export { ddl }
+
+/** SQLite-shaped client (node:sqlite DatabaseSync / better-sqlite3 Database). */
+interface SqliteClient {
+  prepare: (sql: string) => {
+    run: (...params: Array<unknown>) => unknown
+    all: (...params: Array<unknown>) => Array<unknown>
+  }
+}
+/** node-postgres Pool-shaped client. */
+interface PgClient {
+  query: (
+    sql: string,
+    params?: ReadonlyArray<unknown>,
+  ) => Promise<{ rows: Array<Record<string, unknown>> }>
+}
+
+/** A Drizzle db exposing its underlying driver client. */
+export interface DrizzleDb {
+  $client: unknown
+}
+
+function sqliteDriver(client: SqliteClient): SqlDriver {
+  const driver: SqlDriver = {
+    dialect: 'sqlite',
+    exec(sql, params = []) {
+      client.prepare(sql).run(...params)
+      return Promise.resolve()
+    },
+    query<T extends SqlRow = SqlRow>(
+      sql: string,
+      params: ReadonlyArray<unknown> = [],
+    ) {
+      return Promise.resolve(client.prepare(sql).all(...params) as Array<T>)
+    },
+    transaction(fn) {
+      return fn(driver)
+    },
+  }
+  return driver
+}
+
+function pgDriver(client: PgClient): SqlDriver {
+  const driver: SqlDriver = {
+    dialect: 'postgres',
+    async exec(sql, params = []) {
+      await client.query(sql, params)
+    },
+    async query<T extends SqlRow = SqlRow>(
+      sql: string,
+      params: ReadonlyArray<unknown> = [],
+    ) {
+      return (await client.query(sql, params)).rows as Array<T>
+    },
+    // Without a dedicated connection we can't BEGIN/COMMIT; stores only group
+    // DDL in a transaction, so a pass-through is acceptable here.
+    transaction(fn) {
+      return fn(driver)
+    },
+  }
+  return driver
+}
+
+export interface DrizzlePersistenceOptions {
+  db: DrizzleDb
+  dialect: Dialect
+  mode?: PersistenceMode
+  /** Run migrations on first use (default true). Set false to use drizzle-kit. */
+  migrate?: boolean
+}
+
+/** Drizzle-backed {@link ChatPersistence}. */
+export function drizzlePersistence(
+  opts: DrizzlePersistenceOptions,
+): ChatPersistence {
+  const driver =
+    opts.dialect === 'postgres'
+      ? pgDriver(opts.db.$client as PgClient)
+      : sqliteDriver(opts.db.$client as SqliteClient)
+  return createSqlPersistence(driver, {
+    mode: opts.mode,
+    migrate: opts.migrate,
+  })
+}
diff --git a/packages/ai-persistence-drizzle/tests/drizzle.test.ts b/packages/ai-persistence-drizzle/tests/drizzle.test.ts
new file mode 100644
index 000000000..709888ce8
--- /dev/null
+++ b/packages/ai-persistence-drizzle/tests/drizzle.test.ts
@@ -0,0 +1,28 @@
+import { describe, expect, it } from 'vitest'
+import { DatabaseSync } from 'node:sqlite'
+import { EventType } from '@tanstack/ai'
+import type { StreamChunk } from '@tanstack/ai'
+import { drizzlePersistence } from '../src/index'
+
+const text = (delta: string): StreamChunk => ({
+  type: EventType.TEXT_MESSAGE_CONTENT,
+  messageId: 'm1',
+  delta,
+  timestamp: 1,
+})
+
+describe('drizzlePersistence (sqlite dialect, $client = node:sqlite)', () => {
+  it('persists via the unwrapped Drizzle client', async () => {
+    // A Drizzle sqlite db exposes its driver client at `$client`; node:sqlite's
+    // DatabaseSync is prepare().run/all-shaped like better-sqlite3.
+    const db = { $client: new DatabaseSync(':memory:') }
+    const p = drizzlePersistence({ db, dialect: 'sqlite' })
+
+    await p.runs!.createOrResume({ runId: 'r1', threadId: 't1', startedAt: 1 })
+    await p.events!.append('r1', 1, text('a'))
+    await p.events!.append('r1', 2, text('b'))
+
+    expect((await p.runs!.get('r1'))?.threadId).toBe('t1')
+    expect(await p.events!.latestSeq('r1')).toBe(2)
+  })
+})
diff --git a/packages/ai-persistence-drizzle/tsconfig.json b/packages/ai-persistence-drizzle/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-persistence-drizzle/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-persistence-drizzle/vite.config.ts b/packages/ai-persistence-drizzle/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-persistence-drizzle/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-persistence-postgres/package.json b/packages/ai-persistence-postgres/package.json
new file mode 100644
index 000000000..4f4704d0b
--- /dev/null
+++ b/packages/ai-persistence-postgres/package.json
@@ -0,0 +1,61 @@
+{
+  "name": "@tanstack/ai-persistence-postgres",
+  "version": "0.1.0",
+  "description": "Postgres backend for TanStack AI persistence — durable runs, messages, event log, approvals, and artifacts over node-postgres (pg) or a bring-your-own pool.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-persistence-postgres"
+  },
+  "keywords": [
+    "ai",
+    "tanstack",
+    "persistence",
+    "postgres",
+    "pg"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-persistence": "workspace:^",
+    "@tanstack/ai-persistence-sql": "workspace:^",
+    "pg": "^8.13.0"
+  },
+  "peerDependenciesMeta": {
+    "pg": {
+      "optional": true
+    }
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-persistence": "workspace:*",
+    "@tanstack/ai-persistence-sql": "workspace:*",
+    "@types/pg": "^8.11.10",
+    "@vitest/coverage-v8": "4.0.14",
+    "pg": "^8.13.0"
+  }
+}
diff --git a/packages/ai-persistence-postgres/src/index.ts b/packages/ai-persistence-postgres/src/index.ts
new file mode 100644
index 000000000..fb9cadb60
--- /dev/null
+++ b/packages/ai-persistence-postgres/src/index.ts
@@ -0,0 +1,130 @@
+/**
+ * Postgres backend. Wraps a `pg`-style pool in the shared `SqlDriver` and
+ * assembles a `ChatPersistence` via `@tanstack/ai-persistence-sql`.
+ *
+ * - convenience: `postgresPersistence({ connectionString })` lazily creates a
+ *   `pg.Pool` (the `pg` package is an optional peer, imported on first use).
+ * - BYO: pass `{ client }` — any pool exposing `query(sql, params) => { rows }`
+ *   and `connect() => client` (node-postgres `Pool`).
+ */
+import { createSqlPersistence } from '@tanstack/ai-persistence-sql'
+import type { SqlDriver, SqlRow } from '@tanstack/ai-persistence-sql'
+import type { ChatPersistence, PersistenceMode } from '@tanstack/ai-persistence'
+
+/** Minimal node-postgres surface the driver relies on. */
+export interface PgQueryable {
+  query: (
+    sql: string,
+    params?: ReadonlyArray<unknown>,
+  ) => Promise<{ rows: Array<Record<string, unknown>> }>
+}
+export interface PgPool extends PgQueryable {
+  connect: () => Promise<PgPoolClient>
+}
+export interface PgPoolClient extends PgQueryable {
+  release: () => void
+}
+
+export interface PostgresDriverOptions {
+  connectionString?: string
+  /** Bring-your-own pool (node-postgres `Pool`). */
+  client?: PgPool
+}
+
+/**
+ * Build a driver over a queryable. When `pool` is provided, `transaction`
+ * acquires a dedicated connection for BEGIN/COMMIT; otherwise (inside a
+ * transaction's bound client) it runs the callback directly.
+ */
+function makeDriver(queryable: PgQueryable, pool: PgPool | null): SqlDriver {
+  const driver: SqlDriver = {
+    dialect: 'postgres',
+    async exec(sql, params = []) {
+      await queryable.query(sql, params)
+    },
+    async query<T extends SqlRow = SqlRow>(
+      sql: string,
+      params: ReadonlyArray<unknown> = [],
+    ) {
+      const result = await queryable.query(sql, params)
+      return result.rows as Array<T>
+    },
+    async transaction(fn) {
+      if (!pool) return fn(driver)
+      const client = await pool.connect()
+      try {
+        await client.query('BEGIN')
+        const result = await fn(makeDriver(client, null))
+        await client.query('COMMIT')
+        return result
+      } catch (err) {
+        await client.query('ROLLBACK')
+        throw err
+      } finally {
+        client.release()
+      }
+    },
+  }
+  return driver
+}
+
+/** Build a {@link SqlDriver} backed by Postgres (pool resolved lazily). */
+export function createPostgresDriver(opts: PostgresDriverOptions): SqlDriver {
+  let poolPromise: Promise<PgPool> | undefined
+  const getPool = (): Promise<PgPool> => {
+    if (opts.client) return Promise.resolve(opts.client)
+    poolPromise ??= (async () => {
+      const { Pool } = await import('pg')
+      const pool = new Pool({ connectionString: opts.connectionString })
+      // Adapt the real pg Pool to our minimal interface (no cast needed):
+      // both `query(sql, params) => { rows }` and `connect()` already match.
+      return {
+        query: (sql, params) => pool.query(sql, params as Array<unknown>),
+        connect: async () => {
+          const client = await pool.connect()
+          return {
+            query: (sql, params) => client.query(sql, params as Array<unknown>),
+            release: () => client.release(),
+          }
+        },
+      }
+    })()
+    return poolPromise
+  }
+
+  return {
+    dialect: 'postgres',
+    async exec(sql, params) {
+      const pool = await getPool()
+      await makeDriver(pool, pool).exec(sql, params)
+    },
+    async query(sql, params) {
+      const pool = await getPool()
+      return makeDriver(pool, pool).query(sql, params)
+    },
+    async transaction(fn) {
+      const pool = await getPool()
+      return makeDriver(pool, pool).transaction(fn)
+    },
+  }
+}
+
+export interface PostgresPersistenceOptions extends PostgresDriverOptions {
+  mode?: PersistenceMode
+  /** Run migrations on first use (default true). */
+  migrate?: boolean
+}
+
+/** Postgres-backed {@link ChatPersistence}. */
+export function postgresPersistence(
+  opts: PostgresPersistenceOptions,
+): ChatPersistence {
+  const driver = createPostgresDriver({
+    connectionString: opts.connectionString,
+    client: opts.client,
+  })
+  return createSqlPersistence(driver, {
+    mode: opts.mode,
+    migrate: opts.migrate,
+  })
+}
diff --git a/packages/ai-persistence-postgres/tests/driver.test.ts b/packages/ai-persistence-postgres/tests/driver.test.ts
new file mode 100644
index 000000000..2ab9d803b
--- /dev/null
+++ b/packages/ai-persistence-postgres/tests/driver.test.ts
@@ -0,0 +1,79 @@
+import { describe, expect, it } from 'vitest'
+import { createPostgresDriver } from '../src/index'
+import type { PgPool, PgPoolClient } from '../src/index'
+
+/** A fake pg pool recording SQL, returning canned rows, tracking tx control. */
+function fakePool() {
+  const calls: Array<{ sql: string; params?: ReadonlyArray<unknown> }> = []
+  let nextRows: Array<Record<string, unknown>> = []
+  let released = false
+  const client: PgPoolClient = {
+    query: (sql, params) => {
+      calls.push({ sql, params })
+      return Promise.resolve({ rows: sql.startsWith('SELECT') ? nextRows : [] })
+    },
+    release: () => {
+      released = true
+    },
+  }
+  const pool: PgPool = {
+    query: (sql, params) => {
+      calls.push({ sql, params })
+      return Promise.resolve({ rows: sql.startsWith('SELECT') ? nextRows : [] })
+    },
+    connect: () => Promise.resolve(client),
+  }
+  return {
+    pool,
+    calls,
+    setRows: (rows: Array<Record<string, unknown>>) => {
+      nextRows = rows
+    },
+    wasReleased: () => released,
+  }
+}
+
+describe('createPostgresDriver (BYO pool)', () => {
+  it('forwards sql + params and returns rows', async () => {
+    const f = fakePool()
+    f.setRows([{ run_id: 'r1' }])
+    const driver = createPostgresDriver({ client: f.pool })
+
+    await driver.exec('INSERT INTO runs (run_id) VALUES ($1)', ['r1'])
+    const rows = await driver.query('SELECT * FROM runs WHERE run_id = $1', [
+      'r1',
+    ])
+
+    expect(rows).toEqual([{ run_id: 'r1' }])
+    expect(f.calls[0]).toEqual({
+      sql: 'INSERT INTO runs (run_id) VALUES ($1)',
+      params: ['r1'],
+    })
+    expect(driver.dialect).toBe('postgres')
+  })
+
+  it('wraps a transaction in BEGIN/COMMIT on a dedicated connection', async () => {
+    const f = fakePool()
+    const driver = createPostgresDriver({ client: f.pool })
+    await driver.transaction(async (tx) => {
+      await tx.exec('UPDATE runs SET status = $1', ['done'])
+    })
+    const sqls = f.calls.map((c) => c.sql)
+    expect(sqls[0]).toBe('BEGIN')
+    expect(sqls).toContain('UPDATE runs SET status = $1')
+    expect(sqls[sqls.length - 1]).toBe('COMMIT')
+    expect(f.wasReleased()).toBe(true)
+  })
+
+  it('rolls back and rethrows on error', async () => {
+    const f = fakePool()
+    const driver = createPostgresDriver({ client: f.pool })
+    await expect(
+      driver.transaction(async () => {
+        throw new Error('boom')
+      }),
+    ).rejects.toThrow('boom')
+    expect(f.calls.map((c) => c.sql)).toContain('ROLLBACK')
+    expect(f.wasReleased()).toBe(true)
+  })
+})
diff --git a/packages/ai-persistence-postgres/tsconfig.json b/packages/ai-persistence-postgres/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-persistence-postgres/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-persistence-postgres/vite.config.ts b/packages/ai-persistence-postgres/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-persistence-postgres/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-persistence-prisma/package.json b/packages/ai-persistence-prisma/package.json
new file mode 100644
index 000000000..3ec98f5fe
--- /dev/null
+++ b/packages/ai-persistence-prisma/package.json
@@ -0,0 +1,51 @@
+{
+  "name": "@tanstack/ai-persistence-prisma",
+  "version": "0.1.0",
+  "description": "Prisma backend for TanStack AI persistence — bring your own PrismaClient; persists via $queryRawUnsafe/$executeRawUnsafe (sqlite or postgres dialect).",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-persistence-prisma"
+  },
+  "keywords": [
+    "ai",
+    "tanstack",
+    "persistence"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-persistence": "workspace:^",
+    "@tanstack/ai-persistence-sql": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-persistence": "workspace:*",
+    "@tanstack/ai-persistence-sql": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-persistence-prisma/src/index.ts b/packages/ai-persistence-prisma/src/index.ts
new file mode 100644
index 000000000..89d3ea35b
--- /dev/null
+++ b/packages/ai-persistence-prisma/src/index.ts
@@ -0,0 +1,65 @@
+/**
+ * Prisma backend (bring-your-own). Persists over a `PrismaClient`'s raw SQL
+ * escape hatches — `$queryRawUnsafe(sql, ...params)` for reads and
+ * `$executeRawUnsafe(sql, ...params)` for writes — which take a positional-
+ * parameter SQL string, exactly matching the shared `SqlDriver` contract.
+ *
+ * The tables are the same as the raw SQL backend; add the documented Prisma
+ * models to your `schema.prisma` and run `prisma migrate` (use `migrate: false`),
+ * or let the backend auto-migrate the tables directly.
+ */
+import { createSqlPersistence } from '@tanstack/ai-persistence-sql'
+import type { Dialect, SqlDriver, SqlRow } from '@tanstack/ai-persistence-sql'
+import type { ChatPersistence, PersistenceMode } from '@tanstack/ai-persistence'
+
+/** The PrismaClient surface this adapter relies on. */
+export interface PrismaRawClient {
+  $queryRawUnsafe: <T = unknown>(
+    sql: string,
+    ...params: Array<unknown>
+  ) => Promise<T>
+  $executeRawUnsafe: (sql: string, ...params: Array<unknown>) => Promise<number>
+  $transaction: <T>(fn: (tx: PrismaRawClient) => Promise<T>) => Promise<T>
+}
+
+/** Build a {@link SqlDriver} over a PrismaClient. */
+export function createPrismaDriver(
+  prisma: PrismaRawClient,
+  dialect: Dialect,
+): SqlDriver {
+  const driver: SqlDriver = {
+    dialect,
+    async exec(sql, params = []) {
+      await prisma.$executeRawUnsafe(sql, ...params)
+    },
+    async query<T extends SqlRow = SqlRow>(
+      sql: string,
+      params: ReadonlyArray<unknown> = [],
+    ) {
+      return prisma.$queryRawUnsafe<Array<T>>(sql, ...params)
+    },
+    async transaction(fn) {
+      return prisma.$transaction((tx) => fn(createPrismaDriver(tx, dialect)))
+    },
+  }
+  return driver
+}
+
+export interface PrismaPersistenceOptions {
+  prisma: PrismaRawClient
+  dialect: Dialect
+  mode?: PersistenceMode
+  /** Run migrations on first use (default true). Set false to use prisma migrate. */
+  migrate?: boolean
+}
+
+/** Prisma-backed {@link ChatPersistence}. */
+export function prismaPersistence(
+  opts: PrismaPersistenceOptions,
+): ChatPersistence {
+  const driver = createPrismaDriver(opts.prisma, opts.dialect)
+  return createSqlPersistence(driver, {
+    mode: opts.mode,
+    migrate: opts.migrate,
+  })
+}
diff --git a/packages/ai-persistence-prisma/tests/prisma.test.ts b/packages/ai-persistence-prisma/tests/prisma.test.ts
new file mode 100644
index 000000000..f550cf033
--- /dev/null
+++ b/packages/ai-persistence-prisma/tests/prisma.test.ts
@@ -0,0 +1,43 @@
+import { describe, expect, it } from 'vitest'
+import { DatabaseSync } from 'node:sqlite'
+import { EventType } from '@tanstack/ai'
+import type { StreamChunk } from '@tanstack/ai'
+import { prismaPersistence } from '../src/index'
+import type { PrismaRawClient } from '../src/index'
+
+/** A fake PrismaClient backed by node:sqlite (raw escape hatches only). */
+function fakePrisma(): PrismaRawClient {
+  const db = new DatabaseSync(':memory:')
+  const client: PrismaRawClient = {
+    $queryRawUnsafe: <T>(sql: string, ...params: Array<unknown>) =>
+      Promise.resolve(db.prepare(sql).all(...(params as Array<never>)) as T),
+    $executeRawUnsafe: (sql: string, ...params: Array<unknown>) => {
+      db.prepare(sql).run(...(params as Array<never>))
+      return Promise.resolve(0)
+    },
+    $transaction: (fn) => fn(client),
+  }
+  return client
+}
+
+const text = (delta: string): StreamChunk => ({
+  type: EventType.TEXT_MESSAGE_CONTENT,
+  messageId: 'm1',
+  delta,
+  timestamp: 1,
+})
+
+describe('prismaPersistence (sqlite dialect, raw escape hatches)', () => {
+  it('persists via $queryRawUnsafe / $executeRawUnsafe', async () => {
+    const p = prismaPersistence({ prisma: fakePrisma(), dialect: 'sqlite' })
+    await p.runs!.createOrResume({ runId: 'r1', threadId: 't1', startedAt: 1 })
+    await p.events!.append('r1', 1, text('a'))
+
+    expect((await p.runs!.get('r1'))?.status).toBe('running')
+    const deltas: Array<string> = []
+    for await (const e of p.events!.read('r1')) {
+      if (e.event.type === 'TEXT_MESSAGE_CONTENT') deltas.push(e.event.delta)
+    }
+    expect(deltas).toEqual(['a'])
+  })
+})
diff --git a/packages/ai-persistence-prisma/tsconfig.json b/packages/ai-persistence-prisma/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-persistence-prisma/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-persistence-prisma/vite.config.ts b/packages/ai-persistence-prisma/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-persistence-prisma/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-persistence-sql/package.json b/packages/ai-persistence-sql/package.json
new file mode 100644
index 000000000..48cb241ec
--- /dev/null
+++ b/packages/ai-persistence-sql/package.json
@@ -0,0 +1,55 @@
+{
+  "name": "@tanstack/ai-persistence-sql",
+  "version": "0.1.0",
+  "description": "Shared SQL store core for TanStack AI persistence — one SQL implementation of the message/run/event/approval/artifact stores behind a minimal SqlDriver (sqlite | postgres dialect), with versioned migrations. Consumed by the sqlite/postgres/cloudflare/drizzle/prisma backends.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-persistence-sql"
+  },
+  "keywords": [
+    "ai",
+    "ai-sdk",
+    "typescript",
+    "tanstack",
+    "persistence",
+    "sql",
+    "sqlite",
+    "postgres",
+    "migrations"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-persistence": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-persistence": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-persistence-sql/src/driver.ts b/packages/ai-persistence-sql/src/driver.ts
new file mode 100644
index 000000000..3df118124
--- /dev/null
+++ b/packages/ai-persistence-sql/src/driver.ts
@@ -0,0 +1,63 @@
+/**
+ * Minimal SQL driver contract the shared stores are written against. Each
+ * backend (`-sqlite`, `-postgres`, `-cloudflare`, `-drizzle`, `-prisma`)
+ * implements this over its client; the stores never see a concrete driver.
+ */
+
+export type Dialect = 'sqlite' | 'postgres'
+
+export type SqlRow = Record<string, unknown>
+
+export interface SqlDriver {
+  readonly dialect: Dialect
+  /** Run a statement that returns no rows (DDL, INSERT/UPDATE/DELETE). */
+  exec: (sql: string, params?: ReadonlyArray<unknown>) => Promise<void>
+  /** Run a query and return all rows. */
+  query: <T extends SqlRow = SqlRow>(
+    sql: string,
+    params?: ReadonlyArray<unknown>,
+  ) => Promise<Array<T>>
+  /** Run `fn` inside a transaction, passing a driver bound to the transaction. */
+  transaction: <T>(fn: (tx: SqlDriver) => Promise<T>) => Promise<T>
+}
+
+/**
+ * Positional placeholder for the dialect: `?` for SQLite, `$n` for Postgres.
+ * `index` is 1-based to match Postgres `$1`, `$2`, …
+ */
+export function param(dialect: Dialect, index: number): string {
+  return dialect === 'postgres' ? `$${index}` : '?'
+}
+
+/** Build N placeholders starting at `start` (1-based), e.g. `?, ?, ?`. */
+export function params(dialect: Dialect, count: number, start = 1): string {
+  return Array.from({ length: count }, (_, i) =>
+    param(dialect, start + i),
+  ).join(', ')
+}
+
+/** Auto-incrementing integer primary-key column definition for the dialect. */
+export function autoIncrementPk(dialect: Dialect): string {
+  return dialect === 'postgres'
+    ? 'BIGINT GENERATED ALWAYS AS IDENTITY PRIMARY KEY'
+    : 'INTEGER PRIMARY KEY AUTOINCREMENT'
+}
+
+/** JSON column type for the dialect. */
+export function jsonColumn(dialect: Dialect): string {
+  return dialect === 'postgres' ? 'JSONB' : 'TEXT'
+}
+
+/** Binary/blob column type for the dialect. */
+export function blobColumn(dialect: Dialect): string {
+  return dialect === 'postgres' ? 'BYTEA' : 'BLOB'
+}
+
+/**
+ * 64-bit integer column for the dialect. Epoch-ms timestamps overflow Postgres
+ * `INTEGER` (INT4, max ~2.1e9), so they must be `BIGINT`; SQLite `INTEGER` is
+ * already 64-bit.
+ */
+export function bigIntColumn(dialect: Dialect): string {
+  return dialect === 'postgres' ? 'BIGINT' : 'INTEGER'
+}
diff --git a/packages/ai-persistence-sql/src/index.ts b/packages/ai-persistence-sql/src/index.ts
new file mode 100644
index 000000000..ea28b183f
--- /dev/null
+++ b/packages/ai-persistence-sql/src/index.ts
@@ -0,0 +1,26 @@
+// SQL driver contract + dialect helpers (the seam each backend implements).
+export {
+  param,
+  params,
+  autoIncrementPk,
+  jsonColumn,
+  blobColumn,
+  bigIntColumn,
+} from './driver'
+export type { Dialect, SqlRow, SqlDriver } from './driver'
+
+// Schema migrations + raw DDL
+export { migrate, ddl } from './migrations'
+
+// Shared SQL stores (one impl per store, dialect-parameterized)
+export {
+  createMessageStore,
+  createRunStore,
+  createEventLog,
+  createApprovalStore,
+  createArtifactStore,
+} from './stores'
+
+// Assemble a ChatPersistence from a driver
+export { createSqlPersistence } from './sql-persistence'
+export type { SqlPersistenceOptions } from './sql-persistence'
diff --git a/packages/ai-persistence-sql/src/migrations.ts b/packages/ai-persistence-sql/src/migrations.ts
new file mode 100644
index 000000000..58feead04
--- /dev/null
+++ b/packages/ai-persistence-sql/src/migrations.ts
@@ -0,0 +1,105 @@
+/**
+ * Versioned schema migrations.
+ *
+ * Raw drivers run these on first use (opt-out at the backend level). Each
+ * migration is applied at most once, tracked in `_tanstack_ai_migrations`.
+ * Idempotent: re-running `migrate` is a no-op once all versions are applied.
+ *
+ * JSON is stored as TEXT in BOTH dialects (the stores stringify/parse) so reads
+ * don't depend on a driver's JSONB return shape; bytes are stored base64-encoded
+ * in a TEXT column for the same portability reason. Epoch-ms timestamps use
+ * {@link bigIntColumn}.
+ */
+import { bigIntColumn, param } from './driver'
+import type { Dialect, SqlDriver } from './driver'
+
+interface Migration {
+  version: number
+  up: (dialect: Dialect) => Array<string>
+}
+
+/** DDL for schema v1. */
+function v1(dialect: Dialect): Array<string> {
+  const ts = bigIntColumn(dialect)
+  return [
+    `CREATE TABLE IF NOT EXISTS message_threads (
+      thread_id TEXT PRIMARY KEY,
+      messages TEXT NOT NULL
+    )`,
+    `CREATE TABLE IF NOT EXISTS runs (
+      run_id TEXT PRIMARY KEY,
+      thread_id TEXT NOT NULL,
+      status TEXT NOT NULL,
+      started_at ${ts} NOT NULL,
+      finished_at ${ts},
+      error TEXT,
+      usage TEXT
+    )`,
+    `CREATE TABLE IF NOT EXISTS run_events (
+      run_id TEXT NOT NULL,
+      seq INTEGER NOT NULL,
+      event TEXT NOT NULL,
+      PRIMARY KEY (run_id, seq)
+    )`,
+    `CREATE TABLE IF NOT EXISTS approvals (
+      approval_id TEXT PRIMARY KEY,
+      run_id TEXT NOT NULL,
+      thread_id TEXT NOT NULL,
+      status TEXT NOT NULL,
+      requested_at ${ts} NOT NULL,
+      resolved_at ${ts},
+      payload TEXT NOT NULL
+    )`,
+    `CREATE TABLE IF NOT EXISTS artifacts (
+      artifact_id TEXT PRIMARY KEY,
+      run_id TEXT NOT NULL,
+      thread_id TEXT NOT NULL,
+      name TEXT NOT NULL,
+      mime_type TEXT NOT NULL,
+      size INTEGER NOT NULL,
+      bytes_b64 TEXT,
+      external_url TEXT,
+      created_at ${ts} NOT NULL
+    )`,
+  ]
+}
+
+const MIGRATIONS: ReadonlyArray<Migration> = [{ version: 1, up: v1 }]
+
+/** Raw DDL strings for a dialect (every migration, in order) — for users who manage schema themselves. */
+export function ddl(dialect: Dialect): Array<string> {
+  return MIGRATIONS.flatMap((m) => m.up(dialect))
+}
+
+/**
+ * Apply any not-yet-applied migrations. Idempotent and transactional per
+ * migration. Tracks applied versions in `_tanstack_ai_migrations`.
+ */
+export async function migrate(driver: SqlDriver): Promise<void> {
+  await driver.exec(
+    `CREATE TABLE IF NOT EXISTS _tanstack_ai_migrations (
+      version INTEGER PRIMARY KEY,
+      applied_at ${bigIntColumn(driver.dialect)} NOT NULL
+    )`,
+  )
+  const rows = await driver.query<{ version: number }>(
+    'SELECT version FROM _tanstack_ai_migrations',
+  )
+  const applied = new Set(rows.map((r) => Number(r.version)))
+
+  for (const migration of MIGRATIONS) {
+    if (applied.has(migration.version)) continue
+    await driver.transaction(async (tx) => {
+      for (const statement of migration.up(tx.dialect)) {
+        await tx.exec(statement)
+      }
+      await tx.exec(
+        `INSERT INTO _tanstack_ai_migrations (version, applied_at) VALUES (${param(
+          tx.dialect,
+          1,
+        )}, ${param(tx.dialect, 2)})`,
+        [migration.version, Date.now()],
+      )
+    })
+  }
+}
diff --git a/packages/ai-persistence-sql/src/sql-persistence.ts b/packages/ai-persistence-sql/src/sql-persistence.ts
new file mode 100644
index 000000000..c5d3c662b
--- /dev/null
+++ b/packages/ai-persistence-sql/src/sql-persistence.ts
@@ -0,0 +1,68 @@
+/**
+ * Assemble a {@link ChatPersistence} backed by SQL stores over a {@link SqlDriver}.
+ *
+ * By default the schema is migrated on first use (`migrate: true`); pass
+ * `migrate: false` to manage the schema yourself (call {@link migrate}/{@link ddl}).
+ *
+ * Migration runs lazily and exactly once, gated at the DRIVER level: the stores
+ * are built on a wrapper whose every `exec`/`query`/`transaction` first awaits
+ * the (idempotent, memoized) migration. This is why it composes correctly with
+ * `EventLog.read`, which returns an async iterable synchronously — the gate fires
+ * when the generator calls `query`, not when `read` is invoked. Migration itself
+ * runs on the RAW driver to avoid recursing through the gate.
+ */
+import { migrate as runMigrations } from './migrations'
+import {
+  createApprovalStore,
+  createArtifactStore,
+  createEventLog,
+  createMessageStore,
+  createRunStore,
+} from './stores'
+import type { SqlDriver } from './driver'
+import type { ChatPersistence, PersistenceMode } from '@tanstack/ai-persistence'
+
+export interface SqlPersistenceOptions {
+  mode?: PersistenceMode
+  /** Run schema migrations on first use (default true). Set false to self-manage. */
+  migrate?: boolean
+}
+
+export function createSqlPersistence(
+  driver: SqlDriver,
+  opts?: SqlPersistenceOptions,
+): ChatPersistence {
+  const shouldMigrate = opts?.migrate ?? true
+
+  let migrated: Promise<void> | undefined
+  const ensureSchema = (): Promise<void> => {
+    if (!shouldMigrate) return Promise.resolve()
+    migrated ??= runMigrations(driver) // runs on the RAW driver — no recursion
+    return migrated
+  }
+
+  const gated: SqlDriver = {
+    dialect: driver.dialect,
+    async exec(sql, params) {
+      await ensureSchema()
+      return driver.exec(sql, params)
+    },
+    async query(sql, params) {
+      await ensureSchema()
+      return driver.query(sql, params)
+    },
+    async transaction(fn) {
+      await ensureSchema()
+      return driver.transaction(fn)
+    },
+  }
+
+  return {
+    mode: opts?.mode ?? 'agent',
+    messages: createMessageStore(gated),
+    runs: createRunStore(gated),
+    events: createEventLog(gated),
+    approvals: createApprovalStore(gated),
+    artifacts: createArtifactStore(gated),
+  }
+}
diff --git a/packages/ai-persistence-sql/src/stores.ts b/packages/ai-persistence-sql/src/stores.ts
new file mode 100644
index 000000000..9ed420931
--- /dev/null
+++ b/packages/ai-persistence-sql/src/stores.ts
@@ -0,0 +1,297 @@
+/**
+ * One SQL implementation of every persistence store, written against the
+ * minimal {@link SqlDriver}. Dialect differences are confined to placeholder
+ * syntax ({@link param}) and column types (handled in migrations). JSON is
+ * stored/read as TEXT and bytes as base64 TEXT for cross-dialect portability
+ * (Postgres BIGINT comes back as a string, so numeric reads go through Number).
+ */
+import { param } from './driver'
+import type { SqlDriver } from './driver'
+import type {
+  ApprovalRecord,
+  ApprovalStore,
+  ArtifactRecord,
+  ArtifactStore,
+  EventLog,
+  MessageStore,
+  PersistedEvent,
+  RunRecord,
+  RunStatus,
+  RunStore,
+} from '@tanstack/ai-persistence'
+import type { ModelMessage, StreamChunk, TokenUsage } from '@tanstack/ai'
+
+const num = (v: unknown): number => Number(v)
+const str = (v: unknown): string => String(v)
+
+function toBase64(bytes: Uint8Array): string {
+  return Buffer.from(bytes).toString('base64')
+}
+function fromBase64(b64: string): Uint8Array {
+  return new Uint8Array(Buffer.from(b64, 'base64'))
+}
+
+export function createMessageStore(driver: SqlDriver): MessageStore {
+  const p = (i: number) => param(driver.dialect, i)
+  return {
+    async loadThread(threadId) {
+      const rows = await driver.query<{ messages: string }>(
+        `SELECT messages FROM message_threads WHERE thread_id = ${p(1)}`,
+        [threadId],
+      )
+      const row = rows[0]
+      if (!row) return []
+      return JSON.parse(row.messages) as Array<ModelMessage>
+    },
+    async saveThread(threadId, messages) {
+      await driver.exec(
+        `INSERT INTO message_threads (thread_id, messages) VALUES (${p(1)}, ${p(
+          2,
+        )}) ON CONFLICT (thread_id) DO UPDATE SET messages = ${p(3)}`,
+        [threadId, JSON.stringify(messages), JSON.stringify(messages)],
+      )
+    },
+  }
+}
+
+function mapRun(row: Record<string, unknown>): RunRecord {
+  return {
+    runId: str(row.run_id),
+    threadId: str(row.thread_id),
+    status: str(row.status) as RunStatus,
+    startedAt: num(row.started_at),
+    ...(row.finished_at != null ? { finishedAt: num(row.finished_at) } : {}),
+    ...(row.error != null ? { error: str(row.error) } : {}),
+    ...(row.usage != null
+      ? { usage: JSON.parse(str(row.usage)) as TokenUsage }
+      : {}),
+  }
+}
+
+export function createRunStore(driver: SqlDriver): RunStore {
+  const p = (i: number) => param(driver.dialect, i)
+  return {
+    async createOrResume(input) {
+      const existing = await this.get(input.runId)
+      if (existing) return existing
+      const record: RunRecord = {
+        runId: input.runId,
+        threadId: input.threadId,
+        status: input.status ?? 'running',
+        startedAt: input.startedAt,
+      }
+      await driver.exec(
+        `INSERT INTO runs (run_id, thread_id, status, started_at) VALUES (${p(
+          1,
+        )}, ${p(2)}, ${p(3)}, ${p(4)}) ON CONFLICT (run_id) DO NOTHING`,
+        [record.runId, record.threadId, record.status, record.startedAt],
+      )
+      return (await this.get(input.runId)) ?? record
+    },
+    async update(runId, patch) {
+      const sets: Array<string> = []
+      const values: Array<unknown> = []
+      let i = 1
+      if (patch.status !== undefined) {
+        sets.push(`status = ${p(i++)}`)
+        values.push(patch.status)
+      }
+      if (patch.finishedAt !== undefined) {
+        sets.push(`finished_at = ${p(i++)}`)
+        values.push(patch.finishedAt)
+      }
+      if (patch.error !== undefined) {
+        sets.push(`error = ${p(i++)}`)
+        values.push(patch.error)
+      }
+      if (patch.usage !== undefined) {
+        sets.push(`usage = ${p(i++)}`)
+        values.push(JSON.stringify(patch.usage))
+      }
+      if (!sets.length) return
+      values.push(runId)
+      await driver.exec(
+        `UPDATE runs SET ${sets.join(', ')} WHERE run_id = ${p(i)}`,
+        values,
+      )
+    },
+    async get(runId) {
+      const rows = await driver.query(
+        `SELECT * FROM runs WHERE run_id = ${p(1)}`,
+        [runId],
+      )
+      const row = rows[0]
+      return row ? mapRun(row) : null
+    },
+  }
+}
+
+export function createEventLog(driver: SqlDriver): EventLog {
+  const p = (i: number) => param(driver.dialect, i)
+  return {
+    async append(runId, seq, event) {
+      await driver.exec(
+        `INSERT INTO run_events (run_id, seq, event) VALUES (${p(1)}, ${p(
+          2,
+        )}, ${p(3)}) ON CONFLICT (run_id, seq) DO NOTHING`,
+        [runId, seq, JSON.stringify(event)],
+      )
+    },
+    read(runId, opts) {
+      const after = opts?.afterSeq
+      const sql =
+        after === undefined
+          ? `SELECT seq, event FROM run_events WHERE run_id = ${p(
+              1,
+            )} ORDER BY seq ASC`
+          : `SELECT seq, event FROM run_events WHERE run_id = ${p(
+              1,
+            )} AND seq > ${p(2)} ORDER BY seq ASC`
+      const values = after === undefined ? [runId] : [runId, after]
+      return (async function* (): AsyncIterable<PersistedEvent> {
+        const rows = await driver.query<{ seq: number; event: string }>(
+          sql,
+          values,
+        )
+        for (const row of rows) {
+          yield {
+            seq: num(row.seq),
+            event: JSON.parse(str(row.event)) as StreamChunk,
+          }
+        }
+      })()
+    },
+    async hasRun(runId) {
+      const rows = await driver.query(
+        `SELECT 1 AS one FROM run_events WHERE run_id = ${p(1)} LIMIT 1`,
+        [runId],
+      )
+      return rows.length > 0
+    },
+    async latestSeq(runId) {
+      const rows = await driver.query<{ max_seq: number | null }>(
+        `SELECT MAX(seq) AS max_seq FROM run_events WHERE run_id = ${p(1)}`,
+        [runId],
+      )
+      const max = rows[0]?.max_seq
+      return max == null ? 0 : num(max)
+    },
+  }
+}
+
+function mapApproval(row: Record<string, unknown>): ApprovalRecord {
+  return {
+    approvalId: str(row.approval_id),
+    runId: str(row.run_id),
+    threadId: str(row.thread_id),
+    status: str(row.status) as ApprovalRecord['status'],
+    requestedAt: num(row.requested_at),
+    ...(row.resolved_at != null ? { resolvedAt: num(row.resolved_at) } : {}),
+    payload: JSON.parse(str(row.payload)) as Record<string, unknown>,
+  }
+}
+
+export function createApprovalStore(driver: SqlDriver): ApprovalStore {
+  const p = (i: number) => param(driver.dialect, i)
+  return {
+    async create(record) {
+      await driver.exec(
+        `INSERT INTO approvals (approval_id, run_id, thread_id, status, requested_at, payload)
+         VALUES (${p(1)}, ${p(2)}, ${p(3)}, ${p(4)}, ${p(5)}, ${p(6)})
+         ON CONFLICT (approval_id) DO NOTHING`,
+        [
+          record.approvalId,
+          record.runId,
+          record.threadId,
+          record.status,
+          record.requestedAt,
+          JSON.stringify(record.payload),
+        ],
+      )
+    },
+    async resolve(approvalId, granted) {
+      await driver.exec(
+        `UPDATE approvals SET status = ${p(1)}, resolved_at = ${p(
+          2,
+        )} WHERE approval_id = ${p(3)}`,
+        [granted ? 'granted' : 'denied', Date.now(), approvalId],
+      )
+    },
+    async get(approvalId) {
+      const rows = await driver.query(
+        `SELECT * FROM approvals WHERE approval_id = ${p(1)}`,
+        [approvalId],
+      )
+      const row = rows[0]
+      return row ? mapApproval(row) : null
+    },
+    async decisionsForThread(threadId) {
+      const rows = await driver.query(
+        `SELECT approval_id, status FROM approvals WHERE thread_id = ${p(
+          1,
+        )} AND status <> 'pending'`,
+        [threadId],
+      )
+      const decisions = new Map<string, boolean>()
+      for (const row of rows) {
+        decisions.set(str(row.approval_id), str(row.status) === 'granted')
+      }
+      return decisions
+    },
+  }
+}
+
+function mapArtifact(row: Record<string, unknown>): ArtifactRecord {
+  return {
+    artifactId: str(row.artifact_id),
+    runId: str(row.run_id),
+    threadId: str(row.thread_id),
+    name: str(row.name),
+    mimeType: str(row.mime_type),
+    size: num(row.size),
+    ...(row.bytes_b64 != null ? { bytes: fromBase64(str(row.bytes_b64)) } : {}),
+    ...(row.external_url != null ? { externalUrl: str(row.external_url) } : {}),
+    createdAt: num(row.created_at),
+  }
+}
+
+export function createArtifactStore(driver: SqlDriver): ArtifactStore {
+  const p = (i: number) => param(driver.dialect, i)
+  return {
+    async save(record) {
+      await driver.exec(
+        `INSERT INTO artifacts (artifact_id, run_id, thread_id, name, mime_type, size, bytes_b64, external_url, created_at)
+         VALUES (${p(1)}, ${p(2)}, ${p(3)}, ${p(4)}, ${p(5)}, ${p(6)}, ${p(
+           7,
+         )}, ${p(8)}, ${p(9)})
+         ON CONFLICT (artifact_id) DO NOTHING`,
+        [
+          record.artifactId,
+          record.runId,
+          record.threadId,
+          record.name,
+          record.mimeType,
+          record.size,
+          record.bytes ? toBase64(record.bytes) : null,
+          record.externalUrl ?? null,
+          record.createdAt,
+        ],
+      )
+    },
+    async get(artifactId) {
+      const rows = await driver.query(
+        `SELECT * FROM artifacts WHERE artifact_id = ${p(1)}`,
+        [artifactId],
+      )
+      const row = rows[0]
+      return row ? mapArtifact(row) : null
+    },
+    async list(runId) {
+      const rows = await driver.query(
+        `SELECT * FROM artifacts WHERE run_id = ${p(1)} ORDER BY created_at ASC`,
+        [runId],
+      )
+      return rows.map(mapArtifact)
+    },
+  }
+}
diff --git a/packages/ai-persistence-sql/tests/sql-persistence.test.ts b/packages/ai-persistence-sql/tests/sql-persistence.test.ts
new file mode 100644
index 000000000..88cf78d80
--- /dev/null
+++ b/packages/ai-persistence-sql/tests/sql-persistence.test.ts
@@ -0,0 +1,128 @@
+import { describe, expect, it } from 'vitest'
+import { EventType } from '@tanstack/ai'
+import type { StreamChunk } from '@tanstack/ai'
+import { createSqlPersistence } from '../src/sql-persistence'
+import { migrate } from '../src/migrations'
+import { createTestSqliteDriver } from './sqlite-driver'
+
+const text = (delta: string): StreamChunk => ({
+  type: EventType.TEXT_MESSAGE_CONTENT,
+  messageId: 'm1',
+  delta,
+  timestamp: 1,
+})
+
+describe('migrate', () => {
+  it('is idempotent (re-running applies nothing new)', async () => {
+    const driver = createTestSqliteDriver()
+    await migrate(driver)
+    await migrate(driver)
+    const rows = await driver.query<{ version: number }>(
+      'SELECT version FROM _tanstack_ai_migrations',
+    )
+    expect(rows.map((r) => Number(r.version))).toEqual([1])
+  })
+})
+
+describe('createSqlPersistence (sqlite dialect)', () => {
+  it('migrates lazily on first use and round-trips runs', async () => {
+    const p = createSqlPersistence(createTestSqliteDriver())
+    const run = await p.runs!.createOrResume({
+      runId: 'r1',
+      threadId: 't1',
+      startedAt: 100,
+    })
+    expect(run.status).toBe('running')
+    // Idempotent resume returns the same record.
+    const again = await p.runs!.createOrResume({
+      runId: 'r1',
+      threadId: 't1',
+      startedAt: 999,
+    })
+    expect(again.startedAt).toBe(100)
+
+    await p.runs!.update('r1', {
+      status: 'completed',
+      finishedAt: 200,
+      usage: { promptTokens: 1, completionTokens: 2, totalTokens: 3 },
+    })
+    const got = await p.runs!.get('r1')
+    expect(got?.status).toBe('completed')
+    expect(got?.finishedAt).toBe(200)
+    expect(got?.usage?.totalTokens).toBe(3)
+  })
+
+  it('appends events and replays after a sequence', async () => {
+    const p = createSqlPersistence(createTestSqliteDriver())
+    await p.events!.append('r1', 1, text('a'))
+    await p.events!.append('r1', 2, text('b'))
+    await p.events!.append('r1', 3, text('c'))
+    expect(await p.events!.hasRun('r1')).toBe(true)
+    expect(await p.events!.latestSeq('r1')).toBe(3)
+
+    const seen: Array<{ seq: number; delta: string }> = []
+    for await (const e of p.events!.read('r1', { afterSeq: 1 })) {
+      if (e.event.type === 'TEXT_MESSAGE_CONTENT') {
+        seen.push({ seq: e.seq, delta: e.event.delta })
+      }
+    }
+    expect(seen).toEqual([
+      { seq: 2, delta: 'b' },
+      { seq: 3, delta: 'c' },
+    ])
+  })
+
+  it('append is idempotent on (runId, seq)', async () => {
+    const p = createSqlPersistence(createTestSqliteDriver())
+    await p.events!.append('r1', 1, text('a'))
+    await p.events!.append('r1', 1, text('a-again'))
+    expect(await p.events!.latestSeq('r1')).toBe(1)
+  })
+
+  it('round-trips the thread transcript', async () => {
+    const p = createSqlPersistence(createTestSqliteDriver())
+    expect(await p.messages!.loadThread('t1')).toEqual([])
+    await p.messages!.saveThread('t1', [{ role: 'user', content: 'hi' }])
+    await p.messages!.saveThread('t1', [
+      { role: 'user', content: 'hi' },
+      { role: 'assistant', content: 'hello' },
+    ])
+    expect(await p.messages!.loadThread('t1')).toEqual([
+      { role: 'user', content: 'hi' },
+      { role: 'assistant', content: 'hello' },
+    ])
+  })
+
+  it('persists and resolves approvals with thread decisions', async () => {
+    const p = createSqlPersistence(createTestSqliteDriver())
+    await p.approvals!.create({
+      approvalId: 'a1',
+      runId: 'r1',
+      threadId: 't1',
+      status: 'pending',
+      requestedAt: 1,
+      payload: { command: 'rm' },
+    })
+    await p.approvals!.resolve('a1', true)
+    expect((await p.approvals!.get('a1'))?.status).toBe('granted')
+    expect((await p.approvals!.decisionsForThread('t1')).get('a1')).toBe(true)
+  })
+
+  it('stores artifacts including inline bytes', async () => {
+    const p = createSqlPersistence(createTestSqliteDriver())
+    await p.artifacts!.save({
+      artifactId: 'art1',
+      runId: 'r1',
+      threadId: 't1',
+      name: 'out.bin',
+      mimeType: 'application/octet-stream',
+      size: 3,
+      bytes: new Uint8Array([1, 2, 3]),
+      createdAt: 1,
+    })
+    const got = await p.artifacts!.get('art1')
+    expect(got?.name).toBe('out.bin')
+    expect(Array.from(got?.bytes ?? [])).toEqual([1, 2, 3])
+    expect(await p.artifacts!.list('r1')).toHaveLength(1)
+  })
+})
diff --git a/packages/ai-persistence-sql/tests/sqlite-driver.ts b/packages/ai-persistence-sql/tests/sqlite-driver.ts
new file mode 100644
index 000000000..2da713987
--- /dev/null
+++ b/packages/ai-persistence-sql/tests/sqlite-driver.ts
@@ -0,0 +1,32 @@
+/**
+ * Test-only SqlDriver over Node's built-in `node:sqlite` (Node 22+). Lets the
+ * shared SQL stores be runtime-verified here without depending on the
+ * `@tanstack/ai-persistence-sqlite` package (which productionizes this same
+ * adapter). Uses an in-memory database by default.
+ */
+import { DatabaseSync } from 'node:sqlite'
+import type { SqlDriver, SqlRow } from '../src/driver'
+
+export function createTestSqliteDriver(path = ':memory:'): SqlDriver {
+  const db = new DatabaseSync(path)
+  const driver: SqlDriver = {
+    dialect: 'sqlite',
+    exec(sql, params = []) {
+      db.prepare(sql).run(...(params as Array<never>))
+      return Promise.resolve()
+    },
+    query<T extends SqlRow = SqlRow>(
+      sql: string,
+      params: ReadonlyArray<unknown> = [],
+    ) {
+      const rows = db.prepare(sql).all(...(params as Array<never>))
+      return Promise.resolve(rows as Array<T>)
+    },
+    // node:sqlite has no async transaction API; run statements directly. The
+    // stores only group DDL here, which is acceptable for tests.
+    transaction(fn) {
+      return fn(driver)
+    },
+  }
+  return driver
+}
diff --git a/packages/ai-persistence-sql/tsconfig.json b/packages/ai-persistence-sql/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-persistence-sql/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-persistence-sql/vite.config.ts b/packages/ai-persistence-sql/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-persistence-sql/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-persistence-sqlite/package.json b/packages/ai-persistence-sqlite/package.json
new file mode 100644
index 000000000..2cafc2443
--- /dev/null
+++ b/packages/ai-persistence-sqlite/package.json
@@ -0,0 +1,54 @@
+{
+  "name": "@tanstack/ai-persistence-sqlite",
+  "version": "0.1.0",
+  "description": "SQLite backend for TanStack AI persistence — durable runs, messages, event log, approvals, and artifacts over node:sqlite (zero-dep, Node 22+) or a bring-your-own better-sqlite3 handle.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-persistence-sqlite"
+  },
+  "keywords": [
+    "ai",
+    "tanstack",
+    "persistence",
+    "sqlite",
+    "node-sqlite",
+    "better-sqlite3"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-persistence": "workspace:^",
+    "@tanstack/ai-persistence-sql": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-persistence": "workspace:*",
+    "@tanstack/ai-persistence-sql": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-persistence-sqlite/src/index.ts b/packages/ai-persistence-sqlite/src/index.ts
new file mode 100644
index 000000000..6e8827b68
--- /dev/null
+++ b/packages/ai-persistence-sqlite/src/index.ts
@@ -0,0 +1,72 @@
+/**
+ * SQLite backend. Wraps a SQLite client in the shared `SqlDriver` and assembles
+ * a `ChatPersistence` via `@tanstack/ai-persistence-sql`.
+ *
+ * Two client paths:
+ * - convenience: `sqlitePersistence({ path })` lazily opens a `node:sqlite`
+ *   `DatabaseSync` (built in to Node 22+, zero dependency).
+ * - BYO: pass `{ db }` — an existing `node:sqlite` `DatabaseSync` OR a
+ *   `better-sqlite3` `Database` (both expose `prepare(sql).run/all(...params)`).
+ */
+import { DatabaseSync } from 'node:sqlite'
+import { createSqlPersistence } from '@tanstack/ai-persistence-sql'
+import type { SqlDriver, SqlRow } from '@tanstack/ai-persistence-sql'
+import type { ChatPersistence, PersistenceMode } from '@tanstack/ai-persistence'
+
+/** The subset of a SQLite client the driver needs (node:sqlite & better-sqlite3 both satisfy it). */
+interface SqliteClient {
+  prepare: (sql: string) => {
+    run: (...params: Array<unknown>) => unknown
+    all: (...params: Array<unknown>) => Array<unknown>
+  }
+}
+
+export interface SqliteDriverOptions {
+  /** File path (or ':memory:'). Used when `db` is not provided. */
+  path?: string
+  /** Bring-your-own SQLite handle (node:sqlite DatabaseSync or better-sqlite3 Database). */
+  db?: SqliteClient
+}
+
+/** Build a {@link SqlDriver} backed by SQLite. */
+export function createSqliteDriver(opts?: SqliteDriverOptions): SqlDriver {
+  const client: SqliteClient =
+    opts?.db ?? (new DatabaseSync(opts?.path ?? ':memory:') as SqliteClient)
+
+  const driver: SqlDriver = {
+    dialect: 'sqlite',
+    exec(sql, params = []) {
+      client.prepare(sql).run(...params)
+      return Promise.resolve()
+    },
+    query<T extends SqlRow = SqlRow>(
+      sql: string,
+      params: ReadonlyArray<unknown> = [],
+    ) {
+      return Promise.resolve(client.prepare(sql).all(...params) as Array<T>)
+    },
+    // SQLite clients here are synchronous; statements already run in order, so a
+    // plain pass-through is sufficient (no async interleaving to isolate).
+    transaction(fn) {
+      return fn(driver)
+    },
+  }
+  return driver
+}
+
+export interface SqlitePersistenceOptions extends SqliteDriverOptions {
+  mode?: PersistenceMode
+  /** Run migrations on first use (default true). */
+  migrate?: boolean
+}
+
+/** SQLite-backed {@link ChatPersistence}. */
+export function sqlitePersistence(
+  opts?: SqlitePersistenceOptions,
+): ChatPersistence {
+  const driver = createSqliteDriver({ path: opts?.path, db: opts?.db })
+  return createSqlPersistence(driver, {
+    mode: opts?.mode,
+    migrate: opts?.migrate,
+  })
+}
diff --git a/packages/ai-persistence-sqlite/tests/sqlite.test.ts b/packages/ai-persistence-sqlite/tests/sqlite.test.ts
new file mode 100644
index 000000000..256af860d
--- /dev/null
+++ b/packages/ai-persistence-sqlite/tests/sqlite.test.ts
@@ -0,0 +1,44 @@
+import { describe, expect, it } from 'vitest'
+import { EventType } from '@tanstack/ai'
+import type { StreamChunk } from '@tanstack/ai'
+import { createResumeSource } from '@tanstack/ai-persistence'
+import { sqlitePersistence } from '../src/index'
+
+const text = (delta: string): StreamChunk => ({
+  type: EventType.TEXT_MESSAGE_CONTENT,
+  messageId: 'm1',
+  delta,
+  timestamp: 1,
+})
+
+describe('sqlitePersistence', () => {
+  it('round-trips a run, events, and transcript on an in-memory db', async () => {
+    const p = sqlitePersistence()
+    await p.runs!.createOrResume({ runId: 'r1', threadId: 't1', startedAt: 1 })
+    await p.events!.append('r1', 1, text('a'))
+    await p.events!.append('r1', 2, text('b'))
+    await p.messages!.saveThread('t1', [{ role: 'user', content: 'hi' }])
+
+    expect(await p.events!.latestSeq('r1')).toBe(2)
+    expect((await p.runs!.get('r1'))?.status).toBe('running')
+    expect(await p.messages!.loadThread('t1')).toEqual([
+      { role: 'user', content: 'hi' },
+    ])
+  })
+
+  it('drives the core ResumeSource: replays the tail after a cursor', async () => {
+    const p = sqlitePersistence()
+    await p.events!.append('r1', 1, text('a'))
+    await p.events!.append('r1', 2, text('b'))
+    await p.events!.append('r1', 3, text('c'))
+
+    const source = createResumeSource(p.events!, p.runs)
+    expect(await source.hasRun('r1')).toBe(true)
+
+    const deltas: Array<string> = []
+    for await (const chunk of source.replay('r1', undefined)) {
+      if (chunk.type === 'TEXT_MESSAGE_CONTENT') deltas.push(chunk.delta)
+    }
+    expect(deltas).toEqual(['a', 'b', 'c'])
+  })
+})
diff --git a/packages/ai-persistence-sqlite/tsconfig.json b/packages/ai-persistence-sqlite/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-persistence-sqlite/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-persistence-sqlite/vite.config.ts b/packages/ai-persistence-sqlite/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-persistence-sqlite/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-persistence/package.json b/packages/ai-persistence/package.json
new file mode 100644
index 000000000..cca7bd6ef
--- /dev/null
+++ b/packages/ai-persistence/package.json
@@ -0,0 +1,54 @@
+{
+  "name": "@tanstack/ai-persistence",
+  "version": "0.1.0",
+  "description": "Headless persistence layer for TanStack AI — durable runs, message history, an append-only AG-UI event log, durable streams, approvals, artifacts, and resumable runs (runId + cursor) as composable chat() middleware (withPersistence, defineChatPersistence, memoryPersistence).",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-persistence"
+  },
+  "keywords": [
+    "ai",
+    "ai-sdk",
+    "typescript",
+    "tanstack",
+    "persistence",
+    "durable",
+    "resume",
+    "event-log",
+    "chat-history",
+    "ag-ui"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-persistence/src/approval-controller.ts b/packages/ai-persistence/src/approval-controller.ts
new file mode 100644
index 000000000..202b672bb
--- /dev/null
+++ b/packages/ai-persistence/src/approval-controller.ts
@@ -0,0 +1,40 @@
+/**
+ * Server-side approval controller over an {@link ApprovalStore}.
+ *
+ * Approvals ride the existing deny-and-replay flow: a harness emits an
+ * `approval-requested` CUSTOM event (persisted automatically via the event log),
+ * the client POSTs a decision which `resolve()` records durably, and the next
+ * run reads the decisions via `decisionsForThread()` to build the engine's
+ * `TextOptions.approvals` map. This makes approvals durable and multi-device
+ * without the (deferred) true mid-run suspend.
+ */
+import type { ApprovalRecord, ApprovalStore } from './types'
+
+export interface ApprovalController {
+  /** Record a client decision for an approval (durably). */
+  resolve: (approvalId: string, granted: boolean) => Promise<void>
+  /** Register a pending approval (usually emitted by the harness/event log). */
+  request: (
+    record: Omit<ApprovalRecord, 'status' | 'resolvedAt'>,
+  ) => Promise<void>
+  /**
+   * Decisions for a thread as an `approvalId → granted` map, ready to pass as
+   * `chat({ approvals })` on the next/resumed run.
+   */
+  decisionsForThread: (threadId: string) => Promise<Map<string, boolean>>
+}
+
+export function createApprovalController(opts: {
+  store: ApprovalStore
+}): ApprovalController {
+  const { store } = opts
+  return {
+    resolve: (approvalId, granted) => store.resolve(approvalId, granted),
+    request: (record) =>
+      store.create({
+        ...record,
+        status: 'pending',
+      }),
+    decisionsForThread: (threadId) => store.decisionsForThread(threadId),
+  }
+}
diff --git a/packages/ai-persistence/src/capabilities.ts b/packages/ai-persistence/src/capabilities.ts
new file mode 100644
index 000000000..9b4968173
--- /dev/null
+++ b/packages/ai-persistence/src/capabilities.ts
@@ -0,0 +1,36 @@
+/**
+ * Persistence capability tokens.
+ *
+ * `withPersistence` PROVIDES these so later middleware (and harness adapters)
+ * can read durable state. `LocksCapability` and `ResumeSourceCapability` are
+ * re-exported from core (`@tanstack/ai`) — they are shared, single-owner tokens
+ * (locks with the sandbox layer; the resume source with the chat engine's
+ * resume seam).
+ */
+import { createCapability } from '@tanstack/ai'
+import type { ApprovalStore, ChatPersistence, EventLog } from './types'
+
+export const PersistenceCapability =
+  createCapability<ChatPersistence>()('persistence')
+
+export const EventsCapability =
+  createCapability<EventLog>()('persistence.events')
+
+export const ApprovalsCapability = createCapability<ApprovalStore>()(
+  'persistence.approvals',
+)
+
+export const [getPersistence, providePersistence] = PersistenceCapability
+export const [getEvents, provideEvents] = EventsCapability
+export const [getApprovals, provideApprovals] = ApprovalsCapability
+
+// Shared, single-owner tokens live in core; re-export so consumers import
+// everything persistence-related from this package.
+export {
+  LocksCapability,
+  getLocks,
+  provideLocks,
+  ResumeSourceCapability,
+  getResumeSource,
+  provideResumeSource,
+} from '@tanstack/ai'
diff --git a/packages/ai-persistence/src/cursor.ts b/packages/ai-persistence/src/cursor.ts
new file mode 100644
index 000000000..62a6e66d1
--- /dev/null
+++ b/packages/ai-persistence/src/cursor.ts
@@ -0,0 +1,84 @@
+/**
+ * Resume cursors.
+ *
+ * A cursor is an OPAQUE string the client echoes back to resume a run. It
+ * encodes a `(runId, seq)` pair where `seq` is a per-run monotonic sequence
+ * assigned to each persisted event. The opacity keeps the public contract free
+ * of any "cursor is an integer" assumption — backends compare by the decoded
+ * `seq`, and the wire format can evolve without breaking clients.
+ *
+ * Encoding: base64url of `"<seq>:<runId>"`. The sequence comes first and has no
+ * colon, so the runId (which may contain colons) is everything after the first
+ * delimiter — robust regardless of runId content.
+ */
+
+/** Decode the inner `"<seq>:<runId>"` payload, or null if malformed. */
+function decodePayload(cursor: string): { runId: string; seq: number } | null {
+  let decoded: string
+  try {
+    decoded = Buffer.from(cursor, 'base64url').toString('utf8')
+  } catch {
+    return null
+  }
+  const delimiter = decoded.indexOf(':')
+  if (delimiter <= 0) {
+    return null
+  }
+  const seqText = decoded.slice(0, delimiter)
+  if (!/^\d+$/.test(seqText)) {
+    return null
+  }
+  return { seq: Number(seqText), runId: decoded.slice(delimiter + 1) }
+}
+
+/** Encode a `(runId, seq)` pair into an opaque cursor string. */
+export function encodeCursor(runId: string, seq: number): string {
+  return Buffer.from(`${seq}:${runId}`, 'utf8').toString('base64url')
+}
+
+/** Decode a cursor back to its `(runId, seq)` pair. Throws if malformed. */
+export function decodeCursor(cursor: string): { runId: string; seq: number } {
+  const payload = decodePayload(cursor)
+  if (payload === null) {
+    throw new Error(`Invalid resume cursor: ${cursor}`)
+  }
+  return payload
+}
+
+/** Whether `value` is a well-formed cursor produced by {@link encodeCursor}. */
+export function isValidCursor(value: string): boolean {
+  return value.length > 0 && decodePayload(value) !== null
+}
+
+/**
+ * Per-run monotonic sequence counter held by `withPersistence` for the lifetime
+ * of one run. `next()` assigns the next sequence to an event; on resume,
+ * construct it with the highest already-persisted sequence so new events keep
+ * climbing without colliding with replayed ones.
+ */
+export class RunSequence {
+  private seq: number
+
+  constructor(
+    private readonly runId: string,
+    initialSeq = 0,
+  ) {
+    this.seq = initialSeq
+  }
+
+  /** Assign and return the next sequence number. */
+  next(): number {
+    this.seq += 1
+    return this.seq
+  }
+
+  /** The most recently assigned sequence number. */
+  current(): number {
+    return this.seq
+  }
+
+  /** Encode the current sequence as a cursor for this run. */
+  toCursor(): string {
+    return encodeCursor(this.runId, this.seq)
+  }
+}
diff --git a/packages/ai-persistence/src/history.ts b/packages/ai-persistence/src/history.ts
new file mode 100644
index 000000000..18af0fdf2
--- /dev/null
+++ b/packages/ai-persistence/src/history.ts
@@ -0,0 +1,25 @@
+/**
+ * History projection — read a persisted run's events back as a `StreamChunk`
+ * timeline. This is the `events -> StreamChunk[]` projection devtools (and any
+ * client) consume to render or replay a PAST run through the exact same
+ * chunk-rendering path they use for live runs. Live devtools observation is
+ * unchanged; this adds the read-from-store side.
+ */
+import type { StreamChunk } from '@tanstack/ai'
+import type { EventLog } from './types'
+
+/**
+ * Collect a run's persisted events into an ordered `StreamChunk[]` timeline.
+ * `afterSeq` skips events up to and including that sequence (e.g. for paging).
+ */
+export async function loadRunHistory(
+  events: EventLog,
+  runId: string,
+  opts?: { afterSeq?: number },
+): Promise<Array<StreamChunk>> {
+  const chunks: Array<StreamChunk> = []
+  for await (const { event } of events.read(runId, opts)) {
+    chunks.push(event)
+  }
+  return chunks
+}
diff --git a/packages/ai-persistence/src/index.ts b/packages/ai-persistence/src/index.ts
new file mode 100644
index 000000000..d970db559
--- /dev/null
+++ b/packages/ai-persistence/src/index.ts
@@ -0,0 +1,61 @@
+// Store contracts + aggregate
+export { defineChatPersistence } from './types'
+export type {
+  PersistenceMode,
+  PersistedEvent,
+  MessageStore,
+  RunStatus,
+  RunRecord,
+  RunStore,
+  EventLog,
+  DurableRunStream,
+  ApprovalRecord,
+  ApprovalStore,
+  ArtifactRecord,
+  ArtifactStore,
+  ChatPersistence,
+} from './types'
+
+// Middleware
+export { withPersistence } from './middleware'
+export type { WithPersistenceOptions } from './middleware'
+
+// Reference in-memory implementation
+export { memoryPersistence } from './memory'
+
+// Cursor utilities
+export {
+  encodeCursor,
+  decodeCursor,
+  isValidCursor,
+  RunSequence,
+} from './cursor'
+
+// Resume-source adapter (EventLog + RunStore -> core ResumeSource)
+export { createResumeSource } from './resume-source'
+
+// History projection (events -> StreamChunk[] timeline for devtools / replay)
+export { loadRunHistory } from './history'
+
+// Approval controller
+export { createApprovalController } from './approval-controller'
+export type { ApprovalController } from './approval-controller'
+
+// Capabilities (incl. re-exported core Locks/ResumeSource tokens)
+export {
+  PersistenceCapability,
+  EventsCapability,
+  ApprovalsCapability,
+  getPersistence,
+  providePersistence,
+  getEvents,
+  provideEvents,
+  getApprovals,
+  provideApprovals,
+  LocksCapability,
+  getLocks,
+  provideLocks,
+  ResumeSourceCapability,
+  getResumeSource,
+  provideResumeSource,
+} from './capabilities'
diff --git a/packages/ai-persistence/src/memory.ts b/packages/ai-persistence/src/memory.ts
new file mode 100644
index 000000000..cb4ffbccb
--- /dev/null
+++ b/packages/ai-persistence/src/memory.ts
@@ -0,0 +1,156 @@
+/**
+ * In-memory {@link ChatPersistence} — the reference implementation of every
+ * store. Correct within a single process (no durability across restarts); used
+ * by tests, examples, and the devtools demo. Durable backends live in the
+ * `@tanstack/ai-persistence-*` packages.
+ */
+import { InMemoryLockStore } from '@tanstack/ai'
+import type { ModelMessage, StreamChunk } from '@tanstack/ai'
+import type {
+  ApprovalRecord,
+  ApprovalStore,
+  ArtifactRecord,
+  ArtifactStore,
+  ChatPersistence,
+  EventLog,
+  MessageStore,
+  PersistedEvent,
+  PersistenceMode,
+  RunRecord,
+  RunStore,
+} from './types'
+
+class MemoryMessageStore implements MessageStore {
+  private readonly threads = new Map<string, Array<ModelMessage>>()
+  loadThread(threadId: string): Promise<Array<ModelMessage>> {
+    return Promise.resolve(this.threads.get(threadId)?.slice() ?? [])
+  }
+  saveThread(threadId: string, messages: Array<ModelMessage>): Promise<void> {
+    this.threads.set(threadId, messages.slice())
+    return Promise.resolve()
+  }
+}
+
+class MemoryRunStore implements RunStore {
+  private readonly runs = new Map<string, RunRecord>()
+  createOrResume(input: {
+    runId: string
+    threadId: string
+    status?: RunRecord['status']
+    startedAt: number
+  }): Promise<RunRecord> {
+    const existing = this.runs.get(input.runId)
+    if (existing) return Promise.resolve(existing)
+    const record: RunRecord = {
+      runId: input.runId,
+      threadId: input.threadId,
+      status: input.status ?? 'running',
+      startedAt: input.startedAt,
+    }
+    this.runs.set(record.runId, record)
+    return Promise.resolve(record)
+  }
+  update(
+    runId: string,
+    patch: Partial<
+      Pick<RunRecord, 'status' | 'finishedAt' | 'error' | 'usage'>
+    >,
+  ): Promise<void> {
+    const existing = this.runs.get(runId)
+    if (existing) this.runs.set(runId, { ...existing, ...patch })
+    return Promise.resolve()
+  }
+  get(runId: string): Promise<RunRecord | null> {
+    return Promise.resolve(this.runs.get(runId) ?? null)
+  }
+}
+
+class MemoryEventLog implements EventLog {
+  private readonly logs = new Map<string, Array<PersistedEvent>>()
+  append(runId: string, seq: number, event: StreamChunk): Promise<void> {
+    const log = this.logs.get(runId)
+    if (log) log.push({ seq, event })
+    else this.logs.set(runId, [{ seq, event }])
+    return Promise.resolve()
+  }
+  read(
+    runId: string,
+    opts?: { afterSeq?: number },
+  ): AsyncIterable<PersistedEvent> {
+    const after = opts?.afterSeq ?? -Infinity
+    const events = (this.logs.get(runId) ?? []).filter((e) => e.seq > after)
+    return (async function* () {
+      for (const e of events) yield e
+    })()
+  }
+  hasRun(runId: string): Promise<boolean> {
+    return Promise.resolve((this.logs.get(runId)?.length ?? 0) > 0)
+  }
+  latestSeq(runId: string): Promise<number> {
+    const log = this.logs.get(runId)
+    const last = log && log.length ? log[log.length - 1] : undefined
+    return Promise.resolve(last ? last.seq : 0)
+  }
+}
+
+class MemoryApprovalStore implements ApprovalStore {
+  private readonly approvals = new Map<string, ApprovalRecord>()
+  create(record: Omit<ApprovalRecord, 'resolvedAt'>): Promise<void> {
+    this.approvals.set(record.approvalId, { ...record })
+    return Promise.resolve()
+  }
+  resolve(approvalId: string, granted: boolean): Promise<void> {
+    const existing = this.approvals.get(approvalId)
+    if (existing) {
+      existing.status = granted ? 'granted' : 'denied'
+      existing.resolvedAt = Date.now()
+    }
+    return Promise.resolve()
+  }
+  get(approvalId: string): Promise<ApprovalRecord | null> {
+    return Promise.resolve(this.approvals.get(approvalId) ?? null)
+  }
+  decisionsForThread(threadId: string): Promise<Map<string, boolean>> {
+    const decisions = new Map<string, boolean>()
+    for (const a of this.approvals.values()) {
+      if (a.threadId === threadId && a.status !== 'pending') {
+        decisions.set(a.approvalId, a.status === 'granted')
+      }
+    }
+    return Promise.resolve(decisions)
+  }
+}
+
+class MemoryArtifactStore implements ArtifactStore {
+  private readonly artifacts = new Map<string, ArtifactRecord>()
+  save(record: ArtifactRecord): Promise<void> {
+    this.artifacts.set(record.artifactId, { ...record })
+    return Promise.resolve()
+  }
+  get(artifactId: string): Promise<ArtifactRecord | null> {
+    return Promise.resolve(this.artifacts.get(artifactId) ?? null)
+  }
+  list(runId: string): Promise<Array<ArtifactRecord>> {
+    return Promise.resolve(
+      [...this.artifacts.values()].filter((a) => a.runId === runId),
+    )
+  }
+}
+
+/**
+ * Build an in-memory persistence aggregate. All stores are always present (the
+ * `mode` only declares intended coverage); durability is per-process only.
+ */
+export function memoryPersistence(opts?: {
+  mode?: PersistenceMode
+}): ChatPersistence {
+  return {
+    mode: opts?.mode ?? 'agent',
+    messages: new MemoryMessageStore(),
+    runs: new MemoryRunStore(),
+    events: new MemoryEventLog(),
+    approvals: new MemoryApprovalStore(),
+    artifacts: new MemoryArtifactStore(),
+    locks: new InMemoryLockStore(),
+  }
+}
diff --git a/packages/ai-persistence/src/middleware.ts b/packages/ai-persistence/src/middleware.ts
new file mode 100644
index 000000000..425238de4
--- /dev/null
+++ b/packages/ai-persistence/src/middleware.ts
@@ -0,0 +1,172 @@
+/**
+ * `withPersistence` — composable chat() middleware that makes a run durable.
+ *
+ * Maps onto the real middleware hooks:
+ * - `setup`     → create/resume the run record; provide capabilities; seed the
+ *                 per-run sequence (continuing past any already-persisted events).
+ * - `onConfig`  → (init only) load the thread transcript and make the server
+ *                 authoritative: use the client's messages when present, else the
+ *                 stored transcript (so a thin/resume request with no messages
+ *                 still runs on history).
+ * - `onChunk`   → assign the next per-run sequence, stamp the in-band `cursor`,
+ *                 append to the event log, publish to the durable stream.
+ * - `onFinish`  → mark the run completed, persist usage + the final transcript.
+ * - `onError`   → mark the run failed; `onAbort` → interrupted.
+ *
+ * Everything is gated on the presence of the relevant store, so a `messages`-only
+ * persistence is as valid as a full `agent` one, and a non-persisted run is
+ * completely unaffected (this middleware simply isn't in the stack).
+ *
+ * NOTE on message reconciliation: `ModelMessage` has no stable id (ids live on
+ * the client `UIMessage` and are stripped before the engine sees messages), so
+ * reconciliation is whole-transcript, server-authoritative, not id-level. True
+ * id/delta thin-client merging is a documented follow-up.
+ */
+import { defineChatMiddleware } from '@tanstack/ai'
+import {
+  ApprovalsCapability,
+  EventsCapability,
+  LocksCapability,
+  PersistenceCapability,
+  ResumeSourceCapability,
+  provideApprovals,
+  provideEvents,
+  provideLocks,
+  providePersistence,
+  provideResumeSource,
+} from './capabilities'
+import { RunSequence, encodeCursor } from './cursor'
+import { createResumeSource } from './resume-source'
+import type {
+  ChatMiddleware,
+  ChatMiddlewareConfig,
+  ChatMiddlewareContext,
+  StreamChunk,
+} from '@tanstack/ai'
+import type { ChatPersistence, PersistenceMode } from './types'
+
+export interface WithPersistenceOptions {
+  /** Override the persistence aggregate's declared mode for this run. */
+  mode?: PersistenceMode
+}
+
+/** Per-run state, keyed by the stable middleware context. */
+const runState = new WeakMap<object, { seq: RunSequence; merged: boolean }>()
+
+export function withPersistence(
+  persistence: ChatPersistence,
+  opts?: WithPersistenceOptions,
+): ChatMiddleware {
+  const mode = opts?.mode ?? persistence.mode
+  const hasMessages = mode !== 'chat' || !!persistence.messages
+  const wantsMessages = !!persistence.messages
+  const wantsEvents = mode !== 'messages' && !!persistence.events
+  const wantsApprovals = mode === 'agent' && !!persistence.approvals
+  const wantsLocks = !!persistence.locks
+  void hasMessages
+
+  // Declared provisions must match what setup actually provides (array
+  // middleware is runtime-validated for coverage).
+  const provides = [
+    PersistenceCapability,
+    ...(wantsEvents ? [EventsCapability, ResumeSourceCapability] : []),
+    ...(wantsApprovals ? [ApprovalsCapability] : []),
+    ...(wantsLocks ? [LocksCapability] : []),
+  ]
+
+  return defineChatMiddleware({
+    name: 'persistence',
+    provides,
+    async setup(ctx: ChatMiddlewareContext) {
+      providePersistence(ctx, persistence)
+
+      if (persistence.runs) {
+        await persistence.runs.createOrResume({
+          runId: ctx.runId,
+          threadId: ctx.threadId,
+          startedAt: Date.now(),
+        })
+      }
+
+      // Continue the sequence past anything already persisted (resume-safe).
+      const initialSeq =
+        wantsEvents && persistence.events
+          ? await persistence.events.latestSeq(ctx.runId)
+          : 0
+      runState.set(ctx, {
+        seq: new RunSequence(ctx.runId, initialSeq),
+        merged: false,
+      })
+
+      if (wantsEvents && persistence.events) {
+        provideEvents(ctx, persistence.events)
+        provideResumeSource(
+          ctx,
+          createResumeSource(persistence.events, persistence.runs),
+        )
+      }
+      if (wantsApprovals && persistence.approvals) {
+        provideApprovals(ctx, persistence.approvals)
+      }
+      if (wantsLocks && persistence.locks) {
+        provideLocks(ctx, persistence.locks)
+      }
+    },
+
+    async onConfig(ctx: ChatMiddlewareContext, config: ChatMiddlewareConfig) {
+      if (ctx.phase !== 'init' || !wantsMessages || !persistence.messages) {
+        return
+      }
+      const state = runState.get(ctx)
+      if (state?.merged) return
+      if (state) state.merged = true
+
+      const stored = await persistence.messages.loadThread(ctx.threadId)
+      // Server-authoritative: client messages win when present (full-history
+      // client); fall back to stored history for a thin/resume request.
+      const merged = config.messages.length > 0 ? config.messages : stored
+      return { messages: merged }
+    },
+
+    async onChunk(ctx: ChatMiddlewareContext, chunk: StreamChunk) {
+      if (!wantsEvents || !persistence.events) return
+      const state = runState.get(ctx)
+      if (!state) return
+      const seq = state.seq.next()
+      const stamped: StreamChunk = {
+        ...chunk,
+        cursor: encodeCursor(ctx.runId, seq),
+      }
+      await persistence.events.append(ctx.runId, seq, stamped)
+      await persistence.stream?.publish(ctx.runId, seq, stamped)
+      return stamped
+    },
+
+    async onFinish(ctx: ChatMiddlewareContext, info) {
+      await persistence.runs?.update(ctx.runId, {
+        status: 'completed',
+        finishedAt: Date.now(),
+        ...(info.usage ? { usage: info.usage } : {}),
+      })
+      if (wantsMessages && persistence.messages) {
+        await persistence.messages.saveThread(ctx.threadId, [...ctx.messages])
+      }
+    },
+
+    async onError(ctx: ChatMiddlewareContext, info) {
+      await persistence.runs?.update(ctx.runId, {
+        status: 'failed',
+        finishedAt: Date.now(),
+        error:
+          info.error instanceof Error ? info.error.message : String(info.error),
+      })
+    },
+
+    async onAbort(ctx: ChatMiddlewareContext) {
+      await persistence.runs?.update(ctx.runId, {
+        status: 'interrupted',
+        finishedAt: Date.now(),
+      })
+    },
+  })
+}
diff --git a/packages/ai-persistence/src/resume-source.ts b/packages/ai-persistence/src/resume-source.ts
new file mode 100644
index 000000000..db52c83b1
--- /dev/null
+++ b/packages/ai-persistence/src/resume-source.ts
@@ -0,0 +1,34 @@
+/**
+ * Adapts the persistence {@link EventLog} (+ optional {@link RunStore}) to the
+ * core `ResumeSource` contract the `chat()` resume seam consumes. Cursors are
+ * decoded to a per-run sequence so replay returns only events after the point
+ * the client last saw.
+ */
+import { decodeCursor, isValidCursor } from './cursor'
+import type { ResumeSource, RunStatus, StreamChunk } from '@tanstack/ai'
+import type { EventLog, RunStore } from './types'
+
+export function createResumeSource(
+  events: EventLog,
+  runs?: RunStore,
+): ResumeSource {
+  return {
+    hasRun: (runId) => events.hasRun(runId),
+    async *replay(runId, afterCursor): AsyncIterable<StreamChunk> {
+      const afterSeq =
+        afterCursor && isValidCursor(afterCursor)
+          ? decodeCursor(afterCursor).seq
+          : undefined
+      for await (const { event } of events.read(
+        runId,
+        afterSeq === undefined ? undefined : { afterSeq },
+      )) {
+        yield event
+      }
+    },
+    async getStatus(runId): Promise<RunStatus | null> {
+      const run = await runs?.get(runId)
+      return run ? run.status : null
+    },
+  }
+}
diff --git a/packages/ai-persistence/src/types.ts b/packages/ai-persistence/src/types.ts
new file mode 100644
index 000000000..dd2ea7454
--- /dev/null
+++ b/packages/ai-persistence/src/types.ts
@@ -0,0 +1,151 @@
+/**
+ * Persistence store contracts.
+ *
+ * The persisted run log is the AG-UI `StreamChunk` stream itself — there is no
+ * separate event type. Each store is an independently swappable seam; a
+ * `ChatPersistence` aggregate bundles the ones a deployment uses, gated by
+ * {@link PersistenceMode}.
+ */
+import type {
+  LockStore,
+  ModelMessage,
+  StreamChunk,
+  TokenUsage,
+} from '@tanstack/ai'
+
+/**
+ * How much to persist.
+ * - `messages`: thread message history only.
+ * - `chat`: messages + runs + event log + durable stream + usage (everything
+ *   needed for resumable conversations).
+ * - `agent`: everything in `chat` plus sandbox records, approvals, and
+ *   artifacts (for sandbox-backed harness runs).
+ */
+export type PersistenceMode = 'messages' | 'chat' | 'agent'
+
+/** A persisted, sequenced event (a chunk plus its per-run sequence). */
+export interface PersistedEvent {
+  seq: number
+  event: StreamChunk
+}
+
+/** Conversation history, keyed by threadId. Holds server-canonical messages. */
+export interface MessageStore {
+  loadThread: (threadId: string) => Promise<Array<ModelMessage>>
+  saveThread: (threadId: string, messages: Array<ModelMessage>) => Promise<void>
+}
+
+/** Lifecycle status of a run. */
+export type RunStatus = 'running' | 'completed' | 'failed' | 'interrupted'
+
+/** One execution attempt of `chat()`. */
+export interface RunRecord {
+  runId: string
+  threadId: string
+  status: RunStatus
+  startedAt: number
+  finishedAt?: number
+  error?: string
+  usage?: TokenUsage
+}
+
+export interface RunStore {
+  /** Create the run if new, or return the existing record (idempotent resume). */
+  createOrResume: (
+    input: Pick<RunRecord, 'runId' | 'threadId'> & {
+      status?: RunStatus
+      startedAt: number
+    },
+  ) => Promise<RunRecord>
+  update: (
+    runId: string,
+    patch: Partial<
+      Pick<RunRecord, 'status' | 'finishedAt' | 'error' | 'usage'>
+    >,
+  ) => Promise<void>
+  get: (runId: string) => Promise<RunRecord | null>
+}
+
+/** Append-only AG-UI event log — the source of truth for a run. */
+export interface EventLog {
+  append: (runId: string, seq: number, event: StreamChunk) => Promise<void>
+  /** Replay persisted events for a run, optionally only those after a seq. */
+  read: (
+    runId: string,
+    opts?: { afterSeq?: number },
+  ) => AsyncIterable<PersistedEvent>
+  /** Whether any events have been persisted for the run. */
+  hasRun: (runId: string) => Promise<boolean>
+  /** Highest persisted seq for the run, or 0 when none. */
+  latestSeq: (runId: string) => Promise<number>
+}
+
+/** Live fan-out of run events to subscribers (e.g. CF Durable Objects). */
+export interface DurableRunStream {
+  publish: (runId: string, seq: number, event: StreamChunk) => Promise<void>
+}
+
+/** A persisted approval request + its resolution. */
+export interface ApprovalRecord {
+  approvalId: string
+  runId: string
+  threadId: string
+  status: 'pending' | 'granted' | 'denied'
+  requestedAt: number
+  resolvedAt?: number
+  payload: Record<string, unknown>
+}
+
+export interface ApprovalStore {
+  create: (record: Omit<ApprovalRecord, 'resolvedAt'>) => Promise<void>
+  resolve: (approvalId: string, granted: boolean) => Promise<void>
+  get: (approvalId: string) => Promise<ApprovalRecord | null>
+  /** All decided approvals for a thread, as an approvalId→granted map. */
+  decisionsForThread: (threadId: string) => Promise<Map<string, boolean>>
+}
+
+/** Metadata (and optionally inline bytes) for an agent-produced artifact. */
+export interface ArtifactRecord {
+  artifactId: string
+  runId: string
+  threadId: string
+  name: string
+  mimeType: string
+  size: number
+  /** Inline bytes for small artifacts; large ones use an external store (R2). */
+  bytes?: Uint8Array
+  externalUrl?: string
+  createdAt: number
+}
+
+export interface ArtifactStore {
+  save: (record: ArtifactRecord) => Promise<void>
+  get: (artifactId: string) => Promise<ArtifactRecord | null>
+  list: (runId: string) => Promise<Array<ArtifactRecord>>
+}
+
+/**
+ * Aggregate of the stores a deployment uses. `mode` declares the intended
+ * coverage; individual stores are present according to it (and to what a
+ * backend supports). `locks` (durable mutex) is the core {@link LockStore}.
+ */
+export interface ChatPersistence {
+  mode: PersistenceMode
+  messages?: MessageStore
+  runs?: RunStore
+  events?: EventLog
+  stream?: DurableRunStream
+  approvals?: ApprovalStore
+  artifacts?: ArtifactStore
+  locks?: LockStore
+}
+
+/**
+ * Identity helper for assembling a {@link ChatPersistence} from low-level
+ * stores. Pure pass-through today; the named entry point advanced users wire.
+ */
+export function defineChatPersistence(
+  persistence: ChatPersistence,
+): ChatPersistence {
+  return persistence
+}
diff --git a/packages/ai-persistence/tests/cursor.test.ts b/packages/ai-persistence/tests/cursor.test.ts
new file mode 100644
index 000000000..953a23129
--- /dev/null
+++ b/packages/ai-persistence/tests/cursor.test.ts
@@ -0,0 +1,65 @@
+import { describe, expect, it } from 'vitest'
+import {
+  RunSequence,
+  decodeCursor,
+  encodeCursor,
+  isValidCursor,
+} from '../src/cursor'
+
+describe('encodeCursor / decodeCursor', () => {
+  it('round-trips a runId and sequence', () => {
+    const cursor = encodeCursor('run-1', 42)
+    expect(decodeCursor(cursor)).toEqual({ runId: 'run-1', seq: 42 })
+  })
+
+  it('is opaque (not the raw "runId:seq")', () => {
+    const cursor = encodeCursor('run-1', 42)
+    expect(cursor).not.toContain('run-1')
+    expect(cursor).not.toBe('run-1:42')
+  })
+
+  it('round-trips runIds that contain the delimiter', () => {
+    const cursor = encodeCursor('thread:run:1', 7)
+    expect(decodeCursor(cursor)).toEqual({ runId: 'thread:run:1', seq: 7 })
+  })
+
+  it('orders by sequence within a run via the decoded seq', () => {
+    const a = decodeCursor(encodeCursor('r', 1)).seq
+    const b = decodeCursor(encodeCursor('r', 2)).seq
+    expect(b).toBeGreaterThan(a)
+  })
+})
+
+describe('isValidCursor', () => {
+  it('accepts a value produced by encodeCursor', () => {
+    expect(isValidCursor(encodeCursor('run-1', 1))).toBe(true)
+  })
+
+  it('rejects arbitrary / malformed strings', () => {
+    expect(isValidCursor('not-a-cursor')).toBe(false)
+    expect(isValidCursor('')).toBe(false)
+  })
+})
+
+describe('RunSequence', () => {
+  it('hands out monotonically increasing sequence numbers', () => {
+    const seq = new RunSequence('run-1')
+    expect(seq.next()).toBe(1)
+    expect(seq.next()).toBe(2)
+    expect(seq.next()).toBe(3)
+    expect(seq.current()).toBe(3)
+  })
+
+  it('resumes after an initial sequence (so resumed runs keep climbing)', () => {
+    const seq = new RunSequence('run-1', 10)
+    expect(seq.next()).toBe(11)
+    expect(seq.current()).toBe(11)
+  })
+
+  it('toCursor encodes the current sequence for this run', () => {
+    const seq = new RunSequence('run-1')
+    seq.next() // 1
+    seq.next() // 2
+    expect(decodeCursor(seq.toCursor())).toEqual({ runId: 'run-1', seq: 2 })
+  })
+})
diff --git a/packages/ai-persistence/tests/history.test.ts b/packages/ai-persistence/tests/history.test.ts
new file mode 100644
index 000000000..550e53ba9
--- /dev/null
+++ b/packages/ai-persistence/tests/history.test.ts
@@ -0,0 +1,41 @@
+import { describe, expect, it } from 'vitest'
+import { EventType } from '@tanstack/ai'
+import type { StreamChunk } from '@tanstack/ai'
+import { memoryPersistence } from '../src/memory'
+import { loadRunHistory } from '../src/history'
+
+const text = (delta: string): StreamChunk => ({
+  type: EventType.TEXT_MESSAGE_CONTENT,
+  messageId: 'm1',
+  delta,
+  timestamp: 1,
+})
+
+describe('loadRunHistory', () => {
+  it('projects a persisted run into an ordered StreamChunk timeline', async () => {
+    const { events } = memoryPersistence()
+    await events!.append('r1', 1, text('a'))
+    await events!.append('r1', 2, text('b'))
+    await events!.append('r1', 3, text('c'))
+
+    const timeline = await loadRunHistory(events!, 'r1')
+    expect(
+      timeline.map((c) =>
+        c.type === 'TEXT_MESSAGE_CONTENT' ? c.delta : c.type,
+      ),
+    ).toEqual(['a', 'b', 'c'])
+  })
+
+  it('supports paging via afterSeq', async () => {
+    const { events } = memoryPersistence()
+    await events!.append('r1', 1, text('a'))
+    await events!.append('r1', 2, text('b'))
+    const timeline = await loadRunHistory(events!, 'r1', { afterSeq: 1 })
+    expect(timeline).toHaveLength(1)
+  })
+
+  it('returns an empty timeline for an unknown run', async () => {
+    const { events } = memoryPersistence()
+    expect(await loadRunHistory(events!, 'nope')).toEqual([])
+  })
+})
diff --git a/packages/ai-persistence/tests/memory.test.ts b/packages/ai-persistence/tests/memory.test.ts
new file mode 100644
index 000000000..67d50a336
--- /dev/null
+++ b/packages/ai-persistence/tests/memory.test.ts
@@ -0,0 +1,129 @@
+import { describe, expect, it } from 'vitest'
+import { EventType } from '@tanstack/ai'
+import { memoryPersistence } from '../src/memory'
+import type { StreamChunk } from '@tanstack/ai'
+
+const chunk = (delta: string): StreamChunk => ({
+  type: EventType.TEXT_MESSAGE_CONTENT,
+  messageId: 'm1',
+  delta,
+  timestamp: 1,
+})
+
+describe('memoryPersistence', () => {
+  it('defaults to agent mode with every store present', () => {
+    const p = memoryPersistence()
+    expect(p.mode).toBe('agent')
+    expect(p.messages).toBeDefined()
+    expect(p.runs).toBeDefined()
+    expect(p.events).toBeDefined()
+    expect(p.approvals).toBeDefined()
+    expect(p.artifacts).toBeDefined()
+    expect(p.locks).toBeDefined()
+  })
+
+  it('honors a requested mode', () => {
+    expect(memoryPersistence({ mode: 'chat' }).mode).toBe('chat')
+  })
+
+  describe('runs', () => {
+    it('createOrResume is idempotent and update patches status', async () => {
+      const { runs } = memoryPersistence()
+      const a = await runs!.createOrResume({
+        runId: 'r1',
+        threadId: 't1',
+        startedAt: 100,
+      })
+      expect(a.status).toBe('running')
+      // Resume returns the SAME record, not a fresh one.
+      const b = await runs!.createOrResume({
+        runId: 'r1',
+        threadId: 't1',
+        startedAt: 999,
+      })
+      expect(b.startedAt).toBe(100)
+
+      await runs!.update('r1', { status: 'completed', finishedAt: 200 })
+      const got = await runs!.get('r1')
+      expect(got?.status).toBe('completed')
+      expect(got?.finishedAt).toBe(200)
+    })
+  })
+
+  describe('events', () => {
+    it('appends, reports hasRun/latestSeq, and reads after a seq', async () => {
+      const { events } = memoryPersistence()
+      expect(await events!.hasRun('r1')).toBe(false)
+      await events!.append('r1', 1, chunk('a'))
+      await events!.append('r1', 2, chunk('b'))
+      await events!.append('r1', 3, chunk('c'))
+      expect(await events!.hasRun('r1')).toBe(true)
+      expect(await events!.latestSeq('r1')).toBe(3)
+
+      const seen: Array<number> = []
+      for await (const e of events!.read('r1', { afterSeq: 1 })) {
+        seen.push(e.seq)
+      }
+      expect(seen).toEqual([2, 3])
+    })
+
+    it('reads all events when no afterSeq is given', async () => {
+      const { events } = memoryPersistence()
+      await events!.append('r1', 1, chunk('a'))
+      await events!.append('r1', 2, chunk('b'))
+      const seen: Array<string> = []
+      for await (const e of events!.read('r1')) {
+        if (e.event.type === 'TEXT_MESSAGE_CONTENT') seen.push(e.event.delta)
+      }
+      expect(seen).toEqual(['a', 'b'])
+    })
+  })
+
+  describe('messages', () => {
+    it('round-trips a thread transcript', async () => {
+      const { messages } = memoryPersistence()
+      expect(await messages!.loadThread('t1')).toEqual([])
+      await messages!.saveThread('t1', [{ role: 'user', content: 'hi' }])
+      expect(await messages!.loadThread('t1')).toEqual([
+        { role: 'user', content: 'hi' },
+      ])
+    })
+  })
+
+  describe('approvals', () => {
+    it('creates, resolves, and reports thread decisions', async () => {
+      const { approvals } = memoryPersistence()
+      await approvals!.create({
+        approvalId: 'a1',
+        runId: 'r1',
+        threadId: 't1',
+        status: 'pending',
+        requestedAt: 1,
+        payload: {},
+      })
+      expect((await approvals!.get('a1'))?.status).toBe('pending')
+      await approvals!.resolve('a1', true)
+      expect((await approvals!.get('a1'))?.status).toBe('granted')
+      const decisions = await approvals!.decisionsForThread('t1')
+      expect(decisions.get('a1')).toBe(true)
+    })
+  })
+
+  describe('artifacts', () => {
+    it('saves, gets, and lists by run', async () => {
+      const { artifacts } = memoryPersistence()
+      await artifacts!.save({
+        artifactId: 'art1',
+        runId: 'r1',
+        threadId: 't1',
+        name: 'out.txt',
+        mimeType: 'text/plain',
+        size: 3,
+        createdAt: 1,
+      })
+      expect((await artifacts!.get('art1'))?.name).toBe('out.txt')
+      expect(await artifacts!.list('r1')).toHaveLength(1)
+      expect(await artifacts!.list('other')).toHaveLength(0)
+    })
+  })
+})
diff --git a/packages/ai-persistence/tests/with-persistence.test.ts b/packages/ai-persistence/tests/with-persistence.test.ts
new file mode 100644
index 000000000..ca12d3112
--- /dev/null
+++ b/packages/ai-persistence/tests/with-persistence.test.ts
@@ -0,0 +1,138 @@
+import { describe, expect, it } from 'vitest'
+import { EventType, chat } from '@tanstack/ai'
+import type { AnyTextAdapter, StreamChunk } from '@tanstack/ai'
+import { memoryPersistence } from '../src/memory'
+import { withPersistence } from '../src/middleware'
+
+// --- minimal mock text adapter ---------------------------------------------
+
+function mockAdapter(iterations: Array<Array<StreamChunk>>) {
+  const calls: Array<unknown> = []
+  let i = 0
+  const adapter = {
+    kind: 'text',
+    name: 'mock',
+    model: 'test-model',
+    '~types': {},
+    chatStream: (opts: unknown) => {
+      calls.push(opts)
+      const chunks = iterations[i] ?? []
+      i++
+      return (async function* () {
+        for (const c of chunks) yield c
+      })()
+    },
+    structuredOutput: async () => ({ data: {}, rawText: '{}' }),
+  } as unknown as AnyTextAdapter
+  return { adapter, calls }
+}
+
+const ev = {
+  runStarted: (runId = 'r1', threadId = 't1'): StreamChunk => ({
+    type: EventType.RUN_STARTED,
+    runId,
+    threadId,
+    timestamp: 1,
+  }),
+  text: (delta: string): StreamChunk => ({
+    type: EventType.TEXT_MESSAGE_CONTENT,
+    messageId: 'm1',
+    delta,
+    timestamp: 1,
+  }),
+  runFinished: (runId = 'r1', threadId = 't1'): StreamChunk => ({
+    type: EventType.RUN_FINISHED,
+    runId,
+    threadId,
+    finishReason: 'stop',
+    timestamp: 1,
+  }),
+}
+
+async function collect(stream: AsyncIterable<StreamChunk>) {
+  const out: Array<StreamChunk> = []
+  for await (const c of stream) out.push(c)
+  return out
+}
+
+describe('withPersistence (no sandbox)', () => {
+  it('persists events with cursors, completes the run, and saves the transcript', async () => {
+    const persistence = memoryPersistence()
+    const { adapter } = mockAdapter([
+      [ev.runStarted(), ev.text('hello'), ev.runFinished()],
+    ])
+
+    const chunks = await collect(
+      chat({
+        adapter,
+        messages: [{ role: 'user', content: 'hi' }],
+        runId: 'r1',
+        threadId: 't1',
+        middleware: [withPersistence(persistence)],
+      }) as AsyncIterable<StreamChunk>,
+    )
+
+    // Every emitted chunk carries an in-band cursor.
+    expect(chunks.length).toBeGreaterThan(0)
+    expect(chunks.every((c) => typeof c.cursor === 'string')).toBe(true)
+
+    // Events are in the log, run is completed, transcript saved.
+    expect(await persistence.events!.hasRun('r1')).toBe(true)
+    expect((await persistence.runs!.get('r1'))?.status).toBe('completed')
+    expect(
+      (await persistence.messages!.loadThread('t1')).length,
+    ).toBeGreaterThan(0)
+  })
+
+  it('resumes by replaying events after the cursor without running the adapter', async () => {
+    const persistence = memoryPersistence()
+    const first = mockAdapter([
+      [ev.runStarted(), ev.text('hello'), ev.text(' world'), ev.runFinished()],
+    ])
+
+    const original = await collect(
+      chat({
+        adapter: first.adapter,
+        messages: [{ role: 'user', content: 'hi' }],
+        runId: 'r1',
+        threadId: 't1',
+        middleware: [withPersistence(persistence)],
+      }) as AsyncIterable<StreamChunk>,
+    )
+
+    // Resume from the first chunk's cursor — should replay the rest, no adapter.
+    const afterCursor = original[0]!.cursor!
+    const resumeAdapter = mockAdapter([[ev.text('SHOULD NOT RUN')]])
+    const replay = await collect(
+      chat({
+        adapter: resumeAdapter.adapter,
+        messages: [],
+        runId: 'r1',
+        threadId: 't1',
+        cursor: afterCursor,
+        middleware: [withPersistence(persistence)],
+      }) as AsyncIterable<StreamChunk>,
+    )
+
+    expect(resumeAdapter.calls.length).toBe(0)
+    // Replayed cursors are exactly the original tail after the resume point.
+    expect(replay.map((c) => c.cursor)).toEqual(
+      original.slice(1).map((c) => c.cursor),
+    )
+  })
+
+  it('is a no-op without the middleware: chunks carry no cursor', async () => {
+    const { adapter } = mockAdapter([
+      [ev.runStarted(), ev.text('plain'), ev.runFinished()],
+    ])
+    const chunks = await collect(
+      chat({
+        adapter,
+        messages: [{ role: 'user', content: 'hi' }],
+        runId: 'r1',
+        threadId: 't1',
+      }) as AsyncIterable<StreamChunk>,
+    )
+    expect(chunks.every((c) => c.cursor === undefined)).toBe(true)
+  })
+})
diff --git a/packages/ai-persistence/tsconfig.json b/packages/ai-persistence/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-persistence/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-persistence/vite.config.ts b/packages/ai-persistence/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-persistence/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-sandbox-cloudflare/package.json b/packages/ai-sandbox-cloudflare/package.json
new file mode 100644
index 000000000..f89a5dc80
--- /dev/null
+++ b/packages/ai-sandbox-cloudflare/package.json
@@ -0,0 +1,56 @@
+{
+  "name": "@tanstack/ai-sandbox-cloudflare",
+  "version": "0.1.0",
+  "description": "Cloudflare sandbox provider for TanStack AI — run harness adapters inside Cloudflare Containers (edge) through the uniform SandboxHandle.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-sandbox-cloudflare"
+  },
+  "keywords": [
+    "ai",
+    "tanstack",
+    "sandbox",
+    "cloudflare",
+    "workers",
+    "edge",
+    "harness",
+    "agent"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "dependencies": {
+    "@cloudflare/sandbox": "^0.12.1"
+  },
+  "peerDependencies": {
+    "@tanstack/ai-sandbox": "workspace:^"
+  },
+  "devDependencies": {
+    "@cloudflare/workers-types": "^4.20241230.0",
+    "@tanstack/ai-sandbox": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-sandbox-cloudflare/src/handle.ts b/packages/ai-sandbox-cloudflare/src/handle.ts
new file mode 100644
index 000000000..804688a51
--- /dev/null
+++ b/packages/ai-sandbox-cloudflare/src/handle.ts
@@ -0,0 +1,263 @@
+/**
+ * SandboxHandle backed by a Cloudflare Sandbox (Containers + Durable Objects),
+ * via `@cloudflare/sandbox`. Runs at the edge inside a Worker.
+ *
+ * fs is implemented over `exec` with base64 piping (binary-safe), matching the
+ * Docker provider. The container disk is EPHEMERAL (wiped to the image on
+ * restart) and snapshots are not yet GA, so `capabilities.snapshots` and
+ * `durableFilesystem` are false — `withSandbox` re-bootstraps under the same
+ * identity across cold starts.
+ *
+ * LIMITATION: Cloudflare background processes do not expose a writable stdin,
+ * so `spawn().stdin.write` throws. Harness adapters that feed the prompt via
+ * stdin (e.g. the Claude Code adapter) therefore need a stdin-capable provider
+ * (local-process / Docker) or a future Cloudflare stdin path. `exec` (one-shot)
+ * works fully.
+ *
+ * NOTE: not runtime-verified in this repo (requires a Workers runtime); it
+ * compiles against the real `@cloudflare/sandbox` types and follows the proven
+ * provider contract.
+ */
+import { createExecBackedGit } from '@tanstack/ai-sandbox'
+import type { Sandbox } from '@cloudflare/sandbox'
+import type {
+  ExecResult,
+  ProcessOptions,
+  SandboxCapabilities,
+  SandboxChannel,
+  SandboxHandle,
+  SpawnHandle,
+} from '@tanstack/ai-sandbox'
+
+export const CLOUDFLARE_CAPS: SandboxCapabilities = {
+  fs: true,
+  exec: true,
+  env: true,
+  ports: true,
+  backgroundProcesses: true,
+  snapshots: false,
+  networkPolicy: false,
+  durableFilesystem: false,
+  fork: false,
+}
+
+/** POSIX single-quote escape for embedding paths in `sh -c`. */
+function q(value: string): string {
+  return `'${value.replace(/'/g, `'\\''`)}'`
+}
+
+/** A push-driven async string queue used to adapt CF's onOutput callback. */
+class OutputQueue {
+  private readonly buffer: Array<string> = []
+  private readonly waiters: Array<(r: IteratorResult<string>) => void> = []
+  private ended = false
+
+  push(value: string): void {
+    const waiter = this.waiters.shift()
+    if (waiter) waiter({ value, done: false })
+    else this.buffer.push(value)
+  }
+
+  end(): void {
+    this.ended = true
+    let waiter = this.waiters.shift()
+    while (waiter) {
+      waiter({ value: undefined, done: true })
+      waiter = this.waiters.shift()
+    }
+  }
+
+  async *[Symbol.asyncIterator](): AsyncIterator<string> {
+    while (!this.ended || this.buffer.length > 0) {
+      if (this.buffer.length > 0) {
+        yield this.buffer.shift() as string
+        continue
+      }
+      const next = await new Promise<IteratorResult<string>>((resolve) =>
+        this.waiters.push(resolve),
+      )
+      if (next.done) return
+      yield next.value
+    }
+  }
+}
+
+export class CloudflareHandle implements SandboxHandle {
+  readonly id: string
+  readonly provider = 'cloudflare'
+  readonly capabilities = CLOUDFLARE_CAPS
+  readonly fs: SandboxHandle['fs']
+  readonly git: SandboxHandle['git']
+  readonly process: SandboxHandle['process']
+  readonly ports: SandboxHandle['ports']
+  readonly env: SandboxHandle['env']
+
+  private readonly sandbox: Sandbox
+  private readonly workdir: string
+  private readonly previewHostname: string | undefined
+
+  constructor(
+    id: string,
+    sandbox: Sandbox,
+    workdir: string,
+    previewHostname?: string,
+  ) {
+    this.id = id
+    this.sandbox = sandbox
+    this.workdir = workdir
+    this.previewHostname = previewHostname
+
+    this.process = {
+      exec: (command, opts) => this.exec(command, opts),
+      spawn: (command, opts) => this.spawnProcess(command, opts),
+    }
+
+    this.fs = {
+      read: async (p) => {
+        const r = await this.exec(`base64 ${q(this.abs(p))}`)
+        if (r.exitCode !== 0) throw new Error(`read failed: ${r.stderr.trim()}`)
+        return Buffer.from(r.stdout, 'base64').toString('utf8')
+      },
+      readBytes: async (p) => {
+        const r = await this.exec(`base64 ${q(this.abs(p))}`)
+        if (r.exitCode !== 0) throw new Error(`read failed: ${r.stderr.trim()}`)
+        return new Uint8Array(Buffer.from(r.stdout, 'base64'))
+      },
+      write: async (p, data) => {
+        const abs = this.abs(p)
+        const b64 = Buffer.from(
+          typeof data === 'string' ? Buffer.from(data, 'utf8') : data,
+        ).toString('base64')
+        const dir = abs.replace(/\/[^/]*$/, '') || '/'
+        const r = await this.exec(
+          `mkdir -p ${q(dir)} && printf %s ${q(b64)} | base64 -d > ${q(abs)}`,
+        )
+        if (r.exitCode !== 0)
+          throw new Error(`write failed: ${r.stderr.trim()}`)
+      },
+      list: async (p) => {
+        const r = await this.exec(`ls -1Ap ${q(this.abs(p))}`)
+        if (r.exitCode !== 0) throw new Error(`list failed: ${r.stderr.trim()}`)
+        return r.stdout
+          .split('\n')
+          .filter((line) => line.trim() !== '')
+          .map((entry) => {
+            const isDir = entry.endsWith('/')
+            const name = isDir ? entry.slice(0, -1) : entry
+            return {
+              name,
+              path: `${p.replace(/\/$/, '')}/${name}`,
+              type: isDir ? ('dir' as const) : ('file' as const),
+            }
+          })
+      },
+      mkdir: async (p) => {
+        await this.exec(`mkdir -p ${q(this.abs(p))}`)
+      },
+      remove: async (p) => {
+        await this.exec(`rm -rf ${q(this.abs(p))}`)
+      },
+      rename: async (from, to) => {
+        await this.exec(`mv ${q(this.abs(from))} ${q(this.abs(to))}`)
+      },
+      exists: async (p) => {
+        const r = await this.exec(`test -e ${q(this.abs(p))}`)
+        return r.exitCode === 0
+      },
+    }
+
+    this.git = createExecBackedGit(this.process, this.workdir)
+
+    this.ports = {
+      connect: (port) => this.connectPort(port),
+    }
+
+    this.env = {
+      set: (vars) => this.sandbox.setEnvVars(vars),
+    }
+  }
+
+  private abs(p: string): string {
+    if (this.workdir === '/workspace') return p
+    if (p === '/workspace') return this.workdir
+    if (p.startsWith('/workspace/')) {
+      return `${this.workdir}/${p.slice('/workspace/'.length)}`
+    }
+    return p
+  }
+
+  private async exec(
+    command: string,
+    opts?: ProcessOptions,
+  ): Promise<ExecResult> {
+    const result = await this.sandbox.exec(command, {
+      ...(opts?.cwd ? { cwd: this.abs(opts.cwd) } : { cwd: this.workdir }),
+      ...(opts?.env ? { env: opts.env } : {}),
+    })
+    return {
+      stdout: result.stdout,
+      stderr: result.stderr,
+      exitCode: result.exitCode,
+    }
+  }
+
+  private async spawnProcess(
+    command: string,
+    opts?: ProcessOptions,
+  ): Promise<SpawnHandle> {
+    const stdout = new OutputQueue()
+    const stderr = new OutputQueue()
+    let resolveExit: (code: number) => void
+    const exitPromise = new Promise<number>((resolve) => {
+      resolveExit = resolve
+    })
+
+    const proc = await this.sandbox.startProcess(command, {
+      ...(opts?.cwd ? { cwd: this.abs(opts.cwd) } : { cwd: this.workdir }),
+      ...(opts?.env ? { env: opts.env } : {}),
+      onOutput: (stream, data) => {
+        if (stream === 'stdout') stdout.push(data)
+        else stderr.push(data)
+      },
+      onExit: (code) => {
+        stdout.end()
+        stderr.end()
+        resolveExit(code ?? 0)
+      },
+    })
+
+    return {
+      pid: -1,
+      stdout,
+      stderr,
+      stdin: {
+        write: () =>
+          Promise.reject(
+            new Error(
+              'cloudflare: background processes do not expose stdin. Use exec(), or a stdin-capable provider (local-process / docker) for stdin-fed harnesses.',
+            ),
+          ),
+        end: () => Promise.resolve(),
+      },
+      wait: () => exitPromise,
+      kill: (signal) =>
+        proc.kill(typeof signal === 'string' ? signal : undefined),
+    }
+  }
+
+  private async connectPort(port: number): Promise<SandboxChannel> {
+    if (this.previewHostname === undefined) {
+      throw new Error(
+        'cloudflare: ports.connect requires a previewHostname. Pass previewHostname (your Worker request hostname) to cloudflareSandbox(...).',
+      )
+    }
+    const { url } = await this.sandbox.exposePort(port, {
+      hostname: this.previewHostname,
+    })
+    return { url }
+  }
+
+  async destroy(): Promise<void> {
+    await this.sandbox.destroy()
+  }
+}
diff --git a/packages/ai-sandbox-cloudflare/src/index.ts b/packages/ai-sandbox-cloudflare/src/index.ts
new file mode 100644
index 000000000..4e020fe42
--- /dev/null
+++ b/packages/ai-sandbox-cloudflare/src/index.ts
@@ -0,0 +1,5 @@
+export { cloudflareSandbox } from './provider'
+export type { CloudflareSandboxConfig } from './provider'
+export { CloudflareHandle, CLOUDFLARE_CAPS } from './handle'
+// Re-export the Sandbox class so users can wire the Durable Object binding.
+export { Sandbox } from '@cloudflare/sandbox'
diff --git a/packages/ai-sandbox-cloudflare/src/provider.ts b/packages/ai-sandbox-cloudflare/src/provider.ts
new file mode 100644
index 000000000..ac82d531f
--- /dev/null
+++ b/packages/ai-sandbox-cloudflare/src/provider.ts
@@ -0,0 +1,88 @@
+import { getSandbox } from '@cloudflare/sandbox'
+import { CLOUDFLARE_CAPS, CloudflareHandle } from './handle'
+import type { Sandbox } from '@cloudflare/sandbox'
+import type {
+  SandboxCapabilities,
+  SandboxCreateInput,
+  SandboxDestroyInput,
+  SandboxHandle,
+  SandboxProvider,
+  SandboxResumeInput,
+} from '@tanstack/ai-sandbox'
+
+const DEFAULT_WORKDIR = '/workspace'
+
+export interface CloudflareSandboxConfig {
+  /**
+   * The Sandbox Durable Object namespace binding (e.g. `env.Sandbox`).
+   * Available inside a Worker `fetch` handler.
+   */
+  binding: DurableObjectNamespace<Sandbox>
+  /** Working directory inside the container. Defaults to `/workspace`. */
+  workdir?: string
+  /**
+   * Your Worker's request hostname, required by `ports.connect` to expose a
+   * preview URL (Cloudflare routes exposed ports by hostname).
+   */
+  previewHostname?: string
+}
+
+class CloudflareProvider implements SandboxProvider {
+  readonly name = 'cloudflare'
+
+  constructor(private readonly config: CloudflareSandboxConfig) {}
+
+  capabilities(): SandboxCapabilities {
+    return CLOUDFLARE_CAPS
+  }
+
+  private get workdir(): string {
+    return this.config.workdir ?? DEFAULT_WORKDIR
+  }
+
+  async create(input: SandboxCreateInput): Promise<SandboxHandle> {
+    const id = crypto.randomUUID()
+    const sandbox = getSandbox(this.config.binding, id)
+    if (input.env && Object.keys(input.env).length > 0) {
+      await sandbox.setEnvVars(input.env)
+    }
+    await sandbox.mkdir(this.workdir, { recursive: true })
+    return new CloudflareHandle(
+      id,
+      sandbox,
+      this.workdir,
+      this.config.previewHostname,
+    )
+  }
+
+  resume(input: SandboxResumeInput): Promise<SandboxHandle | null> {
+    // The Durable Object is durable, so the sandbox is always addressable by
+    // id. (The container disk may have been wiped on cold start — withSandbox
+    // re-bootstraps under the same identity when durableFilesystem is false.)
+    const sandbox = getSandbox(this.config.binding, input.id)
+    return Promise.resolve(
+      new CloudflareHandle(
+        input.id,
+        sandbox,
+        this.workdir,
+        this.config.previewHostname,
+      ),
+    )
+  }
+
+  async destroy(input: SandboxDestroyInput): Promise<void> {
+    const sandbox = getSandbox(this.config.binding, input.id)
+    await sandbox.destroy()
+  }
+}
+
+/**
+ * Cloudflare sandbox provider — runs harness adapters inside Cloudflare
+ * Containers at the edge. Construct it inside a Worker with the Sandbox Durable
+ * Object namespace binding. See the stdin/snapshot limitations in `handle.ts`.
+ */
+export function cloudflareSandbox(
+  config: CloudflareSandboxConfig,
+): SandboxProvider {
+  return new CloudflareProvider(config)
+}
diff --git a/packages/ai-sandbox-cloudflare/tests/handle.test.ts b/packages/ai-sandbox-cloudflare/tests/handle.test.ts
new file mode 100644
index 000000000..e0cc7983c
--- /dev/null
+++ b/packages/ai-sandbox-cloudflare/tests/handle.test.ts
@@ -0,0 +1,138 @@
+/**
+ * Deterministic tests for the Cloudflare handle against a MOCK Sandbox stub
+ * (no Workers runtime): verify exec pass-through, base64 fs round-trip, the
+ * spawn output queue, capabilities, and the documented stdin limitation.
+ */
+import { describe, expect, it } from 'vitest'
+import { CLOUDFLARE_CAPS, CloudflareHandle } from '../src/handle'
+import type { Sandbox } from '@cloudflare/sandbox'
+import type { ExecResult } from '@tanstack/ai-sandbox'
+
+interface MockProc {
+  onOutput?: (stream: 'stdout' | 'stderr', data: string) => void
+  onExit?: (code: number | null) => void
+}
+
+/** A minimal in-memory Sandbox stub: fs lives in a Map; exec emulates the
+ *  base64/test/mkdir commands the handle issues. */
+function mockSandbox(): { sandbox: Sandbox; files: Map<string, string> } {
+  const files = new Map<string, string>()
+
+  const exec = (command: string): Promise<ExecResult> => {
+    const ok = (stdout = ''): ExecResult => ({
+      stdout,
+      stderr: '',
+      exitCode: 0,
+    })
+    const fail = (stderr: string): ExecResult => ({
+      stdout: '',
+      stderr,
+      exitCode: 1,
+    })
+
+    // base64 '<path>'  -> read
+    const read = command.match(/^base64 '([^']+)'$/)
+    if (read) {
+      const path = read[1]!
+      if (!files.has(path)) return Promise.resolve(fail('no such file'))
+      return Promise.resolve(
+        ok(Buffer.from(files.get(path)!, 'utf8').toString('base64')),
+      )
+    }
+    // mkdir -p '<dir>' && printf %s '<b64>' | base64 -d > '<path>'  -> write
+    const write = command.match(/base64 -d > '([^']+)'$/)
+    const b64 = command.match(/printf %s '([^']+)'/)
+    if (write && b64) {
+      files.set(write[1]!, Buffer.from(b64[1]!, 'base64').toString('utf8'))
+      return Promise.resolve(ok())
+    }
+    // test -e '<path>'
+    const exists = command.match(/^test -e '([^']+)'$/)
+    if (exists) {
+      return Promise.resolve(files.has(exists[1]!) ? ok() : fail(''))
+    }
+    if (command.startsWith('mkdir -p')) return Promise.resolve(ok())
+    if (command.startsWith('echo '))
+      return Promise.resolve(ok(command.slice(5)))
+    return Promise.resolve(ok())
+  }
+
+  const sandbox = {
+    exec,
+    setEnvVars: () => Promise.resolve(),
+    exposePort: (port: number) =>
+      Promise.resolve({ url: `https://${port}.example.workers.dev` }),
+    destroy: () => Promise.resolve(),
+    startProcess: (_cmd: string, opts: MockProc) => {
+      // Emit one line then exit on the next tick.
+      queueMicrotask(() => {
+        opts.onOutput?.('stdout', 'streamed-line\n')
+        opts.onExit?.(0)
+      })
+      return Promise.resolve({ kill: () => Promise.resolve() })
+    },
+  } as unknown as Sandbox
+
+  return { sandbox, files }
+}
+
+describe('CloudflareHandle', () => {
+  it('advertises edge capabilities (ephemeral disk, no snapshots/fork)', () => {
+    expect(CLOUDFLARE_CAPS.snapshots).toBe(false)
+    expect(CLOUDFLARE_CAPS.durableFilesystem).toBe(false)
+    expect(CLOUDFLARE_CAPS.fork).toBe(false)
+    expect(CLOUDFLARE_CAPS.exec).toBe(true)
+    expect(CLOUDFLARE_CAPS.fs).toBe(true)
+  })
+
+  it('round-trips files over base64 exec', async () => {
+    const { sandbox } = mockSandbox()
+    const handle = new CloudflareHandle('sbx-1', sandbox, '/workspace')
+    await handle.fs.write('/workspace/a.txt', 'hello edge')
+    expect(await handle.fs.exists('/workspace/a.txt')).toBe(true)
+    expect(await handle.fs.read('/workspace/a.txt')).toBe('hello edge')
+  })
+
+  it('exec passes stdout/exit through', async () => {
+    const { sandbox } = mockSandbox()
+    const handle = new CloudflareHandle('sbx-1', sandbox, '/workspace')
+    const r = await handle.process.exec('echo hi')
+    expect(r.stdout).toContain('hi')
+    expect(r.exitCode).toBe(0)
+  })
+
+  it('spawn streams output via the queue and resolves wait()', async () => {
+    const { sandbox } = mockSandbox()
+    const handle = new CloudflareHandle('sbx-1', sandbox, '/workspace')
+    const proc = await handle.process.spawn('run something')
+    let out = ''
+    for await (const chunk of proc.stdout) out += chunk
+    expect(out).toContain('streamed-line')
+    expect(await proc.wait()).toBe(0)
+  })
+
+  it('rejects stdin writes (documented CF limitation)', async () => {
+    const { sandbox } = mockSandbox()
+    const handle = new CloudflareHandle('sbx-1', sandbox, '/workspace')
+    const proc = await handle.process.spawn('run something')
+    await expect(proc.stdin.write('x')).rejects.toThrow(/do not expose stdin/i)
+  })
+
+  it('exposes a port to a preview URL when a previewHostname is configured', async () => {
+    const { sandbox } = mockSandbox()
+    const handle = new CloudflareHandle(
+      'sbx-1',
+      sandbox,
+      '/workspace',
+      'my.worker.dev',
+    )
+    const channel = await handle.ports.connect(3000)
+    expect(channel.url).toContain('3000')
+  })
+
+  it('ports.connect throws without a previewHostname', async () => {
+    const { sandbox } = mockSandbox()
+    const handle = new CloudflareHandle('sbx-1', sandbox, '/workspace')
+    await expect(handle.ports.connect(3000)).rejects.toThrow(/previewHostname/i)
+  })
+})
diff --git a/packages/ai-sandbox-cloudflare/tsconfig.json b/packages/ai-sandbox-cloudflare/tsconfig.json
new file mode 100644
index 000000000..1ca53bbf0
--- /dev/null
+++ b/packages/ai-sandbox-cloudflare/tsconfig.json
@@ -0,0 +1,9 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist",
+    "types": ["node", "@cloudflare/workers-types"]
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-sandbox-cloudflare/vite.config.ts b/packages/ai-sandbox-cloudflare/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-sandbox-cloudflare/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-sandbox-docker/package.json b/packages/ai-sandbox-docker/package.json
new file mode 100644
index 000000000..327b01ea6
--- /dev/null
+++ b/packages/ai-sandbox-docker/package.json
@@ -0,0 +1,55 @@
+{
+  "name": "@tanstack/ai-sandbox-docker",
+  "version": "0.1.0",
+  "description": "Docker sandbox provider for TanStack AI — run harness adapters inside isolated Docker containers through the uniform SandboxHandle.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-sandbox-docker"
+  },
+  "keywords": [
+    "ai",
+    "tanstack",
+    "sandbox",
+    "docker",
+    "harness",
+    "agent",
+    "isolation"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "dependencies": {
+    "dockerode": "^4.0.2"
+  },
+  "peerDependencies": {
+    "@tanstack/ai-sandbox": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai-sandbox": "workspace:*",
+    "@types/dockerode": "^3.3.31",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-sandbox-docker/src/handle.ts b/packages/ai-sandbox-docker/src/handle.ts
new file mode 100644
index 000000000..e9b26e0aa
--- /dev/null
+++ b/packages/ai-sandbox-docker/src/handle.ts
@@ -0,0 +1,310 @@
+/**
+ * SandboxHandle backed by a Docker container (via dockerode). Real isolation:
+ * fs/exec/git operate inside the container; paths are real container paths
+ * (default workdir `/workspace`).
+ *
+ * fs is implemented over `exec` with base64 piping (binary-safe, no tar
+ * dependency); the container image must provide `sh`, `base64`, and coreutils
+ * (true for node:* / debian-based images).
+ */
+import { PassThrough, Writable } from 'node:stream'
+import {
+  UnsupportedCapabilityError,
+  createExecBackedGit,
+} from '@tanstack/ai-sandbox'
+import type Dockerode from 'dockerode'
+import type { Readable } from 'node:stream'
+import type {
+  ExecResult,
+  ProcessOptions,
+  SandboxCapabilities,
+  SandboxChannel,
+  SandboxHandle,
+  SnapshotRef,
+  SpawnHandle,
+} from '@tanstack/ai-sandbox'
+
+export const DOCKER_CAPS: SandboxCapabilities = {
+  fs: true,
+  exec: true,
+  env: true,
+  ports: true,
+  backgroundProcesses: true,
+  snapshots: true,
+  networkPolicy: false,
+  durableFilesystem: true, // container fs persists across stop/start (not removal)
+  fork: true,
+}
+
+/** POSIX single-quote escape for embedding paths in `sh -c`. */
+function q(value: string): string {
+  return `'${value.replace(/'/g, `'\\''`)}'`
+}
+
+async function* decodeStream(stream: Readable): AsyncIterable<string> {
+  for await (const chunk of stream) {
+    yield typeof chunk === 'string' ? chunk : (chunk as Buffer).toString('utf8')
+  }
+}
+
+export interface DockerHandleDeps {
+  docker: Dockerode
+  container: Dockerode.Container
+  workdir: string
+  /** Factory used by fork: commit + create a new container from the image. */
+  forkFactory: (sourceContainerId: string) => Promise<SandboxHandle>
+  /** Remove the container on destroy (vs. just stop). */
+  removeOnDestroy: boolean
+}
+
+export class DockerHandle implements SandboxHandle {
+  readonly id: string
+  readonly provider = 'docker'
+  readonly capabilities = DOCKER_CAPS
+  readonly fs: SandboxHandle['fs']
+  readonly git: SandboxHandle['git']
+  readonly process: SandboxHandle['process']
+  readonly ports: SandboxHandle['ports']
+  readonly env: SandboxHandle['env']
+
+  private readonly docker: Dockerode
+  private readonly container: Dockerode.Container
+  private readonly workdir: string
+  private readonly deps: DockerHandleDeps
+  private readonly envVars: Record<string, string> = {}
+
+  constructor(deps: DockerHandleDeps) {
+    this.docker = deps.docker
+    this.container = deps.container
+    this.workdir = deps.workdir
+    this.deps = deps
+    this.id = deps.container.id
+
+    this.process = {
+      exec: (command, opts) => this.exec(command, opts),
+      spawn: (command, opts) => this.spawnProcess(command, opts),
+    }
+
+    this.fs = {
+      read: async (p) => {
+        const r = await this.exec(`base64 ${q(this.abs(p))}`)
+        if (r.exitCode !== 0) throw new Error(`read failed: ${r.stderr.trim()}`)
+        return Buffer.from(r.stdout, 'base64').toString('utf8')
+      },
+      readBytes: async (p) => {
+        const r = await this.exec(`base64 ${q(this.abs(p))}`)
+        if (r.exitCode !== 0) throw new Error(`read failed: ${r.stderr.trim()}`)
+        return new Uint8Array(Buffer.from(r.stdout, 'base64'))
+      },
+      write: async (p, data) => {
+        const abs = this.abs(p)
+        const b64 = Buffer.from(
+          typeof data === 'string' ? Buffer.from(data, 'utf8') : data,
+        ).toString('base64')
+        const dir = abs.replace(/\/[^/]*$/, '') || '/'
+        const r = await this.exec(
+          `mkdir -p ${q(dir)} && printf %s ${q(b64)} | base64 -d > ${q(abs)}`,
+        )
+        if (r.exitCode !== 0)
+          throw new Error(`write failed: ${r.stderr.trim()}`)
+      },
+      list: async (p) => {
+        const r = await this.exec(`ls -1Ap ${q(this.abs(p))}`)
+        if (r.exitCode !== 0) throw new Error(`list failed: ${r.stderr.trim()}`)
+        return r.stdout
+          .split('\n')
+          .filter((line) => line.trim() !== '')
+          .map((entry) => {
+            const isDir = entry.endsWith('/')
+            const name = isDir ? entry.slice(0, -1) : entry
+            return {
+              name,
+              path: `${p.replace(/\/$/, '')}/${name}`,
+              type: isDir ? ('dir' as const) : ('file' as const),
+            }
+          })
+      },
+      mkdir: async (p) => {
+        await this.exec(`mkdir -p ${q(this.abs(p))}`)
+      },
+      remove: async (p) => {
+        await this.exec(`rm -rf ${q(this.abs(p))}`)
+      },
+      rename: async (from, to) => {
+        await this.exec(`mv ${q(this.abs(from))} ${q(this.abs(to))}`)
+      },
+      exists: async (p) => {
+        const r = await this.exec(`test -e ${q(this.abs(p))}`)
+        return r.exitCode === 0
+      },
+    }
+
+    this.git = createExecBackedGit(this.process, this.workdir)
+
+    this.ports = {
+      connect: (port) => this.connectPort(port),
+    }
+
+    this.env = {
+      set: (vars) => {
+        Object.assign(this.envVars, vars)
+        return Promise.resolve()
+      },
+    }
+  }
+
+  /** Map the conventional `/workspace` virtual root to the container workdir. */
+  private abs(p: string): string {
+    if (this.workdir === '/workspace') return p
+    if (p === '/workspace') return this.workdir
+    if (p.startsWith('/workspace/'))
+      return `${this.workdir}/${p.slice('/workspace/'.length)}`
+    return p
+  }
+
+  private envArray(extra?: Record<string, string>): Array<string> {
+    return Object.entries({ ...this.envVars, ...extra }).map(
+      ([k, v]) => `${k}=${v}`,
+    )
+  }
+
+  private async exec(
+    command: string,
+    opts?: ProcessOptions,
+  ): Promise<ExecResult> {
+    const exec = await this.container.exec({
+      Cmd: ['sh', '-c', command],
+      AttachStdout: true,
+      AttachStderr: true,
+      WorkingDir: opts?.cwd ? this.abs(opts.cwd) : this.workdir,
+      Env: this.envArray(opts?.env),
+    })
+    const stream = await exec.start({ hijack: true, stdin: false })
+
+    const stdoutChunks: Array<Buffer> = []
+    const stderrChunks: Array<Buffer> = []
+    const outW = new Writable({
+      write(chunk, _enc, cb) {
+        stdoutChunks.push(chunk as Buffer)
+        cb()
+      },
+    })
+    const errW = new Writable({
+      write(chunk, _enc, cb) {
+        stderrChunks.push(chunk as Buffer)
+        cb()
+      },
+    })
+    this.docker.modem.demuxStream(stream, outW, errW)
+
+    if (opts?.signal) {
+      opts.signal.addEventListener('abort', () => stream.destroy(), {
+        once: true,
+      })
+    }
+
+    await new Promise<void>((resolve, reject) => {
+      stream.on('end', resolve)
+      stream.on('error', reject)
+    })
+
+    const info = await exec.inspect()
+    return {
+      stdout: Buffer.concat(stdoutChunks).toString('utf8'),
+      stderr: Buffer.concat(stderrChunks).toString('utf8'),
+      exitCode: info.ExitCode ?? 0,
+    }
+  }
+
+  private async spawnProcess(
+    command: string,
+    opts?: ProcessOptions,
+  ): Promise<SpawnHandle> {
+    const exec = await this.container.exec({
+      Cmd: ['sh', '-c', command],
+      AttachStdin: true,
+      AttachStdout: true,
+      AttachStderr: true,
+      WorkingDir: opts?.cwd ? this.abs(opts.cwd) : this.workdir,
+      Env: this.envArray(opts?.env),
+    })
+    const stream = await exec.start({ hijack: true, stdin: true })
+    const outPT = new PassThrough()
+    const errPT = new PassThrough()
+    this.docker.modem.demuxStream(stream, outPT, errPT)
+    stream.on('end', () => {
+      outPT.end()
+      errPT.end()
+    })
+    if (opts?.signal) {
+      opts.signal.addEventListener('abort', () => stream.destroy(), {
+        once: true,
+      })
+    }
+
+    return {
+      pid: -1, // docker exec does not surface a host-visible pid
+      stdout: decodeStream(outPT),
+      stderr: decodeStream(errPT),
+      stdin: {
+        write: (data) =>
+          new Promise<void>((resolve, reject) => {
+            stream.write(data, (err) => (err ? reject(err) : resolve()))
+          }),
+        end: () => {
+          stream.end()
+          return Promise.resolve()
+        },
+      },
+      wait: async () => {
+        await new Promise<void>((resolve) => {
+          if (outPT.readableEnded) resolve()
+          else stream.on('end', resolve)
+        })
+        const info = await exec.inspect()
+        return info.ExitCode ?? 0
+      },
+      kill: () => {
+        stream.destroy()
+        return Promise.resolve()
+      },
+    }
+  }
+
+  private async connectPort(port: number): Promise<SandboxChannel> {
+    const info = await this.container.inspect()
+    const mapping = info.NetworkSettings.Ports[`${port}/tcp`]
+    const hostPort = mapping?.[0]?.HostPort
+    if (!hostPort) {
+      throw new Error(
+        `docker: container port ${port} is not published. Pass publishPorts: [${port}] to dockerSandbox() to reach it from the host.`,
+      )
+    }
+    return { url: `http://localhost:${hostPort}` }
+  }
+
+  async snapshot(label?: string): Promise<SnapshotRef> {
+    const tag = `tanstack-ai-sandbox-snapshot:${this.id.slice(0, 12)}-${label ?? 'snap'}`
+    const [repo, tagName] = tag.split(':')
+    await this.container.commit({ repo, tag: tagName })
+    return { id: tag, label }
+  }
+
+  fork = async (): Promise<SandboxHandle> => {
+    if (!this.capabilities.fork) {
+      throw new UnsupportedCapabilityError('docker', 'fork')
+    }
+    return this.deps.forkFactory(this.id)
+  }
+
+  async destroy(): Promise<void> {
+    try {
+      await this.container.stop({ t: 5 })
+    } catch {
+      // already stopped
+    }
+    if (this.deps.removeOnDestroy) {
+      await this.container.remove({ force: true, v: true })
+    }
+  }
+}
diff --git a/packages/ai-sandbox-docker/src/index.ts b/packages/ai-sandbox-docker/src/index.ts
new file mode 100644
index 000000000..d5ca43901
--- /dev/null
+++ b/packages/ai-sandbox-docker/src/index.ts
@@ -0,0 +1,4 @@
+export { dockerSandbox } from './provider'
+export type { DockerSandboxConfig } from './provider'
+export { DockerHandle, DOCKER_CAPS } from './handle'
+export type { DockerHandleDeps } from './handle'
diff --git a/packages/ai-sandbox-docker/src/provider.ts b/packages/ai-sandbox-docker/src/provider.ts
new file mode 100644
index 000000000..003c82490
--- /dev/null
+++ b/packages/ai-sandbox-docker/src/provider.ts
@@ -0,0 +1,177 @@
+import Dockerode from 'dockerode'
+import { DOCKER_CAPS, DockerHandle } from './handle'
+import type {
+  SandboxCapabilities,
+  SandboxCreateInput,
+  SandboxDestroyInput,
+  SandboxHandle,
+  SandboxProvider,
+  SandboxRestoreInput,
+  SandboxResumeInput,
+} from '@tanstack/ai-sandbox'
+
+export interface DockerSandboxConfig {
+  /** Image to run, e.g. `node:22`. Pulled automatically if absent locally. */
+  image: string
+  /** Working directory inside the container. Defaults to `/workspace`. */
+  workdir?: string
+  /** Options forwarded to `new Dockerode(...)` (socketPath, host, port, …). */
+  dockerodeOptions?: Dockerode.DockerOptions
+  /** Command that keeps the container alive. Defaults to `tail -f /dev/null`. */
+  keepAliveCommand?: Array<string>
+  /** Container ports to publish to the host (for `ports.connect`). */
+  publishPorts?: Array<number>
+  /**
+   * Add `host.docker.internal:host-gateway` so the container can reach the
+   * host (e.g. a host-side MCP tool-bridge). Defaults to true.
+   */
+  hostGateway?: boolean
+  /** Remove the container on destroy (vs. just stop). Defaults to true. */
+  removeOnDestroy?: boolean
+}
+
+const DEFAULT_WORKDIR = '/workspace'
+
+class DockerProvider implements SandboxProvider {
+  readonly name = 'docker'
+  private readonly docker: Dockerode
+
+  constructor(private readonly config: DockerSandboxConfig) {
+    this.docker = new Dockerode(config.dockerodeOptions)
+  }
+
+  capabilities(): SandboxCapabilities {
+    return DOCKER_CAPS
+  }
+
+  private get workdir(): string {
+    return this.config.workdir ?? DEFAULT_WORKDIR
+  }
+
+  private async ensureImage(image: string): Promise<void> {
+    try {
+      await this.docker.getImage(image).inspect()
+      return
+    } catch {
+      // not present locally — pull it
+    }
+    const stream = await this.docker.pull(image)
+    await new Promise<void>((resolve, reject) => {
+      this.docker.modem.followProgress(stream, (err) =>
+        err ? reject(err) : resolve(),
+      )
+    })
+  }
+
+  private readonly forkFactory = async (
+    sourceContainerId: string,
+  ): Promise<SandboxHandle> => {
+    const source = this.docker.getContainer(sourceContainerId)
+    const image = await source.commit({
+      repo: 'tanstack-ai-sandbox-fork',
+      tag: `${sourceContainerId.slice(0, 12)}-${Date.now()}`,
+    })
+    const imageRef =
+      typeof image.Id === 'string'
+        ? image.Id
+        : `tanstack-ai-sandbox-fork:latest`
+    return this.startContainer(imageRef)
+  }
+
+  private async startContainer(
+    image: string,
+    env?: Record<string, string>,
+  ): Promise<SandboxHandle> {
+    const exposed: Record<string, Record<string, never>> = {}
+    const bindings: Record<string, Array<{ HostPort: string }>> = {}
+    for (const port of this.config.publishPorts ?? []) {
+      exposed[`${port}/tcp`] = {}
+      bindings[`${port}/tcp`] = [{ HostPort: '' }] // let Docker pick a free host port
+    }
+
+    const container = await this.docker.createContainer({
+      Image: image,
+      Cmd: this.config.keepAliveCommand ?? ['sh', '-c', 'tail -f /dev/null'],
+      Tty: false,
+      WorkingDir: this.workdir,
+      Env: env ? Object.entries(env).map(([k, v]) => `${k}=${v}`) : undefined,
+      ExposedPorts: Object.keys(exposed).length ? exposed : undefined,
+      HostConfig: {
+        ...(Object.keys(bindings).length ? { PortBindings: bindings } : {}),
+        ...(this.config.hostGateway !== false
+          ? { ExtraHosts: ['host.docker.internal:host-gateway'] }
+          : {}),
+      },
+    })
+    await container.start()
+
+    const handle = new DockerHandle({
+      docker: this.docker,
+      container,
+      workdir: this.workdir,
+      forkFactory: this.forkFactory,
+      removeOnDestroy: this.config.removeOnDestroy ?? true,
+    })
+    // Ensure the workspace dir exists.
+    await handle.fs.mkdir(this.workdir)
+    return handle
+  }
+
+  async create(input: SandboxCreateInput): Promise<SandboxHandle> {
+    await this.ensureImage(this.config.image)
+    return this.startContainer(this.config.image, input.env)
+  }
+
+  async resume(input: SandboxResumeInput): Promise<SandboxHandle | null> {
+    const container = this.docker.getContainer(input.id)
+    let info: Dockerode.ContainerInspectInfo
+    try {
+      info = await container.inspect()
+    } catch {
+      return null
+    }
+    if (!info.State.Running) {
+      try {
+        await container.start()
+      } catch {
+        return null
+      }
+    }
+    return new DockerHandle({
+      docker: this.docker,
+      container,
+      workdir: this.workdir,
+      forkFactory: this.forkFactory,
+      removeOnDestroy: this.config.removeOnDestroy ?? true,
+    })
+  }
+
+  async restoreSnapshot(input: SandboxRestoreInput): Promise<SandboxHandle> {
+    return this.startContainer(input.snapshotId, input.env)
+  }
+
+  async destroy(input: SandboxDestroyInput): Promise<void> {
+    const container = this.docker.getContainer(input.id)
+    try {
+      await container.stop({ t: 5 })
+    } catch {
+      // already stopped / gone
+    }
+    if (this.config.removeOnDestroy ?? true) {
+      try {
+        await container.remove({ force: true, v: true })
+      } catch {
+        // already removed
+      }
+    }
+  }
+}
+
+/**
+ * Docker sandbox provider — runs harness adapters inside isolated containers.
+ * Requires a reachable Docker daemon (local socket by default; override via
+ * `dockerodeOptions`).
+ */
+export function dockerSandbox(config: DockerSandboxConfig): SandboxProvider {
+  return new DockerProvider(config)
+}
diff --git a/packages/ai-sandbox-docker/tests/docker.test.ts b/packages/ai-sandbox-docker/tests/docker.test.ts
new file mode 100644
index 000000000..527d1023e
--- /dev/null
+++ b/packages/ai-sandbox-docker/tests/docker.test.ts
@@ -0,0 +1,92 @@
+import { describe, expect, it } from 'vitest'
+import Dockerode from 'dockerode'
+import { defineSandbox, defineWorkspace } from '@tanstack/ai-sandbox'
+import { dockerSandbox } from '../src/index'
+import type { SandboxHandle } from '@tanstack/ai-sandbox'
+
+// Auto-gate: only run when a Docker daemon is reachable.
+let dockerAvailable = false
+try {
+  await new Dockerode().ping()
+  dockerAvailable = true
+} catch {
+  // no daemon — these tests are skipped
+}
+
+const IMAGE = 'alpine:3'
+
+describe.skipIf(!dockerAvailable)(
+  'docker provider (gated on a reachable daemon)',
+  () => {
+    it('creates a container, runs exec, fs round-trip, snapshot + destroy', async () => {
+      const provider = dockerSandbox({ image: IMAGE })
+      let sbx: SandboxHandle | undefined
+      try {
+        sbx = await provider.create({})
+
+        const echo = await sbx.process.exec('echo hello-docker')
+        expect(echo.stdout.trim()).toBe('hello-docker')
+        expect(echo.exitCode).toBe(0)
+
+        await sbx.fs.write('/workspace/note.txt', 'inside the container')
+        expect(await sbx.fs.exists('/workspace/note.txt')).toBe(true)
+        expect(await sbx.fs.read('/workspace/note.txt')).toBe(
+          'inside the container',
+        )
+
+        const bytes = new Uint8Array([0, 1, 2, 250])
+        await sbx.fs.write('/workspace/bin', bytes)
+        expect(Array.from(await sbx.fs.readBytes('/workspace/bin'))).toEqual([
+          0, 1, 2, 250,
+        ])
+
+        const snap = await sbx.snapshot?.('test')
+        expect(snap?.id).toMatch(/tanstack-ai-sandbox-snapshot/)
+      } finally {
+        await sbx?.destroy()
+      }
+    }, 120_000)
+
+    it('resumes a running container by id and streams a spawned process', async () => {
+      const provider = dockerSandbox({ image: IMAGE })
+      let sbx: SandboxHandle | undefined
+      try {
+        sbx = await provider.create({})
+        await sbx.fs.write('/workspace/keep.txt', 'persisted')
+
+        const resumed = await provider.resume({ id: sbx.id })
+        expect(resumed?.id).toBe(sbx.id)
+        expect(await resumed!.fs.read('/workspace/keep.txt')).toBe('persisted')
+
+        const proc = await resumed!.process.spawn('echo streamed-line')
+        let out = ''
+        for await (const chunk of proc.stdout) out += chunk
+        expect(out).toContain('streamed-line')
+        expect(await proc.wait()).toBe(0)
+      } finally {
+        await sbx?.destroy()
+      }
+    }, 120_000)
+
+    it('ensure() bootstraps a workspace (setup command runs)', async () => {
+      const provider = dockerSandbox({ image: IMAGE })
+      const def = defineSandbox({
+        id: 'docker-ensure',
+        provider,
+        workspace: defineWorkspace({
+          source: { type: 'none' },
+          setup: ['echo bootstrapped > /workspace/setup-marker'],
+        }),
+      })
+      const ctx = { threadId: 'docker-t', runId: 'r1' }
+      try {
+        const sbx = await def.ensure(ctx)
+        expect((await sbx.fs.read('/workspace/setup-marker')).trim()).toBe(
+          'bootstrapped',
+        )
+      } finally {
+        await def.destroy(ctx)
+      }
+    }, 120_000)
+  },
+)
diff --git a/packages/ai-sandbox-docker/tsconfig.json b/packages/ai-sandbox-docker/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-sandbox-docker/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-sandbox-docker/vite.config.ts b/packages/ai-sandbox-docker/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-sandbox-docker/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-sandbox-local-process/package.json b/packages/ai-sandbox-local-process/package.json
new file mode 100644
index 000000000..46f9f7983
--- /dev/null
+++ b/packages/ai-sandbox-local-process/package.json
@@ -0,0 +1,50 @@
+{
+  "name": "@tanstack/ai-sandbox-local-process",
+  "version": "0.1.0",
+  "description": "Local-process sandbox provider for TanStack AI — runs the agent directly on the host through the uniform SandboxHandle (no isolation; trusted/dev use).",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-sandbox-local-process"
+  },
+  "keywords": [
+    "ai",
+    "tanstack",
+    "sandbox",
+    "local",
+    "harness",
+    "agent"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai-sandbox": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai-sandbox": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-sandbox-local-process/src/handle.ts b/packages/ai-sandbox-local-process/src/handle.ts
new file mode 100644
index 000000000..9d4f4bd1b
--- /dev/null
+++ b/packages/ai-sandbox-local-process/src/handle.ts
@@ -0,0 +1,272 @@
+/**
+ * SandboxHandle backed by the host machine — no isolation. The "sandbox" is a
+ * real host directory; fs/exec/git operate directly on it.
+ *
+ * TRUST BOUNDARY: local-process runs commands and file writes on the HOST with
+ * the privileges of the current process. It provides NO isolation, NO network
+ * policy, and `exec` runs through a shell. Use it only in trusted/dev contexts
+ * (the fast no-Docker dev loop); never expose it to untrusted prompts in a
+ * context where host compromise matters. For isolation use the Docker or
+ * Cloudflare providers.
+ */
+import { spawn } from 'node:child_process'
+import { watch as watchFs } from 'node:fs'
+import * as fsp from 'node:fs/promises'
+import * as path from 'node:path'
+import {
+  DEFAULT_WORKSPACE_ROOT,
+  UnsupportedCapabilityError,
+  createExecBackedGit,
+} from '@tanstack/ai-sandbox'
+import type { Readable } from 'node:stream'
+import type {
+  ExecResult,
+  ProcessOptions,
+  SandboxCapabilities,
+  SandboxHandle,
+  SpawnHandle,
+} from '@tanstack/ai-sandbox'
+
+export const LOCAL_PROCESS_CAPS: SandboxCapabilities = {
+  fs: true,
+  exec: true,
+  env: true,
+  ports: true,
+  backgroundProcesses: true,
+  snapshots: false,
+  networkPolicy: false,
+  durableFilesystem: true,
+  fork: true,
+}
+
+async function* decodeStream(stream: Readable | null): AsyncIterable<string> {
+  if (!stream) return
+  for await (const chunk of stream) {
+    yield typeof chunk === 'string' ? chunk : (chunk as Buffer).toString('utf8')
+  }
+}
+
+export interface LocalProcessHandleOptions {
+  /** Real host directory backing this sandbox (its workspace root). */
+  root: string
+  /** Remove the backing dir on destroy. */
+  removeOnDestroy: boolean
+  /** Create a fork by copying this sandbox's dir to a new root. */
+  forkFactory: (sourceRoot: string) => Promise<SandboxHandle>
+}
+
+export class LocalProcessHandle implements SandboxHandle {
+  readonly id: string
+  readonly provider = 'local-process'
+  readonly capabilities = LOCAL_PROCESS_CAPS
+  readonly fs: SandboxHandle['fs']
+  readonly git: SandboxHandle['git']
+  readonly process: SandboxHandle['process']
+  readonly ports: SandboxHandle['ports']
+  readonly env: SandboxHandle['env']
+
+  private readonly root: string
+  private readonly options: LocalProcessHandleOptions
+  private readonly envVars: Record<string, string> = {}
+
+  constructor(options: LocalProcessHandleOptions) {
+    this.root = options.root
+    this.id = options.root
+    this.options = options
+
+    this.fs = {
+      read: async (p) => fsp.readFile(this.resolve(p), 'utf8'),
+      readBytes: async (p) =>
+        new Uint8Array(await fsp.readFile(this.resolve(p))),
+      write: async (p, data) => {
+        const target = this.resolve(p)
+        await fsp.mkdir(path.dirname(target), { recursive: true })
+        await fsp.writeFile(
+          target,
+          typeof data === 'string' ? data : Buffer.from(data),
+        )
+      },
+      list: async (p) => {
+        const entries = await fsp.readdir(this.resolve(p), {
+          withFileTypes: true,
+        })
+        return entries.map((e) => ({
+          name: e.name,
+          path: `${p.replace(/\/$/, '')}/${e.name}`,
+          type: e.isDirectory() ? ('dir' as const) : ('file' as const),
+        }))
+      },
+      mkdir: async (p) => {
+        await fsp.mkdir(this.resolve(p), { recursive: true })
+      },
+      remove: async (p) => {
+        await fsp.rm(this.resolve(p), { recursive: true, force: true })
+      },
+      rename: async (from, to) => {
+        await fsp.rename(this.resolve(from), this.resolve(to))
+      },
+      exists: async (p) => {
+        try {
+          await fsp.access(this.resolve(p))
+          return true
+        } catch {
+          return false
+        }
+      },
+    }
+
+    // Native recursive file watching is supported on Windows/macOS but not
+    // Linux (Node throws ERR_FEATURE_UNAVAILABLE_ON_PLATFORM). Expose the
+    // optional `fs.watch` seam only where it works; on Linux it stays
+    // undefined so `watchWorkspace` falls back to the portable exec-poll path.
+    if (process.platform !== 'linux') {
+      this.fs.watch = (p, onEvent) => {
+        const dir = this.resolve(p)
+        // Emit paths under the requested watch root `p` (not a hardcoded
+        // `/workspace`), so callers watching a sub-path get consistent paths.
+        const base = p.replace(/\/+$/, '')
+        const watcher = watchFs(
+          dir,
+          { recursive: true },
+          (eventType, filename) => {
+            if (filename === null) return
+            const rel = filename.toString().split(path.sep).join('/')
+            onEvent({ type: eventType, path: `${base}/${rel}` })
+          },
+        )
+        return Promise.resolve({
+          stop: () => {
+            watcher.close()
+            return Promise.resolve()
+          },
+        })
+      }
+    }
+
+    this.process = {
+      exec: (command, opts) => this.exec(command, opts),
+      spawn: (command, opts) => this.spawnProcess(command, opts),
+    }
+
+    this.git = createExecBackedGit(this.process, this.root)
+
+    this.ports = {
+      // The host can always reach the process directly on localhost.
+      connect: (port) => Promise.resolve({ url: `http://127.0.0.1:${port}` }),
+    }
+
+    this.env = {
+      set: (vars) => {
+        Object.assign(this.envVars, vars)
+        return Promise.resolve()
+      },
+    }
+  }
+
+  /** Map a virtual `/workspace` (or other absolute/relative) path onto the host root. */
+  private resolve(p: string): string {
+    let rel: string
+    if (p === DEFAULT_WORKSPACE_ROOT) rel = ''
+    else if (p.startsWith(`${DEFAULT_WORKSPACE_ROOT}/`)) {
+      rel = p.slice(DEFAULT_WORKSPACE_ROOT.length + 1)
+    } else if (p.startsWith('/')) rel = p.slice(1)
+    else rel = p
+    const resolved = path.resolve(this.root, rel)
+    // Containment: never let an agent's path escape the sandbox dir.
+    const rootWithSep = this.root.endsWith(path.sep)
+      ? this.root
+      : this.root + path.sep
+    if (resolved !== this.root && !resolved.startsWith(rootWithSep)) {
+      throw new Error(
+        `local-process: path "${p}" resolves outside the sandbox root "${this.root}".`,
+      )
+    }
+    return resolved
+  }
+
+  private resolveCwd(cwd: string | undefined): string {
+    return cwd ? this.resolve(cwd) : this.root
+  }
+
+  private mergedEnv(extra?: Record<string, string>): NodeJS.ProcessEnv {
+    return { ...process.env, ...this.envVars, ...extra }
+  }
+
+  private exec(command: string, opts?: ProcessOptions): Promise<ExecResult> {
+    return new Promise<ExecResult>((resolve, reject) => {
+      const child = spawn(command, {
+        shell: true,
+        cwd: this.resolveCwd(opts?.cwd),
+        env: this.mergedEnv(opts?.env),
+      })
+      let stdout = ''
+      let stderr = ''
+      child.stdout.on('data', (d: Buffer) => (stdout += d.toString('utf8')))
+      child.stderr.on('data', (d: Buffer) => (stderr += d.toString('utf8')))
+      const onAbort = (): void => {
+        child.kill()
+      }
+      opts?.signal?.addEventListener('abort', onAbort, { once: true })
+      child.on('error', reject)
+      child.on('close', (code) => {
+        opts?.signal?.removeEventListener('abort', onAbort)
+        resolve({ stdout, stderr, exitCode: code ?? 0 })
+      })
+    })
+  }
+
+  private spawnProcess(
+    command: string,
+    opts?: ProcessOptions,
+  ): Promise<SpawnHandle> {
+    const child = spawn(command, {
+      shell: true,
+      cwd: this.resolveCwd(opts?.cwd),
+      env: this.mergedEnv(opts?.env),
+    })
+    if (opts?.signal) {
+      opts.signal.addEventListener('abort', () => child.kill(), { once: true })
+    }
+    const handle: SpawnHandle = {
+      pid: child.pid ?? -1,
+      stdout: decodeStream(child.stdout),
+      stderr: decodeStream(child.stderr),
+      stdin: {
+        write: (data) =>
+          new Promise<void>((resolve, reject) => {
+            child.stdin.write(data, (err) => (err ? reject(err) : resolve()))
+          }),
+        end: () =>
+          new Promise<void>((resolve) => {
+            child.stdin.end(() => resolve())
+          }),
+      },
+      wait: () =>
+        new Promise<number>((resolve, reject) => {
+          child.on('error', reject)
+          child.on('close', (code) => resolve(code ?? 0))
+        }),
+      kill: (signal) => {
+        child.kill(signal)
+        return Promise.resolve()
+      },
+    }
+    return Promise.resolve(handle)
+  }
+
+  // local-process has no snapshot primitive; fork copies the dir instead.
+  snapshot = undefined
+
+  fork = (): Promise<SandboxHandle> => {
+    if (!this.capabilities.fork) {
+      throw new UnsupportedCapabilityError('local-process', 'fork')
+    }
+    return this.options.forkFactory(this.root)
+  }
+
+  async destroy(): Promise<void> {
+    if (this.options.removeOnDestroy) {
+      await fsp.rm(this.root, { recursive: true, force: true })
+    }
+  }
+}
diff --git a/packages/ai-sandbox-local-process/src/index.ts b/packages/ai-sandbox-local-process/src/index.ts
new file mode 100644
index 000000000..58da39d4b
--- /dev/null
+++ b/packages/ai-sandbox-local-process/src/index.ts
@@ -0,0 +1,4 @@
+export { localProcessSandbox } from './provider'
+export type { LocalProcessSandboxConfig } from './provider'
+export { LocalProcessHandle, LOCAL_PROCESS_CAPS } from './handle'
+export type { LocalProcessHandleOptions } from './handle'
diff --git a/packages/ai-sandbox-local-process/src/provider.ts b/packages/ai-sandbox-local-process/src/provider.ts
new file mode 100644
index 000000000..8911db1bb
--- /dev/null
+++ b/packages/ai-sandbox-local-process/src/provider.ts
@@ -0,0 +1,102 @@
+import { randomUUID } from 'node:crypto'
+import * as fsp from 'node:fs/promises'
+import * as os from 'node:os'
+import * as path from 'node:path'
+import { LOCAL_PROCESS_CAPS, LocalProcessHandle } from './handle'
+import type {
+  SandboxCapabilities,
+  SandboxCreateInput,
+  SandboxDestroyInput,
+  SandboxHandle,
+  SandboxProvider,
+  SandboxResumeInput,
+} from '@tanstack/ai-sandbox'
+
+export interface LocalProcessSandboxConfig {
+  /**
+   * Fixed host directory to use as the workspace (e.g. an existing local repo
+   * checkout). When set, every create/resume uses this exact dir and it is NOT
+   * removed on destroy unless `removeOnDestroy` is explicitly true. When
+   * omitted, each create allocates a fresh temp dir that IS removed on destroy.
+   */
+  dir?: string
+  /** Override the default temp base dir for generated sandboxes. */
+  baseDir?: string
+  /** Remove the backing dir on destroy. Defaults: true (generated), false (fixed `dir`). */
+  removeOnDestroy?: boolean
+}
+
+class LocalProcessProvider implements SandboxProvider {
+  readonly name = 'local-process'
+
+  constructor(private readonly config: LocalProcessSandboxConfig) {}
+
+  capabilities(): SandboxCapabilities {
+    return LOCAL_PROCESS_CAPS
+  }
+
+  private removeDefault(): boolean {
+    return this.config.removeOnDestroy ?? this.config.dir === undefined
+  }
+
+  private makeHandle(root: string): SandboxHandle {
+    return new LocalProcessHandle({
+      root,
+      removeOnDestroy: this.removeDefault(),
+      forkFactory: async (sourceRoot) => {
+        const dest = path.join(this.baseDir(), `fork-${randomUUID()}`)
+        await fsp.mkdir(dest, { recursive: true })
+        await fsp.cp(sourceRoot, dest, { recursive: true })
+        return new LocalProcessHandle({
+          root: dest,
+          removeOnDestroy: true,
+          forkFactory: () =>
+            Promise.reject(new Error('nested fork unsupported')),
+        })
+      },
+    })
+  }
+
+  private baseDir(): string {
+    return (
+      this.config.baseDir ?? path.join(os.tmpdir(), 'tanstack-ai-sandboxes')
+    )
+  }
+
+  async create(_input: SandboxCreateInput): Promise<SandboxHandle> {
+    const root =
+      this.config.dir !== undefined
+        ? path.resolve(this.config.dir)
+        : path.join(this.baseDir(), randomUUID())
+    await fsp.mkdir(root, { recursive: true })
+    return this.makeHandle(root)
+  }
+
+  async resume(input: SandboxResumeInput): Promise<SandboxHandle | null> {
+    // The id is the backing dir path; resume only if it still exists.
+    try {
+      const stat = await fsp.stat(input.id)
+      if (!stat.isDirectory()) return null
+    } catch {
+      return null
+    }
+    return this.makeHandle(input.id)
+  }
+
+  async destroy(input: SandboxDestroyInput): Promise<void> {
+    if (this.removeDefault()) {
+      await fsp.rm(input.id, { recursive: true, force: true })
+    }
+  }
+}
+
+/**
+ * Local-process sandbox provider — runs the agent directly on the host with no
+ * isolation. The fast no-Docker dev loop. See the trust-boundary note in
+ * `handle.ts`.
+ */
+export function localProcessSandbox(
+  config: LocalProcessSandboxConfig = {},
+): SandboxProvider {
+  return new LocalProcessProvider(config)
+}
diff --git a/packages/ai-sandbox-local-process/tests/local-process.test.ts b/packages/ai-sandbox-local-process/tests/local-process.test.ts
new file mode 100644
index 000000000..af949c793
--- /dev/null
+++ b/packages/ai-sandbox-local-process/tests/local-process.test.ts
@@ -0,0 +1,174 @@
+import { afterAll, describe, expect, it } from 'vitest'
+import * as fsp from 'node:fs/promises'
+import * as os from 'node:os'
+import * as path from 'node:path'
+import {
+  bootstrapWorkspace,
+  defineSandbox,
+  defineWorkspace,
+  detectPackageManager,
+  spawnNdjson,
+} from '@tanstack/ai-sandbox'
+import { localProcessSandbox } from '../src/index'
+import type { SandboxHandle } from '@tanstack/ai-sandbox'
+
+const baseDir = path.join(os.tmpdir(), `tanstack-ai-lp-test-${Date.now()}`)
+const provider = localProcessSandbox({ baseDir, removeOnDestroy: true })
+
+afterAll(async () => {
+  await fsp.rm(baseDir, { recursive: true, force: true })
+})
+
+async function fresh(): Promise<SandboxHandle> {
+  return provider.create({})
+}
+
+describe('local-process fs', () => {
+  it('writes, reads, lists, renames, removes', async () => {
+    const sbx = await fresh()
+    await sbx.fs.write('/workspace/a.txt', 'hello')
+    expect(await sbx.fs.read('/workspace/a.txt')).toBe('hello')
+    expect(await sbx.fs.exists('/workspace/a.txt')).toBe(true)
+
+    await sbx.fs.mkdir('/workspace/sub')
+    await sbx.fs.write('/workspace/sub/b.txt', 'world')
+    const listed = await sbx.fs.list('/workspace')
+    expect(listed.map((e) => e.name).sort()).toContain('a.txt')
+
+    await sbx.fs.rename('/workspace/a.txt', '/workspace/c.txt')
+    expect(await sbx.fs.exists('/workspace/a.txt')).toBe(false)
+    expect(await sbx.fs.read('/workspace/c.txt')).toBe('hello')
+
+    await sbx.fs.remove('/workspace/c.txt')
+    expect(await sbx.fs.exists('/workspace/c.txt')).toBe(false)
+    await sbx.destroy()
+  })
+
+  it('reads/writes bytes', async () => {
+    const sbx = await fresh()
+    await sbx.fs.write('/workspace/bin', new Uint8Array([1, 2, 3]))
+    expect(Array.from(await sbx.fs.readBytes('/workspace/bin'))).toEqual([
+      1, 2, 3,
+    ])
+    await sbx.destroy()
+  })
+
+  it('contains paths within the sandbox root', async () => {
+    const sbx = await fresh()
+    await expect(sbx.fs.read('/workspace/../../../etc/hosts')).rejects.toThrow(
+      /outside the sandbox root/,
+    )
+    await sbx.destroy()
+  })
+})
+
+describe('local-process process', () => {
+  it('exec captures stdout + exit code', async () => {
+    const sbx = await fresh()
+    const r = await sbx.process.exec('echo hello')
+    expect(r.stdout.trim()).toContain('hello')
+    expect(r.exitCode).toBe(0)
+    await sbx.destroy()
+  })
+
+  it('exec surfaces non-zero exit codes', async () => {
+    const sbx = await fresh()
+    const r = await sbx.process.exec('exit 7')
+    expect(r.exitCode).toBe(7)
+    await sbx.destroy()
+  })
+
+  it('spawn streams stdout and resolves wait()', async () => {
+    const sbx = await fresh()
+    const proc = await sbx.process.spawn('echo streamed')
+    let out = ''
+    for await (const chunk of proc.stdout) out += chunk
+    const code = await proc.wait()
+    expect(out.trim()).toContain('streamed')
+    expect(code).toBe(0)
+    await sbx.destroy()
+  })
+})
+
+describe('local-process + spawnNdjson (real agent-CLI streaming)', () => {
+  it('streams NDJSON events emitted by a spawned process', async () => {
+    const sbx = await fresh()
+    // A stand-in "agent CLI": emits stream-json on stdout, like `claude -p`.
+    await sbx.fs.write(
+      '/workspace/fake-agent.mjs',
+      [
+        `process.stdout.write(JSON.stringify({ type: 'text', delta: 'pong' }) + '\\n')`,
+        `process.stdout.write(JSON.stringify({ type: 'result', ok: true }) + '\\n')`,
+      ].join('\n'),
+    )
+    const events: Array<unknown> = []
+    for await (const ev of spawnNdjson(sbx, 'node fake-agent.mjs', {
+      cwd: '/workspace',
+    })) {
+      events.push(ev)
+    }
+    expect(events).toEqual([
+      { type: 'text', delta: 'pong' },
+      { type: 'result', ok: true },
+    ])
+    await sbx.destroy()
+  })
+})
+
+describe('local-process lifecycle', () => {
+  it('resume returns a handle for an existing dir, null otherwise', async () => {
+    const sbx = await fresh()
+    const resumed = await provider.resume({ id: sbx.id })
+    expect(resumed?.id).toBe(sbx.id)
+    expect(
+      await provider.resume({ id: path.join(baseDir, 'does-not-exist') }),
+    ).toBeNull()
+    await sbx.destroy()
+  })
+
+  it('fork copies the working tree into a new sandbox', async () => {
+    const sbx = await fresh()
+    await sbx.fs.write('/workspace/seed.txt', 'forked')
+    const forked = await sbx.fork?.()
+    expect(forked).toBeDefined()
+    expect(await forked!.fs.read('/workspace/seed.txt')).toBe('forked')
+    expect(forked!.id).not.toBe(sbx.id)
+    await forked!.destroy()
+    await sbx.destroy()
+  })
+})
+
+describe('local-process + bootstrap + ensure', () => {
+  it('runs setup commands and detects package manager', async () => {
+    const sbx = await fresh()
+    await sbx.fs.write('/workspace/pnpm-lock.yaml', 'lockfileVersion: 9')
+    const workspace = defineWorkspace({
+      source: { type: 'none' },
+      setup: ['echo setup-ran'],
+    })
+    const result = await bootstrapWorkspace(sbx, workspace)
+    expect(result.ranSetup).toEqual(['echo setup-ran'])
+    expect(result.packageManager).toBe('pnpm')
+    expect(await detectPackageManager(sbx, workspace, '/workspace')).toBe(
+      'pnpm',
+    )
+    await sbx.destroy()
+  })
+
+  it('ensure() creates a sandbox and resumes it on a second run', async () => {
+    const def = defineSandbox({
+      id: 'lp-repo',
+      provider,
+      workspace: defineWorkspace({ source: { type: 'none' } }),
+    })
+    const ctx = { threadId: 't-lp', runId: 'r1' }
+    const first = await def.ensure(ctx)
+    await first.fs.write('/workspace/persist.txt', 'kept')
+
+    const second = await def.ensure({ ...ctx, runId: 'r2' })
+    // durable fs + resume by id ⇒ same dir, file survives
+    expect(second.id).toBe(first.id)
+    expect(await second.fs.read('/workspace/persist.txt')).toBe('kept')
+    await def.destroy(ctx)
+  })
+})
diff --git a/packages/ai-sandbox-local-process/tsconfig.json b/packages/ai-sandbox-local-process/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-sandbox-local-process/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-sandbox-local-process/vite.config.ts b/packages/ai-sandbox-local-process/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-sandbox-local-process/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-sandbox-persistence/package.json b/packages/ai-sandbox-persistence/package.json
new file mode 100644
index 000000000..55d366c8e
--- /dev/null
+++ b/packages/ai-sandbox-persistence/package.json
@@ -0,0 +1,55 @@
+{
+  "name": "@tanstack/ai-sandbox-persistence",
+  "version": "0.1.0",
+  "description": "Bridge between @tanstack/ai-sandbox and the persistence layer — provides a durable SQL-backed SandboxStore and wires a durable LockStore into withSandbox, so sandbox resume + ensure-locking survive across processes (agent mode).",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-sandbox-persistence"
+  },
+  "keywords": [
+    "ai",
+    "tanstack",
+    "sandbox",
+    "persistence",
+    "bridge"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^",
+    "@tanstack/ai-persistence": "workspace:^",
+    "@tanstack/ai-persistence-sql": "workspace:^",
+    "@tanstack/ai-sandbox": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@tanstack/ai-persistence": "workspace:*",
+    "@tanstack/ai-persistence-sql": "workspace:*",
+    "@tanstack/ai-sandbox": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-sandbox-persistence/src/index.ts b/packages/ai-sandbox-persistence/src/index.ts
new file mode 100644
index 000000000..263fe7e50
--- /dev/null
+++ b/packages/ai-sandbox-persistence/src/index.ts
@@ -0,0 +1,137 @@
+/**
+ * Bridge between the sandbox layer and persistence (agent mode).
+ *
+ * - {@link createSqlSandboxStore} — a durable, SQL-backed `SandboxStore` so the
+ *   sandbox `ensure` algorithm can resume the same provider sandbox across
+ *   processes (the in-memory default only resumes within one process).
+ * - {@link withPersistenceBridge} — middleware that provides the durable
+ *   `LockStore` (from a `ChatPersistence`) and/or a durable `SandboxStore` into
+ *   the capabilities `withSandbox` optionally requires. Ordered BETWEEN
+ *   `withPersistence` and `withSandbox`.
+ *
+ * This package depends on both sides so neither core package has to: persistence
+ * stays sandbox-free, and ai-sandbox doesn't force a SQL dependency.
+ */
+import {
+  LocksCapability,
+  defineChatMiddleware,
+  provideLocks,
+} from '@tanstack/ai'
+import {
+  SandboxStoreCapability,
+  provideSandboxStore,
+} from '@tanstack/ai-sandbox'
+import { param } from '@tanstack/ai-persistence-sql'
+import type { SqlDriver } from '@tanstack/ai-persistence-sql'
+import type { SandboxRecord, SandboxStore } from '@tanstack/ai-sandbox'
+import type { ChatMiddleware } from '@tanstack/ai'
+import type { ChatPersistence } from '@tanstack/ai-persistence'
+
+/** Durable, SQL-backed {@link SandboxStore}. Creates its table lazily on first use. */
+export function createSqlSandboxStore(driver: SqlDriver): SandboxStore {
+  const p = (i: number) => param(driver.dialect, i)
+  let ready: Promise<void> | undefined
+  const ensure = (): Promise<void> => {
+    ready ??= driver.exec(
+      `CREATE TABLE IF NOT EXISTS sandbox_instances (
+        key TEXT PRIMARY KEY,
+        provider TEXT NOT NULL,
+        provider_sandbox_id TEXT NOT NULL,
+        latest_snapshot_id TEXT,
+        thread_id TEXT NOT NULL,
+        latest_run_id TEXT,
+        updated_at ${driver.dialect === 'postgres' ? 'BIGINT' : 'INTEGER'} NOT NULL
+      )`,
+    )
+    return ready
+  }
+
+  return {
+    async get(key) {
+      await ensure()
+      const rows = await driver.query(
+        `SELECT * FROM sandbox_instances WHERE key = ${p(1)}`,
+        [key],
+      )
+      const row = rows[0]
+      if (!row) return null
+      const record: SandboxRecord = {
+        key: String(row.key),
+        provider: String(row.provider),
+        providerSandboxId: String(row.provider_sandbox_id),
+        threadId: String(row.thread_id),
+        updatedAt: Number(row.updated_at),
+        ...(row.latest_snapshot_id != null
+          ? { latestSnapshotId: String(row.latest_snapshot_id) }
+          : {}),
+        ...(row.latest_run_id != null
+          ? { latestRunId: String(row.latest_run_id) }
+          : {}),
+      }
+      return record
+    },
+    async upsert(record) {
+      await ensure()
+      // Use `excluded.*` (not re-bound params) in the UPDATE so the statement
+      // works on BOTH sqlite (positional `?`, no reuse) and postgres.
+      await driver.exec(
+        `INSERT INTO sandbox_instances
+          (key, provider, provider_sandbox_id, latest_snapshot_id, thread_id, latest_run_id, updated_at)
+         VALUES (${p(1)}, ${p(2)}, ${p(3)}, ${p(4)}, ${p(5)}, ${p(6)}, ${p(7)})
+         ON CONFLICT (key) DO UPDATE SET
+          provider = excluded.provider,
+          provider_sandbox_id = excluded.provider_sandbox_id,
+          latest_snapshot_id = excluded.latest_snapshot_id,
+          thread_id = excluded.thread_id,
+          latest_run_id = excluded.latest_run_id,
+          updated_at = excluded.updated_at`,
+        [
+          record.key,
+          record.provider,
+          record.providerSandboxId,
+          record.latestSnapshotId ?? null,
+          record.threadId,
+          record.latestRunId ?? null,
+          record.updatedAt,
+        ],
+      )
+    },
+    async delete(key) {
+      await ensure()
+      await driver.exec(`DELETE FROM sandbox_instances WHERE key = ${p(1)}`, [
+        key,
+      ])
+    },
+  }
+}
+
+export interface PersistenceBridgeOptions {
+  /** Source of the durable `LockStore` (uses `persistence.locks` when present). */
+  persistence?: ChatPersistence
+  /** Durable sandbox store (e.g. {@link createSqlSandboxStore}). */
+  sandboxStore?: SandboxStore
+}
+
+/**
+ * Wire durable sandbox capabilities into the stack. Provides `LocksCapability`
+ * when the persistence aggregate carries a lock store, and `SandboxStoreCapability`
+ * when a durable sandbox store is supplied. Place after `withPersistence` and
+ * before `withSandbox`.
+ */
+export function withPersistenceBridge(
+  opts: PersistenceBridgeOptions,
+): ChatMiddleware {
+  const lock = opts.persistence?.locks
+  const provides = [
+    ...(lock ? [LocksCapability] : []),
+    ...(opts.sandboxStore ? [SandboxStoreCapability] : []),
+  ]
+  return defineChatMiddleware({
+    name: 'persistence-bridge',
+    provides,
+    setup(ctx) {
+      if (lock) provideLocks(ctx, lock)
+      if (opts.sandboxStore) provideSandboxStore(ctx, opts.sandboxStore)
+    },
+  })
+}
diff --git a/packages/ai-sandbox-persistence/tests/bridge.test.ts b/packages/ai-sandbox-persistence/tests/bridge.test.ts
new file mode 100644
index 000000000..9f96b8b07
--- /dev/null
+++ b/packages/ai-sandbox-persistence/tests/bridge.test.ts
@@ -0,0 +1,89 @@
+import { describe, expect, it } from 'vitest'
+import { DatabaseSync } from 'node:sqlite'
+import { getLocks, InMemoryLockStore } from '@tanstack/ai'
+import { getSandboxStore } from '@tanstack/ai-sandbox'
+import { memoryPersistence } from '@tanstack/ai-persistence'
+import type { SqlDriver, SqlRow } from '@tanstack/ai-persistence-sql'
+import { createSqlSandboxStore, withPersistenceBridge } from '../src/index'
+
+/** Minimal capability context (provide/get key their WeakMap by this object). */
+function fakeCtx() {
+  return { capabilities: { markProvided: () => {} } }
+}
+
+function sqliteDriver(): SqlDriver {
+  const db = new DatabaseSync(':memory:')
+  const driver: SqlDriver = {
+    dialect: 'sqlite',
+    exec(sql, params = []) {
+      db.prepare(sql).run(...(params as Array<never>))
+      return Promise.resolve()
+    },
+    query<T extends SqlRow = SqlRow>(
+      sql: string,
+      params: ReadonlyArray<unknown> = [],
+    ) {
+      return Promise.resolve(
+        db.prepare(sql).all(...(params as Array<never>)) as Array<T>,
+      )
+    },
+    transaction(fn) {
+      return fn(driver)
+    },
+  }
+  return driver
+}
+
+describe('createSqlSandboxStore', () => {
+  it('round-trips upsert / get / delete', async () => {
+    const store = createSqlSandboxStore(sqliteDriver())
+    expect(await store.get('k')).toBeNull()
+    await store.upsert({
+      key: 'k',
+      provider: 'docker',
+      providerSandboxId: 'sb-1',
+      threadId: 't1',
+      latestRunId: 'r1',
+      updatedAt: 123,
+    })
+    const got = await store.get('k')
+    expect(got?.providerSandboxId).toBe('sb-1')
+    expect(got?.threadId).toBe('t1')
+    expect(got?.latestRunId).toBe('r1')
+
+    await store.upsert({
+      key: 'k',
+      provider: 'docker',
+      providerSandboxId: 'sb-2',
+      threadId: 't1',
+      updatedAt: 456,
+    })
+    expect((await store.get('k'))?.providerSandboxId).toBe('sb-2')
+
+    await store.delete('k')
+    expect(await store.get('k')).toBeNull()
+  })
+})
+
+describe('withPersistenceBridge', () => {
+  it('provides the durable LockStore and SandboxStore into the context', async () => {
+    const persistence = memoryPersistence()
+    const lock = new InMemoryLockStore()
+    persistence.locks = lock
+    const sandboxStore = createSqlSandboxStore(sqliteDriver())
+
+    const mw = withPersistenceBridge({ persistence, sandboxStore })
+    const ctx = fakeCtx() as unknown as Parameters<
+      NonNullable<typeof mw.setup>
+    >[0]
+    await mw.setup!(ctx)
+
+    expect(getLocks(ctx)).toBe(lock)
+    expect(getSandboxStore(ctx)).toBe(sandboxStore)
+  })
+
+  it('declares only the capabilities it can provide', () => {
+    const mw = withPersistenceBridge({})
+    expect(mw.provides ?? []).toEqual([])
+  })
+})
diff --git a/packages/ai-sandbox-persistence/tsconfig.json b/packages/ai-sandbox-persistence/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-sandbox-persistence/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-sandbox-persistence/vite.config.ts b/packages/ai-sandbox-persistence/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-sandbox-persistence/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai-sandbox/package.json b/packages/ai-sandbox/package.json
new file mode 100644
index 000000000..0c39788bd
--- /dev/null
+++ b/packages/ai-sandbox/package.json
@@ -0,0 +1,58 @@
+{
+  "name": "@tanstack/ai-sandbox",
+  "version": "0.1.0",
+  "description": "Provider-agnostic sandbox layer for TanStack AI — run harness adapters inside isolated sandboxes (defineSandbox, defineWorkspace, withSandbox) with a uniform SandboxHandle, workspace bootstrap, policy, and resumable lifecycle.",
+  "author": "",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/TanStack/ai.git",
+    "directory": "packages/ai-sandbox"
+  },
+  "keywords": [
+    "ai",
+    "ai-sdk",
+    "typescript",
+    "tanstack",
+    "sandbox",
+    "harness",
+    "agent",
+    "coding-agent",
+    "isolation",
+    "workspace"
+  ],
+  "type": "module",
+  "module": "./dist/esm/index.js",
+  "types": "./dist/esm/index.d.ts",
+  "exports": {
+    ".": {
+      "types": "./dist/esm/index.d.ts",
+      "import": "./dist/esm/index.js"
+    }
+  },
+  "files": [
+    "dist",
+    "src",
+    "skills"
+  ],
+  "scripts": {
+    "build": "vite build",
+    "clean": "premove ./build ./dist",
+    "lint:fix": "eslint ./src --fix",
+    "test:build": "publint --strict",
+    "test:eslint": "eslint ./src",
+    "test:lib": "vitest",
+    "test:lib:dev": "pnpm test:lib --watch",
+    "test:types": "tsc"
+  },
+  "dependencies": {
+    "@modelcontextprotocol/sdk": "^1.29.0"
+  },
+  "peerDependencies": {
+    "@tanstack/ai": "workspace:^"
+  },
+  "devDependencies": {
+    "@tanstack/ai": "workspace:*",
+    "@vitest/coverage-v8": "4.0.14"
+  }
+}
diff --git a/packages/ai-sandbox/skills/ai-sandbox/SKILL.md b/packages/ai-sandbox/skills/ai-sandbox/SKILL.md
new file mode 100644
index 000000000..348290fa3
--- /dev/null
+++ b/packages/ai-sandbox/skills/ai-sandbox/SKILL.md
@@ -0,0 +1,199 @@
+---
+name: ai-sandbox
+description: >
+  Run harness adapters (Claude Code) INSIDE isolated sandboxes via
+  defineSandbox + withSandbox + a provider (localProcessSandbox / dockerSandbox).
+  Covers defineWorkspace (git/setup/scripts/skills/secrets), defineSandboxPolicy
+  (allow/ask/deny), lifecycle/resume, the SandboxHandle (fs/git/process/ports),
+  capability tokens, defineSandbox hooks (onFile/onFileCreate/onFileChange/
+  onFileDelete/onReady/onError/onDestroy) + fileEvents flag, chat middleware
+  sandbox group (defineChatMiddleware sandbox hooks), the sandbox debug category,
+  watchWorkspace as a low-level building block, and the file.changed /
+  sandbox.file / claude-code.session-id events. Use whenever a harness adapter
+  needs a sandbox or when building sandbox providers.
+type: sub-skill
+library: tanstack-ai
+library_version: '0.1.0'
+sources:
+  - 'TanStack/ai:docs/sandbox/overview.md'
+---
+
+# Sandboxes
+
+Harness adapters declare `requires: [SandboxCapability]`. `chat()` errors unless
+some middleware provides it — `withSandbox(...)` does. The adapter then runs the
+agent CLI **inside** the sandbox and streams its events back.
+
+## Setup — Claude Code in a Docker sandbox
+
+```typescript
+import { chat } from '@tanstack/ai'
+import { claudeCodeText } from '@tanstack/ai-claude-code'
+import {
+  defineSandbox,
+  defineWorkspace,
+  withSandbox,
+} from '@tanstack/ai-sandbox'
+import { dockerSandbox } from '@tanstack/ai-sandbox-docker'
+
+const sandbox = defineSandbox({
+  id: 'repo-agent',
+  provider: dockerSandbox({ image: 'node:22' }),
+  workspace: defineWorkspace({
+    source: { type: 'git', url: 'https://github.com/owner/repo', ref: 'main' },
+    packageManager: 'pnpm',
+    setup: ['corepack enable', 'pnpm install'],
+    scripts: { test: 'pnpm test' },
+    secrets: { ANTHROPIC_API_KEY: process.env.ANTHROPIC_API_KEY ?? '' },
+  }),
+  lifecycle: { reuse: 'thread', snapshot: 'after-setup', keepAlive: '30m' },
+})
+
+const stream = chat({
+  threadId,
+  adapter: claudeCodeText('sonnet'),
+  messages,
+  middleware: [withSandbox(sandbox)],
+})
+```
+
+## Providers
+
+- `localProcessSandbox()` — runs on the host (no isolation; dev loop only).
+- `dockerSandbox({ image })` — isolated container; snapshots, fork, resume-by-id.
+
+Both implement the same `SandboxHandle`: `fs` (read/write/list/mkdir/remove/
+rename/exists), `git` (clone/status/add/commit/push/pull/branch), `process`
+(`exec` + duplex `spawn`), `ports.connect(port)`, `env.set`, optional
+`snapshot()`/`fork()`, `destroy()`. Providers advertise support via
+`capabilities()`; calling an unsupported optional method throws
+`UnsupportedCapabilityError`.
+
+## Policy
+
+```typescript
+import { defineSandboxPolicy } from '@tanstack/ai-sandbox'
+
+const policy = defineSandboxPolicy({
+  commands: {
+    allow: ['pnpm test'],
+    ask: ['curl *'],
+    deny: ['sudo *', 'rm -rf *'],
+  },
+  capabilities: { fileWrite: 'allow', network: 'ask' },
+  default: 'ask', // deny > ask > allow
+})
+// pass to defineSandbox({ policy }); harness adapters map it to native permissions
+```
+
+## Lifecycle &amp; resume
+
+`reuse: 'thread'` resumes one sandbox per `threadId`; the compound key folds in
+provider + workspace hash + tenant so changing the repo/setup/image starts
+fresh. Ensure order: resume running → restore snapshot → create + bootstrap.
+
+## File-event hooks
+
+Watch the workspace for create/change/delete events. Provider-agnostic: native
+`fs.watch` on local-process, a portable `find` poll on Docker/exec-only
+providers (no extra deps or image changes).
+
+Declare hooks on `defineSandbox({ hooks })` (sandbox-scoped) or on any chat
+middleware via the `sandbox` group (run-scoped):
+
+```typescript
+import {
+  defineSandbox,
+  defineChatMiddleware,
+  withSandbox,
+} from '@tanstack/ai-sandbox'
+import { dockerSandbox } from '@tanstack/ai-sandbox-docker'
+
+// Sandbox-scoped hooks (all optional):
+const sandbox = defineSandbox({
+  id: 'repo-agent',
+  provider: dockerSandbox({ image: 'node:22' }),
+  hooks: {
+    onFile: (e) => console.log(e.type, e.path), // catch-all
+    onFileCreate: (e) => console.log('created', e.path),
+    onFileChange: (e) => console.log('changed', e.path),
+    onFileDelete: (e) => console.log('deleted', e.path),
+    onReady: (handle) => console.log('ready', handle.id),
+    onError: (err) => console.error(err),
+    onDestroy: () => console.log('destroyed'),
+  },
+  fileEvents: true, // default; set false to disable watching entirely
+})
+
+// Run-scoped hooks via chat middleware (ctx is ChatMiddlewareContext):
+const auditMiddleware = defineChatMiddleware({
+  name: 'audit',
+  sandbox: {
+    onFile: (ctx, e) => console.log(ctx.runId, e.type, e.path),
+    onFileCreate: (ctx, e) => db.log({ run: ctx.runId, event: e }),
+    onFileChange: (ctx, e) => metrics.increment('file.change'),
+    onFileDelete: (ctx, e) => console.warn('deleted', e.path),
+  },
+})
+
+// No extra middleware needed — sandbox.file CUSTOM events are emitted
+// automatically. Read them from the stream:
+for await (const chunk of stream) {
+  if (chunk.type === 'CUSTOM' && chunk.name === 'sandbox.file') {
+    const value = chunk.value
+    if (
+      value !== null &&
+      typeof value === 'object' &&
+      'type' in value &&
+      'path' in value
+    ) {
+      console.log('file event', value) // { type, path, timestamp }
+    }
+  }
+}
+```
+
+`watchWorkspace()` is available as a low-level building block for watching
+outside a `chat()` run:
+
+```typescript
+import { watchWorkspace } from '@tanstack/ai-sandbox'
+
+const watcher = await watchWorkspace(handle, {
+  onEvent: (e) => console.log(e.type, e.path),
+  ignore: ['.git', 'node_modules'], // default
+})
+await watcher.stop()
+```
+
+Enable the `sandbox` debug category to log watcher start/stop, event dispatch,
+and lifecycle transitions:
+
+```typescript
+chat({ threadId, adapter, messages, debug: { sandbox: true } })
+// or debug: true to enable all categories
+```
+
+## Events
+
+- `claude-code.session-id` (CUSTOM) — resumable session id → pass back via
+  `modelOptions.sessionId`.
+- `file.changed` (CUSTOM) — `{ path, diff }` working-tree diff after the run.
+- `sandbox.file` (CUSTOM) — `{ type, path, timestamp }` per file create/change/
+  delete, emitted automatically when a sandbox is active.
+
+## Critical rules
+
+- **Harness adapters require a sandbox.** Always include `withSandbox(...)` in
+  `middleware` — without it `chat()` throws a missing-capability error.
+- **Secrets** (`workspace.secrets`, e.g. `ANTHROPIC_API_KEY`) are injected into
+  the sandbox env and never persisted. The agent binary (`claude`) must exist in
+  the sandbox image (install it in `setup` or bake it into the image).
+- **chat()-provided `tools` are bridged** into the in-sandbox agent over a
+  host-side MCP tool-proxy: the agent calls them as `mcp__tanstack__<tool>` and
+  each call is proxied back to the host where the tool's `execute()` runs (with
+  its closures / DB / secrets). The agent also has its own native tools
+  (Bash/Edit/Read/…). The host bridge binds on the host; the sandbox reaches it
+  (localhost, or `host.docker.internal` for Docker), gated by a per-run bearer
+  token.
+- Use `localProcessSandbox()` only in trusted/dev contexts (no isolation).
diff --git a/packages/ai-sandbox/src/approvals.ts b/packages/ai-sandbox/src/approvals.ts
new file mode 100644
index 000000000..b1c6cac7f
--- /dev/null
+++ b/packages/ai-sandbox/src/approvals.ts
@@ -0,0 +1,94 @@
+/**
+ * Shared interactive-approval logic for harness adapters.
+ *
+ * Flow (rides chat()'s existing resume-based approval mechanism):
+ *  1. The agent (inside the sandbox) asks to run a risky action; the harness's
+ *     host-side permission callback fires.
+ *  2. `resolveApproval` evaluates the sandbox policy: `allow`/`deny` are final;
+ *     `ask` consults the client's approval decisions (threaded via
+ *     `TextOptions.approvals`, keyed by a stable `approvalId`).
+ *  3. On `ask` with no decision yet, the adapter emits an `approval-requested`
+ *     CUSTOM event (carrying the `approvalId`) and denies the action this turn.
+ *     The client shows UI, then re-runs chat() with the decision in the message;
+ *     the engine surfaces it as `approvals`, and the next run allows it.
+ *
+ * `approvalId` is stable for a given (provider, kind, target) so a client grant
+ * matches the same action on the resumed run.
+ */
+import { EventType } from '@tanstack/ai'
+import { evaluateCommand } from './policy'
+import type { SandboxPolicy } from './policy'
+import type { StreamChunk } from '@tanstack/ai'
+
+/** CUSTOM event name emitted when a harness action needs client approval. */
+export const APPROVAL_REQUESTED_EVENT = 'approval-requested'
+
+/** A stable, opaque approval id for a harness action. */
+export function approvalId(input: {
+  provider: string
+  kind: 'command' | 'fileWrite' | 'network' | 'tool'
+  target: string
+}): string {
+  return `${input.provider}:${input.kind}:${input.target}`
+}
+
+export interface ResolveApprovalInput {
+  policy: SandboxPolicy | undefined
+  /** Client approval decisions, keyed by `approvalId`. */
+  approvals: ReadonlyMap<string, boolean> | undefined
+  /** Precomputed approval id for this action. */
+  id: string
+  /** A shell command to match against `policy.commands`. */
+  command?: string
+  /** A coarse capability to match against `policy.capabilities`. */
+  capability?: 'fileWrite' | 'network'
+}
+
+export interface ApprovalOutcome {
+  decision: 'allow' | 'deny'
+  /** True when policy said `ask` and the client hasn't decided yet. */
+  needsApproval: boolean
+}
+
+/** Resolve a harness permission request against policy + client approvals. */
+export function resolveApproval(input: ResolveApprovalInput): ApprovalOutcome {
+  const base =
+    input.command !== undefined
+      ? evaluateCommand(input.command, input.policy)
+      : input.capability !== undefined
+        ? (input.policy?.capabilities?.[input.capability] ??
+          input.policy?.default ??
+          'ask')
+        : (input.policy?.default ?? 'ask')
+
+  if (base === 'allow') return { decision: 'allow', needsApproval: false }
+  if (base === 'deny') return { decision: 'deny', needsApproval: false }
+
+  // base === 'ask' — consult the client's decision.
+  const granted = input.approvals?.get(input.id)
+  if (granted === true) return { decision: 'allow', needsApproval: false }
+  if (granted === false) return { decision: 'deny', needsApproval: false }
+  return { decision: 'deny', needsApproval: true }
+}
+
+/** Build the AG-UI `approval-requested` CUSTOM event for a harness action. */
+export function buildApprovalRequestedEvent(input: {
+  approvalId: string
+  title: string
+  threadId: string
+  runId: string
+  detail?: Record<string, unknown>
+}): StreamChunk {
+  return {
+    type: EventType.CUSTOM,
+    name: APPROVAL_REQUESTED_EVENT,
+    value: {
+      approvalId: input.approvalId,
+      title: input.title,
+      ...(input.detail ?? {}),
+    },
+    timestamp: Date.now(),
+    threadId: input.threadId,
+    runId: input.runId,
+  }
+}
diff --git a/packages/ai-sandbox/src/bootstrap.ts b/packages/ai-sandbox/src/bootstrap.ts
new file mode 100644
index 000000000..86e3875b4
--- /dev/null
+++ b/packages/ai-sandbox/src/bootstrap.ts
@@ -0,0 +1,86 @@
+/**
+ * Workspace bootstrap engine — provider-agnostic because it only uses the
+ * {@link SandboxHandle} contract. Runs once when a sandbox is freshly created
+ * (or restored without its working tree): land the source, inject secrets,
+ * detect the package manager, and run setup commands.
+ *
+ * Harness-specific projection (CLAUDE.md, agent skills, MCP config) is NOT done
+ * here — that's each adapter's `projectWorkspace()` hook, since the format
+ * differs per harness.
+ */
+import type { SandboxHandle } from './contracts'
+import type { PackageManager, WorkspaceDefinition } from './workspace'
+
+const LOCKFILES: Record<Exclude<PackageManager, 'auto'>, string> = {
+  pnpm: 'pnpm-lock.yaml',
+  yarn: 'yarn.lock',
+  bun: 'bun.lockb',
+  npm: 'package-lock.json',
+}
+
+export const DEFAULT_WORKSPACE_ROOT = '/workspace'
+
+/** Resolve the package manager, detecting from a lockfile when `'auto'`. */
+export async function detectPackageManager(
+  handle: SandboxHandle,
+  workspace: WorkspaceDefinition,
+  root: string,
+): Promise<Exclude<PackageManager, 'auto'> | undefined> {
+  const pm = workspace.packageManager ?? 'auto'
+  if (pm !== 'auto') return pm
+  for (const [manager, lockfile] of Object.entries(LOCKFILES) as Array<
+    [Exclude<PackageManager, 'auto'>, string]
+  >) {
+    if (await handle.fs.exists(`${root}/${lockfile}`)) return manager
+  }
+  return undefined
+}
+
+export interface BootstrapResult {
+  packageManager?: Exclude<PackageManager, 'auto'>
+  ranSetup: Array<string>
+}
+
+/**
+ * Bootstrap a freshly created sandbox's workspace. Idempotent enough to be safe
+ * on restore: a git clone into a populated dir is skipped by checking for the
+ * target dir first.
+ */
+export async function bootstrapWorkspace(
+  handle: SandboxHandle,
+  workspace: WorkspaceDefinition,
+  options: { signal?: AbortSignal } = {},
+): Promise<BootstrapResult> {
+  const root = workspace.root ?? DEFAULT_WORKSPACE_ROOT
+
+  // Secrets live only in the running sandbox env (never persisted).
+  if (workspace.secrets && Object.keys(workspace.secrets).length > 0) {
+    await handle.env.set(workspace.secrets)
+  }
+
+  // Land the source. Clone into the handle's own default root (each provider
+  // maps the conventional `/workspace` virtual root to its real backing dir),
+  // rather than passing a virtual `dir` that can't be remapped inside a shell
+  // command string.
+  if (workspace.source.type === 'git') {
+    const alreadyCloned = await handle.fs.exists(`${root}/.git`)
+    if (!alreadyCloned) {
+      await handle.git.clone({
+        url: workspace.source.url,
+        ref: workspace.source.ref,
+        auth: workspace.source.auth,
+      })
+    }
+  }
+  // 'local' is provider-pre-populated at create; 'none' starts empty.
+
+  const packageManager = await detectPackageManager(handle, workspace, root)
+
+  const ranSetup: Array<string> = []
+  for (const command of workspace.setup ?? []) {
+    await handle.process.exec(command, { cwd: root, signal: options.signal })
+    ranSetup.push(command)
+  }
+
+  return { packageManager, ranSetup }
+}
diff --git a/packages/ai-sandbox/src/capabilities.ts b/packages/ai-sandbox/src/capabilities.ts
new file mode 100644
index 000000000..dc815a659
--- /dev/null
+++ b/packages/ai-sandbox/src/capabilities.ts
@@ -0,0 +1,45 @@
+/**
+ * Capability tokens the sandbox layer provides/consumes through the
+ * `@tanstack/ai` middleware capability system.
+ *
+ * - `SandboxCapability` is PROVIDED by `withSandbox` and REQUIRED by harness
+ *   adapters (`requires: [SandboxCapability]`).
+ * - `SandboxStoreCapability` / `LocksCapability` are OPTIONALLY required by
+ *   `withSandbox`. v1 falls back to in-memory defaults; the future persistence
+ *   package PROVIDES durable implementations.
+ */
+import {
+  LocksCapability,
+  createCapability,
+  getLocks,
+  provideLocks,
+} from '@tanstack/ai'
+import type { SandboxHandle } from './contracts'
+import type { SandboxStore } from './store'
+import type { SandboxPolicy } from './policy'
+
+export const SandboxCapability = createCapability<SandboxHandle>()('sandbox')
+
+export const SandboxStoreCapability =
+  createCapability<SandboxStore>()('sandbox-store')
+
+/**
+ * The lock capability now lives in core (`@tanstack/ai`) so there is exactly
+ * ONE global `'locks'` token shared by `withSandbox` (optional require) and
+ * `withPersistence` (durable provider). Re-exported here for back-compat so
+ * existing `@tanstack/ai-sandbox` imports keep working.
+ */
+export { LocksCapability, getLocks, provideLocks }
+
+/**
+ * The active sandbox policy, provided by `withSandbox` from the definition.
+ * Harness adapters read it to map allow/ask/deny rules onto their native
+ * permission system.
+ */
+export const SandboxPolicyCapability =
+  createCapability<SandboxPolicy>()('sandbox-policy')
+
+/** Destructured accessors for adapters: `getSandbox(ctx)` reads the handle. */
+export const [getSandbox, provideSandbox] = SandboxCapability
+export const [getSandboxStore, provideSandboxStore] = SandboxStoreCapability
+export const [getSandboxPolicy, provideSandboxPolicy] = SandboxPolicyCapability
diff --git a/packages/ai-sandbox/src/contracts.ts b/packages/ai-sandbox/src/contracts.ts
new file mode 100644
index 000000000..1e25b4cb5
--- /dev/null
+++ b/packages/ai-sandbox/src/contracts.ts
@@ -0,0 +1,212 @@
+/**
+ * Provider-agnostic sandbox contracts.
+ *
+ * A {@link SandboxProvider} owns an isolation primitive (Docker container,
+ * Cloudflare DO-backed container, a local OS process tree, …) and knows how to
+ * create / resume / restore / destroy a {@link SandboxHandle}. A
+ * `SandboxHandle` is the uniform runtime surface every consumer (harness
+ * adapters, the workspace bootstrap engine, advanced users) codes against.
+ *
+ * Providers differ in what they can do — see {@link SandboxCapabilities}. The
+ * mandatory `fs` and `exec` capabilities are guaranteed by the contract;
+ * everything else is optional and capability-gated. Calling an unsupported
+ * optional method throws {@link UnsupportedCapabilityError} rather than
+ * silently no-opping.
+ */
+import type { WorkspaceDefinition } from './workspace'
+import type { SandboxPolicy } from './policy'
+
+/** Static description of what a provider supports. */
+export interface SandboxCapabilities {
+  /** Read/write/list/… via {@link SandboxFs}. Always true (mandatory). */
+  fs: boolean
+  /** Blocking command execution via {@link SandboxProcess.exec}. Always true (mandatory). */
+  exec: boolean
+  /** Per-create / per-command environment variables. */
+  env: boolean
+  /** Expose a port and resolve a reachable channel via {@link SandboxPorts}. */
+  ports: boolean
+  /** Long-running/background processes via {@link SandboxProcess.spawn}. */
+  backgroundProcesses: boolean
+  /** Capture/restore filesystem snapshots via {@link SandboxHandle.snapshot}. */
+  snapshots: boolean
+  /** Declarative network egress allow/deny policy. */
+  networkPolicy: boolean
+  /** Filesystem persists across sandbox stop/restart without a snapshot. */
+  durableFilesystem: boolean
+  /** Branch a new sandbox from current state via {@link SandboxHandle.fork}. */
+  fork: boolean
+}
+
+/** Result of a blocking command. */
+export interface ExecResult {
+  stdout: string
+  stderr: string
+  exitCode: number
+}
+
+/** Options for {@link SandboxProcess.exec} / {@link SandboxProcess.spawn}. */
+export interface ProcessOptions {
+  /** Working directory inside the sandbox. Defaults to the workspace root. */
+  cwd?: string
+  /** Per-command environment variables, merged over the sandbox env. */
+  env?: Record<string, string>
+  /** Abort the command/process when this signal fires. */
+  signal?: AbortSignal
+}
+
+/**
+ * A live background process. `stdout`/`stderr` are async-iterables of decoded
+ * chunks; `stdin.write` feeds the process (duplex — required for ACP harness
+ * protocols such as Codex / Gemini CLI). There is intentionally NO
+ * reconnect-to-a-running-process in v1 — that belongs to the durable-stream /
+ * persistence layer.
+ */
+export interface SpawnHandle {
+  readonly pid: number
+  readonly stdout: AsyncIterable<string>
+  readonly stderr: AsyncIterable<string>
+  readonly stdin: {
+    write: (data: string) => Promise<void>
+    end: () => Promise<void>
+  }
+  /** Resolves with the exit code when the process exits. */
+  wait: () => Promise<number>
+  kill: (signal?: NodeJS.Signals | number) => Promise<void>
+}
+
+export interface SandboxProcess {
+  /** Run a command to completion and capture stdout/stderr/exit code. */
+  exec: (command: string, options?: ProcessOptions) => Promise<ExecResult>
+  /** Start a long-running/background process with streamable, duplex IO. */
+  spawn: (command: string, options?: ProcessOptions) => Promise<SpawnHandle>
+}
+
+/** Common, portable filesystem operations every provider implements. */
+export interface SandboxFs {
+  read: (path: string) => Promise<string>
+  readBytes: (path: string) => Promise<Uint8Array>
+  write: (path: string, data: string | Uint8Array) => Promise<void>
+  list: (
+    path: string,
+  ) => Promise<Array<{ name: string; path: string; type: 'file' | 'dir' }>>
+  mkdir: (path: string) => Promise<void>
+  remove: (path: string) => Promise<void>
+  rename: (from: string, to: string) => Promise<void>
+  exists: (path: string) => Promise<boolean>
+  /** Optional — present only when `capabilities.fs` providers advertise watch. */
+  watch?: (
+    path: string,
+    onEvent: (event: { type: string; path: string }) => void,
+  ) => Promise<{ stop: () => Promise<void> }>
+}
+
+/**
+ * Uniform git surface. Implementations either delegate to the provider's
+ * native git (when advertised) or desugar to `process.exec("git …")`, so the
+ * contract is identical across providers.
+ */
+export interface SandboxGit {
+  clone: (input: {
+    url: string
+    dir?: string
+    ref?: string
+    auth?: { username?: string; token: string }
+  }) => Promise<void>
+  status: (dir?: string) => Promise<string>
+  add: (paths: Array<string>, dir?: string) => Promise<void>
+  commit: (message: string, dir?: string) => Promise<void>
+  push: (dir?: string) => Promise<void>
+  pull: (dir?: string) => Promise<void>
+  /** Returns the current branch name. */
+  branch: (dir?: string) => Promise<string>
+}
+
+/** A reachable channel to a port inside the sandbox. */
+export interface SandboxChannel {
+  /** URL the host can reach (localhost / host-bound port / authenticated preview URL). */
+  url: string
+  /** Bearer token gating the channel, when the provider issues one. */
+  token?: string
+}
+
+export interface SandboxPorts {
+  /** Expose `port` and resolve the best reachable channel for the host. */
+  connect: (port: number) => Promise<SandboxChannel>
+}
+
+export interface SandboxEnv {
+  set: (vars: Record<string, string>) => Promise<void>
+}
+
+/** Opaque reference to a stored snapshot, used to restore later. */
+export interface SnapshotRef {
+  id: string
+  label?: string
+}
+
+/** The uniform runtime surface a sandbox exposes. */
+export interface SandboxHandle {
+  /** Provider-assigned id used to reconnect to this sandbox. */
+  readonly id: string
+  /** Provider name (e.g. "docker", "cloudflare", "local-process"). */
+  readonly provider: string
+  /** What this sandbox can do. */
+  readonly capabilities: SandboxCapabilities
+  readonly fs: SandboxFs
+  readonly git: SandboxGit
+  readonly process: SandboxProcess
+  readonly ports: SandboxPorts
+  readonly env: SandboxEnv
+  /** Capability-gated: throws UnsupportedCapabilityError if `capabilities.snapshots` is false. */
+  snapshot?: (label?: string) => Promise<SnapshotRef>
+  /** Capability-gated: throws UnsupportedCapabilityError if `capabilities.fork` is false. */
+  fork?: () => Promise<SandboxHandle>
+  destroy: () => Promise<void>
+}
+
+/** Input passed to {@link SandboxProvider.create}. */
+export interface SandboxCreateInput {
+  workspace?: WorkspaceDefinition
+  policy?: SandboxPolicy
+  env?: Record<string, string>
+  signal?: AbortSignal
+}
+
+/** Input passed to {@link SandboxProvider.resume}. */
+export interface SandboxResumeInput {
+  /** Provider-assigned sandbox id recorded by a prior run. */
+  id: string
+  signal?: AbortSignal
+}
+
+/** Input passed to {@link SandboxProvider.restoreSnapshot}. */
+export interface SandboxRestoreInput {
+  snapshotId: string
+  workspace?: WorkspaceDefinition
+  policy?: SandboxPolicy
+  env?: Record<string, string>
+  signal?: AbortSignal
+}
+
+/** Input passed to {@link SandboxProvider.destroy}. */
+export interface SandboxDestroyInput {
+  id: string
+  signal?: AbortSignal
+}
+
+/**
+ * Owns an isolation primitive. Implemented by `@tanstack/ai-sandbox-*`
+ * provider packages.
+ */
+export interface SandboxProvider {
+  readonly name: string
+  /** Static capability descriptor. */
+  capabilities: () => SandboxCapabilities
+  create: (input: SandboxCreateInput) => Promise<SandboxHandle>
+  /** Reconnect to an existing sandbox by id; resolves null if it's gone. */
+  resume: (input: SandboxResumeInput) => Promise<SandboxHandle | null>
+  /** Capability-gated: present only when `capabilities().snapshots` is true. */
+  restoreSnapshot?: (input: SandboxRestoreInput) => Promise<SandboxHandle>
+  destroy: (input: SandboxDestroyInput) => Promise<void>
+}
diff --git a/packages/ai-sandbox/src/errors.ts b/packages/ai-sandbox/src/errors.ts
new file mode 100644
index 000000000..40a33b2d7
--- /dev/null
+++ b/packages/ai-sandbox/src/errors.ts
@@ -0,0 +1,31 @@
+/**
+ * Thrown when code invokes an optional sandbox capability that the active
+ * provider does not support. Core/middleware should check
+ * `handle.capabilities` BEFORE using an optional capability and degrade
+ * gracefully; this error exists so that a direct call to an unsupported
+ * optional method fails loud instead of silently no-opping.
+ */
+export class UnsupportedCapabilityError extends Error {
+  readonly provider: string
+  readonly capability: string
+
+  constructor(provider: string, capability: string, hint?: string) {
+    super(
+      `Sandbox provider "${provider}" does not support the "${capability}" capability.` +
+        (hint ? ` ${hint}` : ''),
+    )
+    this.name = 'UnsupportedCapabilityError'
+    this.provider = provider
+    this.capability = capability
+  }
+}
+
+/** Thrown when a harness adapter requires a sandbox but none was provided. */
+export class MissingSandboxError extends Error {
+  constructor(adapterName: string) {
+    super(
+      `Adapter "${adapterName}" requires a sandbox. Add withSandbox(defineSandbox({ ... })) to chat() middleware.`,
+    )
+    this.name = 'MissingSandboxError'
+  }
+}
diff --git a/packages/ai-sandbox/src/git-exec.ts b/packages/ai-sandbox/src/git-exec.ts
new file mode 100644
index 000000000..8820cdbe6
--- /dev/null
+++ b/packages/ai-sandbox/src/git-exec.ts
@@ -0,0 +1,98 @@
+/**
+ * An exec-backed {@link SandboxGit} implementation. Providers without a native
+ * git API (local-process, Docker) get a uniform `sandbox.git` by desugaring to
+ * `process.exec("git …")`. Providers WITH native git (Daytona, Cloudflare) may
+ * supply their own implementation instead.
+ *
+ * Security:
+ * - Every interpolated value is single-quote escaped (no shell injection).
+ * - A `--` end-of-options separator precedes untrusted positionals and values
+ *   are rejected if they begin with `-`, so a repo URL / ref / path can't
+ *   smuggle a git flag (e.g. `--upload-pack=…`).
+ * - Auth tokens NEVER appear in argv (they'd leak via `ps` / process logs).
+ *   Instead a one-shot `credential.helper` reads the token from the child
+ *   process ENV. The helper string is single-quoted so the OUTER shell never
+ *   expands the env var — only git's own helper subshell does, at use time.
+ *
+ * NOTE: `SandboxProcess.exec` takes a command STRING by design (the sandbox
+ * runs shell commands), so we mitigate flag smuggling with `--` + validation
+ * rather than an argv array.
+ */
+import type { SandboxGit, SandboxProcess } from './contracts'
+
+/** POSIX single-quote escape: wrap in '…' and escape embedded quotes. */
+function q(value: string): string {
+  return `'${value.replace(/'/g, `'\\''`)}'`
+}
+
+/** Reject values that could be parsed as a git flag when used as a positional. */
+function assertNoLeadingDash(value: string, name: string): void {
+  if (value.startsWith('-')) {
+    throw new Error(
+      `git-exec: ${name} "${value}" must not begin with "-" (argument-injection guard).`,
+    )
+  }
+}
+
+// Credential helper that prints creds read from the child ENV. Single-quoted at
+// the call site so the outer shell passes it literally; git expands the vars in
+// its own helper subshell, keeping the token out of argv.
+const CREDENTIAL_HELPER =
+  '!f() { echo "username=${GIT_ASKPASS_USER}"; echo "password=${GIT_ASKPASS_TOKEN}"; }; f'
+
+export function createExecBackedGit(
+  process: SandboxProcess,
+  defaultRoot: string,
+): SandboxGit {
+  const at = (dir?: string): string => {
+    const d = dir ?? defaultRoot
+    assertNoLeadingDash(d, 'dir')
+    return q(d)
+  }
+
+  return {
+    clone: async ({ url, dir, ref, auth }) => {
+      assertNoLeadingDash(url, 'url')
+      const target = dir ?? defaultRoot
+      assertNoLeadingDash(target, 'dir')
+      if (ref !== undefined) assertNoLeadingDash(ref, 'ref')
+      const refArg = ref ? `--branch ${q(ref)} ` : ''
+
+      if (auth?.token) {
+        await process.exec(
+          `git -c credential.helper=${q(CREDENTIAL_HELPER)} clone ${refArg}-- ${q(url)} ${q(target)}`,
+          {
+            // Token lives only in the child env, never in argv.
+            env: {
+              GIT_ASKPASS_USER: auth.username ?? 'x-access-token',
+              GIT_ASKPASS_TOKEN: auth.token,
+              GIT_TERMINAL_PROMPT: '0',
+            },
+          },
+        )
+        return
+      }
+
+      await process.exec(`git clone ${refArg}-- ${q(url)} ${q(target)}`)
+    },
+    status: async (dir) =>
+      (await process.exec(`git -C ${at(dir)} status --porcelain`)).stdout,
+    add: async (paths, dir) => {
+      paths.forEach((p, i) => assertNoLeadingDash(p, `path[${i}]`))
+      await process.exec(`git -C ${at(dir)} add -- ${paths.map(q).join(' ')}`)
+    },
+    commit: async (message, dir) => {
+      await process.exec(`git -C ${at(dir)} commit -m ${q(message)}`)
+    },
+    push: async (dir) => {
+      await process.exec(`git -C ${at(dir)} push`)
+    },
+    pull: async (dir) => {
+      await process.exec(`git -C ${at(dir)} pull`)
+    },
+    branch: async (dir) =>
+      (
+        await process.exec(`git -C ${at(dir)} rev-parse --abbrev-ref HEAD`)
+      ).stdout.trim(),
+  }
+}
diff --git a/packages/ai-sandbox/src/index.ts b/packages/ai-sandbox/src/index.ts
new file mode 100644
index 000000000..156bc9f4f
--- /dev/null
+++ b/packages/ai-sandbox/src/index.ts
@@ -0,0 +1,134 @@
+// Capability tokens + accessors
+export {
+  SandboxCapability,
+  SandboxStoreCapability,
+  LocksCapability,
+  SandboxPolicyCapability,
+  getSandbox,
+  provideSandbox,
+  getSandboxStore,
+  provideSandboxStore,
+  getLocks,
+  provideLocks,
+  getSandboxPolicy,
+  provideSandboxPolicy,
+} from './capabilities'
+
+// Middleware
+export { withSandbox } from './middleware'
+
+// Sandbox definition + lifecycle
+export { defineSandbox } from './sandbox'
+export type {
+  SandboxConfig,
+  SandboxDefinition,
+  SandboxEnsureContext,
+  SandboxLifecycle,
+  SandboxHooks,
+  ReuseStrategy,
+  SnapshotStrategy,
+} from './sandbox'
+
+// Workspace
+export {
+  defineWorkspace,
+  gitSource,
+  githubRepo,
+  localSource,
+  fileSkill,
+  agentSkill,
+  mcpSkill,
+} from './workspace'
+export type {
+  WorkspaceDefinition,
+  WorkspaceSource,
+  WorkspaceSkill,
+  PackageManager,
+} from './workspace'
+
+// Policy
+export { defineSandboxPolicy, evaluateCommand } from './policy'
+export type {
+  SandboxPolicy,
+  PolicyDecision,
+  CommandRules,
+  CapabilityRules,
+} from './policy'
+
+// Provider + handle contracts
+export type {
+  SandboxProvider,
+  SandboxHandle,
+  SandboxCapabilities,
+  SandboxFs,
+  SandboxGit,
+  SandboxProcess,
+  SandboxPorts,
+  SandboxEnv,
+  SandboxChannel,
+  SpawnHandle,
+  ExecResult,
+  ProcessOptions,
+  SnapshotRef,
+  SandboxCreateInput,
+  SandboxResumeInput,
+  SandboxRestoreInput,
+  SandboxDestroyInput,
+} from './contracts'
+
+// Stores (interfaces + in-memory defaults)
+export { InMemorySandboxStore, InMemoryLockStore } from './store'
+export type { SandboxStore, LockStore, SandboxRecord } from './store'
+
+// Bootstrap engine (exported for provider/adapter authors + tests)
+export {
+  bootstrapWorkspace,
+  detectPackageManager,
+  DEFAULT_WORKSPACE_ROOT,
+} from './bootstrap'
+export type { BootstrapResult } from './bootstrap'
+
+// Exec-backed git helper (for providers without native git)
+export { createExecBackedGit } from './git-exec'
+
+// Harness runner: spawn an agent CLI in a sandbox + stream NDJSON stdout
+export { spawnNdjson, toLines } from './runner'
+export type { SpawnNdjsonOptions } from './runner'
+
+// Host-side MCP tool-proxy bridge (shared by harness adapters)
+export {
+  startHostToolBridge,
+  hostForSandbox,
+  BRIDGED_MCP_SERVER_NAME,
+} from './tool-bridge'
+export type {
+  HostToolBridge,
+  StartBridgeOptions,
+  PermissionToolResult,
+} from './tool-bridge'
+
+// Interactive approvals (shared by harness adapters)
+export {
+  resolveApproval,
+  approvalId,
+  buildApprovalRequestedEvent,
+  APPROVAL_REQUESTED_EVENT,
+} from './approvals'
+export type { ResolveApprovalInput, ApprovalOutcome } from './approvals'
+
+// File-event watch (low-level workspace observer)
+export { watchWorkspace, diffSnapshots } from './watch'
+export type {
+  SandboxFileEvent,
+  FileEvent,
+  FileEventType,
+  WatchOptions,
+  SandboxWatchHandle,
+} from './watch'
+
+// Keying
+export { computeSandboxKey, computeWorkspaceHash } from './key'
+export type { SandboxKeyInput } from './key'
+
+// Errors
+export { UnsupportedCapabilityError, MissingSandboxError } from './errors'
diff --git a/packages/ai-sandbox/src/key.ts b/packages/ai-sandbox/src/key.ts
new file mode 100644
index 000000000..4cba73526
--- /dev/null
+++ b/packages/ai-sandbox/src/key.ts
@@ -0,0 +1,70 @@
+/**
+ * Compound sandbox identity. We never key a resumable sandbox on `threadId`
+ * alone — that would resume the WRONG environment when the provider,
+ * workspace, image, or tenant changes. The key folds all of those in, so any
+ * change busts the sandbox and forces a fresh create+bootstrap (safe default).
+ */
+import type { WorkspaceDefinition } from './workspace'
+
+/** Inputs that, together, identify one resumable sandbox instance. */
+export interface SandboxKeyInput {
+  threadId: string
+  sandboxId: string
+  providerName: string
+  workspace?: WorkspaceDefinition
+  /** Optional tenant scoping pulled from runtimeContext. */
+  tenant?: { userId?: string; orgId?: string }
+}
+
+/** Deterministic, dependency-free 64-bit FNV-1a hash → hex string. */
+function fnv1a(input: string): string {
+  // Two 32-bit lanes to approximate 64-bit without BigInt overhead concerns.
+  let h1 = 0x811c9dc5
+  let h2 = 0x811c9dc5
+  for (let i = 0; i < input.length; i++) {
+    const c = input.charCodeAt(i)
+    h1 ^= c & 0xff
+    h1 = Math.imul(h1, 0x01000193)
+    h2 ^= (c >> 8) & 0xff
+    h2 = Math.imul(h2, 0x01000193)
+  }
+  const hex = (n: number): string => (n >>> 0).toString(16).padStart(8, '0')
+  return hex(h1) + hex(h2)
+}
+
+/** Canonical, key-sorted JSON so logically-equal inputs hash identically. */
+function canonical(value: unknown): string {
+  if (value === null || typeof value !== 'object') return JSON.stringify(value)
+  if (Array.isArray(value)) return `[${value.map(canonical).join(',')}]`
+  const keys = Object.keys(value).sort()
+  return `{${keys
+    .map(
+      (k) =>
+        `${JSON.stringify(k)}:${canonical((value as Record<string, unknown>)[k])}`,
+    )
+    .join(',')}}`
+}
+
+/**
+ * Hash of the parts of a workspace that change what the agent sees. Secrets are
+ * intentionally excluded (rotating a token must not orphan the sandbox).
+ */
+export function computeWorkspaceHash(
+  workspace: WorkspaceDefinition | undefined,
+): string {
+  if (!workspace) return fnv1a('no-workspace')
+  const { secrets: _secrets, ...rest } = workspace
+  return fnv1a(canonical(rest))
+}
+
+/** Compute the compound sandbox instance key. */
+export function computeSandboxKey(input: SandboxKeyInput): string {
+  const material = canonical({
+    threadId: input.threadId,
+    sandboxId: input.sandboxId,
+    providerName: input.providerName,
+    workspaceHash: computeWorkspaceHash(input.workspace),
+    tenant: input.tenant ?? null,
+  })
+  return fnv1a(material)
+}
diff --git a/packages/ai-sandbox/src/middleware.ts b/packages/ai-sandbox/src/middleware.ts
new file mode 100644
index 000000000..d7aafc038
--- /dev/null
+++ b/packages/ai-sandbox/src/middleware.ts
@@ -0,0 +1,201 @@
+/**
+ * `withSandbox(definition)` — the middleware that PROVIDES the
+ * {@link SandboxCapability} a harness adapter requires.
+ *
+ * - `setup`: resume-or-create the sandbox (via the definition's ensure
+ *   algorithm), provide the handle, using the optional SandboxStore/Locks
+ *   capabilities when a persistence middleware supplied them (in-memory
+ *   fallback otherwise). If `fileEvents` is not false, starts a watcher
+ *   that dispatches to sandbox-scoped hooks and forwards to the runtime sink.
+ * - `onFinish`/`onAbort`/`onError`: stop the watcher, snapshot (`after-run`)
+ *   and/or destroy per lifecycle.
+ *
+ * NOTE: streamed sandbox lifecycle events (sandbox.created, workspace.setup.*)
+ * are emitted by the harness adapter's chatStream (which can yield CUSTOM
+ * chunks), not from here — middleware setup runs before streaming begins.
+ */
+import { defineChatMiddleware } from '@tanstack/ai'
+import { getSandboxRuntime } from '@tanstack/ai/adapter-internals'
+import {
+  LocksCapability,
+  SandboxCapability,
+  SandboxStoreCapability,
+  provideSandbox,
+  provideSandboxPolicy,
+} from './capabilities'
+import { watchWorkspace } from './watch'
+import type {
+  AbortInfo,
+  ChatMiddlewareContext,
+  DefinedChatMiddleware,
+  SandboxFileEvent,
+} from '@tanstack/ai'
+import type { SandboxHandle } from './contracts'
+import type {
+  SandboxDefinition,
+  SandboxEnsureContext,
+  SandboxHooks,
+} from './sandbox'
+import type { SandboxWatchHandle } from './watch'
+
+/** Per-request state we need to carry from `setup` to the terminal hooks. */
+interface SandboxRunState {
+  handle: SandboxHandle
+  ensureCtx: SandboxEnsureContext
+  watcher?: SandboxWatchHandle
+}
+
+const runState = new WeakMap<object, SandboxRunState>()
+
+/** Defensively pull tenant scoping out of the runtime context, if present. */
+function tenantFrom(
+  context: unknown,
+): { userId?: string; orgId?: string } | undefined {
+  if (context === null || typeof context !== 'object') return undefined
+  const c = context as Record<string, unknown>
+  const userId = typeof c.userId === 'string' ? c.userId : undefined
+  const orgId = typeof c.orgId === 'string' ? c.orgId : undefined
+  if (userId === undefined && orgId === undefined) return undefined
+  return { userId, orgId }
+}
+
+function buildEnsureCtx(ctx: ChatMiddlewareContext): SandboxEnsureContext {
+  return {
+    threadId: ctx.threadId,
+    runId: ctx.runId,
+    store: ctx.getOptional(SandboxStoreCapability),
+    locks: ctx.getOptional(LocksCapability),
+    tenant: tenantFrom(ctx.context),
+    signal: ctx.signal,
+  }
+}
+
+/**
+ * Dispatch a sandbox file event to the per-type hooks declared on the
+ * definition. Errors in individual hooks are swallowed so one bad hook
+ * cannot break the run.
+ */
+async function dispatchDefinitionHooks(
+  hooks: SandboxHooks | undefined,
+  event: SandboxFileEvent,
+): Promise<void> {
+  if (!hooks) return
+  const typed = (
+    {
+      create: 'onFileCreate',
+      change: 'onFileChange',
+      delete: 'onFileDelete',
+    } as const
+  )[event.type]
+  for (const fn of [hooks.onFile, hooks[typed]]) {
+    if (!fn) continue
+    try {
+      await fn(event)
+    } catch {
+      // swallowed — one bad hook must not break the run
+    }
+  }
+}
+
+export function withSandbox(
+  definition: SandboxDefinition,
+): DefinedChatMiddleware<
+  unknown,
+  readonly [],
+  readonly [typeof SandboxCapability]
+> {
+  return defineChatMiddleware({
+    name: 'sandbox',
+    provides: [SandboxCapability],
+    // SandboxPolicyCapability is provided conditionally (only when the
+    // definition has a policy), so it is intentionally NOT declared here —
+    // consumers read it via `getOptional`.
+    optionalRequires: [SandboxStoreCapability, LocksCapability],
+
+    async setup(ctx) {
+      const ensureCtx = buildEnsureCtx(ctx)
+      const handle = await definition.ensure(ensureCtx)
+      provideSandbox(ctx, handle)
+      if (definition.policy) provideSandboxPolicy(ctx, definition.policy)
+
+      const hooks = definition.hooks
+      await hooks?.onReady?.(handle)
+
+      let watcher: SandboxWatchHandle | undefined
+      if (definition.fileEvents !== false) {
+        const runtime = getSandboxRuntime(ctx, { optional: true })
+        watcher = await watchWorkspace(handle, {
+          onEvent: (event: SandboxFileEvent) => {
+            void dispatchDefinitionHooks(hooks, event)
+            runtime?.emit(event)
+          },
+          ...(ctx.signal !== undefined ? { signal: ctx.signal } : {}),
+        })
+      }
+
+      runState.set(ctx, { handle, ensureCtx, ...(watcher ? { watcher } : {}) })
+    },
+
+    async onFinish(ctx) {
+      const state = runState.get(ctx)
+      if (!state) return
+      const { handle, ensureCtx } = state
+
+      await state.watcher?.stop()
+
+      const lifecycle = definition.lifecycle
+
+      if (
+        lifecycle?.snapshot === 'after-run' &&
+        handle.capabilities.snapshots &&
+        handle.snapshot
+      ) {
+        const snapshot = await handle.snapshot(`after-run-${ctx.runId}`)
+        const store = ensureCtx.store
+        if (store) {
+          const key = definition.key(ensureCtx)
+          const existing = await store.get(key)
+          if (existing) {
+            await store.upsert({
+              ...existing,
+              latestSnapshotId: snapshot.id,
+              updatedAt: Date.now(),
+            })
+          }
+        }
+      }
+
+      if (lifecycle?.destroyOnComplete) {
+        await definition.destroy(ensureCtx)
+        await definition.hooks?.onDestroy?.()
+      }
+    },
+
+    async onAbort(ctx, _info: AbortInfo) {
+      const state = runState.get(ctx)
+      if (!state) return
+
+      await state.watcher?.stop()
+
+      if (definition.lifecycle?.destroyOnComplete) {
+        await definition.destroy(state.ensureCtx)
+        await definition.hooks?.onDestroy?.()
+      }
+    },
+
+    async onError(ctx, info) {
+      const state = runState.get(ctx)
+      if (!state) return
+
+      await state.watcher?.stop()
+      await definition.hooks?.onError?.(info.error)
+
+      // On failure, only tear down when the lifecycle says so; otherwise leave
+      // the sandbox for a resumed retry.
+      if (definition.lifecycle?.destroyOnComplete) {
+        await definition.destroy(state.ensureCtx)
+        await definition.hooks?.onDestroy?.()
+      }
+    },
+  })
+}
diff --git a/packages/ai-sandbox/src/policy.ts b/packages/ai-sandbox/src/policy.ts
new file mode 100644
index 000000000..5d727d3b1
--- /dev/null
+++ b/packages/ai-sandbox/src/policy.ts
@@ -0,0 +1,70 @@
+/**
+ * Sandbox policy — a portable, harness-agnostic description of what the agent
+ * may do. Each harness adapter MAPS this onto its native permission system
+ * (Claude Code → canUseTool + allowedTools/disallowedTools/permissionMode).
+ *
+ * Command rules are matched as glob/prefix patterns against the command line.
+ * Precedence is deny > ask > allow; unmatched commands fall to `default`.
+ * `'ask'` surfaces the existing resume-based `approval-requested` flow.
+ */
+
+export type PolicyDecision = 'allow' | 'ask' | 'deny'
+
+export interface CommandRules {
+  /** Glob/prefix patterns to allow outright (e.g. 'pnpm *', 'git diff'). */
+  allow?: Array<string>
+  /** Patterns that require approval before running. */
+  ask?: Array<string>
+  /** Patterns to refuse (e.g. 'sudo *', 'rm -rf *'). */
+  deny?: Array<string>
+}
+
+/** Coarse, non-command capability gates for tools like Write/Edit and network. */
+export interface CapabilityRules {
+  /** File-modifying tools (Write/Edit). Defaults to the policy `default`. */
+  fileWrite?: PolicyDecision
+  /** Outbound network access. Defaults to the policy `default`. */
+  network?: PolicyDecision
+}
+
+export interface SandboxPolicy {
+  commands?: CommandRules
+  capabilities?: CapabilityRules
+  /** Decision for anything not matched by a rule. Defaults to `'ask'`. */
+  default?: PolicyDecision
+}
+
+export function defineSandboxPolicy(policy: SandboxPolicy): SandboxPolicy {
+  return policy
+}
+
+/** Convert a glob/prefix pattern to a RegExp anchored to the full command. */
+function patternToRegExp(pattern: string): RegExp {
+  // Escape regex metacharacters except '*', then turn '*' into '.*'.
+  const escaped = pattern
+    .replace(/[.+?^${}()|[\]\\]/g, '\\$&')
+    .replace(/\*/g, '.*')
+  return new RegExp(`^${escaped}$`)
+}
+
+/**
+ * Resolve a command line against the policy. Precedence: deny > ask > allow,
+ * then `default` (defaults to `'ask'`). Exported for adapter permission
+ * mappers and unit tests.
+ */
+export function evaluateCommand(
+  command: string,
+  policy: SandboxPolicy | undefined,
+): PolicyDecision {
+  const fallback = policy?.default ?? 'ask'
+  const rules = policy?.commands
+  if (!rules) return fallback
+
+  const matches = (patterns: Array<string> | undefined): boolean =>
+    (patterns ?? []).some((p) => patternToRegExp(p).test(command.trim()))
+
+  if (matches(rules.deny)) return 'deny'
+  if (matches(rules.ask)) return 'ask'
+  if (matches(rules.allow)) return 'allow'
+  return fallback
+}
diff --git a/packages/ai-sandbox/src/runner.ts b/packages/ai-sandbox/src/runner.ts
new file mode 100644
index 000000000..59820051a
--- /dev/null
+++ b/packages/ai-sandbox/src/runner.ts
@@ -0,0 +1,75 @@
+/**
+ * The reusable "run an agent CLI inside a sandbox and stream its events out"
+ * primitive. Harness adapters (claude-code, codex, …) spawn their CLI via the
+ * uniform {@link SandboxHandle} and consume newline-delimited JSON from stdout,
+ * which they then translate into AG-UI StreamChunks.
+ *
+ * This is intentionally transport-minimal: a stdout NDJSON pipe. Multi-client
+ * reconnect / replay belongs to the persistence/EventLog layer, not here.
+ */
+import type { ProcessOptions, SandboxHandle } from './contracts'
+
+export interface SpawnNdjsonOptions extends ProcessOptions {
+  /**
+   * Called for each raw stdout line that is non-empty but fails JSON parsing
+   * (e.g. a CLI banner). Defaults to ignoring it. Stderr is never parsed.
+   */
+  onNonJsonLine?: (line: string) => void
+  /**
+   * Written to the process stdin (then stdin is closed) right after spawn —
+   * e.g. the agent prompt for `claude -p`. Avoids putting the prompt in argv.
+   */
+  input?: string
+}
+
+/** Split a stream of arbitrary string chunks into complete lines. */
+export async function* toLines(
+  chunks: AsyncIterable<string>,
+): AsyncIterable<string> {
+  let buffer = ''
+  for await (const chunk of chunks) {
+    buffer += chunk
+    let newlineIndex = buffer.indexOf('\n')
+    while (newlineIndex !== -1) {
+      const line = buffer.slice(0, newlineIndex)
+      buffer = buffer.slice(newlineIndex + 1)
+      yield line
+      newlineIndex = buffer.indexOf('\n')
+    }
+  }
+  if (buffer.length > 0) yield buffer
+}
+
+/**
+ * Spawn `command` in the sandbox and yield each stdout line parsed as JSON.
+ * Resolves the spawn handle's exit via `wait()` after stdout closes; a non-zero
+ * exit with no events surfaced is the adapter's concern to detect.
+ */
+export async function* spawnNdjson(
+  handle: SandboxHandle,
+  command: string,
+  options: SpawnNdjsonOptions = {},
+): AsyncIterable<unknown> {
+  const { onNonJsonLine, input, ...processOptions } = options
+  const proc = await handle.process.spawn(command, processOptions)
+
+  if (input !== undefined) {
+    await proc.stdin.write(input)
+    await proc.stdin.end()
+  }
+
+  for await (const line of toLines(proc.stdout)) {
+    const trimmed = line.trim()
+    if (trimmed === '') continue
+    let parsed: unknown
+    try {
+      parsed = JSON.parse(trimmed)
+    } catch {
+      onNonJsonLine?.(trimmed)
+      continue
+    }
+    yield parsed
+  }
+
+  await proc.wait()
+}
diff --git a/packages/ai-sandbox/src/sandbox.ts b/packages/ai-sandbox/src/sandbox.ts
new file mode 100644
index 000000000..8686f34c2
--- /dev/null
+++ b/packages/ai-sandbox/src/sandbox.ts
@@ -0,0 +1,212 @@
+/**
+ * `defineSandbox()` returns a LAZY controller — it never creates a sandbox at
+ * definition time. `withSandbox()` (and advanced users) call `ensure()` to
+ * resume-or-create, following: provider.resume → provider.restoreSnapshot →
+ * create + bootstrap. The controller folds provider/workspace/policy/lifecycle
+ * into a stable instance key and coordinates through the (optional) lock +
+ * sandbox stores.
+ */
+import { bootstrapWorkspace } from './bootstrap'
+import { computeSandboxKey } from './key'
+import { InMemoryLockStore, InMemorySandboxStore } from './store'
+import type { SandboxFileEvent } from '@tanstack/ai'
+import type { SandboxHandle, SandboxProvider } from './contracts'
+import type { SandboxKeyInput } from './key'
+import type { LockStore, SandboxStore } from './store'
+import type { SandboxPolicy } from './policy'
+import type { WorkspaceDefinition } from './workspace'
+
+/**
+ * Sandbox-scoped hooks declared on `defineSandbox`. File hooks fire for every
+ * create/change/delete during a chat run; lifecycle hooks fire server-side.
+ */
+export interface SandboxHooks {
+  onFile?: (e: SandboxFileEvent) => void | Promise<void>
+  onFileCreate?: (e: SandboxFileEvent) => void | Promise<void>
+  onFileChange?: (e: SandboxFileEvent) => void | Promise<void>
+  onFileDelete?: (e: SandboxFileEvent) => void | Promise<void>
+  onReady?: (handle: SandboxHandle) => void | Promise<void>
+  onError?: (err: unknown) => void | Promise<void>
+  onDestroy?: () => void | Promise<void>
+}
+
+export type ReuseStrategy = 'thread' | 'none'
+export type SnapshotStrategy = 'after-setup' | 'after-run' | 'none'
+
+export interface SandboxLifecycle {
+  /** `'thread'` resumes one sandbox per thread; `'none'` is fresh per run. */
+  reuse?: ReuseStrategy
+  /** When to snapshot (provider-permitting). */
+  snapshot?: SnapshotStrategy
+  /** Hint for how long a provider should keep the sandbox warm between runs. */
+  keepAlive?: string
+  /** Destroy the sandbox after the run completes. */
+  destroyOnComplete?: boolean
+}
+
+export interface SandboxConfig {
+  id: string
+  provider: SandboxProvider
+  workspace?: WorkspaceDefinition
+  policy?: SandboxPolicy
+  lifecycle?: SandboxLifecycle
+  /** Sandbox-scoped file/lifecycle hooks. */
+  hooks?: SandboxHooks
+  /** Watch the workspace for file events (default true). Set false to disable. */
+  fileEvents?: boolean
+}
+
+/** Context passed to `ensure()` by `withSandbox` (or advanced callers). */
+export interface SandboxEnsureContext {
+  threadId: string
+  runId: string
+  /** Persistence seam; falls back to an in-memory store when absent. */
+  store?: SandboxStore
+  /** Lock seam; falls back to an in-memory lock when absent. */
+  locks?: LockStore
+  tenant?: { userId?: string; orgId?: string }
+  signal?: AbortSignal
+}
+
+export interface SandboxDefinition {
+  readonly id: string
+  readonly provider: SandboxProvider
+  readonly workspace?: WorkspaceDefinition
+  readonly policy?: SandboxPolicy
+  readonly lifecycle?: SandboxLifecycle
+  /** Sandbox-scoped file/lifecycle hooks. */
+  readonly hooks?: SandboxHooks
+  /** Watch the workspace for file events (default true). Set false to disable. */
+  readonly fileEvents?: boolean
+  /** Compound instance key for a given run context. */
+  key: (ctx: SandboxEnsureContext) => string
+  /** Resume-or-create the sandbox for this thread/run. */
+  ensure: (ctx: SandboxEnsureContext) => Promise<SandboxHandle>
+  /** Tear down the sandbox recorded for this key. */
+  destroy: (ctx: SandboxEnsureContext) => Promise<void>
+}
+
+// Process-lifetime fallbacks shared across all definitions so concurrent
+// ensures for the same key serialize even without an injected store/lock.
+const fallbackStore = new InMemorySandboxStore()
+const fallbackLocks = new InMemoryLockStore()
+
+export function defineSandbox(config: SandboxConfig): SandboxDefinition {
+  const keyInputFor = (ctx: SandboxEnsureContext): SandboxKeyInput => ({
+    threadId:
+      config.lifecycle?.reuse === 'none'
+        ? `${ctx.threadId}:${ctx.runId}`
+        : ctx.threadId,
+    sandboxId: config.id,
+    providerName: config.provider.name,
+    workspace: config.workspace,
+    tenant: ctx.tenant,
+  })
+
+  const ensure = async (ctx: SandboxEnsureContext): Promise<SandboxHandle> => {
+    const store = ctx.store ?? fallbackStore
+    const locks = ctx.locks ?? fallbackLocks
+    const key = computeSandboxKey(keyInputFor(ctx))
+    const caps = config.provider.capabilities()
+
+    return locks.withLock(`sandbox:${key}`, async () => {
+      const existing = await store.get(key)
+      if (existing) {
+        // 1) Try to reconnect to the still-running sandbox.
+        const resumed = await config.provider.resume({
+          id: existing.providerSandboxId,
+          signal: ctx.signal,
+        })
+        if (resumed) {
+          await store.upsert({
+            ...existing,
+            latestRunId: ctx.runId,
+            updatedAt: Date.now(),
+          })
+          return resumed
+        }
+        // 2) Else restore from the latest snapshot, if supported.
+        if (
+          existing.latestSnapshotId &&
+          caps.snapshots &&
+          config.provider.restoreSnapshot
+        ) {
+          const restored = await config.provider.restoreSnapshot({
+            snapshotId: existing.latestSnapshotId,
+            workspace: config.workspace,
+            policy: config.policy,
+            env: config.workspace?.secrets,
+            signal: ctx.signal,
+          })
+          await store.upsert({
+            ...existing,
+            providerSandboxId: restored.id,
+            latestRunId: ctx.runId,
+            updatedAt: Date.now(),
+          })
+          return restored
+        }
+        // 3) Else fall through and re-create under the same identity
+        //    (capability-aware degradation for ephemeral-disk providers).
+      }
+
+      const created = await config.provider.create({
+        workspace: config.workspace,
+        policy: config.policy,
+        env: config.workspace?.secrets,
+        signal: ctx.signal,
+      })
+
+      if (config.workspace) {
+        await bootstrapWorkspace(created, config.workspace, {
+          signal: ctx.signal,
+        })
+      }
+
+      let latestSnapshotId: string | undefined
+      if (
+        config.lifecycle?.snapshot === 'after-setup' &&
+        caps.snapshots &&
+        created.snapshot
+      ) {
+        latestSnapshotId = (await created.snapshot('after-setup')).id
+      }
+
+      await store.upsert({
+        key,
+        provider: config.provider.name,
+        providerSandboxId: created.id,
+        latestSnapshotId,
+        threadId: ctx.threadId,
+        latestRunId: ctx.runId,
+        updatedAt: Date.now(),
+      })
+      return created
+    })
+  }
+
+  const destroy = async (ctx: SandboxEnsureContext): Promise<void> => {
+    const store = ctx.store ?? fallbackStore
+    const key = computeSandboxKey(keyInputFor(ctx))
+    const existing = await store.get(key)
+    if (!existing) return
+    await config.provider.destroy({
+      id: existing.providerSandboxId,
+      signal: ctx.signal,
+    })
+    await store.delete(key)
+  }
+
+  return {
+    id: config.id,
+    provider: config.provider,
+    workspace: config.workspace,
+    policy: config.policy,
+    lifecycle: config.lifecycle,
+    hooks: config.hooks,
+    fileEvents: config.fileEvents,
+    key: (ctx) => computeSandboxKey(keyInputFor(ctx)),
+    ensure,
+    destroy,
+  }
+}
diff --git a/packages/ai-sandbox/src/store.ts b/packages/ai-sandbox/src/store.ts
new file mode 100644
index 000000000..bf33adaab
--- /dev/null
+++ b/packages/ai-sandbox/src/store.ts
@@ -0,0 +1,58 @@
+/**
+ * Persistence seams for the sandbox layer.
+ *
+ * v1 ships ONLY in-memory implementations (single-process resume). These are
+ * deliberately pluggable OPTIONAL capabilities so the future persistence
+ * package can `provide` durable implementations (D1/Postgres/Durable Objects)
+ * without the sandbox layer changing. Do NOT hardcode storage here.
+ */
+
+/** One persisted sandbox instance, keyed by the compound sandbox instance key. */
+export interface SandboxRecord {
+  /** Compound key (see computeSandboxKey). */
+  key: string
+  /** Provider name that owns `providerSandboxId`. */
+  provider: string
+  /** Provider-assigned sandbox id used to resume. */
+  providerSandboxId: string
+  /** Most recent snapshot id, when the provider supports snapshots. */
+  latestSnapshotId?: string
+  threadId: string
+  latestRunId?: string
+  /** Epoch ms of last write (for keepAlive / GC by the persistence layer). */
+  updatedAt: number
+}
+
+/** Maps a compound key to the provider sandbox that should be resumed. */
+export interface SandboxStore {
+  get: (key: string) => Promise<SandboxRecord | null>
+  upsert: (record: SandboxRecord) => Promise<void>
+  delete: (key: string) => Promise<void>
+}
+
+/**
+ * The lock primitive (`LockStore` + `InMemoryLockStore`) now lives in core
+ * (`@tanstack/ai`) so the `'locks'` capability is a single shared token across
+ * the sandbox and persistence layers. Re-exported here for back-compat.
+ */
+export { InMemoryLockStore } from '@tanstack/ai'
+export type { LockStore } from '@tanstack/ai'
+
+/** In-memory {@link SandboxStore}. Resume works only within one process. */
+export class InMemorySandboxStore implements SandboxStore {
+  private readonly map = new Map<string, SandboxRecord>()
+
+  get(key: string): Promise<SandboxRecord | null> {
+    return Promise.resolve(this.map.get(key) ?? null)
+  }
+
+  upsert(record: SandboxRecord): Promise<void> {
+    this.map.set(record.key, record)
+    return Promise.resolve()
+  }
+
+  delete(key: string): Promise<void> {
+    this.map.delete(key)
+    return Promise.resolve()
+  }
+}
diff --git a/packages/ai-sandbox/src/tool-bridge.ts b/packages/ai-sandbox/src/tool-bridge.ts
new file mode 100644
index 000000000..98a1ba7ec
--- /dev/null
+++ b/packages/ai-sandbox/src/tool-bridge.ts
@@ -0,0 +1,199 @@
+/**
+ * Host-side MCP tool-proxy bridge, shared by all harness adapters.
+ *
+ * Exposes chat()-provided server tools to an in-sandbox agent as an MCP server
+ * reachable over HTTP. The agent (inside the sandbox) calls
+ * `mcp__tanstack__<tool>`; the call is proxied OUT to this host server, where
+ * the tool's `execute()` runs in the host process (with its closures / DB /
+ * secrets), and the result is returned into the sandbox.
+ *
+ * Transport: Streamable HTTP in stateless mode (a fresh server + transport per
+ * request), bound on all interfaces so a Docker container can reach it via
+ * `host.docker.internal`, and gated by a per-run bearer token.
+ *
+ * Each harness adapter formats the bridge into its own MCP config shape
+ * (`claude --mcp-config`, ACP `mcpServers`, opencode `OPENCODE_CONFIG_CONTENT`,
+ * `codex --config mcp_servers.*`).
+ */
+import { createServer } from 'node:http'
+import { randomBytes } from 'node:crypto'
+import { McpServer } from '@modelcontextprotocol/sdk/server/mcp.js'
+import { StreamableHTTPServerTransport } from '@modelcontextprotocol/sdk/server/streamableHttp.js'
+import {
+  CallToolRequestSchema,
+  ListToolsRequestSchema,
+} from '@modelcontextprotocol/sdk/types.js'
+import type { AddressInfo } from 'node:net'
+import type { AnyTool } from '@tanstack/ai'
+
+/**
+ * Name of the bridged MCP server. The agent sees tools as
+ * `mcp__tanstack__<tool>`; each adapter's stream translator strips this prefix
+ * so tool-call events match the names the application registered.
+ */
+export const BRIDGED_MCP_SERVER_NAME = 'tanstack'
+
+/** Hostname the sandbox uses to reach a host-side server, per provider. */
+export function hostForSandbox(provider: string): string {
+  return provider === 'docker' ? 'host.docker.internal' : '127.0.0.1'
+}
+
+export interface HostToolBridge {
+  /** MCP server name; tools appear to the agent as `mcp__<name>__<tool>`. */
+  name: string
+  /** URL the SANDBOX uses to reach this bridge. */
+  url: string
+  /** Per-run bearer token gating the endpoint. */
+  token: string
+  close: () => Promise<void>
+}
+
+/** Result of a permission decision returned to the harness's prompt tool. */
+export interface PermissionToolResult {
+  behavior: 'allow' | 'deny'
+  message?: string
+  updatedInput?: unknown
+}
+
+export interface StartBridgeOptions {
+  /** Hostname the sandbox uses to reach the host (e.g. `host.docker.internal`). */
+  hostForSandbox: string
+  /** Runtime context forwarded to each tool's `execute()`. */
+  context?: unknown
+  /** Abort signal forwarded to each tool's `execute()`. */
+  signal?: AbortSignal
+  /**
+   * Optional permission-prompt tool (e.g. for Claude Code's
+   * `--permission-prompt-tool`). When set, the bridge exposes an extra MCP tool
+   * `<name>` whose handler returns the host's allow/deny decision for an action.
+   */
+  permission?: {
+    toolName: string
+    resolve: (input: {
+      tool_name?: string
+      input?: unknown
+    }) => PermissionToolResult | Promise<PermissionToolResult>
+  }
+}
+
+function buildServer(
+  tools: Array<AnyTool>,
+  options: StartBridgeOptions,
+): McpServer {
+  const server = new McpServer(
+    { name: BRIDGED_MCP_SERVER_NAME, version: '1.0.0' },
+    { capabilities: { tools: {} } },
+  )
+  const toolsByName = new Map(tools.map((tool) => [tool.name, tool]))
+
+  const permissionTool = options.permission
+    ? {
+        name: options.permission.toolName,
+        description:
+          'Permission prompt: returns {behavior:"allow"|"deny"} for a requested action.',
+        inputSchema: { type: 'object' as const, properties: {} },
+      }
+    : undefined
+
+  server.server.setRequestHandler(ListToolsRequestSchema, () => ({
+    tools: [
+      ...tools.map((tool) => ({
+        name: tool.name,
+        description: tool.description,
+        inputSchema: (tool.inputSchema ?? {
+          type: 'object',
+          properties: {},
+        }) as { type: 'object'; [key: string]: unknown },
+      })),
+      ...(permissionTool ? [permissionTool] : []),
+    ],
+  }))
+
+  server.server.setRequestHandler(CallToolRequestSchema, async (request) => {
+    // Permission-prompt tool: return the host's allow/deny decision.
+    if (
+      options.permission &&
+      request.params.name === options.permission.toolName
+    ) {
+      const result = await options.permission.resolve(
+        request.params.arguments ?? {},
+      )
+      return {
+        content: [{ type: 'text' as const, text: JSON.stringify(result) }],
+      }
+    }
+    const tool = toolsByName.get(request.params.name)
+    if (!tool?.execute) {
+      throw new Error(`Unknown tool: ${request.params.name}`)
+    }
+    try {
+      const result: unknown = await tool.execute(
+        request.params.arguments ?? {},
+        {
+          context: options.context,
+          abortSignal: options.signal,
+        },
+      )
+      const text = typeof result === 'string' ? result : JSON.stringify(result)
+      return { content: [{ type: 'text' as const, text }] }
+    } catch (error) {
+      const message = error instanceof Error ? error.message : String(error)
+      return {
+        isError: true,
+        content: [
+          { type: 'text' as const, text: `Tool execution failed: ${message}` },
+        ],
+      }
+    }
+  })
+
+  return server
+}
+
+/** Start the host MCP tool-proxy bridge for the given tools. */
+export async function startHostToolBridge(
+  tools: Array<AnyTool>,
+  options: StartBridgeOptions,
+): Promise<HostToolBridge> {
+  const token = randomBytes(24).toString('hex')
+
+  const httpServer = createServer((req, res) => {
+    void (async () => {
+      if (req.headers['authorization'] !== `Bearer ${token}`) {
+        res.writeHead(401).end('unauthorized')
+        return
+      }
+      const server = buildServer(tools, options)
+      const transport = new StreamableHTTPServerTransport({
+        sessionIdGenerator: undefined,
+      })
+      res.on('close', () => {
+        void transport.close()
+        void server.close()
+      })
+      await server.connect(transport)
+
+      let body = ''
+      for await (const chunk of req) body += chunk
+      await transport.handleRequest(
+        req,
+        res,
+        body ? (JSON.parse(body) as unknown) : undefined,
+      )
+    })().catch(() => {
+      if (!res.headersSent) res.writeHead(500).end('bridge error')
+    })
+  })
+
+  await new Promise<void>((resolve) => httpServer.listen(0, '0.0.0.0', resolve))
+  const port = (httpServer.address() as AddressInfo).port
+  const url = `http://${options.hostForSandbox}:${port}/mcp`
+
+  return {
+    name: BRIDGED_MCP_SERVER_NAME,
+    url,
+    token,
+    close: () =>
+      new Promise<void>((resolve) => httpServer.close(() => resolve())),
+  }
+}
diff --git a/packages/ai-sandbox/src/watch.ts b/packages/ai-sandbox/src/watch.ts
new file mode 100644
index 000000000..bf38e3b65
--- /dev/null
+++ b/packages/ai-sandbox/src/watch.ts
@@ -0,0 +1,256 @@
+/**
+ * Sandbox file-event hooks — observe create / change / delete of files inside a
+ * sandbox (e.g. as an in-sandbox agent edits the workspace).
+ *
+ * Provider-agnostic: coded against the {@link SandboxHandle} contract only.
+ * Two mechanisms, auto-selected:
+ *
+ * - **Native** — when a provider implements the optional `fs.watch` seam
+ *   (local-process does, via Node `fs.watch`), OS events drive the feed with low
+ *   latency.
+ * - **Exec-poll** — otherwise (Docker, Cloudflare, any exec-only provider), a
+ *   single `find … -printf` snapshot of `mtime\tsize\tpath` is taken every
+ *   `intervalMs` and diffed. Works on any Linux container with GNU findutils
+ *   (true for `node:*` / debian images) with no extra deps or image changes.
+ *
+ * The feed intentionally rides only the portable surface, so the same
+ * `watchWorkspace` call behaves identically across providers.
+ */
+import { DEFAULT_WORKSPACE_ROOT } from './bootstrap'
+import type { SandboxHandle } from './contracts'
+import type { SandboxFileEvent } from '@tanstack/ai'
+
+export type { SandboxFileEvent } from '@tanstack/ai'
+/** @deprecated alias retained for the low-level watch API. */
+export type FileEvent = SandboxFileEvent
+export type FileEventType = SandboxFileEvent['type']
+
+export interface WatchOptions {
+  /** Called for every observed file event. */
+  onEvent: (event: SandboxFileEvent) => void
+  /** Workspace root to watch. Defaults to `/workspace`. */
+  root?: string
+  /** Poll interval for the exec-poll fallback, in ms. Defaults to 700. */
+  intervalMs?: number
+  /**
+   * Directory-name fragments to ignore (a path containing `/<entry>/` is
+   * skipped). Defaults to `['.git', 'node_modules']`.
+   */
+  ignore?: Array<string>
+  /** Stop watching when this signal aborts. */
+  signal?: AbortSignal
+}
+
+export interface SandboxWatchHandle {
+  /** Stop the watcher and release its resources. */
+  stop: () => Promise<void>
+}
+
+const DEFAULT_INTERVAL_MS = 700
+const DEFAULT_IGNORE = ['.git', 'node_modules']
+
+/** POSIX single-quote escape for embedding values in a shell command. */
+function q(value: string): string {
+  return `'${value.replace(/'/g, `'\\''`)}'`
+}
+
+/**
+ * Diff two file snapshots (`Map<path, signature>`, signature = `mtime\tsize`).
+ * Pure — the heart of the exec-poll path, unit-tested in isolation.
+ */
+export function diffSnapshots(
+  prev: Map<string, string>,
+  next: Map<string, string>,
+  timestamp: number,
+): Array<SandboxFileEvent> {
+  const events: Array<SandboxFileEvent> = []
+  for (const [path, sig] of next) {
+    const before = prev.get(path)
+    if (before === undefined) events.push({ type: 'create', path, timestamp })
+    else if (before !== sig) events.push({ type: 'change', path, timestamp })
+  }
+  for (const path of prev.keys()) {
+    if (!next.has(path)) events.push({ type: 'delete', path, timestamp })
+  }
+  return events
+}
+
+/** Build the `find` command that prints `mtime\tsize\tpath` for every file. */
+function buildFindCommand(root: string, ignore: Array<string>): string {
+  const prunes = ignore
+    .map((entry) => `-not -path ${q(`*/${entry}/*`)}`)
+    .join(' ')
+  return `find ${q(root)} -type f ${prunes} -printf '%T@\\t%s\\t%p\\n'`
+}
+
+/** Parse `find -printf` output into a `Map<path, signature>`. */
+function parseFindOutput(stdout: string): Map<string, string> {
+  const snapshot = new Map<string, string>()
+  for (const line of stdout.split('\n')) {
+    if (line === '') continue
+    const firstTab = line.indexOf('\t')
+    const secondTab = line.indexOf('\t', firstTab + 1)
+    if (firstTab === -1 || secondTab === -1) continue
+    const mtime = line.slice(0, firstTab)
+    const size = line.slice(firstTab + 1, secondTab)
+    const path = line.slice(secondTab + 1)
+    snapshot.set(path, `${mtime}\t${size}`)
+  }
+  return snapshot
+}
+
+/** Whether a path should be ignored (contains a `/<entry>/` fragment). */
+function isIgnored(path: string, ignore: Array<string>): boolean {
+  return ignore.some((entry) => path.includes(`/${entry}/`))
+}
+
+/**
+ * Start watching a sandbox workspace for file events. Picks the native
+ * `fs.watch` fast-path when the provider advertises it, otherwise polls via
+ * `find`. Returns a handle whose `stop()` tears everything down.
+ */
+export async function watchWorkspace(
+  handle: SandboxHandle,
+  options: WatchOptions,
+): Promise<SandboxWatchHandle> {
+  const root = options.root ?? DEFAULT_WORKSPACE_ROOT
+  const ignore = options.ignore ?? DEFAULT_IGNORE
+  const intervalMs = options.intervalMs ?? DEFAULT_INTERVAL_MS
+
+  // Already aborted before we start — don't begin any async work.
+  if (options.signal?.aborted) return { stop: () => Promise.resolve() }
+
+  if (handle.fs.watch) {
+    return startNativeWatch(handle, { ...options, root, ignore })
+  }
+  return startPollWatch(handle, { ...options, root, ignore, intervalMs })
+}
+
+/** Native fs.watch path: OS events, disambiguated against a known-path set. */
+async function startNativeWatch(
+  handle: SandboxHandle,
+  options: WatchOptions & { root: string; ignore: Array<string> },
+): Promise<SandboxWatchHandle> {
+  const { onEvent, root, ignore } = options
+  const watch = handle.fs.watch
+  if (!watch) throw new Error('native watch is unavailable on this provider')
+  // Seed the set of existing files so the first event per path is classified
+  // correctly (create vs change).
+  const known = await collectPaths(handle, root, ignore)
+
+  const subscription = await watch(root, (raw) => {
+    const path = raw.path
+    if (isIgnored(path, ignore)) return
+    void (async () => {
+      const exists = await handle.fs.exists(path)
+      const timestamp = Date.now()
+      if (!exists) {
+        if (known.delete(path)) onEvent({ type: 'delete', path, timestamp })
+        return
+      }
+      if (known.has(path)) onEvent({ type: 'change', path, timestamp })
+      else {
+        known.add(path)
+        onEvent({ type: 'create', path, timestamp })
+      }
+    })().catch(() => undefined)
+  })
+
+  const onAbort = (): void => void subscription.stop().catch(() => undefined)
+  options.signal?.addEventListener('abort', onAbort, { once: true })
+  // The signal may have aborted during the awaits above (the once-listener
+  // would have missed it) — tear down now if so.
+  if (options.signal?.aborted) void subscription.stop().catch(() => undefined)
+
+  return {
+    stop: async () => {
+      options.signal?.removeEventListener('abort', onAbort)
+      await subscription.stop()
+    },
+  }
+}
+
+/** Exec-poll path: snapshot `find -printf` on an interval and diff. */
+async function startPollWatch(
+  handle: SandboxHandle,
+  options: WatchOptions & {
+    root: string
+    ignore: Array<string>
+    intervalMs: number
+  },
+): Promise<SandboxWatchHandle> {
+  const { onEvent, root, ignore, intervalMs } = options
+  const command = buildFindCommand(root, ignore)
+  const controller = new AbortController()
+
+  const snapshot = async (): Promise<Map<string, string>> => {
+    const result = await handle.process.exec(command, {
+      cwd: root,
+      signal: controller.signal,
+    })
+    return result.exitCode === 0
+      ? parseFindOutput(result.stdout)
+      : new Map<string, string>()
+  }
+
+  let previous = await snapshot()
+  const state = { running: true }
+
+  const tick = async (): Promise<void> => {
+    if (!state.running) return
+    try {
+      const next = await snapshot()
+      for (const event of diffSnapshots(previous, next, Date.now())) {
+        onEvent(event)
+      }
+      previous = next
+    } catch {
+      // transient exec failure (e.g. mid-teardown) — try again next tick
+    }
+  }
+
+  const timer = setInterval(() => void tick(), intervalMs)
+  // Don't keep the event loop alive on the watcher alone.
+  if (typeof timer.unref === 'function') timer.unref()
+
+  const stop = (): Promise<void> => {
+    if (state.running) {
+      state.running = false
+      clearInterval(timer)
+      controller.abort()
+      options.signal?.removeEventListener('abort', onAbort)
+    }
+    return Promise.resolve()
+  }
+  const onAbort = (): void => void stop()
+  options.signal?.addEventListener('abort', onAbort, { once: true })
+  // The signal may have aborted during the initial `await snapshot()` above
+  // (the once-listener would have missed it) — tear down now if so.
+  if (options.signal?.aborted) void stop()
+
+  return { stop }
+}
+
+/** Recursively collect file paths under `root`, honoring `ignore`. */
+async function collectPaths(
+  handle: SandboxHandle,
+  root: string,
+  ignore: Array<string>,
+): Promise<Set<string>> {
+  const files = new Set<string>()
+  const walk = async (dir: string): Promise<void> => {
+    let entries: Awaited<ReturnType<SandboxHandle['fs']['list']>>
+    try {
+      entries = await handle.fs.list(dir)
+    } catch {
+      return
+    }
+    for (const entry of entries) {
+      if (ignore.includes(entry.name)) continue
+      if (entry.type === 'dir') await walk(entry.path)
+      else files.add(entry.path)
+    }
+  }
+  await walk(root)
+  return files
+}
diff --git a/packages/ai-sandbox/src/workspace.ts b/packages/ai-sandbox/src/workspace.ts
new file mode 100644
index 000000000..1bb4741ca
--- /dev/null
+++ b/packages/ai-sandbox/src/workspace.ts
@@ -0,0 +1,100 @@
+/**
+ * Workspace definition — the portable description of what the agent sees
+ * inside the sandbox. Each harness adapter PROJECTS this into its own native
+ * format via `projectWorkspace()` (e.g. Claude Code → CLAUDE.md + .claude/skills
+ * + --mcp-config). The definition itself is provider- and harness-agnostic.
+ */
+
+/** Where the working tree comes from. */
+export type WorkspaceSource =
+  | {
+      type: 'git'
+      url: string
+      ref?: string
+      auth?: { username?: string; token: string }
+    }
+  | { type: 'local'; path: string }
+  | { type: 'none' }
+
+/** Clone a git repo into the workspace. `githubRepo` is a convenience wrapper. */
+export function gitSource(input: {
+  url: string
+  ref?: string
+  auth?: { username?: string; token: string }
+}): WorkspaceSource {
+  return { type: 'git', ...input }
+}
+
+export function githubRepo(input: {
+  repo: string
+  ref?: string
+  auth?: { username?: string; token: string }
+}): WorkspaceSource {
+  const url = input.repo.startsWith('http')
+    ? input.repo
+    : `https://github.com/${input.repo}.git`
+  return { type: 'git', url, ref: input.ref, auth: input.auth }
+}
+
+export function localSource(path: string): WorkspaceSource {
+  return { type: 'local', path }
+}
+
+/** A unit of agent guidance/config projected into the harness's native format. */
+export type WorkspaceSkill =
+  | { kind: 'file'; path: string; content: string }
+  | { kind: 'agent-skill'; name: string }
+  | {
+      kind: 'mcp'
+      name: string
+      config: Record<string, unknown>
+    }
+
+/** Write a file (e.g. CLAUDE.md) into the workspace / harness config. */
+export function fileSkill(input: {
+  path: string
+  content: string
+}): WorkspaceSkill {
+  return { kind: 'file', ...input }
+}
+
+/** Reference a named agent skill the harness should load. */
+export function agentSkill(name: string): WorkspaceSkill {
+  return { kind: 'agent-skill', name }
+}
+
+/** Project an MCP server into the harness. */
+export function mcpSkill(
+  name: string,
+  config: Record<string, unknown>,
+): WorkspaceSkill {
+  return { kind: 'mcp', name, config }
+}
+
+export type PackageManager = 'npm' | 'pnpm' | 'yarn' | 'bun' | 'auto'
+
+export interface WorkspaceDefinition {
+  source: WorkspaceSource
+  /** Defaults to `'auto'` — detect from the lockfile after the source lands. */
+  packageManager?: PackageManager
+  /** Commands run once during bootstrap, in order (e.g. install). */
+  setup?: Array<string>
+  /** Named commands the agent/user can invoke (e.g. { test: 'pnpm test' }). */
+  scripts?: Record<string, string>
+  /** Guidance/config projected into the harness. */
+  skills?: Array<WorkspaceSkill>
+  /**
+   * Secrets injected into the sandbox env at create/resume. NEVER written to
+   * snapshots, the SandboxStore, or the event log — they live only in the
+   * running sandbox's environment and are re-injected each create/resume.
+   */
+  secrets?: Record<string, string>
+  /** Workspace root inside the sandbox. Defaults to `/workspace`. */
+  root?: string
+}
+
+export function defineWorkspace(
+  definition: WorkspaceDefinition,
+): WorkspaceDefinition {
+  return definition
+}
diff --git a/packages/ai-sandbox/tests/approvals.test.ts b/packages/ai-sandbox/tests/approvals.test.ts
new file mode 100644
index 000000000..5bba93337
--- /dev/null
+++ b/packages/ai-sandbox/tests/approvals.test.ts
@@ -0,0 +1,131 @@
+import { describe, expect, it } from 'vitest'
+import {
+  APPROVAL_REQUESTED_EVENT,
+  approvalId,
+  buildApprovalRequestedEvent,
+  resolveApproval,
+} from '../src/approvals'
+import { defineSandboxPolicy } from '../src/policy'
+
+describe('approvalId', () => {
+  it('is stable for the same action across runs', () => {
+    const a = approvalId({
+      provider: 'codex',
+      kind: 'command',
+      target: 'rm -rf x',
+    })
+    const b = approvalId({
+      provider: 'codex',
+      kind: 'command',
+      target: 'rm -rf x',
+    })
+    expect(a).toBe(b)
+    expect(a).not.toBe(
+      approvalId({ provider: 'codex', kind: 'command', target: 'ls' }),
+    )
+  })
+})
+
+describe('resolveApproval', () => {
+  const policy = defineSandboxPolicy({
+    commands: { allow: ['ls'], ask: ['rm *'], deny: ['sudo *'] },
+    capabilities: { fileWrite: 'ask', network: 'deny' },
+    default: 'ask',
+  })
+
+  it('allows / denies per command policy without asking', () => {
+    expect(
+      resolveApproval({ policy, approvals: undefined, id: 'x', command: 'ls' }),
+    ).toEqual({
+      decision: 'allow',
+      needsApproval: false,
+    })
+    expect(
+      resolveApproval({
+        policy,
+        approvals: undefined,
+        id: 'x',
+        command: 'sudo reboot',
+      }),
+    ).toEqual({ decision: 'deny', needsApproval: false })
+  })
+
+  it('asks (deny + needsApproval) when policy says ask and no decision yet', () => {
+    expect(
+      resolveApproval({
+        policy,
+        approvals: undefined,
+        id: 'rm',
+        command: 'rm file',
+      }),
+    ).toEqual({ decision: 'deny', needsApproval: true })
+  })
+
+  it('honors the client decision on the resumed run', () => {
+    const granted = new Map([['rm', true]])
+    expect(
+      resolveApproval({
+        policy,
+        approvals: granted,
+        id: 'rm',
+        command: 'rm file',
+      }),
+    ).toEqual({ decision: 'allow', needsApproval: false })
+    const denied = new Map([['rm', false]])
+    expect(
+      resolveApproval({
+        policy,
+        approvals: denied,
+        id: 'rm',
+        command: 'rm file',
+      }),
+    ).toEqual({ decision: 'deny', needsApproval: false })
+  })
+
+  it('resolves coarse capability rules (fileWrite ask, network deny)', () => {
+    expect(
+      resolveApproval({
+        policy,
+        approvals: undefined,
+        id: 'w',
+        capability: 'fileWrite',
+      }),
+    ).toEqual({ decision: 'deny', needsApproval: true })
+    expect(
+      resolveApproval({
+        policy,
+        approvals: undefined,
+        id: 'n',
+        capability: 'network',
+      }),
+    ).toEqual({ decision: 'deny', needsApproval: false })
+  })
+
+  it('defaults to ask when no policy', () => {
+    expect(
+      resolveApproval({
+        policy: undefined,
+        approvals: undefined,
+        id: 'x',
+        command: 'anything',
+      }),
+    ).toEqual({
+      decision: 'deny',
+      needsApproval: true,
+    })
+  })
+})
+
+describe('buildApprovalRequestedEvent', () => {
+  it('builds an AG-UI CUSTOM event carrying the approvalId', () => {
+    const event = buildApprovalRequestedEvent({
+      approvalId: 'codex:command:rm -rf x',
+      title: 'Run: rm -rf x',
+      threadId: 't',
+      runId: 'r',
+    }) as { type: string; name: string; value: { approvalId: string } }
+    expect(event.type).toBe('CUSTOM')
+    expect(event.name).toBe(APPROVAL_REQUESTED_EVENT)
+    expect(event.value.approvalId).toBe('codex:command:rm -rf x')
+  })
+})
diff --git a/packages/ai-sandbox/tests/ensure.test.ts b/packages/ai-sandbox/tests/ensure.test.ts
new file mode 100644
index 000000000..506bb579c
--- /dev/null
+++ b/packages/ai-sandbox/tests/ensure.test.ts
@@ -0,0 +1,143 @@
+import { describe, expect, it } from 'vitest'
+import { defineSandbox } from '../src/sandbox'
+import { defineWorkspace, githubRepo } from '../src/workspace'
+import { InMemoryLockStore, InMemorySandboxStore } from '../src/store'
+import { FULL_CAPS, makeFakeProvider } from './fakes'
+import type { SandboxCapabilities } from '../src/contracts'
+
+const baseCtx = () => ({
+  threadId: 'thread-1',
+  runId: 'run-1',
+  store: new InMemorySandboxStore(),
+  locks: new InMemoryLockStore(),
+})
+
+const workspace = defineWorkspace({
+  source: githubRepo({ repo: 'TanStack/ai' }),
+  setup: ['corepack enable', 'pnpm install'],
+})
+
+describe('ensureSandbox algorithm', () => {
+  it('creates + bootstraps + records on first run', async () => {
+    const provider = makeFakeProvider()
+    const def = defineSandbox({ id: 'repo', provider, workspace })
+    const ctx = baseCtx()
+
+    const handle = await def.ensure(ctx)
+
+    expect(provider.calls.create).toBe(1)
+    expect(provider.calls.resume).toBe(0)
+    // bootstrap cloned the repo + can run setup (fake handle tracks files)
+    const files = (handle as unknown as { files: Map<string, string> }).files
+    expect(files.has('/workspace/.git')).toBe(true)
+    // recorded in the store under the compound key
+    const rec = await ctx.store.get(def.key(ctx))
+    expect(rec?.providerSandboxId).toBe(handle.id)
+    expect(rec?.threadId).toBe('thread-1')
+  })
+
+  it('resumes the same provider sandbox on a second run (reuse: thread)', async () => {
+    const provider = makeFakeProvider()
+    const def = defineSandbox({ id: 'repo', provider, workspace })
+    const ctx = baseCtx()
+
+    const first = await def.ensure(ctx)
+    const second = await def.ensure({ ...ctx, runId: 'run-2' })
+
+    expect(provider.calls.create).toBe(1)
+    expect(provider.calls.resume).toBe(1)
+    expect(second.id).toBe(first.id)
+    // latestRunId advanced
+    const rec = await ctx.store.get(def.key(ctx))
+    expect(rec?.latestRunId).toBe('run-2')
+  })
+
+  it('falls back to snapshot restore when resume returns null', async () => {
+    const provider = makeFakeProvider({ resumeReturnsNull: true })
+    const def = defineSandbox({
+      id: 'repo',
+      provider,
+      workspace,
+      lifecycle: { reuse: 'thread', snapshot: 'after-setup' },
+    })
+    const ctx = baseCtx()
+
+    await def.ensure(ctx) // create + after-setup snapshot recorded
+    const restored = await def.ensure({ ...ctx, runId: 'run-2' })
+
+    expect(provider.calls.resume).toBe(1)
+    expect(provider.calls.restoreSnapshot).toBe(1)
+    expect(restored.id).toContain('restored')
+  })
+
+  it('re-creates under the same identity when provider lacks durable fs + snapshots', async () => {
+    const ephemeralCaps: SandboxCapabilities = {
+      ...FULL_CAPS,
+      snapshots: false,
+      durableFilesystem: false,
+    }
+    const provider = makeFakeProvider({
+      resumeReturnsNull: true,
+      caps: ephemeralCaps,
+    })
+    const def = defineSandbox({
+      id: 'repo',
+      provider,
+      workspace,
+      lifecycle: { reuse: 'thread', snapshot: 'after-setup' },
+    })
+    const ctx = baseCtx()
+
+    await def.ensure(ctx)
+    await def.ensure({ ...ctx, runId: 'run-2' })
+
+    // resume tried + failed, no snapshot path, so a fresh create both times
+    expect(provider.calls.create).toBe(2)
+    expect(provider.calls.restoreSnapshot).toBe(0)
+  })
+
+  it('reuse: none keys each run separately (no resume)', async () => {
+    const provider = makeFakeProvider()
+    const def = defineSandbox({
+      id: 'repo',
+      provider,
+      workspace,
+      lifecycle: { reuse: 'none' },
+    })
+    const ctx = baseCtx()
+
+    await def.ensure(ctx)
+    await def.ensure({ ...ctx, runId: 'run-2' })
+
+    expect(provider.calls.create).toBe(2)
+    expect(provider.calls.resume).toBe(0)
+  })
+
+  it('destroy removes the record and destroys the provider sandbox', async () => {
+    const provider = makeFakeProvider()
+    const def = defineSandbox({ id: 'repo', provider, workspace })
+    const ctx = baseCtx()
+
+    await def.ensure(ctx)
+    await def.destroy(ctx)
+
+    expect(provider.calls.destroy).toBe(1)
+    expect(await ctx.store.get(def.key(ctx))).toBeNull()
+  })
+
+  it('serializes concurrent ensures for the same key (one create)', async () => {
+    const provider = makeFakeProvider()
+    const def = defineSandbox({ id: 'repo', provider, workspace })
+    const ctx = baseCtx()
+
+    const [a, b] = await Promise.all([
+      def.ensure(ctx),
+      def.ensure({ ...ctx, runId: 'run-2' }),
+    ])
+
+    // The lock forces serialization: the second sees the first's record and resumes.
+    expect(provider.calls.create).toBe(1)
+    expect(provider.calls.resume).toBe(1)
+    expect(a.id).toBe(b.id)
+  })
+})
diff --git a/packages/ai-sandbox/tests/fakes.ts b/packages/ai-sandbox/tests/fakes.ts
new file mode 100644
index 000000000..e95bf04f7
--- /dev/null
+++ b/packages/ai-sandbox/tests/fakes.ts
@@ -0,0 +1,156 @@
+import type {
+  ExecResult,
+  SandboxCapabilities,
+  SandboxCreateInput,
+  SandboxDestroyInput,
+  SandboxHandle,
+  SandboxProvider,
+  SandboxResumeInput,
+  SandboxRestoreInput,
+  SnapshotRef,
+} from '../src/contracts'
+
+export const FULL_CAPS: SandboxCapabilities = {
+  fs: true,
+  exec: true,
+  env: true,
+  ports: true,
+  backgroundProcesses: true,
+  snapshots: true,
+  networkPolicy: true,
+  durableFilesystem: true,
+  fork: true,
+}
+
+/** A no-op handle whose fs/process/git are stubs; tracks created/destroyed. */
+export function makeFakeHandle(
+  id: string,
+  provider: string,
+  caps: SandboxCapabilities = FULL_CAPS,
+): SandboxHandle & { destroyed: boolean; files: Map<string, string> } {
+  const files = new Map<string, string>()
+  let snapshotCounter = 0
+  const handle: SandboxHandle & {
+    destroyed: boolean
+    files: Map<string, string>
+  } = {
+    id,
+    provider,
+    capabilities: caps,
+    destroyed: false,
+    files,
+    fs: {
+      read: (p) => Promise.resolve(files.get(p) ?? ''),
+      readBytes: (p) =>
+        Promise.resolve(new TextEncoder().encode(files.get(p) ?? '')),
+      write: (p, d) => {
+        files.set(p, typeof d === 'string' ? d : new TextDecoder().decode(d))
+        return Promise.resolve()
+      },
+      list: () => Promise.resolve([]),
+      mkdir: () => Promise.resolve(),
+      remove: (p) => {
+        files.delete(p)
+        return Promise.resolve()
+      },
+      rename: () => Promise.resolve(),
+      exists: (p) => Promise.resolve(files.has(p)),
+    },
+    git: {
+      clone: ({ dir }) => {
+        files.set(`${dir ?? '/workspace'}/.git`, 'cloned')
+        return Promise.resolve()
+      },
+      status: () => Promise.resolve(''),
+      add: () => Promise.resolve(),
+      commit: () => Promise.resolve(),
+      push: () => Promise.resolve(),
+      pull: () => Promise.resolve(),
+      branch: () => Promise.resolve('main'),
+    },
+    process: {
+      exec: (): Promise<ExecResult> =>
+        Promise.resolve({ stdout: '', stderr: '', exitCode: 0 }),
+      spawn: () => Promise.reject(new Error('not used in this fake')),
+    },
+    ports: {
+      connect: (port) => Promise.resolve({ url: `http://localhost:${port}` }),
+    },
+    env: { set: () => Promise.resolve() },
+    snapshot: caps.snapshots
+      ? (label) =>
+          Promise.resolve<SnapshotRef>({
+            id: `snap-${id}-${++snapshotCounter}`,
+            label,
+          })
+      : undefined,
+    destroy: () => {
+      handle.destroyed = true
+      return Promise.resolve()
+    },
+  }
+  return handle
+}
+
+export interface FakeProviderOptions {
+  name?: string
+  caps?: SandboxCapabilities
+  /** Make resume() return null (simulate a sandbox that's gone). */
+  resumeReturnsNull?: boolean
+}
+
+export interface FakeProvider extends SandboxProvider {
+  readonly calls: {
+    create: number
+    resume: number
+    restoreSnapshot: number
+    destroy: number
+  }
+  readonly created: Array<SandboxHandle>
+}
+
+export function makeFakeProvider(
+  options: FakeProviderOptions = {},
+): FakeProvider {
+  const name = options.name ?? 'fake'
+  const caps = options.caps ?? FULL_CAPS
+  const calls = { create: 0, resume: 0, restoreSnapshot: 0, destroy: 0 }
+  const created: Array<SandboxHandle> = []
+  let counter = 0
+
+  const provider: FakeProvider = {
+    name,
+    calls,
+    created,
+    capabilities: () => caps,
+    create: (_input: SandboxCreateInput) => {
+      calls.create++
+      const handle = makeFakeHandle(`${name}-${++counter}`, name, caps)
+      created.push(handle)
+      return Promise.resolve(handle)
+    },
+    resume: (_input: SandboxResumeInput) => {
+      calls.resume++
+      if (options.resumeReturnsNull) return Promise.resolve(null)
+      const handle = makeFakeHandle(_input.id, name, caps)
+      return Promise.resolve(handle)
+    },
+    restoreSnapshot: caps.snapshots
+      ? (_input: SandboxRestoreInput) => {
+          calls.restoreSnapshot++
+          const handle = makeFakeHandle(
+            `${name}-restored-${++counter}`,
+            name,
+            caps,
+          )
+          created.push(handle)
+          return Promise.resolve(handle)
+        }
+      : undefined,
+    destroy: (_input: SandboxDestroyInput) => {
+      calls.destroy++
+      return Promise.resolve()
+    },
+  }
+  return provider
+}
diff --git a/packages/ai-sandbox/tests/git-exec.test.ts b/packages/ai-sandbox/tests/git-exec.test.ts
new file mode 100644
index 000000000..6efe75388
--- /dev/null
+++ b/packages/ai-sandbox/tests/git-exec.test.ts
@@ -0,0 +1,77 @@
+import { describe, expect, it } from 'vitest'
+import { createExecBackedGit } from '../src/git-exec'
+import type {
+  ExecResult,
+  ProcessOptions,
+  SandboxProcess,
+} from '../src/contracts'
+
+interface ExecCall {
+  command: string
+  options?: ProcessOptions
+}
+
+function recordingProcess(stdout = ''): {
+  process: SandboxProcess
+  calls: Array<ExecCall>
+} {
+  const calls: Array<ExecCall> = []
+  const process: SandboxProcess = {
+    exec: (command, options): Promise<ExecResult> => {
+      calls.push({ command, options })
+      return Promise.resolve({ stdout, stderr: '', exitCode: 0 })
+    },
+    spawn: () => Promise.reject(new Error('unused')),
+  }
+  return { process, calls }
+}
+
+describe('createExecBackedGit security', () => {
+  it('keeps the auth token out of argv (env-only credential helper)', async () => {
+    const { process, calls } = recordingProcess()
+    const git = createExecBackedGit(process, '/workspace')
+    await git.clone({
+      url: 'https://github.com/org/repo.git',
+      auth: { username: 'x-access-token', token: 'super-secret-token' },
+    })
+    const { command, options } = calls[0]!
+    // Token must NOT appear in the command line (would leak via ps/logs).
+    expect(command).not.toContain('super-secret-token')
+    // It must be supplied via the child env instead.
+    expect(options?.env?.GIT_ASKPASS_TOKEN).toBe('super-secret-token')
+    // The helper references the env var, not the literal token.
+    expect(command).toContain('credential.helper')
+    expect(command).toContain('${GIT_ASKPASS_TOKEN}')
+  })
+
+  it('inserts a -- end-of-options separator before positionals', async () => {
+    const { process, calls } = recordingProcess()
+    const git = createExecBackedGit(process, '/workspace')
+    await git.clone({ url: 'https://example.com/r.git', dir: '/workspace' })
+    expect(calls[0]!.command).toContain('clone -- ')
+    await git.add(['a.ts', 'b.ts'])
+    expect(calls[1]!.command).toContain('add -- ')
+  })
+
+  it('rejects flag-smuggling values (leading dash)', async () => {
+    const { process } = recordingProcess()
+    const git = createExecBackedGit(process, '/workspace')
+    await expect(
+      git.clone({ url: '--upload-pack=touch /tmp/pwned' }),
+    ).rejects.toThrow(/argument-injection guard/)
+    await expect(git.add(['--output=/etc/x'])).rejects.toThrow(
+      /argument-injection guard/,
+    )
+    await expect(git.status('-C/evil')).rejects.toThrow(
+      /argument-injection guard/,
+    )
+  })
+
+  it('escapes embedded single quotes in values', async () => {
+    const { process, calls } = recordingProcess()
+    const git = createExecBackedGit(process, '/workspace')
+    await git.commit("it's done")
+    // The command runs without throwing and the message is single-quote escaped.
+    expect(calls[0]!.command).toContain(`commit -m 'it'\\''s done'`)
+  })
+})
diff --git a/packages/ai-sandbox/tests/key.test.ts b/packages/ai-sandbox/tests/key.test.ts
new file mode 100644
index 000000000..00891c198
--- /dev/null
+++ b/packages/ai-sandbox/tests/key.test.ts
@@ -0,0 +1,76 @@
+import { describe, expect, it } from 'vitest'
+import { computeSandboxKey, computeWorkspaceHash } from '../src/key'
+import { defineWorkspace, githubRepo } from '../src/workspace'
+import type { SandboxKeyInput } from '../src/key'
+
+const base: SandboxKeyInput = {
+  threadId: 'thread-1',
+  sandboxId: 'repo',
+  providerName: 'docker',
+  workspace: defineWorkspace({
+    source: githubRepo({ repo: 'TanStack/ai', ref: 'main' }),
+  }),
+}
+
+describe('computeSandboxKey', () => {
+  it('is stable for identical inputs', () => {
+    expect(computeSandboxKey(base)).toBe(computeSandboxKey({ ...base }))
+  })
+
+  it('changes when thread, sandbox id, provider, or tenant change', () => {
+    const k = computeSandboxKey(base)
+    expect(computeSandboxKey({ ...base, threadId: 'thread-2' })).not.toBe(k)
+    expect(computeSandboxKey({ ...base, sandboxId: 'other' })).not.toBe(k)
+    expect(computeSandboxKey({ ...base, providerName: 'cloudflare' })).not.toBe(
+      k,
+    )
+    expect(computeSandboxKey({ ...base, tenant: { orgId: 'acme' } })).not.toBe(
+      k,
+    )
+  })
+
+  it('changes when the workspace source/ref changes (busts stale env)', () => {
+    const k = computeSandboxKey(base)
+    const otherRef = computeSandboxKey({
+      ...base,
+      workspace: defineWorkspace({
+        source: githubRepo({ repo: 'TanStack/ai', ref: 'next' }),
+      }),
+    })
+    expect(otherRef).not.toBe(k)
+  })
+})
+
+describe('computeWorkspaceHash', () => {
+  it('excludes secrets (rotating a token must not orphan the sandbox)', () => {
+    const a = computeWorkspaceHash(
+      defineWorkspace({
+        source: githubRepo({ repo: 'TanStack/ai' }),
+        secrets: { A: '1' },
+      }),
+    )
+    const b = computeWorkspaceHash(
+      defineWorkspace({
+        source: githubRepo({ repo: 'TanStack/ai' }),
+        secrets: { A: '2' },
+      }),
+    )
+    expect(a).toBe(b)
+  })
+
+  it('changes when setup/scripts change', () => {
+    const a = computeWorkspaceHash(
+      defineWorkspace({
+        source: githubRepo({ repo: 'TanStack/ai' }),
+        setup: ['pnpm i'],
+      }),
+    )
+    const b = computeWorkspaceHash(
+      defineWorkspace({
+        source: githubRepo({ repo: 'TanStack/ai' }),
+        setup: ['npm i'],
+      }),
+    )
+    expect(a).not.toBe(b)
+  })
+})
diff --git a/packages/ai-sandbox/tests/locks-identity.test.ts b/packages/ai-sandbox/tests/locks-identity.test.ts
new file mode 100644
index 000000000..d448c3970
--- /dev/null
+++ b/packages/ai-sandbox/tests/locks-identity.test.ts
@@ -0,0 +1,17 @@
+import { describe, expect, it } from 'vitest'
+import { LocksCapability as CoreLocksCapability } from '@tanstack/ai'
+import { LocksCapability as SandboxLocksCapability } from '../src/capabilities'
+
+describe('LocksCapability identity', () => {
+  it('is the SAME token object as the one exported by @tanstack/ai', () => {
+    // Capability names must be globally unique and the runtime identity is the
+    // object reference. The sandbox layer must reference the core token (not a
+    // second 'locks' capability) so a persistence-provided LockStore is visible
+    // to withSandbox's optional requirement.
+    expect(SandboxLocksCapability).toBe(CoreLocksCapability)
+  })
+
+  it('is named "locks"', () => {
+    expect(SandboxLocksCapability.capabilityName).toBe('locks')
+  })
+})
diff --git a/packages/ai-sandbox/tests/policy.test.ts b/packages/ai-sandbox/tests/policy.test.ts
new file mode 100644
index 000000000..b591a9015
--- /dev/null
+++ b/packages/ai-sandbox/tests/policy.test.ts
@@ -0,0 +1,54 @@
+import { describe, expect, it } from 'vitest'
+import { defineSandboxPolicy, evaluateCommand } from '../src/policy'
+
+describe('evaluateCommand', () => {
+  const policy = defineSandboxPolicy({
+    commands: {
+      allow: ['pnpm test', 'pnpm typecheck', 'git diff'],
+      ask: ['pnpm install', 'curl *', 'wget *'],
+      deny: ['sudo *', 'rm -rf *'],
+    },
+    default: 'ask',
+  })
+
+  it('allows exact allow matches', () => {
+    expect(evaluateCommand('pnpm test', policy)).toBe('allow')
+    expect(evaluateCommand('git diff', policy)).toBe('allow')
+  })
+
+  it('asks for ask matches incl. globs', () => {
+    expect(evaluateCommand('pnpm install', policy)).toBe('ask')
+    expect(evaluateCommand('curl https://example.com', policy)).toBe('ask')
+  })
+
+  it('denies deny matches incl. globs', () => {
+    expect(evaluateCommand('sudo apt-get update', policy)).toBe('deny')
+    expect(evaluateCommand('rm -rf /', policy)).toBe('deny')
+  })
+
+  it('deny beats ask beats allow (precedence)', () => {
+    const overlap = defineSandboxPolicy({
+      commands: {
+        allow: ['git *'],
+        ask: ['git push *'],
+        deny: ['git push --force*'],
+      },
+    })
+    expect(evaluateCommand('git status', overlap)).toBe('allow')
+    expect(evaluateCommand('git push origin main', overlap)).toBe('ask')
+    expect(evaluateCommand('git push --force origin main', overlap)).toBe(
+      'deny',
+    )
+  })
+
+  it('falls back to default for unmatched commands', () => {
+    expect(evaluateCommand('node script.js', policy)).toBe('ask')
+    expect(evaluateCommand('node script.js', { default: 'deny' })).toBe('deny')
+    expect(evaluateCommand('node script.js', undefined)).toBe('ask')
+  })
+
+  it('does not let glob metachars leak across command boundaries', () => {
+    // 'rm -rf *' must not match an unrelated 'confirm -rf safe' string.
+    expect(evaluateCommand('confirm -rf safe', policy)).toBe('ask')
+  })
+})
diff --git a/packages/ai-sandbox/tests/runner.test.ts b/packages/ai-sandbox/tests/runner.test.ts
new file mode 100644
index 000000000..62a84642b
--- /dev/null
+++ b/packages/ai-sandbox/tests/runner.test.ts
@@ -0,0 +1,90 @@
+import { describe, expect, it } from 'vitest'
+import { spawnNdjson, toLines } from '../src/runner'
+import type { SandboxHandle, SpawnHandle } from '../src/contracts'
+
+async function* fromChunks(chunks: Array<string>): AsyncIterable<string> {
+  for (const c of chunks) {
+    // Yield asynchronously to mimic real stream scheduling.
+    await Promise.resolve()
+    yield c
+  }
+}
+
+async function collect<T>(it: AsyncIterable<T>): Promise<Array<T>> {
+  const out: Array<T> = []
+  for await (const v of it) out.push(v)
+  return out
+}
+
+/** Minimal handle whose process.spawn replays scripted stdout chunks. */
+function handleSpawning(chunks: Array<string>): SandboxHandle {
+  const spawnHandle: SpawnHandle = {
+    pid: 1,
+    stdout: fromChunks(chunks),
+    stderr: fromChunks([]),
+    stdin: { write: () => Promise.resolve(), end: () => Promise.resolve() },
+    wait: () => Promise.resolve(0),
+    kill: () => Promise.resolve(),
+  }
+  return {
+    id: 'fake',
+    provider: 'fake',
+    capabilities: {
+      fs: true,
+      exec: true,
+      env: true,
+      ports: false,
+      backgroundProcesses: true,
+      snapshots: false,
+      networkPolicy: false,
+      durableFilesystem: false,
+      fork: false,
+    },
+    // Only process.spawn is exercised here.
+    fs: {} as SandboxHandle['fs'],
+    git: {} as SandboxHandle['git'],
+    process: {
+      exec: () => Promise.reject(new Error('unused')),
+      spawn: () => Promise.resolve(spawnHandle),
+    },
+    ports: { connect: () => Promise.reject(new Error('unused')) },
+    env: { set: () => Promise.resolve() },
+    destroy: () => Promise.resolve(),
+  }
+}
+
+describe('toLines', () => {
+  it('reassembles lines split across chunk boundaries', async () => {
+    const lines = await collect(
+      toLines(fromChunks(['{"a":', '1}\n{"b":2', '}\n'])),
+    )
+    expect(lines).toEqual(['{"a":1}', '{"b":2}'])
+  })
+
+  it('emits a trailing unterminated line', async () => {
+    const lines = await collect(toLines(fromChunks(['one\ntwo'])))
+    expect(lines).toEqual(['one', 'two'])
+  })
+})
+
+describe('spawnNdjson', () => {
+  it('parses NDJSON events from stdout, skipping blank + non-JSON lines', async () => {
+    const nonJson: Array<string> = []
+    const handle = handleSpawning([
+      'Claude Code starting...\n', // banner -> onNonJsonLine
+      '{"type":"text","delta":"hi"}\n',
+      '\n', // blank -> skipped
+      '{"type":"result","ok":true}\n',
+    ])
+    const events = await collect(
+      spawnNdjson(handle, 'claude -p --output-format stream-json', {
+        onNonJsonLine: (l) => nonJson.push(l),
+      }),
+    )
+    expect(events).toEqual([
+      { type: 'text', delta: 'hi' },
+      { type: 'result', ok: true },
+    ])
+    expect(nonJson).toEqual(['Claude Code starting...'])
+  })
+})
diff --git a/packages/ai-sandbox/tests/store.test.ts b/packages/ai-sandbox/tests/store.test.ts
new file mode 100644
index 000000000..184d0d807
--- /dev/null
+++ b/packages/ai-sandbox/tests/store.test.ts
@@ -0,0 +1,64 @@
+import { describe, expect, it } from 'vitest'
+import { InMemoryLockStore, InMemorySandboxStore } from '../src/store'
+
+describe('InMemorySandboxStore', () => {
+  it('round-trips upsert/get/delete', async () => {
+    const store = new InMemorySandboxStore()
+    expect(await store.get('k')).toBeNull()
+    await store.upsert({
+      key: 'k',
+      provider: 'docker',
+      providerSandboxId: 'sbx-1',
+      threadId: 't',
+      updatedAt: 1,
+    })
+    expect((await store.get('k'))?.providerSandboxId).toBe('sbx-1')
+    await store.delete('k')
+    expect(await store.get('k')).toBeNull()
+  })
+})
+
+describe('InMemoryLockStore', () => {
+  it('serializes same-key critical sections', async () => {
+    const locks = new InMemoryLockStore()
+    const order: Array<string> = []
+    const slow = (tag: string, ms: number) =>
+      locks.withLock('k', async () => {
+        order.push(`${tag}:start`)
+        await new Promise((r) => setTimeout(r, ms))
+        order.push(`${tag}:end`)
+      })
+
+    await Promise.all([slow('a', 20), slow('b', 1)])
+
+    // b cannot start until a fully ends.
+    expect(order).toEqual(['a:start', 'a:end', 'b:start', 'b:end'])
+  })
+
+  it('a rejection in one holder does not poison the lock', async () => {
+    const locks = new InMemoryLockStore()
+    await expect(
+      locks.withLock('k', () => Promise.reject(new Error('boom'))),
+    ).rejects.toThrow('boom')
+    // subsequent acquire still works
+    await expect(
+      locks.withLock('k', () => Promise.resolve('ok')),
+    ).resolves.toBe('ok')
+  })
+
+  it('runs different keys concurrently', async () => {
+    const locks = new InMemoryLockStore()
+    const order: Array<string> = []
+    await Promise.all([
+      locks.withLock('a', async () => {
+        await new Promise((r) => setTimeout(r, 20))
+        order.push('a')
+      }),
+      locks.withLock('b', async () => {
+        order.push('b')
+      }),
+    ])
+    // b (different key) finishes first despite a starting first
+    expect(order).toEqual(['b', 'a'])
+  })
+})
diff --git a/packages/ai-sandbox/tests/tool-bridge.test.ts b/packages/ai-sandbox/tests/tool-bridge.test.ts
new file mode 100644
index 000000000..4f805e732
--- /dev/null
+++ b/packages/ai-sandbox/tests/tool-bridge.test.ts
@@ -0,0 +1,90 @@
+/**
+ * Verifies the host-side MCP tool-proxy bridge using the MCP SDK's own HTTP
+ * client (no `claude` needed): list tools + call a tool, asserting the host
+ * `execute()` runs and the result comes back, plus bearer-token enforcement.
+ */
+import { afterEach, describe, expect, it } from 'vitest'
+import { Client } from '@modelcontextprotocol/sdk/client/index.js'
+import { StreamableHTTPClientTransport } from '@modelcontextprotocol/sdk/client/streamableHttp.js'
+import { startHostToolBridge } from '../src/tool-bridge'
+import type { HostToolBridge } from '../src/tool-bridge'
+import type { AnyTool } from '@tanstack/ai'
+
+let bridge: HostToolBridge | undefined
+
+afterEach(async () => {
+  if (bridge) await bridge.close()
+  bridge = undefined
+})
+
+function tool(name: string, execute: (args: unknown) => unknown): AnyTool {
+  return {
+    name,
+    description: `${name} tool`,
+    inputSchema: { type: 'object', properties: {} },
+    execute,
+  } as unknown as AnyTool
+}
+
+describe('startHostToolBridge', () => {
+  it('serves chat() tools over MCP and proxies calls to the host', async () => {
+    let calledWith: unknown
+    bridge = await startHostToolBridge(
+      [
+        tool('getTime', (args) => {
+          calledWith = args
+          return 'high noon'
+        }),
+      ],
+      { hostForSandbox: '127.0.0.1' },
+    )
+
+    const client = new Client({ name: 'test', version: '1.0.0' })
+    const transport = new StreamableHTTPClientTransport(new URL(bridge.url), {
+      requestInit: { headers: { Authorization: `Bearer ${bridge.token}` } },
+    })
+    await client.connect(transport)
+
+    const list = await client.listTools()
+    expect(list.tools.map((t) => t.name)).toContain('getTime')
+
+    const result = await client.callTool({
+      name: 'getTime',
+      arguments: { tz: 'utc' },
+    })
+    expect(calledWith).toEqual({ tz: 'utc' })
+    expect(JSON.stringify(result.content)).toContain('high noon')
+
+    await client.close()
+  })
+
+  it('reports tool execution errors as MCP tool errors', async () => {
+    bridge = await startHostToolBridge(
+      [
+        tool('boom', () => {
+          throw new Error('kaboom')
+        }),
+      ],
+      { hostForSandbox: '127.0.0.1' },
+    )
+    const client = new Client({ name: 'test', version: '1.0.0' })
+    const transport = new StreamableHTTPClientTransport(new URL(bridge.url), {
+      requestInit: { headers: { Authorization: `Bearer ${bridge.token}` } },
+    })
+    await client.connect(transport)
+    const result = await client.callTool({ name: 'boom', arguments: {} })
+    expect(result.isError).toBe(true)
+    expect(JSON.stringify(result.content)).toContain('kaboom')
+    await client.close()
+  })
+
+  it('rejects requests without the bearer token', async () => {
+    bridge = await startHostToolBridge([tool('noop', () => 'ok')], {
+      hostForSandbox: '127.0.0.1',
+    })
+    const client = new Client({ name: 'test', version: '1.0.0' })
+    const transport = new StreamableHTTPClientTransport(new URL(bridge.url))
+    await expect(client.connect(transport)).rejects.toThrow()
+    await client.close().catch(() => {})
+  })
+})
diff --git a/packages/ai-sandbox/tests/watch.test.ts b/packages/ai-sandbox/tests/watch.test.ts
new file mode 100644
index 000000000..d904ba962
--- /dev/null
+++ b/packages/ai-sandbox/tests/watch.test.ts
@@ -0,0 +1,215 @@
+import { afterEach, describe, expect, it, vi } from 'vitest'
+import { diffSnapshots, watchWorkspace } from '../src/watch'
+import type { SandboxHandle } from '../src/contracts'
+import type { FileEvent } from '../src/watch'
+
+/** Let queued microtasks (the native watcher's async classify) settle. */
+function flush(): Promise<void> {
+  return new Promise((resolve) => setTimeout(resolve, 5))
+}
+
+/** Minimal handle exposing only the fs/process bits a watcher touches. */
+function fakeHandle(fs: Partial<SandboxHandle['fs']>): SandboxHandle {
+  return {
+    id: 'fake',
+    provider: 'fake',
+    capabilities: {
+      fs: true,
+      exec: true,
+      env: true,
+      ports: false,
+      backgroundProcesses: false,
+      snapshots: false,
+      networkPolicy: false,
+      durableFilesystem: false,
+      fork: false,
+    },
+    fs: {
+      read: () => Promise.reject(new Error('unused')),
+      readBytes: () => Promise.reject(new Error('unused')),
+      write: () => Promise.resolve(),
+      list: () => Promise.resolve([]),
+      mkdir: () => Promise.resolve(),
+      remove: () => Promise.resolve(),
+      rename: () => Promise.resolve(),
+      exists: () => Promise.resolve(false),
+      ...fs,
+    },
+    git: {} as SandboxHandle['git'],
+    process: {
+      exec: () => Promise.reject(new Error('unused')),
+      spawn: () => Promise.reject(new Error('unused')),
+    },
+    ports: { connect: () => Promise.reject(new Error('unused')) },
+    env: { set: () => Promise.resolve() },
+    destroy: () => Promise.resolve(),
+  }
+}
+
+describe('diffSnapshots', () => {
+  it('detects create, change, and delete', () => {
+    const prev = new Map([
+      ['/workspace/a.js', '1\t10'],
+      ['/workspace/b.js', '2\t20'],
+    ])
+    const next = new Map([
+      ['/workspace/b.js', '2.5\t25'], // changed signature
+      ['/workspace/c.js', '3\t30'], // new
+    ])
+    const events = diffSnapshots(prev, next, 123)
+    expect(events).toEqual(
+      expect.arrayContaining([
+        { type: 'change', path: '/workspace/b.js', timestamp: 123 },
+        { type: 'create', path: '/workspace/c.js', timestamp: 123 },
+        { type: 'delete', path: '/workspace/a.js', timestamp: 123 },
+      ]),
+    )
+    expect(events).toHaveLength(3)
+  })
+
+  it('emits nothing for identical snapshots', () => {
+    const snap = new Map([['/workspace/a.js', '1\t10']])
+    expect(diffSnapshots(snap, new Map(snap), 1)).toEqual([])
+  })
+})
+
+describe('watchWorkspace (exec-poll)', () => {
+  afterEach(() => vi.useRealTimers())
+
+  it('diffs successive `find` snapshots into file events', async () => {
+    vi.useFakeTimers()
+    const snapshots = [
+      // initial
+      '1.0\t10\t/workspace/a.js\n2.0\t20\t/workspace/b.js\n',
+      // after the agent edits b, adds c, removes a
+      '2.5\t25\t/workspace/b.js\n3.0\t30\t/workspace/c.js\n',
+    ]
+    let call = 0
+    const handle = fakeHandle({})
+    handle.process.exec = () =>
+      Promise.resolve({
+        stdout: snapshots[Math.min(call++, snapshots.length - 1)] ?? '',
+        stderr: '',
+        exitCode: 0,
+      })
+
+    const events: Array<FileEvent> = []
+    const watcher = await watchWorkspace(handle, {
+      onEvent: (e) => events.push(e),
+      intervalMs: 100,
+    })
+
+    await vi.advanceTimersByTimeAsync(120)
+    await watcher.stop()
+
+    expect(events.map((e) => `${e.type} ${e.path}`).sort()).toEqual([
+      'change /workspace/b.js',
+      'create /workspace/c.js',
+      'delete /workspace/a.js',
+    ])
+  })
+
+  it('does not start polling when the signal is already aborted', async () => {
+    const controller = new AbortController()
+    controller.abort()
+    let execCalls = 0
+    const handle = fakeHandle({})
+    handle.process.exec = () => {
+      execCalls++
+      return Promise.resolve({ stdout: '', stderr: '', exitCode: 0 })
+    }
+    const events: Array<FileEvent> = []
+    const watcher = await watchWorkspace(handle, {
+      onEvent: (e) => events.push(e),
+      intervalMs: 10,
+      signal: controller.signal,
+    })
+    await new Promise((resolve) => setTimeout(resolve, 30))
+    await watcher.stop()
+    expect(execCalls).toBe(0)
+    expect(events).toEqual([])
+  })
+})
+
+describe('watchWorkspace (native fs.watch)', () => {
+  it('classifies raw events as create/change/delete via a known-path set', async () => {
+    const present = new Set<string>()
+    let onRaw: (e: { type: string; path: string }) => void = () => undefined
+    const handle = fakeHandle({
+      list: () => Promise.resolve([]),
+      exists: (p) => Promise.resolve(present.has(p)),
+      watch: (_path, cb) => {
+        onRaw = cb
+        return Promise.resolve({ stop: () => Promise.resolve() })
+      },
+    })
+
+    const events: Array<FileEvent> = []
+    const watcher = await watchWorkspace(handle, {
+      onEvent: (e) => events.push(e),
+    })
+
+    present.add('/workspace/x.js')
+    onRaw({ type: 'rename', path: '/workspace/x.js' })
+    await flush()
+    onRaw({ type: 'change', path: '/workspace/x.js' })
+    await flush()
+    present.delete('/workspace/x.js')
+    onRaw({ type: 'rename', path: '/workspace/x.js' })
+    await flush()
+
+    await watcher.stop()
+    expect(events.map((e) => e.type)).toEqual(['create', 'change', 'delete'])
+  })
+
+  it('ignores .git / node_modules paths', async () => {
+    let onRaw: (e: { type: string; path: string }) => void = () => undefined
+    const handle = fakeHandle({
+      list: () => Promise.resolve([]),
+      exists: () => Promise.resolve(true),
+      watch: (_path, cb) => {
+        onRaw = cb
+        return Promise.resolve({ stop: () => Promise.resolve() })
+      },
+    })
+    const events: Array<FileEvent> = []
+    const watcher = await watchWorkspace(handle, {
+      onEvent: (e) => events.push(e),
+    })
+
+    onRaw({ type: 'change', path: '/workspace/.git/index' })
+    onRaw({ type: 'change', path: '/workspace/node_modules/x/index.js' })
+    await flush()
+
+    await watcher.stop()
+    expect(events).toEqual([])
+  })
+
+  it('honors a custom root when classifying native events', async () => {
+    const present = new Set<string>()
+    let onRaw: (e: { type: string; path: string }) => void = () => undefined
+    const handle = fakeHandle({
+      list: () => Promise.resolve([]),
+      exists: (p) => Promise.resolve(present.has(p)),
+      watch: (_path, cb) => {
+        onRaw = cb
+        return Promise.resolve({ stop: () => Promise.resolve() })
+      },
+    })
+    const events: Array<FileEvent> = []
+    const watcher = await watchWorkspace(handle, {
+      onEvent: (e) => events.push(e),
+      root: '/workspace/sub',
+    })
+
+    present.add('/workspace/sub/a.ts')
+    onRaw({ type: 'rename', path: '/workspace/sub/a.ts' })
+    await flush()
+    present.delete('/workspace/sub/a.ts')
+    onRaw({ type: 'rename', path: '/workspace/sub/a.ts' })
+    await flush()
+
+    await watcher.stop()
+    expect(events.map((e) => e.type)).toEqual(['create', 'delete'])
+  })
+})
diff --git a/packages/ai-sandbox/tests/with-sandbox-hooks.test.ts b/packages/ai-sandbox/tests/with-sandbox-hooks.test.ts
new file mode 100644
index 000000000..74cfb83d5
--- /dev/null
+++ b/packages/ai-sandbox/tests/with-sandbox-hooks.test.ts
@@ -0,0 +1,126 @@
+import { describe, expect, it } from 'vitest'
+import { provideSandboxRuntime } from '@tanstack/ai/adapter-internals'
+import { resolveDebugOption } from '@tanstack/ai/adapter-internals'
+import { defineSandbox } from '../src/sandbox'
+import { withSandbox } from '../src/middleware'
+import type { SandboxFileEvent } from '@tanstack/ai'
+import type { ChatMiddlewareContext } from '@tanstack/ai'
+import type { SandboxHandle, SandboxProvider } from '../src/contracts'
+
+// Fake handle with a native fs.watch we can fire.
+function fakeHandleAndFire(present: Set<string>) {
+  let onRaw: (e: { type: string; path: string }) => void = () => undefined
+  const handle: SandboxHandle = {
+    id: 'fake',
+    provider: 'fake',
+    capabilities: {
+      fs: true,
+      exec: true,
+      env: true,
+      ports: false,
+      backgroundProcesses: false,
+      snapshots: false,
+      networkPolicy: false,
+      durableFilesystem: false,
+      fork: false,
+    },
+    fs: {
+      read: () => Promise.reject(new Error('x')),
+      readBytes: () => Promise.reject(new Error('x')),
+      write: () => Promise.resolve(),
+      list: () => Promise.resolve([]),
+      mkdir: () => Promise.resolve(),
+      remove: () => Promise.resolve(),
+      rename: () => Promise.resolve(),
+      exists: (p) => Promise.resolve(present.has(p)),
+      watch: (_p, cb) => {
+        onRaw = cb
+        return Promise.resolve({ stop: () => Promise.resolve() })
+      },
+    },
+    git: {} as SandboxHandle['git'],
+    process: {
+      exec: () => Promise.reject(new Error('x')),
+      spawn: () => Promise.reject(new Error('x')),
+    },
+    ports: { connect: () => Promise.reject(new Error('x')) },
+    env: { set: () => Promise.resolve() },
+    destroy: () => Promise.resolve(),
+  }
+  return { handle, fire: (e: { type: string; path: string }) => onRaw(e) }
+}
+
+function fakeProvider(handle: SandboxHandle): SandboxProvider {
+  return {
+    name: 'fake',
+    capabilities: () => handle.capabilities,
+    create: () => Promise.resolve(handle),
+    resume: () => Promise.resolve(handle),
+    destroy: () => Promise.resolve(),
+  }
+}
+
+function makeCtx(): ChatMiddlewareContext {
+  return {
+    threadId: 't',
+    runId: 'r',
+    capabilities: { markProvided: () => undefined },
+    getOptional: () => undefined,
+  } as unknown as ChatMiddlewareContext
+}
+
+const flush = () => new Promise((r) => setTimeout(r, 5))
+
+describe('withSandbox hooks', () => {
+  it('fires defineSandbox file hooks and emits via the runtime sink', async () => {
+    const present = new Set<string>()
+    const { handle, fire } = fakeHandleAndFire(present)
+    const created: Array<SandboxFileEvent> = []
+    const emitted: Array<SandboxFileEvent> = []
+
+    const sandbox = defineSandbox({
+      id: 's',
+      provider: fakeProvider(handle),
+      hooks: { onFileCreate: (e) => void created.push(e) },
+    })
+
+    const ctx = makeCtx()
+    provideSandboxRuntime(ctx, {
+      logger: resolveDebugOption(false),
+      emit: (e) => void emitted.push(e),
+    })
+
+    const mw = withSandbox(sandbox)
+    await mw.setup!(ctx)
+
+    present.add('/workspace/new.ts')
+    fire({ type: 'rename', path: '/workspace/new.ts' })
+    await flush()
+
+    expect(created.map((e) => e.type)).toEqual(['create'])
+    expect(emitted.map((e) => e.path)).toEqual(['/workspace/new.ts'])
+
+    await mw.onFinish!(ctx, { finishReason: 'stop', duration: 0, content: '' })
+  })
+
+  it('does not watch when fileEvents is false', async () => {
+    const { handle, fire } = fakeHandleAndFire(new Set())
+    const emitted: Array<SandboxFileEvent> = []
+    const sandbox = defineSandbox({
+      id: 's',
+      provider: fakeProvider(handle),
+      fileEvents: false,
+    })
+    const ctx = makeCtx()
+    provideSandboxRuntime(ctx, {
+      logger: resolveDebugOption(false),
+      emit: (e) => void emitted.push(e),
+    })
+    const mw = withSandbox(sandbox)
+    await mw.setup!(ctx)
+    fire({ type: 'rename', path: '/workspace/x.ts' })
+    await flush()
+    expect(emitted).toEqual([])
+    await mw.onFinish!(ctx, { finishReason: 'stop', duration: 0, content: '' })
+  })
+})
diff --git a/packages/ai-sandbox/tsconfig.json b/packages/ai-sandbox/tsconfig.json
new file mode 100644
index 000000000..c38689f4e
--- /dev/null
+++ b/packages/ai-sandbox/tsconfig.json
@@ -0,0 +1,8 @@
+{
+  "extends": "../../tsconfig.base.json",
+  "compilerOptions": {
+    "outDir": "dist"
+  },
+  "include": ["src", "tests"],
+  "exclude": ["node_modules", "dist"]
+}
diff --git a/packages/ai-sandbox/vite.config.ts b/packages/ai-sandbox/vite.config.ts
new file mode 100644
index 000000000..11f5b20b7
--- /dev/null
+++ b/packages/ai-sandbox/vite.config.ts
@@ -0,0 +1,37 @@
+import { defineConfig, mergeConfig } from 'vitest/config'
+import { tanstackViteConfig } from '@tanstack/vite-config'
+import packageJson from './package.json'
+
+const config = defineConfig({
+  test: {
+    name: packageJson.name,
+    dir: './',
+    watch: false,
+
+    globals: true,
+    environment: 'node',
+    include: ['tests/**/*.test.ts'],
+    coverage: {
+      provider: 'v8',
+      reporter: ['text', 'json', 'html', 'lcov'],
+      exclude: [
+        'node_modules/',
+        'dist/',
+        'tests/',
+        '**/*.test.ts',
+        '**/*.config.ts',
+        '**/types.ts',
+      ],
+      include: ['src/**/*.ts'],
+    },
+  },
+})
+
+export default mergeConfig(
+  config,
+  tanstackViteConfig({
+    entry: ['./src/index.ts'],
+    srcDir: './src',
+    cjs: false,
+  }),
+)
diff --git a/packages/ai/skills/ai-core/persistence/SKILL.md b/packages/ai/skills/ai-core/persistence/SKILL.md
new file mode 100644
index 000000000..34f40026a
--- /dev/null
+++ b/packages/ai/skills/ai-core/persistence/SKILL.md
@@ -0,0 +1,100 @@
+---
+name: ai-core/persistence
+description: >
+  Durable, resumable chat() via withPersistence middleware. Persists thread
+  messages, run records, an append-only AG-UI event log, usage, approvals, and
+  artifacts. Stamps each chunk with an opaque resume cursor; chat({ cursor })
+  replays the event tail and (for harness adapters) re-attaches live. Backends:
+  memoryPersistence, sqlitePersistence, postgresPersistence, cloudflarePersistence,
+  drizzlePersistence, prismaPersistence (shared SQL core). Use for resumable
+  conversations, multi-device threads, audit/history, and agent-mode sandboxes.
+type: sub-skill
+library: tanstack-ai
+library_version: '0.30.0'
+sources:
+  - 'TanStack/ai:docs/persistence/overview.md'
+---
+
+# Persistence
+
+> **Dependency note:** This skill builds on ai-core and ai-core/middleware. Read those first.
+
+## Core rules
+
+- Persistence is **opt-in middleware** and fully optional. A `chat()` with no
+  persistence middleware is unchanged. It works with AND without a sandbox.
+- `withPersistence(persistence, { mode? })` maps onto the real middleware hooks:
+  `setup` (create/resume run + provide capabilities), `onConfig` (load+merge
+  thread messages, server-authoritative), `onChunk` (assign per-run seq, stamp
+  in-band `cursor`, append to the event log), `onFinish`/`onError`/`onAbort`
+  (run status + usage + transcript save).
+- The persisted log is the AG-UI `StreamChunk` stream itself — there is NO
+  separate event type. Agent activity rides on well-known `CUSTOM` events
+  (`CUSTOM_EVENT.FILE_CHANGED`, `PROCESS_STDOUT`, `APPROVAL_REQUESTED`, …,
+  exported from `@tanstack/ai`).
+- A `cursor` is opaque (a monotonic per-run sequence). Pass the client's last
+  cursor as `chat({ cursor })` to replay the tail after it. Do NOT parse it.
+- `mode`: `'messages'` (history only) | `'chat'` (messages + runs + events +
+  usage) | `'agent'` (+ sandbox records, approvals, artifacts).
+
+## Server — persisted, resumable endpoint
+
+```ts
+import { chat } from '@tanstack/ai'
+import { anthropicText } from '@tanstack/ai-anthropic/adapters'
+import { withPersistence } from '@tanstack/ai-persistence'
+import { sqlitePersistence } from '@tanstack/ai-persistence-sqlite'
+
+const persistence = sqlitePersistence({
+  path: '.tanstack-ai/state.sqlite',
+  mode: 'chat',
+})
+
+export async function POST(request: Request) {
+  const { messages, threadId, runId, cursor } = await request.json()
+  return chat({
+    threadId,
+    runId,
+    cursor,
+    adapter: anthropicText({ model: 'claude-sonnet-4-6' }),
+    messages,
+    middleware: [withPersistence(persistence)],
+  }).toResponse()
+}
+```
+
+## Client — auto-resume
+
+`useChat` auto-resumes by default (`autoResume: false` to opt out). The headless
+client tracks the cursor; `chat.maybeAutoResume()` (call on mount / online),
+`chat.resume()`, and `chat.getResumeState()` drive it.
+
+## Backends
+
+```ts
+import { memoryPersistence } from '@tanstack/ai-persistence' // tests/prototypes
+import { sqlitePersistence } from '@tanstack/ai-persistence-sqlite' // { path } | { db }
+import { postgresPersistence } from '@tanstack/ai-persistence-postgres' // { connectionString } | { client }
+import { drizzlePersistence } from '@tanstack/ai-persistence-drizzle' // { db, dialect }
+import { prismaPersistence } from '@tanstack/ai-persistence-prisma' // { prisma, dialect }
+import { cloudflarePersistence } from '@tanstack/ai-persistence-cloudflare' // { d1, durableObjects?, r2? }
+```
+
+Raw drivers auto-migrate (opt out with `{ migrate: false }` + the exported
+`migrate`/`ddl`). Drizzle and Prisma own their schema.
+
+## Agent mode (sandboxes)
+
+`@tanstack/ai-sandbox-persistence` provides `createSqlSandboxStore(driver)` and
+`withPersistenceBridge({ persistence, sandboxStore })` — order it between
+`withPersistence` and `withSandbox` to make sandbox resume + ensure-locking
+durable across processes. The shared `locks` capability lives in `@tanstack/ai`.
+
+## Gotchas
+
+- `ModelMessage` has no id; message reconciliation is whole-transcript and
+  server-authoritative (client messages win when present, else stored history).
+- Replaying a run does NOT re-run the adapter; a still-running harness adapter
+  (`supportsReattach`) continues live after the replay.
+- Custom middleware that returns a chunk must spread it (`{ ...chunk }`) so the
+  in-band `cursor` survives.
diff --git a/packages/ai/src/activities/chat/index.ts b/packages/ai/src/activities/chat/index.ts
index 9a71cb9cc..b5933d78d 100644
--- a/packages/ai/src/activities/chat/index.ts
+++ b/packages/ai/src/activities/chat/index.ts
@@ -10,6 +10,7 @@ import { stripToSpecMiddleware } from '../../strip-to-spec-middleware'
 import { streamToText } from '../../stream-to-response.js'
 import { resolveDebugOption } from '../../logger/resolve'
 import { EventType } from '../../types'
+import { getResumeSource } from '../../resume'
 import { normalizeToolResult } from '../../utilities/tool-result'
 import { LazyToolManager } from './tools/lazy-tool-manager'
 import {
@@ -25,6 +26,7 @@ import {
 import { maxIterations as maxIterationsStrategy } from './agent-loop-strategies'
 import { convertMessagesToModelMessages, generateMessageId } from './messages'
 import { MiddlewareRunner } from './middleware/compose'
+import { provideSandboxRuntime } from './middleware/sandbox-runtime'
 import { CapabilityRegistry } from './middleware/capabilities'
 import { validateCapabilities } from './middleware/validate'
 import { MCPManager } from './mcp/manager'
@@ -60,6 +62,7 @@ import type {
   ChatMiddleware,
   ChatMiddlewareConfig,
   ChatMiddlewareContext,
+  SandboxFileEvent,
   StructuredOutputMiddlewareConfig,
 } from './middleware/types'
 import type { CheckCoverage } from './middleware/builder'
@@ -237,6 +240,12 @@ export interface TextActivityOptions<
   runId?: TextOptions['runId']
   /** Parent run ID for AG-UI protocol nested run correlation. */
   parentRunId?: TextOptions['parentRunId']
+  /**
+   * Resume cursor. When provided with a resume source (e.g. via
+   * `withPersistence`), the engine replays persisted events after this cursor
+   * instead of running the adapter. A no-op when no resume source is present.
+   */
+  cursor?: TextOptions['cursor']
   /**
    * Optional Standard Schema for structured output.
    * When provided, the activity will:
@@ -514,10 +523,13 @@ class TextEngine<
   private readonly threadId: string
   private readonly runIdOverride?: string
   private readonly parentRunIdOverride?: string
+  /** Resume cursor supplied by the caller; drives the resume seam (no-op without a resume source). */
+  private readonly cursorInput?: string
 
   // Middleware support
   private readonly middlewareRunner: MiddlewareRunner<TContext>
   private readonly middlewareCtx: ChatMiddlewareContext<TContext>
+  private readonly sandboxFileQueue: Array<StreamChunk> = []
   private readonly deferredPromises: Array<Promise<unknown>> = []
   private abortReason?: string
   private readonly middlewareAbortController?: AbortController
@@ -609,6 +621,7 @@ class TextEngine<
       this.createId('thread')
     this.runIdOverride = config.params.runId
     this.parentRunIdOverride = config.params.parentRunId
+    this.cursorInput = config.params.cursor
 
     // Initialize middleware — devtools first, strip-to-spec always last.
     // handleStreamChunk processes raw chunks BEFORE middleware, so internal
@@ -674,6 +687,21 @@ class TextEngine<
         capability[0](this.middlewareCtx, { optional: true }),
       provide: (capability, value) => capability[1](this.middlewareCtx, value),
     }
+
+    // Provide the internal SandboxRuntime capability so harness adapters and
+    // sandbox middleware can emit file events. The sink logs, fans the event
+    // out through the middleware `onFile*` hooks (fire-and-forget), and queues
+    // a `sandbox.file` custom chunk to be drained into the public stream.
+    provideSandboxRuntime(this.middlewareCtx, {
+      logger: this.logger,
+      emit: (event: SandboxFileEvent) => {
+        this.logger.sandbox(`file ${event.type} ${event.path}`, { event })
+        void this.middlewareRunner.runSandboxFile(this.middlewareCtx, event)
+        this.sandboxFileQueue.push(
+          this.createCustomEventChunk('sandbox.file', { ...event }),
+        )
+      },
+    })
   }
 
   /** Get the accumulated content after the chat loop completes */
@@ -713,6 +741,52 @@ class TextEngine<
     return this.finalizationError
   }
 
+  /**
+   * Resume seam. When the caller supplied a `cursor` and a `ResumeSource` was
+   * provided by middleware (e.g. `withPersistence`) for this run, replay the
+   * persisted event tail after the cursor and report that the run was handled
+   * by replay. Returns `false` (a no-op) when there is no cursor, no resume
+   * source, or no persisted run — so a normal run proceeds unchanged.
+   *
+   * Phase 1 is replay-only: it yields the persisted tail and ends. Live
+   * re-attach for harness adapters (continuing an in-sandbox process) layers on
+   * top of this in a later phase.
+   */
+  private async *maybeResume(): AsyncGenerator<StreamChunk, boolean> {
+    const cursor = this.cursorInput
+    if (cursor === undefined) {
+      return false
+    }
+    const source = getResumeSource(this.middlewareCtx, { optional: true })
+    if (!source) {
+      return false
+    }
+    const runId = this.middlewareCtx.runId
+    if (!(await source.hasRun(runId))) {
+      return false
+    }
+    for await (const chunk of source.replay(runId, cursor)) {
+      yield chunk
+    }
+    // If the run is still in flight AND the adapter can re-attach to its live
+    // source (a harness adapter re-attaching to the still-running in-sandbox
+    // process), fall through to the agent loop to continue live. Otherwise
+    // (completed run, or a model adapter with no live source) replay is terminal.
+    const status = await source.getStatus(runId)
+    if (status === 'running' && this.adapterSupportsReattach()) {
+      return false
+    }
+    return true
+  }
+
+  /** Whether the adapter declares it can re-attach to a live run on resume. */
+  private adapterSupportsReattach(): boolean {
+    return (
+      'supportsReattach' in this.adapter &&
+      (this.adapter as { supportsReattach?: boolean }).supportsReattach === true
+    )
+  }
+
   async *run(): AsyncGenerator<StreamChunk> {
     this.beforeRun()
     this.logger.agentLoop('run started', {
@@ -735,6 +809,15 @@ class TextEngine<
       // Run onStart (devtools middleware emits text:request:started and initial messages here)
       await this.middlewareRunner.runOnStart(this.middlewareCtx)
 
+      // Resume seam: when a cursor was supplied AND a resume source is available
+      // for this run, replay the persisted event tail instead of running the
+      // adapter. No-op (falls through) when no resume source is provided, so a
+      // normal run is unaffected.
+      const resumed = yield* this.maybeResume()
+      if (resumed) {
+        return
+      }
+
       const pendingPhase = yield* this.checkForPendingToolCalls()
       if (pendingPhase === 'wait') {
         return
@@ -994,6 +1077,10 @@ class TextEngine<
       threadId: this.threadId,
       runId: this.runIdOverride,
       parentRunId: this.parentRunIdOverride,
+      // Expose provided capabilities (e.g. sandbox) to harness adapters.
+      capabilities: this.middlewareCtx,
+      // Client approval decisions, for harness interactive-approval resolution.
+      approvals: this.initialApprovals,
       ...(combinedSchema ? { outputSchema: combinedSchema } : {}),
     })) {
       if (this.isCancelled()) {
@@ -1078,10 +1165,16 @@ class TextEngine<
         await this.middlewareRunner.runOnUsage(this.middlewareCtx, chunk.usage)
       }
 
+      // Drain any sandbox.file events emitted while processing this chunk.
+      yield* this.drainSandboxFileQueue()
+
       if (this.earlyTermination) {
         break
       }
     }
+
+    // Drain any remaining sandbox.file events emitted after the stream ended.
+    yield* this.drainSandboxFileQueue()
   }
 
   private handleStreamChunk(chunk: StreamChunk): void {
@@ -2437,6 +2530,17 @@ class TextEngine<
     }
   }
 
+  /**
+   * Drain queued `sandbox.file` chunks (emitted via the SandboxRuntime sink)
+   * through the middleware pipeline and into the public stream.
+   */
+  private async *drainSandboxFileQueue(): AsyncGenerator<StreamChunk> {
+    while (this.sandboxFileQueue.length > 0) {
+      const chunk = this.sandboxFileQueue.shift()
+      if (chunk) yield* this.pipeThroughMiddleware(chunk)
+    }
+  }
+
   /**
    * Drain an executeToolCalls async generator, yielding any CustomEvent chunks
    * through the middleware pipeline and returning the final ExecuteToolCallsResult.
diff --git a/packages/ai/src/activities/chat/middleware/compose.ts b/packages/ai/src/activities/chat/middleware/compose.ts
index bab6a9a03..cdd4ca552 100644
--- a/packages/ai/src/activities/chat/middleware/compose.ts
+++ b/packages/ai/src/activities/chat/middleware/compose.ts
@@ -11,6 +11,7 @@ import type {
   ErrorInfo,
   FinishInfo,
   IterationInfo,
+  SandboxFileEvent,
   StructuredOutputMiddlewareConfig,
   ToolCallHookContext,
   ToolPhaseCompleteInfo,
@@ -344,6 +345,39 @@ export class MiddlewareRunner<TContext = unknown> {
     return chunks
   }
 
+  /**
+   * Dispatch a sandbox file event to every middleware's `sandbox` hooks, in
+   * array order: the catch-all `onFile` then the type-specific hook. Errors are
+   * logged and swallowed so one bad hook can't break the run.
+   */
+  async runSandboxFile(
+    ctx: ChatMiddlewareContext<TContext>,
+    event: SandboxFileEvent,
+  ): Promise<void> {
+    const typed = (
+      {
+        create: 'onFileCreate',
+        change: 'onFileChange',
+        delete: 'onFileDelete',
+      } as const
+    )[event.type]
+    for (const mw of this.middlewares) {
+      const hooks = mw.sandbox
+      if (!hooks) continue
+      for (const fn of [hooks.onFile, hooks[typed]]) {
+        if (!fn) continue
+        try {
+          await fn(ctx, event)
+        } catch (error) {
+          this.logger.sandbox(
+            `hook=${typed} middleware=${mw.name ?? 'unnamed'} threw`,
+            { middleware: mw.name ?? 'unnamed', error },
+          )
+        }
+      }
+    }
+  }
+
   /**
    * Run onBeforeToolCall through middleware in order.
    * Returns the first non-void decision, or undefined to continue normally.
diff --git a/packages/ai/src/activities/chat/middleware/index.ts b/packages/ai/src/activities/chat/middleware/index.ts
index 98e2f02f9..b45333234 100644
--- a/packages/ai/src/activities/chat/middleware/index.ts
+++ b/packages/ai/src/activities/chat/middleware/index.ts
@@ -13,6 +13,8 @@ export type {
   FinishInfo,
   AbortInfo,
   ErrorInfo,
+  SandboxFileEvent,
+  ChatSandboxHooks,
 } from './types'
 
 export { MiddlewareRunner } from './compose'
diff --git a/packages/ai/src/activities/chat/middleware/sandbox-runtime.ts b/packages/ai/src/activities/chat/middleware/sandbox-runtime.ts
new file mode 100644
index 000000000..bf1a85070
--- /dev/null
+++ b/packages/ai/src/activities/chat/middleware/sandbox-runtime.ts
@@ -0,0 +1,21 @@
+/**
+ * Internal runtime seam the chat engine PROVIDES so the sandbox middleware can
+ * surface file events without a public ctx method. `emit` runs every
+ * middleware's `sandbox` hooks AND emits a CUSTOM `sandbox.file` chunk into the
+ * stream; `logger` lets the sandbox layer log under the `sandbox` debug
+ * category. Consumed (optionally) by `withSandbox` in `@tanstack/ai-sandbox`.
+ */
+import { createCapability } from './capabilities'
+import type { InternalLogger } from '../../../logger/internal-logger'
+import type { SandboxFileEvent } from './types'
+
+export interface SandboxRuntime {
+  emit: (event: SandboxFileEvent) => void
+  logger: InternalLogger
+}
+
+export const SandboxRuntimeCapability =
+  createCapability<SandboxRuntime>()('sandbox-runtime')
+
+export const [getSandboxRuntime, provideSandboxRuntime] =
+  SandboxRuntimeCapability
diff --git a/packages/ai/src/activities/chat/middleware/types.ts b/packages/ai/src/activities/chat/middleware/types.ts
index f3b7d3ff8..a87c92e6f 100644
--- a/packages/ai/src/activities/chat/middleware/types.ts
+++ b/packages/ai/src/activities/chat/middleware/types.ts
@@ -13,6 +13,37 @@ import type {
   CapabilityRegistry,
 } from './capabilities'
 
+/** A file change observed inside a sandbox during a chat run. */
+export interface SandboxFileEvent {
+  type: 'create' | 'change' | 'delete'
+  /** Absolute path inside the sandbox (under the workspace root). */
+  path: string
+  timestamp: number
+}
+
+/**
+ * Sandbox file-event hooks a chat middleware can declare. Fire server-side for
+ * every file create/change/delete observed in the sandbox during the run.
+ */
+export interface ChatSandboxHooks<TContext = unknown> {
+  onFile?: (
+    ctx: ChatMiddlewareContext<TContext>,
+    e: SandboxFileEvent,
+  ) => void | Promise<void>
+  onFileCreate?: (
+    ctx: ChatMiddlewareContext<TContext>,
+    e: SandboxFileEvent,
+  ) => void | Promise<void>
+  onFileChange?: (
+    ctx: ChatMiddlewareContext<TContext>,
+    e: SandboxFileEvent,
+  ) => void | Promise<void>
+  onFileDelete?: (
+    ctx: ChatMiddlewareContext<TContext>,
+    e: SandboxFileEvent,
+  ) => void | Promise<void>
+}
+
 // ===========================
 // Middleware Context
 // ===========================
@@ -532,6 +563,12 @@ export interface ChatMiddleware<TContext = unknown> {
     ctx: ChatMiddlewareContext<TContext>,
     info: ErrorInfo,
   ) => void | Promise<void>
+
+  /**
+   * Sandbox file-event hooks. Fire when a sandbox provided by `withSandbox` is
+   * active during the run and a file is created/changed/deleted. Server-side.
+   */
+  sandbox?: ChatSandboxHooks<TContext>
 }
 
 /** A `ChatMiddleware` with a permissive context — for use as a constraint. */
diff --git a/packages/ai/src/adapter-internals.ts b/packages/ai/src/adapter-internals.ts
index f45fafc12..c5672d68d 100644
--- a/packages/ai/src/adapter-internals.ts
+++ b/packages/ai/src/adapter-internals.ts
@@ -10,3 +10,9 @@ export {
   toRunErrorPayload,
   toRunErrorRawEvent,
 } from './activities/error-payload'
+export {
+  getSandboxRuntime,
+  provideSandboxRuntime,
+  SandboxRuntimeCapability,
+} from './activities/chat/middleware/sandbox-runtime'
+export type { SandboxRuntime } from './activities/chat/middleware/sandbox-runtime'
diff --git a/packages/ai/src/custom-events.ts b/packages/ai/src/custom-events.ts
new file mode 100644
index 000000000..7829924ab
--- /dev/null
+++ b/packages/ai/src/custom-events.ts
@@ -0,0 +1,107 @@
+/**
+ * Catalog of well-known AG-UI `CUSTOM` event names used by the sandbox/agent
+ * layers, plus their payload shapes.
+ *
+ * The persisted run log is the AG-UI `StreamChunk` stream itself — there is no
+ * separate `RunEvent` type. Agent activity that has no first-class AG-UI event
+ * (process output, file diffs, ports, approvals, artifacts, sandbox lifecycle)
+ * rides on `CUSTOM` events carrying one of these names. Centralizing the names +
+ * payloads here keeps emitters (harness adapters, sandbox) and consumers
+ * (persistence projections, devtools, diff/terminal panels) in agreement without
+ * inventing a parallel event union.
+ */
+import { EventType } from './types'
+import type { CustomEvent, StreamChunk } from './types'
+
+/** Well-known CUSTOM event names. */
+export const CUSTOM_EVENT = {
+  FILE_CHANGED: 'file.changed',
+  PROCESS_STDOUT: 'process.stdout',
+  PROCESS_STDERR: 'process.stderr',
+  PORT_OPENED: 'port.opened',
+  APPROVAL_REQUESTED: 'approval.requested',
+  APPROVAL_RESOLVED: 'approval.resolved',
+  ARTIFACT_CREATED: 'artifact.created',
+  SANDBOX_CREATED: 'sandbox.created',
+  SANDBOX_RESUMED: 'sandbox.resumed',
+} as const
+
+/** Union of the well-known CUSTOM event name literals. */
+export type WellKnownCustomEventName =
+  (typeof CUSTOM_EVENT)[keyof typeof CUSTOM_EVENT]
+
+// ---- Payload shapes ----
+
+export interface FileChangedPayload {
+  type: 'create' | 'change' | 'delete'
+  /** Absolute path inside the sandbox (under the workspace root). */
+  path: string
+  /** Unified diff, when the harness can produce one. */
+  diff?: string
+  timestamp: number
+}
+
+export interface ProcessOutputPayload {
+  /** Stable id for the spawned process whose output this is. */
+  processId: string
+  /** A chunk of stdout/stderr text. */
+  chunk: string
+}
+
+export interface PortOpenedPayload {
+  port: number
+  /** Externally reachable URL, when the provider exposes one. */
+  url?: string
+}
+
+export interface ApprovalRequestedPayload {
+  approvalId: string
+  title: string
+  /** Free-form detail describing the action awaiting approval. */
+  [key: string]: unknown
+}
+
+export interface ApprovalResolvedPayload {
+  approvalId: string
+  granted: boolean
+}
+
+export interface ArtifactCreatedPayload {
+  artifactId: string
+  name: string
+  mimeType: string
+  size: number
+}
+
+export interface SandboxLifecyclePayload {
+  sandboxId: string
+  provider: string
+}
+
+/** Maps each well-known name to its payload type. */
+export interface CustomEventPayloads {
+  [CUSTOM_EVENT.FILE_CHANGED]: FileChangedPayload
+  [CUSTOM_EVENT.PROCESS_STDOUT]: ProcessOutputPayload
+  [CUSTOM_EVENT.PROCESS_STDERR]: ProcessOutputPayload
+  [CUSTOM_EVENT.PORT_OPENED]: PortOpenedPayload
+  [CUSTOM_EVENT.APPROVAL_REQUESTED]: ApprovalRequestedPayload
+  [CUSTOM_EVENT.APPROVAL_RESOLVED]: ApprovalResolvedPayload
+  [CUSTOM_EVENT.ARTIFACT_CREATED]: ArtifactCreatedPayload
+  [CUSTOM_EVENT.SANDBOX_CREATED]: SandboxLifecyclePayload
+  [CUSTOM_EVENT.SANDBOX_RESUMED]: SandboxLifecyclePayload
+}
+
+/** A CUSTOM event narrowed to a specific well-known name and its payload. */
+export type WellKnownCustomEvent<TName extends WellKnownCustomEventName> =
+  CustomEvent & { name: TName; value: CustomEventPayloads[TName] }
+
+/**
+ * Type guard: is `chunk` a CUSTOM event with the given well-known `name`?
+ * Narrows the payload type when true, so consumers read `chunk.value` typed.
+ */
+export function isCustomEvent<TName extends WellKnownCustomEventName>(
+  chunk: StreamChunk,
+  name: TName,
+): chunk is WellKnownCustomEvent<TName> {
+  return chunk.type === EventType.CUSTOM && (chunk as CustomEvent).name === name
+}
diff --git a/packages/ai/src/index.ts b/packages/ai/src/index.ts
index f44d44b43..e6d87a1f1 100644
--- a/packages/ai/src/index.ts
+++ b/packages/ai/src/index.ts
@@ -116,6 +116,8 @@ export type {
   FinishInfo,
   AbortInfo,
   ErrorInfo,
+  SandboxFileEvent,
+  ChatSandboxHooks,
 } from './activities/chat/middleware/index'
 
 // Capability primitives + middleware builder
@@ -130,8 +132,40 @@ export type {
   CapabilityContext,
   CapabilityGetter,
   CapabilityProvider,
+  DefinedChatMiddleware,
+  AnyChatMiddleware,
 } from './activities/chat/middleware/index'
 
+// Shared lock primitive (one global 'locks' capability; see locks.ts)
+export {
+  LocksCapability,
+  getLocks,
+  provideLocks,
+  InMemoryLockStore,
+} from './locks'
+export type { LockStore } from './locks'
+
+// Resume-source capability (consumed by chat()'s resume seam; provided by persistence)
+export {
+  ResumeSourceCapability,
+  getResumeSource,
+  provideResumeSource,
+} from './resume'
+export type { ResumeSource, RunStatus } from './resume'
+
+// Well-known AG-UI CUSTOM event catalog (agent activity rides on CUSTOM events)
+export { CUSTOM_EVENT, isCustomEvent } from './custom-events'
+export type {
+  WellKnownCustomEventName,
+  FileChangedPayload,
+  ProcessOutputPayload,
+  PortOpenedPayload,
+  ApprovalRequestedPayload,
+  ApprovalResolvedPayload,
+  ArtifactCreatedPayload,
+  SandboxLifecyclePayload,
+} from './custom-events'
+
 // All types
 export * from './types'
 
diff --git a/packages/ai/src/locks.ts b/packages/ai/src/locks.ts
new file mode 100644
index 000000000..621a3c04c
--- /dev/null
+++ b/packages/ai/src/locks.ts
@@ -0,0 +1,56 @@
+/**
+ * Distributed-mutex primitive, shared across the sandbox and persistence
+ * layers via the middleware capability system.
+ *
+ * `LocksCapability` lives in core (rather than in `@tanstack/ai-sandbox` or
+ * `@tanstack/ai-persistence`) so there is exactly ONE `'locks'` token: capability
+ * names must be globally unique, and both `withSandbox` (which optionally
+ * requires it) and `withPersistence` (which provides a durable implementation)
+ * must reference the same handle. The in-memory default here is correct within a
+ * single process; the persistence layer provides a distributed lock (e.g. a
+ * Durable Object) for multi-instance deployments.
+ */
+import { createCapability } from './activities/chat/middleware/capabilities'
+
+/**
+ * Mutual exclusion around a critical section keyed by `key`. Used by the
+ * sandbox `ensure` algorithm so two concurrent runs for the same thread don't
+ * both create a sandbox, and available to any middleware that needs a named lock.
+ */
+export interface LockStore {
+  withLock: <T>(key: string, fn: () => Promise<T>) => Promise<T>
+}
+
+/**
+ * The lock capability. PROVIDED by `withPersistence` (durable) and OPTIONALLY
+ * required by `withSandbox`. Falls back to {@link InMemoryLockStore} when no
+ * middleware provides it.
+ */
+export const LocksCapability = createCapability<LockStore>()('locks')
+
+/** Destructured accessors: `getLocks(ctx)` / `provideLocks(ctx, store)`. */
+export const [getLocks, provideLocks] = LocksCapability
+
+/**
+ * In-memory {@link LockStore} — a per-key promise chain. Correct within a
+ * single process; multi-instance correctness needs a distributed lock from the
+ * persistence layer.
+ */
+export class InMemoryLockStore implements LockStore {
+  private readonly chains = new Map<string, Promise<unknown>>()
+
+  withLock<T>(key: string, fn: () => Promise<T>): Promise<T> {
+    const prior = this.chains.get(key) ?? Promise.resolve()
+    // Chain after the prior holder regardless of how it settled.
+    const run = prior.then(fn, fn)
+    // Keep the chain alive but swallow rejections so one failure doesn't poison the lock.
+    this.chains.set(
+      key,
+      run.then(
+        () => undefined,
+        () => undefined,
+      ),
+    )
+    return run
+  }
+}
diff --git a/packages/ai/src/logger/internal-logger.ts b/packages/ai/src/logger/internal-logger.ts
index e9eb0eb60..61914c296 100644
--- a/packages/ai/src/logger/internal-logger.ts
+++ b/packages/ai/src/logger/internal-logger.ts
@@ -31,6 +31,7 @@ const CATEGORY_EMOJI: Record<keyof ResolvedCategories, string> = {
   agentLoop: '🔁',
   config: '⚙️',
   errors: '❌',
+  sandbox: '📦',
 }
 
 export class InternalLogger {
@@ -82,6 +83,11 @@ export class InternalLogger {
     this.emit('debug', 'tools', message, meta)
   }
 
+  /** Log sandbox internals (watcher, file events, hook dispatch). Chat-only. */
+  sandbox(message: string, meta?: Record<string, unknown>): void {
+    this.emit('debug', 'sandbox', message, meta)
+  }
+
   /** Log an agent-loop iteration marker or phase transition. Chat-only. */
   agentLoop(message: string, meta?: Record<string, unknown>): void {
     this.emit('debug', 'agentLoop', message, meta)
diff --git a/packages/ai/src/logger/resolve.ts b/packages/ai/src/logger/resolve.ts
index 688240d48..dbfb42b0a 100644
--- a/packages/ai/src/logger/resolve.ts
+++ b/packages/ai/src/logger/resolve.ts
@@ -12,6 +12,7 @@ const ALL_OFF: ResolvedCategories = {
   config: false,
   errors: false,
   request: false,
+  sandbox: false,
 }
 
 const ALL_ON: ResolvedCategories = {
@@ -23,6 +24,7 @@ const ALL_ON: ResolvedCategories = {
   config: true,
   errors: true,
   request: true,
+  sandbox: true,
 }
 
 const errorsOnlyCategories = (): ResolvedCategories => ({
@@ -41,6 +43,7 @@ const resolveCategoriesFromPartial = (
   config: partial.config ?? true,
   errors: partial.errors ?? true,
   request: partial.request ?? true,
+  sandbox: partial.sandbox ?? true,
 })
 
 /**
diff --git a/packages/ai/src/logger/types.ts b/packages/ai/src/logger/types.ts
index 41611cf30..420606804 100644
--- a/packages/ai/src/logger/types.ts
+++ b/packages/ai/src/logger/types.ts
@@ -60,6 +60,11 @@ export interface DebugCategories {
    * Outgoing call metadata (provider, model, message/tool counts) emitted before each adapter SDK call.
    */
   request?: boolean
+  /**
+   * Sandbox internals: watcher start/stop + mechanism, file events, sandbox
+   * hook dispatch, ensure/bootstrap and lifecycle transitions. Chat-only.
+   */
+  sandbox?: boolean
 }
 
 /**
diff --git a/packages/ai/src/resume.ts b/packages/ai/src/resume.ts
new file mode 100644
index 000000000..8936e4f5d
--- /dev/null
+++ b/packages/ai/src/resume.ts
@@ -0,0 +1,46 @@
+/**
+ * Resume-source capability — the core seam that lets a reconnecting client pick
+ * up a run where it left off.
+ *
+ * The contract lives in core (not in `@tanstack/ai-persistence`) because the
+ * `chat()` engine itself owns the resume decision: when a `cursor` is supplied
+ * and a `ResumeSource` has been provided by middleware, the engine replays the
+ * persisted event tail instead of running the adapter again. `withPersistence`
+ * PROVIDES a `ResumeSource` backed by its event log + run store; without it, the
+ * `cursor` option is a silent no-op (a normal run is unaffected).
+ *
+ * Core depends only on this small read contract — never on the persistence
+ * package — mirroring how {@link LocksCapability} lives in core.
+ */
+import { createCapability } from './activities/chat/middleware/capabilities'
+import type { StreamChunk } from './types'
+
+/** Lifecycle status of a persisted run. */
+export type RunStatus = 'running' | 'completed' | 'failed' | 'interrupted'
+
+/**
+ * A read-only view of persisted run history sufficient for the engine to resume.
+ * Provided by `withPersistence`; consumed by the `chat()` resume seam.
+ */
+export interface ResumeSource {
+  /** Whether any events have been persisted for `runId`. */
+  hasRun: (runId: string) => Promise<boolean>
+  /**
+   * Replay persisted chunks for `runId` whose cursor is strictly after
+   * `afterCursor` (or from the beginning when omitted). Each yielded chunk
+   * carries its stamped `cursor`.
+   */
+  replay: (runId: string, afterCursor?: string) => AsyncIterable<StreamChunk>
+  /** Current status of `runId`, or null when unknown. */
+  getStatus: (runId: string) => Promise<RunStatus | null>
+}
+
+/**
+ * The resume capability. PROVIDED by `withPersistence`; OPTIONALLY consumed by
+ * the chat engine. When absent, a supplied `cursor` is ignored.
+ */
+export const ResumeSourceCapability =
+  createCapability<ResumeSource>()('resume-source')
+
+/** Destructured accessors: `getResumeSource(ctx)` / `provideResumeSource(ctx, src)`. */
+export const [getResumeSource, provideResumeSource] = ResumeSourceCapability
diff --git a/packages/ai/src/types.ts b/packages/ai/src/types.ts
index 798b381b4..c83cf2d0a 100644
--- a/packages/ai/src/types.ts
+++ b/packages/ai/src/types.ts
@@ -4,6 +4,7 @@ import type {
 } from '@standard-schema/spec'
 import type { InternalLogger } from './logger/internal-logger'
 import type { SystemPrompt } from './system-prompts'
+import type { CapabilityContext } from './activities/chat/middleware/capabilities'
 // The canonical usage types live in the leaf `@tanstack/ai-event-client`
 // package (which `@tanstack/ai` already depends on) so there is a single source
 // of truth without a dependency cycle. They are re-exported below.
@@ -906,6 +907,35 @@ export interface TextOptions<
    * Surfaced for observability/middleware; not consumed by the LLM call.
    */
   parentRunId?: string
+
+  /**
+   * Resume cursor for persistence-backed runs. When provided alongside `runId`,
+   * and a resume source has been provided by middleware (e.g. `withPersistence`),
+   * the engine replays persisted events after this cursor instead of running the
+   * adapter fresh. Opaque string; generated/consumed by `@tanstack/ai-persistence`.
+   * Ignored (a no-op) when no resume source is present — so a normal run is
+   * unaffected. See {@link StreamChunk.cursor}.
+   */
+  cursor?: string
+
+  /**
+   * Middleware capability context for this run. The engine populates it with
+   * the live middleware context so harness adapters that declare
+   * `requires: [SomeCapability]` can read provided capabilities from inside
+   * `chatStream` — e.g. `getSandbox(options.capabilities)`. Capabilities are
+   * provisioned by middleware `setup` before the adapter runs. Undefined for
+   * direct adapter usage outside the chat engine.
+   */
+  capabilities?: CapabilityContext
+
+  /**
+   * Client approval decisions for this run, keyed by approval id. The engine
+   * populates this from approvals carried on the incoming messages. Harness
+   * adapters consult it to resolve `ask`-policy permission requests (the agent
+   * pauses on a risky action; the client re-runs with a decision recorded
+   * here). Undefined for direct adapter usage outside the chat engine.
+   */
+  approvals?: ReadonlyMap<string, boolean>
 }
 
 // ============================================================================
@@ -1428,8 +1458,16 @@ export type AGUIEvent =
 /**
  * Chunk returned by the SDK during streaming chat completions.
  * Uses the AG-UI protocol event format.
+ *
+ * `cursor` is an OPTIONAL, opaque per-event resume cursor. It is absent on a
+ * normal (non-persisted) run and stamped by `withPersistence` when persistence
+ * is active, so a reconnecting client can resume with the last cursor it saw.
+ * It rides in-band so both the SSE and ndjson transports carry it unchanged.
  */
-export type StreamChunk = AGUIEvent
+export type StreamChunk = AGUIEvent & {
+  /** Opaque per-event resume cursor (present only on persisted runs). */
+  cursor?: string
+}
 
 // Simple streaming format for basic text completions
 // Converted to StreamChunk format by convertTextCompletionStream()
diff --git a/packages/ai/tests/custom-events.test.ts b/packages/ai/tests/custom-events.test.ts
new file mode 100644
index 000000000..6566c0ab8
--- /dev/null
+++ b/packages/ai/tests/custom-events.test.ts
@@ -0,0 +1,52 @@
+import { describe, expect, it } from 'vitest'
+import { CUSTOM_EVENT, isCustomEvent } from '../src/custom-events'
+import { EventType } from '../src/types'
+import type { StreamChunk } from '../src/types'
+
+describe('CUSTOM_EVENT catalog', () => {
+  it('exposes the well-known agent-activity event names', () => {
+    expect(CUSTOM_EVENT.FILE_CHANGED).toBe('file.changed')
+    expect(CUSTOM_EVENT.PROCESS_STDOUT).toBe('process.stdout')
+    expect(CUSTOM_EVENT.PROCESS_STDERR).toBe('process.stderr')
+    expect(CUSTOM_EVENT.PORT_OPENED).toBe('port.opened')
+    expect(CUSTOM_EVENT.APPROVAL_REQUESTED).toBe('approval.requested')
+    expect(CUSTOM_EVENT.APPROVAL_RESOLVED).toBe('approval.resolved')
+    expect(CUSTOM_EVENT.ARTIFACT_CREATED).toBe('artifact.created')
+    expect(CUSTOM_EVENT.SANDBOX_CREATED).toBe('sandbox.created')
+    expect(CUSTOM_EVENT.SANDBOX_RESUMED).toBe('sandbox.resumed')
+  })
+})
+
+describe('isCustomEvent', () => {
+  const fileChanged: StreamChunk = {
+    type: EventType.CUSTOM,
+    name: CUSTOM_EVENT.FILE_CHANGED,
+    value: { type: 'change', path: '/workspace/a.ts', timestamp: 1 },
+    timestamp: 1,
+  }
+
+  it('returns true for a matching CUSTOM event name', () => {
+    expect(isCustomEvent(fileChanged, CUSTOM_EVENT.FILE_CHANGED)).toBe(true)
+  })
+
+  it('returns false for a CUSTOM event with a different name', () => {
+    expect(isCustomEvent(fileChanged, CUSTOM_EVENT.PORT_OPENED)).toBe(false)
+  })
+
+  it('returns false for a non-CUSTOM chunk', () => {
+    const runStarted: StreamChunk = {
+      type: EventType.RUN_STARTED,
+      runId: 'r',
+      threadId: 't',
+      timestamp: 1,
+    }
+    expect(isCustomEvent(runStarted, CUSTOM_EVENT.FILE_CHANGED)).toBe(false)
+  })
+
+  it('narrows the payload type when matched', () => {
+    if (isCustomEvent(fileChanged, CUSTOM_EVENT.FILE_CHANGED)) {
+      // Type-level: value is FileChangedPayload — `.path` is a string.
+      expect(fileChanged.value.path).toBe('/workspace/a.ts')
+    }
+  })
+})
diff --git a/packages/ai/tests/locks.test.ts b/packages/ai/tests/locks.test.ts
new file mode 100644
index 000000000..bf1972d97
--- /dev/null
+++ b/packages/ai/tests/locks.test.ts
@@ -0,0 +1,88 @@
+import { describe, expect, it } from 'vitest'
+import {
+  InMemoryLockStore,
+  LocksCapability,
+  getLocks,
+  provideLocks,
+} from '../src/locks'
+import { CapabilityRegistry } from '../src/activities/chat/middleware/capabilities'
+
+describe('InMemoryLockStore', () => {
+  it('serializes concurrent withLock calls for the same key', async () => {
+    const store = new InMemoryLockStore()
+    const order: Array<string> = []
+
+    const first = store.withLock('k', async () => {
+      order.push('first-start')
+      await new Promise((r) => setTimeout(r, 20))
+      order.push('first-end')
+      return 1
+    })
+    // Second acquire happens while first holds the lock.
+    const second = store.withLock('k', async () => {
+      order.push('second-start')
+      order.push('second-end')
+      return 2
+    })
+
+    const [a, b] = await Promise.all([first, second])
+    expect(a).toBe(1)
+    expect(b).toBe(2)
+    // Second must not interleave: it starts only after first fully ends.
+    expect(order).toEqual([
+      'first-start',
+      'first-end',
+      'second-start',
+      'second-end',
+    ])
+  })
+
+  it('runs different keys concurrently', async () => {
+    const store = new InMemoryLockStore()
+    const order: Array<string> = []
+
+    const a = store.withLock('a', async () => {
+      order.push('a-start')
+      await new Promise((r) => setTimeout(r, 20))
+      order.push('a-end')
+    })
+    const b = store.withLock('b', async () => {
+      order.push('b-start')
+      order.push('b-end')
+    })
+
+    await Promise.all([a, b])
+    // b (different key) runs while a is still waiting on its timeout.
+    expect(order.slice(0, 2)).toEqual(['a-start', 'b-start'])
+  })
+
+  it('keeps the lock usable after a holder throws', async () => {
+    const store = new InMemoryLockStore()
+    await expect(
+      store.withLock('k', async () => {
+        throw new Error('boom')
+      }),
+    ).rejects.toThrow('boom')
+
+    // Lock is not poisoned: a subsequent acquire still runs.
+    await expect(store.withLock('k', async () => 'ok')).resolves.toBe('ok')
+  })
+})
+
+describe('LocksCapability', () => {
+  it('is named "locks"', () => {
+    expect(LocksCapability.capabilityName).toBe('locks')
+  })
+
+  it('round-trips a LockStore through provide/get', () => {
+    const ctx = { capabilities: new CapabilityRegistry() }
+    const store = new InMemoryLockStore()
+    provideLocks(ctx, store)
+    expect(getLocks(ctx)).toBe(store)
+  })
+
+  it('getLocks returns undefined when optional and not provided', () => {
+    const ctx = { capabilities: new CapabilityRegistry() }
+    expect(getLocks(ctx, { optional: true })).toBeUndefined()
+  })
+})
diff --git a/packages/ai/tests/logger/internal-logger.test.ts b/packages/ai/tests/logger/internal-logger.test.ts
index da8592b27..0a8c0e87b 100644
--- a/packages/ai/tests/logger/internal-logger.test.ts
+++ b/packages/ai/tests/logger/internal-logger.test.ts
@@ -32,6 +32,7 @@ const allOn = {
   config: true,
   errors: true,
   request: true,
+  sandbox: true,
 }
 
 const allOff = {
@@ -43,6 +44,7 @@ const allOff = {
   config: false,
   errors: false,
   request: false,
+  sandbox: false,
 }
 
 describe('InternalLogger', () => {
diff --git a/packages/ai/tests/logger/types.test.ts b/packages/ai/tests/logger/types.test.ts
index 6af840385..12d4bb3bb 100644
--- a/packages/ai/tests/logger/types.test.ts
+++ b/packages/ai/tests/logger/types.test.ts
@@ -29,7 +29,7 @@ describe('logger types', () => {
     expectTypeOf<Logger['error']>().returns.toEqualTypeOf<void>()
   })
 
-  it('DebugCategories has all eight optional boolean flags and allows empty object', () => {
+  it('DebugCategories has all optional boolean flags and allows empty object', () => {
     expectTypeOf<DebugCategories>().toEqualTypeOf<{
       provider?: boolean
       output?: boolean
@@ -39,6 +39,7 @@ describe('logger types', () => {
       config?: boolean
       errors?: boolean
       request?: boolean
+      sandbox?: boolean
     }>()
     const empty: DebugCategories = {}
     void empty
diff --git a/packages/ai/tests/resume-seam.test.ts b/packages/ai/tests/resume-seam.test.ts
new file mode 100644
index 000000000..ff684ecfa
--- /dev/null
+++ b/packages/ai/tests/resume-seam.test.ts
@@ -0,0 +1,161 @@
+import { describe, expect, it } from 'vitest'
+import { chat } from '../src/activities/chat/index'
+import { defineChatMiddleware } from '../src/activities/chat/middleware/index'
+import { ResumeSourceCapability, provideResumeSource } from '../src/resume'
+import type { ResumeSource } from '../src/resume'
+import type { StreamChunk } from '../src/types'
+import { ev, createMockAdapter, collectChunks, getDeltas } from './test-utils'
+
+/** Middleware that provides a fixed ResumeSource (stands in for withPersistence). */
+function withFakeResumeSource(source: ResumeSource) {
+  return defineChatMiddleware({
+    name: 'fake-resume-source',
+    provides: [ResumeSourceCapability],
+    setup(ctx) {
+      provideResumeSource(ctx, source)
+    },
+  })
+}
+
+describe('chat() resume seam', () => {
+  it('ignores `cursor` when no resume source is provided (no-op invariant)', async () => {
+    const { adapter, calls } = createMockAdapter({
+      iterations: [
+        [ev.runStarted(), ev.textContent('hello'), ev.runFinished('stop')],
+      ],
+    })
+
+    const stream = chat({
+      adapter,
+      messages: [{ role: 'user', content: 'Hi' }],
+      runId: 'run-1',
+      cursor: 'some-cursor',
+    })
+
+    const chunks = await collectChunks(stream as AsyncIterable<StreamChunk>)
+    // Adapter ran normally — cursor was ignored.
+    expect(calls.length).toBe(1)
+    expect(getDeltas(chunks).join('')).toBe('hello')
+  })
+
+  it('replays persisted events after the cursor and does NOT run the adapter', async () => {
+    const replayed: Array<StreamChunk> = [
+      { ...ev.textContent(' world'), cursor: '3' },
+      { ...ev.runFinished('stop'), cursor: '4' },
+    ]
+    const source: ResumeSource = {
+      hasRun: async (runId) => runId === 'run-1',
+      replay: async function* (runId, afterCursor) {
+        expect(runId).toBe('run-1')
+        expect(afterCursor).toBe('2')
+        for (const c of replayed) yield c
+      },
+      getStatus: async () => 'completed',
+    }
+
+    const { adapter, calls } = createMockAdapter({
+      iterations: [
+        [ev.runStarted(), ev.textContent('SHOULD NOT RUN'), ev.runFinished()],
+      ],
+    })
+
+    const stream = chat({
+      adapter,
+      messages: [],
+      runId: 'run-1',
+      cursor: '2',
+      middleware: [withFakeResumeSource(source)],
+    })
+
+    const chunks = await collectChunks(stream as AsyncIterable<StreamChunk>)
+    // The adapter must never run on a resume.
+    expect(calls.length).toBe(0)
+    // Output is exactly the replayed tail, cursors intact.
+    expect(getDeltas(chunks).join('')).toBe(' world')
+    expect(chunks.map((c) => c.cursor)).toEqual(['3', '4'])
+  })
+
+  it('re-attaches (continues the agent loop) when the run is still running and the adapter supports it', async () => {
+    const source: ResumeSource = {
+      hasRun: async () => true,
+      replay: async function* () {
+        yield { ...ev.textContent('replayed'), cursor: '2' }
+      },
+      getStatus: async () => 'running', // still in flight
+    }
+
+    const { adapter, calls } = createMockAdapter({
+      iterations: [
+        [ev.runStarted(), ev.textContent(' live'), ev.runFinished('stop')],
+      ],
+    })
+    // Mark the adapter as re-attach capable (a harness adapter would).
+    ;(adapter as { supportsReattach?: boolean }).supportsReattach = true
+
+    const stream = chat({
+      adapter,
+      messages: [],
+      runId: 'run-1',
+      cursor: '1',
+      middleware: [withFakeResumeSource(source)],
+    })
+
+    const chunks = await collectChunks(stream as AsyncIterable<StreamChunk>)
+    // Adapter ran (live continuation) AND the replayed tail was delivered first.
+    expect(calls.length).toBe(1)
+    expect(getDeltas(chunks).join('')).toBe('replayed live')
+  })
+
+  it('does NOT re-attach for a finished run even if the adapter supports it', async () => {
+    const source: ResumeSource = {
+      hasRun: async () => true,
+      replay: async function* () {
+        yield { ...ev.textContent('replayed'), cursor: '2' }
+      },
+      getStatus: async () => 'completed',
+    }
+    const { adapter, calls } = createMockAdapter({
+      iterations: [[ev.runStarted(), ev.textContent('NOPE'), ev.runFinished()]],
+    })
+    ;(adapter as { supportsReattach?: boolean }).supportsReattach = true
+
+    const stream = chat({
+      adapter,
+      messages: [],
+      runId: 'run-1',
+      cursor: '1',
+      middleware: [withFakeResumeSource(source)],
+    })
+    const chunks = await collectChunks(stream as AsyncIterable<StreamChunk>)
+    expect(calls.length).toBe(0)
+    expect(getDeltas(chunks).join('')).toBe('replayed')
+  })
+
+  it('falls through to a normal run when the resume source has no such run', async () => {
+    const source: ResumeSource = {
+      hasRun: async () => false,
+      replay: async function* () {
+        throw new Error('replay should not be called')
+      },
+      getStatus: async () => null,
+    }
+
+    const { adapter, calls } = createMockAdapter({
+      iterations: [
+        [ev.runStarted(), ev.textContent('fresh'), ev.runFinished('stop')],
+      ],
+    })
+
+    const stream = chat({
+      adapter,
+      messages: [{ role: 'user', content: 'Hi' }],
+      runId: 'run-unknown',
+      cursor: '5',
+      middleware: [withFakeResumeSource(source)],
+    })
+
+    const chunks = await collectChunks(stream as AsyncIterable<StreamChunk>)
+    expect(calls.length).toBe(1)
+    expect(getDeltas(chunks).join('')).toBe('fresh')
+  })
+})
diff --git a/packages/ai/tests/sandbox-debug-category.test.ts b/packages/ai/tests/sandbox-debug-category.test.ts
new file mode 100644
index 000000000..6397978bd
--- /dev/null
+++ b/packages/ai/tests/sandbox-debug-category.test.ts
@@ -0,0 +1,22 @@
+import { describe, expect, it, vi } from 'vitest'
+import { resolveDebugOption } from '../src/logger/resolve'
+
+describe('sandbox debug category', () => {
+  it('is enabled by debug: true and disabled by { sandbox: false }', () => {
+    expect(resolveDebugOption(true).isEnabled('sandbox')).toBe(true)
+    expect(resolveDebugOption({ sandbox: false }).isEnabled('sandbox')).toBe(
+      false,
+    )
+    expect(resolveDebugOption(false).isEnabled('sandbox')).toBe(false)
+  })
+
+  it('sandbox() routes to logger.debug when enabled', () => {
+    const debug = vi.fn()
+    const logger = { debug, info() {}, warn() {}, error() {} }
+    resolveDebugOption({ logger, sandbox: true }).sandbox('watch start', {
+      x: 1,
+    })
+    expect(debug).toHaveBeenCalledOnce()
+    expect(debug.mock.calls[0]?.[0]).toContain('tanstack-ai:sandbox')
+  })
+})
diff --git a/packages/ai/tests/sandbox-file-dispatch.test.ts b/packages/ai/tests/sandbox-file-dispatch.test.ts
new file mode 100644
index 000000000..ddab55753
--- /dev/null
+++ b/packages/ai/tests/sandbox-file-dispatch.test.ts
@@ -0,0 +1,53 @@
+import { describe, expect, it } from 'vitest'
+import { MiddlewareRunner } from '../src/activities/chat/middleware/compose'
+import { resolveDebugOption } from '../src/logger/resolve'
+import type {
+  ChatMiddleware,
+  ChatMiddlewareContext,
+  SandboxFileEvent,
+} from '../src/activities/chat/middleware/types'
+
+const ctx = {} as ChatMiddlewareContext
+const ev = (type: SandboxFileEvent['type']): SandboxFileEvent => ({
+  type,
+  path: `/workspace/a-${type}.ts`,
+  timestamp: 1,
+})
+
+describe('MiddlewareRunner.runSandboxFile', () => {
+  it('calls onFile (catch-all) + the type-specific hook, in array order', async () => {
+    const calls: Array<string> = []
+    const mws: Array<ChatMiddleware> = [
+      {
+        name: 'a',
+        sandbox: {
+          onFile: () => void calls.push('a:onFile'),
+          onFileCreate: () => void calls.push('a:onFileCreate'),
+          onFileChange: () => void calls.push('a:onFileChange'),
+        },
+      },
+      { name: 'b', sandbox: { onFile: () => void calls.push('b:onFile') } },
+    ]
+    const runner = new MiddlewareRunner(mws, resolveDebugOption(false))
+    await runner.runSandboxFile(ctx, ev('create'))
+    expect(calls).toEqual(['a:onFile', 'a:onFileCreate', 'b:onFile'])
+  })
+
+  it('isolates hook errors (one throwing does not stop the rest)', async () => {
+    const calls: Array<string> = []
+    const mws: Array<ChatMiddleware> = [
+      {
+        name: 'a',
+        sandbox: {
+          onFileDelete: () => {
+            throw new Error('boom')
+          },
+        },
+      },
+      { name: 'b', sandbox: { onFileDelete: () => void calls.push('b') } },
+    ]
+    const runner = new MiddlewareRunner(mws, resolveDebugOption(false))
+    await runner.runSandboxFile(ctx, ev('delete'))
+    expect(calls).toEqual(['b'])
+  })
+})
diff --git a/packages/ai/tests/sandbox-runtime-emit.test.ts b/packages/ai/tests/sandbox-runtime-emit.test.ts
new file mode 100644
index 000000000..33d80d753
--- /dev/null
+++ b/packages/ai/tests/sandbox-runtime-emit.test.ts
@@ -0,0 +1,57 @@
+import { describe, expect, it } from 'vitest'
+import { MiddlewareRunner } from '../src/activities/chat/middleware/compose'
+import { resolveDebugOption } from '../src/logger/resolve'
+import { EventType } from '../src/types'
+import type {
+  ChatMiddleware,
+  ChatMiddlewareContext,
+  SandboxFileEvent,
+} from '../src/activities/chat/middleware/types'
+import type { StreamChunk } from '../src/types'
+
+// Mirrors the engine sink built in index.ts (Step 5) so we can unit-test the
+// contract: emit() runs middleware sandbox hooks AND enqueues a CUSTOM chunk.
+function makeSink(
+  runner: MiddlewareRunner,
+  ctx: ChatMiddlewareContext,
+  queue: Array<StreamChunk>,
+) {
+  return (event: SandboxFileEvent) => {
+    void runner.runSandboxFile(ctx, event)
+    queue.push({
+      type: EventType.CUSTOM,
+      name: 'sandbox.file',
+      value: { ...event },
+      timestamp: event.timestamp,
+    } as StreamChunk)
+  }
+}
+
+describe('sandbox runtime emit', () => {
+  it('runs middleware sandbox hooks and enqueues a CUSTOM sandbox.file chunk', async () => {
+    const seen: Array<SandboxFileEvent> = []
+    const mw: ChatMiddleware = {
+      name: 'audit',
+      sandbox: { onFileChange: (_ctx, e) => void seen.push(e) },
+    }
+    const runner = new MiddlewareRunner([mw], resolveDebugOption(false))
+    const queue: Array<StreamChunk> = []
+    const sink = makeSink(runner, {} as ChatMiddlewareContext, queue)
+
+    const event: SandboxFileEvent = {
+      type: 'change',
+      path: '/workspace/x.ts',
+      timestamp: 1,
+    }
+    sink(event)
+    await Promise.resolve()
+
+    expect(seen).toEqual([event])
+    expect(queue).toHaveLength(1)
+    expect(queue[0]).toMatchObject({
+      type: EventType.CUSTOM,
+      name: 'sandbox.file',
+      value: { type: 'change', path: '/workspace/x.ts' },
+    })
+  })
+})
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index aee0c7730..e13789245 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -105,6 +105,50 @@ importers:
         specifier: ^4.0.14
         version: 4.1.4(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jsdom@27.3.0(postcss@8.5.15))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
 
+  examples/sandbox-coding-agent:
+    dependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../../packages/ai
+      '@tanstack/ai-claude-code':
+        specifier: workspace:*
+        version: link:../../packages/ai-claude-code
+      '@tanstack/ai-sandbox':
+        specifier: workspace:*
+        version: link:../../packages/ai-sandbox
+      '@tanstack/ai-sandbox-docker':
+        specifier: workspace:*
+        version: link:../../packages/ai-sandbox-docker
+      '@tanstack/ai-sandbox-local-process':
+        specifier: workspace:*
+        version: link:../../packages/ai-sandbox-local-process
+    devDependencies:
+      tsx:
+        specifier: ^4.21.0
+        version: 4.21.0
+
+  examples/sandbox-issue-triage:
+    dependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../../packages/ai
+      '@tanstack/ai-claude-code':
+        specifier: workspace:*
+        version: link:../../packages/ai-claude-code
+      '@tanstack/ai-sandbox':
+        specifier: workspace:*
+        version: link:../../packages/ai-sandbox
+      '@tanstack/ai-sandbox-docker':
+        specifier: workspace:*
+        version: link:../../packages/ai-sandbox-docker
+      '@tanstack/ai-sandbox-local-process':
+        specifier: workspace:*
+        version: link:../../packages/ai-sandbox-local-process
+    devDependencies:
+      tsx:
+        specifier: ^4.21.0
+        version: 4.21.0
+
   examples/ts-angular-chat:
     dependencies:
       '@angular/common':
@@ -212,7 +256,7 @@ importers:
         version: link:../../packages/ai-react
       '@tanstack/nitro-v2-vite-plugin':
         specifier: ^1.154.7
-        version: 1.154.7(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+        version: 1.154.7(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@tanstack/react-router':
         specifier: ^1.158.4
         version: 1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3)
@@ -439,7 +483,7 @@ importers:
         version: link:../../packages/ai-react-ui
       '@tanstack/nitro-v2-vite-plugin':
         specifier: ^1.154.7
-        version: 1.154.7(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+        version: 1.154.7(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@tanstack/react-devtools':
         specifier: ^0.9.10
         version: 0.9.10(@types/react-dom@19.2.3(@types/react@19.2.7))(@types/react@19.2.7)(csstype@3.2.3)(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(solid-js@1.9.10)
@@ -541,6 +585,79 @@ importers:
         specifier: ^5.1.0
         version: 5.1.0
 
+  examples/ts-react-coding-agent:
+    dependencies:
+      '@tailwindcss/vite':
+        specifier: ^4.1.18
+        version: 4.1.18(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../../packages/ai
+      '@tanstack/ai-claude-code':
+        specifier: workspace:*
+        version: link:../../packages/ai-claude-code
+      '@tanstack/ai-client':
+        specifier: workspace:*
+        version: link:../../packages/ai-client
+      '@tanstack/ai-codex':
+        specifier: workspace:*
+        version: link:../../packages/ai-codex
+      '@tanstack/ai-gemini-cli':
+        specifier: workspace:*
+        version: link:../../packages/ai-gemini-cli
+      '@tanstack/ai-opencode':
+        specifier: workspace:*
+        version: link:../../packages/ai-opencode
+      '@tanstack/ai-react':
+        specifier: workspace:*
+        version: link:../../packages/ai-react
+      '@tanstack/nitro-v2-vite-plugin':
+        specifier: ^1.154.7
+        version: 1.154.7(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+      '@tanstack/react-router':
+        specifier: ^1.158.4
+        version: 1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3)
+      '@tanstack/react-start':
+        specifier: ^1.159.0
+        version: 1.159.5(crossws@0.4.5(srvx@0.11.15))(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+      '@tanstack/router-plugin':
+        specifier: ^1.158.4
+        version: 1.159.5(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+      react:
+        specifier: ^19.2.3
+        version: 19.2.3
+      react-dom:
+        specifier: ^19.2.3
+        version: 19.2.3(react@19.2.3)
+      tailwindcss:
+        specifier: ^4.1.18
+        version: 4.1.18
+      vite-tsconfig-paths:
+        specifier: ^5.1.4
+        version: 5.1.4(typescript@5.9.3)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+      zod:
+        specifier: ^4.2.0
+        version: 4.3.6
+    devDependencies:
+      '@types/node':
+        specifier: ^24.10.1
+        version: 24.10.3
+      '@types/react':
+        specifier: ^19.2.7
+        version: 19.2.7
+      '@types/react-dom':
+        specifier: ^19.2.3
+        version: 19.2.3(@types/react@19.2.7)
+      '@vitejs/plugin-react':
+        specifier: ^5.1.2
+        version: 5.1.2(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+      typescript:
+        specifier: 5.9.3
+        version: 5.9.3
+      vite:
+        specifier: ^7.3.3
+        version: 7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
+
   examples/ts-react-media:
     dependencies:
       '@tailwindcss/vite':
@@ -569,7 +686,7 @@ importers:
         version: 0.561.0(react@19.2.3)
       nitro:
         specifier: 3.0.1-alpha.2
-        version: 3.0.1-alpha.2(chokidar@5.0.0)(ioredis@5.9.2)(lru-cache@11.2.4)(rolldown@1.0.0-rc.17)(rollup@4.60.1)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+        version: 3.0.1-alpha.2(aws4fetch@1.0.20)(chokidar@5.0.0)(ioredis@5.9.2)(lru-cache@11.2.4)(rolldown@1.0.0-rc.17)(rollup@4.60.1)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       react:
         specifier: ^19.2.3
         version: 19.2.3
@@ -706,7 +823,7 @@ importers:
         version: 0.561.0(react@19.2.3)
       nitro:
         specifier: latest
-        version: 3.0.260429-beta(chokidar@5.0.0)(dotenv@17.2.3)(giget@2.0.0)(jiti@2.6.1)(miniflare@4.20260609.0)(rollup@4.60.1)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+        version: 3.0.260429-beta(aws4fetch@1.0.20)(chokidar@5.0.0)(dotenv@17.2.3)(giget@2.0.0)(jiti@2.6.1)(miniflare@4.20260609.0)(rollup@4.60.1)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       radix-ui:
         specifier: ^1.4.3
         version: 1.4.3(@types/react-dom@19.2.3(@types/react@19.2.7))(@types/react@19.2.7)(react-dom@19.2.3(react@19.2.3))(react@19.2.3)
@@ -806,7 +923,7 @@ importers:
         version: link:../../packages/ai-solid-ui
       '@tanstack/nitro-v2-vite-plugin':
         specifier: ^1.154.7
-        version: 1.154.7(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+        version: 1.154.7(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@tanstack/router-plugin':
         specifier: ^1.158.4
         version: 1.159.5(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
@@ -1151,6 +1268,21 @@ importers:
         specifier: ^4.2.0
         version: 4.2.1
 
+  packages/ai-claude-code:
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-sandbox':
+        specifier: workspace:*
+        version: link:../ai-sandbox
+      '@tanstack/ai-sandbox-local-process':
+        specifier: workspace:*
+        version: link:../ai-sandbox-local-process
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
   packages/ai-client:
     dependencies:
       '@tanstack/ai':
@@ -1266,6 +1398,21 @@ importers:
         specifier: ^4.21.0
         version: 4.21.0
 
+  packages/ai-codex:
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-sandbox':
+        specifier: workspace:*
+        version: link:../ai-sandbox
+      '@tanstack/ai-sandbox-local-process':
+        specifier: workspace:*
+        version: link:../ai-sandbox-local-process
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
   packages/ai-devtools:
     dependencies:
       '@tanstack/ai':
@@ -1382,6 +1529,22 @@ importers:
         specifier: ^4.2.0
         version: 4.3.6
 
+  packages/ai-gemini-cli:
+    dependencies:
+      '@agentclientprotocol/sdk':
+        specifier: ^0.25.0
+        version: 0.25.1(zod@4.3.6)
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-sandbox':
+        specifier: workspace:*
+        version: link:../ai-sandbox
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
   packages/ai-grok:
     dependencies:
       '@tanstack/ai-utils':
@@ -1552,6 +1715,22 @@ importers:
         specifier: ^4.2.0
         version: 4.3.6
 
+  packages/ai-opencode:
+    dependencies:
+      '@opencode-ai/sdk':
+        specifier: ^1.17.4
+        version: 1.17.7
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-sandbox':
+        specifier: workspace:*
+        version: link:../ai-sandbox
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
   packages/ai-openrouter:
     dependencies:
       '@openrouter/sdk':
@@ -1574,6 +1753,111 @@ importers:
         specifier: ^4.2.0
         version: 4.3.6
 
+  packages/ai-persistence:
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
+  packages/ai-persistence-cloudflare:
+    devDependencies:
+      '@cloudflare/workers-types':
+        specifier: ^4.20241230.0
+        version: 4.20260317.1
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-persistence':
+        specifier: workspace:*
+        version: link:../ai-persistence
+      '@tanstack/ai-persistence-sql':
+        specifier: workspace:*
+        version: link:../ai-persistence-sql
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
+  packages/ai-persistence-drizzle:
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-persistence':
+        specifier: workspace:*
+        version: link:../ai-persistence
+      '@tanstack/ai-persistence-sql':
+        specifier: workspace:*
+        version: link:../ai-persistence-sql
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
+  packages/ai-persistence-postgres:
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-persistence':
+        specifier: workspace:*
+        version: link:../ai-persistence
+      '@tanstack/ai-persistence-sql':
+        specifier: workspace:*
+        version: link:../ai-persistence-sql
+      '@types/pg':
+        specifier: ^8.11.10
+        version: 8.20.0
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+      pg:
+        specifier: ^8.13.0
+        version: 8.21.0
+
+  packages/ai-persistence-prisma:
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-persistence':
+        specifier: workspace:*
+        version: link:../ai-persistence
+      '@tanstack/ai-persistence-sql':
+        specifier: workspace:*
+        version: link:../ai-persistence-sql
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
+  packages/ai-persistence-sql:
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-persistence':
+        specifier: workspace:*
+        version: link:../ai-persistence
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
+  packages/ai-persistence-sqlite:
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-persistence':
+        specifier: workspace:*
+        version: link:../ai-persistence
+      '@tanstack/ai-persistence-sql':
+        specifier: workspace:*
+        version: link:../ai-persistence-sql
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
   packages/ai-preact:
     dependencies:
       '@tanstack/ai':
@@ -1670,6 +1954,78 @@ importers:
         specifier: ^7.3.3
         version: 7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
 
+  packages/ai-sandbox:
+    dependencies:
+      '@modelcontextprotocol/sdk':
+        specifier: ^1.29.0
+        version: 1.29.0(zod@4.3.6)
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
+  packages/ai-sandbox-cloudflare:
+    dependencies:
+      '@cloudflare/sandbox':
+        specifier: ^0.12.1
+        version: 0.12.1(@opencode-ai/sdk@1.17.7)
+    devDependencies:
+      '@cloudflare/workers-types':
+        specifier: ^4.20241230.0
+        version: 4.20260317.1
+      '@tanstack/ai-sandbox':
+        specifier: workspace:*
+        version: link:../ai-sandbox
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
+  packages/ai-sandbox-docker:
+    dependencies:
+      dockerode:
+        specifier: ^4.0.2
+        version: 4.0.12
+    devDependencies:
+      '@tanstack/ai-sandbox':
+        specifier: workspace:*
+        version: link:../ai-sandbox
+      '@types/dockerode':
+        specifier: ^3.3.31
+        version: 3.3.47
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
+  packages/ai-sandbox-local-process:
+    devDependencies:
+      '@tanstack/ai-sandbox':
+        specifier: workspace:*
+        version: link:../ai-sandbox
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
+  packages/ai-sandbox-persistence:
+    devDependencies:
+      '@tanstack/ai':
+        specifier: workspace:*
+        version: link:../ai
+      '@tanstack/ai-persistence':
+        specifier: workspace:*
+        version: link:../ai-persistence
+      '@tanstack/ai-persistence-sql':
+        specifier: workspace:*
+        version: link:../ai-persistence-sql
+      '@tanstack/ai-sandbox':
+        specifier: workspace:*
+        version: link:../ai-sandbox
+      '@vitest/coverage-v8':
+        specifier: 4.0.14
+        version: 4.0.14(vitest@4.0.14(@opentelemetry/api@1.9.1)(@types/node@24.10.3)(happy-dom@20.0.11)(jiti@2.6.1)(jsdom@27.3.0(postcss@8.5.15))(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+
   packages/ai-solid:
     dependencies:
       '@tanstack/ai-client':
@@ -1972,6 +2328,9 @@ importers:
       '@tanstack/ai-anthropic':
         specifier: workspace:*
         version: link:../../packages/ai-anthropic
+      '@tanstack/ai-claude-code':
+        specifier: workspace:*
+        version: link:../../packages/ai-claude-code
       '@tanstack/ai-client':
         specifier: workspace:*
         version: link:../../packages/ai-client
@@ -2010,7 +2369,7 @@ importers:
         version: 0.4.1
       '@tanstack/nitro-v2-vite-plugin':
         specifier: ^1.154.7
-        version: 1.154.7(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+        version: 1.154.7(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@tanstack/react-ai-devtools':
         specifier: workspace:*
         version: link:../../packages/react-ai-devtools
@@ -2122,7 +2481,7 @@ importers:
         version: link:../../packages/ai-react-ui
       '@tanstack/nitro-v2-vite-plugin':
         specifier: ^1.154.7
-        version: 1.154.7(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+        version: 1.154.7(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@tanstack/react-router':
         specifier: ^1.158.4
         version: 1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3)
@@ -2131,7 +2490,7 @@ importers:
         version: 1.159.5(crossws@0.4.5(srvx@0.11.15))(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@tanstack/start':
         specifier: ^1.120.20
-        version: 1.120.20(@types/node@24.10.3)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))(yaml@2.8.2)
+        version: 1.120.20(@types/node@24.10.3)(aws4fetch@1.0.20)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))(yaml@2.8.2)
       highlight.js:
         specifier: ^11.11.1
         version: 11.11.1
@@ -2236,6 +2595,11 @@ packages:
   '@ag-ui/core@0.0.52':
     resolution: {integrity: sha512-Xo0bUaNV56EqylzcrAuhUkQX7et7+SZIrqZZtEByGwEq/I1EHny6ZMkWHLkKR7UNi0FJZwJyhKYmKJS3B2SEgA==}
 
+  '@agentclientprotocol/sdk@0.25.1':
+    resolution: {integrity: sha512-jx2rF3bdpGwZ75Q/meyEDLLbYmbtxk82Uh9hDCdxDvcEedBnNSF5hZAnL/kJR5VNz56JqwOmqnAqasC84MwwkQ==}
+    peerDependencies:
+      zod: ^3.25.0 || ^4.0.0
+
   '@ampproject/remapping@2.3.0':
     resolution: {integrity: sha512-30iZtAPgz+LTIYoeivqYo853f02jBYSd5uGnGpkFV0M3xOt9aN73erkgYAmZU43x4VfqcnLxW9Kpg3R5LC4YYw==}
     engines: {node: '>=6.0.0'}
@@ -2934,6 +3298,9 @@ packages:
     resolution: {integrity: sha512-4zBIxpPzowiZpusoFkyGVwakdRJUyuH5PxQ/PrqghfdFWWasvnCdPfQXHrenDai+gyLARulZjZowCOj6fjT4pA==}
     engines: {node: '>=6.9.0'}
 
+  '@balena/dockerignore@1.0.2':
+    resolution: {integrity: sha512-wMue2Sy4GAVTk6Ic4tJVcnfdau+gx2EnG7S+uAEe+TWJFqE4YoWN4/H8MSLj4eYJKxGg26lZwboEniNiNwZQ6Q==}
+
   '@bcoe/v8-coverage@1.0.2':
     resolution: {integrity: sha512-6zABk/ECA/QYSCQ1NGiVwwbQerUCZ+TQbp64Q3AgmfNvurHH0j8TtXa1qbShXA6qqkpAj4V5W8pP6mLe1mcMqA==}
     engines: {node: '>=18'}
@@ -3002,6 +3369,9 @@ packages:
   '@changesets/write@0.4.0':
     resolution: {integrity: sha512-CdTLvIOPiCNuH71pyDu3rA+Q0n65cmAbXnwWH84rKGiFumFzkmHNT8KHTMEchcxN+Kl8I54xGUhJ7l3E7X396Q==}
 
+  '@cloudflare/containers@0.3.7':
+    resolution: {integrity: sha512-DM9dm3FnIBSyiSJ1FLavKwl/lk3oAmTaynCzZQ9pZR0ncRPquSxkxd8Nu2MFILxmDDsPkxKsSNEh9mHHMty4Fw==}
+
   '@cloudflare/kv-asset-handler@0.4.2':
     resolution: {integrity: sha512-SIOD2DxrRRwQ+jgzlXCqoEFiKOFqaPjhnNTGKXSRLvp1HiOvapLaFG2kEr9dYQTYe8rKrd9uvDUzmAITeNyaHQ==}
     engines: {node: '>=18.0.0'}
@@ -3010,6 +3380,20 @@ packages:
     resolution: {integrity: sha512-jxQYkj8dSIzc0cD6cMMNdOc1UVjqSqu8BZdor5s8cGjW2I8BjODt/kWPVdY+u9zj3ms75Q5qaZgnxUad83+eAg==}
     engines: {node: '>=22.0.0'}
 
+  '@cloudflare/sandbox@0.12.1':
+    resolution: {integrity: sha512-P1ZmNDLYtuEY1ZUcAx0OgTol98VqS617LGd4nf1RTOjSV2yHLDAp59NI36/gg3/pxkHPgmAEyFIjH/ie8FoA7g==}
+    peerDependencies:
+      '@openai/agents': ^0.3.3
+      '@opencode-ai/sdk': ^1.1.40
+      '@xterm/xterm': '>=5.0.0'
+    peerDependenciesMeta:
+      '@openai/agents':
+        optional: true
+      '@opencode-ai/sdk':
+        optional: true
+      '@xterm/xterm':
+        optional: true
+
   '@cloudflare/unenv-preset@2.16.1':
     resolution: {integrity: sha512-ECxObrMfyTl5bhQf/lZCXwo5G6xX9IAUo+nDMKK4SZ8m4Jvvxp52vilxyySSWh2YTZz8+HQ07qGH/2rEom1vDw==}
     peerDependencies:
@@ -3188,12 +3572,6 @@ packages:
     cpu: [ppc64]
     os: [aix]
 
-  '@esbuild/aix-ppc64@0.27.2':
-    resolution: {integrity: sha512-GZMB+a0mOMZs4MpDbj8RJp4cw+w1WV5NYD6xzgvzUJ5Ek2jerwfO2eADyI6ExDSUED+1X8aMbegahsJi+8mgpw==}
-    engines: {node: '>=18'}
-    cpu: [ppc64]
-    os: [aix]
-
   '@esbuild/aix-ppc64@0.27.3':
     resolution: {integrity: sha512-9fJMTNFTWZMh5qwrBItuziu834eOCUcEqymSH7pY+zoMVEZg3gcPuBNxH1EvfVYe9h0x/Ptw8KBzv7qxb7l8dg==}
     engines: {node: '>=18'}
@@ -3218,12 +3596,6 @@ packages:
     cpu: [arm64]
     os: [android]
 
-  '@esbuild/android-arm64@0.27.2':
-    resolution: {integrity: sha512-pvz8ZZ7ot/RBphf8fv60ljmaoydPU12VuXHImtAs0XhLLw+EXBi2BLe3OYSBslR4rryHvweW5gmkKFwTiFy6KA==}
-    engines: {node: '>=18'}
-    cpu: [arm64]
-    os: [android]
-
   '@esbuild/android-arm64@0.27.3':
     resolution: {integrity: sha512-YdghPYUmj/FX2SYKJ0OZxf+iaKgMsKHVPF1MAq/P8WirnSpCStzKJFjOjzsW0QQ7oIAiccHdcqjbHmJxRb/dmg==}
     engines: {node: '>=18'}
@@ -3248,12 +3620,6 @@ packages:
     cpu: [arm]
     os: [android]
 
-  '@esbuild/android-arm@0.27.2':
-    resolution: {integrity: sha512-DVNI8jlPa7Ujbr1yjU2PfUSRtAUZPG9I1RwW4F4xFB1Imiu2on0ADiI/c3td+KmDtVKNbi+nffGDQMfcIMkwIA==}
-    engines: {node: '>=18'}
-    cpu: [arm]
-    os: [android]
-
   '@esbuild/android-arm@0.27.3':
     resolution: {integrity: sha512-i5D1hPY7GIQmXlXhs2w8AWHhenb00+GxjxRncS2ZM7YNVGNfaMxgzSGuO8o8SJzRc/oZwU2bcScvVERk03QhzA==}
     engines: {node: '>=18'}
@@ -3278,12 +3644,6 @@ packages:
     cpu: [x64]
     os: [android]
 
-  '@esbuild/android-x64@0.27.2':
-    resolution: {integrity: sha512-z8Ank4Byh4TJJOh4wpz8g2vDy75zFL0TlZlkUkEwYXuPSgX8yzep596n6mT7905kA9uHZsf/o2OJZubl2l3M7A==}
-    engines: {node: '>=18'}
-    cpu: [x64]
-    os: [android]
-
   '@esbuild/android-x64@0.27.3':
     resolution: {integrity: sha512-IN/0BNTkHtk8lkOM8JWAYFg4ORxBkZQf9zXiEOfERX/CzxW3Vg1ewAhU7QSWQpVIzTW+b8Xy+lGzdYXV6UZObQ==}
     engines: {node: '>=18'}
@@ -3308,12 +3668,6 @@ packages:
     cpu: [arm64]
     os: [darwin]
 
-  '@esbuild/darwin-arm64@0.27.2':
-    resolution: {integrity: sha512-davCD2Zc80nzDVRwXTcQP/28fiJbcOwvdolL0sOiOsbwBa72kegmVU0Wrh1MYrbuCL98Omp5dVhQFWRKR2ZAlg==}
-    engines: {node: '>=18'}
-    cpu: [arm64]
-    os: [darwin]
-
   '@esbuild/darwin-arm64@0.27.3':
     resolution: {integrity: sha512-Re491k7ByTVRy0t3EKWajdLIr0gz2kKKfzafkth4Q8A5n1xTHrkqZgLLjFEHVD+AXdUGgQMq+Godfq45mGpCKg==}
     engines: {node: '>=18'}
@@ -3338,12 +3692,6 @@ packages:
     cpu: [x64]
     os: [darwin]
 
-  '@esbuild/darwin-x64@0.27.2':
-    resolution: {integrity: sha512-ZxtijOmlQCBWGwbVmwOF/UCzuGIbUkqB1faQRf5akQmxRJ1ujusWsb3CVfk/9iZKr2L5SMU5wPBi1UWbvL+VQA==}
-    engines: {node: '>=18'}
-    cpu: [x64]
-    os: [darwin]
-
   '@esbuild/darwin-x64@0.27.3':
     resolution: {integrity: sha512-vHk/hA7/1AckjGzRqi6wbo+jaShzRowYip6rt6q7VYEDX4LEy1pZfDpdxCBnGtl+A5zq8iXDcyuxwtv3hNtHFg==}
     engines: {node: '>=18'}
@@ -3368,12 +3716,6 @@ packages:
     cpu: [arm64]
     os: [freebsd]
 
-  '@esbuild/freebsd-arm64@0.27.2':
-    resolution: {integrity: sha512-lS/9CN+rgqQ9czogxlMcBMGd+l8Q3Nj1MFQwBZJyoEKI50XGxwuzznYdwcav6lpOGv5BqaZXqvBSiB/kJ5op+g==}
-    engines: {node: '>=18'}
-    cpu: [arm64]
-    os: [freebsd]
-
   '@esbuild/freebsd-arm64@0.27.3':
     resolution: {integrity: sha512-ipTYM2fjt3kQAYOvo6vcxJx3nBYAzPjgTCk7QEgZG8AUO3ydUhvelmhrbOheMnGOlaSFUoHXB6un+A7q4ygY9w==}
     engines: {node: '>=18'}
@@ -3398,12 +3740,6 @@ packages:
     cpu: [x64]
     os: [freebsd]
 
-  '@esbuild/freebsd-x64@0.27.2':
-    resolution: {integrity: sha512-tAfqtNYb4YgPnJlEFu4c212HYjQWSO/w/h/lQaBK7RbwGIkBOuNKQI9tqWzx7Wtp7bTPaGC6MJvWI608P3wXYA==}
-    engines: {node: '>=18'}
-    cpu: [x64]
-    os: [freebsd]
-
   '@esbuild/freebsd-x64@0.27.3':
     resolution: {integrity: sha512-dDk0X87T7mI6U3K9VjWtHOXqwAMJBNN2r7bejDsc+j03SEjtD9HrOl8gVFByeM0aJksoUuUVU9TBaZa2rgj0oA==}
     engines: {node: '>=18'}
@@ -3428,12 +3764,6 @@ packages:
     cpu: [arm64]
     os: [linux]
 
-  '@esbuild/linux-arm64@0.27.2':
-    resolution: {integrity: sha512-hYxN8pr66NsCCiRFkHUAsxylNOcAQaxSSkHMMjcpx0si13t1LHFphxJZUiGwojB1a/Hd5OiPIqDdXONia6bhTw==}
-    engines: {node: '>=18'}
-    cpu: [arm64]
-    os: [linux]
-
   '@esbuild/linux-arm64@0.27.3':
     resolution: {integrity: sha512-sZOuFz/xWnZ4KH3YfFrKCf1WyPZHakVzTiqji3WDc0BCl2kBwiJLCXpzLzUBLgmp4veFZdvN5ChW4Eq/8Fc2Fg==}
     engines: {node: '>=18'}
@@ -3458,12 +3788,6 @@ packages:
     cpu: [arm]
     os: [linux]
 
-  '@esbuild/linux-arm@0.27.2':
-    resolution: {integrity: sha512-vWfq4GaIMP9AIe4yj1ZUW18RDhx6EPQKjwe7n8BbIecFtCQG4CfHGaHuh7fdfq+y3LIA2vGS/o9ZBGVxIDi9hw==}
-    engines: {node: '>=18'}
-    cpu: [arm]
-    os: [linux]
-
   '@esbuild/linux-arm@0.27.3':
     resolution: {integrity: sha512-s6nPv2QkSupJwLYyfS+gwdirm0ukyTFNl3KTgZEAiJDd+iHZcbTPPcWCcRYH+WlNbwChgH2QkE9NSlNrMT8Gfw==}
     engines: {node: '>=18'}
@@ -3488,12 +3812,6 @@ packages:
     cpu: [ia32]
     os: [linux]
 
-  '@esbuild/linux-ia32@0.27.2':
-    resolution: {integrity: sha512-MJt5BRRSScPDwG2hLelYhAAKh9imjHK5+NE/tvnRLbIqUWa+0E9N4WNMjmp/kXXPHZGqPLxggwVhz7QP8CTR8w==}
-    engines: {node: '>=18'}
-    cpu: [ia32]
-    os: [linux]
-
   '@esbuild/linux-ia32@0.27.3':
     resolution: {integrity: sha512-yGlQYjdxtLdh0a3jHjuwOrxQjOZYD/C9PfdbgJJF3TIZWnm/tMd/RcNiLngiu4iwcBAOezdnSLAwQDPqTmtTYg==}
     engines: {node: '>=18'}
@@ -3518,12 +3836,6 @@ packages:
     cpu: [loong64]
     os: [linux]
 
-  '@esbuild/linux-loong64@0.27.2':
-    resolution: {integrity: sha512-lugyF1atnAT463aO6KPshVCJK5NgRnU4yb3FUumyVz+cGvZbontBgzeGFO1nF+dPueHD367a2ZXe1NtUkAjOtg==}
-    engines: {node: '>=18'}
-    cpu: [loong64]
-    os: [linux]
-
   '@esbuild/linux-loong64@0.27.3':
     resolution: {integrity: sha512-WO60Sn8ly3gtzhyjATDgieJNet/KqsDlX5nRC5Y3oTFcS1l0KWba+SEa9Ja1GfDqSF1z6hif/SkpQJbL63cgOA==}
     engines: {node: '>=18'}
@@ -3548,12 +3860,6 @@ packages:
     cpu: [mips64el]
     os: [linux]
 
-  '@esbuild/linux-mips64el@0.27.2':
-    resolution: {integrity: sha512-nlP2I6ArEBewvJ2gjrrkESEZkB5mIoaTswuqNFRv/WYd+ATtUpe9Y09RnJvgvdag7he0OWgEZWhviS1OTOKixw==}
-    engines: {node: '>=18'}
-    cpu: [mips64el]
-    os: [linux]
-
   '@esbuild/linux-mips64el@0.27.3':
     resolution: {integrity: sha512-APsymYA6sGcZ4pD6k+UxbDjOFSvPWyZhjaiPyl/f79xKxwTnrn5QUnXR5prvetuaSMsb4jgeHewIDCIWljrSxw==}
     engines: {node: '>=18'}
@@ -3578,12 +3884,6 @@ packages:
     cpu: [ppc64]
     os: [linux]
 
-  '@esbuild/linux-ppc64@0.27.2':
-    resolution: {integrity: sha512-C92gnpey7tUQONqg1n6dKVbx3vphKtTHJaNG2Ok9lGwbZil6DrfyecMsp9CrmXGQJmZ7iiVXvvZH6Ml5hL6XdQ==}
-    engines: {node: '>=18'}
-    cpu: [ppc64]
-    os: [linux]
-
   '@esbuild/linux-ppc64@0.27.3':
     resolution: {integrity: sha512-eizBnTeBefojtDb9nSh4vvVQ3V9Qf9Df01PfawPcRzJH4gFSgrObw+LveUyDoKU3kxi5+9RJTCWlj4FjYXVPEA==}
     engines: {node: '>=18'}
@@ -3608,12 +3908,6 @@ packages:
     cpu: [riscv64]
     os: [linux]
 
-  '@esbuild/linux-riscv64@0.27.2':
-    resolution: {integrity: sha512-B5BOmojNtUyN8AXlK0QJyvjEZkWwy/FKvakkTDCziX95AowLZKR6aCDhG7LeF7uMCXEJqwa8Bejz5LTPYm8AvA==}
-    engines: {node: '>=18'}
-    cpu: [riscv64]
-    os: [linux]
-
   '@esbuild/linux-riscv64@0.27.3':
     resolution: {integrity: sha512-3Emwh0r5wmfm3ssTWRQSyVhbOHvqegUDRd0WhmXKX2mkHJe1SFCMJhagUleMq+Uci34wLSipf8Lagt4LlpRFWQ==}
     engines: {node: '>=18'}
@@ -3638,12 +3932,6 @@ packages:
     cpu: [s390x]
     os: [linux]
 
-  '@esbuild/linux-s390x@0.27.2':
-    resolution: {integrity: sha512-p4bm9+wsPwup5Z8f4EpfN63qNagQ47Ua2znaqGH6bqLlmJ4bx97Y9JdqxgGZ6Y8xVTixUnEkoKSHcpRlDnNr5w==}
-    engines: {node: '>=18'}
-    cpu: [s390x]
-    os: [linux]
-
   '@esbuild/linux-s390x@0.27.3':
     resolution: {integrity: sha512-pBHUx9LzXWBc7MFIEEL0yD/ZVtNgLytvx60gES28GcWMqil8ElCYR4kvbV2BDqsHOvVDRrOxGySBM9Fcv744hw==}
     engines: {node: '>=18'}
@@ -3668,12 +3956,6 @@ packages:
     cpu: [x64]
     os: [linux]
 
-  '@esbuild/linux-x64@0.27.2':
-    resolution: {integrity: sha512-uwp2Tip5aPmH+NRUwTcfLb+W32WXjpFejTIOWZFw/v7/KnpCDKG66u4DLcurQpiYTiYwQ9B7KOeMJvLCu/OvbA==}
-    engines: {node: '>=18'}
-    cpu: [x64]
-    os: [linux]
-
   '@esbuild/linux-x64@0.27.3':
     resolution: {integrity: sha512-Czi8yzXUWIQYAtL/2y6vogER8pvcsOsk5cpwL4Gk5nJqH5UZiVByIY8Eorm5R13gq+DQKYg0+JyQoytLQas4dA==}
     engines: {node: '>=18'}
@@ -3692,12 +3974,6 @@ packages:
     cpu: [arm64]
     os: [netbsd]
 
-  '@esbuild/netbsd-arm64@0.27.2':
-    resolution: {integrity: sha512-Kj6DiBlwXrPsCRDeRvGAUb/LNrBASrfqAIok+xB0LxK8CHqxZ037viF13ugfsIpePH93mX7xfJp97cyDuTZ3cw==}
-    engines: {node: '>=18'}
-    cpu: [arm64]
-    os: [netbsd]
-
   '@esbuild/netbsd-arm64@0.27.3':
     resolution: {integrity: sha512-sDpk0RgmTCR/5HguIZa9n9u+HVKf40fbEUt+iTzSnCaGvY9kFP0YKBWZtJaraonFnqef5SlJ8/TiPAxzyS+UoA==}
     engines: {node: '>=18'}
@@ -3722,12 +3998,6 @@ packages:
     cpu: [x64]
     os: [netbsd]
 
-  '@esbuild/netbsd-x64@0.27.2':
-    resolution: {integrity: sha512-HwGDZ0VLVBY3Y+Nw0JexZy9o/nUAWq9MlV7cahpaXKW6TOzfVno3y3/M8Ga8u8Yr7GldLOov27xiCnqRZf0tCA==}
-    engines: {node: '>=18'}
-    cpu: [x64]
-    os: [netbsd]
-
   '@esbuild/netbsd-x64@0.27.3':
     resolution: {integrity: sha512-P14lFKJl/DdaE00LItAukUdZO5iqNH7+PjoBm+fLQjtxfcfFE20Xf5CrLsmZdq5LFFZzb5JMZ9grUwvtVYzjiA==}
     engines: {node: '>=18'}
@@ -3746,12 +4016,6 @@ packages:
     cpu: [arm64]
     os: [openbsd]
 
-  '@esbuild/openbsd-arm64@0.27.2':
-    resolution: {integrity: sha512-DNIHH2BPQ5551A7oSHD0CKbwIA/Ox7+78/AWkbS5QoRzaqlev2uFayfSxq68EkonB+IKjiuxBFoV8ESJy8bOHA==}
-    engines: {node: '>=18'}
-    cpu: [arm64]
-    os: [openbsd]
-
   '@esbuild/openbsd-arm64@0.27.3':
     resolution: {integrity: sha512-AIcMP77AvirGbRl/UZFTq5hjXK+2wC7qFRGoHSDrZ5v5b8DK/GYpXW3CPRL53NkvDqb9D+alBiC/dV0Fb7eJcw==}
     engines: {node: '>=18'}
@@ -3776,12 +4040,6 @@ packages:
     cpu: [x64]
     os: [openbsd]
 
-  '@esbuild/openbsd-x64@0.27.2':
-    resolution: {integrity: sha512-/it7w9Nb7+0KFIzjalNJVR5bOzA9Vay+yIPLVHfIQYG/j+j9VTH84aNB8ExGKPU4AzfaEvN9/V4HV+F+vo8OEg==}
-    engines: {node: '>=18'}
-    cpu: [x64]
-    os: [openbsd]
-
   '@esbuild/openbsd-x64@0.27.3':
     resolution: {integrity: sha512-DnW2sRrBzA+YnE70LKqnM3P+z8vehfJWHXECbwBmH/CU51z6FiqTQTHFenPlHmo3a8UgpLyH3PT+87OViOh1AQ==}
     engines: {node: '>=18'}
@@ -3800,12 +4058,6 @@ packages:
     cpu: [arm64]
     os: [openharmony]
 
-  '@esbuild/openharmony-arm64@0.27.2':
-    resolution: {integrity: sha512-LRBbCmiU51IXfeXk59csuX/aSaToeG7w48nMwA6049Y4J4+VbWALAuXcs+qcD04rHDuSCSRKdmY63sruDS5qag==}
-    engines: {node: '>=18'}
-    cpu: [arm64]
-    os: [openharmony]
-
   '@esbuild/openharmony-arm64@0.27.3':
     resolution: {integrity: sha512-NinAEgr/etERPTsZJ7aEZQvvg/A6IsZG/LgZy+81wON2huV7SrK3e63dU0XhyZP4RKGyTm7aOgmQk0bGp0fy2g==}
     engines: {node: '>=18'}
@@ -3830,12 +4082,6 @@ packages:
     cpu: [x64]
     os: [sunos]
 
-  '@esbuild/sunos-x64@0.27.2':
-    resolution: {integrity: sha512-kMtx1yqJHTmqaqHPAzKCAkDaKsffmXkPHThSfRwZGyuqyIeBvf08KSsYXl+abf5HDAPMJIPnbBfXvP2ZC2TfHg==}
-    engines: {node: '>=18'}
-    cpu: [x64]
-    os: [sunos]
-
   '@esbuild/sunos-x64@0.27.3':
     resolution: {integrity: sha512-PanZ+nEz+eWoBJ8/f8HKxTTD172SKwdXebZ0ndd953gt1HRBbhMsaNqjTyYLGLPdoWHy4zLU7bDVJztF5f3BHA==}
     engines: {node: '>=18'}
@@ -3860,12 +4106,6 @@ packages:
     cpu: [arm64]
     os: [win32]
 
-  '@esbuild/win32-arm64@0.27.2':
-    resolution: {integrity: sha512-Yaf78O/B3Kkh+nKABUF++bvJv5Ijoy9AN1ww904rOXZFLWVc5OLOfL56W+C8F9xn5JQZa3UX6m+IktJnIb1Jjg==}
-    engines: {node: '>=18'}
-    cpu: [arm64]
-    os: [win32]
-
   '@esbuild/win32-arm64@0.27.3':
     resolution: {integrity: sha512-B2t59lWWYrbRDw/tjiWOuzSsFh1Y/E95ofKz7rIVYSQkUYBjfSgf6oeYPNWHToFRr2zx52JKApIcAS/D5TUBnA==}
     engines: {node: '>=18'}
@@ -3890,12 +4130,6 @@ packages:
     cpu: [ia32]
     os: [win32]
 
-  '@esbuild/win32-ia32@0.27.2':
-    resolution: {integrity: sha512-Iuws0kxo4yusk7sw70Xa2E2imZU5HoixzxfGCdxwBdhiDgt9vX9VUCBhqcwY7/uh//78A1hMkkROMJq9l27oLQ==}
-    engines: {node: '>=18'}
-    cpu: [ia32]
-    os: [win32]
-
   '@esbuild/win32-ia32@0.27.3':
     resolution: {integrity: sha512-QLKSFeXNS8+tHW7tZpMtjlNb7HKau0QDpwm49u0vUp9y1WOF+PEzkU84y9GqYaAVW8aH8f3GcBck26jh54cX4Q==}
     engines: {node: '>=18'}
@@ -3920,12 +4154,6 @@ packages:
     cpu: [x64]
     os: [win32]
 
-  '@esbuild/win32-x64@0.27.2':
-    resolution: {integrity: sha512-sRdU18mcKf7F+YgheI/zGf5alZatMUTKj/jNS6l744f9u3WFu4v7twcUI9vu4mknF4Y9aDlblIie0IM+5xxaqQ==}
-    engines: {node: '>=18'}
-    cpu: [x64]
-    os: [win32]
-
   '@esbuild/win32-x64@0.27.3':
     resolution: {integrity: sha512-4uJGhsxuptu3OcpVAzli+/gWusVGwZZHTlS63hh++ehExkVT8SgiEf7/uC/PclrPPkLhZqGgCTjd0VWLo6xMqA==}
     engines: {node: '>=18'}
@@ -4192,6 +4420,20 @@ packages:
       '@modelcontextprotocol/sdk':
         optional: true
 
+  '@grpc/grpc-js@1.14.4':
+    resolution: {integrity: sha512-k9Dj3DV/itK9D06Y8f190Qgop7/Ui+D0njFV3LHMPwPT75DpXLQohE9Wmz0QElrJnzsjB7KPWiKJbOl7IPDArQ==}
+    engines: {node: '>=12.10.0'}
+
+  '@grpc/proto-loader@0.7.15':
+    resolution: {integrity: sha512-tMXdRCfYVixjuFK+Hk0Q1s38gV9zDiDJfWL3h1rv4Qc39oILCu1TRTDt7+fGUI8K4G1Fj125Hx/ru3azECWTyQ==}
+    engines: {node: '>=6'}
+    hasBin: true
+
+  '@grpc/proto-loader@0.8.1':
+    resolution: {integrity: sha512-wtF6h+DY6M3YaDBPAmvuuA6jV8Sif9MjtOI5euKFWRgCDl5PeDpPsHR9u2l6St5ceY8AZgoNDww5+HvEsXFsGg==}
+    engines: {node: '>=6'}
+    hasBin: true
+
   '@harperfast/extended-iterable@1.0.3':
     resolution: {integrity: sha512-sSAYhQca3rDWtQUHSAPeO7axFIUJOI6hn1gjRC5APVE1a90tuyT8f5WIgRsFhhWA7htNkju2veB9eWL6YHi/Lw==}
 
@@ -4513,6 +4755,9 @@ packages:
   '@jridgewell/trace-mapping@0.3.9':
     resolution: {integrity: sha512-3Belt6tdc8bPgAtbcmdtNJlirVoTmEb5e2gC94PnkwEW9jI6CAHUeoG85tjWP5WquqfavoMtMwiG4P926ZKKuQ==}
 
+  '@js-sdsl/ordered-map@4.4.2':
+    resolution: {integrity: sha512-iUKgm52T8HOE/makSxjqoWhe95ZJA1/G1sYsGev2JDKUSS14KAgg1LHb+Ba+IPow0xflbnSkOsZcO08C7w1gYw==}
+
   '@jsdevtools/ono@7.1.3':
     resolution: {integrity: sha512-4JQNk+3mVzK3xh2rqd6RB4J46qUR19azEHBneZyTZM+c456qOrbbM/5xcR8huNCCcbVt7+UmizG6GuUvPvKUYg==}
 
@@ -4860,6 +5105,9 @@ packages:
     resolution: {integrity: sha512-T8TbSnGsxo6TDBJx/Sgv/BlVJL3tshxZP7Aq5R1mSnM5OcHY2dQaxLMu2+E8u3gN0MLOzdjurqN4ZRVuzQycOQ==}
     engines: {node: '>=8.0'}
 
+  '@opencode-ai/sdk@1.17.7':
+    resolution: {integrity: sha512-7q7StGM+N0OwUgRsmDc8Gyz3hMIH1XGig+qZ4lzWUpmSgFEjLx8U7R14GXY7KiMJVdbVf6FeaYloRz2Rcsma4A==}
+
   '@openrouter/sdk@0.12.35':
     resolution: {integrity: sha512-s4QVLLnG1AmfW3TjnnHUqGfsCkzwVK+kboGcZmKbde09m1DPqgzl4RUFt/HJ5v97MX8aEaN0UG3mKv2S+qj2Gw==}
 
@@ -5368,12 +5616,21 @@ packages:
   '@protobufjs/codegen@2.0.4':
     resolution: {integrity: sha512-YyFaikqM5sH0ziFZCN3xDC7zeGaB/d0IUb9CATugHWbd1FRFwWwt4ld4OYMPWu5a3Xe01mGAULCdqhMlPl29Jg==}
 
+  '@protobufjs/codegen@2.0.5':
+    resolution: {integrity: sha512-zgXFLzW3Ap33e6d0Wlj4MGIm6Ce8O89n/apUaGNB/jx+hw+ruWEp7EwGUshdLKVRCxZW12fp9r40E1mQrf/34g==}
+
   '@protobufjs/eventemitter@1.1.0':
     resolution: {integrity: sha512-j9ednRT81vYJ9OfVuXG6ERSTdEL1xVsNgqpkxMsbIabzSo3goCjDIveeGv5d03om39ML71RdmrGNjG5SReBP/Q==}
 
+  '@protobufjs/eventemitter@1.1.1':
+    resolution: {integrity: sha512-vW1GmwMZNnL+gMRaovlh9yZX74kc+TTU3FObkkurpMaRtBfLP3ldjS9KQWlwZgraRE0+dheEEoAxdzcJQ8eXZg==}
+
   '@protobufjs/fetch@1.1.0':
     resolution: {integrity: sha512-lljVXpqXebpsijW71PZaCYeIcE5on1w5DlQy5WH6GLbFryLUrBD4932W/E2BSpfRJWseIL4v/KPgBFxDOIdKpQ==}
 
+  '@protobufjs/fetch@1.1.1':
+    resolution: {integrity: sha512-GpptLrs57adMSuHi3VNj0mAF8dwh36LMaYF6XyJ6JMWlVsc+t42tm1HSEDmOs3A8fC9yyeisgLhsTVQokOZ0zw==}
+
   '@protobufjs/float@1.0.2':
     resolution: {integrity: sha512-Ddb+kVXlXst9d+R9PfTIxh1EdNkgoRe5tOX6t01f1lYWOvJnSPDBlG241QLzcyPdoNTsblLUdujGSE4RzrTZGQ==}
 
@@ -5389,6 +5646,9 @@ packages:
   '@protobufjs/utf8@1.1.0':
     resolution: {integrity: sha512-Vvn3zZrhQZkkBE8LSuW3em98c0FwgO4nxzv6OdSxPKJIEKY2bGbHn+mhGIPerzI4twdxaP8/0+06HBpwf345Lw==}
 
+  '@protobufjs/utf8@1.1.1':
+    resolution: {integrity: sha512-oOAWABowe8EAbMyWKM0tYDKi8Yaox52D+HWZhAIJqQXbqe0xI/GV7FhLWqlEKreMkfDjshR5FKgi3mnle0h6Eg==}
+
   '@publint/pack@0.1.2':
     resolution: {integrity: sha512-S+9ANAvUmjutrshV4jZjaiG8XQyuJIZ8a4utWmN/vW1sgQ9IfBnPndwkmQYw53QmouOIytT874u65HEmu6H5jw==}
     engines: {node: '>=18'}
@@ -7783,6 +8043,12 @@ packages:
   '@types/deep-eql@4.0.2':
     resolution: {integrity: sha512-c9h9dVVMigMPc4bwTvC5dxqtqJZwQPePsWjPlpSOnojbor6pGqdk541lfA7AqFQr5pB1BRdq0juY9db81BwyFw==}
 
+  '@types/docker-modem@3.0.6':
+    resolution: {integrity: sha512-yKpAGEuKRSS8wwx0joknWxsmLha78wNMe9R2S3UNsVOkZded8UqOrV8KoeDXoXsjndxwyF3eIhyClGbO1SEhEg==}
+
+  '@types/dockerode@3.3.47':
+    resolution: {integrity: sha512-ShM1mz7rCjdssXt7Xz0u1/R2BJC7piWa3SJpUBiVjCf2A3XNn4cP6pUVaD8bLanpPVVn4IKzJuw3dOvkJ8IbYw==}
+
   '@types/dom-mediacapture-record@1.0.22':
     resolution: {integrity: sha512-mUMZLK3NvwRLcAAT9qmcK+9p7tpU2FHdDsntR3YI4+GY88XrgG4XiE7u1Q2LAN2/FZOz/tdMDC3GQCR4T8nFuw==}
 
@@ -7828,12 +8094,18 @@ packages:
   '@types/node@12.20.55':
     resolution: {integrity: sha512-J8xLz7q2OFulZ2cyGTLE1TbbZcjpno7FaN6zdJNrgAdrJ+DZzh/uFR6YrTb4C+nXakvud8Q4+rbhoIWlYQbUFQ==}
 
+  '@types/node@18.19.130':
+    resolution: {integrity: sha512-GRaXQx6jGfL8sKfaIDD6OupbIHBr9jv7Jnaml9tB7l4v068PAOXqfcujMMo5PhbIs6ggR1XODELqahT2R8v0fg==}
+
   '@types/node@20.19.26':
     resolution: {integrity: sha512-0l6cjgF0XnihUpndDhk+nyD3exio3iKaYROSgvh/qSevPXax3L8p5DBRFjbvalnwatGgHEQn2R88y2fA3g4irg==}
 
   '@types/node@24.10.3':
     resolution: {integrity: sha512-gqkrWUsS8hcm0r44yn7/xZeV1ERva/nLgrLxFRUGb7aoNMIJfZJ3AC261zDQuOAKC7MiXai1WCpYc48jAHoShQ==}
 
+  '@types/pg@8.20.0':
+    resolution: {integrity: sha512-bEPFOaMAHTEP1EzpvHTbmwR8UsFyHSKsRisLIHVMXnpNefSbGA1bD6CVy+qKjGSqmZqNqBDV2azOBo8TgkcVow==}
+
   '@types/react-dom@19.2.3':
     resolution: {integrity: sha512-jp2L/eY6fn+KgVVQAOqYItbF0VY/YApe5Mz2F0aykSO8gx31bYCZyvSeYxCHKvzHG5eZjc+zyaS5BrBWya2+kQ==}
     peerDependencies:
@@ -7848,6 +8120,9 @@ packages:
   '@types/retry@0.12.0':
     resolution: {integrity: sha512-wWKOClTTiizcZhXnPY4wikVAwmdYHp8q6DmC+EJUzAMsycb7HB32Kh9RN4+0gExjmPmZSAQjgURXIGATPegAvA==}
 
+  '@types/ssh2@1.15.5':
+    resolution: {integrity: sha512-N1ASjp/nXH3ovBHddRJpli4ozpk6UdDYIX4RJWFa9L1YKnzdhTlVmiGHm4DZnj/jLbqZpes4aeR30EFGQtvhQQ==}
+
   '@types/unist@2.0.11':
     resolution: {integrity: sha512-CmBKiL6NNo/OqgmMn95Fk9Whlp2mtvIv+KNpQKN2F4SjvrEesubTRWGYSg+BnWZOnlCaSTU1sMpsBOzgbYhnsA==}
 
@@ -8475,6 +8750,9 @@ packages:
   asap@2.0.6:
     resolution: {integrity: sha512-BSHWgDSAiKs50o2Re8ppvp3seVHXSRM44cdSsT9FfNEUUZLOGWVCsiWaRPWM1Znn+mqZ1OfVZ3z3DWEzSp7hRA==}
 
+  asn1@0.2.6:
+    resolution: {integrity: sha512-ix/FxPn0MDjeyJ7i/yoHGFt/EX6LyNbxSEhPPXODPL+KB0VPk86UYfL0lMdy+KCnv+fmvIzySwaK5COwqVbWTQ==}
+
   assertion-error@2.0.1:
     resolution: {integrity: sha512-Izi8RQcffqCeNVgFigKli1ssklIbpHnCYc6AknXGYoB6grJqyeby7jv12JUQgmTAnIDnbck1uxksT4dzN3PWBA==}
     engines: {node: '>=12'}
@@ -8514,6 +8792,9 @@ packages:
     resolution: {integrity: sha512-wvUjBtSGN7+7SjNpq/9M2Tg350UZD3q62IFZLbRAR1bSMlCo1ZaeW+BJ+D090e4hIIZLBcTDWe4Mh4jvUDajzQ==}
     engines: {node: '>= 0.4'}
 
+  aws4fetch@1.0.20:
+    resolution: {integrity: sha512-/djoAN709iY65ETD6LKCtyyEI04XIBP5xVvfmNxsEP0uJB5tyaGBztSryRr4HqMStr9R06PisQE7m9zDTXKu6g==}
+
   axios@1.13.2:
     resolution: {integrity: sha512-VPk9ebNqPcy5lRGuSlKx752IlDatOjT9paPlm8A7yOuW2Fbvp4X3JznJtT4f0GzGLLiWE9W8onz51SqLYwzGaA==}
 
@@ -8651,6 +8932,9 @@ packages:
     engines: {node: '>=10.0.0'}
     deprecated: Security vulnerability fixed in 5.2.1, please upgrade
 
+  bcrypt-pbkdf@1.0.2:
+    resolution: {integrity: sha512-qeFIXtP4MSoi6NLqO12WfqARWWuCKi2Rn/9hJLEmtB5yTNr9DqFWkJRCf2qShWzPeAMRnOgCrq0sg/KLv5ES9w==}
+
   beasties@0.4.1:
     resolution: {integrity: sha512-2Imdcw3LznDuxAbJM26RHniOLAzE6WgrK8OuvVXCQtNBS8rsnD9zsSEa3fHl4hHpUY7BYTlrpvtPVbvu9G6neg==}
     engines: {node: '>=18.0.0'}
@@ -8751,6 +9035,10 @@ packages:
   buffer@6.0.3:
     resolution: {integrity: sha512-FTiCpNxtwiZZHEZbcbTIcZjERVICn9yq/pDFkTl95/AxzD1naBctN7YO68riM/gLSDY7sdrMby8hofADYuuqOA==}
 
+  buildcheck@0.0.7:
+    resolution: {integrity: sha512-lHblz4ahamxpTmnsk+MNTRWsjYKv965MwOrSJyeD588rR3Jcu7swE+0wN5F+PbL5cjgu/9ObkhfzEPuofEMwLA==}
+    engines: {node: '>=10.0.0'}
+
   bundle-require@5.1.0:
     resolution: {integrity: sha512-3WrrOuZiyaaZPWiEt4G3+IffISVC9HYlWueJEBWED4ZH4aIAC2PnkdnuRrR94M+w6yGWn4AglWtJtBI8YqvgoA==}
     engines: {node: ^12.20.0 || ^14.13.1 || >=16.0.0}
@@ -8811,6 +9099,9 @@ packages:
   capnweb@0.1.0:
     resolution: {integrity: sha512-+pygKx1JFTZTRdd1hHgaBRg5BwULEDZq8ZoHXkYP2GXNV3lrjXLj5qzlGz+SgBCJjWUmNBtlh7JPWdr0wIbY8w==}
 
+  capnweb@0.8.0:
+    resolution: {integrity: sha512-BK/TuXUiyfLSKsmjojn70yN7oYG/JJzoURZ3tckjg5Zj2KcygPm0A5jyOlswK7SYB4f0Gh9tt+RZ132b80iLfA==}
+
   ccount@2.0.1:
     resolution: {integrity: sha512-eyrF0jiFpY+3drT6383f1qhkbGsLSifNAjA61IUjZjmLCWjItY6LB9ft9YhoDgwfmclB2zhu51Lc7+95b8NRAg==}
 
@@ -8868,6 +9159,9 @@ packages:
     resolution: {integrity: sha512-TQMmc3w+5AxjpL8iIiwebF73dRDF4fBIieAqGn9RGCWaEVwQ6Fb2cGe31Yns0RRIzii5goJ1Y7xbMwo1TxMplw==}
     engines: {node: '>= 20.19.0'}
 
+  chownr@1.1.4:
+    resolution: {integrity: sha512-jJ0bqzaylmJtVnNgzTeSOs8DPavpbYgEr/b0YL8/2GO3xJEhInFmhKMUnEJQjZumK7KXGFhUy89PrsJWlakBVg==}
+
   chownr@3.0.0:
     resolution: {integrity: sha512-+IxzY9BZOQd/XuYPRmrvEVjF/nqj5kgT4kEq7VofrDoM1MxoRjEWkrCC3EtLi59TVawxTAn+orJwFQcrqEN1+g==}
     engines: {node: '>=18'}
@@ -9132,6 +9426,10 @@ packages:
       typescript:
         optional: true
 
+  cpu-features@0.0.10:
+    resolution: {integrity: sha512-9IkYqtX3YHPCzoVg1Py+o9057a3i0fp7S530UWokCSaFVTc7CwXPRiOjRjBQQ18ZCNafx78YfnG+HALxtVmOGA==}
+    engines: {node: '>=10.0.0'}
+
   crc-32@1.2.2:
     resolution: {integrity: sha512-ROmzCKrTnOwybPcJApAA6WBWij23HVfGVNKqqrZpuyZOHqK2CwHSvpGuyt/UNNvaIjEd8X5IFGp4Mh+Ie1IHJQ==}
     engines: {node: '>=0.8'}
@@ -9424,6 +9722,14 @@ packages:
   dnssd-advertise@1.1.4:
     resolution: {integrity: sha512-AmGyK9WpNf06WeP5TjHZq/wNzP76OuEeaiTlKr9E/EEelYLczywUKoqRz+DPRq/ErssjT4lU+/W7wzJW+7K/ZA==}
 
+  docker-modem@5.0.7:
+    resolution: {integrity: sha512-XJgGhoR/CLpqshm4d3L7rzH6t8NgDFUIIpztYlLHIApeJjMZKYJMz2zxPsYxnejq5h3ELYSw/RBsi3t5h7gNTA==}
+    engines: {node: '>= 8.0'}
+
+  dockerode@4.0.12:
+    resolution: {integrity: sha512-/bCZd6KlGcjZO8Buqmi/vXuqEGVEZ0PNjx/biBNqJD3MhK9DmdiAuKxqfNhflgDESDIiBz3qF+0e55+CpnrUcw==}
+    engines: {node: '>= 8.0'}
+
   dom-accessibility-api@0.5.16:
     resolution: {integrity: sha512-X7BJ2yElsnOJ30pZF4uIIDfBEVgF4XEBxL9Bxhy6dnrm5hkzqmsWHGTiHqRiITNhMyFLyAiWndIJP7Z1NTteDg==}
 
@@ -9621,11 +9927,6 @@ packages:
     engines: {node: '>=18'}
     hasBin: true
 
-  esbuild@0.27.2:
-    resolution: {integrity: sha512-HyNQImnsOC7X9PMNaCIeAm4ISCQXs5a5YasTXVliKv4uuBo1dKrG0A+uQS8M5eXjVMnLg3WgXaKvprHlFJQffw==}
-    engines: {node: '>=18'}
-    hasBin: true
-
   esbuild@0.27.3:
     resolution: {integrity: sha512-8VwMnyGCONIs6cWue2IdpHxHnAjzxnw2Zr7MkVxB2vjmQ2ivqGFb4LEG3SMnv0Gb2F/G/2yA8zUaiL1gywDCCg==}
     engines: {node: '>=18'}
@@ -10583,10 +10884,6 @@ packages:
     resolution: {integrity: sha512-tAAg/72/VxOUW7RQSX1pIxJVucYKcjFjfvj60L57jrZpYCHC3XN0WCQ3sNYL4Gmvv+7GPvTAjc+KSdeNuE8oWQ==}
     engines: {node: '>=12.22.0'}
 
-  ip-address@10.1.0:
-    resolution: {integrity: sha512-XXADHxXmvT9+CRxhXg56LJovE+bmWnEWB78LB83VZTprKTmaC5QfruXocxzTZ2Kl0DNwKuBdlIhjL8LeY8Sf8Q==}
-    engines: {node: '>= 12'}
-
   ip-address@10.2.0:
     resolution: {integrity: sha512-/+S6j4E9AHvW9SWMSEY9Xfy66O5PWvVEJ08O0y5JGyEKQpojb0K0GKpz/v5HJ/G0vi3D2sjGK78119oXZeE0qA==}
     engines: {node: '>= 12'}
@@ -11189,6 +11486,9 @@ packages:
     resolution: {integrity: sha512-iPZK6eYjbxRu3uB4/WZ3EsEIMJFMqAoopl3R+zuq0UjcAm/MO6KCweDgPfP3elTztoKP3KtnVHxTn2NHBSDVUw==}
     engines: {node: '>=10'}
 
+  lodash.camelcase@4.3.0:
+    resolution: {integrity: sha512-TwuEnCnxbc3rAvhf/LbG7tJUDzhqXyFnv3dtzLOPgCG/hODL7WFnsbwktkD7yUV0RrreP/l1PALq/YSg6VvjlA==}
+
   lodash.debounce@4.0.8:
     resolution: {integrity: sha512-FT1yDzDYEoYWhnSGnpE/4Kj1fLZkDFyqRb7fNt6FdYOSxlUWAtp42Eh6Wb0rGIv/m9Bgo7x4GhQbm5Ys4SG5ow==}
 
@@ -11679,6 +11979,9 @@ packages:
   mitt@3.0.1:
     resolution: {integrity: sha512-vKivATfr97l2/QBCYAkXYDbrIWPM2IIKEl7YPhjCvKlG3kE2gm+uBo6nEXK3M5/Ffh/FLpKExzOQ3JJoJGFKBw==}
 
+  mkdirp-classic@0.5.3:
+    resolution: {integrity: sha512-gKLcREMhtuZRwRAfqP3RFW+TK4JqApVBtOIftVgjuABpAtpxhPGaDcfvbhNvD0B8iD1oUr/txX35NjcaY6Ns/A==}
+
   mkdirp@1.0.4:
     resolution: {integrity: sha512-vVqVZQyf3WLx2Shd0qJ9xuvqgAyKPLAiqITEtqW0oIUjzo3PePDd6fW9iFz30ef7Ysp/oiWqbhszeGWW2T6Gzw==}
     engines: {node: '>=10'}
@@ -11735,6 +12038,9 @@ packages:
   mz@2.7.0:
     resolution: {integrity: sha512-z81GNO7nnYMEhrGh9LeymoE4+Yr0Wn5McHIZMK5cfQCl+NDX08sCZgUc9/6MHni9IWuFLm1Z3HTCXu2z9fN62Q==}
 
+  nan@2.27.0:
+    resolution: {integrity: sha512-hC+0LidcL3XE4rp1C4H54KujgXKzbfyTngZTwBByQxsOxCEKZT0MPQ4hOKUH2jU1OYstqdDH4onyHPDzcV0XdQ==}
+
   nanoid@3.3.11:
     resolution: {integrity: sha512-N8SpfPUnUp1bK+PMYW8qSWdl9U+wwNWI4QKxOYDy9JAro3WMX7p2OeVRF9v+347pnakNevPmiHhNmZ2HbFA76w==}
     engines: {node: ^10 || ^12 || ^13.7 || ^14 || >=15.0.1}
@@ -12251,6 +12557,40 @@ packages:
   perfect-debounce@2.0.0:
     resolution: {integrity: sha512-fkEH/OBiKrqqI/yIgjR92lMfs2K8105zt/VT6+7eTjNwisrsh47CeIED9z58zI7DfKdH3uHAn25ziRZn3kgAow==}
 
+  pg-cloudflare@1.4.0:
+    resolution: {integrity: sha512-Vo7z/6rrQYxpNRylp4Tlob2elzbh+N/MOQbxFVWCxS7oEx6jF53GTJFxK2WWpKuBRkmiin4Mt+xofFDjx09R0A==}
+
+  pg-connection-string@2.13.0:
+    resolution: {integrity: sha512-EMnU9E2fSULdsbErBbMaXJvFeD9B4+nPcM3f+4lsiCR0BHLPrLVjv3DbyM2hgQQviKJaTWIRRTjKjWlHg3p2ig==}
+
+  pg-int8@1.0.1:
+    resolution: {integrity: sha512-WCtabS6t3c8SkpDBUlb1kjOs7l66xsGdKpIPZsg4wR+B3+u9UAum2odSsF9tnvxg80h4ZxLWMy4pRjOsFIqQpw==}
+    engines: {node: '>=4.0.0'}
+
+  pg-pool@3.14.0:
+    resolution: {integrity: sha512-gKtPkFdQPU3DksooVLi9LsjZxrsBUZIpa+7aVx+LV5pNh0KzP4Zleud2po+ConrxbuXGBJ6Hfer6hdgpIBpBaw==}
+    peerDependencies:
+      pg: '>=8.0'
+
+  pg-protocol@1.14.0:
+    resolution: {integrity: sha512-n5taZ1kO3s9ngDTVxsEznOqCyToTgz0FLuPq0B33COy5pPpuWJpY3/2oRBVETuOgzdqRXfWpM9HIhp2LBBT1BA==}
+
+  pg-types@2.2.0:
+    resolution: {integrity: sha512-qTAAlrEsl8s4OiEQY69wDvcMIdQN6wdz5ojQiOy6YRMuynxenON0O5oCpJI6lshc6scgAY8qvJ2On/p+CXY0GA==}
+    engines: {node: '>=4'}
+
+  pg@8.21.0:
+    resolution: {integrity: sha512-AUP1EYJuHraQGsVoCQVIcM7TEJVGtDzxWtGFZd8rds9d+CCXlU5Js1rYgfLNvxy9iJrpHjGrRjoi/3BT9fRyiA==}
+    engines: {node: '>= 16.0.0'}
+    peerDependencies:
+      pg-native: '>=3.0.1'
+    peerDependenciesMeta:
+      pg-native:
+        optional: true
+
+  pgpass@1.0.5:
+    resolution: {integrity: sha512-FdW9r/jQZhSeohs1Z3sI1yxFQNFvMcnmfuj4WBMUTxOrAyLMaTcE1aAMBiTlbMNaXvBCQuVi0R7hd8udDSP7ug==}
+
   picocolors@1.1.1:
     resolution: {integrity: sha512-xceH2snhtb5M9liqDsmEw56le376mTZkEX/jEb/RxNFyegNul7eNslCXP9FDj/Lcu0X8KEyMceP2ntpaHrDEVA==}
 
@@ -12364,6 +12704,22 @@ packages:
     resolution: {integrity: sha512-7a70Nsot+EMX9fFU3064K/kdHWZqGVY+BADLyXc8Dfv+mTLLVl6JzJpPaCZ2kQL9gIJvKXSLMHhqdRRjwQeFtw==}
     engines: {node: ^10 || ^12 || >=14}
 
+  postgres-array@2.0.0:
+    resolution: {integrity: sha512-VpZrUqU5A69eQyW2c5CA1jtLecCsN2U/bD6VilrFDWq5+5UIEVO7nazS3TEcHf1zuPYO/sqGvUvW62g86RXZuA==}
+    engines: {node: '>=4'}
+
+  postgres-bytea@1.0.1:
+    resolution: {integrity: sha512-5+5HqXnsZPE65IJZSMkZtURARZelel2oXUEO8rH83VS/hxH5vv1uHquPg5wZs8yMAfdv971IU+kcPUczi7NVBQ==}
+    engines: {node: '>=0.10.0'}
+
+  postgres-date@1.0.7:
+    resolution: {integrity: sha512-suDmjLVQg78nMK2UZ454hAG+OAW+HQPZ6n++TNDUX+L0+uUlLywnoxJKDou51Zm+zTCjrCl0Nq6J9C5hP9vK/Q==}
+    engines: {node: '>=0.10.0'}
+
+  postgres-interval@1.2.0:
+    resolution: {integrity: sha512-9ZhXKM/rw350N1ovuWHbGxnGh/SNJ4cnxHiM0rxE4VN41wsg8P8zWn9hv/buK00RP4WvlOyr/RBDiptyxVbkZQ==}
+    engines: {node: '>=0.10.0'}
+
   preact@10.28.1:
     resolution: {integrity: sha512-u1/ixq/lVQI0CakKNvLDEcW5zfCjUQfZdK9qqWuIJtsezuyG6pk9TWj75GMuI/EzRSZB/VAE43sNWWZfiy8psw==}
 
@@ -12449,6 +12805,10 @@ packages:
     resolution: {integrity: sha512-CvexbZtbov6jW2eXAvLukXjXUW1TzFaivC46BpWc/3BpcCysb5Vffu+B3XHMm8lVEuy2Mm4XGex8hBSg1yapPg==}
     engines: {node: '>=12.0.0'}
 
+  protobufjs@7.6.4:
+    resolution: {integrity: sha512-RJJPTTpvFfHcWLkIa2JFWK4XvtSzS0yEWDmunqHXli1h3JlkbcQZXDZdcWxv+JK3Xsl5/UFDPZ0iGm7DAengYw==}
+    engines: {node: '>=12.0.0'}
+
   proxy-addr@2.0.7:
     resolution: {integrity: sha512-llQsMLSUDUPT44jdrU/O37qlnifitDP+ZwrmmZcoSKyLKvtZxpyV0n2/bD/N4tBAAZ/gJEdZU7KMraoK1+XYAg==}
     engines: {node: '>= 0.10'}
@@ -13229,6 +13589,13 @@ packages:
   spawndamnit@3.0.1:
     resolution: {integrity: sha512-MmnduQUuHCoFckZoWnXsTg7JaiLBJrKFj9UI2MbRPGaJeVpsLcVBu6P/IGZovziM/YBsellCmsprgNA+w0CzVg==}
 
+  split-ca@1.0.1:
+    resolution: {integrity: sha512-Q5thBSxp5t8WPTTJQS59LrGqOZqOsrhDGDVm8azCqIBjSBd7nd9o2PM+mDulQQkh8h//4U6hFZnc/mul8t5pWQ==}
+
+  split2@4.2.0:
+    resolution: {integrity: sha512-UcjcJOWknrNkF6PLX83qcHM6KHgVKNkV62Y8a5uYDVv9ydGQVwAHMKqHdJje1VTWpljG0WYpCDhrCdAOYH4TWg==}
+    engines: {node: '>= 10.x'}
+
   sprintf-js@1.0.3:
     resolution: {integrity: sha512-D9cPgkvLlV3t3IzL0D0YLvGA9Ahk4PcvVwUbN0dSGr1aP0Nrt4AEnTUbuGvquEC0mA64Gqt1fzirlRs5ibXx8g==}
 
@@ -13252,6 +13619,10 @@ packages:
     engines: {node: '>=20.16.0'}
     hasBin: true
 
+  ssh2@1.17.0:
+    resolution: {integrity: sha512-wPldCk3asibAjQ/kziWQQt1Wh3PgDFpC0XpwclzKcdT1vql6KeYxf5LIt4nlFkUeR8WuphYMKqUA56X4rjbfgQ==}
+    engines: {node: '>=10.16.0'}
+
   stable-hash-x@0.2.0:
     resolution: {integrity: sha512-o3yWv49B/o4QZk5ZcsALc6t0+eCelPc44zZsLtCQnZPDwFpDYSWcDnrv2TtMmMbQ7uKo3J0HTURCqckw23czNQ==}
     engines: {node: '>=12.0.0'}
@@ -13445,6 +13816,9 @@ packages:
     resolution: {integrity: sha512-g9ljZiwki/LfxmQADO3dEY1CbpmXT5Hm2fJ+QaGKwSXUylMybePR7/67YW7jOrrvjEgL1Fmz5kzyAjWVWLlucg==}
     engines: {node: '>=6'}
 
+  tar-fs@2.1.4:
+    resolution: {integrity: sha512-mDAjwmZdh7LTT6pNleZ05Yt65HC3E+NiQzl672vQG38jIrehtJk/J3mNwIg+vShQPcLF/LV7CMnDW6vjj6sfYQ==}
+
   tar-fs@3.1.2:
     resolution: {integrity: sha512-QGxxTxxyleAdyM3kpFs14ymbYmNFrfY+pHj7Z8FgtbZ7w2//VAgLMac7sT6nRpIHjppXO2AwwEOg0bPFVRcmXw==}
 
@@ -13679,6 +14053,9 @@ packages:
   tw-animate-css@1.4.0:
     resolution: {integrity: sha512-7bziOlRqH0hJx80h/3mbicLW7o8qLsH5+RaLR2t+OHM3D0JlWGODQKQ4cxbK7WlvmUxpcj6Kgu6EKqjrGFe3QQ==}
 
+  tweetnacl@0.14.5:
+    resolution: {integrity: sha512-KXXFFdAbFXY4geFIwoyNK+f5Z1b7swfXABfL7HXCmoIWMKU3dmS26672A4EeQtDzLKy7SXmfBu51JolvEKwtGA==}
+
   type-check@0.4.0:
     resolution: {integrity: sha512-XleUoc9uwGXqjWwXaUTZAmzMcFZ5858QA2vvx1Ur5xIcixXIP+8LnFDgRplU30us6teqdlskFfu+ae4K79Ooew==}
     engines: {node: '>= 0.8.0'}
@@ -13768,6 +14145,9 @@ packages:
   unctx@2.5.0:
     resolution: {integrity: sha512-p+Rz9x0R7X+CYDkT+Xg8/GhpcShTlU8n+cf9OtOEf7zEQsNcCZO1dPKNRDqvUTaq+P32PMMkxWHwfrxkqfqAYg==}
 
+  undici-types@5.26.5:
+    resolution: {integrity: sha512-JlCMO+ehdEIKqlFxk6IfVoAUVmgz7cU7zD/h9XZ0qzeosSHmUJVOzSQvvYSYWXkFXC+IfLKSIffhv0sVZup6pA==}
+
   undici-types@5.28.4:
     resolution: {integrity: sha512-3OeMF5Lyowe8VW0skf5qaIE7Or3yS9LS7fvMUI0gg4YxpIBVg0L8BxCmROw2CcYhSkpR68Epz7CGc8MPj94Uww==}
 
@@ -14154,6 +14534,11 @@ packages:
     resolution: {integrity: sha512-pMZTvIkT1d+TFGvDOqodOclx0QWkkgi6Tdoa8gC8ffGAAqz9pzPTZWAybbsHHoED/ztMtkv/VoYTYyShUn81hA==}
     engines: {node: '>= 0.4.0'}
 
+  uuid@10.0.0:
+    resolution: {integrity: sha512-8XkAphELsDnEGrDxUOHB3RGvXz6TeuYSGEZBOjtTtPm2lwhGBjLgOzLHB63IUWfBpNucQjND6d3AOudO+H3RWQ==}
+    deprecated: uuid@10 and below is no longer supported.  For ESM codebases, update to uuid@latest.  For CommonJS codebases, use uuid@11 (but be aware this version will likely be deprecated in 2028).
+    hasBin: true
+
   uuid@7.0.3:
     resolution: {integrity: sha512-DPSke0pXhTZgoF/d+WSt2QaKMCFSfx7QegxEWT+JOuHF5aWrKEn0G+ztjuJg/gG8/ItK+rbPCD/yNv8yyih6Cg==}
     deprecated: uuid@10 and below is no longer supported.  For ESM codebases, update to uuid@latest.  For CommonJS codebases, use uuid@11 (but be aware this version will likely be deprecated in 2028).
@@ -14770,6 +15155,10 @@ packages:
   xmlchars@2.2.0:
     resolution: {integrity: sha512-JZnDKK8B0RCDw84FNdDAIpZK+JuJw+s7Lz8nksI7SIuU3UXJJslUthsi+uWBUYOwPFwW7W7PRLRfUKpxjtjFCw==}
 
+  xtend@4.0.2:
+    resolution: {integrity: sha512-LKYU1iAXJXUgAXn9URjiu+MWhyUXHsvfp7mcuYm9dSUKK0/CjtrUwFAxD82/mCWbtLsGjFIad0wIsod4zrTAEQ==}
+    engines: {node: '>=0.4'}
+
   y18n@5.0.8:
     resolution: {integrity: sha512-0pfFzegeDWJHJIAmTLRP2DwHjdF5s7jo9tuztdQxAhINCdvS+3nGINqPd00AphqJR/0LhANUS6/+7SCb98YOfA==}
     engines: {node: '>=10'}
@@ -14864,6 +15253,10 @@ snapshots:
     dependencies:
       zod: 3.25.76
 
+  '@agentclientprotocol/sdk@0.25.1(zod@4.3.6)':
+    dependencies:
+      zod: 4.3.6
+
   '@ampproject/remapping@2.3.0':
     dependencies:
       '@jridgewell/gen-mapping': 0.3.13
@@ -15958,6 +16351,8 @@ snapshots:
       '@babel/helper-string-parser': 7.29.7
       '@babel/helper-validator-identifier': 7.29.7
 
+  '@balena/dockerignore@1.0.2': {}
+
   '@bcoe/v8-coverage@1.0.2': {}
 
   '@bufbuild/protobuf@1.10.1': {}
@@ -16120,10 +16515,21 @@ snapshots:
       human-id: 4.1.3
       prettier: 2.8.8
 
+  '@cloudflare/containers@0.3.7': {}
+
   '@cloudflare/kv-asset-handler@0.4.2': {}
 
   '@cloudflare/kv-asset-handler@0.5.0': {}
 
+  '@cloudflare/sandbox@0.12.1(@opencode-ai/sdk@1.17.7)':
+    dependencies:
+      '@cloudflare/containers': 0.3.7
+      aws4fetch: 1.0.20
+      capnweb: 0.8.0
+      hono: 4.12.23
+    optionalDependencies:
+      '@opencode-ai/sdk': 1.17.7
+
   '@cloudflare/unenv-preset@2.16.1(unenv@2.0.0-rc.24)(workerd@1.20260504.1)':
     dependencies:
       unenv: 2.0.0-rc.24
@@ -16269,9 +16675,6 @@ snapshots:
   '@esbuild/aix-ppc64@0.25.12':
     optional: true
 
-  '@esbuild/aix-ppc64@0.27.2':
-    optional: true
-
   '@esbuild/aix-ppc64@0.27.3':
     optional: true
 
@@ -16284,9 +16687,6 @@ snapshots:
   '@esbuild/android-arm64@0.25.12':
     optional: true
 
-  '@esbuild/android-arm64@0.27.2':
-    optional: true
-
   '@esbuild/android-arm64@0.27.3':
     optional: true
 
@@ -16299,9 +16699,6 @@ snapshots:
   '@esbuild/android-arm@0.25.12':
     optional: true
 
-  '@esbuild/android-arm@0.27.2':
-    optional: true
-
   '@esbuild/android-arm@0.27.3':
     optional: true
 
@@ -16314,9 +16711,6 @@ snapshots:
   '@esbuild/android-x64@0.25.12':
     optional: true
 
-  '@esbuild/android-x64@0.27.2':
-    optional: true
-
   '@esbuild/android-x64@0.27.3':
     optional: true
 
@@ -16329,9 +16723,6 @@ snapshots:
   '@esbuild/darwin-arm64@0.25.12':
     optional: true
 
-  '@esbuild/darwin-arm64@0.27.2':
-    optional: true
-
   '@esbuild/darwin-arm64@0.27.3':
     optional: true
 
@@ -16344,9 +16735,6 @@ snapshots:
   '@esbuild/darwin-x64@0.25.12':
     optional: true
 
-  '@esbuild/darwin-x64@0.27.2':
-    optional: true
-
   '@esbuild/darwin-x64@0.27.3':
     optional: true
 
@@ -16359,9 +16747,6 @@ snapshots:
   '@esbuild/freebsd-arm64@0.25.12':
     optional: true
 
-  '@esbuild/freebsd-arm64@0.27.2':
-    optional: true
-
   '@esbuild/freebsd-arm64@0.27.3':
     optional: true
 
@@ -16374,9 +16759,6 @@ snapshots:
   '@esbuild/freebsd-x64@0.25.12':
     optional: true
 
-  '@esbuild/freebsd-x64@0.27.2':
-    optional: true
-
   '@esbuild/freebsd-x64@0.27.3':
     optional: true
 
@@ -16389,9 +16771,6 @@ snapshots:
   '@esbuild/linux-arm64@0.25.12':
     optional: true
 
-  '@esbuild/linux-arm64@0.27.2':
-    optional: true
-
   '@esbuild/linux-arm64@0.27.3':
     optional: true
 
@@ -16404,9 +16783,6 @@ snapshots:
   '@esbuild/linux-arm@0.25.12':
     optional: true
 
-  '@esbuild/linux-arm@0.27.2':
-    optional: true
-
   '@esbuild/linux-arm@0.27.3':
     optional: true
 
@@ -16419,9 +16795,6 @@ snapshots:
   '@esbuild/linux-ia32@0.25.12':
     optional: true
 
-  '@esbuild/linux-ia32@0.27.2':
-    optional: true
-
   '@esbuild/linux-ia32@0.27.3':
     optional: true
 
@@ -16434,9 +16807,6 @@ snapshots:
   '@esbuild/linux-loong64@0.25.12':
     optional: true
 
-  '@esbuild/linux-loong64@0.27.2':
-    optional: true
-
   '@esbuild/linux-loong64@0.27.3':
     optional: true
 
@@ -16449,9 +16819,6 @@ snapshots:
   '@esbuild/linux-mips64el@0.25.12':
     optional: true
 
-  '@esbuild/linux-mips64el@0.27.2':
-    optional: true
-
   '@esbuild/linux-mips64el@0.27.3':
     optional: true
 
@@ -16464,9 +16831,6 @@ snapshots:
   '@esbuild/linux-ppc64@0.25.12':
     optional: true
 
-  '@esbuild/linux-ppc64@0.27.2':
-    optional: true
-
   '@esbuild/linux-ppc64@0.27.3':
     optional: true
 
@@ -16479,9 +16843,6 @@ snapshots:
   '@esbuild/linux-riscv64@0.25.12':
     optional: true
 
-  '@esbuild/linux-riscv64@0.27.2':
-    optional: true
-
   '@esbuild/linux-riscv64@0.27.3':
     optional: true
 
@@ -16494,9 +16855,6 @@ snapshots:
   '@esbuild/linux-s390x@0.25.12':
     optional: true
 
-  '@esbuild/linux-s390x@0.27.2':
-    optional: true
-
   '@esbuild/linux-s390x@0.27.3':
     optional: true
 
@@ -16509,9 +16867,6 @@ snapshots:
   '@esbuild/linux-x64@0.25.12':
     optional: true
 
-  '@esbuild/linux-x64@0.27.2':
-    optional: true
-
   '@esbuild/linux-x64@0.27.3':
     optional: true
 
@@ -16521,9 +16876,6 @@ snapshots:
   '@esbuild/netbsd-arm64@0.25.12':
     optional: true
 
-  '@esbuild/netbsd-arm64@0.27.2':
-    optional: true
-
   '@esbuild/netbsd-arm64@0.27.3':
     optional: true
 
@@ -16536,9 +16888,6 @@ snapshots:
   '@esbuild/netbsd-x64@0.25.12':
     optional: true
 
-  '@esbuild/netbsd-x64@0.27.2':
-    optional: true
-
   '@esbuild/netbsd-x64@0.27.3':
     optional: true
 
@@ -16548,9 +16897,6 @@ snapshots:
   '@esbuild/openbsd-arm64@0.25.12':
     optional: true
 
-  '@esbuild/openbsd-arm64@0.27.2':
-    optional: true
-
   '@esbuild/openbsd-arm64@0.27.3':
     optional: true
 
@@ -16563,9 +16909,6 @@ snapshots:
   '@esbuild/openbsd-x64@0.25.12':
     optional: true
 
-  '@esbuild/openbsd-x64@0.27.2':
-    optional: true
-
   '@esbuild/openbsd-x64@0.27.3':
     optional: true
 
@@ -16575,9 +16918,6 @@ snapshots:
   '@esbuild/openharmony-arm64@0.25.12':
     optional: true
 
-  '@esbuild/openharmony-arm64@0.27.2':
-    optional: true
-
   '@esbuild/openharmony-arm64@0.27.3':
     optional: true
 
@@ -16590,9 +16930,6 @@ snapshots:
   '@esbuild/sunos-x64@0.25.12':
     optional: true
 
-  '@esbuild/sunos-x64@0.27.2':
-    optional: true
-
   '@esbuild/sunos-x64@0.27.3':
     optional: true
 
@@ -16605,9 +16942,6 @@ snapshots:
   '@esbuild/win32-arm64@0.25.12':
     optional: true
 
-  '@esbuild/win32-arm64@0.27.2':
-    optional: true
-
   '@esbuild/win32-arm64@0.27.3':
     optional: true
 
@@ -16620,9 +16954,6 @@ snapshots:
   '@esbuild/win32-ia32@0.25.12':
     optional: true
 
-  '@esbuild/win32-ia32@0.27.2':
-    optional: true
-
   '@esbuild/win32-ia32@0.27.3':
     optional: true
 
@@ -16635,9 +16966,6 @@ snapshots:
   '@esbuild/win32-x64@0.25.12':
     optional: true
 
-  '@esbuild/win32-x64@0.27.2':
-    optional: true
-
   '@esbuild/win32-x64@0.27.3':
     optional: true
 
@@ -17125,6 +17453,25 @@ snapshots:
       - supports-color
       - utf-8-validate
 
+  '@grpc/grpc-js@1.14.4':
+    dependencies:
+      '@grpc/proto-loader': 0.8.1
+      '@js-sdsl/ordered-map': 4.4.2
+
+  '@grpc/proto-loader@0.7.15':
+    dependencies:
+      lodash.camelcase: 4.3.0
+      long: 5.3.2
+      protobufjs: 7.5.4
+      yargs: 17.7.2
+
+  '@grpc/proto-loader@0.8.1':
+    dependencies:
+      lodash.camelcase: 4.3.0
+      long: 5.3.2
+      protobufjs: 7.6.4
+      yargs: 17.7.2
+
   '@harperfast/extended-iterable@1.0.3':
     optional: true
 
@@ -17381,6 +17728,8 @@ snapshots:
       '@jridgewell/resolve-uri': 3.1.2
       '@jridgewell/sourcemap-codec': 1.5.5
 
+  '@js-sdsl/ordered-map@4.4.2': {}
+
   '@jsdevtools/ono@7.1.3': {}
 
   '@livekit/mutex@1.1.1': {}
@@ -17702,6 +18051,10 @@ snapshots:
 
   '@oozcitak/util@8.3.8': {}
 
+  '@opencode-ai/sdk@1.17.7':
+    dependencies:
+      cross-spawn: 7.0.6
+
   '@openrouter/sdk@0.12.35':
     dependencies:
       zod: 4.3.6
@@ -17997,13 +18350,21 @@ snapshots:
 
   '@protobufjs/codegen@2.0.4': {}
 
+  '@protobufjs/codegen@2.0.5': {}
+
   '@protobufjs/eventemitter@1.1.0': {}
 
+  '@protobufjs/eventemitter@1.1.1': {}
+
   '@protobufjs/fetch@1.1.0':
     dependencies:
       '@protobufjs/aspromise': 1.1.2
       '@protobufjs/inquire': 1.1.0
 
+  '@protobufjs/fetch@1.1.1':
+    dependencies:
+      '@protobufjs/aspromise': 1.1.2
+
   '@protobufjs/float@1.0.2': {}
 
   '@protobufjs/inquire@1.1.0': {}
@@ -18014,6 +18375,8 @@ snapshots:
 
   '@protobufjs/utf8@1.1.0': {}
 
+  '@protobufjs/utf8@1.1.1': {}
+
   '@publint/pack@0.1.2': {}
 
   '@puppeteer/browsers@2.13.0':
@@ -19799,9 +20162,9 @@ snapshots:
 
   '@tanstack/history@1.154.14': {}
 
-  '@tanstack/nitro-v2-vite-plugin@1.154.7(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))':
+  '@tanstack/nitro-v2-vite-plugin@1.154.7(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))':
     dependencies:
-      nitropack: 2.13.1(rolldown@1.0.0-rc.17)
+      nitropack: 2.13.1(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)
       pathe: 2.0.3
       vite: 7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
     transitivePeerDependencies:
@@ -19936,9 +20299,9 @@ snapshots:
       tiny-invariant: 1.3.3
       tiny-warning: 1.0.3
 
-  '@tanstack/react-start-plugin@1.131.50(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(@vitejs/plugin-react@4.7.0(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(rolldown@1.0.0-rc.17)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))':
+  '@tanstack/react-start-plugin@1.131.50(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(@vitejs/plugin-react@4.7.0(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))':
     dependencies:
-      '@tanstack/start-plugin-core': 1.131.50(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(rolldown@1.0.0-rc.17)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+      '@tanstack/start-plugin-core': 1.131.50(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@vitejs/plugin-react': 4.7.0(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       pathe: 2.0.3
       vite: 7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
@@ -19978,11 +20341,11 @@ snapshots:
       - webpack
       - xml2js
 
-  '@tanstack/react-start-router-manifest@1.120.19(@types/node@24.10.3)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)':
+  '@tanstack/react-start-router-manifest@1.120.19(@types/node@24.10.3)(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)':
     dependencies:
       '@tanstack/router-core': 1.157.16
       tiny-invariant: 1.3.3
-      vinxi: 0.5.3(@types/node@24.10.3)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
+      vinxi: 0.5.3(@types/node@24.10.3)(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
     transitivePeerDependencies:
       - '@azure/app-configuration'
       - '@azure/cosmos'
@@ -20453,11 +20816,11 @@ snapshots:
       '@tanstack/store': 0.8.0
       solid-js: 1.9.10
 
-  '@tanstack/start-api-routes@1.120.19(@types/node@24.10.3)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)':
+  '@tanstack/start-api-routes@1.120.19(@types/node@24.10.3)(aws4fetch@1.0.20)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)':
     dependencies:
       '@tanstack/router-core': 1.157.16
       '@tanstack/start-server-core': 1.141.1(crossws@0.4.5(srvx@0.11.15))
-      vinxi: 0.5.3(@types/node@24.10.3)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
+      vinxi: 0.5.3(@types/node@24.10.3)(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
     transitivePeerDependencies:
       - '@azure/app-configuration'
       - '@azure/cosmos'
@@ -20529,21 +20892,21 @@ snapshots:
       tiny-invariant: 1.3.3
       tiny-warning: 1.0.3
 
-  '@tanstack/start-config@1.120.20(@types/node@24.10.3)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))(yaml@2.8.2)':
+  '@tanstack/start-config@1.120.20(@types/node@24.10.3)(aws4fetch@1.0.20)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))(yaml@2.8.2)':
     dependencies:
       '@tanstack/react-router': 1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3)
-      '@tanstack/react-start-plugin': 1.131.50(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(@vitejs/plugin-react@4.7.0(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(rolldown@1.0.0-rc.17)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
+      '@tanstack/react-start-plugin': 1.131.50(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(@vitejs/plugin-react@4.7.0(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@tanstack/router-generator': 1.141.1
       '@tanstack/router-plugin': 1.159.5(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@tanstack/server-functions-plugin': 1.141.0(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@tanstack/start-server-functions-handler': 1.120.19(crossws@0.4.5(srvx@0.11.15))
       '@vitejs/plugin-react': 4.7.0(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       import-meta-resolve: 4.2.0
-      nitropack: 2.12.9(rolldown@1.0.0-rc.17)
+      nitropack: 2.12.9(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)
       ofetch: 1.5.1
       react: 19.2.3
       react-dom: 19.2.3(react@19.2.3)
-      vinxi: 0.5.3(@types/node@24.10.3)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
+      vinxi: 0.5.3(@types/node@24.10.3)(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
       vite: 7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
       zod: 3.25.76
     transitivePeerDependencies:
@@ -20597,7 +20960,7 @@ snapshots:
 
   '@tanstack/start-fn-stubs@1.154.7': {}
 
-  '@tanstack/start-plugin-core@1.131.50(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(rolldown@1.0.0-rc.17)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))':
+  '@tanstack/start-plugin-core@1.131.50(@tanstack/react-router@1.159.5(react-dom@19.2.3(react@19.2.3))(react@19.2.3))(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))':
     dependencies:
       '@babel/code-frame': 7.26.2
       '@babel/core': 7.29.0
@@ -20613,7 +20976,7 @@ snapshots:
       babel-dead-code-elimination: 1.0.10
       cheerio: 1.1.2
       h3: 1.13.0
-      nitropack: 2.12.9(rolldown@1.0.0-rc.17)
+      nitropack: 2.12.9(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)
       pathe: 2.0.3
       ufo: 1.6.1
       vite: 7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
@@ -20849,13 +21212,13 @@ snapshots:
     dependencies:
       '@tanstack/router-core': 1.159.4
 
-  '@tanstack/start@1.120.20(@types/node@24.10.3)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))(yaml@2.8.2)':
+  '@tanstack/start@1.120.20(@types/node@24.10.3)(aws4fetch@1.0.20)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))(yaml@2.8.2)':
     dependencies:
       '@tanstack/react-start-client': 1.141.1(react-dom@19.2.3(react@19.2.3))(react@19.2.3)
-      '@tanstack/react-start-router-manifest': 1.120.19(@types/node@24.10.3)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
+      '@tanstack/react-start-router-manifest': 1.120.19(@types/node@24.10.3)(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
       '@tanstack/react-start-server': 1.141.1(crossws@0.4.5(srvx@0.11.15))(react-dom@19.2.3(react@19.2.3))(react@19.2.3)
-      '@tanstack/start-api-routes': 1.120.19(@types/node@24.10.3)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
-      '@tanstack/start-config': 1.120.20(@types/node@24.10.3)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))(yaml@2.8.2)
+      '@tanstack/start-api-routes': 1.120.19(@types/node@24.10.3)(aws4fetch@1.0.20)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
+      '@tanstack/start-config': 1.120.20(@types/node@24.10.3)(aws4fetch@1.0.20)(crossws@0.4.5(srvx@0.11.15))(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(react-dom@19.2.3(react@19.2.3))(react@19.2.3)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(vite-plugin-solid@2.11.10(solid-js@1.9.10)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)))(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))(yaml@2.8.2)
       '@tanstack/start-server-functions-client': 1.131.50(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
       '@tanstack/start-server-functions-handler': 1.120.19(crossws@0.4.5(srvx@0.11.15))
       '@tanstack/start-server-functions-server': 1.131.2(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2))
@@ -21069,6 +21432,17 @@ snapshots:
 
   '@types/deep-eql@4.0.2': {}
 
+  '@types/docker-modem@3.0.6':
+    dependencies:
+      '@types/node': 24.10.3
+      '@types/ssh2': 1.15.5
+
+  '@types/dockerode@3.3.47':
+    dependencies:
+      '@types/docker-modem': 3.0.6
+      '@types/node': 24.10.3
+      '@types/ssh2': 1.15.5
+
   '@types/dom-mediacapture-record@1.0.22': {}
 
   '@types/estree-jsx@1.0.5':
@@ -21114,6 +21488,10 @@ snapshots:
 
   '@types/node@12.20.55': {}
 
+  '@types/node@18.19.130':
+    dependencies:
+      undici-types: 5.26.5
+
   '@types/node@20.19.26':
     dependencies:
       undici-types: 6.21.0
@@ -21122,6 +21500,12 @@ snapshots:
     dependencies:
       undici-types: 7.16.0
 
+  '@types/pg@8.20.0':
+    dependencies:
+      '@types/node': 24.10.3
+      pg-protocol: 1.14.0
+      pg-types: 2.2.0
+
   '@types/react-dom@19.2.3(@types/react@19.2.7)':
     dependencies:
       '@types/react': 19.2.7
@@ -21134,6 +21518,10 @@ snapshots:
 
   '@types/retry@0.12.0': {}
 
+  '@types/ssh2@1.15.5':
+    dependencies:
+      '@types/node': 18.19.130
+
   '@types/unist@2.0.11': {}
 
   '@types/unist@3.0.3': {}
@@ -21938,6 +22326,10 @@ snapshots:
 
   asap@2.0.6: {}
 
+  asn1@0.2.6:
+    dependencies:
+      safer-buffer: 2.1.2
+
   assertion-error@2.0.1: {}
 
   ast-kit@2.2.0:
@@ -21979,6 +22371,8 @@ snapshots:
     dependencies:
       possible-typed-array-names: 1.1.0
 
+  aws4fetch@1.0.20: {}
+
   axios@1.13.2:
     dependencies:
       follow-redirects: 1.15.11
@@ -22183,6 +22577,10 @@ snapshots:
 
   basic-ftp@5.2.0: {}
 
+  bcrypt-pbkdf@1.0.2:
+    dependencies:
+      tweetnacl: 0.14.5
+
   beasties@0.4.1:
     dependencies:
       css-select: 6.0.0
@@ -22314,6 +22712,9 @@ snapshots:
       base64-js: 1.5.1
       ieee754: 1.2.1
 
+  buildcheck@0.0.7:
+    optional: true
+
   bundle-require@5.1.0(esbuild@0.27.3):
     dependencies:
       esbuild: 0.27.3
@@ -22384,6 +22785,8 @@ snapshots:
 
   capnweb@0.1.0: {}
 
+  capnweb@0.8.0: {}
+
   ccount@2.0.1: {}
 
   chai@6.2.1: {}
@@ -22456,6 +22859,8 @@ snapshots:
     dependencies:
       readdirp: 5.0.0
 
+  chownr@1.1.4: {}
+
   chownr@3.0.0: {}
 
   chrome-launcher@0.15.2:
@@ -22701,6 +23106,12 @@ snapshots:
     optionalDependencies:
       typescript: 5.9.3
 
+  cpu-features@0.0.10:
+    dependencies:
+      buildcheck: 0.0.7
+      nan: 2.27.0
+    optional: true
+
   crc-32@1.2.2: {}
 
   crc32-stream@6.0.0:
@@ -22938,6 +23349,27 @@ snapshots:
 
   dnssd-advertise@1.1.4: {}
 
+  docker-modem@5.0.7:
+    dependencies:
+      debug: 4.4.3
+      readable-stream: 3.6.2
+      split-ca: 1.0.1
+      ssh2: 1.17.0
+    transitivePeerDependencies:
+      - supports-color
+
+  dockerode@4.0.12:
+    dependencies:
+      '@balena/dockerignore': 1.0.2
+      '@grpc/grpc-js': 1.14.4
+      '@grpc/proto-loader': 0.7.15
+      docker-modem: 5.0.7
+      protobufjs: 7.5.4
+      tar-fs: 2.1.4
+      uuid: 10.0.0
+    transitivePeerDependencies:
+      - supports-color
+
   dom-accessibility-api@0.5.16: {}
 
   dom-helpers@5.2.1:
@@ -23171,35 +23603,6 @@ snapshots:
       '@esbuild/win32-ia32': 0.25.12
       '@esbuild/win32-x64': 0.25.12
 
-  esbuild@0.27.2:
-    optionalDependencies:
-      '@esbuild/aix-ppc64': 0.27.2
-      '@esbuild/android-arm': 0.27.2
-      '@esbuild/android-arm64': 0.27.2
-      '@esbuild/android-x64': 0.27.2
-      '@esbuild/darwin-arm64': 0.27.2
-      '@esbuild/darwin-x64': 0.27.2
-      '@esbuild/freebsd-arm64': 0.27.2
-      '@esbuild/freebsd-x64': 0.27.2
-      '@esbuild/linux-arm': 0.27.2
-      '@esbuild/linux-arm64': 0.27.2
-      '@esbuild/linux-ia32': 0.27.2
-      '@esbuild/linux-loong64': 0.27.2
-      '@esbuild/linux-mips64el': 0.27.2
-      '@esbuild/linux-ppc64': 0.27.2
-      '@esbuild/linux-riscv64': 0.27.2
-      '@esbuild/linux-s390x': 0.27.2
-      '@esbuild/linux-x64': 0.27.2
-      '@esbuild/netbsd-arm64': 0.27.2
-      '@esbuild/netbsd-x64': 0.27.2
-      '@esbuild/openbsd-arm64': 0.27.2
-      '@esbuild/openbsd-x64': 0.27.2
-      '@esbuild/openharmony-arm64': 0.27.2
-      '@esbuild/sunos-x64': 0.27.2
-      '@esbuild/win32-arm64': 0.27.2
-      '@esbuild/win32-ia32': 0.27.2
-      '@esbuild/win32-x64': 0.27.2
-
   esbuild@0.27.3:
     optionalDependencies:
       '@esbuild/aix-ppc64': 0.27.3
@@ -24414,8 +24817,6 @@ snapshots:
     transitivePeerDependencies:
       - supports-color
 
-  ip-address@10.1.0: {}
-
   ip-address@10.2.0: {}
 
   ipaddr.js@1.9.1: {}
@@ -25050,6 +25451,8 @@ snapshots:
     dependencies:
       p-locate: 5.0.0
 
+  lodash.camelcase@4.3.0: {}
+
   lodash.debounce@4.0.8: {}
 
   lodash.defaults@4.2.0: {}
@@ -25842,6 +26245,8 @@ snapshots:
 
   mitt@3.0.1: {}
 
+  mkdirp-classic@0.5.3: {}
+
   mkdirp@1.0.4: {}
 
   mkdirp@3.0.1: {}
@@ -25900,6 +26305,9 @@ snapshots:
       object-assign: 4.1.1
       thenify-all: 1.6.0
 
+  nan@2.27.0:
+    optional: true
+
   nanoid@3.3.11: {}
 
   nanoid@3.3.12: {}
@@ -25958,7 +26366,7 @@ snapshots:
       rollup: 4.60.1
       tailwindcss: 4.1.18
 
-  nitro@3.0.1-alpha.2(chokidar@5.0.0)(ioredis@5.9.2)(lru-cache@11.2.4)(rolldown@1.0.0-rc.17)(rollup@4.60.1)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)):
+  nitro@3.0.1-alpha.2(aws4fetch@1.0.20)(chokidar@5.0.0)(ioredis@5.9.2)(lru-cache@11.2.4)(rolldown@1.0.0-rc.17)(rollup@4.60.1)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)):
     dependencies:
       consola: 3.4.2
       crossws: 0.4.4(srvx@0.10.1)
@@ -25973,7 +26381,7 @@ snapshots:
       srvx: 0.10.1
       undici: 7.21.0
       unenv: 2.0.0-rc.24
-      unstorage: 2.0.0-alpha.5(chokidar@5.0.0)(db0@0.3.4)(ioredis@5.9.2)(lru-cache@11.2.4)(ofetch@2.0.0-alpha.3)
+      unstorage: 2.0.0-alpha.5(aws4fetch@1.0.20)(chokidar@5.0.0)(db0@0.3.4)(ioredis@5.9.2)(lru-cache@11.2.4)(ofetch@2.0.0-alpha.3)
     optionalDependencies:
       rolldown: 1.0.0-rc.17
       rollup: 4.60.1
@@ -26007,7 +26415,7 @@ snapshots:
       - sqlite3
       - uploadthing
 
-  nitro@3.0.260429-beta(chokidar@5.0.0)(dotenv@17.2.3)(giget@2.0.0)(jiti@2.6.1)(miniflare@4.20260609.0)(rollup@4.60.1)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)):
+  nitro@3.0.260429-beta(aws4fetch@1.0.20)(chokidar@5.0.0)(dotenv@17.2.3)(giget@2.0.0)(jiti@2.6.1)(miniflare@4.20260609.0)(rollup@4.60.1)(vite@7.3.3(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)):
     dependencies:
       consola: 3.4.2
       crossws: 0.4.5(srvx@0.11.15)
@@ -26022,7 +26430,7 @@ snapshots:
       rolldown: 1.0.0-rc.17
       srvx: 0.11.15
       unenv: 2.0.0-rc.24
-      unstorage: 2.0.0-alpha.7(chokidar@5.0.0)(db0@0.3.4)(ofetch@2.0.0-alpha.3)
+      unstorage: 2.0.0-alpha.7(aws4fetch@1.0.20)(chokidar@5.0.0)(db0@0.3.4)(ofetch@2.0.0-alpha.3)
     optionalDependencies:
       dotenv: 17.2.3
       giget: 2.0.0
@@ -26060,7 +26468,7 @@ snapshots:
       - sqlite3
       - uploadthing
 
-  nitropack@2.12.9(rolldown@1.0.0-rc.17):
+  nitropack@2.12.9(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17):
     dependencies:
       '@cloudflare/kv-asset-handler': 0.4.2
       '@rollup/plugin-alias': 5.1.1(rollup@4.60.1)
@@ -26127,7 +26535,7 @@ snapshots:
       unenv: 2.0.0-rc.24
       unimport: 5.5.0
       unplugin-utils: 0.3.1
-      unstorage: 1.17.4(db0@0.3.4)(ioredis@5.8.2)
+      unstorage: 1.17.4(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.8.2)
       untyped: 2.0.0
       unwasm: 0.3.11
       youch: 4.1.0-beta.13
@@ -26162,7 +26570,7 @@ snapshots:
       - supports-color
       - uploadthing
 
-  nitropack@2.13.1(rolldown@1.0.0-rc.17):
+  nitropack@2.13.1(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17):
     dependencies:
       '@cloudflare/kv-asset-handler': 0.4.2
       '@rollup/plugin-alias': 6.0.0(rollup@4.57.1)
@@ -26229,7 +26637,7 @@ snapshots:
       unenv: 2.0.0-rc.24
       unimport: 5.6.0
       unplugin-utils: 0.3.1
-      unstorage: 1.17.4(db0@0.3.4)(ioredis@5.9.2)
+      unstorage: 1.17.4(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.9.2)
       untyped: 2.0.0
       unwasm: 0.5.3
       youch: 4.1.0-beta.13
@@ -26753,6 +27161,41 @@ snapshots:
 
   perfect-debounce@2.0.0: {}
 
+  pg-cloudflare@1.4.0:
+    optional: true
+
+  pg-connection-string@2.13.0: {}
+
+  pg-int8@1.0.1: {}
+
+  pg-pool@3.14.0(pg@8.21.0):
+    dependencies:
+      pg: 8.21.0
+
+  pg-protocol@1.14.0: {}
+
+  pg-types@2.2.0:
+    dependencies:
+      pg-int8: 1.0.1
+      postgres-array: 2.0.0
+      postgres-bytea: 1.0.1
+      postgres-date: 1.0.7
+      postgres-interval: 1.2.0
+
+  pg@8.21.0:
+    dependencies:
+      pg-connection-string: 2.13.0
+      pg-pool: 3.14.0(pg@8.21.0)
+      pg-protocol: 1.14.0
+      pg-types: 2.2.0
+      pgpass: 1.0.5
+    optionalDependencies:
+      pg-cloudflare: 1.4.0
+
+  pgpass@1.0.5:
+    dependencies:
+      split2: 4.2.0
+
   picocolors@1.1.1: {}
 
   picomatch@2.3.1: {}
@@ -26848,6 +27291,16 @@ snapshots:
       picocolors: 1.1.1
       source-map-js: 1.2.1
 
+  postgres-array@2.0.0: {}
+
+  postgres-bytea@1.0.1: {}
+
+  postgres-date@1.0.7: {}
+
+  postgres-interval@1.2.0:
+    dependencies:
+      xtend: 4.0.2
+
   preact@10.28.1: {}
 
   preact@10.28.2: {}
@@ -26929,6 +27382,20 @@ snapshots:
       '@types/node': 24.10.3
       long: 5.3.2
 
+  protobufjs@7.6.4:
+    dependencies:
+      '@protobufjs/aspromise': 1.1.2
+      '@protobufjs/base64': 1.1.2
+      '@protobufjs/codegen': 2.0.5
+      '@protobufjs/eventemitter': 1.1.1
+      '@protobufjs/fetch': 1.1.1
+      '@protobufjs/float': 1.0.2
+      '@protobufjs/path': 1.1.2
+      '@protobufjs/pool': 1.1.0
+      '@protobufjs/utf8': 1.1.1
+      '@types/node': 24.10.3
+      long: 5.3.2
+
   proxy-addr@2.0.7:
     dependencies:
       forwarded: 0.2.0
@@ -27998,7 +28465,7 @@ snapshots:
 
   socks@2.8.7:
     dependencies:
-      ip-address: 10.1.0
+      ip-address: 10.2.0
       smart-buffer: 4.2.0
 
   solid-js@1.9.10:
@@ -28053,6 +28520,10 @@ snapshots:
       cross-spawn: 7.0.6
       signal-exit: 4.1.0
 
+  split-ca@1.0.1: {}
+
+  split2@4.2.0: {}
+
   sprintf-js@1.0.3: {}
 
   srvx@0.10.1: {}
@@ -28063,6 +28534,14 @@ snapshots:
 
   srvx@0.8.16: {}
 
+  ssh2@1.17.0:
+    dependencies:
+      asn1: 0.2.6
+      bcrypt-pbkdf: 1.0.2
+    optionalDependencies:
+      cpu-features: 0.0.10
+      nan: 2.27.0
+
   stable-hash-x@0.2.0: {}
 
   stackback@0.0.2: {}
@@ -28264,6 +28743,13 @@ snapshots:
 
   tapable@2.3.0: {}
 
+  tar-fs@2.1.4:
+    dependencies:
+      chownr: 1.1.4
+      mkdirp-classic: 0.5.3
+      pump: 3.0.4
+      tar-stream: 2.2.0
+
   tar-fs@3.1.2:
     dependencies:
       pump: 3.0.4
@@ -28504,13 +28990,15 @@ snapshots:
 
   tsx@4.21.0:
     dependencies:
-      esbuild: 0.27.2
+      esbuild: 0.27.7
       get-tsconfig: 4.13.0
     optionalDependencies:
       fsevents: 2.3.3
 
   tw-animate-css@1.4.0: {}
 
+  tweetnacl@0.14.5: {}
+
   type-check@0.4.0:
     dependencies:
       prelude-ls: 1.2.1
@@ -28599,6 +29087,8 @@ snapshots:
       magic-string: 0.30.21
       unplugin: 2.3.11
 
+  undici-types@5.26.5: {}
+
   undici-types@5.28.4: {}
 
   undici-types@6.21.0: {}
@@ -28769,7 +29259,7 @@ snapshots:
     dependencies:
       rolldown: 1.0.0-beta.53
 
-  unstorage@1.17.4(db0@0.3.4)(ioredis@5.8.2):
+  unstorage@1.17.4(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.8.2):
     dependencies:
       anymatch: 3.1.3
       chokidar: 5.0.0
@@ -28780,10 +29270,11 @@ snapshots:
       ofetch: 1.5.1
       ufo: 1.6.3
     optionalDependencies:
+      aws4fetch: 1.0.20
       db0: 0.3.4
       ioredis: 5.8.2
 
-  unstorage@1.17.4(db0@0.3.4)(ioredis@5.9.2):
+  unstorage@1.17.4(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.9.2):
     dependencies:
       anymatch: 3.1.3
       chokidar: 5.0.0
@@ -28794,19 +29285,22 @@ snapshots:
       ofetch: 1.5.1
       ufo: 1.6.3
     optionalDependencies:
+      aws4fetch: 1.0.20
       db0: 0.3.4
       ioredis: 5.9.2
 
-  unstorage@2.0.0-alpha.5(chokidar@5.0.0)(db0@0.3.4)(ioredis@5.9.2)(lru-cache@11.2.4)(ofetch@2.0.0-alpha.3):
+  unstorage@2.0.0-alpha.5(aws4fetch@1.0.20)(chokidar@5.0.0)(db0@0.3.4)(ioredis@5.9.2)(lru-cache@11.2.4)(ofetch@2.0.0-alpha.3):
     optionalDependencies:
+      aws4fetch: 1.0.20
       chokidar: 5.0.0
       db0: 0.3.4
       ioredis: 5.9.2
       lru-cache: 11.2.4
       ofetch: 2.0.0-alpha.3
 
-  unstorage@2.0.0-alpha.7(chokidar@5.0.0)(db0@0.3.4)(ofetch@2.0.0-alpha.3):
+  unstorage@2.0.0-alpha.7(aws4fetch@1.0.20)(chokidar@5.0.0)(db0@0.3.4)(ofetch@2.0.0-alpha.3):
     optionalDependencies:
+      aws4fetch: 1.0.20
       chokidar: 5.0.0
       db0: 0.3.4
       ofetch: 2.0.0-alpha.3
@@ -28878,6 +29372,8 @@ snapshots:
 
   utils-merge@1.0.1: {}
 
+  uuid@10.0.0: {}
+
   uuid@7.0.3: {}
 
   validate-npm-package-name@5.0.1: {}
@@ -28916,7 +29412,7 @@ snapshots:
       d3-time: 3.1.0
       d3-timer: 3.0.1
 
-  vinxi@0.5.3(@types/node@24.10.3)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2):
+  vinxi@0.5.3(@types/node@24.10.3)(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.8.2)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(rolldown@1.0.0-rc.17)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2):
     dependencies:
       '@babel/core': 7.29.0
       '@babel/plugin-syntax-jsx': 7.27.1(@babel/core@7.29.0)
@@ -28938,7 +29434,7 @@ snapshots:
       hookable: 5.5.3
       http-proxy: 1.18.1
       micromatch: 4.0.8
-      nitropack: 2.12.9(rolldown@1.0.0-rc.17)
+      nitropack: 2.12.9(aws4fetch@1.0.20)(rolldown@1.0.0-rc.17)
       node-fetch-native: 1.6.7
       path-to-regexp: 6.3.0
       pathe: 1.1.2
@@ -28949,7 +29445,7 @@ snapshots:
       ufo: 1.6.1
       unctx: 2.4.1
       unenv: 1.10.0
-      unstorage: 1.17.4(db0@0.3.4)(ioredis@5.8.2)
+      unstorage: 1.17.4(aws4fetch@1.0.20)(db0@0.3.4)(ioredis@5.8.2)
       vite: 6.4.2(@types/node@24.10.3)(jiti@2.6.1)(less@4.6.6)(lightningcss@1.30.2)(sass@1.101.0)(terser@5.44.1)(tsx@4.21.0)(yaml@2.8.2)
       zod: 3.25.76
     transitivePeerDependencies:
@@ -29535,6 +30031,8 @@ snapshots:
 
   xmlchars@2.2.0: {}
 
+  xtend@4.0.2: {}
+
   y18n@5.0.8: {}
 
   yallist@3.1.1: {}
diff --git a/pnpm-workspace.yaml b/pnpm-workspace.yaml
index bf7160b83..a333d6a7b 100644
--- a/pnpm-workspace.yaml
+++ b/pnpm-workspace.yaml
@@ -40,3 +40,8 @@ allowBuilds:
   unrs-resolver: false
   workerd: false
   lmdb: true
+  # dockerode (@tanstack/ai-sandbox-docker) pulls these only for SSH-based
+  # Docker connections; the local-socket path the provider uses has a working
+  # JS fallback, so their native builds are not required.
+  cpu-features: false
+  ssh2: false
diff --git a/testing/e2e/README.md b/testing/e2e/README.md
index ab0f13479..288fd1924 100644
--- a/testing/e2e/README.md
+++ b/testing/e2e/README.md
@@ -6,6 +6,8 @@ End-to-end tests for TanStack AI using Playwright and [aimock](https://github.co
 
 **Providers tested:** openai, anthropic, gemini, ollama, groq, grok, openrouter
 
+> **Claude Code (`@tanstack/ai-claude-code`) is excluded from the standard matrix.** It's a harness adapter that spawns the Claude Code runtime as a subprocess, so aimock's per-test `X-Test-Id` header isolation can't be injected into its requests. It's covered by unit tests in the package plus a gated live smoke test in `tests/claude-code.spec.ts` — run it with `CLAUDE_CODE_E2E=1` and an `ANTHROPIC_API_KEY` (or a local `claude login`).
+
 ## What's tested
 
 ### Provider-coverage tests
diff --git a/testing/e2e/package.json b/testing/e2e/package.json
index 68381f527..bcbe281b0 100644
--- a/testing/e2e/package.json
+++ b/testing/e2e/package.json
@@ -18,6 +18,7 @@
     "@tailwindcss/vite": "^4.1.18",
     "@tanstack/ai": "workspace:*",
     "@tanstack/ai-anthropic": "workspace:*",
+    "@tanstack/ai-claude-code": "workspace:*",
     "@tanstack/ai-client": "workspace:*",
     "@tanstack/ai-elevenlabs": "workspace:*",
     "@tanstack/ai-gemini": "workspace:*",
diff --git a/testing/e2e/tests/claude-code.spec.ts b/testing/e2e/tests/claude-code.spec.ts
new file mode 100644
index 000000000..0a842f1b3
--- /dev/null
+++ b/testing/e2e/tests/claude-code.spec.ts
@@ -0,0 +1,72 @@
+/**
+ * Gated live smoke test for the Claude Code harness adapter.
+ *
+ * The standard e2e matrix mocks providers with aimock via per-test
+ * `X-Test-Id` header isolation. Claude Code spawns its bundled runtime as a
+ * subprocess, so that isolation can't be injected — this adapter is excluded
+ * from the matrix and covered here instead, gated behind CLAUDE_CODE_E2E.
+ *
+ * Run with:
+ *   CLAUDE_CODE_E2E=1 ANTHROPIC_API_KEY=sk-... \
+ *     pnpm --filter @tanstack/ai-e2e test:e2e -- --grep "claude-code"
+ *
+ * (A local `claude login` works in place of ANTHROPIC_API_KEY.)
+ */
+import { expect, test } from '@playwright/test'
+import { chat } from '@tanstack/ai'
+import { claudeCodeText } from '@tanstack/ai-claude-code'
+import type { StreamChunk } from '@tanstack/ai'
+
+test.describe('claude-code harness (gated live smoke)', () => {
+  test.skip(
+    !process.env.CLAUDE_CODE_E2E,
+    'Set CLAUDE_CODE_E2E=1 (plus ANTHROPIC_API_KEY or a local Claude login) to run the Claude Code live smoke test',
+  )
+
+  test('streams a full harness turn with session id and stop finish', async () => {
+    test.setTimeout(180_000)
+
+    const chunks: Array<StreamChunk> = []
+    const stream = chat({
+      adapter: claudeCodeText('haiku', {
+        maxTurns: 2,
+        // Read-only smoke: the default permission policy denies anything
+        // that would prompt, and no tools are bridged.
+        disallowedTools: ['Bash', 'Write', 'Edit'],
+      }),
+      messages: [
+        {
+          role: 'user',
+          content: 'Reply with exactly the word: pong',
+        },
+      ],
+    })
+
+    for await (const chunk of stream) {
+      chunks.push(chunk)
+    }
+
+    const types = chunks.map((chunk) => chunk.type as string)
+    expect(types[0]).toBe('RUN_STARTED')
+
+    const sessionEvent = chunks.find(
+      (chunk) =>
+        chunk.type === 'CUSTOM' &&
+        (chunk as { name?: string }).name === 'claude-code.session-id',
+    )
+    expect(sessionEvent).toBeDefined()
+    expect(
+      (sessionEvent as { value: { sessionId: string } }).value.sessionId,
+    ).toMatch(/.+/)
+
+    const finished = chunks.find((chunk) => chunk.type === 'RUN_FINISHED')
+    expect(finished).toBeDefined()
+    expect((finished as { finishReason?: string }).finishReason).toBe('stop')
+
+    const text = chunks
+      .filter((chunk) => chunk.type === 'TEXT_MESSAGE_CONTENT')
+      .map((chunk) => (chunk as { delta?: string }).delta ?? '')
+      .join('')
+    expect(text.toLowerCase()).toContain('pong')
+  })
+})