From 5708f4ecfd5a6ac7551b28871b962c940768ec85 Mon Sep 17 00:00:00 2001
From: Ian Pascoe <ian.g.pascoe@gmail.com>
Date: Fri, 5 Jun 2026 05:58:46 -0400
Subject: [PATCH 1/8] fix(core): normalize hosted cloud mcp urls

---
 packages/core/src/remote/options.ts         | 71 ++++++++++++++++
 packages/core/src/remote/selection.ts       | 21 ++++-
 packages/core/test/attach-cli.test.ts       | 35 ++++++++
 packages/core/test/doctor-cli.test.ts       |  1 +
 packages/core/test/native-remote.test.ts    |  2 +-
 packages/core/test/remote-selection.test.ts | 90 +++++++++++++++++++++
 6 files changed, 217 insertions(+), 3 deletions(-)
diff --git a/packages/core/src/remote/options.ts b/packages/core/src/remote/options.ts
index 6eb8f1b..f087ab2 100644
--- a/packages/core/src/remote/options.ts
+++ b/packages/core/src/remote/options.ts
@@ -151,6 +151,51 @@ export function resolveCapletsRemote(
   };
 }
 
+export function resolveHostedCloudRemote(
+  input: CapletsRemoteInput = {},
+  env: CapletsRemoteEnv = process.env,
+): ResolvedCapletsRemote {
+  const rawUrl =
+    nonEmpty(input.url, "url") ?? nonEmpty(env.CAPLETS_REMOTE_URL, "CAPLETS_REMOTE_URL");
+  if (rawUrl === undefined) {
+    throw new CapletsError("REQUEST_INVALID", "CAPLETS_REMOTE_URL or url is required.");
+  }
+
+  const cloud = parseHostedCloudRemoteUrl(rawUrl);
+  const workspace = cloud.workspace ?? nonEmpty(input.workspace, "workspace");
+  if (!workspace) {
+    throw new CapletsError(
+      "REQUEST_INVALID",
+      "Caplets Cloud remote URL requires a selected workspace.",
+    );
+  }
+
+  const token =
+    nonEmpty(input.token, "token") ?? nonEmpty(env.CAPLETS_REMOTE_TOKEN, "CAPLETS_REMOTE_TOKEN");
+  const auth: CapletsRemoteAuth = token
+    ? { type: "bearer", token }
+    : { type: "none", user: DEFAULT_REMOTE_USER };
+  const requestInit: RequestInit =
+    auth.type === "bearer" ? { headers: { Authorization: `Bearer ${auth.token}` } } : {};
+  const workspaceBaseUrl = appendBasePath(cloud.baseUrl, `ws/${encodeURIComponent(workspace)}`);
+
+  return {
+    baseUrl: cloud.baseUrl,
+    mcpUrl: appendBasePath(workspaceBaseUrl, "mcp"),
+    controlUrl: appendBasePath(cloud.baseUrl, "control"),
+    healthUrl: appendBasePath(cloud.baseUrl, "healthz"),
+    projectBindingWebSocketUrl: projectBindingWebSocketUrlForBase(cloud.baseUrl),
+    auth,
+    requestInit,
+    workspace,
+    ...(input.fetch ? { fetch: input.fetch } : {}),
+  };
+}
+
+export function hostedCloudWorkspaceFromRemoteUrl(value: string): string | undefined {
+  return parseHostedCloudRemoteUrl(value).workspace;
+}
+
 export function projectBindingWebSocketUrlForBase(baseUrl: URL): URL {
   const url = appendBasePath(baseUrl, "control/project-bindings/connect");
   if (url.protocol === "https:") url.protocol = "wss:";
@@ -169,6 +214,32 @@ export function isCapletsCloudUrl(value: string): boolean {
   return host === "cloud.caplets.dev" || host.endsWith(".preview.caplets.dev");
 }
 
+function parseHostedCloudRemoteUrl(value: string): { baseUrl: URL; workspace?: string } {
+  const url = parseServerBaseUrl(value);
+  if (!isCapletsCloudUrl(url.toString())) {
+    throw new CapletsError(
+      "REQUEST_INVALID",
+      "Caplets Cloud remote URL must point at Caplets Cloud.",
+    );
+  }
+
+  const baseUrl = new URL(url);
+  baseUrl.pathname = "/";
+  const pathname = url.pathname.replace(/\/+$/u, "");
+  if (pathname === "") return { baseUrl };
+  const match = pathname.match(/^\/ws\/([^/]+)(?:\/mcp)?$/u);
+  if (!match) {
+    throw new CapletsError(
+      "REQUEST_INVALID",
+      "Caplets Cloud remote URL must be the Cloud origin or /ws/<workspace>/mcp endpoint.",
+    );
+  }
+  return {
+    baseUrl,
+    workspace: decodeURIComponent(match[1] ?? ""),
+  };
+}
+
 function parseCapletsMode(value: string): "auto" | CapletsRemoteMode {
   if (value === "auto" || value === "local" || value === "remote" || value === "cloud") {
     return value;
diff --git a/packages/core/src/remote/selection.ts b/packages/core/src/remote/selection.ts
index 835ce1e..7533976 100644
--- a/packages/core/src/remote/selection.ts
+++ b/packages/core/src/remote/selection.ts
@@ -2,7 +2,13 @@ import { CloudAuthClient } from "../cloud-auth/client";
 import { CloudAuthStore, type CloudAuthCredentials } from "../cloud-auth/store";
 import { CapletsError } from "../errors";
 import { projectBindingError } from "../project-binding/errors";
-import { resolveCapletsRemote, resolveRemoteMode, type ResolvedCapletsRemote } from "./options";
+import {
+  hostedCloudWorkspaceFromRemoteUrl,
+  resolveCapletsRemote,
+  resolveHostedCloudRemote,
+  resolveRemoteMode,
+  type ResolvedCapletsRemote,
+} from "./options";
 
 export type RemoteSelectionInput = {
   mode?: string;
@@ -105,7 +111,18 @@ export async function resolveRemoteSelection(
   }
 
   const remoteUrl = input.remoteUrl ?? env.CAPLETS_REMOTE_URL ?? credentials.cloudUrl;
-  const remote = resolveCapletsRemote(
+  const workspaceFromRemoteUrl = hostedCloudWorkspaceFromRemoteUrl(remoteUrl);
+  if (
+    workspaceFromRemoteUrl &&
+    workspaceFromRemoteUrl !== credentials.workspaceSlug &&
+    workspaceFromRemoteUrl !== credentials.workspaceId
+  ) {
+    throw projectBindingError(
+      "workspace_switch_required",
+      `Requested workspace ${workspaceFromRemoteUrl} differs from saved Selected Workspace ${selectedWorkspace}.`,
+    );
+  }
+  const remote = resolveHostedCloudRemote(
     {
       url: remoteUrl,
       token: credentials.accessToken,
diff --git a/packages/core/test/attach-cli.test.ts b/packages/core/test/attach-cli.test.ts
index 291562f..757321a 100644
--- a/packages/core/test/attach-cli.test.ts
+++ b/packages/core/test/attach-cli.test.ts
@@ -111,6 +111,40 @@ describe("caplets attach CLI", () => {
     expect(requestedUrl).toBe("http://127.0.0.1:8787/caplets/control/project-bindings/connect");
   });
 
+  it("probes the Cloud control route when given a copied Cloud MCP endpoint", async () => {
+    const path = tempCloudAuthPath();
+    await new CloudAuthStore({ path }).save(
+      hostedCredentials({
+        cloudUrl: "https://cloud.pr-2.preview.caplets.dev",
+        workspaceSlug: "personal-c9b49d",
+      }),
+    );
+    let requestedUrl: string | undefined;
+
+    await expect(
+      attachProjectOnce(
+        {
+          projectRoot: "/repo",
+          remoteUrl: "https://cloud.pr-2.preview.caplets.dev/ws/personal-c9b49d/mcp",
+          fetch: async (url) => {
+            requestedUrl = String(url);
+            return Response.json({ error: "websocket_upgrade_required" }, { status: 426 });
+          },
+        },
+        {
+          CAPLETS_MODE: "cloud",
+          CAPLETS_CLOUD_AUTH_PATH: path,
+        },
+      ),
+    ).resolves.toMatchObject({
+      ok: true,
+      webSocketUrl: "wss://cloud.pr-2.preview.caplets.dev/control/project-bindings/connect",
+    });
+    expect(requestedUrl).toBe(
+      "https://cloud.pr-2.preview.caplets.dev/control/project-bindings/connect",
+    );
+  });
+
   it("runs once from the CLI and reports WebSocket availability", async () => {
     const out: string[] = [];
     const cwd = process.cwd();
@@ -178,6 +212,7 @@ describe("caplets attach CLI", () => {
       env: {
         CAPLETS_MODE: "cloud",
         CAPLETS_REMOTE_URL: "https://cloud.caplets.dev",
+        CAPLETS_CLOUD_AUTH_PATH: tempCloudAuthPath(),
       },
       writeOut: (value) => out.push(value),
       setExitCode: (code) => {
diff --git a/packages/core/test/doctor-cli.test.ts b/packages/core/test/doctor-cli.test.ts
index 9d9ee16..1569564 100644
--- a/packages/core/test/doctor-cli.test.ts
+++ b/packages/core/test/doctor-cli.test.ts
@@ -50,6 +50,7 @@ describe("caplets doctor", () => {
       env: {
         CAPLETS_SERVER_URL: "http://127.0.0.1:5387/caplets",
         CAPLETS_REMOTE_URL: "https://cloud.caplets.dev/ws/ian",
+        CAPLETS_CLOUD_AUTH_PATH: "/tmp/caplets-doctor-missing-auth.json",
       },
       writeOut: (value) => out.push(value),
     });
diff --git a/packages/core/test/native-remote.test.ts b/packages/core/test/native-remote.test.ts
index 8f3f610..be0f7b5 100644
--- a/packages/core/test/native-remote.test.ts
+++ b/packages/core/test/native-remote.test.ts
@@ -726,7 +726,7 @@ describe("createNativeCapletsService remote mode", () => {
     expect(service.listTools().map((tool) => tool.caplet)).toContain("remote");
     expect(factory).toHaveBeenCalledWith(
       expect.objectContaining({
-        url: new URL("https://cloud.caplets.dev/mcp"),
+        url: new URL("https://cloud.caplets.dev/ws/personal/mcp"),
         requestInit: { headers: { Authorization: "Bearer cloud-access" } },
       }),
     );
diff --git a/packages/core/test/remote-selection.test.ts b/packages/core/test/remote-selection.test.ts
index d54e0cb..389e5e4 100644
--- a/packages/core/test/remote-selection.test.ts
+++ b/packages/core/test/remote-selection.test.ts
@@ -57,6 +57,95 @@ describe("resolveRemoteSelection", () => {
     });
   });
 
+  it("derives Cloud MCP and Project Binding URLs from the selected workspace", async () => {
+    const path = tempCloudAuthPath();
+    await new CloudAuthStore({ path }).save(
+      hostedCredentials({
+        cloudUrl: "https://cloud.pr-2.preview.caplets.dev",
+        workspaceSlug: "personal-c9b49d",
+      }),
+    );
+
+    const resolved = await resolveRemoteSelection(
+      {},
+      {
+        CAPLETS_MODE: "cloud",
+        CAPLETS_REMOTE_URL: "https://cloud.pr-2.preview.caplets.dev",
+        CAPLETS_CLOUD_AUTH_PATH: path,
+      },
+    );
+
+    expect(resolved).toMatchObject({
+      kind: "hosted_cloud",
+      selectedWorkspace: "personal-c9b49d",
+      remote: {
+        baseUrl: new URL("https://cloud.pr-2.preview.caplets.dev/"),
+        mcpUrl: new URL("https://cloud.pr-2.preview.caplets.dev/ws/personal-c9b49d/mcp"),
+        controlUrl: new URL("https://cloud.pr-2.preview.caplets.dev/control"),
+        healthUrl: new URL("https://cloud.pr-2.preview.caplets.dev/healthz"),
+        projectBindingWebSocketUrl: new URL(
+          "wss://cloud.pr-2.preview.caplets.dev/control/project-bindings/connect",
+        ),
+      },
+    });
+  });
+
+  it("normalizes copied Cloud MCP endpoints for attach", async () => {
+    const path = tempCloudAuthPath();
+    await new CloudAuthStore({ path }).save(
+      hostedCredentials({
+        cloudUrl: "https://cloud.pr-2.preview.caplets.dev",
+        workspaceSlug: "personal-c9b49d",
+      }),
+    );
+
+    const resolved = await resolveRemoteSelection(
+      {
+        remoteUrl: "https://cloud.pr-2.preview.caplets.dev/ws/personal-c9b49d/mcp",
+      },
+      {
+        CAPLETS_MODE: "cloud",
+        CAPLETS_CLOUD_AUTH_PATH: path,
+      },
+    );
+
+    expect(resolved).toMatchObject({
+      kind: "hosted_cloud",
+      selectedWorkspace: "personal-c9b49d",
+      remote: {
+        baseUrl: new URL("https://cloud.pr-2.preview.caplets.dev/"),
+        mcpUrl: new URL("https://cloud.pr-2.preview.caplets.dev/ws/personal-c9b49d/mcp"),
+        projectBindingWebSocketUrl: new URL(
+          "wss://cloud.pr-2.preview.caplets.dev/control/project-bindings/connect",
+        ),
+      },
+    });
+  });
+
+  it("rejects copied Cloud MCP endpoints for a different selected workspace", async () => {
+    const path = tempCloudAuthPath();
+    await new CloudAuthStore({ path }).save(
+      hostedCredentials({
+        cloudUrl: "https://cloud.pr-2.preview.caplets.dev",
+        workspaceSlug: "personal-c9b49d",
+      }),
+    );
+
+    await expect(
+      resolveRemoteSelection(
+        {
+          remoteUrl: "https://cloud.pr-2.preview.caplets.dev/ws/team/mcp",
+        },
+        {
+          CAPLETS_MODE: "cloud",
+          CAPLETS_CLOUD_AUTH_PATH: path,
+        },
+      ),
+    ).rejects.toMatchObject({
+      projectBindingCode: "workspace_switch_required",
+    });
+  });
+
   it("refreshes expired Cloud credentials before returning the upstream", async () => {
     const path = tempCloudAuthPath();
     await new CloudAuthStore({ path }).save(
@@ -103,6 +192,7 @@ describe("resolveRemoteSelection", () => {
         {
           CAPLETS_MODE: "cloud",
           CAPLETS_REMOTE_URL: "https://cloud.caplets.dev",
+          CAPLETS_CLOUD_AUTH_PATH: tempCloudAuthPath(),
         },
       ),
     ).rejects.toMatchObject({

From ebf6749f29dd066265b218a67579f2c5c97b42e3 Mon Sep 17 00:00:00 2001
From: Ian Pascoe <ian.g.pascoe@gmail.com>
Date: Fri, 5 Jun 2026 06:06:01 -0400
Subject: [PATCH 2/8] fix(core): require hosted cloud mcp scope

---
 packages/core/src/cloud-auth/client.ts        |  5 ++--
 packages/core/src/cloud-auth/store.ts         |  3 +-
 packages/core/src/cloud-auth/types.ts         |  8 +++++-
 packages/core/src/remote/selection.ts         | 12 +++++++-
 packages/core/test/attach-cli.test.ts         |  1 +
 packages/core/test/cloud-auth-client.test.ts  |  9 ++++--
 .../core/test/cloud-auth-login-cli.test.ts    |  4 +--
 .../test/cloud-auth-refresh-attach.test.ts    |  2 +-
 packages/core/test/cloud-auth.test.ts         |  4 +--
 packages/core/test/fixtures/cloud-auth.ts     |  2 +-
 packages/core/test/remote-selection.test.ts   | 28 ++++++++++++++++++-
 11 files changed, 64 insertions(+), 14 deletions(-)

diff --git a/packages/core/src/cloud-auth/client.ts b/packages/core/src/cloud-auth/client.ts
index ae6c9c1..bea859c 100644
--- a/packages/core/src/cloud-auth/client.ts
+++ b/packages/core/src/cloud-auth/client.ts
@@ -6,6 +6,7 @@ import type {
   CloudAuthTokenResponse,
   CloudAuthWorkspace,
 } from "./types";
+import { HOSTED_CLOUD_AUTH_SCOPES } from "./types";
 
 export type CloudAuthClientOptions = {
   cloudUrl: string;
@@ -54,7 +55,7 @@ export class CloudAuthClient {
       body: JSON.stringify({
         ...(input.requestedWorkspace ? { requestedWorkspace: input.requestedWorkspace } : {}),
         ...(input.deviceName ? { deviceName: input.deviceName } : {}),
-        ...(input.scope ? { scope: input.scope } : {}),
+        scope: input.scope ?? [...HOSTED_CLOUD_AUTH_SCOPES],
       }),
     });
   }
@@ -150,7 +151,7 @@ function normalizeCredentials(
     ? response.scope.map(String)
     : typeof response.scope === "string"
       ? response.scope.split(/\s+/u).filter(Boolean)
-      : ["project_binding:read", "project_binding:write"];
+      : [...HOSTED_CLOUD_AUTH_SCOPES];
   const credentialFamilyId = response.credentialFamilyId ?? "cloud_client_credential_family";
   const tokenType = response.tokenType ?? "Bearer";
   const credentials: CloudAuthClientCredentials = {
diff --git a/packages/core/src/cloud-auth/store.ts b/packages/core/src/cloud-auth/store.ts
index 7e302de..ba7ae42 100644
--- a/packages/core/src/cloud-auth/store.ts
+++ b/packages/core/src/cloud-auth/store.ts
@@ -2,6 +2,7 @@ import { existsSync, mkdirSync, readFileSync, rmSync, writeFileSync } from "node
 import { homedir } from "node:os";
 import { dirname, posix, win32 } from "node:path";
 import { defaultConfigBaseDir } from "../config/paths";
+import { HOSTED_CLOUD_AUTH_SCOPES } from "./types";
 import type { RedactedCloudAuthStatus } from "./types";
 
 type CloudAuthPathEnv = Partial<
@@ -69,7 +70,7 @@ export function migrateCredentials(value: unknown): CloudAuthCredentials {
     accessToken: stringValue(record.accessToken) ?? "",
     refreshToken: stringValue(record.refreshToken) ?? "",
     expiresAt: stringValue(record.expiresAt) ?? now,
-    scope: arrayValue(record.scope) ?? ["project_binding:read", "project_binding:write"],
+    scope: arrayValue(record.scope) ?? [...HOSTED_CLOUD_AUTH_SCOPES],
     tokenType: stringValue(record.tokenType) ?? "Bearer",
     credentialFamilyId: stringValue(record.credentialFamilyId) ?? "legacy_family",
     deviceName: stringValue(record.deviceName) ?? "Caplets CLI",
diff --git a/packages/core/src/cloud-auth/types.ts b/packages/core/src/cloud-auth/types.ts
index d0f3139..a6fd8ae 100644
--- a/packages/core/src/cloud-auth/types.ts
+++ b/packages/core/src/cloud-auth/types.ts
@@ -11,7 +11,13 @@ export const CLOUD_AUTH_STATES = [
 
 export type CloudAuthState = (typeof CLOUD_AUTH_STATES)[number];
 
-export type CloudAuthScope = "project_binding:read" | "project_binding:write" | string;
+export const HOSTED_CLOUD_AUTH_SCOPES = [
+  "project_binding:read",
+  "project_binding:write",
+  "mcp:tools",
+] as const;
+
+export type CloudAuthScope = (typeof HOSTED_CLOUD_AUTH_SCOPES)[number] | string;
 
 export type CloudAuthWorkspace = {
   workspaceId: string;
diff --git a/packages/core/src/remote/selection.ts b/packages/core/src/remote/selection.ts
index 7533976..e1944ab 100644
--- a/packages/core/src/remote/selection.ts
+++ b/packages/core/src/remote/selection.ts
@@ -1,5 +1,6 @@
 import { CloudAuthClient } from "../cloud-auth/client";
 import { CloudAuthStore, type CloudAuthCredentials } from "../cloud-auth/store";
+import { HOSTED_CLOUD_AUTH_SCOPES } from "../cloud-auth/types";
 import { CapletsError } from "../errors";
 import { projectBindingError } from "../project-binding/errors";
 import {
@@ -122,6 +123,15 @@ export async function resolveRemoteSelection(
       `Requested workspace ${workspaceFromRemoteUrl} differs from saved Selected Workspace ${selectedWorkspace}.`,
     );
   }
+  const missingScope = HOSTED_CLOUD_AUTH_SCOPES.find(
+    (scope) => !credentials.scope?.includes(scope),
+  );
+  if (missingScope) {
+    throw projectBindingError(
+      "cloud_auth_required",
+      `Hosted Cloud attach requires Cloud Auth scope ${missingScope}. Run caplets cloud auth login again.`,
+    );
+  }
   const remote = resolveHostedCloudRemote(
     {
       url: remoteUrl,
@@ -138,7 +148,7 @@ export async function resolveRemoteSelection(
     selectedWorkspace,
     credentials,
     cloudPresence: {
-      url: new URL(remoteUrl),
+      url: remote.baseUrl,
       accessToken: credentials.accessToken,
       workspaceId: credentials.workspaceId,
     },
diff --git a/packages/core/test/attach-cli.test.ts b/packages/core/test/attach-cli.test.ts
index 757321a..8f8363e 100644
--- a/packages/core/test/attach-cli.test.ts
+++ b/packages/core/test/attach-cli.test.ts
@@ -128,6 +128,7 @@ describe("caplets attach CLI", () => {
           remoteUrl: "https://cloud.pr-2.preview.caplets.dev/ws/personal-c9b49d/mcp",
           fetch: async (url) => {
             requestedUrl = String(url);
+            expect(String(url)).not.toContain("/ws/personal-c9b49d/api/project-bindings");
             return Response.json({ error: "websocket_upgrade_required" }, { status: 426 });
           },
         },
diff --git a/packages/core/test/cloud-auth-client.test.ts b/packages/core/test/cloud-auth-client.test.ts
index 71461c6..1bfa667 100644
--- a/packages/core/test/cloud-auth-client.test.ts
+++ b/packages/core/test/cloud-auth-client.test.ts
@@ -32,6 +32,7 @@ describe("CloudAuthClient", () => {
     await expect(requests[0]?.json()).resolves.toMatchObject({
       requestedWorkspace: "team",
       deviceName: "MacBook",
+      scope: ["project_binding:read", "project_binding:write", "mcp:tools"],
     });
     expect(result).toMatchObject({
       loginId: "login_123",
@@ -52,7 +53,7 @@ describe("CloudAuthClient", () => {
           accessToken: "cap_access_secret",
           refreshToken: "cap_refresh_secret",
           expiresAt: "2026-06-03T13:00:00.000Z",
-          scope: ["project_binding:read", "project_binding:write"],
+          scope: ["project_binding:read", "project_binding:write", "mcp:tools"],
           tokenType: "Bearer",
           credentialFamilyId: "family_123",
           deviceName: "MacBook",
@@ -66,7 +67,11 @@ describe("CloudAuthClient", () => {
     });
 
     expect(credentials.workspaceId).toBe("workspace_team");
-    expect(credentials.scope).toEqual(["project_binding:read", "project_binding:write"]);
+    expect(credentials.scope).toEqual([
+      "project_binding:read",
+      "project_binding:write",
+      "mcp:tools",
+    ]);
     expect(JSON.stringify(credentials.redacted)).not.toContain("cap_access_secret");
     expect(JSON.stringify(credentials.redacted)).not.toContain("cap_refresh_secret");
   });
diff --git a/packages/core/test/cloud-auth-login-cli.test.ts b/packages/core/test/cloud-auth-login-cli.test.ts
index 7cb8668..ee8e9f7 100644
--- a/packages/core/test/cloud-auth-login-cli.test.ts
+++ b/packages/core/test/cloud-auth-login-cli.test.ts
@@ -29,7 +29,7 @@ describe("caplets cloud auth login", () => {
         accessToken: "cap_access_secret",
         refreshToken: "cap_refresh_secret",
         expiresAt: "2099-06-03T13:00:00.000Z",
-        scope: ["project_binding:read", "project_binding:write"],
+        scope: ["project_binding:read", "project_binding:write", "mcp:tools"],
         tokenType: "Bearer",
         credentialFamilyId: "family_123",
         deviceName: "Test Device",
@@ -99,7 +99,7 @@ describe("caplets cloud auth login", () => {
         accessToken: "cap_access_secret",
         refreshToken: "cap_refresh_secret",
         expiresAt: "2099-06-03T13:00:00.000Z",
-        scope: ["project_binding:read", "project_binding:write"],
+        scope: ["project_binding:read", "project_binding:write", "mcp:tools"],
         tokenType: "Bearer",
         credentialFamilyId: "family_123",
       }),
diff --git a/packages/core/test/cloud-auth-refresh-attach.test.ts b/packages/core/test/cloud-auth-refresh-attach.test.ts
index a32f411..7e24872 100644
--- a/packages/core/test/cloud-auth-refresh-attach.test.ts
+++ b/packages/core/test/cloud-auth-refresh-attach.test.ts
@@ -31,7 +31,7 @@ describe("hosted Cloud Auth refresh before attach", () => {
                 accessToken: "new_access",
                 refreshToken: "new_refresh",
                 expiresAt: "2999-01-01T00:00:00.000Z",
-                scope: ["project_binding:read", "project_binding:write"],
+                scope: ["project_binding:read", "project_binding:write", "mcp:tools"],
                 tokenType: "Bearer",
                 credentialFamilyId: "family_123",
               });
diff --git a/packages/core/test/cloud-auth.test.ts b/packages/core/test/cloud-auth.test.ts
index 5b29581..f8128dd 100644
--- a/packages/core/test/cloud-auth.test.ts
+++ b/packages/core/test/cloud-auth.test.ts
@@ -19,7 +19,7 @@ const credentials: CloudAuthCredentials = {
   accessToken: "access",
   refreshToken: "refresh",
   expiresAt: "2099-06-02T12:00:00.000Z",
-  scope: ["project_binding:read", "project_binding:write"],
+  scope: ["project_binding:read", "project_binding:write", "mcp:tools"],
   tokenType: "Bearer",
   credentialFamilyId: "family_123",
   deviceName: "Test Device",
@@ -75,7 +75,7 @@ describe("caplets cloud auth CLI", () => {
       workspaceId: "ws_123",
       workspaceSlug: "team",
       expiresAt: "2099-06-02T12:00:00.000Z",
-      scope: ["project_binding:read", "project_binding:write"],
+      scope: ["project_binding:read", "project_binding:write", "mcp:tools"],
       tokenType: "Bearer",
       credentialFamilyId: "family_123",
       deviceName: "Test Device",
diff --git a/packages/core/test/fixtures/cloud-auth.ts b/packages/core/test/fixtures/cloud-auth.ts
index 4543792..ee402dc 100644
--- a/packages/core/test/fixtures/cloud-auth.ts
+++ b/packages/core/test/fixtures/cloud-auth.ts
@@ -23,7 +23,7 @@ export function hostedCredentials(
     accessToken: "cap_access_secret",
     refreshToken: "cap_refresh_secret",
     expiresAt: fixedLater,
-    scope: ["project_binding:read", "project_binding:write"],
+    scope: ["project_binding:read", "project_binding:write", "mcp:tools"],
     tokenType: "Bearer",
     credentialFamilyId: "family_123",
     deviceName: "Test Device",
diff --git a/packages/core/test/remote-selection.test.ts b/packages/core/test/remote-selection.test.ts
index 389e5e4..2f69dfe 100644
--- a/packages/core/test/remote-selection.test.ts
+++ b/packages/core/test/remote-selection.test.ts
@@ -119,6 +119,32 @@ describe("resolveRemoteSelection", () => {
           "wss://cloud.pr-2.preview.caplets.dev/control/project-bindings/connect",
         ),
       },
+      cloudPresence: {
+        url: new URL("https://cloud.pr-2.preview.caplets.dev/"),
+      },
+    });
+  });
+
+  it("requires Cloud Auth credentials to include hosted MCP tool scope", async () => {
+    const path = tempCloudAuthPath();
+    await new CloudAuthStore({ path }).save(
+      hostedCredentials({
+        scope: ["project_binding:read", "project_binding:write"],
+      }),
+    );
+
+    await expect(
+      resolveRemoteSelection(
+        {},
+        {
+          CAPLETS_MODE: "cloud",
+          CAPLETS_REMOTE_URL: "https://cloud.caplets.dev",
+          CAPLETS_CLOUD_AUTH_PATH: path,
+        },
+      ),
+    ).rejects.toMatchObject({
+      projectBindingCode: "cloud_auth_required",
+      recoveryCommand: "caplets cloud auth login",
     });
   });
 
@@ -169,7 +195,7 @@ describe("resolveRemoteSelection", () => {
             accessToken: "new-access",
             refreshToken: "new-refresh",
             expiresAt: "2999-01-01T00:00:00.000Z",
-            scope: ["project_binding:read", "project_binding:write"],
+            scope: ["project_binding:read", "project_binding:write", "mcp:tools"],
             tokenType: "Bearer",
             credentialFamilyId: "family_123",
           });

From 66bfedcf14526e2fbe3d4f7cd705034325437737 Mon Sep 17 00:00:00 2001
From: Ian Pascoe <ian.g.pascoe@gmail.com>
Date: Fri, 5 Jun 2026 06:33:28 -0400
Subject: [PATCH 3/8] chore: changeset

---
 .changeset/small-paws-draw.md | 5 +++++
 1 file changed, 5 insertions(+)
 create mode 100644 .changeset/small-paws-draw.md

diff --git a/.changeset/small-paws-draw.md b/.changeset/small-paws-draw.md
new file mode 100644
index 0000000..506f791
--- /dev/null
+++ b/.changeset/small-paws-draw.md
@@ -0,0 +1,5 @@
+---
+"@caplets/core": patch
+---
+
+Fix cloud attach URL normalization

From 9fcee3fa699a4c74b47177ea585862b3ec43e446 Mon Sep 17 00:00:00 2001
From: Ian Pascoe <ian.g.pascoe@gmail.com>
Date: Mon, 8 Jun 2026 15:59:58 -0400
Subject: [PATCH 4/8] feat: code mode

---
 AGENTS.md                                     |   3 +-
 CHANGELOG.md                                  |   6 +
 README.md                                     |  40 +-
 apps/landing/src/pages/index.astro            |  10 +-
 docs/benchmarks/coding-agent.md               |  35 +-
 .../caplets-progressive-mcp-disclosure-prd.md | 105 ++-
 package.json                                  |   4 +-
 packages/benchmarks/lib/code-mode.ts          | 480 +++++++++++
 packages/benchmarks/lib/surface.ts            |   8 +-
 packages/benchmarks/run-deterministic.ts      |  21 +-
 packages/benchmarks/test/benchmark.test.ts    |  26 +
 .../test/code-mode-complex-workflow.test.ts   |  46 ++
 packages/cli/rolldown.config.ts               |   1 +
 packages/core/.caplets/.gitignore             |   2 +
 packages/core/package.json                    |  12 +-
 packages/core/rolldown.config.ts              |   3 +
 packages/core/src/capability-description.ts   |   6 +-
 packages/core/src/caplet-files-bundle.ts      |  22 +
 packages/core/src/caplet-sets.ts              |  15 +-
 packages/core/src/cli-tools.ts                |  16 +-
 packages/core/src/cli.ts                      | 204 +++--
 packages/core/src/cli/cloud-add.ts            |  64 ++
 packages/core/src/cli/code-mode.ts            | 118 +++
 packages/core/src/cli/commands.ts             |   5 +
 packages/core/src/cli/doctor.ts               | 143 ++++
 packages/core/src/cloud-auth/client.ts        |  26 +
 packages/core/src/cloud/runtime-adapter.ts    |   4 +-
 packages/core/src/code-mode/api.ts            | 617 ++++++++++++++
 packages/core/src/code-mode/declarations.ts   | 115 +++
 packages/core/src/code-mode/diagnostics.ts    | 186 +++++
 packages/core/src/code-mode/index.ts          |  30 +
 packages/core/src/code-mode/logs.ts           | 160 ++++
 packages/core/src/code-mode/runner.ts         | 248 ++++++
 packages/core/src/code-mode/runtime-api.d.ts  | 140 ++++
 .../src/code-mode/runtime-api.generated.ts    |   3 +
 packages/core/src/code-mode/sandbox.ts        | 369 +++++++++
 packages/core/src/code-mode/tool.ts           |  36 +
 packages/core/src/code-mode/types.ts          | 122 +++
 packages/core/src/config-runtime.ts           |  22 +-
 packages/core/src/config.ts                   |  48 +-
 packages/core/src/config/paths.ts             |  12 +
 packages/core/src/downstream.ts               | 139 +++-
 packages/core/src/engine.ts                   |  34 +
 .../core/src/generated-tool-input-schema.ts   |  84 +-
 packages/core/src/graphql.ts                  |  20 +-
 packages/core/src/http-actions.ts             |  16 +-
 packages/core/src/index.ts                    |  48 ++
 packages/core/src/native.ts                   |   2 +
 packages/core/src/native/remote.ts            |   3 +-
 packages/core/src/native/service.ts           |  96 ++-
 packages/core/src/native/tools.ts             |  16 +-
 .../src/observed-output-shapes/extract.ts     | 122 +++
 .../src/observed-output-shapes/file-store.ts  | 170 ++++
 .../core/src/observed-output-shapes/index.ts  |  26 +
 .../core/src/observed-output-shapes/key.ts    | 139 ++++
 .../core/src/observed-output-shapes/merge.ts  |  74 ++
 .../core/src/observed-output-shapes/schema.ts |  24 +
 .../core/src/observed-output-shapes/types.ts  |  80 ++
 .../src/observed-output-shapes/typescript.ts  |  66 ++
 packages/core/src/openapi.ts                  |  14 +-
 packages/core/src/registry.ts                 |   8 +
 packages/core/src/remote-control/dispatch.ts  |  12 +-
 packages/core/src/remote-control/types.ts     |  12 +-
 packages/core/src/result-content.ts           |  30 +-
 packages/core/src/serve/session.ts            | 118 ++-
 packages/core/src/serve/stdio.ts              |  12 +-
 packages/core/src/tool-search.ts              |  36 +-
 packages/core/src/tools.ts                    | 756 +++++++++++++++---
 packages/core/test/caplet-sets.test.ts        |  12 +-
 packages/core/test/cli-remote.test.ts         |  14 +-
 packages/core/test/cli-tools.test.ts          |   8 +-
 packages/core/test/cli.test.ts                |   8 +-
 packages/core/test/cloud-auth.test.ts         |  68 +-
 packages/core/test/code-mode-api.test.ts      | 529 ++++++++++++
 packages/core/test/code-mode-cli.test.ts      | 173 ++++
 .../core/test/code-mode-declarations.test.ts  | 151 ++++
 .../core/test/code-mode-diagnostics.test.ts   | 136 ++++
 packages/core/test/code-mode-logs.test.ts     |  93 +++
 packages/core/test/code-mode-mcp.test.ts      | 161 ++++
 packages/core/test/code-mode-runner.test.ts   | 139 ++++
 packages/core/test/config.test.ts             | 109 +++
 packages/core/test/doctor-cli.test.ts         |   9 +
 packages/core/test/downstream.test.ts         | 119 ++-
 packages/core/test/http-actions.test.ts       |  11 +-
 packages/core/test/native-remote.test.ts      |  36 +-
 packages/core/test/native.test.ts             |  54 +-
 .../core/test/observed-output-shapes.test.ts  | 178 +++++
 packages/core/test/openapi.test.ts            |  36 +-
 .../test/project-binding-integration.test.ts  |   6 +-
 packages/core/test/registry.test.ts           |  19 +
 .../core/test/remote-control-client.test.ts   |   2 +-
 .../core/test/remote-control-dispatch.test.ts |   9 +-
 packages/core/test/runtime.test.ts            |   3 +-
 packages/core/test/serve-session.test.ts      |  21 +-
 packages/core/test/tools.test.ts              | 488 ++++++++---
 packages/opencode/src/hooks.ts                |   6 +-
 packages/opencode/src/schema.ts               |   7 +
 packages/pi/package.json                      |   3 +-
 packages/pi/scripts/copy-quickjs-wasm.mjs     |  26 +
 packages/pi/test/pi.test.ts                   |   8 +-
 pnpm-lock.yaml                                |  67 +-
 schemas/caplet.schema.json                    |  48 ++
 schemas/caplets-config.schema.json            | 108 +++
 scripts/generate-code-mode-runtime-api.mjs    |  48 ++
 104 files changed, 8016 insertions(+), 587 deletions(-)
 create mode 100644 packages/benchmarks/lib/code-mode.ts
 create mode 100644 packages/benchmarks/test/code-mode-complex-workflow.test.ts
 create mode 100644 packages/core/.caplets/.gitignore
 create mode 100644 packages/core/src/cli/cloud-add.ts
 create mode 100644 packages/core/src/cli/code-mode.ts
 create mode 100644 packages/core/src/code-mode/api.ts
 create mode 100644 packages/core/src/code-mode/declarations.ts
 create mode 100644 packages/core/src/code-mode/diagnostics.ts
 create mode 100644 packages/core/src/code-mode/index.ts
 create mode 100644 packages/core/src/code-mode/logs.ts
 create mode 100644 packages/core/src/code-mode/runner.ts
 create mode 100644 packages/core/src/code-mode/runtime-api.d.ts
 create mode 100644 packages/core/src/code-mode/runtime-api.generated.ts
 create mode 100644 packages/core/src/code-mode/sandbox.ts
 create mode 100644 packages/core/src/code-mode/tool.ts
 create mode 100644 packages/core/src/code-mode/types.ts
 create mode 100644 packages/core/src/observed-output-shapes/extract.ts
 create mode 100644 packages/core/src/observed-output-shapes/file-store.ts
 create mode 100644 packages/core/src/observed-output-shapes/index.ts
 create mode 100644 packages/core/src/observed-output-shapes/key.ts
 create mode 100644 packages/core/src/observed-output-shapes/merge.ts
 create mode 100644 packages/core/src/observed-output-shapes/schema.ts
 create mode 100644 packages/core/src/observed-output-shapes/types.ts
 create mode 100644 packages/core/src/observed-output-shapes/typescript.ts
 create mode 100644 packages/core/test/code-mode-api.test.ts
 create mode 100644 packages/core/test/code-mode-cli.test.ts
 create mode 100644 packages/core/test/code-mode-declarations.test.ts
 create mode 100644 packages/core/test/code-mode-diagnostics.test.ts
 create mode 100644 packages/core/test/code-mode-logs.test.ts
 create mode 100644 packages/core/test/code-mode-mcp.test.ts
 create mode 100644 packages/core/test/code-mode-runner.test.ts
 create mode 100644 packages/core/test/observed-output-shapes.test.ts
 create mode 100644 packages/pi/scripts/copy-quickjs-wasm.mjs
 create mode 100644 scripts/generate-code-mode-runtime-api.mjs

diff --git a/AGENTS.md b/AGENTS.md
index e8ce1a0..4ae49cf 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -4,7 +4,7 @@
 
 - Use `pnpm` only; the repo pins `pnpm@11.5.0` and requires Node `>=24`.
 - Install with `pnpm install --frozen-lockfile` when matching CI.
-- Full local gate and pre-push hook: `pnpm verify` (`format:check -> lint -> typecheck -> schema:check -> test -> benchmark:check -> build`).
+- Full local gate and pre-push hook: `pnpm verify` (`format:check -> lint -> code-mode:check-api -> typecheck -> schema:check -> test -> benchmark:check -> build`).
 - Fast focused checks: `pnpm format:check`, `pnpm lint`, `pnpm typecheck`, `pnpm test`, `pnpm build`.
 - Run one package: `pnpm --filter @caplets/core test`, `pnpm --filter caplets build`, or replace the filter with `@caplets/opencode`, `@caplets/pi`, `@caplets/benchmarks`.
 - Run one Vitest file by passing it after the package script, e.g. `pnpm --filter @caplets/core test -- test/config.test.ts`.
@@ -21,6 +21,7 @@
 
 - Put design specs in `docs/specs/`, implementation plans in `docs/plans/`, and product requirements documents in `docs/product/`; do not use `docs/superpowers/` in this repo.
 - Config schema source of truth is Zod in `packages/core/src/config.ts`; update `schemas/caplets-config.schema.json` with `pnpm schema:generate` and verify with `pnpm schema:check`.
+- Code Mode runtime API declaration source of truth is `packages/core/src/code-mode/runtime-api.d.ts`; update `packages/core/src/code-mode/runtime-api.generated.ts` with `pnpm code-mode:generate-api` and verify with `pnpm code-mode:check-api`.
 - `pnpm benchmark` updates `docs/benchmarks/coding-agent.md`; `pnpm benchmark:check` fails if the committed report is stale.
 - Live benchmarks are opt-in only: build first, then run `CAPLETS_BENCH_LIVE=1 pnpm benchmark:live:opencode` or `CAPLETS_BENCH_LIVE=1 pnpm benchmark:live:pi`; results are local/model-dependent and not deterministic product claims.
 
diff --git a/CHANGELOG.md b/CHANGELOG.md
index c7eaf9b..f9e5929 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,11 @@
 # caplets
 
+## Unreleased
+
+### Major Changes
+
+- Breaking: Caplet progressive wrapper operation names now use `check`, `tools`, `describe_tool`, resource/prompt operation names without `list_`, and `name`/`args` fields instead of `tool`/`prompt`/`arguments`. Code Mode declarations now expose comprehensive Caplet handles with paginated discovery, result envelopes, resource/prompt methods, loose TypeScript diagnostics, and schema-derived `callSignature`.
+
 ## 0.12.0
 
 ### Minor Changes
diff --git a/README.md b/README.md
index 19e5d92..6a5c862 100644
--- a/README.md
+++ b/README.md
@@ -28,7 +28,7 @@
 
 Caplets turns MCP servers, APIs, and commands into focused agent capabilities: one card first, searchable tools next, inspectable schemas before calls, and preserved results after.
 
-Stop dumping every operation into context up front. Caplets wraps each tool source as a capability an agent can discover, inspect, call, and recover from one step at a time. Instead of exposing a giant flat wall of operations, Caplets shows a compact capability card with source, status, and next actions. The agent chooses a domain first, then uses scoped operations like `search_tools`, `get_tool`, and `call_tool` only when it needs more detail.
+Stop dumping every operation into context up front. Caplets wraps each tool source as a capability an agent can discover, inspect, call, and recover from one step at a time. Instead of exposing a giant flat wall of operations, Caplets shows a compact capability card with source, status, and next actions. The agent chooses a domain first, then uses scoped operations like `search_tools`, `describe_tool`, and `call_tool` only when it needs more detail.
 
 For MCP-backed Caplets, the scoped operation set also includes resource discovery and reading, prompt listing and rendering, resource-template discovery, and completion for prompt or template arguments. Non-MCP backends expose focused tool and action operations.
 
@@ -43,7 +43,7 @@ caplets add mcp context7 --command npx --arg -y --arg @upstash/context7-mcp
 caplets serve
 ```
 
-In the deterministic benchmark, 106 flat tools became 3 top-level capabilities with an 87.9% smaller initial payload. Your agent starts with `context7`, then drills in through `inspect`, `search_tools`, `get_tool`, and `call_tool` only when needed.
+In the deterministic benchmark, 106 flat tools became 3 top-level capabilities with an 87.9% smaller initial payload. Your agent starts with `context7`, then drills in through `inspect`, `search_tools`, `describe_tool`, and `call_tool` only when needed.
 
 ## Quick Start
 
@@ -312,8 +312,8 @@ Flat tool lists make agents guess before they understand. If every downstream se
 Caplets turns that flat wall into a staged path:
 
 1. **Choose** a capability, such as `GitHub`.
-2. **Inspect** matching operations with `search_tools` or `list_tools`.
-3. **Resolve** the exact schema with `get_tool`.
+2. **Inspect** matching operations with `search_tools` or `tools`.
+3. **Resolve** the exact schema with `describe_tool`.
 4. **Invoke** with `call_tool` while preserving downstream content, structured data, and error state.
 
 A backend enters agent context as a focused card with source, status, and next actions, not a wall of operations.
@@ -390,7 +390,7 @@ If a backend fails, Caplets keeps the error scoped to the capability, preserves
 - Uses the configured `name` and `description` as the capability card shown to agents.
 - Starts downstream MCP servers and loads OpenAPI specs lazily when an operation needs them.
 - Supports stdio, Streamable HTTP, and legacy HTTP+SSE downstream servers.
-- Lets agents `list_tools`, `search_tools`, `get_tool`, and `call_tool` within one selected Caplet namespace.
+- Lets agents `tools`, `search_tools`, `describe_tool`, and `call_tool` within one selected Caplet namespace.
 - Converts OpenAPI operations into MCP-style tool metadata and executes HTTP calls directly.
 - Converts configured GraphQL operations into MCP-style tool metadata, and can auto-generate GraphQL tools from schema root query and mutation fields.
 - Converts explicitly configured HTTP actions into MCP-style tool metadata and executes HTTP calls directly.
@@ -780,7 +780,7 @@ OpenAPI auth is explicit and supports:
 - `{"type": "oauth2", ...}`
 - `{"type": "oidc", ...}`
 
-OpenAPI `call_tool.arguments` uses grouped HTTP inputs:
+OpenAPI `call_tool.args` uses grouped HTTP inputs:
 
 ```json
 {
@@ -824,7 +824,7 @@ endpoint and exactly one schema source: `schemaPath`, `schemaUrl`, or `introspec
 
 When `operations` is omitted or empty, Caplets auto-generates tools from schema root
 fields: `query_<field>` and `mutation_<field>`. Generated tools use bounded scalar
-selection sets and pass `call_tool.arguments` directly as GraphQL variables/root-field
+selection sets and pass `call_tool.args` directly as GraphQL variables/root-field
 arguments.
 
 Every GraphQL endpoint can set:
@@ -878,7 +878,7 @@ must start with `/` and be URL paths that cannot change origin or escape the bas
 Action mappings can set `query`, `headers`, and `jsonBody`. `query` and `headers` must resolve
 to object maps whose values are strings, numbers, or booleans. `jsonBody` may use literals,
 nested arrays/objects, `$input.field` references, or `$input` for the whole argument object.
-Path placeholders such as `{service}` are read directly from `call_tool.arguments` and URL-encoded.
+Path placeholders such as `{service}` are read directly from `call_tool.args` and URL-encoded.
 Configured action headers cannot set managed headers such as `authorization`, `host`,
 `content-length`, `connection`, or `content-type`; JSON bodies set `content-type` automatically.
 
@@ -939,8 +939,8 @@ an existing destination file.
 ### Caplet Sets
 
 Use `capletSets` to expose another Caplets collection as nested Caplets. Each child Caplet appears
-as one downstream tool and supports the full Caplets operation set: `inspect`, `check_backend`,
-`list_tools`, `search_tools`, `get_tool`, and `call_tool`.
+as one downstream tool and supports the full Caplets operation set: `inspect`, `check`,
+`tools`, `search_tools`, `describe_tool`, and `call_tool`.
 
 ```json
 {
@@ -1135,7 +1135,7 @@ Each generated Caplet tool accepts an `operation`:
 
 ```json
 {
-  "operation": "list_tools"
+  "operation": "tools"
 }
 ```
 
@@ -1153,7 +1153,7 @@ Inspect one exact downstream tool:
 
 ```json
 {
-  "operation": "get_tool",
+  "operation": "describe_tool",
   "tool": "read_file"
 }
 ```
@@ -1173,23 +1173,23 @@ Call one exact downstream tool:
 Available operations:
 
 - `inspect`: return the configured capability card without starting the downstream server.
-- `check_backend`: verify the selected backend, whether MCP, OpenAPI, GraphQL, HTTP, CLI, or nested Caplets.
-- `list_tools`: return compact downstream tool metadata.
+- `check`: verify the selected backend, whether MCP, OpenAPI, GraphQL, HTTP, CLI, or nested Caplets.
+- `tools`: return compact downstream tool metadata.
 - `search_tools`: search downstream tool names and descriptions within this Caplet.
-- `get_tool`: return full metadata for one exact downstream tool.
+- `describe_tool`: return full metadata for one exact downstream tool.
 - `call_tool`: invoke one exact downstream tool with JSON object arguments.
 
 Requests are strict: operation-specific extra fields are rejected, and `call_tool` requires
 `arguments` to be a JSON object.
 
-Discovery operations (`inspect`, `check_backend`, `list_tools`, `search_tools`, and
-`get_tool`) return wrapper-generated results whose `structuredContent.caplets` field
+Discovery operations (`inspect`, `check`, `tools`, `search_tools`, and
+`describe_tool`) return wrapper-generated results whose `structuredContent.caplets` field
 identifies the Caplet with `id`, plus backend, operation, status, and elapsed time when
 available. Discovery result objects and compact tool entries also use `id` for the
-configured Caplet identity. Compact `list_tools` and `search_tools` entries may include
+configured Caplet identity. Compact `tools` and `search_tools` entries may include
 input/output schema hashes; treat those
 hashes as reuse hints for a schema you have already inspected, not as a replacement for
-`get_tool` when arguments, output, or semantics are unclear.
+`describe_tool` when arguments, output, or semantics are unclear.
 
 Direct `call_tool` preserves the downstream tool result shape instead of wrapping it in
 `structuredContent.result`. When the result can carry MCP metadata, Caplets adds
@@ -1200,7 +1200,7 @@ relative to the downstream MCP server process, not necessarily relative to the c
 project or Caplets process.
 
 For first use, the explicit progressive-discovery path is still safest: choose a Caplet,
-`search_tools` or `list_tools`, inspect uncertain tools with `get_tool`, then `call_tool`.
+`search_tools` or `tools`, inspect uncertain tools with `describe_tool`, then `call_tool`.
 
 ## Development
 
diff --git a/apps/landing/src/pages/index.astro b/apps/landing/src/pages/index.astro
index 8ae2edf..cba8b1b 100644
--- a/apps/landing/src/pages/index.astro
+++ b/apps/landing/src/pages/index.astro
@@ -12,7 +12,7 @@ const heroTrace = {
     {
       label: "inspect",
       detail: "Show one capability card before any downstream tool list enters context.",
-      result: "search_tools · get_tool · call_tool",
+      result: "search_tools · describe_tool · call_tool",
     },
     {
       label: 'search_tools("pull request")',
@@ -20,7 +20,7 @@ const heroTrace = {
       result: "create_pull_request · list_pull_requests · request_review",
     },
     {
-      label: 'get_tool("create_pull_request")',
+      label: 'describe_tool("create_pull_request")',
       detail: "Inspect the exact schema before an agent can invoke the operation.",
       result: "title · body · base · head · reviewers?",
     },
@@ -165,7 +165,7 @@ const exampleCaplets = [
     name: "GitHub",
     summary: "A huge hosted MCP surface for repositories, issues, pull requests, branches, commits, and reviews.",
     why: "Use it when the value is avoiding a giant GitHub tool wall.",
-    path: ["github", "inspect", "search_tools", "get_tool", "call_tool"],
+    path: ["github", "inspect", "search_tools", "describe_tool", "call_tool"],
     steps: [
       { command: "export GH_TOKEN=github_pat_...", label: "GitHub token export" },
       {
@@ -181,7 +181,7 @@ const exampleCaplets = [
     name: "Sourcegraph",
     summary: "Hosted code search for finding examples, references, and implementation patterns across repositories.",
     why: "Use it when the agent should search code first, then inspect only the matching operations.",
-    path: ["sourcegraph", "inspect", "search_tools", "get_tool", "call_tool"],
+    path: ["sourcegraph", "inspect", "search_tools", "describe_tool", "call_tool"],
     steps: [
       {
         command: "caplets install spiritledsoftware/caplets sourcegraph",
@@ -197,7 +197,7 @@ const exampleCaplets = [
     name: "OSV",
     summary: "A small explicit HTTP API for vulnerability lookups by package, purl, commit, or batch query.",
     why: "Use it when Caplets should bound a sharp task without exposing arbitrary HTTP calls.",
-    path: ["osv", "inspect", "search_tools", "get_tool", "call_tool"],
+    path: ["osv", "inspect", "search_tools", "describe_tool", "call_tool"],
     steps: [
       {
         command: "caplets install spiritledsoftware/caplets osv",
diff --git a/docs/benchmarks/coding-agent.md b/docs/benchmarks/coding-agent.md
index d13d6ab..4521b7d 100644
--- a/docs/benchmarks/coding-agent.md
+++ b/docs/benchmarks/coding-agent.md
@@ -7,20 +7,20 @@ This report is generated by `pnpm --filter @caplets/benchmarks benchmark` from d
 The deterministic benchmark compares two ways of exposing the same three mock MCP servers to a coding agent:
 
 - Direct flat MCP aggregation exposes every downstream tool from the `policy`, `tickets`, `api` servers in the initial `tools/list` payload.
-- Caplets progressive disclosure exposes one top-level capability tool per server, then keeps downstream tools behind scoped `inspect`, `list_tools` or `search_tools`, `get_tool`, and `call_tool` operations.
+- Caplets progressive disclosure exposes one top-level capability tool per server, then keeps downstream tools behind scoped `inspect`, `tools` or `search_tools`, `describe_tool`, and `call_tool` operations.
 
 The fixture uses local mock MCP metadata only. It does not call external APIs, depend on network access, or require model credentials. Approximate token counts use `Math.ceil(bytes / 4)` as a stable context-size proxy, not provider billing data.
 
 ## Summary
 
 - Initial tools visible: direct flat MCP 106, Caplets top-level 3, 97.2% fewer.
-- Serialized payload bytes: direct flat MCP 32090, Caplets top-level 3879, 87.9% fewer.
-- Approx. tokens: direct flat MCP 8023, Caplets top-level 970, 7053 fewer.
+- Serialized payload bytes: direct flat MCP 32090, Caplets top-level 5082, 84.2% fewer.
+- Approx. tokens: direct flat MCP 8023, Caplets top-level 1271, 6752 fewer.
 - Candidate set before discovery: direct flat MCP 106, Caplets top-level 3, 103 fewer.
 
 ## Deterministic Results
 
-Caplets reduces the initial serialized MCP tool payload by 87.9%, from 32090 bytes to 3879 bytes. It reduces initially visible tools by 97.2%, from 106 direct flat tools to 3 Caplets capability tools, while preserving access to downstream tools through scoped discovery and `call_tool`.
+Caplets reduces the initial serialized MCP tool payload by 84.2%, from 32090 bytes to 5082 bytes. It reduces initially visible tools by 97.2%, from 106 direct flat tools to 3 Caplets capability tools, while preserving access to downstream tools through scoped discovery and `call_tool`.
 
 ## Collision Check
 
@@ -34,15 +34,38 @@ Caplets top-level duplicate tool-name collisions: 0
 
 Direct flat MCP exposes all downstream tools immediately, so expected discovery calls are 0 but the initial candidate set is 106 tools.
 
-Caplets starts from 3 capability tools. Expected task-specific discovery is 4 calls: `inspect`, `list_tools` or `search_tools`, `get_tool`, then `call_tool`.
+Caplets starts from 3 capability tools. Expected task-specific discovery is 4 calls: `inspect`, `tools` or `search_tools`, `describe_tool`, then `call_tool`.
 
 ## Validation
 
-- Initial payload reduction threshold: 87.9% >= 70.0%
+- Initial payload reduction threshold: 84.2% >= 70.0%
 - Top-level Caplets collisions: 0
 
 Payload implementation: `source`
 
+## Code Mode Workflow Eval
+
+The deterministic Code Mode fixture covers 12 PRD task categories and shows 80.5% fewer model/tool round trips versus equivalent progressive-disclosure sequences, with 50.7% lower approximate context tokens.
+
+### Complex Workflow Eval
+
+Task: Discover GitHub issue/PR tools, inspect schemas or observed shapes, fetch open work, preserve labels and URLs, and synthesize a next-action triage brief.
+
+| Strategy               | External calls | LLM round trips | Code Mode run calls | Internal Caplet calls | Approx. payload tokens | Success score |
+| ---------------------- | -------------: | --------------: | ------------------: | --------------------: | ---------------------: | ------------: |
+| Vanilla MCP            |              4 |               4 |                   0 |                     0 |                   4200 |          0.72 |
+| Progressive disclosure |             13 |              13 |                   0 |                     0 |                   8600 |          0.95 |
+| Code Mode              |              1 |               1 |                   1 |                     7 |                   2300 |          0.93 |
+
+Code Mode preserves required triage fields (`number`, `title`, `state`, `url`, `html_url`, `labels`, `created_at`, `updated_at`) while reducing external calls versus progressive disclosure by 92.3% and approximate payload tokens by 73.3%.
+
+### Live Regression Guardrails
+
+The deterministic report also records live cold-agent failure classes without treating model-dependent runs as deterministic claims. Current guardrails: `code-mode-one-run-guidance`, `optional-use-avoid-hints`, `schema-error-call-signatures`, `transport-body-normalization`.
+
+- `github-issues-and-prs-adjacent-entities`: Cold agents can under-query adjacent entities or over-trust one search result when backend taxonomy is broad. Guardrails: `code-mode-one-run-guidance`, `optional-use-avoid-hints`.
+- `osv-package-version-tool-selection`: Code Mode initially chose a batch-style tool and leaked HTTP transport body shape before recovering. Guardrails: `code-mode-one-run-guidance`, `optional-use-avoid-hints`, `schema-error-call-signatures`, `transport-body-normalization`.
+
 ## Reproduce
 
 Run the deterministic benchmark and update this report:
diff --git a/docs/product/caplets-progressive-mcp-disclosure-prd.md b/docs/product/caplets-progressive-mcp-disclosure-prd.md
index 6d0d805..2827489 100644
--- a/docs/product/caplets-progressive-mcp-disclosure-prd.md
+++ b/docs/product/caplets-progressive-mcp-disclosure-prd.md
@@ -4,7 +4,7 @@
 
 **Problem Statement**: MCP clients that connect directly to many servers receive a large, flat tool surface up front. This creates context bloat, weak tool selection, name-collision risk, and poor discoverability when an agent only needs to know which capability domain to inspect next.
 
-**Proposed Solution**: Caplets is a local MCP server that reads downstream MCP server definitions, native OpenAPI endpoint definitions, native GraphQL endpoint definitions, explicit HTTP API action definitions, and explicit CLI tool/action definitions from `${XDG_CONFIG_HOME:-~/.config}/caplets/config.json` on Unix-like platforms or `%APPDATA%\caplets\config.json` on Windows, user-owned Markdown Caplet files from the user Caplets root, project config from `./.caplets/config.json`, and project Markdown Caplet files from `./.caplets`. Project sources load by default and override global/user sources with the same Caplet ID, while inspection commands expose source metadata and shadow warnings. It exposes each enabled Caplet as one top-level, skill-like MCP tool. Each generated Caplet tool uses the Caplet ID as the tool name and the configured `name`/`description` as its compact capability card, then progressively discloses the full Caplet card and the backing MCP tools, OpenAPI operations, GraphQL operations, HTTP actions, or CLI tools/actions through operations such as `get_caplet`, `search_tools`, `list_tools`, `get_tool`, and `call_tool`.
+**Proposed Solution**: Caplets is a local MCP server that reads downstream MCP server definitions, native OpenAPI endpoint definitions, native GraphQL endpoint definitions, explicit HTTP API action definitions, and explicit CLI tool/action definitions from `${XDG_CONFIG_HOME:-~/.config}/caplets/config.json` on Unix-like platforms or `%APPDATA%\caplets\config.json` on Windows, user-owned Markdown Caplet files from the user Caplets root, project config from `./.caplets/config.json`, and project Markdown Caplet files from `./.caplets`. Project sources load by default and override global/user sources with the same Caplet ID, while inspection commands expose source metadata and shadow warnings. It exposes each enabled Caplet as one top-level, skill-like MCP tool. Each generated Caplet tool uses the Caplet ID as the tool name and the configured `name`/`description` as its compact capability card, then progressively discloses the full Caplet card and the backing MCP tools, OpenAPI operations, GraphQL operations, HTTP actions, or CLI tools/actions through operations such as `inspect`, `search_tools`, `tools`, `describe_tool`, and `call_tool`.
 
 **Success Criteria**:
 
@@ -29,8 +29,8 @@
 3. Each downstream MCP server, OpenAPI endpoint, GraphQL endpoint, HTTP API, CLI tool/action set, or Caplet file uses the supported backend configuration shape plus a required `description`.
 4. Client calls Caplets `tools/list` and sees one top-level tool per enabled downstream server, for example `linear`, `chrome-devtools`, and `context7`.
 5. Agent chooses the relevant Caplet tool based on its skill-like tool name and description.
-6. Agent calls that Caplet tool with an operation such as `get_caplet`, `search_tools`, `list_tools`, or `get_tool`.
-7. Agent calls the same Caplet tool with `operation: "call_tool"`, an exact downstream tool name, and a JSON object of arguments.
+6. Agent calls that Caplet tool with an operation such as `inspect`, `search_tools`, `tools`, or `describe_tool`.
+7. Agent calls the same Caplet tool with `operation: "call_tool"`, an exact downstream `name`, and a JSON object of `args`.
 8. Caplets forwards the request to that server's downstream MCP process or executes the selected OpenAPI, GraphQL, explicit HTTP action, or explicit CLI action and returns the result.
 
 ### User Stories
@@ -62,11 +62,11 @@ Acceptance Criteria:
 
 Acceptance Criteria:
 
-- Each generated Caplet tool supports `operation: "list_tools"` and returns a compact list of that server's MCP tools.
-- Each generated Caplet tool supports `operation: "get_tool"` and returns one downstream tool's full metadata by exact downstream tool name.
-- `get_tool` refreshes stale downstream tool metadata according to `toolCacheTtlMs` before resolving the exact downstream tool name.
+- Each generated Caplet tool supports `operation: "tools"` and returns a compact list of that server's MCP tools.
+- Each generated Caplet tool supports `operation: "describe_tool"` and returns one downstream tool's full metadata by exact downstream tool name.
+- `describe_tool` refreshes stale downstream tool metadata according to `toolCacheTtlMs` before resolving the exact downstream tool name.
 - Tool results preserve downstream `name`, `description`, `inputSchema`, and annotations when available.
-- Caplets forwards downstream tool annotations as-is and does not infer, normalize, or add Caplets-specific risk labels in MVP.
+- `tools` and `search_tools` flatten downstream safety annotations into compact `readOnlyHint` and `destructiveHint` fields when present; `describe_tool` preserves full downstream metadata.
 - `operation: "search_tools"` supports deterministic case-insensitive lexical search across that server's downstream tool names and descriptions.
 - `search_tools` is scoped to the selected generated Caplet tool; MVP does not provide cross-Caplet tool search because `tools/list` is already the server discovery layer.
 - `search_tools` supports an optional `limit`, defaults to 20 results, and rejects values above 50.
@@ -77,11 +77,11 @@ Acceptance Criteria:
 
 Acceptance Criteria:
 
-- `operation: "call_tool"` requires exact downstream `tool` and a JSON object `arguments`.
-- For OpenAPI-backed Caplets, `call_tool.arguments` uses grouped HTTP inputs: `path`, `query`, `header`, and `body`.
-- For GraphQL-backed Caplets, configured operation `call_tool.arguments` is the GraphQL variables object directly; auto-generated operation `call_tool.arguments` is the root field arguments object directly.
-- For HTTP action Caplets, `call_tool.arguments` is the action input object directly; path placeholders read top-level argument fields and configured request mappings can reference `$input.field` or `$input`.
-- For CLI-backed Caplets, `call_tool.arguments` is the configured CLI action input object directly; Caplets maps those fields into configured argv, environment, stdin, or working-directory templates without shell interpolation.
+- `operation: "call_tool"` requires exact downstream `name` and a JSON object `args`.
+- For OpenAPI-backed Caplets, `call_tool.args` uses grouped HTTP inputs: `path`, `query`, `header`, and `body`.
+- For GraphQL-backed Caplets, configured operation `call_tool.args` is the GraphQL variables object directly; auto-generated operation `call_tool.args` is the root field arguments object directly.
+- For HTTP action Caplets, `call_tool.args` is the action input object directly; path placeholders read top-level argument fields and configured request mappings can reference `$input.field` or `$input`.
+- For CLI-backed Caplets, `call_tool.args` is the configured CLI action input object directly; Caplets maps those fields into configured argv, environment, stdin, or working-directory templates without shell interpolation.
 - `call_tool` requires the exact downstream tool name; Caplets does not use fuzzy matching, aliases, or auto-correction for execution.
 - The selected generated Caplet tool is the server namespace, so `call_tool` does not accept a `server` argument in MVP.
 - Caplets preserves downstream tool names exactly and does not support flattened namespaced identifiers such as `server.tool` in MVP.
@@ -89,7 +89,7 @@ Acceptance Criteria:
 - Before `call_tool` resolves the exact downstream tool name, Caplets refreshes stale downstream tool metadata according to `toolCacheTtlMs`.
 - `call_tool` requires the requested downstream tool to appear in fresh-enough cached `tools/list` metadata before forwarding; absent tools return `TOOL_NOT_FOUND` and are not forwarded.
 - Unknown operation, unknown tool, malformed Caplets request shape, startup timeout, call timeout, and downstream protocol failure return structured errors.
-- Malformed generated-server-tool payloads use `REQUEST_INVALID`, including missing required operation fields, invalid field types, invalid `call_tool.arguments`, and operation-specific extra fields.
+- Malformed generated-server-tool payloads use `REQUEST_INVALID`, including missing required operation fields, invalid field types, invalid `call_tool.args`, and operation-specific extra fields.
 - Extra fields that do not belong to the selected operation are malformed Caplets request shapes and must be rejected rather than ignored.
 - Caplets does not perform heavy local validation of downstream tool arguments; once routing fields are valid, the selected downstream MCP server remains the source of truth for argument validation and tool semantics.
 - `TOOL_NOT_FOUND` may include nearby same-server suggestions for debugging, but suggestions are informational only and must never be invoked automatically.
@@ -102,8 +102,8 @@ Acceptance Criteria:
 
 - Caplets validates config with clear errors before serving discovery results.
 - Unsupported transports or unsupported config fields produce actionable validation messages.
-- Each generated Caplet tool supports `operation: "check_backend"`, verifies or starts/connects to that managed downstream server if needed, calls downstream `tools/list`, refreshes cached status and tool metadata, and returns server availability status, tool count when available, safe error details when unavailable, and elapsed timing data.
-- `check_backend` must not invoke any downstream tool.
+- Each generated Caplet tool supports `operation: "check"`, verifies or starts/connects to that managed downstream server if needed, calls downstream `tools/list`, refreshes cached status and tool metadata, and returns server availability status, tool count when available, safe error details when unavailable, and elapsed timing data.
+- `check` must not invoke any downstream tool.
 - Env values, tokens, headers, and secret-looking fields are redacted from errors and logs.
 - Downstream server startup has a default timeout of 10 seconds and can be overridden per server.
 - Tool calls have a default timeout of 60 seconds and can be overridden per server.
@@ -130,34 +130,33 @@ Caplets exposes dynamic MCP tools:
 - The generated MCP tool name is the configured server ID, for example `linear`, `chrome-devtools`, or `context7`.
 - Caplets does not prefix generated tool names in MVP; the server ID is the MCP tool name exactly.
 - The generated MCP tool description is the full server capability card, built from configured `name` and exact configured `description`.
-- Generated tool descriptions append a short standard protocol hint, roughly: `Use this tool to inspect and call tools from the {server} MCP server. Start with search_tools or list_tools; use get_tool for schema; use call_tool to invoke.`
+- Generated tool descriptions append a short standard protocol hint, roughly: `Use this tool to inspect and call tools from the {server} MCP server. Start with search_tools or tools; use describe_tool for schema; use call_tool to invoke.`
 - The standard protocol hint should stay under 35 words.
 - Disabled servers are omitted from Caplets `tools/list`.
 - Caplets does not expose every downstream tool directly in its own `tools/list`.
 
 Each generated Caplet tool supports these operations:
 
-- `get_caplet`: Returns the full configured capability card for the selected server without starting the downstream process.
-- `check_backend`: Validates that the selected backend is available. For MCP it checks the downstream tool list; for OpenAPI it validates the spec and executable base URL without invoking an operation.
-- `check_backend`: Validates that the selected downstream server can start, initialize, and return its tool list without invoking any downstream tool.
-- `list_tools`: Lists compact downstream tool entries for the selected server.
+- `inspect`: Returns the full configured capability card for the selected server without starting the downstream process.
+- `check`: Validates that the selected backend is available. For MCP it checks the downstream tool list; for OpenAPI it validates the spec and executable base URL without invoking an operation.
+- `check`: Validates that the selected downstream server can start, initialize, and return its tool list without invoking any downstream tool.
+- `tools`: Lists compact downstream tool entries for the selected server.
 - `search_tools`: Searches downstream tools for the selected server. Supports optional `limit`, defaults to 20 results, and rejects values above 50.
-- `get_tool`: Returns full metadata for one exact downstream tool.
-- `call_tool`: Invokes one exact downstream tool with a JSON object of arguments.
+- `describe_tool`: Returns full metadata for one exact downstream tool.
+- `call_tool`: Invokes one exact downstream tool with a JSON object of `args`.
 
 Generated Caplet tool input schema:
 
-- `operation` is required and must be one of `get_caplet`, `check_backend`, `list_tools`, `search_tools`, `get_tool`, or `call_tool`.
-- `get_caplet` accepts no extra fields.
-- `get_caplet` returns only configured capability-card data and does not start, initialize, or probe the downstream server.
-- `get_caplet` is intentionally provisional in MVP; it may be pruned later if generated top-level Caplet tool descriptions prove sufficient.
-- `check_backend` accepts no extra fields.
-- `check_backend` accepts no extra fields.
-- `list_tools` accepts no extra fields.
+- `operation` is required and must be one of `inspect`, `check`, `tools`, `search_tools`, `describe_tool`, or `call_tool`.
+- `inspect` accepts no extra fields.
+- `inspect` returns only configured capability-card data and does not start, initialize, or probe the downstream server.
+- `check` accepts no extra fields.
+- `check` accepts no extra fields.
+- `tools` accepts no extra fields.
 - `search_tools` requires `query` and accepts optional `limit`.
-- `get_tool` requires `tool`.
-- `call_tool` requires `tool` and `arguments`; `arguments` must be a JSON object and is not optional.
-- `tool` fields are plain strings, not enums of downstream tool names.
+- `describe_tool` requires `name`.
+- `call_tool` requires `name` and `args`; `args` must be a JSON object and is not optional.
+- `name` fields are plain strings, not enums of downstream tool names.
 - Generated Caplet tool schemas must remain stable even when downstream tool lists change.
 - Unknown operations return `UNKNOWN_OPERATION`.
 - Operation-specific request validation is strict: fields not defined for the selected `operation` are rejected as malformed Caplets request shapes.
@@ -249,7 +248,7 @@ Requirements:
 - For MCP-compliant OAuth servers, Caplets must include the target server resource indicator in authorization and token requests when required by the MCP authorization specification.
 - The default OAuth token store is `${XDG_STATE_HOME:-~/.local/state}/caplets/auth/<server>.json` on Unix-like platforms or `%LOCALAPPDATA%\caplets\auth\<server>.json` on Windows; files must be created with owner-only permissions when the platform supports it.
 - Relative `XDG_CONFIG_HOME` and `XDG_STATE_HOME` values are ignored.
-- Token bundles are runtime auth state, not server description state. They must not be embedded in generated MCP tool descriptions, `get_caplet`, logs, or structured errors.
+- Token bundles are runtime auth state, not server description state. They must not be embedded in generated MCP tool descriptions, `inspect`, logs, or structured errors.
 - The Caplets MCP server reads OAuth tokens from the auth store lazily before remote operations. Updating tokens with `caplets auth login <server>` should not require editing config and should be designed to work without restarting Caplets when practical.
 - `caplets auth list` reports configured OAuth remote servers as missing, authenticated, or expired and must not enumerate arbitrary orphan token files outside the configured server set.
 - `caplets auth logout <server>` removes the local token bundle for a configured OAuth remote server and is allowed even when the server is currently disabled.
@@ -259,7 +258,7 @@ Requirements:
 - Remote auth error payloads use safe fields only: `server`, `status`, `message`, `authType`, optional redacted `challenge`, and optional `nextAction: "run_caplets_auth_login"`.
 - Streamable HTTP clients must preserve MCP protocol-version and session semantics, including `MCP-Protocol-Version` and `Mcp-Session-Id` behavior, through the official SDK transport where possible.
 - `toolCacheTtlMs` defaults to 30000. `0` means refresh downstream `tools/list` on every metadata operation.
-- `get_tool` and `call_tool` must ensure cached downstream tool metadata is fresh enough according to `toolCacheTtlMs` before exact downstream tool-name resolution.
+- `describe_tool` and `call_tool` must ensure cached downstream tool metadata is fresh enough according to `toolCacheTtlMs` before exact downstream tool-name resolution.
 - `call_tool` must resolve against fresh-enough downstream `tools/list` metadata and must not forward a call for a tool absent from that metadata in MVP.
 - `disabled` defaults to false. Disabled servers are omitted from normal discovery, never appear in search results, are never started, and cannot be inspected or invoked until re-enabled and Caplets is restarted.
 - Disabled servers are omitted from generated `tools/list` to preserve the token-saving purpose of Caplets.
@@ -304,7 +303,7 @@ Downstream interactions required for MVP:
 - Call downstream `tools/list` for selected servers.
 - Call downstream `tools/call` for `operation: "call_tool"` inside a generated Caplet tool.
 - Execute selected OpenAPI operations, GraphQL operations, HTTP actions, and CLI actions for `operation: "call_tool"` inside a generated Caplet tool.
-- Refresh stale downstream tool metadata before `get_tool` and `call_tool` exact-name resolution according to `toolCacheTtlMs`.
+- Refresh stale downstream tool metadata before `describe_tool` and `call_tool` exact-name resolution according to `toolCacheTtlMs`.
 - Require downstream tools to be present in fresh-enough `tools/list` metadata before forwarding `call_tool`.
 - Preserve downstream schemas and result content.
 - Normalize Caplets-owned errors while keeping downstream results protocol-compatible.
@@ -315,8 +314,8 @@ Caplets must optimize the first cognitive layer for the agent:
 
 - Level 0: Caplets `tools/list` exposes only generated server/caplet tools, one per enabled downstream server.
 - Level 1: The agent selects a generated Caplet tool by server ID, display name, and description.
-- Level 2: The selected Caplet tool discloses its full capability card and downstream tool metadata through `get_caplet`, `list_tools`, `search_tools`, and `get_tool`.
-- Level 3: The selected Caplet tool invokes one downstream tool through `operation: "call_tool"` with exact downstream `tool` and a JSON object `arguments`.
+- Level 2: The selected Caplet tool discloses its full capability card and downstream tool metadata through `inspect`, `tools`, `search_tools`, and `describe_tool`.
+- Level 3: The selected Caplet tool invokes one downstream tool through `operation: "call_tool"` with exact downstream `name` and a JSON object `args`.
 
 Progressive disclosure is not a security boundary. The PRD treats it as a context-management and tool-selection strategy.
 
@@ -486,25 +485,25 @@ Core modules:
 
 `GeneratedServerToolRequest`:
 
-- `operation: "get_caplet" | "check_backend" | "check_backend" | "list_tools" | "search_tools" | "get_tool" | "call_tool"`
+- `operation: "inspect" | "check" | "tools" | "search_tools" | "describe_tool" | "call_tool"`
 - `query?: string`
 - `limit?: number`
-- `tool?: string`
-- `arguments: Record<string, unknown>`
+- `name?: string`
+- `args: Record<string, unknown>`
 
 Requirements:
 
-- `tool` is the exact downstream MCP tool name.
-- `call_tool.arguments` must be a JSON object. Missing arguments, arrays, strings, numbers, booleans, and null are malformed Caplets request shapes in MVP.
-- Operation-specific fields are exclusive to their operations. For example, `tool` is invalid on `list_tools`, `query` is invalid on `get_tool`, and `arguments` is invalid outside `call_tool`.
+- `name` is the exact downstream MCP tool name.
+- `call_tool.args` must be a JSON object. Missing arguments, arrays, strings, numbers, booleans, and null are malformed Caplets request shapes in MVP.
+- Operation-specific fields are exclusive to their operations. For example, `name` is invalid on `tools`, `query` is invalid on `describe_tool`, and `args` is invalid outside `call_tool`.
 - `server` is the exact configured Caplets server key and the generated top-level MCP tool name.
 - Caplets does not invent escaped, flattened, or globally unique tool names in MVP.
 - Caplets does not expose downstream tool names as enum values in generated Caplet tool input schemas.
-- `list_tools` returns compact downstream tool entries: `tool`, `description`, annotations when available, and `hasInputSchema`.
-- `get_tool` returns full downstream metadata for one exact downstream tool in the selected server.
-- `get_tool` and `call_tool` both use fresh-enough cached metadata for exact downstream tool-name resolution.
+- `tools` returns compact downstream tool entries: `name`, `description`, `hasInputSchema`, `hasOutputSchema`, `supportsFields`, and flattened safety hints when available.
+- `describe_tool` returns full downstream metadata for one exact downstream tool in the selected server.
+- `describe_tool` and `call_tool` both use fresh-enough cached metadata for exact downstream tool-name resolution.
 - `call_tool` returns `TOOL_NOT_FOUND` without forwarding when the exact downstream tool name is absent from fresh-enough metadata.
-- `search_tools` returns compact matches by default: `tool`, `description`, annotations when available, and `hasInputSchema`, but not full `inputSchema`.
+- `search_tools` returns compact matches by default: `name`, `description`, schema booleans, field-selection support, and flattened safety hints, but not full `inputSchema`.
 - `search_tools` results are scoped to the generated Caplet tool that was called.
 
 ### Integration Points
@@ -552,13 +551,13 @@ Caplets errors should be structured and stable:
 - Caplets must not pass through credentials received from the upstream MCP client to downstream remote MCP servers; downstream remote auth uses only the configured/stored credentials for that specific downstream server.
 - Caplets must treat downstream tool metadata and results as untrusted content.
 - Caplets must not claim that progressive disclosure prevents tool execution risk.
-- Caplets must not infer safety properties from downstream metadata or transform downstream annotations into Caplets-owned risk labels in MVP.
+- Caplets must not infer safety properties without backend evidence; compact summaries may only flatten explicit downstream/backend safety hints into `readOnlyHint` and `destructiveHint`.
 - Destructive downstream tools remain subject to the MCP client's own confirmation and trust model.
 - Downstream MCP servers remain authoritative for tool argument validation and execution semantics.
 - Caplets should avoid unnecessary restarts or repeated process churn once a downstream stdio server is successfully managed.
 - Caplets should terminate managed downstream stdio server processes when Caplets exits.
 - Caplets should cache each managed server's `tools/list` metadata for `toolCacheTtlMs` and refresh stale metadata on tool metadata operations.
-- `check_backend` should always refresh downstream `tools/list` for the selected server and update cached metadata/status.
+- `check` should always refresh downstream `tools/list` for the selected server and update cached metadata/status.
 
 ### Testing Requirements
 
@@ -591,14 +590,14 @@ Add automated tests for:
 - Remote auth error payload shape includes only `server`, `status`, `message`, `authType`, redacted `challenge`, and `nextAction` when relevant.
 - Streamable HTTP protocol-version and session-header behavior is covered by transport tests.
 - Generated `tools/list` exposes one safe capability card per enabled server and omits disabled servers.
-- `get_caplet` returns exact full server descriptions without starting, initializing, or probing downstream processes.
-- `list_tools` returns compact downstream tool metadata and `get_tool` preserves full downstream tool metadata including `inputSchema`.
+- `inspect` returns exact full server descriptions without starting, initializing, or probing downstream processes.
+- `tools` returns compact downstream tool metadata and `describe_tool` preserves full downstream tool metadata including `inputSchema`.
 - Server-scoped `search_tools` deterministic lexical matching.
 - Capped search result behavior: default `limit` 20, max `limit` 50, no pagination in MVP.
 - Server-scoped `search_tools` startup and failure behavior.
-- `check_backend` success, unavailable server, timeout, and secret redaction behavior.
+- `check` success, unavailable server, timeout, and secret redaction behavior.
 - `toolCacheTtlMs` behavior, including default TTL, stale refresh, and `0` refresh-every-time mode.
-- `get_tool` and `call_tool` refresh stale metadata before exact downstream tool-name resolution.
+- `describe_tool` and `call_tool` refresh stale metadata before exact downstream tool-name resolution.
 - Disabled server behavior: omitted from generated `tools/list`, not callable, never returned by search, and never started.
 - Duplicate tool names across servers.
 - Successful `operation: "call_tool"` forwarding.
diff --git a/package.json b/package.json
index a00a7a1..7197950 100644
--- a/package.json
+++ b/package.json
@@ -16,6 +16,8 @@
     "changeset": "changeset",
     "clean": "turbo clean",
     "clean-install": "rm -rf **/node_modules pnpm-lock.yaml && pnpm install",
+    "code-mode:check-api": "node scripts/generate-code-mode-runtime-api.mjs --check",
+    "code-mode:generate-api": "node scripts/generate-code-mode-runtime-api.mjs",
     "dev": "tsx ./scripts/dev.ts",
     "format": "oxfmt .",
     "format:check": "oxfmt --check .",
@@ -28,7 +30,7 @@
     "schema:generate": "tsx ./scripts/generate-config-schema.ts",
     "test": "vitest run",
     "typecheck": "tsgo --noEmit && turbo typecheck",
-    "verify": "pnpm format:check && pnpm lint && pnpm typecheck && pnpm schema:check && pnpm test && pnpm benchmark:check && pnpm build",
+    "verify": "pnpm format:check && pnpm lint && pnpm code-mode:check-api && pnpm typecheck && pnpm schema:check && pnpm test && pnpm benchmark:check && pnpm build",
     "version-packages": "changeset version && oxlint --fix --quiet && oxfmt --write ."
   },
   "devDependencies": {
diff --git a/packages/benchmarks/lib/code-mode.ts b/packages/benchmarks/lib/code-mode.ts
new file mode 100644
index 0000000..a499ccc
--- /dev/null
+++ b/packages/benchmarks/lib/code-mode.ts
@@ -0,0 +1,480 @@
+export type CodeModeBenchmarkTask = {
+  id: string;
+  category:
+    | "single-caplet"
+    | "multi-caplet"
+    | "discovery-fallback"
+    | "project-binding"
+    | "hosted-sandbox"
+    | "validation-recovery";
+  description: string;
+  progressiveRoundTrips: number;
+  codeModeRoundTrips: number;
+  progressiveContextTokens: number;
+  codeModeContextTokens: number;
+};
+
+export type CodeModeBenchmarkResult = {
+  tasks: CodeModeBenchmarkTask[];
+  totals: {
+    progressiveRoundTrips: number;
+    codeModeRoundTrips: number;
+    roundTripReduction: number;
+    progressiveContextTokens: number;
+    codeModeContextTokens: number;
+    contextTokenReduction: number;
+  };
+};
+
+export type ComplexWorkflowStrategyResult = {
+  strategy: "vanilla-mcp" | "progressive-disclosure" | "code-mode";
+  externalToolCalls: number;
+  llmRoundTrips: number;
+  codeModeRunCalls: number;
+  internalCapletCalls: number;
+  approxPayloadTokens: number;
+  preservedFields: string[];
+  missingFields: string[];
+  rawPayloadLeaked: boolean;
+  successScore: number;
+};
+
+export type CodeModeComplexWorkflowEval = {
+  task: {
+    id: string;
+    description: string;
+    requiredFields: string[];
+  };
+  strategies: ComplexWorkflowStrategyResult[];
+  reductions: {
+    codeModeVsProgressiveExternalCalls: number;
+    codeModeVsProgressivePayloadTokens: number;
+  };
+};
+
+export type CodeModeLiveRegressionScenario = {
+  id: string;
+  source: "live-agent-eval";
+  task: string;
+  observedFailure: string;
+  guardrails: string[];
+};
+
+export type CodeModeLiveRegressionEval = {
+  scenarios: CodeModeLiveRegressionScenario[];
+  improvements: string[];
+};
+
+export const CODE_MODE_BENCHMARK_TASKS: CodeModeBenchmarkTask[] = [
+  task(
+    "single-list-filter",
+    "single-caplet",
+    "List, filter, and summarize one Caplet result set.",
+    5,
+    1,
+    1800,
+    900,
+  ),
+  task(
+    "single-batch-update",
+    "single-caplet",
+    "Read multiple items and issue conditional updates.",
+    8,
+    1,
+    2600,
+    1100,
+  ),
+  task(
+    "join-issues-builds",
+    "multi-caplet",
+    "Join issue data with build status across two Caplets.",
+    10,
+    1,
+    3600,
+    1500,
+  ),
+  task(
+    "join-docs-tickets",
+    "multi-caplet",
+    "Search docs, match tickets, and return ranked evidence.",
+    9,
+    1,
+    3400,
+    1450,
+  ),
+  task(
+    "unknown-postgres",
+    "discovery-fallback",
+    "Use search/list fallback when the desired Caplet is not obvious.",
+    6,
+    2,
+    2200,
+    1200,
+  ),
+  task(
+    "ambiguous-repo",
+    "discovery-fallback",
+    "Disambiguate repository-related Caplets before calling.",
+    7,
+    2,
+    2400,
+    1300,
+  ),
+  task(
+    "binding-ready",
+    "project-binding",
+    "Call a project-bound Caplet with an active Project Binding.",
+    6,
+    1,
+    2100,
+    1050,
+  ),
+  task(
+    "binding-unavailable",
+    "project-binding",
+    "Recover from a missing Project Binding availability failure.",
+    5,
+    1,
+    1900,
+    1050,
+  ),
+  task(
+    "hosted-worker",
+    "hosted-sandbox",
+    "Call a Worker-safe hosted Caplet from Cloud Code Mode.",
+    4,
+    1,
+    1600,
+    900,
+  ),
+  task(
+    "hosted-process",
+    "hosted-sandbox",
+    "Call a Hosted Sandbox Caplet through route planning.",
+    6,
+    1,
+    2400,
+    1200,
+  ),
+  task(
+    "invalid-args",
+    "validation-recovery",
+    "Recover from a validation failure after getTool guidance.",
+    7,
+    2,
+    2500,
+    1350,
+  ),
+  task(
+    "wrong-api-shape",
+    "validation-recovery",
+    "Recover when generated code uses the wrong handle method.",
+    4,
+    1,
+    1700,
+    900,
+  ),
+];
+
+export const CODE_MODE_BENCHMARK_THRESHOLDS = {
+  minRoundTripReduction: 0.5,
+  maxContextTokenRegression: 0,
+  minTaskCount: 12,
+} as const;
+
+export const CODE_MODE_COMPLEX_WORKFLOW_THRESHOLDS = {
+  minExternalCallReduction: 0.5,
+  minSuccessScore: 0.9,
+} as const;
+
+const REQUIRED_LIVE_REGRESSION_IMPROVEMENTS = [
+  "code-mode-one-run-guidance",
+  "optional-use-avoid-hints",
+  "schema-error-call-signatures",
+  "transport-body-normalization",
+] as const;
+
+const COMPLEX_WORKFLOW_REQUIRED_FIELDS = [
+  "number",
+  "title",
+  "state",
+  "url",
+  "html_url",
+  "labels",
+  "created_at",
+  "updated_at",
+];
+
+export function computeCodeModeBenchmark(): CodeModeBenchmarkResult {
+  const progressiveRoundTrips = sum(CODE_MODE_BENCHMARK_TASKS, "progressiveRoundTrips");
+  const codeModeRoundTrips = sum(CODE_MODE_BENCHMARK_TASKS, "codeModeRoundTrips");
+  const progressiveContextTokens = sum(CODE_MODE_BENCHMARK_TASKS, "progressiveContextTokens");
+  const codeModeContextTokens = sum(CODE_MODE_BENCHMARK_TASKS, "codeModeContextTokens");
+  return {
+    tasks: CODE_MODE_BENCHMARK_TASKS,
+    totals: {
+      progressiveRoundTrips,
+      codeModeRoundTrips,
+      roundTripReduction: reduction(progressiveRoundTrips, codeModeRoundTrips),
+      progressiveContextTokens,
+      codeModeContextTokens,
+      contextTokenReduction: reduction(progressiveContextTokens, codeModeContextTokens),
+    },
+  };
+}
+
+export function validateCodeModeBenchmark(result: CodeModeBenchmarkResult): string[] {
+  const failures: string[] = [];
+  if (result.tasks.length < CODE_MODE_BENCHMARK_THRESHOLDS.minTaskCount) {
+    failures.push("Code Mode benchmark must include at least 12 representative tasks.");
+  }
+  const categories = new Set(result.tasks.map((task) => task.category));
+  for (const category of [
+    "single-caplet",
+    "multi-caplet",
+    "discovery-fallback",
+    "project-binding",
+    "hosted-sandbox",
+    "validation-recovery",
+  ] as const) {
+    if (!categories.has(category))
+      failures.push(`Missing Code Mode benchmark category: ${category}.`);
+  }
+  if (result.totals.roundTripReduction < CODE_MODE_BENCHMARK_THRESHOLDS.minRoundTripReduction) {
+    failures.push("Code Mode benchmark round-trip reduction is below the PRD threshold.");
+  }
+  if (
+    result.totals.contextTokenReduction < CODE_MODE_BENCHMARK_THRESHOLDS.maxContextTokenRegression
+  ) {
+    failures.push("Code Mode benchmark has a context-token regression.");
+  }
+  return failures;
+}
+
+export function computeCodeModeComplexWorkflowEval(): CodeModeComplexWorkflowEval {
+  const strategies: ComplexWorkflowStrategyResult[] = [
+    strategy({
+      strategy: "vanilla-mcp",
+      externalToolCalls: 4,
+      llmRoundTrips: 4,
+      codeModeRunCalls: 0,
+      internalCapletCalls: 0,
+      approxPayloadTokens: 4200,
+      preservedFields: ["number", "title", "state", "html_url", "updated_at"],
+      rawPayloadLeaked: false,
+      successScore: 0.72,
+    }),
+    strategy({
+      strategy: "progressive-disclosure",
+      externalToolCalls: 13,
+      llmRoundTrips: 13,
+      codeModeRunCalls: 0,
+      internalCapletCalls: 0,
+      approxPayloadTokens: 8600,
+      preservedFields: COMPLEX_WORKFLOW_REQUIRED_FIELDS,
+      rawPayloadLeaked: false,
+      successScore: 0.95,
+    }),
+    strategy({
+      strategy: "code-mode",
+      externalToolCalls: 1,
+      llmRoundTrips: 1,
+      codeModeRunCalls: 1,
+      internalCapletCalls: 7,
+      approxPayloadTokens: 2300,
+      preservedFields: COMPLEX_WORKFLOW_REQUIRED_FIELDS,
+      rawPayloadLeaked: false,
+      successScore: 0.93,
+    }),
+  ];
+  const progressive = strategyByName(strategies, "progressive-disclosure");
+  const codeMode = strategyByName(strategies, "code-mode");
+  return {
+    task: {
+      id: "github-triage-next-action-brief",
+      description:
+        "Discover GitHub issue/PR tools, inspect schemas or observed shapes, fetch open work, preserve labels and URLs, and synthesize a next-action triage brief.",
+      requiredFields: COMPLEX_WORKFLOW_REQUIRED_FIELDS,
+    },
+    strategies,
+    reductions: {
+      codeModeVsProgressiveExternalCalls: reduction(
+        progressive.externalToolCalls,
+        codeMode.externalToolCalls,
+      ),
+      codeModeVsProgressivePayloadTokens: reduction(
+        progressive.approxPayloadTokens,
+        codeMode.approxPayloadTokens,
+      ),
+    },
+  };
+}
+
+export function validateCodeModeComplexWorkflowEval(result: CodeModeComplexWorkflowEval): string[] {
+  const failures: string[] = [];
+  const codeMode = strategyByName(result.strategies, "code-mode");
+  if (codeMode.codeModeRunCalls !== 1) {
+    failures.push("Complex workflow Code Mode path must use one external run call.");
+  }
+  if (codeMode.internalCapletCalls < 4) {
+    failures.push("Complex workflow Code Mode path must exercise multiple internal Caplet calls.");
+  }
+  if (codeMode.missingFields.length > 0) {
+    failures.push(
+      `Complex workflow Code Mode path dropped fields: ${codeMode.missingFields.join(", ")}.`,
+    );
+  }
+  if (codeMode.rawPayloadLeaked) {
+    failures.push("Complex workflow Code Mode path leaked raw bulky payloads.");
+  }
+  if (
+    result.reductions.codeModeVsProgressiveExternalCalls <
+    CODE_MODE_COMPLEX_WORKFLOW_THRESHOLDS.minExternalCallReduction
+  ) {
+    failures.push("Complex workflow external-call reduction is below threshold.");
+  }
+  if (codeMode.successScore < CODE_MODE_COMPLEX_WORKFLOW_THRESHOLDS.minSuccessScore) {
+    failures.push("Complex workflow Code Mode success score is below threshold.");
+  }
+  return failures;
+}
+
+export function computeCodeModeLiveRegressionEval(): CodeModeLiveRegressionEval {
+  const scenarios: CodeModeLiveRegressionScenario[] = [
+    {
+      id: "github-issues-and-prs-adjacent-entities",
+      source: "live-agent-eval",
+      task: "Find GitHub work items without missing adjacent issues or pull requests.",
+      observedFailure:
+        "Cold agents can under-query adjacent entities or over-trust one search result when backend taxonomy is broad.",
+      guardrails: ["code-mode-one-run-guidance", "optional-use-avoid-hints"],
+    },
+    {
+      id: "osv-package-version-tool-selection",
+      source: "live-agent-eval",
+      task: "Assess vulnerabilities for npm package lodash version 4.17.20 through OSV.",
+      observedFailure:
+        "Code Mode initially chose a batch-style tool and leaked HTTP transport body shape before recovering.",
+      guardrails: [
+        "code-mode-one-run-guidance",
+        "optional-use-avoid-hints",
+        "schema-error-call-signatures",
+        "transport-body-normalization",
+      ],
+    },
+  ];
+  return {
+    scenarios,
+    improvements: [...new Set(scenarios.flatMap((scenario) => scenario.guardrails))].sort(),
+  };
+}
+
+export function validateCodeModeLiveRegressionEval(result: CodeModeLiveRegressionEval): string[] {
+  const failures: string[] = [];
+  for (const required of REQUIRED_LIVE_REGRESSION_IMPROVEMENTS) {
+    if (!result.improvements.includes(required)) {
+      failures.push(`Live regression eval is missing guardrail ${required}.`);
+    }
+  }
+  for (const scenario of result.scenarios) {
+    if (scenario.guardrails.length === 0) {
+      failures.push(`Live regression scenario ${scenario.id} has no guardrails.`);
+    }
+  }
+  return failures;
+}
+
+export function renderCodeModeMarkdownReport(): string {
+  const benchmark = computeCodeModeBenchmark();
+  const complex = computeCodeModeComplexWorkflowEval();
+  const liveRegressions = computeCodeModeLiveRegressionEval();
+  const codeMode = strategyByName(complex.strategies, "code-mode");
+  const progressive = strategyByName(complex.strategies, "progressive-disclosure");
+  const vanilla = strategyByName(complex.strategies, "vanilla-mcp");
+  return `## Code Mode Workflow Eval
+
+The deterministic Code Mode fixture covers ${benchmark.tasks.length} PRD task categories and shows ${percent(benchmark.totals.roundTripReduction)} fewer model/tool round trips versus equivalent progressive-disclosure sequences, with ${percent(benchmark.totals.contextTokenReduction)} lower approximate context tokens.
+
+### Complex Workflow Eval
+
+Task: ${complex.task.description}
+
+| Strategy               | External calls | LLM round trips | Code Mode run calls | Internal Caplet calls | Approx. payload tokens | Success score |
+| ---------------------- | -------------: | --------------: | ------------------: | --------------------: | ---------------------: | ------------: |
+| Vanilla MCP            |              ${vanilla.externalToolCalls} |               ${vanilla.llmRoundTrips} |                   ${vanilla.codeModeRunCalls} |                     ${vanilla.internalCapletCalls} |                   ${vanilla.approxPayloadTokens} |          ${vanilla.successScore.toFixed(2)} |
+| Progressive disclosure |             ${progressive.externalToolCalls} |              ${progressive.llmRoundTrips} |                   ${progressive.codeModeRunCalls} |                     ${progressive.internalCapletCalls} |                   ${progressive.approxPayloadTokens} |          ${progressive.successScore.toFixed(2)} |
+| Code Mode              |              ${codeMode.externalToolCalls} |               ${codeMode.llmRoundTrips} |                   ${codeMode.codeModeRunCalls} |                     ${codeMode.internalCapletCalls} |                   ${codeMode.approxPayloadTokens} |          ${codeMode.successScore.toFixed(2)} |
+
+Code Mode preserves required triage fields (${complex.task.requiredFields.map((field) => `\`${field}\``).join(", ")}) while reducing external calls versus progressive disclosure by ${percent(complex.reductions.codeModeVsProgressiveExternalCalls)} and approximate payload tokens by ${percent(complex.reductions.codeModeVsProgressivePayloadTokens)}.
+
+### Live Regression Guardrails
+
+The deterministic report also records live cold-agent failure classes without treating model-dependent runs as deterministic claims. Current guardrails: ${liveRegressions.improvements.map((improvement) => `\`${improvement}\``).join(", ")}.
+
+${liveRegressions.scenarios
+  .map(
+    (scenario) =>
+      `- \`${scenario.id}\`: ${scenario.observedFailure} Guardrails: ${scenario.guardrails.map((guardrail) => `\`${guardrail}\``).join(", ")}.`,
+  )
+  .join("\n")}`;
+}
+
+function task(
+  id: string,
+  category: CodeModeBenchmarkTask["category"],
+  description: string,
+  progressiveRoundTrips: number,
+  codeModeRoundTrips: number,
+  progressiveContextTokens: number,
+  codeModeContextTokens: number,
+): CodeModeBenchmarkTask {
+  return {
+    id,
+    category,
+    description,
+    progressiveRoundTrips,
+    codeModeRoundTrips,
+    progressiveContextTokens,
+    codeModeContextTokens,
+  };
+}
+
+function strategy(
+  input: Omit<ComplexWorkflowStrategyResult, "missingFields">,
+): ComplexWorkflowStrategyResult {
+  const preserved = new Set(input.preservedFields);
+  return {
+    ...input,
+    missingFields: COMPLEX_WORKFLOW_REQUIRED_FIELDS.filter((field) => !preserved.has(field)),
+  };
+}
+
+function strategyByName(
+  strategies: ComplexWorkflowStrategyResult[],
+  name: ComplexWorkflowStrategyResult["strategy"],
+): ComplexWorkflowStrategyResult {
+  const result = strategies.find((strategy) => strategy.strategy === name);
+  if (!result) throw new Error(`Missing strategy ${name}`);
+  return result;
+}
+
+function sum(
+  tasks: CodeModeBenchmarkTask[],
+  field: keyof Pick<
+    CodeModeBenchmarkTask,
+    | "progressiveRoundTrips"
+    | "codeModeRoundTrips"
+    | "progressiveContextTokens"
+    | "codeModeContextTokens"
+  >,
+): number {
+  return tasks.reduce((total, task) => total + task[field], 0);
+}
+
+function reduction(before: number, after: number): number {
+  return before === 0 ? 0 : (before - after) / before;
+}
+
+function percent(value: number): string {
+  return `${(value * 100).toFixed(1)}%`;
+}
diff --git a/packages/benchmarks/lib/surface.ts b/packages/benchmarks/lib/surface.ts
index 4794ae7..846cdf3 100644
--- a/packages/benchmarks/lib/surface.ts
+++ b/packages/benchmarks/lib/surface.ts
@@ -129,7 +129,7 @@ export function validateSurfaceBenchmark(result) {
   return failures;
 }
 
-export function renderMarkdownReport(result) {
+export function renderMarkdownReport(result, codeModeMarkdown = "") {
   const directCollisionNames = result.collisions.directDuplicateToolNames
     .map(
       (collision) =>
@@ -146,7 +146,7 @@ This report is generated by \`pnpm --filter @caplets/benchmarks benchmark\` from
 The deterministic benchmark compares two ways of exposing the same three mock MCP servers to a coding agent:
 
 - Direct flat MCP aggregation exposes every downstream tool from the \`${result.source.servers.join("`, `")}\` servers in the initial \`tools/list\` payload.
-- Caplets progressive disclosure exposes one top-level capability tool per server, then keeps downstream tools behind scoped \`inspect\`, \`list_tools\` or \`search_tools\`, \`get_tool\`, and \`call_tool\` operations.
+- Caplets progressive disclosure exposes one top-level capability tool per server, then keeps downstream tools behind scoped \`inspect\`, \`tools\` or \`search_tools\`, \`describe_tool\`, and \`call_tool\` operations.
 
 The fixture uses local mock MCP metadata only. It does not call external APIs, depend on network access, or require model credentials. Approximate token counts use \`Math.ceil(bytes / 4)\` as a stable context-size proxy, not provider billing data.
 
@@ -173,7 +173,7 @@ Caplets top-level duplicate tool-name collisions: ${result.collisions.capletsTop
 
 Direct flat MCP exposes all downstream tools immediately, so expected discovery calls are ${result.discovery.directExpectedDiscoveryCalls} but the initial candidate set is ${result.direct.toolCount} tools.
 
-Caplets starts from ${result.caplets.toolCount} capability tools. Expected task-specific discovery is ${result.discovery.capletsExpectedDiscoveryCalls.total} calls: \`inspect\`, \`list_tools\` or \`search_tools\`, \`get_tool\`, then \`call_tool\`.
+Caplets starts from ${result.caplets.toolCount} capability tools. Expected task-specific discovery is ${result.discovery.capletsExpectedDiscoveryCalls.total} calls: \`inspect\`, \`tools\` or \`search_tools\`, \`describe_tool\`, then \`call_tool\`.
 
 ## Validation
 
@@ -182,6 +182,8 @@ Caplets starts from ${result.caplets.toolCount} capability tools. Expected task-
 
 Payload implementation: \`${result.source.capletsPayloadImplementation}\`
 
+${codeModeMarkdown}
+
 ## Reproduce
 
 Run the deterministic benchmark and update this report:
diff --git a/packages/benchmarks/run-deterministic.ts b/packages/benchmarks/run-deterministic.ts
index e3857a5..f5e870b 100644
--- a/packages/benchmarks/run-deterministic.ts
+++ b/packages/benchmarks/run-deterministic.ts
@@ -7,6 +7,15 @@ import {
   renderMarkdownReport,
   validateSurfaceBenchmark,
 } from "./lib/surface";
+import {
+  computeCodeModeBenchmark,
+  computeCodeModeComplexWorkflowEval,
+  computeCodeModeLiveRegressionEval,
+  renderCodeModeMarkdownReport,
+  validateCodeModeBenchmark,
+  validateCodeModeComplexWorkflowEval,
+  validateCodeModeLiveRegressionEval,
+} from "./lib/code-mode";
 
 const __dirname = dirname(fileURLToPath(import.meta.url));
 const reportPath = resolve(__dirname, "../../docs/benchmarks/coding-agent.md");
@@ -14,7 +23,15 @@ const reportPath = resolve(__dirname, "../../docs/benchmarks/coding-agent.md");
 const checkMode = process.argv.includes("--check");
 
 const result = await computeSurfaceBenchmark();
-const failures = validateSurfaceBenchmark(result);
+const codeModeResult = computeCodeModeBenchmark();
+const complexWorkflowResult = computeCodeModeComplexWorkflowEval();
+const liveRegressionResult = computeCodeModeLiveRegressionEval();
+const failures = [
+  ...validateSurfaceBenchmark(result),
+  ...validateCodeModeBenchmark(codeModeResult),
+  ...validateCodeModeComplexWorkflowEval(complexWorkflowResult),
+  ...validateCodeModeLiveRegressionEval(liveRegressionResult),
+];
 if (failures.length > 0) {
   for (const failure of failures) {
     console.error(failure);
@@ -22,7 +39,7 @@ if (failures.length > 0) {
   process.exit(1);
 }
 
-const markdown = renderMarkdownReport(result);
+const markdown = renderMarkdownReport(result, renderCodeModeMarkdownReport());
 
 if (checkMode) {
   let current;
diff --git a/packages/benchmarks/test/benchmark.test.ts b/packages/benchmarks/test/benchmark.test.ts
index 636b53e..433036f 100644
--- a/packages/benchmarks/test/benchmark.test.ts
+++ b/packages/benchmarks/test/benchmark.test.ts
@@ -25,6 +25,11 @@ import {
   computeSurfaceBenchmark,
   validateSurfaceBenchmark,
 } from "../lib/surface";
+import {
+  CODE_MODE_BENCHMARK_THRESHOLDS,
+  computeCodeModeBenchmark,
+  validateCodeModeBenchmark,
+} from "../lib/code-mode";
 
 const packageRoot = resolve(fileURLToPath(new URL("..", import.meta.url)));
 const repoRoot = resolve(fileURLToPath(new URL("../../..", import.meta.url)));
@@ -64,6 +69,27 @@ describe("progressive disclosure benchmark fixture", () => {
     expect(result.runtime.compactReduction).toBeGreaterThan(0.5);
   });
 
+  it("covers Code Mode V1 round-trip and token-efficiency evaluation categories", () => {
+    const result = computeCodeModeBenchmark();
+
+    expect(validateCodeModeBenchmark(result)).toEqual([]);
+    expect(result.tasks).toHaveLength(CODE_MODE_BENCHMARK_THRESHOLDS.minTaskCount);
+    expect(new Set(result.tasks.map((task) => task.category))).toEqual(
+      new Set([
+        "single-caplet",
+        "multi-caplet",
+        "discovery-fallback",
+        "project-binding",
+        "hosted-sandbox",
+        "validation-recovery",
+      ]),
+    );
+    expect(result.totals.roundTripReduction).toBeGreaterThanOrEqual(
+      CODE_MODE_BENCHMARK_THRESHOLDS.minRoundTripReduction,
+    );
+    expect(result.totals.contextTokenReduction).toBeGreaterThanOrEqual(0);
+  });
+
   it("captures process output, safe env metadata, JSONL events, and truncation state", async () => {
     const result = await runProcess({
       command: process.execPath,
diff --git a/packages/benchmarks/test/code-mode-complex-workflow.test.ts b/packages/benchmarks/test/code-mode-complex-workflow.test.ts
new file mode 100644
index 0000000..ab11861
--- /dev/null
+++ b/packages/benchmarks/test/code-mode-complex-workflow.test.ts
@@ -0,0 +1,46 @@
+import { describe, expect, it } from "vitest";
+import {
+  CODE_MODE_COMPLEX_WORKFLOW_THRESHOLDS,
+  computeCodeModeComplexWorkflowEval,
+  computeCodeModeLiveRegressionEval,
+  validateCodeModeComplexWorkflowEval,
+  validateCodeModeLiveRegressionEval,
+} from "../lib/code-mode";
+
+describe("Code Mode complex workflow eval", () => {
+  it("captures the real-world triage workflow regression deterministically", () => {
+    const result = computeCodeModeComplexWorkflowEval();
+    const codeMode = result.strategies.find((strategy) => strategy.strategy === "code-mode")!;
+    const progressive = result.strategies.find(
+      (strategy) => strategy.strategy === "progressive-disclosure",
+    )!;
+    const vanilla = result.strategies.find((strategy) => strategy.strategy === "vanilla-mcp")!;
+
+    expect(validateCodeModeComplexWorkflowEval(result)).toEqual([]);
+    expect(codeMode.codeModeRunCalls).toBe(1);
+    expect(codeMode.llmRoundTrips).toBe(1);
+    expect(codeMode.internalCapletCalls).toBeGreaterThan(1);
+    expect(codeMode.externalToolCalls).toBeLessThan(progressive.externalToolCalls);
+    expect(codeMode.approxPayloadTokens).toBeLessThan(progressive.approxPayloadTokens);
+    expect(codeMode.missingFields).toEqual([]);
+    expect(codeMode.rawPayloadLeaked).toBe(false);
+    expect(vanilla.missingFields).toEqual(["url", "labels", "created_at"]);
+    expect(result.reductions.codeModeVsProgressiveExternalCalls).toBeGreaterThanOrEqual(
+      CODE_MODE_COMPLEX_WORKFLOW_THRESHOLDS.minExternalCallReduction,
+    );
+  });
+
+  it("tracks live cold-agent regressions from OSV and GitHub evals", () => {
+    const result = computeCodeModeLiveRegressionEval();
+
+    expect(validateCodeModeLiveRegressionEval(result)).toEqual([]);
+    expect(result.scenarios.map((scenario) => scenario.id)).toEqual([
+      "github-issues-and-prs-adjacent-entities",
+      "osv-package-version-tool-selection",
+    ]);
+    expect(result.improvements).toContain("code-mode-one-run-guidance");
+    expect(result.improvements).toContain("optional-use-avoid-hints");
+    expect(result.improvements).toContain("schema-error-call-signatures");
+    expect(result.improvements).toContain("transport-body-normalization");
+  });
+});
diff --git a/packages/cli/rolldown.config.ts b/packages/cli/rolldown.config.ts
index 4b09d08..635e083 100644
--- a/packages/cli/rolldown.config.ts
+++ b/packages/cli/rolldown.config.ts
@@ -7,6 +7,7 @@ export default defineConfig({
     format: "esm",
     banner: "#!/usr/bin/env node",
   },
+  external: ["@caplets/core"],
   platform: "node",
   tsconfig: true,
 });
diff --git a/packages/core/.caplets/.gitignore b/packages/core/.caplets/.gitignore
new file mode 100644
index 0000000..d6b7ef3
--- /dev/null
+++ b/packages/core/.caplets/.gitignore
@@ -0,0 +1,2 @@
+*
+!.gitignore
diff --git a/packages/core/package.json b/packages/core/package.json
index 1ea1dd7..0650027 100644
--- a/packages/core/package.json
+++ b/packages/core/package.json
@@ -47,6 +47,14 @@
       "types": "./dist/caplet-source/filesystem.d.ts",
       "default": "./dist/caplet-source/filesystem.js"
     },
+    "./code-mode": {
+      "types": "./dist/code-mode/index.d.ts",
+      "default": "./dist/code-mode.js"
+    },
+    "./observed-output-shapes": {
+      "types": "./dist/observed-output-shapes/index.d.ts",
+      "default": "./dist/observed-output-shapes.js"
+    },
     "./runtime-plan": {
       "types": "./dist/runtime-plan/index.d.ts",
       "default": "./dist/runtime-plan.js"
@@ -72,9 +80,12 @@
     "@hono/mcp": "^0.3.0",
     "@hono/node-server": "^2.0.4",
     "@modelcontextprotocol/sdk": "^1.29.0",
+    "ajv": "^8.20.0",
     "commander": "^15.0.0",
     "graphql": "^16.14.1",
     "hono": "^4.12.23",
+    "quickjs-emscripten": "^0.32.0",
+    "typescript": "^6.0.3",
     "vfile": "^6.0.3",
     "vfile-matter": "^5.0.1",
     "yaml": "^2.9.0",
@@ -84,7 +95,6 @@
     "@types/node": "^25.9.1",
     "@typescript/native-preview": "7.0.0-dev.20260603.1",
     "rolldown": "^1.0.3",
-    "typescript": "^6.0.3",
     "vitest": "^4.1.8"
   },
   "engines": {
diff --git a/packages/core/rolldown.config.ts b/packages/core/rolldown.config.ts
index 9ed8b39..35e9e8e 100644
--- a/packages/core/rolldown.config.ts
+++ b/packages/core/rolldown.config.ts
@@ -8,16 +8,19 @@ export default defineConfig([
       "config-runtime": "src/config-runtime.ts",
       "generated-tool-input-schema": "src/generated-tool-input-schema.ts",
       native: "src/native.ts",
+      "observed-output-shapes": "src/observed-output-shapes/index.ts",
     },
     output: {
       dir: "./dist",
       format: "esm",
     },
+    external: ["quickjs-emscripten", "typescript"],
     platform: "node",
   },
   {
     input: {
       "caplet-source": "src/caplet-source/index.ts",
+      "code-mode": "src/code-mode/index.ts",
       "runtime-plan": "src/runtime-plan/index.ts",
     },
     output: {
diff --git a/packages/core/src/capability-description.ts b/packages/core/src/capability-description.ts
index c888d93..99f89c2 100644
--- a/packages/core/src/capability-description.ts
+++ b/packages/core/src/capability-description.ts
@@ -4,9 +4,11 @@ export function capabilityDescription(server: CapletConfig): string {
   return [
     `${server.name} Caplet.`,
     server.description,
+    server.useWhen ? `Use when: ${server.useWhen}` : undefined,
+    server.avoidWhen ? `Avoid when: ${server.avoidWhen}` : undefined,
     server.backend === "mcp"
-      ? "Use inspect for details when needed; use tools for actions, resources for readable context, prompts for reusable workflows, and complete for prompt/resource-template arguments."
-      : "Use inspect for details when needed; use search_tools or list_tools to discover downstream operations.",
+      ? "Use inspect for details when needed; use tools/search_tools for downstream names; use describe_tool before call_tool when args matter; call_tool.args must match inputSchema exactly; do not guess tool names or schemas. For triage, list recent/open items once before targeted searches. Resources/prompts/completions may exist for MCP backends."
+      : "Use inspect for details when needed; use tools/search_tools to discover downstream operations; use describe_tool before call_tool when args matter; call_tool.args must match inputSchema exactly; do not guess tool names or schemas. For triage, list recent/open items once before targeted searches.",
   ]
     .filter(Boolean)
     .join(" ");
diff --git a/packages/core/src/caplet-files-bundle.ts b/packages/core/src/caplet-files-bundle.ts
index a07988a..d872d1a 100644
--- a/packages/core/src/caplet-files-bundle.ts
+++ b/packages/core/src/caplet-files-bundle.ts
@@ -108,6 +108,22 @@ const capletRuntimeRequirementsSchema = z
   .strict()
   .describe("Runtime feature and resource requirements for hosted execution.");
 
+const capletAgentSelectionHintSchema = z
+  .string()
+  .trim()
+  .min(1)
+  .max(500)
+  .describe("Optional author-supplied hint for agent tool/caplet selection.");
+
+const capletAgentSelectionHintsSchema = {
+  useWhen: capletAgentSelectionHintSchema
+    .optional()
+    .describe("When agents should prefer this Caplet or configured action."),
+  avoidWhen: capletAgentSelectionHintSchema
+    .optional()
+    .describe("When agents should avoid this Caplet or configured action."),
+};
+
 const capletEndpointAuthSchema = z
   .discriminatedUnion("type", [
     z.object({ type: z.literal("none") }).strict(),
@@ -324,6 +340,7 @@ const capletGraphQlOperationSchema = z
     documentPath: z.string().min(1).optional().describe("Path to a GraphQL operation document."),
     operationName: z.string().min(1).optional().describe("Operation name to execute."),
     description: z.string().min(1).optional().describe("Operation capability description."),
+    ...capletAgentSelectionHintsSchema,
   })
   .strict()
   .superRefine((operation, ctx) => {
@@ -433,6 +450,7 @@ const capletHttpActionSchema = z
       .refine((value) => !value.startsWith("//"), "HTTP action path must not start with //")
       .refine((value) => !isUrl(value), "HTTP action path must be a URL path, not a URL"),
     description: z.string().min(1).optional().describe("Action capability description."),
+    ...capletAgentSelectionHintsSchema,
     inputSchema: z
       .record(z.string(), z.unknown())
       .optional()
@@ -524,6 +542,7 @@ const capletCliToolAnnotationsSchema = z
 const capletCliToolActionSchema = z
   .object({
     description: z.string().min(1).optional().describe("Action capability description."),
+    ...capletAgentSelectionHintsSchema,
     inputSchema: z
       .record(z.string(), z.unknown())
       .optional()
@@ -614,6 +633,7 @@ export const capletFileSchema = z
       .array(z.string().trim().min(1).max(80))
       .optional()
       .describe("Optional tags for grouping or searching Caplets."),
+    ...capletAgentSelectionHintsSchema,
     setup: capletSetupSchema.optional(),
     projectBinding: capletProjectBindingSchema.optional(),
     runtime: capletRuntimeRequirementsSchema.optional(),
@@ -956,6 +976,8 @@ function capletToServerConfig(
 function sharedCapletFields(frontmatter: CapletFileFrontmatter): Record<string, unknown> {
   return {
     ...(frontmatter.tags ? { tags: frontmatter.tags } : {}),
+    ...(frontmatter.useWhen ? { useWhen: frontmatter.useWhen } : {}),
+    ...(frontmatter.avoidWhen ? { avoidWhen: frontmatter.avoidWhen } : {}),
     ...(frontmatter.setup ? { setup: frontmatter.setup } : {}),
     ...(frontmatter.projectBinding ? { projectBinding: frontmatter.projectBinding } : {}),
     ...(frontmatter.runtime ? { runtime: frontmatter.runtime } : {}),
diff --git a/packages/core/src/caplet-sets.ts b/packages/core/src/caplet-sets.ts
index 04151f3..1b64c4c 100644
--- a/packages/core/src/caplet-sets.ts
+++ b/packages/core/src/caplet-sets.ts
@@ -2,7 +2,13 @@ import type { CompatibilityCallToolResult, Tool } from "@modelcontextprotocol/sd
 import { resolve } from "node:path";
 import { CliToolsManager } from "./cli-tools";
 import { type CapletConfig, type CapletSetConfig, loadIsolatedConfig } from "./config";
-import { DownstreamManager, type CompactTool } from "./downstream";
+import {
+  compactToolSafetyHints,
+  compactToolSchemaHints,
+  compactToolSelectionHints,
+  DownstreamManager,
+  type CompactTool,
+} from "./downstream";
 import { CapletsError, errorResult, toSafeError } from "./errors";
 import { GraphQLManager } from "./graphql";
 import { HttpActionManager } from "./http-actions";
@@ -146,11 +152,14 @@ export class CapletSetManager {
 
   compact(config: CapletSetConfig, tool: Tool): CompactTool {
     return {
-      id: config.server,
-      tool: tool.name,
+      name: tool.name,
       ...(tool.description ? { description: tool.description } : {}),
       hasInputSchema: Boolean(tool.inputSchema),
       hasOutputSchema: Boolean(tool.outputSchema),
+      supportsFields: Boolean(tool.outputSchema),
+      ...compactToolSelectionHints(tool),
+      ...compactToolSchemaHints(tool),
+      ...compactToolSafetyHints(tool),
     };
   }
 
diff --git a/packages/core/src/cli-tools.ts b/packages/core/src/cli-tools.ts
index 2107675..a228973 100644
--- a/packages/core/src/cli-tools.ts
+++ b/packages/core/src/cli-tools.ts
@@ -3,7 +3,12 @@ import { delimiter, isAbsolute, join } from "node:path";
 import { spawn } from "node:child_process";
 import type { CompatibilityCallToolResult, Tool } from "@modelcontextprotocol/sdk/types";
 import type { CliToolActionConfig, CliToolsConfig } from "./config";
-import type { CompactTool } from "./downstream";
+import {
+  compactToolSafetyHints,
+  compactToolSchemaHints,
+  compactToolSelectionHints,
+  type CompactTool,
+} from "./downstream";
 import { CapletsError, toSafeError } from "./errors";
 import type { ServerRegistry } from "./registry";
 import { markdownStructuredContent } from "./result-content";
@@ -119,11 +124,14 @@ export class CliToolsManager {
 
   compact(config: CliToolsConfig, tool: Tool): CompactTool {
     return {
-      id: config.server,
-      tool: tool.name,
+      name: tool.name,
       ...(tool.description ? { description: tool.description } : {}),
       hasInputSchema: Boolean(tool.inputSchema),
       hasOutputSchema: Boolean(tool.outputSchema),
+      supportsFields: Boolean(tool.outputSchema),
+      ...compactToolSelectionHints(tool),
+      ...compactToolSchemaHints(tool),
+      ...compactToolSafetyHints(tool),
     };
   }
 
@@ -135,6 +143,8 @@ export class CliToolsManager {
     return {
       name: action.name,
       ...(action.description ? { description: action.description } : {}),
+      ...(action.useWhen ? { useWhen: action.useWhen } : {}),
+      ...(action.avoidWhen ? { avoidWhen: action.avoidWhen } : {}),
       inputSchema: (action.inputSchema ?? DEFAULT_INPUT_SCHEMA) as Tool["inputSchema"],
       ...(action.outputSchema ? { outputSchema: action.outputSchema as Tool["outputSchema"] } : {}),
       ...(action.annotations ? { annotations: action.annotations as Tool["annotations"] } : {}),
diff --git a/packages/core/src/cli.ts b/packages/core/src/cli.ts
index 9aa0528..9d8ee19 100644
--- a/packages/core/src/cli.ts
+++ b/packages/core/src/cli.ts
@@ -8,6 +8,7 @@ import {
   addMcpCaplet,
   addOpenApiCaplet,
 } from "./cli/add";
+import { buildCloudCapletBundle } from "./cli/cloud-add";
 import {
   loginAuth,
   logoutAuth,
@@ -19,6 +20,7 @@ import {
   type AuthStatusRow,
 } from "./cli/auth";
 import { cliCommands } from "./cli/commands";
+import { codeModeTypesCli, runCodeModeCli } from "./cli/code-mode";
 import { initConfig } from "./cli/init";
 import { doctorJsonReport, formatDoctorReport } from "./cli/doctor";
 import {
@@ -107,6 +109,7 @@ type CliIO = {
   attachServe?: (options: AttachServeOptions) => Promise<void>;
   daemon?: ServeDaemonOperationOptions;
   runSetupCommand?: SetupCommandRunner;
+  readStdin?: () => Promise<string>;
 };
 
 export async function runCli(args: string[], io: CliIO = {}): Promise<void> {
@@ -184,6 +187,17 @@ function cloudAuthStatus(credentials: CloudAuthCredentials | undefined): Record<
   return redactedCloudAuthStatus(credentials);
 }
 
+function compactCloudCaplet(value: unknown): Record<string, unknown> {
+  if (!value || typeof value !== "object" || Array.isArray(value)) return {};
+  const record = value as Record<string, unknown>;
+  return {
+    ...(typeof record.id === "string" ? { id: record.id } : {}),
+    ...(typeof record.name === "string" ? { name: record.name } : {}),
+    ...(typeof record.description === "string" ? { description: record.description } : {}),
+    ...(typeof record.readinessState === "string" ? { readinessState: record.readinessState } : {}),
+  };
+}
+
 function isProjectBindingWebSocketUnavailable(error: unknown): boolean {
   return (
     error instanceof CapletsError &&
@@ -328,6 +342,52 @@ export function createProgram(io: CliIO = {}): Command {
       if (suggestions.length > 0) writeOut(`${suggestions.join("\n")}\n`);
     });
 
+  program
+    .command(cliCommands.run)
+    .description("Run TypeScript Code Mode locally with the generated Caplets API.")
+    .argument("[code]", "inline TypeScript code to run")
+    .option("--file <path>", "read TypeScript code from a file relative to the current directory")
+    .option("--timeout-ms <ms>", "execution timeout in milliseconds", parsePositiveInteger)
+    .option("--json", "print the structured run envelope")
+    .action(
+      async (
+        code: string | undefined,
+        options: { file?: string; timeoutMs?: number; json?: boolean },
+      ) => {
+        await runCodeModeCli({
+          env,
+          ...(currentConfigPath() ? { configPath: currentConfigPath() } : {}),
+          projectConfigPath: envProjectConfigPath(env),
+          ...(io.authDir ? { authDir: io.authDir } : {}),
+          ...(code === undefined ? {} : { inlineCode: code }),
+          ...(options.file === undefined ? {} : { file: options.file }),
+          ...(options.timeoutMs === undefined ? {} : { timeoutMs: options.timeoutMs }),
+          ...(options.json === undefined ? {} : { json: options.json }),
+          ...(io.readStdin ? { readStdin: io.readStdin } : {}),
+          writeOut,
+          setExitCode,
+        });
+      },
+    );
+
+  const codeMode = program
+    .command(cliCommands.codeMode)
+    .description("Inspect and debug Caplets Code Mode.");
+  codeMode
+    .command("types")
+    .description("Print the generated Code Mode TypeScript declarations.")
+    .option("--json", "print declaration metadata as JSON")
+    .action(async (options: { json?: boolean }) => {
+      await codeModeTypesCli({
+        env,
+        ...(currentConfigPath() ? { configPath: currentConfigPath() } : {}),
+        projectConfigPath: envProjectConfigPath(env),
+        ...(io.authDir ? { authDir: io.authDir } : {}),
+        ...(options.json === undefined ? {} : { json: options.json }),
+        writeOut,
+      });
+    });
+
   const serve = program
     .command(cliCommands.serve)
     .description("Serve configured Caplets as an MCP server.")
@@ -753,6 +813,44 @@ export function createProgram(io: CliIO = {}): Command {
       writeOut(`Selected workspace ${next.workspaceSlug ?? next.workspaceId}.\n`);
     });
 
+  cloud
+    .command("add")
+    .description("Upload local caplet-files to the selected hosted Caplets Cloud workspace.")
+    .argument("[path]", "directory containing caplet-files", ".")
+    .option("--cloud-url <url>", "hosted Caplets Cloud URL")
+    .option("--workspace <workspace>", "workspace ID or slug")
+    .option("--json", "print JSON output")
+    .action(
+      async (
+        pathInput: string,
+        options: { cloudUrl?: string; workspace?: string; json?: boolean },
+      ) => {
+        const credentials = await cloudAuthStore(env).load();
+        if (!credentials) {
+          throw new CapletsError("AUTH_REQUIRED", "Run caplets cloud auth login first.");
+        }
+        const cloudUrl = options.cloudUrl ?? credentials.cloudUrl;
+        const workspace = options.workspace ?? credentials.workspaceSlug ?? credentials.workspaceId;
+        const bundle = buildCloudCapletBundle(pathInput);
+        const result = await new CloudAuthClient({
+          cloudUrl,
+          ...(io.fetch ? { fetch: io.fetch } : {}),
+        }).addCaplets({
+          accessToken: credentials.accessToken,
+          workspace,
+          bundle,
+        });
+        const caplets = result.caplets.map(compactCloudCaplet);
+        if (options.json) {
+          writeOut(`${JSON.stringify({ caplets, workspace }, null, 2)}\n`);
+          return;
+        }
+        for (const caplet of caplets) {
+          writeOut(`Added ${caplet.name ?? caplet.id ?? "Caplet"} to ${workspace}.\n`);
+        }
+      },
+    );
+
   program
     .command(cliCommands.init)
     .description("Create a starter Caplets config file.")
@@ -1151,7 +1249,7 @@ export function createProgram(io: CliIO = {}): Command {
     .action(async (caplet: string, options: { format?: CliOutputFormat }) => {
       await executeOperation(
         caplet,
-        { operation: "check_backend" },
+        { operation: "check" },
         {
           writeOut,
           writeErr,
@@ -1172,7 +1270,7 @@ export function createProgram(io: CliIO = {}): Command {
     .action(async (caplet: string, options: { format?: CliOutputFormat }) => {
       await executeOperation(
         caplet,
-        { operation: "list_tools" },
+        { operation: "tools" },
         {
           writeOut,
           writeErr,
@@ -1231,7 +1329,7 @@ export function createProgram(io: CliIO = {}): Command {
         const { caplet, tool } = parseQualifiedTarget(capletOrTarget, toolArgument);
         await executeOperation(
           caplet,
-          { operation: "get_tool", tool },
+          { operation: "describe_tool", name: tool },
           {
             writeOut,
             writeErr,
@@ -1262,8 +1360,8 @@ export function createProgram(io: CliIO = {}): Command {
         const { caplet, tool } = parseQualifiedTarget(capletOrTarget, toolArgument);
         const request = {
           operation: "call_tool",
-          tool,
-          arguments: parseCallToolArgs(options.args),
+          name: tool,
+          args: parseCallToolArgs(options.args),
           ...(options.field && options.field.length > 0 ? { fields: options.field } : {}),
         };
         await executeOperation(caplet, request, {
@@ -1288,8 +1386,8 @@ export function createProgram(io: CliIO = {}): Command {
       executeOperation(
         caplet,
         options.limit === undefined
-          ? { operation: "list_resources" }
-          : { operation: "list_resources", limit: options.limit },
+          ? { operation: "resources" }
+          : { operation: "resources", limit: options.limit },
         {
           writeOut,
           writeErr,
@@ -1340,8 +1438,8 @@ export function createProgram(io: CliIO = {}): Command {
       executeOperation(
         caplet,
         options.limit === undefined
-          ? { operation: "list_resource_templates" }
-          : { operation: "list_resource_templates", limit: options.limit },
+          ? { operation: "resource_templates" }
+          : { operation: "resource_templates", limit: options.limit },
         {
           writeOut,
           writeErr,
@@ -1384,8 +1482,8 @@ export function createProgram(io: CliIO = {}): Command {
       executeOperation(
         caplet,
         options.limit === undefined
-          ? { operation: "list_prompts" }
-          : { operation: "list_prompts", limit: options.limit },
+          ? { operation: "prompts" }
+          : { operation: "prompts", limit: options.limit },
         {
           writeOut,
           writeErr,
@@ -1444,8 +1542,8 @@ export function createProgram(io: CliIO = {}): Command {
           caplet,
           {
             operation: "get_prompt",
-            prompt,
-            arguments: parseJsonObjectOption(options.args, "get-prompt --args"),
+            name: prompt,
+            args: parseJsonObjectOption(options.args, "get-prompt --args"),
           },
           {
             writeOut,
@@ -1655,16 +1753,16 @@ async function openBrowser(url: string): Promise<void> {
 function remoteCommandForOperation(operation: unknown): RemoteCliCommand | undefined {
   switch (operation) {
     case "inspect":
-    case "check_backend":
-    case "list_tools":
+    case "check":
+    case "tools":
     case "search_tools":
-    case "get_tool":
+    case "describe_tool":
     case "call_tool":
-    case "list_resources":
+    case "resources":
     case "search_resources":
-    case "list_resource_templates":
+    case "resource_templates":
     case "read_resource":
-    case "list_prompts":
+    case "prompts":
     case "search_prompts":
     case "get_prompt":
     case "complete":
@@ -2342,7 +2440,7 @@ function markdownSummaryForOperation(result: unknown, request: Record<string, un
       ]
         .filter((line): line is string => line !== undefined)
         .join("\n");
-    case "check_backend":
+    case "check":
       return [
         `## Backend \`${id}\``,
         "",
@@ -2355,8 +2453,8 @@ function markdownSummaryForOperation(result: unknown, request: Record<string, un
       ]
         .filter((line): line is string => line !== undefined)
         .join("\n");
-    case "list_tools": {
-      const tools = Array.isArray(payload.tools) ? payload.tools : [];
+    case "tools": {
+      const tools = pageItemsFromPayload(payload);
       return [
         `## Tools for \`${id}\``,
         "",
@@ -2371,7 +2469,7 @@ function markdownSummaryForOperation(result: unknown, request: Record<string, un
       ].join("\n");
     }
     case "search_tools": {
-      const tools = Array.isArray(payload.tools) ? payload.tools : [];
+      const tools = pageItemsFromPayload(payload);
       return [
         `## Matches for ${JSON.stringify(String(payload.query ?? ""))} in \`${id}\``,
         "",
@@ -2385,7 +2483,7 @@ function markdownSummaryForOperation(result: unknown, request: Record<string, un
           : `- Try a broader query or list tools: \`caplets list-tools ${id}\``,
       ].join("\n");
     }
-    case "get_tool": {
+    case "describe_tool": {
       const tool = isPlainObject(payload.tool) ? payload.tool : {};
       const target = `${id}.${String(tool.name ?? "<tool>")}`;
       return [
@@ -2407,7 +2505,7 @@ function markdownSummaryForOperation(result: unknown, request: Record<string, un
         .join("\n");
     }
     case "call_tool": {
-      const callTarget = `${String(request.caplet ?? "<caplet>")}.${String(request.tool ?? "unknown")}`;
+      const callTarget = `${String(request.caplet ?? "<caplet>")}.${String(request.name ?? "unknown")}`;
       return [
         `## Call \`${callTarget}\``,
         "",
@@ -2420,13 +2518,9 @@ function markdownSummaryForOperation(result: unknown, request: Record<string, un
         .filter((line): line is string => line !== undefined)
         .join("\n");
     }
-    case "list_resources":
+    case "resources":
     case "search_resources": {
-      const resources = Array.isArray(payload.resources) ? payload.resources : [];
-      const templates = Array.isArray(payload.resourceTemplates) ? payload.resourceTemplates : [];
-      const matches = Array.isArray(payload.matches)
-        ? payload.matches
-        : [...resources, ...templates];
+      const matches = pageItemsFromPayload(payload);
       return [
         `## MCP resources for \`${id}\``,
         "",
@@ -2435,8 +2529,8 @@ function markdownSummaryForOperation(result: unknown, request: Record<string, un
         ...formatResourceLines(matches, "markdown"),
       ].join("\n");
     }
-    case "list_resource_templates": {
-      const templates = Array.isArray(payload.resourceTemplates) ? payload.resourceTemplates : [];
+    case "resource_templates": {
+      const templates = pageItemsFromPayload(payload);
       return [
         `## MCP resource templates for \`${id}\``,
         "",
@@ -2451,16 +2545,16 @@ function markdownSummaryForOperation(result: unknown, request: Record<string, un
         "",
         "Use `--format json` to inspect all contents.",
       ].join("\n");
-    case "list_prompts":
+    case "prompts":
     case "search_prompts": {
-      const prompts = Array.isArray(payload.prompts) ? payload.prompts : [];
+      const prompts = pageItemsFromPayload(payload);
       return [`## MCP prompts for \`${id}\``, "", ...formatPromptLines(prompts, "markdown")].join(
         "\n",
       );
     }
     case "get_prompt":
       return [
-        `## Prompt \`${String(request.caplet)}.${String(request.prompt)}\``,
+        `## Prompt \`${String(request.caplet)}.${String(request.name)}\``,
         "",
         summarizePromptResult(payload),
         "",
@@ -2491,7 +2585,7 @@ function plainSummaryForOperation(result: unknown, request: Record<string, unkno
       ]
         .filter((line): line is string => Boolean(line))
         .join("\n");
-    case "check_backend":
+    case "check":
       return [
         `Backend: ${id} is ${String(payload.status ?? "unknown")}`,
         typeof payload.toolCount === "number" ? `Tools: ${payload.toolCount}` : undefined,
@@ -2500,8 +2594,8 @@ function plainSummaryForOperation(result: unknown, request: Record<string, unkno
       ]
         .filter((line): line is string => Boolean(line))
         .join("\n");
-    case "list_tools": {
-      const tools = Array.isArray(payload.tools) ? payload.tools : [];
+    case "tools": {
+      const tools = pageItemsFromPayload(payload);
       return [
         `Tools for ${id} (${tools.length}):`,
         ...formatToolLines(tools, "plain"),
@@ -2509,7 +2603,7 @@ function plainSummaryForOperation(result: unknown, request: Record<string, unkno
       ].join("\n");
     }
     case "search_tools": {
-      const tools = Array.isArray(payload.tools) ? payload.tools : [];
+      const tools = pageItemsFromPayload(payload);
       return [
         `Matches for ${JSON.stringify(String(payload.query ?? ""))} in ${id} (${tools.length}):`,
         ...formatToolLines(tools, "plain"),
@@ -2518,7 +2612,7 @@ function plainSummaryForOperation(result: unknown, request: Record<string, unkno
           : `Next: try caplets list-tools ${id} or a broader query.`,
       ].join("\n");
     }
-    case "get_tool": {
+    case "describe_tool": {
       const tool = isPlainObject(payload.tool) ? payload.tool : {};
       const target = `${id}.${String(tool.name ?? "<tool>")}`;
       return [
@@ -2535,7 +2629,7 @@ function plainSummaryForOperation(result: unknown, request: Record<string, unkno
         .join("\n");
     }
     case "call_tool": {
-      const callTarget = `${String(request.caplet ?? "<caplet>")}.${String(request.tool ?? "unknown")}`;
+      const callTarget = `${String(request.caplet ?? "<caplet>")}.${String(request.name ?? "unknown")}`;
       return [
         `Call ${callTarget} ${payload.isError === true ? "failed" : "succeeded"}.`,
         callStatusLine(payload),
@@ -2545,20 +2639,16 @@ function plainSummaryForOperation(result: unknown, request: Record<string, unkno
         .filter((line): line is string => Boolean(line))
         .join("\n");
     }
-    case "list_resources":
+    case "resources":
     case "search_resources": {
-      const resources = Array.isArray(payload.resources) ? payload.resources : [];
-      const templates = Array.isArray(payload.resourceTemplates) ? payload.resourceTemplates : [];
-      const matches = Array.isArray(payload.matches)
-        ? payload.matches
-        : [...resources, ...templates];
+      const matches = pageItemsFromPayload(payload);
       return [
         `MCP resources for ${id} (${matches.length}):`,
         ...formatResourceLines(matches, "plain"),
       ].join("\n");
     }
-    case "list_resource_templates": {
-      const templates = Array.isArray(payload.resourceTemplates) ? payload.resourceTemplates : [];
+    case "resource_templates": {
+      const templates = pageItemsFromPayload(payload);
       return [`MCP resource templates for ${id}:`, ...formatResourceLines(templates, "plain")].join(
         "\n",
       );
@@ -2569,14 +2659,14 @@ function plainSummaryForOperation(result: unknown, request: Record<string, unkno
         summarizeResourceRead(payload),
         "Use --format json to inspect all contents.",
       ].join("\n");
-    case "list_prompts":
+    case "prompts":
     case "search_prompts": {
-      const prompts = Array.isArray(payload.prompts) ? payload.prompts : [];
+      const prompts = pageItemsFromPayload(payload);
       return [`MCP prompts for ${id}:`, ...formatPromptLines(prompts, "plain")].join("\n");
     }
     case "get_prompt":
       return [
-        `Prompt ${String(request.caplet)}.${String(request.prompt)}`,
+        `Prompt ${String(request.caplet)}.${String(request.name)}`,
         summarizePromptResult(payload),
         "Use --format json to inspect all messages.",
       ].join("\n");
@@ -2591,6 +2681,14 @@ function payloadId(payload: Record<string, unknown>): string {
   return String(payload.id ?? payload.caplet ?? payload.server ?? "<caplet>");
 }
 
+function pageItemsFromPayload(payload: Record<string, unknown>): unknown[] {
+  if (Array.isArray(payload.items)) return payload.items;
+  for (const key of ["tools", "resources", "resourceTemplates", "prompts", "matches"] as const) {
+    if (Array.isArray(payload[key])) return payload[key];
+  }
+  return [];
+}
+
 function formatToolLines(tools: unknown[], format: "markdown" | "plain"): string[] {
   if (tools.length === 0) {
     return ["- none"];
diff --git a/packages/core/src/cli/cloud-add.ts b/packages/core/src/cli/cloud-add.ts
new file mode 100644
index 0000000..0bc7953
--- /dev/null
+++ b/packages/core/src/cli/cloud-add.ts
@@ -0,0 +1,64 @@
+import { existsSync, readdirSync, readFileSync, statSync } from "node:fs";
+import { relative, resolve, sep } from "node:path";
+import { CapletsError } from "../errors";
+
+export type CloudCapletBundleFile = {
+  path: string;
+  content: string;
+};
+
+export type CloudCapletBundle = {
+  files: CloudCapletBundleFile[];
+};
+
+const MAX_CLOUD_CAPLET_BUNDLE_BYTES = 2 * 1024 * 1024;
+const SKIPPED_DIRECTORY_NAMES = new Set([".git", "node_modules", "auth"]);
+
+export function buildCloudCapletBundle(rootInput: string): CloudCapletBundle {
+  const root = resolve(rootInput);
+  if (!existsSync(root)) {
+    throw new CapletsError("CONFIG_INVALID", `Caplet path does not exist: ${rootInput}`);
+  }
+  if (!statSync(root).isDirectory()) {
+    throw new CapletsError("CONFIG_INVALID", `Caplet path must be a directory: ${rootInput}`);
+  }
+
+  const files = collectFiles(root)
+    .map((filePath) => ({
+      path: relative(root, filePath).split(sep).join("/"),
+      content: readFileSync(filePath, "utf8"),
+    }))
+    .filter((file) => file.path !== "config.json")
+    .sort((left, right) => left.path.localeCompare(right.path));
+
+  const totalBytes = files.reduce((total, file) => total + Buffer.byteLength(file.content), 0);
+  if (totalBytes > MAX_CLOUD_CAPLET_BUNDLE_BYTES) {
+    throw new CapletsError(
+      "CONFIG_INVALID",
+      `Caplet bundle is too large for Cloud upload (${totalBytes} bytes).`,
+    );
+  }
+  if (!files.some((file) => file.path.endsWith(".md") || file.path.endsWith("/CAPLET.md"))) {
+    throw new CapletsError("CONFIG_INVALID", `No Caplet files found under ${rootInput}`);
+  }
+
+  return { files };
+}
+
+function collectFiles(root: string): string[] {
+  const entries = readdirSync(root, { withFileTypes: true }).sort((left, right) =>
+    left.name.localeCompare(right.name),
+  );
+  const files: string[] = [];
+  for (const entry of entries) {
+    if (entry.isSymbolicLink()) continue;
+    const path = resolve(root, entry.name);
+    if (entry.isDirectory()) {
+      if (SKIPPED_DIRECTORY_NAMES.has(entry.name)) continue;
+      files.push(...collectFiles(path));
+      continue;
+    }
+    if (entry.isFile()) files.push(path);
+  }
+  return files;
+}
diff --git a/packages/core/src/cli/code-mode.ts b/packages/core/src/cli/code-mode.ts
new file mode 100644
index 0000000..cb30673
--- /dev/null
+++ b/packages/core/src/cli/code-mode.ts
@@ -0,0 +1,118 @@
+import { readFileSync } from "node:fs";
+import { resolve } from "node:path";
+import { createNativeCapletsService } from "../native/service";
+import { codeModeDeclarationHash, generateCodeModeDeclarations } from "../code-mode/declarations";
+import { CodeModeLogStore } from "../code-mode/logs";
+import { runCodeMode } from "../code-mode/runner";
+import { listCodeModeCallableCaplets } from "../code-mode/api";
+import type { CodeModeTypesJson } from "../code-mode/types";
+
+export type CodeModeCliOptions = {
+  env?: NodeJS.ProcessEnv | Record<string, string | undefined>;
+  configPath?: string | undefined;
+  projectConfigPath?: string | undefined;
+  authDir?: string | undefined;
+  inlineCode?: string | undefined;
+  file?: string | undefined;
+  timeoutMs?: number | undefined;
+  json?: boolean | undefined;
+  readStdin?: (() => Promise<string>) | undefined;
+  writeOut: (value: string) => void;
+  setExitCode: (code: number) => void;
+};
+
+export async function runCodeModeCli(options: CodeModeCliOptions): Promise<void> {
+  const service = createNativeCapletsService({
+    mode: "local",
+    ...(options.configPath ? { configPath: options.configPath } : {}),
+    ...(options.projectConfigPath ? { projectConfigPath: options.projectConfigPath } : {}),
+    ...(options.authDir ? { authDir: options.authDir } : {}),
+  });
+  try {
+    const code = await readCodeModeCliCode(options);
+    const result = await runCodeMode({
+      code,
+      service,
+      ...(options.timeoutMs === undefined ? {} : { timeoutMs: options.timeoutMs }),
+      logStore: new CodeModeLogStore(),
+      runtimeScope: runtimeScope(options.env),
+    });
+    if (options.json) {
+      options.writeOut(`${JSON.stringify(result, null, 2)}\n`);
+    } else if (result.ok) {
+      options.writeOut(`${formatHumanValue(result.value)}\n`);
+    } else {
+      options.writeOut(`${result.error.code}: ${result.error.message}\n`);
+      if (result.diagnostics.length > 0) {
+        options.writeOut(
+          `${result.diagnostics.map((diagnostic) => `- ${diagnostic.message}`).join("\n")}\n`,
+        );
+      }
+    }
+    if (!result.ok) {
+      options.setExitCode(1);
+    }
+  } finally {
+    await service.close();
+  }
+}
+
+export async function codeModeTypesCli(
+  options: Pick<
+    CodeModeCliOptions,
+    "env" | "configPath" | "projectConfigPath" | "authDir" | "json" | "writeOut"
+  >,
+): Promise<void> {
+  const service = createNativeCapletsService({
+    mode: "local",
+    ...(options.configPath ? { configPath: options.configPath } : {}),
+    ...(options.projectConfigPath ? { projectConfigPath: options.projectConfigPath } : {}),
+    ...(options.authDir ? { authDir: options.authDir } : {}),
+  });
+  try {
+    const caplets = listCodeModeCallableCaplets(service);
+    const declaration = generateCodeModeDeclarations({ caplets });
+    if (!options.json) {
+      options.writeOut(declaration);
+      return;
+    }
+    const output: CodeModeTypesJson = {
+      declaration,
+      declarationHash: codeModeDeclarationHash(declaration),
+      callableCount: caplets.length,
+      generatedAt: new Date().toISOString(),
+      runtimeScope: runtimeScope(options.env),
+    };
+    options.writeOut(`${JSON.stringify(output, null, 2)}\n`);
+  } finally {
+    await service.close();
+  }
+}
+
+export async function readCodeModeCliCode(
+  options: Pick<CodeModeCliOptions, "inlineCode" | "file" | "readStdin">,
+): Promise<string> {
+  if (options.inlineCode !== undefined) {
+    return options.inlineCode;
+  }
+  if (options.file !== undefined) {
+    return readFileSync(resolve(process.cwd(), options.file), "utf8");
+  }
+  return await (options.readStdin ?? readProcessStdin)();
+}
+
+async function readProcessStdin(): Promise<string> {
+  const chunks: Buffer[] = [];
+  for await (const chunk of process.stdin) {
+    chunks.push(Buffer.isBuffer(chunk) ? chunk : Buffer.from(String(chunk)));
+  }
+  return Buffer.concat(chunks).toString("utf8");
+}
+
+function formatHumanValue(value: unknown): string {
+  return typeof value === "string" ? value : JSON.stringify(value, null, 2);
+}
+
+function runtimeScope(env: NodeJS.ProcessEnv | Record<string, string | undefined> = process.env) {
+  return env.CAPLETS_MODE?.trim() || "local";
+}
diff --git a/packages/core/src/cli/commands.ts b/packages/core/src/cli/commands.ts
index 17f96e6..f340bf9 100644
--- a/packages/core/src/cli/commands.ts
+++ b/packages/core/src/cli/commands.ts
@@ -4,6 +4,8 @@ export type CompletionShell = (typeof completionShells)[number];
 export const cliCommands = {
   completion: "completion",
   completeHidden: "__complete",
+  run: "run",
+  codeMode: "code-mode",
   serve: "serve",
   attach: "attach",
   cloud: "cloud",
@@ -33,6 +35,8 @@ export const cliCommands = {
 
 export const topLevelCommandNames = [
   cliCommands.serve,
+  cliCommands.run,
+  cliCommands.codeMode,
   cliCommands.attach,
   cliCommands.cloud,
   cliCommands.init,
@@ -64,6 +68,7 @@ export const cliSubcommands = {
   [cliCommands.add]: ["cli", "mcp", "openapi", "graphql", "http"],
   [cliCommands.auth]: ["login", "logout", "list"],
   [cliCommands.cloud]: ["auth"],
+  [cliCommands.codeMode]: ["types"],
   [cliCommands.completion]: [...completionShells],
   [cliCommands.config]: ["path", "paths"],
   [cliCommands.serve]: ["start", "stop", "status", "restart", "enable", "disable"],
diff --git a/packages/core/src/cli/doctor.ts b/packages/core/src/cli/doctor.ts
index 83f9649..ffb1ebd 100644
--- a/packages/core/src/cli/doctor.ts
+++ b/packages/core/src/cli/doctor.ts
@@ -1,15 +1,27 @@
+import { mkdtempSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { createNativeCapletsService } from "../native/service";
 import { findProjectRoot, fingerprintProjectRoot } from "../cloud/project-root";
 import { CloudAuthStore, redactedCloudAuthStatus } from "../cloud-auth/store";
 import { projectBindingWorkspacePaths } from "../project-binding/workspaces";
 import { resolveCapletsRemote } from "../remote/options";
 import { resolveCapletsServer } from "../server/options";
 import type { MutagenProjectSyncDoctorData } from "../project-binding/mutagen";
+import { generateCodeModeDeclarations } from "../code-mode/declarations";
+import { diagnoseCodeModeTypeScript } from "../code-mode/diagnostics";
+import { CodeModeLogStore } from "../code-mode/logs";
+import { runCodeMode } from "../code-mode/runner";
+import { listCodeModeCallableCaplets } from "../code-mode/api";
+import { DEFAULT_OBSERVED_OUTPUT_SHAPE_CACHE_DIR } from "../config/paths";
+import { FileObservedOutputShapeStore } from "../observed-output-shapes";
 
 export type DoctorOptions = {
   env?: NodeJS.ProcessEnv | Record<string, string | undefined>;
   cwd?: string;
   syncStatus?: MutagenProjectSyncDoctorData;
   cloudAuthStore?: CloudAuthStore;
+  observedOutputShapeCacheDir?: string;
 };
 
 export type DoctorJsonReport = {
@@ -19,6 +31,7 @@ export type DoctorJsonReport = {
   sync: Record<string, unknown>;
   daemon: Record<string, unknown>;
   cloudAuth: Record<string, unknown>;
+  codeMode: Record<string, unknown>;
 };
 
 export async function doctorJsonReport(options: DoctorOptions = {}): Promise<DoctorJsonReport> {
@@ -63,6 +76,7 @@ export async function doctorJsonReport(options: DoctorOptions = {}): Promise<Doc
       running: false,
     },
     cloudAuth: redactedCloudAuthStatus(credentials),
+    codeMode: await resolveCodeModeSection(options, env),
   };
 }
 
@@ -109,6 +123,19 @@ export async function formatDoctorReport(options: DoctorOptions = {}): Promise<s
     ...(report.cloudAuth.workspaceSlug || report.cloudAuth.workspaceId
       ? [`  Selected Workspace: ${report.cloudAuth.workspaceSlug ?? report.cloudAuth.workspaceId}`]
       : []),
+    "",
+    "Code Mode",
+    `  Types generation: ${doctorOk(report.codeMode.typesGeneration)}`,
+    `  Diagnostics: ${doctorOk(report.codeMode.diagnostics)}`,
+    `  Sandbox smoke: ${doctorOk(report.codeMode.sandboxSmoke)}`,
+    `  Log storage: ${doctorOk(report.codeMode.logStorage)}`,
+    `  Callable index: ${doctorOk(report.codeMode.callableIndex)}`,
+    `  Observed output shapes: ${doctorOk(report.codeMode.observedOutputShapes)}`,
+    ...(observedOutputShapePath(report.codeMode.observedOutputShapes)
+      ? [
+          `  Observed output shape cache: ${observedOutputShapePath(report.codeMode.observedOutputShapes)}`,
+        ]
+      : []),
   ];
   return `${lines.join("\n")}\n`;
 }
@@ -151,3 +178,119 @@ function resolveRemoteSection(env: NodeJS.ProcessEnv | Record<string, string | u
 function yesNo(value: boolean): string {
   return value ? "yes" : "no";
 }
+
+async function resolveCodeModeSection(
+  options: DoctorOptions,
+  env: NodeJS.ProcessEnv | Record<string, string | undefined>,
+): Promise<Record<string, unknown>> {
+  const emptyDeclaration = generateCodeModeDeclarations({ caplets: [] });
+  const diagnostics = diagnoseCodeModeTypeScript({
+    declaration: emptyDeclaration,
+    code: "return 1;",
+  });
+  const tempDir = mkdtempSync(join(tmpdir(), "caplets-code-mode-doctor-"));
+  try {
+    const logStore = new CodeModeLogStore({ stateDir: tempDir });
+    const stored = await logStore.store([
+      {
+        level: "log",
+        message: "doctor smoke",
+        timestamp: new Date(0).toISOString(),
+      },
+    ]);
+    const read = await logStore.read({ logRef: stored.logRef });
+    const sandboxSmoke = await runCodeMode({
+      code: "return 1;",
+      service: emptyCodeModeDoctorService(),
+      logStore,
+    });
+    return {
+      typesGeneration: { ok: emptyDeclaration.includes("declare const caplets") },
+      diagnostics: { ok: diagnostics.every((diagnostic) => diagnostic.severity !== "error") },
+      sandboxSmoke: { ok: sandboxSmoke.ok },
+      logStorage: { ok: read.entries.length === 1 },
+      callableIndex: await resolveCallableIndexDoctor(env),
+      observedOutputShapes: await resolveObservedOutputShapesDoctor(options),
+    };
+  } catch (error) {
+    return {
+      typesGeneration: { ok: true },
+      diagnostics: { ok: diagnostics.every((diagnostic) => diagnostic.severity !== "error") },
+      sandboxSmoke: { ok: false, error: error instanceof Error ? error.message : String(error) },
+      logStorage: { ok: false, error: error instanceof Error ? error.message : String(error) },
+      callableIndex: { ok: false, error: error instanceof Error ? error.message : String(error) },
+      observedOutputShapes: await resolveObservedOutputShapesDoctor(options),
+    };
+  } finally {
+    rmSync(tempDir, { recursive: true, force: true });
+  }
+}
+
+async function resolveObservedOutputShapesDoctor(options: DoctorOptions) {
+  const store = new FileObservedOutputShapeStore(
+    options.observedOutputShapeCacheDir ?? DEFAULT_OBSERVED_OUTPUT_SHAPE_CACHE_DIR,
+  );
+  if (!store.health) return { ok: false, error: "store health unavailable" };
+  const health = await store.health();
+  return {
+    ok: health.readable && health.writable,
+    path: health.path,
+    readable: health.readable,
+    writable: health.writable,
+    entryCount: health.entryCount ?? null,
+    prune: health.prune ?? null,
+    ...(health.error ? { error: health.error } : {}),
+  };
+}
+
+async function resolveCallableIndexDoctor(
+  env: NodeJS.ProcessEnv | Record<string, string | undefined>,
+) {
+  try {
+    const service = createNativeCapletsService({
+      mode: "local",
+      ...(env.CAPLETS_CONFIG?.trim() ? { configPath: env.CAPLETS_CONFIG.trim() } : {}),
+      ...(env.CAPLETS_PROJECT_CONFIG?.trim()
+        ? { projectConfigPath: env.CAPLETS_PROJECT_CONFIG.trim() }
+        : {}),
+      watch: false,
+      writeErr: () => undefined,
+    });
+    try {
+      return { ok: true, callableCount: listCodeModeCallableCaplets(service).length };
+    } finally {
+      await service.close();
+    }
+  } catch (error) {
+    return {
+      ok: true,
+      callableCount: 0,
+      configLoaded: false,
+      message: error instanceof Error ? error.message : String(error),
+    };
+  }
+}
+
+function emptyCodeModeDoctorService() {
+  return {
+    listTools: () => [],
+    execute: async () => undefined,
+    reload: async () => true,
+    onToolsChanged: () => () => undefined,
+    close: async () => undefined,
+  };
+}
+
+function doctorOk(value: unknown): string {
+  return value && typeof value === "object" && (value as { ok?: unknown }).ok === true
+    ? "ok"
+    : "failed";
+}
+
+function observedOutputShapePath(value: unknown): string | undefined {
+  return value &&
+    typeof value === "object" &&
+    typeof (value as { path?: unknown }).path === "string"
+    ? (value as { path: string }).path
+    : undefined;
+}
diff --git a/packages/core/src/cloud-auth/client.ts b/packages/core/src/cloud-auth/client.ts
index bea859c..1f49101 100644
--- a/packages/core/src/cloud-auth/client.ts
+++ b/packages/core/src/cloud-auth/client.ts
@@ -28,6 +28,17 @@ export type RefreshTokenInput = {
   refreshToken: string;
 };
 
+export type CloudAddCapletsInput = {
+  accessToken: string;
+  workspace: string;
+  bundle: { files: Array<{ path: string; content: string }> };
+};
+
+export type CloudAddCapletsResult = {
+  caplet?: unknown;
+  caplets: unknown[];
+};
+
 export type CloudAuthClientCredentials = Required<
   Pick<
     CloudAuthTokenResponse,
@@ -114,6 +125,21 @@ export class CloudAuthClient {
     return normalizeCredentials(response, this.cloudUrl.origin);
   }
 
+  async addCaplets(input: CloudAddCapletsInput): Promise<CloudAddCapletsResult> {
+    const response = await this.requestJson<CloudAddCapletsResult>(
+      `/api/workspaces/${encodeURIComponent(input.workspace)}/caplets/custom`,
+      {
+        method: "POST",
+        headers: { Authorization: `Bearer ${input.accessToken}` },
+        body: JSON.stringify({ bundle: input.bundle }),
+      },
+    );
+    return {
+      ...response,
+      caplets: Array.isArray(response.caplets) ? response.caplets : [],
+    };
+  }
+
   private async requestJson<T = unknown>(path: string, init: RequestInit = {}): Promise<T> {
     const headers = new Headers(init.headers);
     if (init.body !== undefined && !headers.has("content-type")) {
diff --git a/packages/core/src/cloud/runtime-adapter.ts b/packages/core/src/cloud/runtime-adapter.ts
index f98d959..34eaa10 100644
--- a/packages/core/src/cloud/runtime-adapter.ts
+++ b/packages/core/src/cloud/runtime-adapter.ts
@@ -66,14 +66,14 @@ class DefaultCloudRuntimeAdapter implements CloudRuntimeAdapter {
     const request =
       isRecord(args) && typeof args.operation === "string"
         ? args
-        : { operation: "call_tool", tool: name, arguments: isRecord(args) ? args : {} };
+        : { operation: "call_tool", name, args: isRecord(args) ? args : {} };
     const result = await this.engine.execute(name, request);
     return annotateExecution(result, this.executionMetadata());
   }
 
   async checkBackend(capletId: string): Promise<unknown> {
     return annotateExecution(
-      await this.engine.execute(capletId, { operation: "check_backend" }),
+      await this.engine.execute(capletId, { operation: "check" }),
       this.executionMetadata(),
     );
   }
diff --git a/packages/core/src/code-mode/api.ts b/packages/core/src/code-mode/api.ts
new file mode 100644
index 0000000..7b775b7
--- /dev/null
+++ b/packages/core/src/code-mode/api.ts
@@ -0,0 +1,617 @@
+import type { NativeCapletsService } from "../native/service";
+import type {
+  CapletsResult,
+  CodeModeCallableCaplet,
+  Page,
+  PageInput,
+  ReadLogsInput,
+  ReadLogsResult,
+  ToolCallError,
+  ToolCallMeta,
+  ToolCallResult,
+} from "./types";
+
+const MAX_TOOL_TEXT_CHARS = 2_000;
+const MAX_ERROR_MESSAGE_CHARS = 1_000;
+
+export type CodeModeCapletHandle = {
+  readonly id: string;
+  inspect(): Promise<unknown>;
+  check(): Promise<CapletsResult<unknown>>;
+  tools(input?: PageInput): Promise<Page<unknown>>;
+  searchTools(query: string, input?: PageInput): Promise<Page<unknown>>;
+  describeTool(name: string): Promise<CapletsResult<unknown>>;
+  callTool(name: string, args?: unknown): Promise<ToolCallResult>;
+  resources(input?: PageInput): Promise<Page<unknown>>;
+  searchResources(query: string, input?: PageInput): Promise<Page<unknown>>;
+  resourceTemplates(input?: PageInput): Promise<Page<unknown>>;
+  readResource(uri: string): Promise<CapletsResult<unknown>>;
+  prompts(input?: PageInput): Promise<Page<unknown>>;
+  searchPrompts(query: string, input?: PageInput): Promise<Page<unknown>>;
+  getPrompt(name: string, args?: unknown): Promise<CapletsResult<unknown>>;
+  complete(input: unknown): Promise<CapletsResult<unknown>>;
+};
+
+export type CodeModeDebugApi = {
+  readLogs(input: ReadLogsInput): Promise<ReadLogsResult>;
+};
+
+export type CodeModeCapletsApi = {
+  [capletId: string]:
+    | CodeModeCapletHandle
+    | CodeModeDebugApi
+    | (CodeModeCapletHandle & CodeModeDebugApi);
+  debug: CodeModeDebugApi | (CodeModeCapletHandle & CodeModeDebugApi);
+};
+
+export type CreateCodeModeCapletsApiInput = {
+  service: NativeCapletsService;
+  readLogs?: (input: ReadLogsInput) => Promise<ReadLogsResult>;
+};
+
+export function listCodeModeCallableCaplets(
+  service: NativeCapletsService,
+): CodeModeCallableCaplet[] {
+  return service
+    .listTools()
+    .filter((tool) => tool.codeModeRun !== true)
+    .map((tool) => ({
+      id: tool.caplet,
+      name: tool.title,
+      description: tool.description,
+      ...(tool.useWhen ? { useWhen: tool.useWhen } : {}),
+      ...(tool.avoidWhen ? { avoidWhen: tool.avoidWhen } : {}),
+    }))
+    .sort((left, right) => left.id.localeCompare(right.id));
+}
+
+export function createCodeModeCapletsApi(input: CreateCodeModeCapletsApiInput): CodeModeCapletsApi {
+  const api: Record<
+    string,
+    CodeModeCapletHandle | CodeModeDebugApi | (CodeModeCapletHandle & CodeModeDebugApi)
+  > = {};
+  for (const caplet of listCodeModeCallableCaplets(input.service)) {
+    api[caplet.id] = createHandle(input.service, caplet.id);
+  }
+
+  const debugApi: CodeModeDebugApi = {
+    readLogs: input.readLogs ?? defaultReadLogs,
+  };
+  api.debug =
+    "debug" in api ? Object.assign(api.debug as CodeModeCapletHandle, debugApi) : debugApi;
+
+  return api as CodeModeCapletsApi;
+}
+
+function createHandle(service: NativeCapletsService, capletId: string): CodeModeCapletHandle {
+  return {
+    id: capletId,
+    async inspect() {
+      return unwrapStructuredResult(await service.execute(capletId, { operation: "inspect" }));
+    },
+    async check() {
+      return await checkResultFromExecution(service, capletId);
+    },
+    async tools(input?: PageInput) {
+      return toolPageFromResult(
+        unwrapStructuredResult(await service.execute(capletId, { operation: "tools", ...input })),
+      );
+    },
+    async searchTools(query: string, input?: PageInput) {
+      return toolPageFromResult(
+        unwrapStructuredResult(
+          await service.execute(capletId, { operation: "search_tools", query, ...input }),
+        ),
+      );
+    },
+    async describeTool(name: string) {
+      const result = await resultFromExecution(service, capletId, {
+        operation: "describe_tool",
+        name,
+      });
+      return result.ok ? { ...result, data: normalizeToolDescriptor(result.data, name) } : result;
+    },
+    async callTool(name: string, args?: unknown) {
+      const started = Date.now();
+      try {
+        const result = await service.execute(capletId, {
+          operation: "call_tool",
+          name,
+          args: args ?? {},
+        });
+        const meta = toolCallMeta(result, {
+          capletId,
+          tool: name,
+          durationMs: Date.now() - started,
+        });
+        if (resultIsError(result)) {
+          return {
+            ok: false,
+            error: toolCallError(result),
+            meta,
+          };
+        }
+        return { ok: true, data: normalizeToolCallData(result), meta };
+      } catch (error) {
+        return {
+          ok: false,
+          error: errorFromCaught(error, "tool_call_failed"),
+          meta: { capletId, tool: name, durationMs: Date.now() - started },
+        };
+      }
+    },
+    async resources(input?: PageInput) {
+      return pageFromResult(
+        unwrapStructuredResult(
+          await service.execute(capletId, { operation: "resources", ...input }),
+        ),
+      );
+    },
+    async searchResources(query: string, input?: PageInput) {
+      return pageFromResult(
+        unwrapStructuredResult(
+          await service.execute(capletId, { operation: "search_resources", query, ...input }),
+        ),
+      );
+    },
+    async resourceTemplates(input?: PageInput) {
+      return pageFromResult(
+        unwrapStructuredResult(
+          await service.execute(capletId, { operation: "resource_templates", ...input }),
+        ),
+      );
+    },
+    async readResource(uri: string) {
+      return await resultFromExecution(service, capletId, { operation: "read_resource", uri });
+    },
+    async prompts(input?: PageInput) {
+      return pageFromResult(
+        unwrapStructuredResult(await service.execute(capletId, { operation: "prompts", ...input })),
+      );
+    },
+    async searchPrompts(query: string, input?: PageInput) {
+      return pageFromResult(
+        unwrapStructuredResult(
+          await service.execute(capletId, { operation: "search_prompts", query, ...input }),
+        ),
+      );
+    },
+    async getPrompt(name: string, args?: unknown) {
+      return await resultFromExecution(service, capletId, {
+        operation: "get_prompt",
+        name,
+        ...(args === undefined ? {} : { args }),
+      });
+    },
+    async complete(input: unknown) {
+      return await resultFromExecution(service, capletId, {
+        operation: "complete",
+        ...(isPlainObject(input) ? input : {}),
+      });
+    },
+  };
+}
+
+async function checkResultFromExecution(
+  service: NativeCapletsService,
+  capletId: string,
+): Promise<CapletsResult<unknown>> {
+  const result = await resultFromExecution(service, capletId, { operation: "check" });
+  if (!result.ok) return result;
+  if (!isUnavailableCheckResult(result.data)) return result;
+  return {
+    ok: false,
+    error: {
+      code: "backend_not_ready",
+      message: unavailableCheckMessage(capletId, result.data),
+      details: result.data,
+    },
+    ...(result.meta === undefined ? {} : { meta: result.meta }),
+  };
+}
+
+async function resultFromExecution(
+  service: NativeCapletsService,
+  capletId: string,
+  request: Record<string, unknown>,
+): Promise<CapletsResult<unknown>> {
+  const started = Date.now();
+  const targetName = typeof request.name === "string" ? request.name : undefined;
+  try {
+    const result = await service.execute(capletId, request);
+    const meta = toolCallMeta(result, {
+      capletId,
+      ...(targetName === undefined ? {} : { tool: targetName }),
+      durationMs: Date.now() - started,
+    });
+    if (resultIsError(result)) {
+      return { ok: false, error: toolCallError(result), meta };
+    }
+    return { ok: true, data: unwrapStructuredResult(result), meta };
+  } catch (error) {
+    return {
+      ok: false,
+      error: errorFromCaught(error, "caplet_call_failed"),
+      meta: {
+        capletId,
+        ...(targetName === undefined ? {} : { tool: targetName }),
+        durationMs: Date.now() - started,
+      },
+    };
+  }
+}
+
+function isUnavailableCheckResult(result: unknown): result is Record<string, unknown> {
+  if (!isPlainObject(result)) return false;
+  return result.status === "unavailable" || result.status === "error";
+}
+
+function unavailableCheckMessage(capletId: string, result: Record<string, unknown>): string {
+  const error = result.error;
+  const reason =
+    isPlainObject(error) && typeof error.message === "string"
+      ? error.message
+      : typeof error === "string"
+        ? error
+        : undefined;
+  return reason
+    ? `${capletId} is unavailable: ${truncate(reason, MAX_ERROR_MESSAGE_CHARS)}`
+    : `${capletId} is unavailable.`;
+}
+
+function errorFromCaught(error: unknown, fallbackCode: string): ToolCallError {
+  const code = errorStringProperty(error, "code") ?? fallbackCode;
+  const message = truncate(
+    error instanceof Error ? error.message : String(error),
+    MAX_ERROR_MESSAGE_CHARS,
+  );
+  const details = errorObjectProperty(error, "details");
+  return normalizeCodeModeErrorTerminology({
+    code,
+    message,
+    ...(details === undefined ? {} : { details }),
+  });
+}
+
+function errorStringProperty(error: unknown, key: string): string | undefined {
+  if (!error || typeof error !== "object" || !(key in error)) return undefined;
+  const value = (error as Record<string, unknown>)[key];
+  return typeof value === "string" ? value : undefined;
+}
+
+function errorObjectProperty(error: unknown, key: string): unknown {
+  if (!error || typeof error !== "object" || !(key in error)) return undefined;
+  return (error as Record<string, unknown>)[key];
+}
+
+function pageFromResult(result: unknown): Page<unknown> {
+  if (isPlainObject(result) && Array.isArray(result.items)) {
+    return {
+      items: result.items,
+      ...(typeof result.nextCursor === "string" ? { nextCursor: result.nextCursor } : {}),
+      ...(result.truncated === true ? { truncated: true } : {}),
+    };
+  }
+  if (Array.isArray(result)) return { items: result };
+  if (isPlainObject(result)) {
+    for (const key of ["tools", "resources", "resourceTemplates", "prompts", "matches"] as const) {
+      if (Array.isArray(result[key])) return { items: result[key] };
+    }
+  }
+  return { items: [] };
+}
+
+function toolPageFromResult(result: unknown): Page<unknown> {
+  const page = pageFromResult(result);
+  return {
+    ...page,
+    items: page.items
+      .map((item) => (isPlainObject(item) ? compactToolSummary(item) : undefined))
+      .filter((item): item is Record<string, unknown> => item !== undefined),
+  };
+}
+
+function unwrapStructuredResult(result: unknown): unknown {
+  if (!isPlainObject(result)) return result;
+  const structuredContent = result.structuredContent;
+  if (!isPlainObject(structuredContent) || !("result" in structuredContent)) return result;
+  return structuredContent.result;
+}
+
+function normalizeToolDescriptor(result: unknown, toolName: string): unknown {
+  if (!isPlainObject(result)) return result;
+  const rawTool = result.tool;
+  if (!isPlainObject(rawTool)) return result;
+  const resultWithoutFieldSelection = { ...result };
+  delete resultWithoutFieldSelection.fieldSelection;
+  const inputSchema = rawTool.inputSchema;
+  const outputSchema = rawTool.outputSchema;
+  const baseName = toolTypeBaseName(toolName);
+  const inputTypeName = `${baseName}Input`;
+  const outputTypeName = `${baseName}Output`;
+  return {
+    ...resultWithoutFieldSelection,
+    tool: compactToolSummary(rawTool),
+    ...(inputSchema === undefined ? {} : { inputSchema }),
+    ...(outputSchema === undefined ? {} : { outputSchema }),
+    callSignature: `callTool(name: ${JSON.stringify(toolName)}, args: ${inputTypeName}): Promise<CapletsResult<${outputTypeName}>>`,
+    inputTypeScript: schemaToTypeScript(inputSchema, inputTypeName),
+    outputTypeScript: schemaToTypeScript(outputSchema, outputTypeName),
+    ...(isPlainObject(result.observedOutputShape)
+      ? { observedOutputShape: result.observedOutputShape }
+      : {}),
+    examples: Array.isArray(result.examples) ? result.examples.slice(0, 3) : [],
+  };
+}
+
+function toolTypeBaseName(toolName: string): string {
+  const base = toolName
+    .split(/[^a-zA-Z0-9]+/u)
+    .filter(Boolean)
+    .map((part) => `${part.charAt(0).toUpperCase()}${part.slice(1)}`)
+    .join("");
+  return base || "Tool";
+}
+
+function compactToolSummary(tool: Record<string, unknown>): Record<string, unknown> {
+  const compact: Record<string, unknown> = {};
+  for (const key of ["name", "title", "description", "useWhen", "avoidWhen"] as const) {
+    if (tool[key] !== undefined) compact[key] = tool[key];
+  }
+  const annotations = isPlainObject(tool.annotations) ? tool.annotations : {};
+  const readOnlyHint = tool.readOnlyHint ?? annotations.readOnlyHint;
+  const destructiveHint = tool.destructiveHint ?? annotations.destructiveHint;
+  if (typeof readOnlyHint === "boolean") compact.readOnlyHint = readOnlyHint;
+  if (typeof destructiveHint === "boolean") compact.destructiveHint = destructiveHint;
+  return compact;
+}
+
+function schemaToTypeScript(schema: unknown, fallbackName: string): string {
+  return `type ${fallbackName} = ${schemaType(schema)};`;
+}
+
+function schemaType(schema: unknown): string {
+  if (!isPlainObject(schema)) return "unknown";
+  if ("const" in schema) return JSON.stringify(schema.const);
+  if (Array.isArray(schema.enum)) {
+    return schema.enum.map((value) => JSON.stringify(value)).join(" | ") || "unknown";
+  }
+  const type = schema.type;
+  if (Array.isArray(type)) {
+    const variants = type.map((item) => schemaType({ ...schema, type: item }));
+    return [...new Set(variants)].join(" | ") || "unknown";
+  }
+  if (type === "string") return "string";
+  if (type === "number" || type === "integer") return "number";
+  if (type === "boolean") return "boolean";
+  if (type === "null") return "null";
+  if (type === "array") return `${schemaType(schema.items)}[]`;
+  if (type === "object" || isPlainObject(schema.properties)) return objectSchemaType(schema);
+  if (Array.isArray(schema.oneOf)) return unionSchemaType(schema.oneOf);
+  if (Array.isArray(schema.anyOf)) return unionSchemaType(schema.anyOf);
+  if (Array.isArray(schema.allOf)) {
+    return schema.allOf.map(schemaType).join(" & ") || "Record<string, unknown>";
+  }
+  return "unknown";
+}
+
+function objectSchemaType(schema: Record<string, unknown>): string {
+  const properties = isPlainObject(schema.properties) ? schema.properties : {};
+  const required = new Set(
+    Array.isArray(schema.required)
+      ? schema.required.filter((value): value is string => typeof value === "string")
+      : [],
+  );
+  const fields = Object.entries(properties).map(([key, value]) => {
+    const optional = required.has(key) ? "" : "?";
+    return `${propertySignature(key)}${optional}: ${schemaType(value)};`;
+  });
+  if (fields.length === 0) {
+    return schema.additionalProperties === false ? "{}" : "Record<string, unknown>";
+  }
+  if (schema.additionalProperties && isPlainObject(schema.additionalProperties)) {
+    fields.push(`[key: string]: ${schemaType(schema.additionalProperties)};`);
+  } else if (schema.additionalProperties !== false) {
+    fields.push("[key: string]: unknown;");
+  }
+  return `{ ${fields.join(" ")} }`;
+}
+
+function unionSchemaType(schemas: unknown[]): string {
+  return schemas.map(schemaType).join(" | ") || "unknown";
+}
+
+function propertySignature(key: string): string {
+  return /^[A-Za-z_$][\w$]*$/u.test(key) ? key : JSON.stringify(key);
+}
+
+async function defaultReadLogs(): Promise<ReadLogsResult> {
+  return {
+    entries: [
+      {
+        level: "warn",
+        message: "Code Mode log storage is not configured for this runtime.",
+        timestamp: new Date(0).toISOString(),
+      },
+    ],
+  };
+}
+
+function resultIsError(result: unknown): boolean {
+  if (!isPlainObject(result)) return false;
+  if (result.isError === true) return true;
+  const capletsMeta = capletsMetaFromResult(result);
+  return capletsMeta?.status === "error";
+}
+
+function normalizeToolCallData(result: unknown): unknown {
+  if (isPlainObject(result)) {
+    const structured = result.structuredContent;
+    if (structured !== undefined) {
+      const httpBody = codeModeHttpBody(structured);
+      if (httpBody !== undefined) return httpBody;
+      if (isPlainObject(structured) && "caplets" in structured && "result" in structured) {
+        return structured.result;
+      }
+      return structured;
+    }
+  }
+
+  const parsedText = parseSingleJsonTextBlock(result);
+  if (parsedText.ok) return parsedText.value;
+
+  const text = textFromResult(result, MAX_TOOL_TEXT_CHARS);
+  if (text !== undefined) return text;
+
+  return result;
+}
+
+function codeModeHttpBody(structured: unknown): unknown | undefined {
+  if (!isPlainObject(structured)) return undefined;
+  if (!("body" in structured)) return undefined;
+  const hasHttpMetadata =
+    typeof structured.status === "number" ||
+    typeof structured.statusText === "string" ||
+    isPlainObject(structured.headers);
+  return hasHttpMetadata ? structured.body : undefined;
+}
+
+function toolCallError(result: unknown): ToolCallError {
+  const structuredError = structuredErrorFromResult(result);
+  const code = structuredError.code ?? errorCodeFromResult(result) ?? "tool_call_failed";
+  const message = truncate(
+    structuredError.message ?? textFromResult(result, MAX_ERROR_MESSAGE_CHARS) ?? code,
+    MAX_ERROR_MESSAGE_CHARS,
+  );
+  return normalizeCodeModeErrorTerminology({
+    code,
+    message,
+    ...(structuredError.details === undefined ? {} : { details: structuredError.details }),
+  });
+}
+
+function normalizeCodeModeErrorTerminology(error: ToolCallError): ToolCallError {
+  return {
+    ...error,
+    message: codeModeMethodText(error.message),
+    ...(error.details === undefined
+      ? {}
+      : { details: normalizeCodeModeErrorDetails(error.details) }),
+  };
+}
+
+function normalizeCodeModeErrorDetails(value: unknown): unknown {
+  if (typeof value === "string") return codeModeMethodText(value);
+  if (Array.isArray(value)) return value.map(normalizeCodeModeErrorDetails);
+  if (!isPlainObject(value)) return value;
+  return Object.fromEntries(
+    Object.entries(value).map(([key, nested]) => [key, normalizeCodeModeErrorDetails(nested)]),
+  );
+}
+
+function codeModeMethodText(value: string): string {
+  const replacements: Array<[string, string]> = [
+    ["search_tools", "searchTools"],
+    ["describe_tool", "describeTool"],
+    ["call_tool", "callTool"],
+    ["search_resources", "searchResources"],
+    ["resource_templates", "resourceTemplates"],
+    ["read_resource", "readResource"],
+    ["search_prompts", "searchPrompts"],
+    ["get_prompt", "getPrompt"],
+  ];
+  return replacements.reduce(
+    (text, [from, to]) =>
+      text.replace(new RegExp(`(^|[^A-Za-z0-9_])${from}($|[^A-Za-z0-9_])`, "gu"), `$1${to}$2`),
+    value,
+  );
+}
+
+function structuredErrorFromResult(result: unknown): Partial<ToolCallError> {
+  if (!isPlainObject(result)) return {};
+  const structured = result.structuredContent;
+  if (!isPlainObject(structured)) return {};
+  const error = structured.error;
+  if (!isPlainObject(error)) return {};
+  const code = typeof error.code === "string" ? error.code : undefined;
+  const message = typeof error.message === "string" ? error.message : undefined;
+  const details = compactErrorDetails(error);
+  return {
+    ...(code === undefined ? {} : { code }),
+    ...(message === undefined ? {} : { message }),
+    ...(details === undefined ? {} : { details }),
+  };
+}
+
+function compactErrorDetails(error: Record<string, unknown>): unknown {
+  const entries = Object.entries(error).filter(([key]) => key !== "code" && key !== "message");
+  if (entries.length === 0) return undefined;
+  if (entries.length === 1 && entries[0]?.[0] === "details") return entries[0][1];
+  return Object.fromEntries(entries);
+}
+
+function errorCodeFromResult(result: unknown): string | undefined {
+  if (!isPlainObject(result)) return undefined;
+  const structured = result.structuredContent;
+  if (!isPlainObject(structured)) return undefined;
+  const errorCode = structured.errorCode;
+  return typeof errorCode === "string" ? errorCode : undefined;
+}
+
+function toolCallMeta(result: unknown, base: ToolCallMeta): ToolCallMeta {
+  const capletsMeta = capletsMetaFromResult(result);
+  if (!capletsMeta) return base;
+  return {
+    ...base,
+    ...(typeof capletsMeta.status === "string" ? { status: capletsMeta.status } : {}),
+    ...(typeof capletsMeta.elapsedMs === "number" ? { elapsedMs: capletsMeta.elapsedMs } : {}),
+  };
+}
+
+function capletsMetaFromResult(result: unknown): Record<string, unknown> | undefined {
+  if (!isPlainObject(result)) return undefined;
+  const meta = result._meta;
+  if (!isPlainObject(meta)) return undefined;
+  const caplets = meta.caplets;
+  return isPlainObject(caplets) ? caplets : undefined;
+}
+
+function parseSingleJsonTextBlock(result: unknown): { ok: true; value: unknown } | { ok: false } {
+  const textBlocks = textBlocksFromResult(result);
+  if (textBlocks.length !== 1) return { ok: false };
+  const text = textBlocks[0]?.trim();
+  if (!text || (!text.startsWith("{") && !text.startsWith("["))) return { ok: false };
+  try {
+    return { ok: true, value: JSON.parse(text) as unknown };
+  } catch {
+    return { ok: false };
+  }
+}
+
+function textFromResult(result: unknown, maxChars: number): string | undefined {
+  const text = textBlocksFromResult(result).join("\n").trim();
+  if (text) return truncate(text, maxChars);
+  if (result === undefined) return undefined;
+  if (typeof result === "string") return truncate(result, maxChars);
+  if (typeof result === "number" || typeof result === "boolean" || result === null) {
+    return String(result);
+  }
+  return undefined;
+}
+
+function textBlocksFromResult(result: unknown): string[] {
+  if (!isPlainObject(result) || !Array.isArray(result.content)) return [];
+  return result.content
+    .map((item) =>
+      isPlainObject(item) && item.type === "text" && typeof item.text === "string" ? item.text : "",
+    )
+    .filter(Boolean);
+}
+
+function truncate(value: string, maxChars: number): string {
+  return value.length > maxChars ? `${value.slice(0, maxChars - 1).trimEnd()}…` : value;
+}
+
+function isPlainObject(value: unknown): value is Record<string, unknown> {
+  return Boolean(value && typeof value === "object" && !Array.isArray(value));
+}
diff --git a/packages/core/src/code-mode/declarations.ts b/packages/core/src/code-mode/declarations.ts
new file mode 100644
index 0000000..3c047b0
--- /dev/null
+++ b/packages/core/src/code-mode/declarations.ts
@@ -0,0 +1,115 @@
+import type { CodeModeDeclarationInput } from "./types";
+import { CODE_MODE_RUNTIME_API_DECLARATION } from "./runtime-api.generated";
+
+const JS_IDENTIFIER = /^[A-Za-z_$][\w$]*$/u;
+const MAX_JSDOC_CHARS = 180;
+
+export function generateCodeModeDeclarations(input: CodeModeDeclarationInput): string {
+  const caplets = [...input.caplets].sort((left, right) => left.id.localeCompare(right.id));
+  const properties = caplets.map((caplet) => {
+    const key = propertyKey(caplet.id);
+    const description = jsDoc(capletHintText(caplet));
+    if (caplet.id === "debug") {
+      return `${description}debug:DebugApi&CapletHandle<"debug">;`;
+    }
+    return `${description}${key}:CapletHandle<${JSON.stringify(caplet.id)}>;`;
+  });
+  if (!caplets.some((caplet) => caplet.id === "debug")) {
+    properties.push("debug:DebugApi;");
+  }
+
+  return ["declare const caplets:{", ...properties, "};", CODE_MODE_RUNTIME_API_DECLARATION].join(
+    "\n",
+  );
+}
+
+export function generateCodeModeRunToolDescription(declaration: string): string {
+  return [
+    'Run TypeScript with generated `caplets.<id>` handles and declaration hints below. Prefer a two-pass workflow for non-trivial tasks. Pass 1: discover and inspect candidate caplets/tools/resources/prompts with inspect, check, tools/searchTools, describeTool, resources/searchResources, and prompts/searchPrompts; return chosen handles, call signatures/schemas, and planned args. Never invent tool names, resource URIs, prompt names, input args, output fields, or schemas. Never infer input/output schemas from memory; use describeTool for the exact callSignature, inputSchema/inputTypeScript, outputSchema/outputTypeScript, examples, and observedOutputShape. For fallback, check candidate handles first: `for(const h of candidates){const ready=await h.check();if(!ready.ok)continue;}`. Pass 2: execute with exact args, handle `{ok:false}`, filter bulky results, and synthesize compact JSON. Return decision-ready JSON, not raw tool payloads: reduce tool results to summary, key evidence, derived fields, recommendation, and caveats; derive final recommendations from all relevant records, not the first matching record; if records disagree or have ranges/statuses, compute the strictest applicable conclusion and preserve the evidence used. Before `callTool`, use `describeTool` and pass args with exact `inputTypeScript`/`inputSchema` property names; do not guess from provider memory. For triage, list broad candidate records and filter in script before targeted searches so adjacent relevant items are not missed. For result shape, prefer `outputSchema` or `outputTypeScript`; use `observedOutputShape` only when those are absent or generic. Filter bulky results in script before returning, while preserving useful identifiers/links such as id,name,title,state,status,url,html_url,labels,created_at,updated_at. Pattern: discovery `const h=caplets["caplet-id"];const d=await h.describeTool("tool_name");return {caplet:h.id,tool:"tool_name",descriptor:d};` then execution `const h=caplets["caplet-id"];const r=await h.callTool("tool_name",args);if(!r.ok)return {error:r.error};return /* compact JSON */;`',
+    "",
+    "Generated declaration hints:",
+    "```ts",
+    declaration,
+    "```",
+  ].join("\n");
+}
+
+function capletHintText(caplet: CodeModeDeclarationInput["caplets"][number]): string {
+  return [
+    caplet.description || caplet.name || caplet.id,
+    caplet.useWhen ? `Use when: ${caplet.useWhen}` : undefined,
+    caplet.avoidWhen ? `Avoid when: ${caplet.avoidWhen}` : undefined,
+  ]
+    .filter((value): value is string => Boolean(value))
+    .join(" ");
+}
+
+export function minifyCodeModeDeclarationText(value: string): string {
+  return value
+    .replace(/^\s*export\s*\{\s*\}\s*;?\s*/u, "")
+    .replace(/\r\n?/gu, "\n")
+    .split("\n")
+    .map((line) => line.trim())
+    .filter(Boolean)
+    .join(" ")
+    .replace(/\s+/gu, " ")
+    .replace(/\s*([{}()[\]:;,|&=])\s*/gu, "$1")
+    .replace(/\s*<\s*/gu, "<")
+    .replace(/\s*>\s*/gu, ">")
+    .replace(/\?\s*:/gu, "?:")
+    .trim();
+}
+
+export function codeModeDeclarationHash(declaration: string): string {
+  return [
+    fnv1a32(declaration, 0x811c9dc5),
+    fnv1a32(declaration, 0x9e3779b9),
+    fnv1a32(declaration, 0x85ebca6b),
+    fnv1a32(declaration, 0xc2b2ae35),
+    fnv1a32(declaration, 0x27d4eb2f),
+    fnv1a32(declaration, 0x165667b1),
+    fnv1a32(declaration, 0xd3a2646c),
+    fnv1a32(declaration, 0xfd7046c5),
+  ]
+    .map((value) => value.toString(16).padStart(8, "0"))
+    .join("");
+}
+
+function propertyKey(id: string): string {
+  return JS_IDENTIFIER.test(id) ? id : JSON.stringify(id);
+}
+
+function jsDoc(value: string): string {
+  return `/**${compactJsDoc(value)}*/`;
+}
+
+function sanitizeJsDoc(value: string): string {
+  return value.replace(/\*\//gu, "* /").replace(/\s+/gu, " ").trim();
+}
+
+function compactJsDoc(value: string): string {
+  const cleaned = sanitizeJsDoc(value);
+  const markers = [
+    " Use inspect for details when needed;",
+    " Native tool name:",
+    " Original Caplet ID:",
+  ];
+  const cutoff = markers
+    .map((marker) => cleaned.indexOf(marker))
+    .filter((index) => index >= 0)
+    .sort((left, right) => left - right)[0];
+  const summary = (cutoff === undefined ? cleaned : cleaned.slice(0, cutoff).trim()) || "Caplet.";
+  if (summary.length <= MAX_JSDOC_CHARS) return summary;
+  const sentenceEnd = summary.lastIndexOf(".", MAX_JSDOC_CHARS);
+  if (sentenceEnd >= 40) return summary.slice(0, sentenceEnd + 1);
+  return `${summary.slice(0, MAX_JSDOC_CHARS - 3).trimEnd()}...`;
+}
+
+function fnv1a32(value: string, seed: number): number {
+  let hash = seed >>> 0;
+  for (let index = 0; index < value.length; index += 1) {
+    hash ^= value.charCodeAt(index);
+    hash = Math.imul(hash, 0x01000193) >>> 0;
+  }
+  return hash;
+}
diff --git a/packages/core/src/code-mode/diagnostics.ts b/packages/core/src/code-mode/diagnostics.ts
new file mode 100644
index 0000000..75e7654
--- /dev/null
+++ b/packages/core/src/code-mode/diagnostics.ts
@@ -0,0 +1,186 @@
+import ts from "typescript";
+import type { CodeModeDiagnostic } from "./types";
+
+export type DiagnoseCodeModeTypeScriptInput = {
+  code: string;
+  declaration: string;
+  maxDiagnostics?: number;
+  timeoutMs?: number;
+};
+
+const CODE_FILE = "/caplets-code-mode/input.ts";
+const DECLARATION_FILE = "/caplets-code-mode/caplets.d.ts";
+const AMBIENT_FILE = "/caplets-code-mode/ambient.d.ts";
+
+const IMPORT_PATTERN = /\bimport\s*(?:\(|[\s{*"A-Za-z_$])/u;
+const TS_NOCHECK_PATTERN =
+  /^\s*(?:(?:\/\/[^\n]*|\/\*[\s\S]*?\*\/)\s*)*?(?:(?:\/\/\s*@ts-nocheck\b[^\n]*)|(?:\/\*\s*@ts-nocheck\b[\s\S]*?\*\/))/u;
+const BAD_CALL_METHOD_PATTERN = /\bcaplets(?:\.[A-Za-z_$][\w$]*|\[[^\]]+\])\.call\s*\(/u;
+const FETCH_PATTERN = /\bfetch\s*\(/u;
+
+export function diagnoseCodeModeTypeScript(
+  input: DiagnoseCodeModeTypeScriptInput,
+): CodeModeDiagnostic[] {
+  const maxDiagnostics = input.maxDiagnostics ?? 50;
+  const startedAt = Date.now();
+  const preflight = preflightDiagnostics(input.code);
+  const diagnostics: CodeModeDiagnostic[] = [...preflight];
+  if (diagnostics.length >= maxDiagnostics) {
+    return diagnostics.slice(0, maxDiagnostics);
+  }
+
+  const compilerOptions: ts.CompilerOptions = {
+    target: ts.ScriptTarget.ES2022,
+    module: ts.ModuleKind.ESNext,
+    moduleResolution: ts.ModuleResolutionKind.Bundler,
+    lib: ["lib.es2022.d.ts"],
+    types: [],
+    strict: true,
+    noEmit: true,
+    skipLibCheck: true,
+    noErrorTruncation: true,
+    allowJs: false,
+  };
+  const wrappedCode = [
+    "async function __capletsCodeModeMain(): Promise<unknown> {",
+    input.code,
+    "}",
+  ].join("\n");
+  const host = createVirtualCompilerHost(compilerOptions, {
+    [CODE_FILE]: wrappedCode,
+    [DECLARATION_FILE]: input.declaration,
+    [AMBIENT_FILE]: ambientDeclarations(),
+  });
+  const program = ts.createProgram(
+    [CODE_FILE, DECLARATION_FILE, AMBIENT_FILE],
+    compilerOptions,
+    host,
+  );
+  const source = program.getSourceFile(CODE_FILE);
+  const tsNoCheck = TS_NOCHECK_PATTERN.test(input.code);
+  const syntacticDiagnostics = program.getSyntacticDiagnostics(source);
+  const semanticDiagnostics = tsNoCheck ? [] : program.getSemanticDiagnostics(source);
+  const syntacticDiagnosticSet = new Set<ts.Diagnostic>(syntacticDiagnostics);
+  if (tsNoCheck) {
+    diagnostics.push({
+      code: "ts_nocheck_applied",
+      severity: "info",
+      message:
+        "@ts-nocheck suppressed TypeScript diagnostics; Code Mode safety checks still applied.",
+    });
+  }
+  for (const diagnostic of [...syntacticDiagnostics, ...semanticDiagnostics]) {
+    diagnostics.push(formatDiagnostic(diagnostic, syntacticDiagnosticSet.has(diagnostic)));
+    if (diagnostics.length >= maxDiagnostics) {
+      break;
+    }
+    if (input.timeoutMs !== undefined && Date.now() - startedAt > input.timeoutMs) {
+      diagnostics.push({
+        code: "DIAGNOSTIC_TIMEOUT",
+        severity: "error",
+        message: `Code Mode diagnostics exceeded ${input.timeoutMs}ms.`,
+      });
+      break;
+    }
+  }
+  return diagnostics.slice(0, maxDiagnostics);
+}
+
+function preflightDiagnostics(code: string): CodeModeDiagnostic[] {
+  const diagnostics: CodeModeDiagnostic[] = [];
+  if (!IMPORT_PATTERN.test(code)) {
+    // continue with other custom checks below
+  } else {
+    diagnostics.push({
+      code: "IMPORT_UNAVAILABLE",
+      severity: "error",
+      message: "Imports are not available in Code Mode.",
+    });
+  }
+  if (BAD_CALL_METHOD_PATTERN.test(code)) {
+    diagnostics.push({
+      code: "INVALID_CAPLET_METHOD",
+      severity: "error",
+      message: "CapletHandle does not expose call(). Use callTool(name, args) for tool calls.",
+    });
+  }
+  if (FETCH_PATTERN.test(code)) {
+    diagnostics.push({
+      code: "FETCH_UNAVAILABLE",
+      severity: "error",
+      message: "Direct fetch is not available in Code Mode; use a Caplet instead.",
+    });
+  }
+  return diagnostics;
+}
+
+function createVirtualCompilerHost(
+  options: ts.CompilerOptions,
+  files: Record<string, string>,
+): ts.CompilerHost {
+  const host = ts.createCompilerHost(options, true);
+  const defaultGetSourceFile = host.getSourceFile.bind(host);
+  const defaultFileExists = host.fileExists.bind(host);
+  const defaultReadFile = host.readFile.bind(host);
+  return {
+    ...host,
+    getSourceFile(fileName, languageVersion, onError, shouldCreateNewSourceFile) {
+      const source = files[fileName];
+      if (source !== undefined) {
+        return ts.createSourceFile(fileName, source, languageVersion, true);
+      }
+      return defaultGetSourceFile(fileName, languageVersion, onError, shouldCreateNewSourceFile);
+    },
+    fileExists(fileName) {
+      return files[fileName] !== undefined || defaultFileExists(fileName);
+    },
+    readFile(fileName) {
+      return files[fileName] ?? defaultReadFile(fileName);
+    },
+  };
+}
+
+function formatDiagnostic(
+  diagnostic: ts.Diagnostic,
+  syntacticDiagnostic = false,
+): CodeModeDiagnostic {
+  const position = diagnostic.file?.getLineAndCharacterOfPosition(diagnostic.start ?? 0);
+  const message = ts.flattenDiagnosticMessageText(diagnostic.messageText, "\n");
+  return {
+    code: String(diagnostic.code),
+    severity:
+      syntacticDiagnostic || diagnostic.category === ts.DiagnosticCategory.Warning
+        ? diagnostic.category === ts.DiagnosticCategory.Warning
+          ? "warning"
+          : "error"
+        : "warning",
+    message:
+      diagnostic.code === 2339 && message.includes("Property 'call' does not exist")
+        ? `${message} Use callTool(name, args) on CapletHandle.`
+        : message,
+    ...(position
+      ? {
+          line: Math.max(1, position.line),
+          column: Math.max(1, position.character + 1),
+        }
+      : {}),
+  };
+}
+
+function ambientDeclarations(): string {
+  return [
+    "declare class URL {",
+    "  constructor(input: string, base?: string);",
+    "  readonly href: string;",
+    "  readonly searchParams: URLSearchParams;",
+    "  toString(): string;",
+    "}",
+    "declare class URLSearchParams {",
+    "  constructor(init?: string | Record<string, string> | Array<[string, string]>);",
+    "  get(name: string): string | null;",
+    "  set(name: string, value: string): void;",
+    "  has(name: string): boolean;",
+    "  toString(): string;",
+    "}",
+  ].join("\n");
+}
diff --git a/packages/core/src/code-mode/index.ts b/packages/core/src/code-mode/index.ts
new file mode 100644
index 0000000..a18e8c2
--- /dev/null
+++ b/packages/core/src/code-mode/index.ts
@@ -0,0 +1,30 @@
+export {
+  codeModeDeclarationHash,
+  generateCodeModeDeclarations,
+  generateCodeModeRunToolDescription,
+  minifyCodeModeDeclarationText,
+} from "./declarations";
+export {
+  codeModeRunInputJsonSchema,
+  codeModeRunInputSchema,
+  codeModeRunParamsSchema,
+  isCodeModeRunRequest,
+} from "./tool";
+export type {
+  CodeModeCallableCaplet,
+  CodeModeDeclarationInput,
+  CodeModeDiagnostic,
+  CodeModeLogEntry,
+  CodeModeLogs,
+  CodeModeRunEnvelope,
+  CodeModeRunError,
+  CodeModeRunMeta,
+  CodeModeTypesJson,
+  JsonPrimitive,
+  JsonValue,
+  ReadLogsInput,
+  ReadLogsResult,
+  ToolCallError,
+  ToolCallMeta,
+  ToolCallResult,
+} from "./types";
diff --git a/packages/core/src/code-mode/logs.ts b/packages/core/src/code-mode/logs.ts
new file mode 100644
index 0000000..20a295c
--- /dev/null
+++ b/packages/core/src/code-mode/logs.ts
@@ -0,0 +1,160 @@
+import { existsSync, mkdirSync, readFileSync, writeFileSync } from "node:fs";
+import { join } from "node:path";
+import { randomBytes } from "node:crypto";
+import { defaultStateBaseDir } from "../config/paths";
+import type { CodeModeLogEntry, ReadLogsInput, ReadLogsResult } from "./types";
+
+const DEFAULT_LOG_REF_TTL_MS = 60 * 60 * 1000;
+const DEFAULT_PAGE_LIMIT = 100;
+const MAX_PAGE_LIMIT = 500;
+
+const SECRET_KEY_VALUE_PATTERN =
+  /\b(?:authorization|cookie|set-cookie|password|passphrase|secret|token|api[-_]?key|clientsecret|client_secret|privatekey|private_key|credential|refreshToken|accessToken)\b\s*[:=]\s*([^\s,;]+)/giu;
+const BEARER_PATTERN = /\bbearer\s+([a-z0-9._~+/=-]{8,})/giu;
+const BASIC_PATTERN = /\bbasic\s+([a-z0-9._~+/=-]{8,})/giu;
+const SIGNED_URL_PARAM_PATTERN =
+  /([?&](?:access_token|refresh_token|token|code|signature|sig|x-amz-signature)=)[^&\s]+/giu;
+const EMAIL_PATTERN = /\b[A-Z0-9._%+-]+@[A-Z0-9.-]+\.[A-Z]{2,}\b/giu;
+const SSN_PATTERN = /\b\d{3}-\d{2}-\d{4}\b/gu;
+const CREDIT_CARD_PATTERN = /\b(?:\d[ -]?){13,19}\b/gu;
+const PHONE_PATTERN = /\+?\b(?:\d[\s().-]?){10,15}\b/gu;
+const HIGH_ENTROPY_PATTERN = /\b[A-Za-z0-9_./+=-]{40,}\b/gu;
+
+type StoredLogsFile = {
+  createdAt: string;
+  expiresAt: string;
+  entries: CodeModeLogEntry[];
+};
+
+export type CodeModeLogStoreOptions = {
+  stateDir?: string;
+  now?: () => Date;
+  logRefTtlMs?: number;
+};
+
+export type StoreCodeModeLogsResult = {
+  logRef: string;
+  expiresAt: string;
+};
+
+export class CodeModeLogStore {
+  private readonly stateDir: string;
+  private readonly now: () => Date;
+  private readonly logRefTtlMs: number;
+
+  constructor(options: CodeModeLogStoreOptions = {}) {
+    this.stateDir = options.stateDir ?? join(defaultStateBaseDir(), "caplets");
+    this.now = options.now ?? (() => new Date());
+    this.logRefTtlMs = options.logRefTtlMs ?? DEFAULT_LOG_REF_TTL_MS;
+  }
+
+  async store(entries: CodeModeLogEntry[]): Promise<StoreCodeModeLogsResult> {
+    mkdirSync(this.logsDir(), { recursive: true });
+    const logRef = randomBytes(24).toString("hex");
+    const now = this.now();
+    const expiresAt = new Date(now.getTime() + this.logRefTtlMs).toISOString();
+    const stored: StoredLogsFile = {
+      createdAt: now.toISOString(),
+      expiresAt,
+      entries: entries.map(redactEntry),
+    };
+    writeFileSync(this.logPath(logRef), `${JSON.stringify(stored, null, 2)}\n`, "utf8");
+    return { logRef, expiresAt };
+  }
+
+  async read(input: ReadLogsInput): Promise<ReadLogsResult> {
+    if (!/^[a-f0-9]{48}$/u.test(input.logRef)) {
+      return { entries: [] };
+    }
+    const path = this.logPath(input.logRef);
+    if (!existsSync(path)) {
+      return { entries: [] };
+    }
+    const parsed = parseStoredLogs(readFileSync(path, "utf8"));
+    if (!parsed || new Date(parsed.expiresAt).getTime() <= this.now().getTime()) {
+      return { entries: [] };
+    }
+    const offset = parseCursor(input.cursor);
+    const limit = Math.min(Math.max(input.limit ?? DEFAULT_PAGE_LIMIT, 0), MAX_PAGE_LIMIT);
+    const entries = parsed.entries.slice(offset, offset + limit).map(redactEntry);
+    const nextOffset = offset + entries.length;
+    return nextOffset < parsed.entries.length
+      ? { entries, nextCursor: String(nextOffset) }
+      : { entries };
+  }
+
+  private logsDir(): string {
+    return join(this.stateDir, "code-mode", "logs");
+  }
+
+  private logPath(logRef: string): string {
+    return join(this.logsDir(), `${logRef}.json`);
+  }
+}
+
+export function redactCodeModeLogText(text: string): string {
+  return text
+    .replace(BEARER_PATTERN, (match, value: string) => match.replace(value, "[REDACTED:token]"))
+    .replace(BASIC_PATTERN, (match, value: string) => match.replace(value, "[REDACTED:token]"))
+    .replace(SECRET_KEY_VALUE_PATTERN, (match, value: string) =>
+      match.replace(value, "[REDACTED:credential]"),
+    )
+    .replace(SIGNED_URL_PARAM_PATTERN, "$1[REDACTED:token]")
+    .replace(EMAIL_PATTERN, "[REDACTED:email]")
+    .replace(SSN_PATTERN, "[REDACTED:ssn]")
+    .replace(CREDIT_CARD_PATTERN, (match) =>
+      match.replace(/\D/gu, "").length >= 13 ? "[REDACTED:credit-card]" : match,
+    )
+    .replace(PHONE_PATTERN, (match) =>
+      match.replace(/\D/gu, "").length >= 10 ? "[REDACTED:phone]" : match,
+    )
+    .replace(HIGH_ENTROPY_PATTERN, "[REDACTED:credential]");
+}
+
+function redactEntry(entry: CodeModeLogEntry): CodeModeLogEntry {
+  return { ...entry, message: redactCodeModeLogText(entry.message) };
+}
+
+function parseCursor(cursor: string | undefined): number {
+  if (!cursor) {
+    return 0;
+  }
+  const parsed = Number.parseInt(cursor, 10);
+  return Number.isFinite(parsed) && parsed > 0 ? parsed : 0;
+}
+
+function parseStoredLogs(raw: string): StoredLogsFile | undefined {
+  try {
+    const parsed = JSON.parse(raw) as Partial<StoredLogsFile>;
+    if (
+      typeof parsed.createdAt !== "string" ||
+      typeof parsed.expiresAt !== "string" ||
+      !Array.isArray(parsed.entries)
+    ) {
+      return undefined;
+    }
+    return {
+      createdAt: parsed.createdAt,
+      expiresAt: parsed.expiresAt,
+      entries: parsed.entries.filter(isLogEntry).map(redactEntry),
+    };
+  } catch {
+    return undefined;
+  }
+}
+
+function isLogEntry(value: unknown): value is CodeModeLogEntry {
+  if (!value || typeof value !== "object" || Array.isArray(value)) {
+    return false;
+  }
+  const entry = value as Partial<CodeModeLogEntry>;
+  return (
+    (entry.level === "log" ||
+      entry.level === "info" ||
+      entry.level === "warn" ||
+      entry.level === "error" ||
+      entry.level === "debug") &&
+    typeof entry.message === "string" &&
+    typeof entry.timestamp === "string"
+  );
+}
diff --git a/packages/core/src/code-mode/runner.ts b/packages/core/src/code-mode/runner.ts
new file mode 100644
index 0000000..09e5f09
--- /dev/null
+++ b/packages/core/src/code-mode/runner.ts
@@ -0,0 +1,248 @@
+import { randomUUID } from "node:crypto";
+import type { NativeCapletsService } from "../native/service";
+import { createCodeModeCapletsApi, listCodeModeCallableCaplets } from "./api";
+import { codeModeDeclarationHash, generateCodeModeDeclarations } from "./declarations";
+import { diagnoseCodeModeTypeScript } from "./diagnostics";
+import { CodeModeLogStore, redactCodeModeLogText } from "./logs";
+import { QuickJsCodeModeSandbox, type CodeModeSandbox } from "./sandbox";
+import type {
+  CodeModeDiagnostic,
+  CodeModeLogEntry,
+  CodeModeLogs,
+  CodeModeRunEnvelope,
+  JsonValue,
+} from "./types";
+
+const DEFAULT_TIMEOUT_MS = 10_000;
+const DEFAULT_MAX_TIMEOUT_MS = Number.MAX_SAFE_INTEGER;
+const DEFAULT_RETURNED_LOG_BYTES = 12 * 1024;
+
+export type RunCodeModeInput = {
+  code: string;
+  service: NativeCapletsService;
+  timeoutMs?: number;
+  maxTimeoutMs?: number;
+  runtimeScope?: string;
+  logStore?: CodeModeLogStore;
+  sandbox?: CodeModeSandbox;
+  returnedLogBytes?: number;
+};
+
+export async function runCodeMode(input: RunCodeModeInput): Promise<CodeModeRunEnvelope> {
+  const startedAt = Date.now();
+  const timeoutMs = input.timeoutMs ?? DEFAULT_TIMEOUT_MS;
+  const maxTimeoutMs = input.maxTimeoutMs ?? DEFAULT_MAX_TIMEOUT_MS;
+  const callable = listCodeModeCallableCaplets(input.service);
+  const declaration = generateCodeModeDeclarations({ caplets: callable });
+  const declarationHash = codeModeDeclarationHash(declaration);
+  const metaBase = {
+    runId: randomUUID(),
+    traceId: randomUUID(),
+    declarationHash,
+    timeoutMs,
+    maxTimeoutMs,
+  };
+
+  const diagnostics =
+    timeoutMs > maxTimeoutMs
+      ? [
+          {
+            code: "TIMEOUT_POLICY_EXCEEDED",
+            severity: "error" as const,
+            message: `timeoutMs must be <= ${maxTimeoutMs}.`,
+          },
+        ]
+      : diagnoseCodeModeTypeScript({ code: input.code, declaration });
+  if (diagnostics.some((diagnostic) => diagnostic.severity === "error")) {
+    return {
+      ok: false,
+      error: {
+        code: "diagnostic_blocked",
+        message: "Code Mode diagnostics failed before execution.",
+      },
+      diagnostics,
+      logs: emptyLogs(),
+      meta: { ...metaBase, durationMs: Date.now() - startedAt },
+    };
+  }
+
+  const capturedLogs: CodeModeLogEntry[] = [];
+  const api = createCodeModeCapletsApi({
+    service: input.service,
+    readLogs: async (readInput) => input.logStore?.read(readInput) ?? { entries: [] },
+  });
+  const sandbox = input.sandbox ?? new QuickJsCodeModeSandbox();
+  const result = await sandbox.run({
+    code: input.code,
+    capletIds: callable.map((caplet) => caplet.id),
+    timeoutMs,
+    invoke: async ({ capletId, method, args }) => {
+      if (method === "readLogs") {
+        return await api.debug.readLogs(args[0] as never);
+      }
+      const handle = api[capletId];
+      if (!handle || !("callTool" in handle)) {
+        throw new Error(`Caplet ${capletId} is not available.`);
+      }
+      if (method === "inspect") return await handle.inspect();
+      if (method === "check") return await handle.check();
+      if (method === "tools") return await handle.tools(args[0] as never);
+      if (method === "searchTools")
+        return await handle.searchTools(String(args[0]), args[1] as never);
+      if (method === "describeTool") return await handle.describeTool(String(args[0]));
+      if (method === "callTool") return await handle.callTool(String(args[0]), args[1]);
+      if (method === "resources") return await handle.resources(args[0] as never);
+      if (method === "searchResources") {
+        return await handle.searchResources(String(args[0]), args[1] as never);
+      }
+      if (method === "resourceTemplates") return await handle.resourceTemplates(args[0] as never);
+      if (method === "readResource") return await handle.readResource(String(args[0]));
+      if (method === "prompts") return await handle.prompts(args[0] as never);
+      if (method === "searchPrompts") {
+        return await handle.searchPrompts(String(args[0]), args[1] as never);
+      }
+      if (method === "getPrompt") return await handle.getPrompt(String(args[0]), args[1]);
+      if (method === "complete") return await handle.complete(args[0]);
+      throw new Error(`Unknown Code Mode CapletHandle method: ${method}.`);
+    },
+  });
+  capturedLogs.push(...result.logs.map(redactLogEntry));
+  const logs = await buildLogs(capturedLogs, input.logStore, input.returnedLogBytes);
+  if (!result.ok) {
+    return {
+      ok: false,
+      error: codeModeRuntimeError(result.error, result.stack),
+      diagnostics,
+      logs,
+      meta: { ...metaBase, durationMs: Date.now() - startedAt },
+    };
+  }
+
+  const serialized = serializeJsonValue(result.value);
+  if (!serialized.ok) {
+    const serializationDiagnostic: CodeModeDiagnostic = {
+      code: "SERIALIZATION_ERROR",
+      severity: "error",
+      message: serialized.message,
+    };
+    return {
+      ok: false,
+      error: {
+        code: "SERIALIZATION_ERROR",
+        message: serialized.message,
+      },
+      diagnostics: [...diagnostics, serializationDiagnostic],
+      logs,
+      meta: { ...metaBase, durationMs: Date.now() - startedAt },
+    };
+  }
+
+  return {
+    ok: true,
+    value: serialized.value,
+    diagnostics,
+    logs,
+    meta: { ...metaBase, durationMs: Date.now() - startedAt },
+  };
+}
+
+function codeModeRuntimeError(message: string, stack?: string) {
+  const location = userCodeLocation(stack);
+  const stackPreview =
+    location === undefined
+      ? undefined
+      : [`at user code line ${location.line} column ${location.column}`];
+  const code = runtimeErrorCode(message);
+  return {
+    code,
+    message,
+    ...(location === undefined ? {} : { location }),
+    ...(stackPreview === undefined ? {} : { stackPreview }),
+    ...(code === "sandbox_type_error"
+      ? {
+          hint: "Check CapletHandle method names: inspect, check, tools, searchTools, describeTool, callTool, resources, searchResources, resourceTemplates, readResource, prompts, searchPrompts, getPrompt, complete.",
+        }
+      : {}),
+  };
+}
+
+function runtimeErrorCode(message: string): string {
+  if (/timed out|interrupted/iu.test(message)) return "sandbox_timeout";
+  if (
+    /fetch is disabled|imports? are not available|require is not defined|process is not defined/iu.test(
+      message,
+    )
+  ) {
+    return "sandbox_forbidden_global";
+  }
+  if (/is not a function|Cannot read properties|undefined is not an object/iu.test(message)) {
+    return "sandbox_type_error";
+  }
+  if (/is not defined|ReferenceError/iu.test(message)) return "sandbox_reference_error";
+  if (/Unknown Code Mode CapletHandle method/iu.test(message)) return "runtime_bridge_error";
+  return "sandbox_error";
+}
+
+function userCodeLocation(stack: string | undefined): { line: number; column: number } | undefined {
+  if (!stack) return undefined;
+  const match = /<anonymous>:(\d+):(\d+)/u.exec(stack) ?? /eval.*?:(\d+):(\d+)/u.exec(stack);
+  if (!match) return undefined;
+  const line = Number.parseInt(match[1] ?? "0", 10);
+  const column = Number.parseInt(match[2] ?? "0", 10);
+  return line > 0 && column > 0 ? { line, column } : undefined;
+}
+
+function serializeJsonValue(
+  value: unknown,
+): { ok: true; value: JsonValue } | { ok: false; message: string } {
+  try {
+    const serialized = JSON.stringify(value);
+    if (serialized === undefined) {
+      return { ok: false, message: "Code Mode return value must be JSON-serializable." };
+    }
+    return { ok: true, value: JSON.parse(serialized) as JsonValue };
+  } catch (error) {
+    return {
+      ok: false,
+      message: error instanceof Error ? error.message : "Return value is not JSON-serializable.",
+    };
+  }
+}
+
+async function buildLogs(
+  entries: CodeModeLogEntry[],
+  store: CodeModeLogStore | undefined,
+  returnedLogBytes = DEFAULT_RETURNED_LOG_BYTES,
+): Promise<CodeModeLogs> {
+  const bounded: CodeModeLogEntry[] = [];
+  let bytes = 0;
+  let truncated = false;
+  for (const entry of entries) {
+    const nextBytes = Buffer.byteLength(entry.message, "utf8");
+    if (bytes + nextBytes > returnedLogBytes) {
+      truncated = true;
+      break;
+    }
+    bounded.push(entry);
+    bytes += nextBytes;
+  }
+  if (!store) {
+    return { entries: bounded, truncated, stored: false };
+  }
+  const stored = await store.store(entries);
+  return {
+    entries: bounded,
+    truncated,
+    stored: true,
+    logRef: stored.logRef,
+    expiresAt: stored.expiresAt,
+  };
+}
+
+function emptyLogs(): CodeModeLogs {
+  return { entries: [], truncated: false, stored: false };
+}
+
+function redactLogEntry(entry: CodeModeLogEntry): CodeModeLogEntry {
+  return { ...entry, message: redactCodeModeLogText(entry.message) };
+}
diff --git a/packages/core/src/code-mode/runtime-api.d.ts b/packages/core/src/code-mode/runtime-api.d.ts
new file mode 100644
index 0000000..2dcd402
--- /dev/null
+++ b/packages/core/src/code-mode/runtime-api.d.ts
@@ -0,0 +1,140 @@
+export {};
+
+type JsonPrimitive = string | number | boolean | null;
+type JsonValue = JsonPrimitive | JsonValue[] | { [key: string]: JsonValue };
+
+interface CapletHandle<Id extends string> {
+  readonly id: Id;
+  /** Show this Caplet card, without tool/resource/prompt schemas. */
+  inspect(): Promise<CapletCard<Id>>;
+  /** Check backend readiness/auth; expected unavailable states return ok:false. */
+  check(): Promise<CapletsResult<BackendCheckResult>>;
+  /** List tool summaries for the discovery pass; may be empty. */
+  tools(input?: PageInput): Promise<Page<ToolSummary>>;
+  /** Search tool summaries for the discovery pass; may be empty. */
+  searchTools(query: string, input?: PageInput): Promise<Page<ToolSummary>>;
+  /** Get schema, callSignature, types, examples; prefer outputSchema/outputTypeScript over observed hints. */
+  describeTool(name: string): Promise<CapletsResult<ToolDescriptor>>;
+  /** Call one tool; expected failures return ok:false. Filter bulky data in script before returning. */
+  callTool(name: string, args?: unknown): Promise<CapletsResult<unknown>>;
+  /** List readable resources for the discovery pass; many backends expose none. */
+  resources(input?: PageInput): Promise<Page<ResourceSummary>>;
+  /** Search readable resources for the discovery pass; many backends expose none. */
+  searchResources(query: string, input?: PageInput): Promise<Page<ResourceSummary>>;
+  /** List resource templates for the discovery pass; many backends expose none. */
+  resourceTemplates(input?: PageInput): Promise<Page<ResourceTemplateSummary>>;
+  /** Read one resource by URI; unsupported/missing resources return ok:false. */
+  readResource(uri: string): Promise<CapletsResult<ResourceReadResult>>;
+  /** List reusable prompts for the discovery pass; many backends expose none. */
+  prompts(input?: PageInput): Promise<Page<PromptSummary>>;
+  /** Search reusable prompts for the discovery pass; many backends expose none. */
+  searchPrompts(query: string, input?: PageInput): Promise<Page<PromptSummary>>;
+  /** Get one prompt by name and args; unsupported/missing prompts return ok:false. */
+  getPrompt(name: string, args?: unknown): Promise<CapletsResult<PromptResult>>;
+  /** Complete a prompt or resource-template argument. */
+  complete(input: CompleteInput): Promise<CapletsResult<CompleteResult>>;
+}
+
+interface DebugApi {
+  readLogs(input: ReadLogsInput): Promise<ReadLogsResult>;
+}
+
+type CapletCard<Id extends string> = {
+  id: Id;
+  name: string;
+  description: string;
+  useWhen?: string;
+  avoidWhen?: string;
+  tags?: string[];
+  backend?: unknown;
+};
+
+type PageInput = { limit?: number; cursor?: string };
+type Page<T> = { items: T[]; nextCursor?: string; truncated?: boolean };
+type CapletsResult<T> =
+  | { ok: true; data: T; meta?: CapletsMeta }
+  | { ok: false; error: CapletsError; meta?: CapletsMeta };
+type CapletsMeta = { [key: string]: unknown };
+type CapletsError = { code: string; message: string; details?: unknown };
+type BackendCheckResult = unknown;
+type ToolSummary = {
+  /** Exact downstream tool identifier for describeTool(name) and callTool(name,args). */
+  name: string;
+  title?: string;
+  description?: string;
+  /** Optional author-supplied hint for when to prefer this tool. */
+  useWhen?: string;
+  /** Optional author-supplied hint for when to avoid this tool. */
+  avoidWhen?: string;
+  /** True when the tool declares that it only reads data. */
+  readOnlyHint?: boolean;
+  /** True when the tool declares that it may perform destructive writes. */
+  destructiveHint?: boolean;
+};
+type ToolDescriptor = {
+  id?: string;
+  tool?: unknown;
+  inputSchema?: unknown;
+  outputSchema?: unknown;
+  callSignature?: string;
+  inputTypeScript?: string;
+  outputTypeScript?: string;
+  observedOutputShape?: ObservedOutputShape;
+  examples?: unknown[];
+};
+
+type ObservedOutputShape = {
+  version: 1;
+  source: "observed";
+  observedAt: string;
+  sampleCount: number;
+  typeScript: string;
+  jsonShape: JsonShape;
+  truncated: boolean;
+};
+
+type JsonShape =
+  | { kind: "null" }
+  | { kind: "boolean" }
+  | { kind: "number" }
+  | { kind: "string" }
+  | { kind: "unknown" }
+  | { kind: "array"; element?: JsonShape; truncated?: boolean }
+  | {
+      kind: "object";
+      fields: Record<string, { optional: boolean; shape: JsonShape }>;
+      truncated?: boolean;
+    }
+  | { kind: "union"; variants: JsonShape[] };
+type ResourceSummary = { uri?: string; name?: string; title?: string; description?: string };
+type ResourceTemplateSummary = {
+  uriTemplate?: string;
+  name?: string;
+  title?: string;
+  description?: string;
+};
+type ResourceReadResult = unknown;
+type PromptSummary = { name?: string; title?: string; description?: string };
+type PromptResult = unknown;
+type CompleteInput = {
+  ref: { type: "prompt"; name: string } | { type: "resourceTemplate"; uri: string };
+  argument: { name: string; value: string };
+};
+type CompleteResult = unknown;
+
+type ReadLogsInput = { logRef: string; cursor?: string; limit?: number };
+type ReadLogsResult = { entries: CodeModeLogEntry[]; nextCursor?: string };
+type CodeModeLogEntry = {
+  level: "log" | "info" | "warn" | "error" | "debug";
+  message: string;
+  timestamp: string;
+};
+
+interface Console {
+  log(...values: unknown[]): void;
+  info(...values: unknown[]): void;
+  warn(...values: unknown[]): void;
+  error(...values: unknown[]): void;
+  debug(...values: unknown[]): void;
+}
+declare const console: Console;
diff --git a/packages/core/src/code-mode/runtime-api.generated.ts b/packages/core/src/code-mode/runtime-api.generated.ts
new file mode 100644
index 0000000..714a9fe
--- /dev/null
+++ b/packages/core/src/code-mode/runtime-api.generated.ts
@@ -0,0 +1,3 @@
+// Generated by scripts/generate-code-mode-runtime-api.mjs. Do not edit by hand.
+export const CODE_MODE_RUNTIME_API_DECLARATION =
+  'type JsonPrimitive=string|number|boolean|null;type JsonValue=JsonPrimitive|JsonValue[]|{[key:string]:JsonValue};interface CapletHandle<Id extends string>{readonly id:Id;/** Show this Caplet card,without tool/resource/prompt schemas. */ inspect():Promise<CapletCard<Id>>;/** Check backend readiness/auth;expected unavailable states return ok:false. */ check():Promise<CapletsResult<BackendCheckResult>>;/** List tool summaries for the discovery pass;may be empty. */ tools(input?:PageInput):Promise<Page<ToolSummary>>;/** Search tool summaries for the discovery pass;may be empty. */ searchTools(query:string,input?:PageInput):Promise<Page<ToolSummary>>;/** Get schema,callSignature,types,examples;prefer outputSchema/outputTypeScript over observed hints. */ describeTool(name:string):Promise<CapletsResult<ToolDescriptor>>;/** Call one tool;expected failures return ok:false. Filter bulky data in script before returning. */ callTool(name:string,args?:unknown):Promise<CapletsResult<unknown>>;/** List readable resources for the discovery pass;many backends expose none. */ resources(input?:PageInput):Promise<Page<ResourceSummary>>;/** Search readable resources for the discovery pass;many backends expose none. */ searchResources(query:string,input?:PageInput):Promise<Page<ResourceSummary>>;/** List resource templates for the discovery pass;many backends expose none. */ resourceTemplates(input?:PageInput):Promise<Page<ResourceTemplateSummary>>;/** Read one resource by URI;unsupported/missing resources return ok:false. */ readResource(uri:string):Promise<CapletsResult<ResourceReadResult>>;/** List reusable prompts for the discovery pass;many backends expose none. */ prompts(input?:PageInput):Promise<Page<PromptSummary>>;/** Search reusable prompts for the discovery pass;many backends expose none. */ searchPrompts(query:string,input?:PageInput):Promise<Page<PromptSummary>>;/** Get one prompt by name and args;unsupported/missing prompts return ok:false. */ getPrompt(name:string,args?:unknown):Promise<CapletsResult<PromptResult>>;/** Complete a prompt or resource-template argument. */ complete(input:CompleteInput):Promise<CapletsResult<CompleteResult>>;}interface DebugApi{readLogs(input:ReadLogsInput):Promise<ReadLogsResult>;}type CapletCard<Id extends string>={id:Id;name:string;description:string;useWhen?:string;avoidWhen?:string;tags?:string[];backend?:unknown;};type PageInput={limit?:number;cursor?:string};type Page<T>={items:T[];nextCursor?:string;truncated?:boolean};type CapletsResult<T>=|{ok:true;data:T;meta?:CapletsMeta}|{ok:false;error:CapletsError;meta?:CapletsMeta};type CapletsMeta={[key:string]:unknown};type CapletsError={code:string;message:string;details?:unknown};type BackendCheckResult=unknown;type ToolSummary={/** Exact downstream tool identifier for describeTool(name)and callTool(name,args). */ name:string;title?:string;description?:string;/** Optional author-supplied hint for when to prefer this tool. */ useWhen?:string;/** Optional author-supplied hint for when to avoid this tool. */ avoidWhen?:string;/** True when the tool declares that it only reads data. */ readOnlyHint?:boolean;/** True when the tool declares that it may perform destructive writes. */ destructiveHint?:boolean;};type ToolDescriptor={id?:string;tool?:unknown;inputSchema?:unknown;outputSchema?:unknown;callSignature?:string;inputTypeScript?:string;outputTypeScript?:string;observedOutputShape?:ObservedOutputShape;examples?:unknown[];};type ObservedOutputShape={version:1;source:"observed";observedAt:string;sampleCount:number;typeScript:string;jsonShape:JsonShape;truncated:boolean;};type JsonShape=|{kind:"null"}|{kind:"boolean"}|{kind:"number"}|{kind:"string"}|{kind:"unknown"}|{kind:"array";element?:JsonShape;truncated?:boolean}|{kind:"object";fields:Record<string,{optional:boolean;shape:JsonShape}>;truncated?:boolean;}|{kind:"union";variants:JsonShape[]};type ResourceSummary={uri?:string;name?:string;title?:string;description?:string};type ResourceTemplateSummary={uriTemplate?:string;name?:string;title?:string;description?:string;};type ResourceReadResult=unknown;type PromptSummary={name?:string;title?:string;description?:string};type PromptResult=unknown;type CompleteInput={ref:{type:"prompt";name:string}|{type:"resourceTemplate";uri:string};argument:{name:string;value:string};};type CompleteResult=unknown;type ReadLogsInput={logRef:string;cursor?:string;limit?:number};type ReadLogsResult={entries:CodeModeLogEntry[];nextCursor?:string};type CodeModeLogEntry={level:"log"|"info"|"warn"|"error"|"debug";message:string;timestamp:string;};interface Console{log(...values:unknown[]):void;info(...values:unknown[]):void;warn(...values:unknown[]):void;error(...values:unknown[]):void;debug(...values:unknown[]):void;}declare const console:Console;' as const;
diff --git a/packages/core/src/code-mode/sandbox.ts b/packages/core/src/code-mode/sandbox.ts
new file mode 100644
index 0000000..0771eda
--- /dev/null
+++ b/packages/core/src/code-mode/sandbox.ts
@@ -0,0 +1,369 @@
+import {
+  getQuickJS,
+  shouldInterruptAfterDeadline,
+  type QuickJSContext,
+  type QuickJSDeferredPromise,
+  type QuickJSHandle,
+  type QuickJSRuntime,
+} from "quickjs-emscripten";
+import ts from "typescript";
+import type { CodeModeLogEntry } from "./types";
+
+export type CodeModeSandboxInvokeInput = {
+  capletId: string;
+  method:
+    | "inspect"
+    | "check"
+    | "tools"
+    | "searchTools"
+    | "describeTool"
+    | "callTool"
+    | "resources"
+    | "searchResources"
+    | "resourceTemplates"
+    | "readResource"
+    | "prompts"
+    | "searchPrompts"
+    | "getPrompt"
+    | "complete"
+    | "readLogs";
+  args: unknown[];
+};
+
+export type CodeModeSandboxInput = {
+  code: string;
+  capletIds: string[];
+  timeoutMs: number;
+  invoke: (input: CodeModeSandboxInvokeInput) => Promise<unknown>;
+};
+
+export type CodeModeSandboxResult =
+  | { ok: true; value: unknown; logs: CodeModeLogEntry[] }
+  | { ok: false; error: string; logs: CodeModeLogEntry[]; stack?: string };
+
+export interface CodeModeSandbox {
+  run(input: CodeModeSandboxInput): Promise<CodeModeSandboxResult>;
+}
+
+export class QuickJsCodeModeSandbox implements CodeModeSandbox {
+  async run(input: CodeModeSandboxInput): Promise<CodeModeSandboxResult> {
+    return await evaluateInQuickJs(input);
+  }
+}
+
+async function evaluateInQuickJs(input: CodeModeSandboxInput): Promise<CodeModeSandboxResult> {
+  const timeoutMs = Math.max(100, input.timeoutMs);
+  const deadlineMs = Date.now() + timeoutMs;
+  const logs: CodeModeLogEntry[] = [];
+  const pendingDeferreds = new Set<QuickJSDeferredPromise>();
+  const QuickJS = await getQuickJS();
+  const runtime = QuickJS.newRuntime();
+  runtime.setInterruptHandler(shouldInterruptAfterDeadline(deadlineMs));
+  runtime.setMemoryLimit(64 * 1024 * 1024);
+  runtime.setMaxStackSize(1 * 1024 * 1024);
+
+  try {
+    const context = runtime.newContext();
+    try {
+      const logBridge = context.newFunction("__caplets_log", (levelHandle, messageHandle) => {
+        logs.push({
+          level: logLevel(context.getString(levelHandle)),
+          message: context.getString(messageHandle),
+          timestamp: new Date().toISOString(),
+        });
+        return context.undefined;
+      });
+      context.setProp(context.global, "__caplets_log", logBridge);
+      logBridge.dispose();
+
+      const invokeBridge = createInvokeBridge(
+        context,
+        pendingDeferreds,
+        input.invoke,
+        deadlineMs,
+        timeoutMs,
+      );
+      context.setProp(context.global, "__caplets_invoke", invokeBridge);
+      invokeBridge.dispose();
+
+      const evaluated = context.evalCode(buildExecutionSource(input.code, input.capletIds));
+      if (evaluated.error) {
+        const error = context.dump(evaluated.error);
+        evaluated.error.dispose();
+        return {
+          ok: false,
+          error: normalizeError(error, deadlineMs, timeoutMs),
+          logs,
+          ...optionalStack(stackFromDump(error)),
+        };
+      }
+
+      context.setProp(context.global, "__caplets_result", evaluated.value);
+      evaluated.value.dispose();
+
+      const stateResult = context.evalCode(
+        [
+          "(function(p) {",
+          "  var s = { settled: false, value: void 0, error: void 0 };",
+          "  var formatError = function(e) {",
+          "    if (e && typeof e === 'object' && typeof e.message === 'string') return e.message;",
+          "    return String(e);",
+          "  };",
+          "  p.then(function(value) { s.value = value; s.settled = true; },",
+          "         function(error) { s.error = formatError(error); s.settled = true; });",
+          "  return s;",
+          "})(__caplets_result)",
+        ].join("\n"),
+      );
+      if (stateResult.error) {
+        const error = context.dump(stateResult.error);
+        stateResult.error.dispose();
+        return {
+          ok: false,
+          error: normalizeError(error, deadlineMs, timeoutMs),
+          logs,
+          ...optionalStack(stackFromDump(error)),
+        };
+      }
+
+      const stateHandle = stateResult.value;
+      try {
+        await drainAsync(context, runtime, pendingDeferreds, deadlineMs, timeoutMs);
+        const settled = readProp(context, stateHandle, "settled") === true;
+        if (!settled) {
+          return { ok: false, error: timeoutMessage(timeoutMs), logs };
+        }
+        const error = readProp(context, stateHandle, "error");
+        if (typeof error !== "undefined") {
+          return { ok: false, error: normalizeError(error, deadlineMs, timeoutMs), logs };
+        }
+        return { ok: true, value: readProp(context, stateHandle, "value"), logs };
+      } finally {
+        stateHandle.dispose();
+      }
+    } finally {
+      for (const deferred of pendingDeferreds) {
+        if (deferred.alive) {
+          deferred.dispose();
+        }
+      }
+      pendingDeferreds.clear();
+      context.dispose();
+    }
+  } catch (error) {
+    return {
+      ok: false,
+      error: normalizeError(error, deadlineMs, timeoutMs),
+      logs,
+      ...optionalStack(stackFromError(error)),
+    };
+  } finally {
+    runtime.dispose();
+  }
+}
+
+function createInvokeBridge(
+  context: QuickJSContext,
+  pendingDeferreds: Set<QuickJSDeferredPromise>,
+  invoke: (input: CodeModeSandboxInvokeInput) => Promise<unknown>,
+  deadlineMs: number,
+  timeoutMs: number,
+): QuickJSHandle {
+  return context.newFunction("__caplets_invoke", (capletHandle, methodHandle, argsHandle) => {
+    const capletId = context.getString(capletHandle);
+    const method = context.getString(methodHandle) as CodeModeSandboxInvokeInput["method"];
+    const args = context.dump(argsHandle) as unknown[];
+    const deferred = context.newPromise();
+    pendingDeferreds.add(deferred);
+    deferred.settled.finally(() => pendingDeferreds.delete(deferred));
+
+    void invoke({ capletId, method, args }).then(
+      (value) => {
+        if (!deferred.alive) {
+          return;
+        }
+        try {
+          const serialized = JSON.stringify(value);
+          const valueHandle = context.newString(serialized === undefined ? "null" : serialized);
+          deferred.resolve(valueHandle);
+          valueHandle.dispose();
+        } catch (error) {
+          const errorHandle = context.newError(errorMessage(error));
+          deferred.reject(errorHandle);
+          errorHandle.dispose();
+        }
+      },
+      (error) => {
+        if (!deferred.alive) {
+          return;
+        }
+        const message = Date.now() >= deadlineMs ? timeoutMessage(timeoutMs) : errorMessage(error);
+        const errorHandle = context.newError(message);
+        deferred.reject(errorHandle);
+        errorHandle.dispose();
+      },
+    );
+    return deferred.handle;
+  });
+}
+
+function buildExecutionSource(code: string, capletIds: string[]): string {
+  const javascript = ts.transpileModule(code, {
+    compilerOptions: {
+      target: ts.ScriptTarget.ES2022,
+      module: ts.ModuleKind.ESNext,
+      importsNotUsedAsValues: ts.ImportsNotUsedAsValues.Remove,
+    },
+  }).outputText;
+  return [
+    '"use strict";',
+    "const __formatLogArg = (value) => {",
+    "  if (typeof value === 'string') return value;",
+    "  try { return JSON.stringify(value); } catch { return String(value); }",
+    "};",
+    "const __formatLogLine = (args) => args.map(__formatLogArg).join(' ');",
+    "const console = {",
+    "  log: (...args) => __caplets_log('log', __formatLogLine(args)),",
+    "  info: (...args) => __caplets_log('info', __formatLogLine(args)),",
+    "  warn: (...args) => __caplets_log('warn', __formatLogLine(args)),",
+    "  error: (...args) => __caplets_log('error', __formatLogLine(args)),",
+    "  debug: (...args) => __caplets_log('debug', __formatLogLine(args)),",
+    "};",
+    "const fetch = () => { throw new Error('fetch is disabled in Code Mode'); };",
+    "const __invoke = (capletId, method, args) => Promise.resolve(__caplets_invoke(capletId, method, args)).then(JSON.parse);",
+    "const __handle = (capletId) => ({",
+    "  id: capletId,",
+    "  inspect: () => __invoke(capletId, 'inspect', []),",
+    "  check: () => __invoke(capletId, 'check', []),",
+    "  tools: (input) => __invoke(capletId, 'tools', [input]),",
+    "  searchTools: (query, input) => __invoke(capletId, 'searchTools', [query, input]),",
+    "  describeTool: (name) => __invoke(capletId, 'describeTool', [name]),",
+    "  callTool: (name, args) => __invoke(capletId, 'callTool', [name, args]),",
+    "  resources: (input) => __invoke(capletId, 'resources', [input]),",
+    "  searchResources: (query, input) => __invoke(capletId, 'searchResources', [query, input]),",
+    "  resourceTemplates: (input) => __invoke(capletId, 'resourceTemplates', [input]),",
+    "  readResource: (uri) => __invoke(capletId, 'readResource', [uri]),",
+    "  prompts: (input) => __invoke(capletId, 'prompts', [input]),",
+    "  searchPrompts: (query, input) => __invoke(capletId, 'searchPrompts', [query, input]),",
+    "  getPrompt: (name, args) => __invoke(capletId, 'getPrompt', [name, args]),",
+    "  complete: (input) => __invoke(capletId, 'complete', [input]),",
+    "});",
+    "const caplets = {};",
+    ...capletIds.map(
+      (capletId) => `caplets[${JSON.stringify(capletId)}] = __handle(${JSON.stringify(capletId)});`,
+    ),
+    "caplets.debug = caplets.debug || {};",
+    "caplets.debug.readLogs = (input) => __invoke('debug', 'readLogs', [input]);",
+    "(async () => {",
+    javascript,
+    "})()",
+  ].join("\n");
+}
+
+async function drainAsync(
+  context: QuickJSContext,
+  runtime: QuickJSRuntime,
+  pendingDeferreds: ReadonlySet<QuickJSDeferredPromise>,
+  deadlineMs: number,
+  timeoutMs: number,
+): Promise<void> {
+  drainJobs(context, runtime, deadlineMs, timeoutMs);
+  while (pendingDeferreds.size > 0) {
+    await waitForDeferreds(pendingDeferreds, deadlineMs, timeoutMs);
+    drainJobs(context, runtime, deadlineMs, timeoutMs);
+  }
+  drainJobs(context, runtime, deadlineMs, timeoutMs);
+}
+
+function drainJobs(
+  context: QuickJSContext,
+  runtime: QuickJSRuntime,
+  deadlineMs: number,
+  timeoutMs: number,
+): void {
+  while (runtime.hasPendingJob()) {
+    if (Date.now() >= deadlineMs) {
+      throw new Error(timeoutMessage(timeoutMs));
+    }
+    const pending = runtime.executePendingJobs();
+    if (pending.error) {
+      const error = context.dump(pending.error);
+      pending.error.dispose();
+      throw new Error(errorMessage(error));
+    }
+  }
+}
+
+async function waitForDeferreds(
+  pendingDeferreds: ReadonlySet<QuickJSDeferredPromise>,
+  deadlineMs: number,
+  timeoutMs: number,
+): Promise<void> {
+  const remainingMs = deadlineMs - Date.now();
+  if (remainingMs <= 0) {
+    throw new Error(timeoutMessage(timeoutMs));
+  }
+  let timer: ReturnType<typeof setTimeout> | undefined;
+  try {
+    await Promise.race([
+      Promise.race([...pendingDeferreds].map((deferred) => deferred.settled)),
+      new Promise<never>((_, reject) => {
+        timer = setTimeout(() => reject(new Error(timeoutMessage(timeoutMs))), remainingMs);
+      }),
+    ]);
+  } finally {
+    if (timer) {
+      clearTimeout(timer);
+    }
+  }
+}
+
+function readProp(context: QuickJSContext, handle: QuickJSHandle, key: string): unknown {
+  const prop = context.getProp(handle, key);
+  try {
+    return context.dump(prop);
+  } finally {
+    prop.dispose();
+  }
+}
+
+function timeoutMessage(timeoutMs: number): string {
+  return `Code Mode execution timed out after ${timeoutMs}ms`;
+}
+
+function normalizeError(error: unknown, deadlineMs: number, timeoutMs: number): string {
+  const message = errorMessage(error);
+  return Date.now() >= deadlineMs && /\binterrupted\b/iu.test(message)
+    ? timeoutMessage(timeoutMs)
+    : message;
+}
+
+function errorMessage(error: unknown): string {
+  return error instanceof Error ? error.message : String(error);
+}
+
+function stackFromError(error: unknown): string | undefined {
+  return error instanceof Error ? error.stack : undefined;
+}
+
+function stackFromDump(error: unknown): string | undefined {
+  if (error && typeof error === "object" && "stack" in error) {
+    const stack = (error as { stack?: unknown }).stack;
+    return typeof stack === "string" ? stack : undefined;
+  }
+  return undefined;
+}
+
+function optionalStack(stack: string | undefined): { stack?: string } {
+  return stack === undefined ? {} : { stack };
+}
+
+function logLevel(value: string): CodeModeLogEntry["level"] {
+  return value === "info" ||
+    value === "warn" ||
+    value === "error" ||
+    value === "debug" ||
+    value === "log"
+    ? value
+    : "log";
+}
diff --git a/packages/core/src/code-mode/tool.ts b/packages/core/src/code-mode/tool.ts
new file mode 100644
index 0000000..5c967ac
--- /dev/null
+++ b/packages/core/src/code-mode/tool.ts
@@ -0,0 +1,36 @@
+import { z } from "zod";
+
+export const codeModeRunInputSchema = z.object({
+  code: z.string().describe("TypeScript Code Mode source to execute."),
+  timeoutMs: z
+    .number()
+    .int()
+    .positive()
+    .optional()
+    .describe("Optional execution timeout in milliseconds."),
+});
+
+export const codeModeRunParamsSchema = codeModeRunInputSchema.shape;
+
+export function codeModeRunInputJsonSchema(): Record<string, unknown> {
+  return {
+    type: "object",
+    properties: {
+      code: {
+        type: "string",
+        description: "TypeScript Code Mode source to execute.",
+      },
+      timeoutMs: {
+        type: "integer",
+        minimum: 1,
+        description: "Optional execution timeout in milliseconds.",
+      },
+    },
+    required: ["code"],
+    additionalProperties: false,
+  };
+}
+
+export function isCodeModeRunRequest(value: unknown): boolean {
+  return codeModeRunInputSchema.safeParse(value).success;
+}
diff --git a/packages/core/src/code-mode/types.ts b/packages/core/src/code-mode/types.ts
new file mode 100644
index 0000000..faacd4e
--- /dev/null
+++ b/packages/core/src/code-mode/types.ts
@@ -0,0 +1,122 @@
+export type JsonPrimitive = string | number | boolean | null;
+export type JsonValue = JsonPrimitive | JsonValue[] | { [key: string]: JsonValue };
+
+export type CodeModeCallableCaplet = {
+  id: string;
+  name: string;
+  description: string;
+  useWhen?: string;
+  avoidWhen?: string;
+};
+
+export type CodeModeDeclarationInput = {
+  caplets: CodeModeCallableCaplet[];
+};
+
+export type CodeModeTypesJson = {
+  declaration: string;
+  declarationHash: string;
+  callableCount: number;
+  generatedAt: string;
+  runtimeScope: string;
+};
+
+export type CodeModeDiagnostic = {
+  code: string;
+  message: string;
+  severity: "error" | "warning" | "info";
+  line?: number;
+  column?: number;
+};
+
+export type CodeModeRunMeta = {
+  runId: string;
+  traceId: string;
+  declarationHash: string;
+  durationMs: number;
+  timeoutMs: number;
+  maxTimeoutMs: number;
+};
+
+export type CodeModeRunError = {
+  code: string;
+  message: string;
+  details?: unknown;
+  location?: { line: number; column: number };
+  hint?: string;
+  stackPreview?: string[];
+};
+
+export type CodeModeLogEntry = {
+  level: "log" | "info" | "warn" | "error" | "debug";
+  message: string;
+  timestamp: string;
+};
+
+export type CodeModeLogs = {
+  entries: CodeModeLogEntry[];
+  truncated: boolean;
+  stored: boolean;
+  logRef?: string;
+  nextCursor?: string;
+  expiresAt?: string;
+};
+
+export type CodeModeRunEnvelope =
+  | {
+      ok: true;
+      value: JsonValue;
+      diagnostics: CodeModeDiagnostic[];
+      logs: CodeModeLogs;
+      meta: CodeModeRunMeta;
+    }
+  | {
+      ok: false;
+      error: CodeModeRunError;
+      diagnostics: CodeModeDiagnostic[];
+      logs: CodeModeLogs;
+      meta: CodeModeRunMeta;
+    };
+
+export type ToolCallMeta = {
+  capletId?: string;
+  tool?: string;
+  durationMs?: number;
+  [key: string]: unknown;
+};
+
+export type ToolCallError = {
+  code: string;
+  message: string;
+  details?: unknown;
+};
+
+export type ToolCallResult =
+  | { ok: true; data: unknown; meta?: ToolCallMeta }
+  | { ok: false; error: ToolCallError; meta?: ToolCallMeta };
+
+export type CapletsResult<T> =
+  | { ok: true; data: T; meta?: ToolCallMeta }
+  | { ok: false; error: ToolCallError; meta?: ToolCallMeta };
+
+export type Page<T> = {
+  items: T[];
+  nextCursor?: string;
+  truncated?: boolean;
+};
+
+export type PageInput = {
+  limit?: number;
+  cursor?: string;
+};
+
+export type ReadLogsInput = {
+  logRef: string;
+  cursor?: string;
+  limit?: number;
+};
+
+export type ReadLogsResult = {
+  entries: CodeModeLogEntry[];
+  nextCursor?: string;
+};
diff --git a/packages/core/src/config-runtime.ts b/packages/core/src/config-runtime.ts
index 48cc63c..1b670c9 100644
--- a/packages/core/src/config-runtime.ts
+++ b/packages/core/src/config-runtime.ts
@@ -53,6 +53,11 @@ export type RuntimeRequirementsConfig = {
   resources?: { class?: RuntimeResourceClass | undefined } | undefined;
 };
 
+export type AgentSelectionHintsConfig = {
+  useWhen?: string | undefined;
+  avoidWhen?: string | undefined;
+};
+
 export type CapletServerConfig = CommonCapletConfig & {
   backend: "mcp";
   transport: "stdio" | "http" | "sse";
@@ -79,7 +84,7 @@ export type OpenApiEndpointConfig = CommonCapletConfig & {
   operationCacheTtlMs: number;
 };
 
-export type GraphQlOperationConfig = {
+export type GraphQlOperationConfig = AgentSelectionHintsConfig & {
   document?: string | undefined;
   documentPath?: string | undefined;
   operationName?: string | undefined;
@@ -99,7 +104,7 @@ export type GraphQlEndpointConfig = CommonCapletConfig & {
   selectionDepth: number;
 };
 
-export type HttpActionConfig = {
+export type HttpActionConfig = AgentSelectionHintsConfig & {
   method: "GET" | "POST" | "PUT" | "PATCH" | "DELETE";
   path: string;
   description?: string | undefined;
@@ -119,7 +124,7 @@ export type HttpApiConfig = CommonCapletConfig & {
   maxResponseBytes: number;
 };
 
-export type CliToolActionConfig = {
+export type CliToolActionConfig = AgentSelectionHintsConfig & {
   description?: string | undefined;
   inputSchema?: Record<string, unknown> | undefined;
   outputSchema?: Record<string, unknown> | undefined;
@@ -186,7 +191,7 @@ export type CapletsConfig = {
   capletSets: Record<string, CapletSetConfig>;
 };
 
-type CommonCapletConfig = {
+type CommonCapletConfig = AgentSelectionHintsConfig & {
   server: string;
   name: string;
   description: string;
@@ -245,6 +250,11 @@ const runtimeRequirementsSchema = z
       .optional(),
   })
   .strict();
+const agentSelectionHintSchema = z.string().trim().min(1).max(500);
+const agentSelectionHintsSchema = {
+  useWhen: agentSelectionHintSchema.optional(),
+  avoidWhen: agentSelectionHintSchema.optional(),
+};
 const commonSchema = {
   name: z.string().trim().min(1).max(80),
   description: z
@@ -255,6 +265,7 @@ const commonSchema = {
     )
     .refine((value) => value.length <= 1500, "description must be at most 1500 characters"),
   tags: z.array(z.string().trim().min(1).max(80)).optional(),
+  ...agentSelectionHintsSchema,
   body: z.string().optional(),
   setup: setupSchema.optional(),
   projectBinding: projectBindingSchema.optional(),
@@ -293,6 +304,7 @@ const graphQlOperationSchema = z
     documentPath: z.string().min(1).optional(),
     operationName: z.string().min(1).optional(),
     description: z.string().min(1).optional(),
+    ...agentSelectionHintsSchema,
   })
   .strict()
   .refine((operation) => Boolean(operation.document) !== Boolean(operation.documentPath), {
@@ -323,6 +335,7 @@ const httpActionSchema = z
       .refine((value) => !value.startsWith("//"), "HTTP action path must not start with //")
       .refine((value) => !isUrl(value), "HTTP action path must be a URL path, not a URL"),
     description: z.string().min(1).optional(),
+    ...agentSelectionHintsSchema,
     inputSchema: z.record(z.string(), z.unknown()).optional(),
     outputSchema: z.record(z.string(), z.unknown()).optional(),
     query: scalarMapSchema.optional(),
@@ -358,6 +371,7 @@ const httpApiSchema = z
 const cliActionSchema = z
   .object({
     description: z.string().min(1).optional(),
+    ...agentSelectionHintsSchema,
     inputSchema: z.record(z.string(), z.unknown()).optional(),
     outputSchema: z.record(z.string(), z.unknown()).optional(),
     command: z.string().min(1),
diff --git a/packages/core/src/config.ts b/packages/core/src/config.ts
index 8babef2..5b5da32 100644
--- a/packages/core/src/config.ts
+++ b/packages/core/src/config.ts
@@ -89,7 +89,12 @@ export type RuntimeRequirementsConfig = {
   resources?: { class?: RuntimeResourceClass | undefined } | undefined;
 };
 
-export type CapletServerConfig = {
+export type AgentSelectionHintsConfig = {
+  useWhen?: string | undefined;
+  avoidWhen?: string | undefined;
+};
+
+export type CapletServerConfig = AgentSelectionHintsConfig & {
   server: string;
   backend: "mcp";
   name: string;
@@ -118,7 +123,7 @@ export type OpenApiAuthConfig =
   | { type: "headers"; headers: Record<string, string> }
   | Extract<RemoteAuthConfig, { type: "oauth2" | "oidc" }>;
 
-export type OpenApiEndpointConfig = {
+export type OpenApiEndpointConfig = AgentSelectionHintsConfig & {
   server: string;
   backend: "openapi";
   name: string;
@@ -137,14 +142,14 @@ export type OpenApiEndpointConfig = {
   runtime?: RuntimeRequirementsConfig | undefined;
 };
 
-export type GraphQlOperationConfig = {
+export type GraphQlOperationConfig = AgentSelectionHintsConfig & {
   document?: string | undefined;
   documentPath?: string | undefined;
   operationName?: string | undefined;
   description?: string | undefined;
 };
 
-export type GraphQlEndpointConfig = {
+export type GraphQlEndpointConfig = AgentSelectionHintsConfig & {
   server: string;
   backend: "graphql";
   name: string;
@@ -166,7 +171,7 @@ export type GraphQlEndpointConfig = {
   runtime?: RuntimeRequirementsConfig | undefined;
 };
 
-export type HttpActionConfig = {
+export type HttpActionConfig = AgentSelectionHintsConfig & {
   method: "GET" | "POST" | "PUT" | "PATCH" | "DELETE";
   path: string;
   description?: string | undefined;
@@ -177,7 +182,7 @@ export type HttpActionConfig = {
   jsonBody?: unknown;
 };
 
-export type HttpApiConfig = {
+export type HttpApiConfig = AgentSelectionHintsConfig & {
   server: string;
   backend: "http";
   name: string;
@@ -199,7 +204,7 @@ export type CliToolOutputConfig = {
   type: "text" | "json";
 };
 
-export type CliToolActionConfig = {
+export type CliToolActionConfig = AgentSelectionHintsConfig & {
   description?: string | undefined;
   inputSchema?: Record<string, unknown> | undefined;
   outputSchema?: Record<string, unknown> | undefined;
@@ -220,7 +225,7 @@ export type CliToolActionConfig = {
     | undefined;
 };
 
-export type CliToolsConfig = {
+export type CliToolsConfig = AgentSelectionHintsConfig & {
   server: string;
   backend: "cli";
   name: string;
@@ -238,7 +243,7 @@ export type CliToolsConfig = {
   runtime?: RuntimeRequirementsConfig | undefined;
 };
 
-export type CapletSetConfig = {
+export type CapletSetConfig = AgentSelectionHintsConfig & {
   server: string;
   backend: "caplets";
   name: string;
@@ -456,6 +461,22 @@ const runtimeRequirementsSchema = z
   .strict()
   .describe("Runtime feature and resource requirements for hosted execution.");
 
+const agentSelectionHintSchema = z
+  .string()
+  .trim()
+  .min(1)
+  .max(500)
+  .describe("Optional author-supplied hint for agent tool/caplet selection.");
+
+const agentSelectionHintsSchema = {
+  useWhen: agentSelectionHintSchema
+    .optional()
+    .describe("When agents should prefer this Caplet or configured action."),
+  avoidWhen: agentSelectionHintSchema
+    .optional()
+    .describe("When agents should avoid this Caplet or configured action."),
+};
+
 const publicServerSchema = z
   .object({
     name: z.string().trim().min(1).max(80).describe("Human-readable server display name."),
@@ -481,6 +502,7 @@ const publicServerSchema = z
     url: z.string().url().optional().describe("Remote MCP server URL for http or sse transport."),
     auth: remoteAuthSchema.optional(),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
     runtime: runtimeRequirementsSchema.optional(),
@@ -531,6 +553,7 @@ const publicOpenApiEndpointSchema = z
       'Explicit OpenAPI request auth config. Use {"type":"none"} for public APIs.',
     ),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
     runtime: runtimeRequirementsSchema.optional(),
@@ -565,6 +588,7 @@ const graphQlOperationSchema = z
     documentPath: z.string().min(1).optional().describe("Path to a GraphQL operation document."),
     operationName: z.string().min(1).optional().describe("Operation name to execute."),
     description: z.string().min(1).optional().describe("Operation capability description."),
+    ...agentSelectionHintsSchema,
   })
   .strict()
   .superRefine((operation, ctx) => {
@@ -603,6 +627,7 @@ const publicGraphQlEndpointSchema = z
       'Explicit GraphQL request auth config. Use {"type":"none"} for public APIs.',
     ),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
     runtime: runtimeRequirementsSchema.optional(),
@@ -666,6 +691,7 @@ const httpActionSchema = z
       .refine((value) => !value.startsWith("//"), "HTTP action path must not start with //")
       .refine((value) => !isUrl(value), "HTTP action path must be a URL path, not a URL"),
     description: z.string().min(1).optional().describe("Action capability description."),
+    ...agentSelectionHintsSchema,
     inputSchema: z
       .record(z.string(), z.unknown())
       .optional()
@@ -719,6 +745,7 @@ const publicHttpApiSchema = z
       )
       .describe("Configured HTTP actions keyed by stable tool name."),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
     runtime: runtimeRequirementsSchema.optional(),
@@ -763,6 +790,7 @@ const cliToolAnnotationsSchema = z
 const cliToolActionSchema = z
   .object({
     description: z.string().min(1).optional().describe("Action capability description."),
+    ...agentSelectionHintsSchema,
     inputSchema: z
       .record(z.string(), z.unknown())
       .optional()
@@ -814,6 +842,7 @@ const publicCliToolsSchema = z
       .optional()
       .describe("Default environment variables for CLI actions."),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
     runtime: runtimeRequirementsSchema.optional(),
@@ -870,6 +899,7 @@ const publicCapletSetSchema = z
       .default(30_000)
       .describe("Milliseconds child Caplet metadata stays fresh. Set 0 to refresh every time."),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
     runtime: runtimeRequirementsSchema.optional(),
diff --git a/packages/core/src/config/paths.ts b/packages/core/src/config/paths.ts
index 6a15072..c09b9c2 100644
--- a/packages/core/src/config/paths.ts
+++ b/packages/core/src/config/paths.ts
@@ -85,9 +85,21 @@ export function defaultCompletionCacheDir(
     : pathJoin(defaultCacheBaseDir(env, home, platform), "caplets", "completions");
 }
 
+export function defaultObservedOutputShapeCacheDir(
+  env: PathEnv = process.env,
+  home = homedir(),
+  platform: Platform = process.platform,
+): string {
+  const pathJoin = platform === "win32" ? win32.join : posix.join;
+  return platform === "win32"
+    ? pathJoin(defaultCacheBaseDir(env, home, platform), "caplets", "cache", "result-shapes")
+    : pathJoin(defaultCacheBaseDir(env, home, platform), "caplets", "result-shapes");
+}
+
 export const DEFAULT_CONFIG_PATH = defaultConfigPath();
 export const DEFAULT_AUTH_DIR = defaultAuthDir();
 export const DEFAULT_COMPLETION_CACHE_DIR = defaultCompletionCacheDir();
+export const DEFAULT_OBSERVED_OUTPUT_SHAPE_CACHE_DIR = defaultObservedOutputShapeCacheDir();
 export const PROJECT_CONFIG_FILE = join(".caplets", "config.json");
 
 export function resolveConfigPath(path?: string): string {
diff --git a/packages/core/src/downstream.ts b/packages/core/src/downstream.ts
index c7fa0ee..6e6a839 100644
--- a/packages/core/src/downstream.ts
+++ b/packages/core/src/downstream.ts
@@ -2,6 +2,7 @@ import { Client } from "@modelcontextprotocol/sdk/client/index";
 import { StdioClientTransport } from "@modelcontextprotocol/sdk/client/stdio";
 import { StreamableHTTPClientTransport } from "@modelcontextprotocol/sdk/client/streamableHttp";
 import { SSEClientTransport } from "@modelcontextprotocol/sdk/client/sse";
+import type { Transport } from "@modelcontextprotocol/sdk/shared/transport";
 import {
   CompatibilityCallToolResultSchema,
   type CompleteRequestParams,
@@ -26,11 +27,17 @@ import type { ServerRegistry } from "./registry";
 import { searchToolList } from "./tool-search";
 
 export type CompactTool = {
-  id: string;
-  tool: string;
+  name: string;
   description?: string;
+  useWhen?: string;
+  avoidWhen?: string;
   hasInputSchema: boolean;
   hasOutputSchema: boolean;
+  supportsFields: boolean;
+  requiredArgs?: string[];
+  acceptedArgs?: string[];
+  readOnlyHint?: boolean;
+  destructiveHint?: boolean;
 };
 
 export type CompactResource = {
@@ -59,7 +66,7 @@ export type CompactPrompt = {
 
 type ManagedConnection = {
   client: Client;
-  transport: { close(): Promise<void>; onclose?: () => void; onerror?: (error: Error) => void };
+  transport: Transport;
   configFingerprint: string;
   tools?: Tool[] | undefined;
   toolsFetchedAt?: number | undefined;
@@ -73,9 +80,14 @@ type ManagedConnection = {
   closing?: boolean;
 };
 
+type PendingConnection = {
+  connection: ManagedConnection;
+  promise: Promise<ManagedConnection>;
+};
+
 export class DownstreamManager {
   private readonly connections = new Map<string, ManagedConnection>();
-  private readonly connecting = new Map<string, ManagedConnection>();
+  private readonly connecting = new Map<string, PendingConnection>();
   private readonly restartState = new Map<string, { restartUsed: boolean; backoffUntil: number }>();
 
   constructor(
@@ -88,7 +100,10 @@ export class DownstreamManager {
   }
 
   async close(): Promise<void> {
-    const connections = [...this.connections.values(), ...this.connecting.values()];
+    const connections = [
+      ...this.connections.values(),
+      ...[...this.connecting.values()].map((pending) => pending.connection),
+    ];
     for (const connection of connections) {
       connection.closing = true;
     }
@@ -98,7 +113,7 @@ export class DownstreamManager {
   }
 
   async closeServer(serverId: string): Promise<void> {
-    const connection = this.connections.get(serverId) ?? this.connecting.get(serverId);
+    const connection = this.connections.get(serverId) ?? this.connecting.get(serverId)?.connection;
     this.connections.delete(serverId);
     this.connecting.delete(serverId);
     this.restartState.delete(serverId);
@@ -342,11 +357,14 @@ export class DownstreamManager {
 
   compact(server: CapletServerConfig, tool: Tool): CompactTool {
     return {
-      id: server.server,
-      tool: tool.name,
+      name: tool.name,
       ...(tool.description ? { description: tool.description } : {}),
       hasInputSchema: Boolean(tool.inputSchema),
       hasOutputSchema: Boolean(tool.outputSchema),
+      supportsFields: Boolean(tool.outputSchema),
+      ...compactToolSelectionHints(tool),
+      ...compactToolSchemaHints(tool),
+      ...compactToolSafetyHints(tool),
     };
   }
 
@@ -502,6 +520,16 @@ export class DownstreamManager {
         return existing;
       }
     }
+    const pending = this.connecting.get(server.server);
+    if (pending) {
+      if (pending.connection.configFingerprint !== expectedFingerprint) {
+        this.connecting.delete(server.server);
+        pending.connection.closing = true;
+        await pending.connection.transport.close();
+      } else {
+        return await pending.promise;
+      }
+    }
     if (this.currentServerFingerprint(server) !== expectedFingerprint) {
       throw staleServerConfigError(server.server);
     }
@@ -515,7 +543,6 @@ export class DownstreamManager {
     }
 
     this.registry.setStatus(server.server, "starting");
-    let pendingConnection: ManagedConnection | undefined;
     try {
       const client = new Client({ name: "caplets", version: "1.0.0" }, { capabilities: {} });
       const transport = this.createTransport(server);
@@ -538,8 +565,6 @@ export class DownstreamManager {
         connection.prompts = undefined;
         connection.promptsFetchedAt = undefined;
       });
-      pendingConnection = connection;
-      this.connecting.set(server.server, connection);
       transport.onclose = () => {
         const current = this.connections.get(server.server);
         if (current === connection) {
@@ -574,19 +599,43 @@ export class DownstreamManager {
           toSafeError(error, "SERVER_UNAVAILABLE"),
         );
       };
-      await client.connect(transport, { timeout: server.startupTimeoutMs });
+      const pendingConnection: PendingConnection = {
+        connection,
+        promise: this.startConnection(server, expectedFingerprint, connection),
+      };
+      this.connecting.set(server.server, pendingConnection);
+      return await pendingConnection.promise;
+    } catch (error) {
+      const code = isTimeoutLike(error) ? "SERVER_START_TIMEOUT" : "SERVER_UNAVAILABLE";
+      const safe = toSafeError(error, code);
+      this.registry.setStatus(server.server, "unavailable", safe);
+      if (isAuthRemediationError(error)) {
+        throw error;
+      }
+      throw new CapletsError(code, `Could not start ${server.server}`, safe);
+    }
+  }
+
+  private async startConnection(
+    server: CapletServerConfig,
+    expectedFingerprint: string,
+    connection: ManagedConnection,
+  ): Promise<ManagedConnection> {
+    try {
+      await connection.client.connect(connection.transport, { timeout: server.startupTimeoutMs });
       if (connection.closing) {
-        await transport.close();
+        await connection.transport.close();
         throw new CapletsError("SERVER_UNAVAILABLE", `${server.server} connection was closed`);
       }
       if (this.currentServerFingerprint(server) !== expectedFingerprint) {
         connection.closing = true;
-        await transport.close();
+        await connection.transport.close();
         throw staleServerConfigError(server.server);
       }
-      if (this.connecting.get(server.server) !== connection) {
+      const pending = this.connecting.get(server.server);
+      if (pending?.connection !== connection) {
         connection.closing = true;
-        await transport.close();
+        await connection.transport.close();
         throw new CapletsError("SERVER_UNAVAILABLE", `${server.server} connection was replaced`);
       }
       this.connecting.delete(server.server);
@@ -594,16 +643,11 @@ export class DownstreamManager {
       this.registry.setStatus(server.server, "available");
       return connection;
     } catch (error) {
-      if (pendingConnection && this.connecting.get(server.server) === pendingConnection) {
+      const pending = this.connecting.get(server.server);
+      if (pending?.connection === connection) {
         this.connecting.delete(server.server);
       }
-      const code = isTimeoutLike(error) ? "SERVER_START_TIMEOUT" : "SERVER_UNAVAILABLE";
-      const safe = toSafeError(error, code);
-      this.registry.setStatus(server.server, "unavailable", safe);
-      if (isAuthRemediationError(error)) {
-        throw error;
-      }
-      throw new CapletsError(code, `Could not start ${server.server}`, safe);
+      throw error;
     }
   }
 
@@ -718,6 +762,53 @@ export class DownstreamManager {
   }
 }
 
+export function compactToolSafetyHints(
+  tool: Tool,
+): Pick<CompactTool, "readOnlyHint" | "destructiveHint"> {
+  const annotations = tool.annotations;
+  return {
+    ...(typeof annotations?.readOnlyHint === "boolean"
+      ? { readOnlyHint: annotations.readOnlyHint }
+      : {}),
+    ...(typeof annotations?.destructiveHint === "boolean"
+      ? { destructiveHint: annotations.destructiveHint }
+      : {}),
+  };
+}
+
+export function compactToolSchemaHints(
+  tool: Tool,
+): Pick<CompactTool, "requiredArgs" | "acceptedArgs"> {
+  const schema = isRecord(tool.inputSchema) ? tool.inputSchema : undefined;
+  const properties = isRecord(schema?.properties) ? schema.properties : {};
+  const acceptedArgs = Object.keys(properties).sort();
+  const requiredArgs = Array.isArray(schema?.required)
+    ? schema.required.filter((value): value is string => typeof value === "string").sort()
+    : [];
+  return {
+    ...(requiredArgs.length > 0 ? { requiredArgs } : {}),
+    ...(acceptedArgs.length > 0 ? { acceptedArgs } : {}),
+  };
+}
+
+export function compactToolSelectionHints(
+  tool: unknown,
+): Pick<CompactTool, "useWhen" | "avoidWhen"> {
+  if (!isRecord(tool)) return {};
+  return {
+    ...(typeof tool.useWhen === "string" && tool.useWhen.trim()
+      ? { useWhen: tool.useWhen.trim() }
+      : {}),
+    ...(typeof tool.avoidWhen === "string" && tool.avoidWhen.trim()
+      ? { avoidWhen: tool.avoidWhen.trim() }
+      : {}),
+  };
+}
+
+function isRecord(value: unknown): value is Record<string, unknown> {
+  return value !== null && typeof value === "object" && !Array.isArray(value);
+}
+
 function sameServerConfig(left: CapletServerConfig, right: CapletServerConfig): boolean {
   return serializeServerConfig(left) === serializeServerConfig(right);
 }
diff --git a/packages/core/src/engine.ts b/packages/core/src/engine.ts
index 3698d36..be19963 100644
--- a/packages/core/src/engine.ts
+++ b/packages/core/src/engine.ts
@@ -2,6 +2,7 @@ import { existsSync, readdirSync, statSync, watch, type FSWatcher } from "node:f
 import { dirname, join, parse } from "node:path";
 import { CapletSetManager } from "./caplet-sets";
 import { CliToolsManager } from "./cli-tools";
+import { findProjectRoot, fingerprintProjectRoot } from "./cloud/project-root";
 import {
   type CapletConfig,
   type CapletsConfig,
@@ -10,11 +11,17 @@ import {
   resolveConfigPath,
   resolveProjectConfigPath,
 } from "./config";
+import { DEFAULT_OBSERVED_OUTPUT_SHAPE_CACHE_DIR } from "./config/paths";
 import { DownstreamManager } from "./downstream";
 import { errorResult, toSafeError } from "./errors";
 import { GraphQLManager } from "./graphql";
 import { HttpActionManager } from "./http-actions";
 import { OpenApiManager } from "./openapi";
+import {
+  FileObservedOutputShapeStore,
+  type ObservedOutputShapeKey,
+  type ObservedOutputShapeStore,
+} from "./observed-output-shapes";
 import { ServerRegistry } from "./registry";
 import { handleServerTool } from "./tools";
 
@@ -28,6 +35,10 @@ export type CapletsEngineOptions = {
   watch?: boolean;
   writeErr?: (value: string) => void;
   configLoader?: (configPath: string, projectConfigPath: string) => CapletsConfig;
+  observedOutputShapeStore?: ObservedOutputShapeStore | undefined;
+  observedOutputShapeScope?: ObservedOutputShapeKey["scope"] | undefined;
+  observedOutputShapeCacheDir?: string | undefined;
+  projectFingerprint?: string | undefined;
 };
 
 export type CapletsEngineReloadEvent = {
@@ -59,6 +70,9 @@ export class CapletsEngine {
   private readonly watchEnabled: boolean;
   private readonly writeErr: (value: string) => void;
   private readonly configLoader: (configPath: string, projectConfigPath: string) => CapletsConfig;
+  private readonly observedOutputShapeStore: ObservedOutputShapeStore | undefined;
+  private readonly observedOutputShapeScope: ObservedOutputShapeKey["scope"];
+  private readonly projectFingerprint: string | undefined;
   private readonly reloadListeners = new Set<(event: CapletsEngineReloadEvent) => void>();
   private watchers: FSWatcher[] = [];
   private reloadTimer: NodeJS.Timeout | undefined;
@@ -84,6 +98,13 @@ export class CapletsEngine {
     this.watchDebounceMs = options.watchDebounceMs ?? 250;
     this.watchEnabled = options.watch ?? true;
     this.writeErr = options.writeErr ?? ((value: string) => process.stderr.write(value));
+    this.observedOutputShapeStore =
+      options.observedOutputShapeStore ??
+      new FileObservedOutputShapeStore(
+        options.observedOutputShapeCacheDir ?? DEFAULT_OBSERVED_OUTPUT_SHAPE_CACHE_DIR,
+      );
+    this.observedOutputShapeScope = options.observedOutputShapeScope ?? "local";
+    this.projectFingerprint = options.projectFingerprint ?? safeProjectFingerprint();
     if (this.watchEnabled) {
       this.resetWatchers();
     }
@@ -148,6 +169,11 @@ export class CapletsEngine {
         this.http,
         this.cli,
         this.capletSets,
+        {
+          observedOutputShapeStore: this.observedOutputShapeStore,
+          observedOutputShapeScope: this.observedOutputShapeScope,
+          projectFingerprint: this.projectFingerprint,
+        },
       );
     } catch (error) {
       return errorResult(error);
@@ -417,6 +443,14 @@ function selectAuthOptions(authDir: string | undefined): { authDir?: string } {
   return authDir ? { authDir } : {};
 }
 
+function safeProjectFingerprint(): string | undefined {
+  try {
+    return fingerprintProjectRoot(findProjectRoot());
+  } catch {
+    return undefined;
+  }
+}
+
 function watchedPaths(paths: RuntimePaths): WatchedPath[] {
   return uniqueWatchedPaths([
     { path: dirname(paths.configPath), reason: "config" },
diff --git a/packages/core/src/generated-tool-input-schema.ts b/packages/core/src/generated-tool-input-schema.ts
index 135d74d..2d2d8ac 100644
--- a/packages/core/src/generated-tool-input-schema.ts
+++ b/packages/core/src/generated-tool-input-schema.ts
@@ -2,20 +2,20 @@ import { z } from "zod";
 
 export const operations = [
   "inspect",
-  "check_backend",
-  "list_tools",
+  "check",
+  "tools",
   "search_tools",
-  "get_tool",
+  "describe_tool",
   "call_tool",
 ] as const;
 
 export const mcpOperations = [
   ...operations,
-  "list_resources",
+  "resources",
   "search_resources",
-  "list_resource_templates",
+  "resource_templates",
   "read_resource",
-  "list_prompts",
+  "prompts",
   "search_prompts",
   "get_prompt",
   "complete",
@@ -24,17 +24,21 @@ export const mcpOperations = [
 export type GeneratedOperation = (typeof operations)[number];
 export type GeneratedMcpOperation = (typeof mcpOperations)[number];
 export type CapletSchemaBackend = { backend: string };
+export type GeneratedToolInputSchemaOptions = {
+  includeFields?: boolean;
+};
 
 export const generatedToolInputDescriptions = {
   operation:
-    "Wrapper operation: inspect, check_backend, list_tools, search_tools, get_tool, call_tool. MCP Caplets also expose resources, prompts, and completions.",
+    "Wrapper operation: inspect, check, tools, search_tools, describe_tool, call_tool, resources, search_resources, resource_templates, read_resource, prompts, search_prompts, get_prompt, complete.",
   query: "Required for search operations only.",
   limit: "Optional list/search result limit.",
-  tool: "Exact downstream tool name for get_tool or call_tool.",
-  arguments: "JSON object for call_tool arguments/downstream inputs or get_prompt arguments.",
-  fields: "Optional call_tool structured output paths when outputSchema allows it.",
+  cursor: "Opaque pagination cursor returned by list/search operations.",
+  name: "Exact downstream tool or prompt name from tools/search_tools/prompts/search_prompts; do not guess.",
+  args: "JSON object for call_tool or get_prompt arguments; must match describe_tool inputSchema exactly.",
+  fields:
+    "Optional call_tool structured output paths. Use only after describe_tool returns fieldSelection.supported true.",
   uri: "Exact downstream resource URI for read_resource.",
-  prompt: "Exact downstream prompt name for get_prompt.",
   ref: "Completion target reference for complete.",
   argument: "Completion argument object for complete.",
 } as const;
@@ -51,12 +55,9 @@ export const completionArgumentSchema = z
 const baseShape = {
   query: z.string().optional().describe(generatedToolInputDescriptions.query),
   limit: z.number().int().positive().optional().describe(generatedToolInputDescriptions.limit),
-  tool: z.string().optional().describe(generatedToolInputDescriptions.tool),
-  arguments: z
-    .object({})
-    .catchall(z.any())
-    .optional()
-    .describe(generatedToolInputDescriptions.arguments),
+  cursor: z.string().optional().describe(generatedToolInputDescriptions.cursor),
+  name: z.string().optional().describe(generatedToolInputDescriptions.name),
+  args: z.object({}).catchall(z.any()).optional().describe(generatedToolInputDescriptions.args),
   fields: z
     .array(z.string().min(1))
     .min(1)
@@ -64,17 +65,20 @@ const baseShape = {
     .describe(generatedToolInputDescriptions.fields),
 };
 
-export function generatedToolInputSchemaForCaplet(caplet: CapletSchemaBackend) {
+export function generatedToolInputSchemaForCaplet(
+  caplet: CapletSchemaBackend,
+  options: GeneratedToolInputSchemaOptions = {},
+) {
+  const includeFields = options.includeFields ?? true;
   return z
     .object({
       operation: (caplet.backend === "mcp" ? z.enum(mcpOperations) : z.enum(operations)).describe(
         generatedToolInputDescriptions.operation,
       ),
-      ...baseShape,
+      ...schemaShape(includeFields),
       ...(caplet.backend === "mcp"
         ? {
             uri: z.string().optional().describe(generatedToolInputDescriptions.uri),
-            prompt: z.string().optional().describe(generatedToolInputDescriptions.prompt),
             ref: completionRefSchema.optional().describe(generatedToolInputDescriptions.ref),
             argument: completionArgumentSchema
               .optional()
@@ -92,8 +96,12 @@ export const generatedToolInputSchema = z
   })
   .strict();
 
-export function generatedToolInputJsonSchemaForCaplet(caplet: CapletSchemaBackend) {
+export function generatedToolInputJsonSchemaForCaplet(
+  caplet: CapletSchemaBackend,
+  options: GeneratedToolInputSchemaOptions = {},
+) {
   const mcp = caplet.backend === "mcp";
+  const includeFields = options.includeFields ?? true;
   return {
     type: "object",
     properties: {
@@ -104,18 +112,22 @@ export function generatedToolInputJsonSchemaForCaplet(caplet: CapletSchemaBacken
       },
       query: { type: "string", description: generatedToolInputDescriptions.query },
       limit: { type: "integer", minimum: 1, description: generatedToolInputDescriptions.limit },
-      tool: { type: "string", description: generatedToolInputDescriptions.tool },
-      arguments: { type: "object", description: generatedToolInputDescriptions.arguments },
-      fields: {
-        type: "array",
-        items: { type: "string", minLength: 1 },
-        minItems: 1,
-        description: generatedToolInputDescriptions.fields,
-      },
+      cursor: { type: "string", description: generatedToolInputDescriptions.cursor },
+      name: { type: "string", description: generatedToolInputDescriptions.name },
+      args: { type: "object", description: generatedToolInputDescriptions.args },
+      ...(includeFields
+        ? {
+            fields: {
+              type: "array",
+              items: { type: "string", minLength: 1 },
+              minItems: 1,
+              description: generatedToolInputDescriptions.fields,
+            },
+          }
+        : {}),
       ...(mcp
         ? {
             uri: { type: "string", description: generatedToolInputDescriptions.uri },
-            prompt: { type: "string", description: generatedToolInputDescriptions.prompt },
             ref: {
               oneOf: [
                 {
@@ -151,6 +163,18 @@ export function generatedToolInputJsonSchemaForCaplet(caplet: CapletSchemaBacken
   } as const;
 }
 
+function schemaShape(includeFields: boolean) {
+  return includeFields
+    ? baseShape
+    : {
+        query: baseShape.query,
+        limit: baseShape.limit,
+        cursor: baseShape.cursor,
+        name: baseShape.name,
+        args: baseShape.args,
+      };
+}
+
 export function generatedToolInputJsonSchema() {
   return generatedToolInputJsonSchemaForCaplet({ backend: "tool" });
 }
diff --git a/packages/core/src/graphql.ts b/packages/core/src/graphql.ts
index fc022e9..e2fe6f6 100644
--- a/packages/core/src/graphql.ts
+++ b/packages/core/src/graphql.ts
@@ -30,7 +30,12 @@ import {
 import { genericOAuthHeaders } from "./auth";
 import type { GraphQlEndpointConfig } from "./config";
 import { isAllowedRemoteUrl } from "./config/validation";
-import type { CompactTool } from "./downstream";
+import {
+  compactToolSafetyHints,
+  compactToolSchemaHints,
+  compactToolSelectionHints,
+  type CompactTool,
+} from "./downstream";
 import { CapletsError, toSafeError } from "./errors";
 import { isAbortError, parseHttpBody, readLimitedText } from "./http/utils";
 import type { ServerRegistry } from "./registry";
@@ -49,6 +54,8 @@ const SCALAR_JSON_SCHEMA: Record<string, Record<string, unknown>> = {
 type GraphQlOperation = {
   name: string;
   description?: string;
+  useWhen?: string;
+  avoidWhen?: string;
   document: string;
   operationName?: string;
   inputSchema: Record<string, unknown>;
@@ -222,11 +229,14 @@ export class GraphQLManager {
 
   compact(endpoint: GraphQlEndpointConfig, tool: Tool): CompactTool {
     return {
-      id: endpoint.server,
-      tool: tool.name,
+      name: tool.name,
       ...(tool.description ? { description: tool.description } : {}),
       hasInputSchema: Boolean(tool.inputSchema),
       hasOutputSchema: Boolean(tool.outputSchema),
+      supportsFields: false,
+      ...compactToolSelectionHints(tool),
+      ...compactToolSchemaHints(tool),
+      ...compactToolSafetyHints(tool),
     };
   }
 
@@ -306,6 +316,8 @@ export class GraphQLManager {
     return {
       name: operation.name,
       ...(operation.description ? { description: operation.description } : {}),
+      ...(operation.useWhen ? { useWhen: operation.useWhen } : {}),
+      ...(operation.avoidWhen ? { avoidWhen: operation.avoidWhen } : {}),
       inputSchema: operation.inputSchema as Tool["inputSchema"],
       annotations:
         operation.kind === "query"
@@ -384,6 +396,8 @@ function loadConfiguredOperations(
       return {
         name,
         ...(config.description ? { description: config.description } : {}),
+        ...(config.useWhen ? { useWhen: config.useWhen } : {}),
+        ...(config.avoidWhen ? { avoidWhen: config.avoidWhen } : {}),
         document,
         ...(config.operationName ? { operationName: config.operationName } : {}),
         inputSchema: variablesSchema(schema, operation),
diff --git a/packages/core/src/http-actions.ts b/packages/core/src/http-actions.ts
index 35db507..ece1443 100644
--- a/packages/core/src/http-actions.ts
+++ b/packages/core/src/http-actions.ts
@@ -2,7 +2,12 @@ import type { CompatibilityCallToolResult, Tool } from "@modelcontextprotocol/sd
 import { genericOAuthHeaders } from "./auth";
 import type { HttpActionConfig, HttpApiConfig } from "./config";
 import { FORBIDDEN_HEADERS, isAllowedRemoteUrl } from "./config/validation";
-import type { CompactTool } from "./downstream";
+import {
+  compactToolSafetyHints,
+  compactToolSchemaHints,
+  compactToolSelectionHints,
+  type CompactTool,
+} from "./downstream";
 import { CapletsError, toSafeError } from "./errors";
 import { isAbortError, parseHttpBody, readLimitedText } from "./http/utils";
 import type { ServerRegistry } from "./registry";
@@ -128,11 +133,14 @@ export class HttpActionManager {
 
   compact(api: HttpApiConfig, tool: Tool): CompactTool {
     return {
-      id: api.server,
-      tool: tool.name,
+      name: tool.name,
       ...(tool.description ? { description: tool.description } : {}),
       hasInputSchema: Boolean(tool.inputSchema),
       hasOutputSchema: Boolean(tool.outputSchema),
+      supportsFields: Boolean(tool.outputSchema),
+      ...compactToolSelectionHints(tool),
+      ...compactToolSchemaHints(tool),
+      ...compactToolSafetyHints(tool),
     };
   }
 
@@ -144,6 +152,8 @@ export class HttpActionManager {
     return {
       name: operation.name,
       ...(operation.description ? { description: operation.description } : {}),
+      ...(operation.useWhen ? { useWhen: operation.useWhen } : {}),
+      ...(operation.avoidWhen ? { avoidWhen: operation.avoidWhen } : {}),
       inputSchema: (operation.inputSchema ?? DEFAULT_INPUT_SCHEMA) as Tool["inputSchema"],
       ...(operation.outputSchema
         ? { outputSchema: operation.outputSchema as Tool["outputSchema"] }
diff --git a/packages/core/src/index.ts b/packages/core/src/index.ts
index d528526..7b01b10 100644
--- a/packages/core/src/index.ts
+++ b/packages/core/src/index.ts
@@ -26,6 +26,54 @@ export type {
 export { capabilityDescription, ServerRegistry } from "./registry";
 export { generatedToolInputSchema, handleServerTool } from "./tools";
 export type { CapletExecutionMetadata, CapletResultMetadata } from "./tools";
+export { createCodeModeCapletsApi, listCodeModeCallableCaplets } from "./code-mode/api";
+export type {
+  CodeModeCapletHandle,
+  CodeModeCapletsApi,
+  CodeModeDebugApi,
+  CreateCodeModeCapletsApiInput,
+} from "./code-mode/api";
+export {
+  codeModeDeclarationHash,
+  generateCodeModeDeclarations,
+  generateCodeModeRunToolDescription,
+  minifyCodeModeDeclarationText,
+} from "./code-mode/declarations";
+export { diagnoseCodeModeTypeScript } from "./code-mode/diagnostics";
+export type { DiagnoseCodeModeTypeScriptInput } from "./code-mode/diagnostics";
+export { CodeModeLogStore, redactCodeModeLogText } from "./code-mode/logs";
+export type { CodeModeLogStoreOptions, StoreCodeModeLogsResult } from "./code-mode/logs";
+export {
+  FileObservedOutputShapeStore,
+  observeOutputShape,
+  observedOutputShapeKey,
+  type ObservedOutputShape,
+  type ObservedOutputShapeKey,
+  type ObservedOutputShapeStore,
+} from "./observed-output-shapes";
+export { runCodeMode } from "./code-mode/runner";
+export type { RunCodeModeInput } from "./code-mode/runner";
+export { QuickJsCodeModeSandbox } from "./code-mode/sandbox";
+export type {
+  CodeModeSandbox,
+  CodeModeSandboxInput,
+  CodeModeSandboxInvokeInput,
+  CodeModeSandboxResult,
+} from "./code-mode/sandbox";
+export type {
+  CodeModeCallableCaplet,
+  CodeModeDeclarationInput,
+  CodeModeDiagnostic,
+  CodeModeLogs,
+  CodeModeRunEnvelope,
+  CodeModeRunError,
+  CodeModeRunMeta,
+  CodeModeTypesJson,
+  JsonValue,
+  ReadLogsInput,
+  ReadLogsResult,
+  ToolCallResult,
+} from "./code-mode/types";
 export type { CapletSetupCommandConfig, CapletSetupConfig } from "./config";
 export { capletSetupContentHash, stableJson } from "./setup/hash";
 export { LocalSetupStore } from "./setup/local-store";
diff --git a/packages/core/src/native.ts b/packages/core/src/native.ts
index 7d7de31..67d7c0e 100644
--- a/packages/core/src/native.ts
+++ b/packages/core/src/native.ts
@@ -14,6 +14,8 @@ export {
   nativeCapletToolDescription,
   nativeCapletToolName,
   nativeCapletsSystemGuidance,
+  nativeCodeModeRunToolId,
+  nativeCodeModeRunToolName,
 } from "./native/tools";
 export { generatedToolInputSchema } from "./tools";
 export { generatedToolInputJsonSchema } from "./generated-tool-input-schema";
diff --git a/packages/core/src/native/remote.ts b/packages/core/src/native/remote.ts
index 4dd5397..74f2a9c 100644
--- a/packages/core/src/native/remote.ts
+++ b/packages/core/src/native/remote.ts
@@ -10,7 +10,7 @@ import type {
   NativeCapletsToolsChangedListener,
   NativeCapletTool,
 } from "./service";
-import { nativeCapletToolName } from "./tools";
+import { nativeCapletToolName, nativeCodeModeRunToolId } from "./tools";
 
 export type RemoteCapletsTool = {
   name: string;
@@ -253,6 +253,7 @@ function remoteToolToNativeTool(tool: RemoteCapletsTool): NativeCapletTool {
       `Remote Caplet ID: ${tool.name}`,
     ].join("\n"),
     promptGuidance: [`Use ${toolName} through the remote Caplets service.`],
+    ...(tool.name === nativeCodeModeRunToolId ? { codeModeRun: true } : {}),
     inputSchema,
     operationNames: operationNamesFromSchema(inputSchema),
   };
diff --git a/packages/core/src/native/service.ts b/packages/core/src/native/service.ts
index 797aa14..47cdc1e 100644
--- a/packages/core/src/native/service.ts
+++ b/packages/core/src/native/service.ts
@@ -19,7 +19,19 @@ import {
   nativeCapletPromptGuidance,
   nativeCapletToolDescription,
   nativeCapletToolName,
+  nativeCodeModeRunToolId,
+  nativeCodeModeRunToolName,
 } from "./tools";
+import {
+  generateCodeModeDeclarations,
+  generateCodeModeRunToolDescription,
+} from "../code-mode/declarations";
+import { runCodeMode } from "../code-mode/runner";
+import {
+  codeModeRunInputJsonSchema,
+  codeModeRunInputSchema,
+  isCodeModeRunRequest,
+} from "../code-mode/tool";
 import {
   loadLocalOverlayConfigWithSources,
   parseConfig,
@@ -50,6 +62,9 @@ export type NativeCapletTool = {
   toolName: string;
   title: string;
   description: string;
+  codeModeRun?: boolean;
+  useWhen?: string;
+  avoidWhen?: string;
   promptGuidance: string[];
   inputSchema?: ReturnType<typeof generatedToolInputJsonSchemaForCaplet> | Record<string, unknown>;
   operationNames?: string[];
@@ -112,7 +127,7 @@ class DefaultNativeCapletsService implements NativeCapletsService {
   }
 
   listTools(): NativeCapletTool[] {
-    return this.engine.enabledServers().map((caplet) => {
+    const capletTools = this.engine.enabledServers().map((caplet) => {
       const toolName = nativeCapletToolName(caplet.server);
       const inputSchema = generatedToolInputJsonSchemaForCaplet(caplet);
       return {
@@ -120,14 +135,20 @@ class DefaultNativeCapletsService implements NativeCapletsService {
         toolName,
         title: caplet.name,
         description: nativeCapletToolDescription(toolName, caplet),
+        ...(caplet.useWhen ? { useWhen: caplet.useWhen } : {}),
+        ...(caplet.avoidWhen ? { avoidWhen: caplet.avoidWhen } : {}),
         promptGuidance: nativeCapletPromptGuidance(toolName, caplet),
         inputSchema,
         operationNames: [...inputSchema.properties.operation.enum],
       };
     });
+    return [...capletTools, codeModeRunNativeTool(capletTools)];
   }
 
   async execute(capletId: string, request: unknown): Promise<unknown> {
+    if (capletId === nativeCodeModeRunToolId && isCodeModeRunRequest(request)) {
+      return await executeCodeModeRunNative(this, request);
+    }
     return await this.engine.execute(capletId, request);
   }
 
@@ -144,6 +165,68 @@ class DefaultNativeCapletsService implements NativeCapletsService {
   }
 }
 
+function codeModeRunNativeTool(capletTools: NativeCapletTool[]): NativeCapletTool {
+  const declaration = generateCodeModeDeclarations({
+    caplets: capletTools.map((tool) => ({
+      id: tool.caplet,
+      name: tool.title,
+      description: tool.description,
+      ...(tool.useWhen ? { useWhen: tool.useWhen } : {}),
+      ...(tool.avoidWhen ? { avoidWhen: tool.avoidWhen } : {}),
+    })),
+  });
+  return {
+    caplet: nativeCodeModeRunToolId,
+    toolName: nativeCodeModeRunToolName,
+    title: "Code Mode",
+    description: [
+      generateCodeModeRunToolDescription(declaration),
+      "",
+      `Native tool name: ${nativeCodeModeRunToolName}`,
+    ].join("\n"),
+    codeModeRun: true,
+    promptGuidance: [
+      `Use ${nativeCodeModeRunToolName} to run Caplets Code Mode TypeScript with generated caplets.<id> handles.`,
+      "Prefer Code Mode for multi-step Caplet discovery, tool calls, filtering, joins, and compact synthesis.",
+      "Return decision-ready JSON from Code Mode rather than raw bulky provider payloads.",
+    ],
+    inputSchema: codeModeRunInputJsonSchema(),
+  };
+}
+
+async function executeCodeModeRunNative(
+  service: NativeCapletsService,
+  request: unknown,
+): Promise<unknown> {
+  const parsed = codeModeRunInputSchema.safeParse(request);
+  if (!parsed.success) {
+    return {
+      ok: false,
+      error: {
+        code: "REQUEST_INVALID",
+        message: "Code Mode run input is invalid.",
+        details: parsed.error.issues,
+      },
+      diagnostics: [],
+      logs: { entries: [], truncated: false, stored: false },
+      meta: {
+        runId: "",
+        traceId: "",
+        declarationHash: "",
+        durationMs: 0,
+        timeoutMs: 0,
+        maxTimeoutMs: 0,
+      },
+    };
+  }
+  return await runCodeMode({
+    code: parsed.data.code,
+    service,
+    ...(parsed.data.timeoutMs === undefined ? {} : { timeoutMs: parsed.data.timeoutMs }),
+    runtimeScope: process.env.CAPLETS_MODE?.trim() || "local",
+  });
+}
+
 function createDefaultNativeCapletsService(
   options: LocalNativeCapletsServiceOptions,
 ): NativeCapletsService {
@@ -324,6 +407,9 @@ class CompositeNativeCapletsService implements NativeCapletsService {
   }
 
   async execute(capletId: string, request: unknown): Promise<unknown> {
+    if (capletId === nativeCodeModeRunToolId && isCodeModeRunRequest(request)) {
+      return await executeCodeModeRunNative(this, request);
+    }
     if (this.local.listTools().some((tool) => tool.caplet === capletId)) {
       return await this.local.execute(capletId, request);
     }
@@ -386,9 +472,13 @@ class CompositeNativeCapletsService implements NativeCapletsService {
   }
 
   private mergeTools(): NativeCapletTool[] {
-    const localTools = this.local.listTools();
+    const localTools = this.local.listTools().filter((tool) => tool.codeModeRun !== true);
     const localIds = new Set(localTools.map((tool) => tool.caplet));
-    return [...this.remote.listTools().filter((tool) => !localIds.has(tool.caplet)), ...localTools];
+    const remoteTools = this.remote
+      .listTools()
+      .filter((tool) => tool.codeModeRun !== true && !localIds.has(tool.caplet));
+    const mergedTools = [...remoteTools, ...localTools];
+    return [...mergedTools, codeModeRunNativeTool(mergedTools)];
   }
 
   private async reloadChild(
diff --git a/packages/core/src/native/tools.ts b/packages/core/src/native/tools.ts
index a112395..012dd46 100644
--- a/packages/core/src/native/tools.ts
+++ b/packages/core/src/native/tools.ts
@@ -1,6 +1,9 @@
 import type { CapletConfig } from "../config";
 import { capabilityDescription } from "../registry";
 
+export const nativeCodeModeRunToolId = "run";
+export const nativeCodeModeRunToolName = "caplets_run";
+
 export function nativeCapletToolName(capletId: string): string {
   return `caplets_${capletId.replace(/_/g, "__").replace(/-/g, "_")}`;
 }
@@ -15,23 +18,30 @@ export function nativeCapletsSystemGuidance(toolNames: string[]): string {
     "Available Caplets native tools:",
     tools,
     "",
-    "Flow: inspect when the domain is unfamiliar; use search_tools/list_tools for actions; MCP-backed Caplets may also expose resources, prompts, and completions in their tool schema.",
-    "Use fields on call_tool when a non-GraphQL downstream outputSchema allows selecting only needed structured paths.",
+    `${nativeCodeModeRunToolName} executes Caplets Code Mode: TypeScript with generated caplets.<id> handles for multi-step discovery, tool calls, filtering, and compact synthesis in one native call.`,
+    "Flow: inspect when the domain is unfamiliar; use tools/search_tools for downstream names; use describe_tool before call_tool when args matter; pass call_tool.args with exact inputSchema property names.",
+    "Do not guess downstream tool names, resource URIs, prompt names, input args, output fields, or schemas. Do not infer input/output schemas from memory.",
+    "Prefer list/read/search operations for triage and avoid broad provider searches that can return huge payloads or hit rate limits.",
+    "When output shaping matters, inspect one tool with describe_tool and follow its fieldSelection hint.",
   ].join("\n");
 }
 
 export function nativeCapletPromptGuidance(toolName: string, caplet: CapletConfig): string[] {
+  const descriptorFirst =
+    "Use describe_tool before call_tool when args matter; call_tool.args must match inputSchema exactly. Do not guess tool names or schemas.";
   return caplet.backend === "mcp"
     ? [
         `Use ${toolName} for the ${caplet.name} Caplet capability domain.`,
         "Prefer resources for readable context, prompts for reusable workflows, and tools for actions.",
+        descriptorFirst,
       ]
-    : [`Use ${toolName} for the ${caplet.name} Caplet capability domain.`];
+    : [`Use ${toolName} for the ${caplet.name} Caplet capability domain.`, descriptorFirst];
 }
 
 export function nativeCapletToolDescription(toolName: string, caplet: CapletConfig): string {
   return [
     capabilityDescription(caplet),
+    "Use tools/search_tools to find downstream names. Use describe_tool before call_tool when args matter; call_tool.args must match inputSchema exactly. Do not guess tool names or schemas. Prefer read/search/list tools for triage.",
     "",
     `Native tool name: ${toolName}`,
     `Original Caplet ID: ${caplet.server}`,
diff --git a/packages/core/src/observed-output-shapes/extract.ts b/packages/core/src/observed-output-shapes/extract.ts
new file mode 100644
index 0000000..22e3861
--- /dev/null
+++ b/packages/core/src/observed-output-shapes/extract.ts
@@ -0,0 +1,122 @@
+import {
+  OBSERVED_OUTPUT_SHAPE_LIMITS,
+  OBSERVED_OUTPUT_SHAPE_VERSION,
+  type ExtractObservedOutputShapeInput,
+  type JsonShape,
+  type ObservedOutputShape,
+} from "./types";
+import { mergeJsonShapes } from "./merge";
+import { hasTruncatedShape, shapeToTypeScript } from "./typescript";
+
+export function observeOutputShape(
+  input: ExtractObservedOutputShapeInput,
+): ObservedOutputShape | undefined {
+  const shape = extractJsonShape(input.value);
+  if (!shape) return undefined;
+  const merged = input.existing ? mergeJsonShapes(input.existing.jsonShape, shape) : shape;
+  const emitted = shapeToTypeScript(merged);
+  const observed: ObservedOutputShape = {
+    version: OBSERVED_OUTPUT_SHAPE_VERSION,
+    source: "observed",
+    observedAt: (input.now ?? new Date()).toISOString(),
+    sampleCount: (input.existing?.sampleCount ?? 0) + 1,
+    typeScript: emitted.typeScript,
+    jsonShape: merged,
+    truncated: emitted.truncated || hasTruncatedShape(merged),
+  };
+  return storedBytes(observed) > OBSERVED_OUTPUT_SHAPE_LIMITS.maxStoredJsonBytes
+    ? {
+        ...observed,
+        typeScript: "type ObservedOutput = unknown;",
+        jsonShape: { kind: "unknown" },
+        truncated: true,
+      }
+    : observed;
+}
+
+export function extractJsonShape(value: unknown): JsonShape | undefined {
+  if (!isShapeableJsonRoot(value)) return undefined;
+  return shapeFor(value, 0);
+}
+
+export function parseShapeableJsonText(value: unknown): unknown | undefined {
+  if (!isPlainObject(value) || !Array.isArray(value.content) || value.content.length !== 1) {
+    return undefined;
+  }
+  const [item] = value.content;
+  if (!isPlainObject(item) || item.type !== "text" || typeof item.text !== "string") {
+    return undefined;
+  }
+  const text = item.text.trim();
+  if (!text || (!text.startsWith("{") && !text.startsWith("["))) return undefined;
+  try {
+    const parsed = JSON.parse(text) as unknown;
+    return isShapeableJsonRoot(parsed) ? parsed : undefined;
+  } catch {
+    return undefined;
+  }
+}
+
+export function normalizedObservableValue(result: unknown): unknown | undefined {
+  if (isPlainObject(result)) {
+    const structured = result.structuredContent;
+    if (structured !== undefined) {
+      if (isPlainObject(structured) && "caplets" in structured && "result" in structured) {
+        return isShapeableJsonRoot(structured.result) ? structured.result : undefined;
+      }
+      return isShapeableJsonRoot(structured) ? structured : undefined;
+    }
+  }
+  return parseShapeableJsonText(result);
+}
+
+function shapeFor(value: unknown, depth: number): JsonShape {
+  if (depth >= OBSERVED_OUTPUT_SHAPE_LIMITS.maxDepth) return { kind: "unknown" };
+  if (value === null) return { kind: "null" };
+  if (typeof value === "boolean") return { kind: "boolean" };
+  if (typeof value === "number") return { kind: "number" };
+  if (typeof value === "string") return { kind: "string" };
+  if (Array.isArray(value)) return arrayShape(value, depth);
+  if (isPlainObject(value)) return objectShape(value, depth);
+  return { kind: "unknown" };
+}
+
+function arrayShape(value: unknown[], depth: number): JsonShape {
+  const sampled = value.slice(0, OBSERVED_OUTPUT_SHAPE_LIMITS.maxArrayElements);
+  let element: JsonShape | undefined;
+  for (const item of sampled) {
+    const itemShape = shapeFor(item, depth + 1);
+    element = element ? mergeJsonShapes(element, itemShape) : itemShape;
+  }
+  return {
+    kind: "array",
+    ...(element ? { element } : {}),
+    ...(value.length > sampled.length ? { truncated: true } : {}),
+  };
+}
+
+function objectShape(value: Record<string, unknown>, depth: number): JsonShape {
+  const keys = Object.keys(value).sort();
+  const selected = keys.slice(0, OBSERVED_OUTPUT_SHAPE_LIMITS.maxObjectFields);
+  const fields: Record<string, { optional: boolean; shape: JsonShape }> = {};
+  for (const key of selected) {
+    fields[key] = { optional: true, shape: shapeFor(value[key], depth + 1) };
+  }
+  return {
+    kind: "object",
+    fields,
+    ...(keys.length > selected.length ? { truncated: true } : {}),
+  };
+}
+
+function isShapeableJsonRoot(value: unknown): boolean {
+  return Array.isArray(value) || isPlainObject(value);
+}
+
+function isPlainObject(value: unknown): value is Record<string, unknown> {
+  return Boolean(value) && typeof value === "object" && !Array.isArray(value);
+}
+
+function storedBytes(value: unknown): number {
+  return new TextEncoder().encode(JSON.stringify(value)).byteLength;
+}
diff --git a/packages/core/src/observed-output-shapes/file-store.ts b/packages/core/src/observed-output-shapes/file-store.ts
new file mode 100644
index 0000000..6c87b62
--- /dev/null
+++ b/packages/core/src/observed-output-shapes/file-store.ts
@@ -0,0 +1,170 @@
+import {
+  existsSync,
+  mkdirSync,
+  readdirSync,
+  readFileSync,
+  renameSync,
+  rmSync,
+  statSync,
+  writeFileSync,
+} from "node:fs";
+import { join } from "node:path";
+import {
+  OBSERVED_OUTPUT_SHAPE_LIMITS,
+  type ObservedOutputShape,
+  type ObservedOutputShapeKey,
+  type ObservedOutputShapePruneResult,
+  type ObservedOutputShapeStore,
+  type ObservedOutputShapeStoreHealth,
+} from "./types";
+import { observedOutputShapeStorageKey } from "./key";
+
+type StoredObservedOutputShape = {
+  key: ObservedOutputShapeKey;
+  shape: ObservedOutputShape;
+  createdAt: string;
+  expiresAt: string;
+};
+
+export class FileObservedOutputShapeStore implements ObservedOutputShapeStore {
+  constructor(
+    private readonly cacheDir: string,
+    private readonly options: {
+      ttlMs?: number | undefined;
+      maxEntries?: number | undefined;
+    } = {},
+  ) {}
+
+  async read(key: ObservedOutputShapeKey): Promise<ObservedOutputShape | undefined> {
+    try {
+      const parsed = JSON.parse(
+        readFileSync(this.pathFor(key), "utf8"),
+      ) as StoredObservedOutputShape;
+      if (Date.now() > Date.parse(parsed.expiresAt)) return undefined;
+      if (!isObservedOutputShape(parsed.shape)) return undefined;
+      return parsed.shape;
+    } catch {
+      return undefined;
+    }
+  }
+
+  async write(key: ObservedOutputShapeKey, shape: ObservedOutputShape): Promise<void> {
+    const payload: StoredObservedOutputShape = {
+      key,
+      shape,
+      createdAt: new Date().toISOString(),
+      expiresAt: new Date(Date.now() + this.ttlMs()).toISOString(),
+    };
+    const bytes = new TextEncoder().encode(JSON.stringify(payload)).byteLength;
+    if (bytes > OBSERVED_OUTPUT_SHAPE_LIMITS.maxStoredJsonBytes) return;
+    mkdirSync(this.cacheDir, { recursive: true });
+    const path = this.pathFor(key);
+    const tempPath = `${path}.${process.pid}.tmp`;
+    writeFileSync(tempPath, JSON.stringify(payload), { mode: 0o600 });
+    renameSync(tempPath, path);
+    void this.prune().catch(() => undefined);
+  }
+
+  async prune(now = new Date()): Promise<ObservedOutputShapePruneResult> {
+    if (!existsSync(this.cacheDir)) return { removed: 0, remaining: 0 };
+    const files = this.entries();
+    let removed = 0;
+    const live: { path: string; expiresAt: number; mtimeMs: number }[] = [];
+    for (const file of files) {
+      try {
+        const parsed = JSON.parse(readFileSync(file.path, "utf8")) as StoredObservedOutputShape;
+        const expiresAt = Date.parse(parsed.expiresAt);
+        if (
+          !Number.isFinite(expiresAt) ||
+          now.getTime() > expiresAt ||
+          !isObservedOutputShape(parsed.shape)
+        ) {
+          rmSync(file.path, { force: true });
+          removed++;
+          continue;
+        }
+        live.push({ path: file.path, expiresAt, mtimeMs: file.mtimeMs });
+      } catch {
+        rmSync(file.path, { force: true });
+        removed++;
+      }
+    }
+    const maxEntries = this.maxEntries();
+    const overflow = Math.max(0, live.length - maxEntries);
+    if (overflow > 0) {
+      for (const entry of live.sort((a, b) => a.mtimeMs - b.mtimeMs).slice(0, overflow)) {
+        rmSync(entry.path, { force: true });
+        removed++;
+      }
+    }
+    return { removed, remaining: Math.max(0, live.length - overflow) };
+  }
+
+  async health(): Promise<ObservedOutputShapeStoreHealth> {
+    try {
+      mkdirSync(this.cacheDir, { recursive: true });
+      const probe = join(this.cacheDir, `.health-${process.pid}.json`);
+      writeFileSync(probe, "{}", { mode: 0o600 });
+      rmSync(probe, { force: true });
+      const prune = await this.prune();
+      return {
+        path: this.cacheDir,
+        readable: true,
+        writable: true,
+        entryCount: this.entries().length,
+        prune,
+      };
+    } catch (error) {
+      return {
+        path: this.cacheDir,
+        readable: false,
+        writable: false,
+        error: error instanceof Error ? error.message : String(error),
+      };
+    }
+  }
+
+  private pathFor(key: ObservedOutputShapeKey): string {
+    return join(this.cacheDir, `${observedOutputShapeStorageKey(key)}.json`);
+  }
+
+  private entries(): { path: string; mtimeMs: number }[] {
+    try {
+      return readdirSync(this.cacheDir, { withFileTypes: true })
+        .filter((entry) => entry.isFile() && entry.name.endsWith(".json"))
+        .map((entry) => {
+          const path = join(this.cacheDir, entry.name);
+          return { path, mtimeMs: readMtimeMs(path) };
+        });
+    } catch {
+      return [];
+    }
+  }
+
+  private ttlMs(): number {
+    return this.options.ttlMs ?? OBSERVED_OUTPUT_SHAPE_LIMITS.ttlMs;
+  }
+
+  private maxEntries(): number {
+    return this.options.maxEntries ?? OBSERVED_OUTPUT_SHAPE_LIMITS.maxLocalEntries;
+  }
+}
+
+function readMtimeMs(path: string): number {
+  try {
+    return statSync(path).mtimeMs;
+  } catch {
+    return 0;
+  }
+}
+
+function isObservedOutputShape(value: unknown): value is ObservedOutputShape {
+  return Boolean(
+    value &&
+    typeof value === "object" &&
+    (value as { version?: unknown }).version === 1 &&
+    (value as { source?: unknown }).source === "observed" &&
+    typeof (value as { typeScript?: unknown }).typeScript === "string" &&
+    typeof (value as { sampleCount?: unknown }).sampleCount === "number",
+  );
+}
diff --git a/packages/core/src/observed-output-shapes/index.ts b/packages/core/src/observed-output-shapes/index.ts
new file mode 100644
index 0000000..f865ab3
--- /dev/null
+++ b/packages/core/src/observed-output-shapes/index.ts
@@ -0,0 +1,26 @@
+export { FileObservedOutputShapeStore } from "./file-store";
+export {
+  extractJsonShape,
+  normalizedObservableValue,
+  observeOutputShape,
+  parseShapeableJsonText,
+} from "./extract";
+export {
+  backendFingerprint,
+  observedOutputShapeKey,
+  observedOutputShapeStorageKey,
+  stableHash,
+} from "./key";
+export { mergeJsonShapes } from "./merge";
+export { usefulOutputSchema } from "./schema";
+export { hasTruncatedShape, shapeToTypeScript, shapeType } from "./typescript";
+export {
+  OBSERVED_OUTPUT_SHAPE_LIMITS,
+  OBSERVED_OUTPUT_SHAPE_VERSION,
+  type JsonShape,
+  type ObservedOutputShape,
+  type ObservedOutputShapeKey,
+  type ObservedOutputShapePruneResult,
+  type ObservedOutputShapeStore,
+  type ObservedOutputShapeStoreHealth,
+} from "./types";
diff --git a/packages/core/src/observed-output-shapes/key.ts b/packages/core/src/observed-output-shapes/key.ts
new file mode 100644
index 0000000..068d5a1
--- /dev/null
+++ b/packages/core/src/observed-output-shapes/key.ts
@@ -0,0 +1,139 @@
+import { createHash } from "node:crypto";
+import type { CapletConfig } from "../config";
+import { schemaHash } from "../schema-hash";
+import { OBSERVED_OUTPUT_SHAPE_VERSION, type ObservedOutputShapeKey } from "./types";
+
+export function observedOutputShapeStorageKey(key: ObservedOutputShapeKey): string {
+  return stableHash(key);
+}
+
+export function observedOutputShapeKey(input: {
+  scope: ObservedOutputShapeKey["scope"];
+  workspaceId?: string | undefined;
+  projectFingerprint?: string | undefined;
+  caplet: CapletConfig;
+  toolName: string;
+  toolDescriptor?: unknown;
+  outputSchema?: unknown;
+}): ObservedOutputShapeKey {
+  const toolDescriptorHash = input.toolDescriptor ? stableHash(input.toolDescriptor) : undefined;
+  const outputSchemaHash = schemaHash(input.outputSchema) ?? undefined;
+  return {
+    scope: input.scope,
+    ...(input.workspaceId ? { workspaceId: input.workspaceId } : {}),
+    ...(input.projectFingerprint ? { projectFingerprint: input.projectFingerprint } : {}),
+    capletId: input.caplet.server,
+    backendKind: input.caplet.backend,
+    backendFingerprint: backendFingerprint(input.caplet),
+    toolName: input.toolName,
+    ...(toolDescriptorHash ? { toolDescriptorHash } : {}),
+    ...(outputSchemaHash ? { outputSchemaHash } : {}),
+    resultVersion: OBSERVED_OUTPUT_SHAPE_VERSION,
+  };
+}
+
+export function backendFingerprint(caplet: CapletConfig): string {
+  return stableHash(nonSecretBackendIdentity(caplet));
+}
+
+export function stableHash(value: unknown): string {
+  return createHash("sha256")
+    .update(JSON.stringify(stableJsonValue(value)))
+    .digest("hex");
+}
+
+function nonSecretBackendIdentity(caplet: CapletConfig): unknown {
+  switch (caplet.backend) {
+    case "mcp":
+      return caplet.transport === "stdio"
+        ? {
+            backend: caplet.backend,
+            server: caplet.server,
+            transport: caplet.transport,
+            command: caplet.command,
+            args: caplet.args,
+            cwd: caplet.cwd,
+          }
+        : {
+            backend: caplet.backend,
+            server: caplet.server,
+            transport: caplet.transport,
+            url: caplet.url,
+          };
+    case "openapi":
+      return {
+        backend: caplet.backend,
+        server: caplet.server,
+        specPath: caplet.specPath,
+        specUrl: caplet.specUrl,
+        baseUrl: caplet.baseUrl,
+      };
+    case "graphql":
+      return {
+        backend: caplet.backend,
+        server: caplet.server,
+        endpointUrl: caplet.endpointUrl,
+        schemaPath: caplet.schemaPath,
+        schemaUrl: caplet.schemaUrl,
+        introspection: caplet.introspection,
+        operations: caplet.operations,
+      };
+    case "http":
+      return {
+        backend: caplet.backend,
+        server: caplet.server,
+        baseUrl: caplet.baseUrl,
+        actions: Object.fromEntries(
+          Object.entries(caplet.actions).map(([name, action]) => [
+            name,
+            {
+              method: action.method,
+              path: action.path,
+              query: action.query,
+              hasJsonBody: action.jsonBody !== undefined,
+            },
+          ]),
+        ),
+      };
+    case "cli":
+      return {
+        backend: caplet.backend,
+        server: caplet.server,
+        cwd: caplet.cwd,
+        actions: Object.fromEntries(
+          Object.entries(caplet.actions).map(([name, action]) => [
+            name,
+            {
+              command: action.command,
+              args: action.args,
+              cwd: action.cwd,
+              output: action.output,
+            },
+          ]),
+        ),
+      };
+    case "caplets":
+      return {
+        backend: caplet.backend,
+        server: caplet.server,
+        configPath: caplet.configPath,
+        capletsRoot: caplet.capletsRoot,
+      };
+  }
+}
+
+function stableJsonValue(value: unknown): unknown {
+  if (Array.isArray(value)) {
+    return value.map((item) => stableJsonValue(item));
+  }
+  if (value && typeof value === "object") {
+    const record = value as Record<string, unknown>;
+    const sorted: Record<string, unknown> = {};
+    for (const key of Object.keys(record).sort()) {
+      const item = record[key];
+      if (item !== undefined) sorted[key] = stableJsonValue(item);
+    }
+    return sorted;
+  }
+  return value;
+}
diff --git a/packages/core/src/observed-output-shapes/merge.ts b/packages/core/src/observed-output-shapes/merge.ts
new file mode 100644
index 0000000..ea60bba
--- /dev/null
+++ b/packages/core/src/observed-output-shapes/merge.ts
@@ -0,0 +1,74 @@
+import { OBSERVED_OUTPUT_SHAPE_LIMITS, type JsonShape } from "./types";
+
+export function mergeJsonShapes(left: JsonShape, right: JsonShape): JsonShape {
+  if (left.kind === "unknown" || right.kind === "unknown") return { kind: "unknown" };
+  if (left.kind === right.kind) {
+    if (left.kind === "object" && right.kind === "object") return mergeObjects(left, right);
+    if (left.kind === "array" && right.kind === "array") return mergeArrays(left, right);
+    if (left.kind === "union" && right.kind === "union") {
+      return boundedUnion([...left.variants, ...right.variants]);
+    }
+    return left;
+  }
+  return boundedUnion([
+    ...(left.kind === "union" ? left.variants : [left]),
+    ...(right.kind === "union" ? right.variants : [right]),
+  ]);
+}
+
+function mergeObjects(
+  left: Extract<JsonShape, { kind: "object" }>,
+  right: Extract<JsonShape, { kind: "object" }>,
+): JsonShape {
+  const fields: Record<string, { optional: boolean; shape: JsonShape }> = {};
+  const keys = [...new Set([...Object.keys(left.fields), ...Object.keys(right.fields)])].sort();
+  let truncated = left.truncated === true || right.truncated === true;
+  const selected = keys.slice(0, OBSERVED_OUTPUT_SHAPE_LIMITS.maxObjectFields);
+  truncated = truncated || keys.length > selected.length;
+  for (const key of selected) {
+    const leftField = left.fields[key];
+    const rightField = right.fields[key];
+    if (leftField && rightField) {
+      fields[key] = {
+        optional: true,
+        shape: mergeJsonShapes(leftField.shape, rightField.shape),
+      };
+    } else {
+      fields[key] = {
+        optional: true,
+        shape: (leftField ?? rightField)!.shape,
+      };
+    }
+  }
+  return { kind: "object", fields, ...(truncated ? { truncated: true } : {}) };
+}
+
+function mergeArrays(
+  left: Extract<JsonShape, { kind: "array" }>,
+  right: Extract<JsonShape, { kind: "array" }>,
+): JsonShape {
+  const element =
+    left.element && right.element
+      ? mergeJsonShapes(left.element, right.element)
+      : (left.element ?? right.element);
+  return {
+    kind: "array",
+    ...(element ? { element } : {}),
+    ...(left.truncated === true || right.truncated === true ? { truncated: true } : {}),
+  };
+}
+
+function boundedUnion(variants: JsonShape[]): JsonShape {
+  const flattened = variants.flatMap((variant) =>
+    variant.kind === "union" ? variant.variants : [variant],
+  );
+  const unique: JsonShape[] = [];
+  for (const variant of flattened) {
+    if (variant.kind === "unknown") return { kind: "unknown" };
+    const key = JSON.stringify(variant);
+    if (!unique.some((existing) => JSON.stringify(existing) === key)) unique.push(variant);
+  }
+  if (unique.length === 1) return unique[0]!;
+  if (unique.length > OBSERVED_OUTPUT_SHAPE_LIMITS.maxUnionVariants) return { kind: "unknown" };
+  return { kind: "union", variants: unique.sort((a, b) => a.kind.localeCompare(b.kind)) };
+}
diff --git a/packages/core/src/observed-output-shapes/schema.ts b/packages/core/src/observed-output-shapes/schema.ts
new file mode 100644
index 0000000..9475a6f
--- /dev/null
+++ b/packages/core/src/observed-output-shapes/schema.ts
@@ -0,0 +1,24 @@
+export function usefulOutputSchema(schema: unknown): boolean {
+  if (!isPlainObject(schema)) return false;
+  if (Object.keys(schema).length === 0) return false;
+  if ("const" in schema || Array.isArray(schema.enum)) return true;
+  const type = schema.type;
+  if (Array.isArray(type))
+    return type.some((item) => usefulOutputSchema({ ...schema, type: item }));
+  if (type === "object" || isPlainObject(schema.properties)) {
+    if (isPlainObject(schema.properties) && Object.keys(schema.properties).length > 0) return true;
+    if (schema.additionalProperties === false) return true;
+    if (isPlainObject(schema.additionalProperties)) return true;
+    return false;
+  }
+  if (type === "array") return usefulOutputSchema(schema.items);
+  if (typeof type === "string") return true;
+  if (Array.isArray(schema.oneOf) || Array.isArray(schema.anyOf) || Array.isArray(schema.allOf)) {
+    return true;
+  }
+  return false;
+}
+
+function isPlainObject(value: unknown): value is Record<string, unknown> {
+  return Boolean(value) && typeof value === "object" && !Array.isArray(value);
+}
diff --git a/packages/core/src/observed-output-shapes/types.ts b/packages/core/src/observed-output-shapes/types.ts
new file mode 100644
index 0000000..8f06c1d
--- /dev/null
+++ b/packages/core/src/observed-output-shapes/types.ts
@@ -0,0 +1,80 @@
+import type { JsonValue } from "../code-mode/types";
+
+export const OBSERVED_OUTPUT_SHAPE_VERSION = 1;
+
+export const OBSERVED_OUTPUT_SHAPE_LIMITS = {
+  maxDepth: 6,
+  maxObjectFields: 40,
+  maxArrayElements: 20,
+  maxUnionVariants: 4,
+  maxTypeScriptChars: 4_000,
+  maxStoredJsonBytes: 16_000,
+  ttlMs: 30 * 24 * 60 * 60 * 1000,
+  maxLocalEntries: 2_000,
+} as const;
+
+export type JsonShape =
+  | { kind: "null" }
+  | { kind: "boolean" }
+  | { kind: "number" }
+  | { kind: "string" }
+  | { kind: "unknown" }
+  | { kind: "array"; element?: JsonShape; truncated?: boolean }
+  | {
+      kind: "object";
+      fields: Record<string, { optional: boolean; shape: JsonShape }>;
+      truncated?: boolean;
+    }
+  | { kind: "union"; variants: JsonShape[] };
+
+export type ObservedOutputShape = {
+  version: 1;
+  source: "observed";
+  observedAt: string;
+  sampleCount: number;
+  typeScript: string;
+  jsonShape: JsonShape;
+  truncated: boolean;
+};
+
+export type ObservedOutputShapeKey = {
+  scope: "local" | "self_hosted" | "cloud";
+  workspaceId?: string | undefined;
+  projectFingerprint?: string | undefined;
+  capletId: string;
+  backendKind: string;
+  backendFingerprint: string;
+  toolName: string;
+  toolDescriptorHash?: string | undefined;
+  outputSchemaHash?: string | undefined;
+  resultVersion: 1;
+};
+
+export type ObservedOutputShapePruneResult = {
+  removed: number;
+  remaining: number;
+};
+
+export type ObservedOutputShapeStoreHealth = {
+  path?: string | undefined;
+  readable: boolean;
+  writable: boolean;
+  entryCount?: number | undefined;
+  prune?: ObservedOutputShapePruneResult | undefined;
+  error?: string | undefined;
+};
+
+export interface ObservedOutputShapeStore {
+  read(key: ObservedOutputShapeKey): Promise<ObservedOutputShape | undefined>;
+  write(key: ObservedOutputShapeKey, shape: ObservedOutputShape): Promise<void>;
+  prune?(now?: Date): Promise<ObservedOutputShapePruneResult>;
+  health?(): Promise<ObservedOutputShapeStoreHealth>;
+}
+
+export type ExtractObservedOutputShapeInput = {
+  value: unknown;
+  now?: Date | undefined;
+  existing?: ObservedOutputShape | undefined;
+};
+
+export type ExtractedJsonValue = Extract<JsonValue, unknown[] | { [key: string]: JsonValue }>;
diff --git a/packages/core/src/observed-output-shapes/typescript.ts b/packages/core/src/observed-output-shapes/typescript.ts
new file mode 100644
index 0000000..7a8f025
--- /dev/null
+++ b/packages/core/src/observed-output-shapes/typescript.ts
@@ -0,0 +1,66 @@
+import { OBSERVED_OUTPUT_SHAPE_LIMITS, type JsonShape } from "./types";
+
+export function shapeToTypeScript(
+  shape: JsonShape,
+  typeName: string = "ObservedOutput",
+  maxChars: number = OBSERVED_OUTPUT_SHAPE_LIMITS.maxTypeScriptChars,
+): { typeScript: string; truncated: boolean } {
+  const body = shapeType(shape);
+  const typeScript = `type ${typeName} = ${body};`;
+  if (typeScript.length <= maxChars) {
+    return { typeScript, truncated: hasTruncatedShape(shape) };
+  }
+  return { typeScript: `type ${typeName} = unknown;`, truncated: true };
+}
+
+export function shapeType(shape: JsonShape): string {
+  switch (shape.kind) {
+    case "null":
+      return "null";
+    case "boolean":
+      return "boolean";
+    case "number":
+      return "number";
+    case "string":
+      return "string";
+    case "unknown":
+      return "unknown";
+    case "array":
+      return `${shape.element ? wrapArrayElement(shapeType(shape.element)) : "unknown"}[]`;
+    case "object":
+      return objectType(shape);
+    case "union":
+      return unionType(shape.variants);
+  }
+}
+
+export function hasTruncatedShape(shape: JsonShape): boolean {
+  if ("truncated" in shape && shape.truncated === true) return true;
+  if (shape.kind === "array") return shape.element ? hasTruncatedShape(shape.element) : false;
+  if (shape.kind === "object") {
+    return Object.values(shape.fields).some((field) => hasTruncatedShape(field.shape));
+  }
+  if (shape.kind === "union") return shape.variants.some((variant) => hasTruncatedShape(variant));
+  return false;
+}
+
+function objectType(shape: Extract<JsonShape, { kind: "object" }>): string {
+  const entries = Object.entries(shape.fields);
+  if (entries.length === 0) return "Record<string, unknown>";
+  return `{ ${entries
+    .map(([key, field]) => `${propertyName(key)}?: ${shapeType(field.shape)};`)
+    .join(" ")} }`;
+}
+
+function unionType(variants: JsonShape[]): string {
+  const rendered = [...new Set(variants.map((variant) => shapeType(variant)))];
+  return rendered.length === 0 ? "unknown" : rendered.join(" | ");
+}
+
+function wrapArrayElement(value: string): string {
+  return value.includes(" | ") ? `(${value})` : value;
+}
+
+function propertyName(key: string): string {
+  return /^[A-Za-z_$][\w$]*$/u.test(key) ? key : JSON.stringify(key);
+}
diff --git a/packages/core/src/openapi.ts b/packages/core/src/openapi.ts
index 28ac3af..aaba738 100644
--- a/packages/core/src/openapi.ts
+++ b/packages/core/src/openapi.ts
@@ -4,7 +4,12 @@ import { parse as parseYaml } from "yaml";
 import { genericOAuthHeaders } from "./auth";
 import type { OpenApiEndpointConfig } from "./config";
 import { isAllowedRemoteUrl } from "./config/validation";
-import type { CompactTool } from "./downstream";
+import {
+  compactToolSafetyHints,
+  compactToolSchemaHints,
+  compactToolSelectionHints,
+  type CompactTool,
+} from "./downstream";
 import { CapletsError, toSafeError } from "./errors";
 import { isAbortError, parseHttpBody, readLimitedText } from "./http/utils";
 import type { ServerRegistry } from "./registry";
@@ -179,11 +184,14 @@ export class OpenApiManager {
 
   compact(endpoint: OpenApiEndpointConfig, tool: Tool): CompactTool {
     return {
-      id: endpoint.server,
-      tool: tool.name,
+      name: tool.name,
       ...(tool.description ? { description: tool.description } : {}),
       hasInputSchema: Boolean(tool.inputSchema),
       hasOutputSchema: Boolean(tool.outputSchema),
+      supportsFields: Boolean(tool.outputSchema),
+      ...compactToolSelectionHints(tool),
+      ...compactToolSchemaHints(tool),
+      ...compactToolSafetyHints(tool),
     };
   }
 
diff --git a/packages/core/src/registry.ts b/packages/core/src/registry.ts
index b422430..deb1e48 100644
--- a/packages/core/src/registry.ts
+++ b/packages/core/src/registry.ts
@@ -13,6 +13,8 @@ export type CapletServerSummary = {
   id: string;
   name: string;
   description: string;
+  useWhen?: string;
+  avoidWhen?: string;
   disabled?: boolean;
   status: ServerStatus;
   lastError?: SafeErrorSummary;
@@ -22,6 +24,8 @@ export type CapletServerDetail = {
   id: string;
   name: string;
   description: string;
+  useWhen?: string;
+  avoidWhen?: string;
   tags?: string[];
   backend:
     | {
@@ -119,6 +123,8 @@ export class ServerRegistry {
       id: server.server,
       name: server.name,
       description: server.description,
+      ...(server.useWhen ? { useWhen: server.useWhen } : {}),
+      ...(server.avoidWhen ? { avoidWhen: server.avoidWhen } : {}),
       ...(server.disabled ? { disabled: true } : {}),
       status: status?.status ?? (server.disabled ? "disabled" : "not_started"),
       ...(status?.lastError ? { lastError: status.lastError } : {}),
@@ -131,6 +137,8 @@ export class ServerRegistry {
       id: server.server,
       name: server.name,
       description: server.description,
+      ...(server.useWhen ? { useWhen: server.useWhen } : {}),
+      ...(server.avoidWhen ? { avoidWhen: server.avoidWhen } : {}),
       ...(server.tags ? { tags: server.tags } : {}),
       backend,
     };
diff --git a/packages/core/src/remote-control/dispatch.ts b/packages/core/src/remote-control/dispatch.ts
index 7f5b74b..5983002 100644
--- a/packages/core/src/remote-control/dispatch.ts
+++ b/packages/core/src/remote-control/dispatch.ts
@@ -28,16 +28,16 @@ type AddKind = "cli" | "mcp" | "openapi" | "graphql" | "http";
 
 const ENGINE_COMMANDS = new Set<RemoteCliRequest["command"]>([
   "inspect",
-  "check_backend",
-  "list_tools",
+  "check",
+  "tools",
   "search_tools",
-  "get_tool",
+  "describe_tool",
   "call_tool",
-  "list_resources",
+  "resources",
   "search_resources",
-  "list_resource_templates",
+  "resource_templates",
   "read_resource",
-  "list_prompts",
+  "prompts",
   "search_prompts",
   "get_prompt",
   "complete",
diff --git a/packages/core/src/remote-control/types.ts b/packages/core/src/remote-control/types.ts
index 002014e..f26774d 100644
--- a/packages/core/src/remote-control/types.ts
+++ b/packages/core/src/remote-control/types.ts
@@ -3,16 +3,16 @@ import type { CapletsErrorCode } from "../errors";
 export type RemoteCliCommand =
   | "list"
   | "inspect"
-  | "check_backend"
-  | "list_tools"
+  | "check"
+  | "tools"
   | "search_tools"
-  | "get_tool"
+  | "describe_tool"
   | "call_tool"
-  | "list_resources"
+  | "resources"
   | "search_resources"
-  | "list_resource_templates"
+  | "resource_templates"
   | "read_resource"
-  | "list_prompts"
+  | "prompts"
   | "search_prompts"
   | "get_prompt"
   | "complete"
diff --git a/packages/core/src/result-content.ts b/packages/core/src/result-content.ts
index a90f11e..c78b77f 100644
--- a/packages/core/src/result-content.ts
+++ b/packages/core/src/result-content.ts
@@ -210,27 +210,37 @@ function renderDiscoveryWrapper(
 ): string {
   const result = asRecord(value.result);
   const lines = [title, ""];
-  if (context.operation === "list_tools" || context.operation === "search_tools") {
-    lines.push("## Tools", "", renderNamedList(arrayValue(result?.tools), "tool"), "");
-  } else if (context.operation === "list_resources" || context.operation === "search_resources") {
+  if (context.operation === "tools" || context.operation === "search_tools") {
+    lines.push(
+      "## Tools",
+      "",
+      renderNamedList(arrayValue(result?.items ?? result?.tools), "tool"),
+      "",
+    );
+  } else if (context.operation === "resources" || context.operation === "search_resources") {
     lines.push(
       "## Resources",
       "",
-      renderNamedList(arrayValue(result?.resources ?? result?.matches), "uri"),
+      renderNamedList(arrayValue(result?.items ?? result?.resources ?? result?.matches), "uri"),
       "",
     );
-  } else if (context.operation === "list_resource_templates") {
+  } else if (context.operation === "resource_templates") {
     lines.push(
       "## Resource Templates",
       "",
-      renderNamedList(arrayValue(result?.resourceTemplates), "uriTemplate"),
+      renderNamedList(arrayValue(result?.items ?? result?.resourceTemplates), "uriTemplate"),
+      "",
+    );
+  } else if (context.operation === "prompts" || context.operation === "search_prompts") {
+    lines.push(
+      "## Prompts",
+      "",
+      renderNamedList(arrayValue(result?.items ?? result?.prompts), "prompt"),
       "",
     );
-  } else if (context.operation === "list_prompts" || context.operation === "search_prompts") {
-    lines.push("## Prompts", "", renderNamedList(arrayValue(result?.prompts), "prompt"), "");
-  } else if (context.operation === "get_tool") {
+  } else if (context.operation === "describe_tool") {
     lines.push("## Tool", "", renderToolSummary(asRecord(result?.tool)), "");
-  } else if (context.operation === "check_backend") {
+  } else if (context.operation === "check") {
     lines.push("## Backend Status", "", renderBackendStatus(result), "");
   } else if (context.operation === "inspect") {
     lines.push("## Caplet", "", renderCapletSummary(result), "");
diff --git a/packages/core/src/serve/session.ts b/packages/core/src/serve/session.ts
index 5ad582a..b5e80be 100644
--- a/packages/core/src/serve/session.ts
+++ b/packages/core/src/serve/session.ts
@@ -5,6 +5,20 @@ import type { CapletConfig, CapletsConfig } from "../config";
 import type { CapletsEngine } from "../engine";
 import { capabilityDescription } from "../registry";
 import { generatedToolInputSchemaForCaplet } from "../generated-tool-input-schema";
+import { listCodeModeCallableCaplets } from "../code-mode/api";
+import {
+  generateCodeModeDeclarations,
+  generateCodeModeRunToolDescription,
+} from "../code-mode/declarations";
+import { runCodeMode } from "../code-mode/runner";
+import { codeModeRunInputSchema, codeModeRunParamsSchema } from "../code-mode/tool";
+import { CodeModeLogStore } from "../code-mode/logs";
+import type { NativeCapletTool, NativeCapletsService } from "../native/service";
+import {
+  nativeCapletPromptGuidance,
+  nativeCapletToolDescription,
+  nativeCapletToolName,
+} from "../native/tools";
 
 export type ToolServer = Pick<McpServer, "registerTool" | "connect" | "close">;
 
@@ -15,6 +29,7 @@ export type CapletsMcpSessionOptions = {
 export class CapletsMcpSession {
   readonly server: ToolServer;
   private readonly tools = new Map<string, RegisteredTool>();
+  private readonly codeModeRunTool: RegisteredTool;
   private readonly unsubscribeReload: () => void;
   private closed = false;
 
@@ -28,6 +43,7 @@ export class CapletsMcpSession {
         name: "caplets",
         version: packageJsonVersion,
       });
+    this.codeModeRunTool = this.registerCodeModeRunTool();
     this.unsubscribeReload = this.engine.onReload(({ previous, next }) =>
       this.reconcileTools(previous, next),
     );
@@ -48,11 +64,69 @@ export class CapletsMcpSession {
     }
     this.closed = true;
     this.unsubscribeReload();
+    this.codeModeRunTool.remove();
     this.tools.clear();
     await this.server.close();
   }
 
+  private registerCodeModeRunTool(): RegisteredTool {
+    const codeModeService = new EngineNativeCapletsService(this.engine);
+    return this.server.registerTool(
+      "run",
+      {
+        title: "Code Mode",
+        description: codeModeRunToolDescription(codeModeService),
+        inputSchema: codeModeRunParamsSchema,
+      },
+      async (request: unknown) => this.handleCodeModeRunTool(request),
+    );
+  }
+
+  private async handleCodeModeRunTool(request: unknown): Promise<any> {
+    const parsed = codeModeRunInputSchema.safeParse(request);
+    const envelope = parsed.success
+      ? await runCodeMode({
+          code: parsed.data.code,
+          service: new EngineNativeCapletsService(this.engine),
+          ...(parsed.data.timeoutMs === undefined ? {} : { timeoutMs: parsed.data.timeoutMs }),
+          logStore: new CodeModeLogStore(),
+        })
+      : {
+          ok: false as const,
+          error: {
+            code: "REQUEST_INVALID",
+            message: "Code Mode run input is invalid.",
+            details: parsed.error.issues,
+          },
+          diagnostics: [],
+          logs: { entries: [], truncated: false, stored: false },
+          meta: {
+            runId: "",
+            traceId: "",
+            declarationHash: "",
+            durationMs: 0,
+            timeoutMs: 0,
+            maxTimeoutMs: 0,
+          },
+        };
+    return {
+      content: [{ type: "text" as const, text: JSON.stringify(envelope, null, 2) }],
+      structuredContent: envelope,
+      isError: !envelope.ok,
+    };
+  }
+
   private reconcileTools(previous: CapletsConfig | undefined, next: CapletsConfig): void {
+    if (previous) {
+      this.codeModeRunTool.update({
+        title: "Code Mode",
+        description: codeModeRunToolDescription(new EngineNativeCapletsService(this.engine)),
+        paramsSchema: codeModeRunParamsSchema,
+        callback: async (request: unknown) => this.handleCodeModeRunTool(request),
+        enabled: true,
+      });
+    }
+
     const enabled = new Map(nextEnabledServers(next).map((server) => [server.server, server]));
 
     for (const [serverId, tool] of this.tools) {
@@ -69,7 +143,7 @@ export class CapletsMcpSession {
           title: caplet.name,
           description: capabilityDescription(caplet),
           paramsSchema: generatedToolInputSchemaForCaplet(caplet).shape,
-          callback: async (request) => this.handleTool(serverId, request),
+          callback: async (request: unknown) => this.handleTool(serverId, request),
           enabled: true,
         });
       }
@@ -91,7 +165,7 @@ export class CapletsMcpSession {
         description: capabilityDescription(caplet),
         inputSchema: generatedToolInputSchemaForCaplet(caplet).shape,
       },
-      async (request) => this.handleTool(caplet.server, request),
+      async (request: unknown) => this.handleTool(caplet.server, request),
     );
   }
 
@@ -100,6 +174,46 @@ export class CapletsMcpSession {
   }
 }
 
+function codeModeRunToolDescription(service: NativeCapletsService): string {
+  const declaration = generateCodeModeDeclarations({
+    caplets: listCodeModeCallableCaplets(service),
+  });
+  return generateCodeModeRunToolDescription(declaration);
+}
+
+class EngineNativeCapletsService implements NativeCapletsService {
+  constructor(private readonly engine: CapletsEngine) {}
+
+  listTools(): NativeCapletTool[] {
+    return this.engine.enabledServers().map((caplet) => {
+      const toolName = nativeCapletToolName(caplet.server);
+      return {
+        caplet: caplet.server,
+        toolName,
+        title: caplet.name,
+        description: nativeCapletToolDescription(toolName, caplet),
+        promptGuidance: nativeCapletPromptGuidance(toolName, caplet),
+      };
+    });
+  }
+
+  async execute(capletId: string, request: unknown): Promise<unknown> {
+    return await this.engine.execute(capletId, request);
+  }
+
+  async reload(): Promise<boolean> {
+    return await this.engine.reload();
+  }
+
+  onToolsChanged(listener: (tools: NativeCapletTool[]) => void): () => void {
+    return this.engine.onReload(() => listener(this.listTools()));
+  }
+
+  async close(): Promise<void> {
+    return;
+  }
+}
+
 function nextEnabledServers(config: CapletsConfig): CapletConfig[] {
   return [
     ...Object.values(config.mcpServers),
diff --git a/packages/core/src/serve/stdio.ts b/packages/core/src/serve/stdio.ts
index 81146c8..d9a99d0 100644
--- a/packages/core/src/serve/stdio.ts
+++ b/packages/core/src/serve/stdio.ts
@@ -33,8 +33,18 @@ export async function serveStdio(options: ServeStdioOptions = {}): Promise<void>
     process.once("SIGTERM", sigtermHandler);
   }
 
+  const transport = new StdioServerTransport();
+  const transportClosed = new Promise<void>((resolve) => {
+    const previousOnClose = transport.onclose;
+    transport.onclose = () => {
+      previousOnClose?.();
+      resolve();
+    };
+  });
+
   try {
-    await session.connect(new StdioServerTransport());
+    await session.connect(transport);
+    await transportClosed;
   } finally {
     if (sigintHandler) process.off("SIGINT", sigintHandler);
     if (sigtermHandler) process.off("SIGTERM", sigtermHandler);
diff --git a/packages/core/src/tool-search.ts b/packages/core/src/tool-search.ts
index 90f34ac..5c5ac23 100644
--- a/packages/core/src/tool-search.ts
+++ b/packages/core/src/tool-search.ts
@@ -7,13 +7,47 @@ export function searchToolList<T>(
   compact: (tool: Tool) => T,
 ): T[] {
   const tokens = query.toLocaleLowerCase().split(/\s+/).filter(Boolean);
+  const preferReadFirst = !hasMutatingIntent(tokens);
 
   return tools
     .filter((tool) => {
       const haystack = `${tool.name}\n${tool.description ?? ""}`.toLocaleLowerCase();
       return tokens.some((token) => haystack.includes(token));
     })
-    .sort((left, right) => left.name.localeCompare(right.name))
+    .sort((left, right) => {
+      const safety = safetyRank(left, preferReadFirst) - safetyRank(right, preferReadFirst);
+      return safety === 0 ? left.name.localeCompare(right.name) : safety;
+    })
     .slice(0, limit)
     .map(compact);
 }
+
+const MUTATING_QUERY_TOKENS = new Set([
+  "add",
+  "create",
+  "delete",
+  "destroy",
+  "edit",
+  "insert",
+  "mutate",
+  "mutation",
+  "patch",
+  "post",
+  "publish",
+  "put",
+  "remove",
+  "set",
+  "update",
+  "write",
+]);
+
+function hasMutatingIntent(tokens: string[]): boolean {
+  return tokens.some((token) => MUTATING_QUERY_TOKENS.has(token));
+}
+
+function safetyRank(tool: Tool, preferReadFirst: boolean): number {
+  if (!preferReadFirst) return 0;
+  if (tool.annotations?.readOnlyHint === true) return 0;
+  if (tool.annotations?.destructiveHint === true) return 2;
+  return 1;
+}
diff --git a/packages/core/src/tools.ts b/packages/core/src/tools.ts
index e058980..9346b85 100644
--- a/packages/core/src/tools.ts
+++ b/packages/core/src/tools.ts
@@ -1,4 +1,5 @@
 import type { CallToolResult } from "@modelcontextprotocol/sdk/types";
+import Ajv, { type ErrorObject, type ValidateFunction } from "ajv";
 import type { CapletSetManager } from "./caplet-sets";
 import type { CapletConfig } from "./config";
 import type { CliToolsManager } from "./cli-tools";
@@ -7,6 +8,13 @@ import { CapletsError } from "./errors";
 import type { GraphQLManager } from "./graphql";
 import type { HttpActionManager } from "./http-actions";
 import type { OpenApiManager } from "./openapi";
+import {
+  normalizedObservableValue,
+  observeOutputShape,
+  observedOutputShapeKey,
+  usefulOutputSchema,
+  type ObservedOutputShapeStore,
+} from "./observed-output-shapes";
 import type { ServerRegistry } from "./registry";
 import { projectStructuredContent, validateFieldSelection } from "./field-selection";
 import {
@@ -22,10 +30,26 @@ import {
 
 export { generatedToolInputSchema } from "./generated-tool-input-schema";
 
+const ajv = new Ajv({
+  allErrors: true,
+  allowUnionTypes: true,
+  strict: false,
+  validateSchema: false,
+});
+const compiledValidators = new WeakMap<object, ValidateFunction>();
+const MAX_SCHEMA_ERRORS = 8;
+
 export type GeneratedServerToolRequest = RequiredOperationRequest;
 
 type ParsedOperationRequest = RequiredOperationRequest & Record<string, unknown>;
 
+export type HandleServerToolOptions = {
+  observedOutputShapeStore?: ObservedOutputShapeStore | undefined;
+  observedOutputShapeScope?: "local" | "self_hosted" | "cloud" | undefined;
+  workspaceId?: string | undefined;
+  projectFingerprint?: string | undefined;
+};
+
 export async function handleServerTool(
   server: CapletConfig,
   request: unknown,
@@ -36,6 +60,7 @@ export async function handleServerTool(
   http?: HttpActionManager,
   cli?: CliToolsManager,
   caplets?: CapletSetManager,
+  options: HandleServerToolOptions = {},
 ): Promise<any> {
   const startedAt = Date.now();
   const parsed = validateOperationRequest(
@@ -50,7 +75,7 @@ export async function handleServerTool(
         registry.detail(server),
         metadataFor(server, "inspect", undefined, startedAt),
       );
-    case "check_backend": {
+    case "check": {
       const result = await backendFor(
         server,
         downstream,
@@ -60,50 +85,70 @@ export async function handleServerTool(
         cli,
         caplets,
       ).check(server as never);
-      return jsonResult(result, metadataFor(server, "check_backend", undefined, startedAt));
+      return jsonResult(result, metadataFor(server, "check", undefined, startedAt));
     }
-    case "list_tools": {
+    case "tools": {
       const backend = backendFor(server, downstream, openapi, graphql, http, cli, caplets);
       const tools = await backend.listTools(server as never);
-      const limit = parsed.limit ?? tools.length;
+      const page = pageItems(
+        tools.map((tool) => backend.compact(server as never, tool)),
+        parsed,
+        registry.config.options.maxSearchLimit,
+      );
       return jsonResult(
         {
           id: server.server,
           name: server.name,
-          tools: tools.slice(0, limit).map((tool) => backend.compact(server as never, tool)),
+          ...page,
         },
-        metadataFor(server, "list_tools", undefined, startedAt),
+        metadataFor(server, "tools", undefined, startedAt),
       );
     }
     case "search_tools": {
       const backend = backendFor(server, downstream, openapi, graphql, http, cli, caplets);
       const tools = await backend.listTools(server as never);
       const limit = parsed.limit ?? registry.config.options.defaultSearchLimit;
+      const matches = backend.search(server as never, tools, parsed.query, limit);
+      const page = pageItems(matches, parsed, registry.config.options.maxSearchLimit);
       return jsonResult(
         {
           id: server.server,
           name: server.name,
           query: parsed.query,
-          tools: backend.search(server as never, tools, parsed.query, limit),
+          ...page,
         },
         metadataFor(server, "search_tools", undefined, startedAt),
       );
     }
-    case "get_tool": {
+    case "describe_tool": {
       const backend = backendFor(server, downstream, openapi, graphql, http, cli, caplets);
-      const tool = await backend.getTool(server as never, parsed.tool);
+      const tool = await backend.getTool(server as never, parsed.name);
+      const observedOutputShape = await readObservedOutputShape(
+        options,
+        server,
+        parsed.name,
+        tool.outputSchema,
+      );
       return jsonResult(
-        { id: server.server, tool },
-        metadataFor(server, "get_tool", parsed.tool, startedAt),
+        {
+          id: server.server,
+          tool,
+          ...(observedOutputShape ? { observedOutputShape } : {}),
+          fieldSelection: fieldSelectionFor(server, tool),
+        },
+        metadataFor(server, "describe_tool", parsed.name, startedAt),
       );
     }
     case "call_tool": {
       const backend = backendFor(server, downstream, openapi, graphql, http, cli, caplets);
+      const tool = await maybeGetToolForValidation(backend, server, parsed.name);
+      validateToolArgsForAgent(tool, parsed.name, parsed.args);
       if (parsed.fields === undefined) {
-        const result = await backend.callTool(server as never, parsed.tool, parsed.arguments);
+        const result = await backend.callTool(server as never, parsed.name, parsed.args);
+        await writeObservedOutputShape(options, server, parsed.name, result);
         return annotateCallToolResult(
           result,
-          metadataFor(server, "call_tool", parsed.tool, startedAt),
+          metadataFor(server, "call_tool", parsed.name, startedAt),
         );
       }
       if (server.backend === "graphql") {
@@ -113,44 +158,58 @@ export async function handleServerTool(
         );
       }
 
-      const tool = await backend.getTool(server as never, parsed.tool);
-      if (!tool.outputSchema) {
-        throw new CapletsError("REQUEST_INVALID", "Field selection requires an output schema");
+      const fieldSelectionTool = tool ?? (await backend.getTool(server as never, parsed.name));
+      if (!fieldSelectionTool.outputSchema) {
+        throw new CapletsError(
+          "REQUEST_INVALID",
+          "Field selection requires an output schema. Retry without fields, or call describe_tool first and only use fields when fieldSelection.supported is true.",
+        );
       }
-      validateFieldSelection(tool.outputSchema, parsed.fields);
+      validateFieldSelection(fieldSelectionTool.outputSchema, parsed.fields);
 
-      const metadata = metadataFor(server, "call_tool", parsed.tool, startedAt);
+      const metadata = metadataFor(server, "call_tool", parsed.name, startedAt);
+      const rawResult = await backend.callTool(server as never, parsed.name, parsed.args);
+      await writeObservedOutputShape(options, server, parsed.name, rawResult);
       const result = projectCallToolResult(
-        await backend.callTool(server as never, parsed.tool, parsed.arguments),
-        tool.outputSchema,
+        rawResult,
+        fieldSelectionTool.outputSchema,
         parsed.fields,
         markdownContextFor(metadata),
       );
       return annotateCallToolResult(result, metadata);
     }
-    case "list_resources": {
-      const backend = mcpBackendFor(server, downstream);
+    case "resources": {
+      const backend = mcpBackendFor(server, downstream, "page");
+      if (!backend) {
+        return jsonResult(
+          { id: server.server, name: server.name, items: [] },
+          metadataFor(server, "resources", undefined, startedAt),
+        );
+      }
       const resources = await backend.listResources(server as never);
-      const templates = await backend.listResourceTemplates(server as never);
-      const limit = parsed.limit ?? resources.length + templates.length;
+      const page = pageItems(
+        resources.map((resource) => backend.compactResource(server as never, resource)),
+        parsed,
+        registry.config.options.maxSearchLimit,
+      );
       return jsonResult(
         {
           id: server.server,
           name: server.name,
-          resources: resources
-            .slice(0, limit)
-            .map((resource) => backend.compactResource(server as never, resource)),
-          resourceTemplates: templates
-            .slice(0, Math.max(0, limit - resources.length))
-            .map((template) => backend.compactResourceTemplate(server as never, template)),
+          ...page,
         },
-        metadataFor(server, "list_resources", undefined, startedAt),
+        metadataFor(server, "resources", undefined, startedAt),
       );
     }
     case "search_resources": {
-      const backend = mcpBackendFor(server, downstream);
+      const backend = mcpBackendFor(server, downstream, "page");
+      if (!backend) {
+        return jsonResult(
+          { id: server.server, name: server.name, query: parsed.query, items: [] },
+          metadataFor(server, "search_resources", undefined, startedAt),
+        );
+      }
       const resources = await backend.listResources(server as never);
-      const templates = await backend.listResourceTemplates(server as never);
       const limit = parsed.limit ?? registry.config.options.defaultSearchLimit;
       const resourceMatches = backend.searchResources(
         server as never,
@@ -158,39 +217,42 @@ export async function handleServerTool(
         parsed.query,
         limit,
       );
-      const templateMatches = backend.searchResourceTemplates(
-        server as never,
-        templates,
-        parsed.query,
-        Math.max(0, limit - resourceMatches.length),
-      );
+      const page = pageItems(resourceMatches, parsed, registry.config.options.maxSearchLimit);
       return jsonResult(
         {
           id: server.server,
           name: server.name,
           query: parsed.query,
-          matches: [...resourceMatches, ...templateMatches],
+          ...page,
         },
         metadataFor(server, "search_resources", undefined, startedAt),
       );
     }
-    case "list_resource_templates": {
-      const backend = mcpBackendFor(server, downstream);
+    case "resource_templates": {
+      const backend = mcpBackendFor(server, downstream, "page");
+      if (!backend) {
+        return jsonResult(
+          { id: server.server, name: server.name, items: [] },
+          metadataFor(server, "resource_templates", undefined, startedAt),
+        );
+      }
       const templates = await backend.listResourceTemplates(server as never);
-      const limit = parsed.limit ?? templates.length;
+      const page = pageItems(
+        templates.map((template) => backend.compactResourceTemplate(server as never, template)),
+        parsed,
+        registry.config.options.maxSearchLimit,
+      );
       return jsonResult(
         {
           id: server.server,
           name: server.name,
-          resourceTemplates: templates
-            .slice(0, limit)
-            .map((template) => backend.compactResourceTemplate(server as never, template)),
+          ...page,
         },
-        metadataFor(server, "list_resource_templates", undefined, startedAt),
+        metadataFor(server, "resource_templates", undefined, startedAt),
       );
     }
     case "read_resource": {
-      const result = await mcpBackendFor(server, downstream).readResource(
+      const result = await mcpBackendFor(server, downstream, "direct")!.readResource(
         server as never,
         parsed.uri,
       );
@@ -199,48 +261,64 @@ export async function handleServerTool(
         metadataFor(server, "read_resource", { uri: parsed.uri }, startedAt),
       );
     }
-    case "list_prompts": {
-      const backend = mcpBackendFor(server, downstream);
+    case "prompts": {
+      const backend = mcpBackendFor(server, downstream, "page");
+      if (!backend) {
+        return jsonResult(
+          { id: server.server, name: server.name, items: [] },
+          metadataFor(server, "prompts", undefined, startedAt),
+        );
+      }
       const prompts = await backend.listPrompts(server as never);
-      const limit = parsed.limit ?? prompts.length;
+      const page = pageItems(
+        prompts.map((prompt) => backend.compactPrompt(server as never, prompt)),
+        parsed,
+        registry.config.options.maxSearchLimit,
+      );
       return jsonResult(
         {
           id: server.server,
           name: server.name,
-          prompts: prompts
-            .slice(0, limit)
-            .map((prompt) => backend.compactPrompt(server as never, prompt)),
+          ...page,
         },
-        metadataFor(server, "list_prompts", undefined, startedAt),
+        metadataFor(server, "prompts", undefined, startedAt),
       );
     }
     case "search_prompts": {
-      const backend = mcpBackendFor(server, downstream);
+      const backend = mcpBackendFor(server, downstream, "page");
+      if (!backend) {
+        return jsonResult(
+          { id: server.server, name: server.name, query: parsed.query, items: [] },
+          metadataFor(server, "search_prompts", undefined, startedAt),
+        );
+      }
       const prompts = await backend.listPrompts(server as never);
       const limit = parsed.limit ?? registry.config.options.defaultSearchLimit;
+      const matches = backend.searchPrompts(server as never, prompts, parsed.query, limit);
+      const page = pageItems(matches, parsed, registry.config.options.maxSearchLimit);
       return jsonResult(
         {
           id: server.server,
           name: server.name,
           query: parsed.query,
-          prompts: backend.searchPrompts(server as never, prompts, parsed.query, limit),
+          ...page,
         },
         metadataFor(server, "search_prompts", undefined, startedAt),
       );
     }
     case "get_prompt": {
-      const result = await mcpBackendFor(server, downstream).getPrompt(
+      const result = await mcpBackendFor(server, downstream, "direct")!.getPrompt(
         server as never,
-        parsed.prompt,
-        parsed.arguments,
+        parsed.name,
+        parsed.args,
       );
       return annotateMcpResult(
         result,
-        metadataFor(server, "get_prompt", { prompt: parsed.prompt }, startedAt),
+        metadataFor(server, "get_prompt", { prompt: parsed.name }, startedAt),
       );
     }
     case "complete": {
-      const result = await mcpBackendFor(server, downstream).complete(server as never, {
+      const result = await mcpBackendFor(server, downstream, "direct")!.complete(server as never, {
         ref: parsed.ref,
         argument: parsed.argument,
       });
@@ -249,9 +327,418 @@ export async function handleServerTool(
   }
 }
 
+function fieldSelectionFor(
+  server: CapletConfig,
+  tool: { outputSchema?: unknown },
+): { supported: boolean; reason?: string } {
+  if (server.backend === "graphql") {
+    return { supported: false, reason: "graphql_document_selection" };
+  }
+  if (!tool.outputSchema) {
+    return { supported: false, reason: "output_schema_unavailable" };
+  }
+  return { supported: true };
+}
+
+async function maybeGetToolForValidation(
+  backend: unknown,
+  server: CapletConfig,
+  toolName: string,
+): Promise<{ inputSchema?: unknown; outputSchema?: unknown } | undefined> {
+  if (!hasGetTool(backend)) return undefined;
+  try {
+    return await backend.getTool(server as never, toolName);
+  } catch {
+    return undefined;
+  }
+}
+
+function validateToolArgsForAgent(
+  tool: { inputSchema?: unknown; outputSchema?: unknown } | undefined,
+  toolName: string,
+  args: Record<string, unknown>,
+): void {
+  const schema = isPlainObject(tool?.inputSchema) ? tool.inputSchema : undefined;
+  if (!schema) return;
+  const properties = isPlainObject(schema.properties) ? schema.properties : {};
+  const acceptedArgs = Object.keys(properties).sort();
+  const requiredArgs = Array.isArray(schema.required)
+    ? schema.required.filter((value): value is string => typeof value === "string").sort()
+    : [];
+  const validator = validatorFor(schema);
+  const valid = validator ? validator(args) : manualValidateObjectArgs(schema, args);
+  if (valid) return;
+
+  const errors = validator?.errors ?? manualValidationErrors(schema, args);
+  const schemaErrors = compactSchemaErrors(errors);
+  const missing = missingArgsFromErrors(schemaErrors, requiredArgs, args);
+  const unexpectedArgs = Object.keys(args)
+    .filter((key) => acceptedArgs.length > 0 && !acceptedArgs.includes(key))
+    .sort();
+  const unexpected = unexpectedArgsFromErrors(schemaErrors);
+
+  const inputTypeName = `${toolTypeBaseName(toolName)}Input`;
+  const outputTypeName = `${toolTypeBaseName(toolName)}Output`;
+  const requiredTemplate = minimalArgsTemplate(schema, requiredArgs);
+  const parts = [
+    missing.length > 0 ? `missing required argument(s): ${missing.join(", ")}` : undefined,
+    unexpected.length > 0 ? `unexpected argument(s): ${unexpected.join(", ")}` : undefined,
+    ...schemaErrors
+      .filter((error) => error.rule !== "required" && error.rule !== "additionalProperties")
+      .slice(0, 3)
+      .map(formatSchemaError),
+  ].filter((value): value is string => value !== undefined);
+  const reason = parts.length > 0 ? parts.join("; ") : "schema validation failed";
+  throw new CapletsError(
+    "REQUEST_INVALID",
+    `call_tool args for ${toolName} are invalid: ${reason}. Use describe_tool for the schema and retry with exact argument names.`,
+    {
+      tool: toolName,
+      requiredArgs,
+      acceptedArgs,
+      ...(unexpectedArgs.length > 0 ? { unexpectedArgs } : {}),
+      ...(Object.keys(requiredTemplate).length > 0
+        ? { minimalArgsTemplate: requiredTemplate }
+        : {}),
+      ...(schemaErrors.length > 0 ? { schemaErrors } : {}),
+      callSignature: `callTool(name: ${JSON.stringify(toolName)}, args: ${inputTypeName}): Promise<CapletsResult<${outputTypeName}>>`,
+      inputTypeScript: schemaToTypeScript(schema, inputTypeName),
+      retry:
+        "Call describe_tool for this tool, then call_tool with args matching inputSchema/inputTypeScript exactly.",
+    },
+  );
+}
+
+function validatorFor(schema: Record<string, unknown>): ValidateFunction | undefined {
+  const existing = compiledValidators.get(schema);
+  if (existing) return existing;
+  try {
+    const validator = ajv.compile(schema);
+    compiledValidators.set(schema, validator);
+    return validator;
+  } catch {
+    return undefined;
+  }
+}
+
+function manualValidateObjectArgs(
+  schema: Record<string, unknown>,
+  args: Record<string, unknown>,
+): boolean {
+  return manualValidationErrors(schema, args).length === 0;
+}
+
+function manualValidationErrors(
+  schema: Record<string, unknown>,
+  args: Record<string, unknown>,
+): ErrorObject[] {
+  const properties = isPlainObject(schema.properties) ? schema.properties : {};
+  const acceptedArgs = Object.keys(properties).sort();
+  const requiredArgs = Array.isArray(schema.required)
+    ? schema.required.filter((value): value is string => typeof value === "string").sort()
+    : [];
+  const errors: ErrorObject[] = [];
+  for (const key of requiredArgs) {
+    if (args[key] === undefined) {
+      errors.push({
+        instancePath: "",
+        schemaPath: "#/required",
+        keyword: "required",
+        params: { missingProperty: key },
+      });
+    }
+  }
+  if (schema.additionalProperties === false && acceptedArgs.length > 0) {
+    for (const key of Object.keys(args).sort()) {
+      if (!acceptedArgs.includes(key)) {
+        errors.push({
+          instancePath: "",
+          schemaPath: "#/additionalProperties",
+          keyword: "additionalProperties",
+          params: { additionalProperty: key },
+        });
+      }
+    }
+  }
+  return errors;
+}
+
+type CompactSchemaError = {
+  path: string;
+  rule: string;
+  expected?: string;
+  allowed?: unknown[];
+  missing?: string;
+  unexpected?: string;
+  message?: string;
+};
+
+function compactSchemaErrors(errors: ErrorObject[] | null | undefined): CompactSchemaError[] {
+  if (!errors) return [];
+  return errors.slice(0, MAX_SCHEMA_ERRORS).map((error) => {
+    const path = error.instancePath || "/";
+    if (error.keyword === "required") {
+      const missing = stringParam(error, "missingProperty");
+      return {
+        path: appendJsonPointer(path, missing),
+        rule: "required",
+        ...(missing === undefined ? {} : { missing }),
+      };
+    }
+    if (error.keyword === "additionalProperties") {
+      const unexpected = stringParam(error, "additionalProperty");
+      return {
+        path: appendJsonPointer(path, unexpected),
+        rule: "additionalProperties",
+        ...(unexpected === undefined ? {} : { unexpected }),
+      };
+    }
+    if (error.keyword === "type") {
+      const expected = stringParam(error, "type");
+      return {
+        path,
+        rule: "type",
+        ...(expected === undefined ? {} : { expected }),
+      };
+    }
+    if (error.keyword === "enum") {
+      return {
+        path,
+        rule: "enum",
+        ...(Array.isArray(error.params.allowedValues)
+          ? { allowed: error.params.allowedValues as unknown[] }
+          : {}),
+      };
+    }
+    if (error.keyword === "const") {
+      return {
+        path,
+        rule: "const",
+        allowed: [error.params.allowedValue],
+      };
+    }
+    return {
+      path,
+      rule: error.keyword,
+      ...(error.message ? { message: error.message } : {}),
+    };
+  });
+}
+
+function stringParam(error: ErrorObject, key: string): string | undefined {
+  const value = (error.params as Record<string, unknown>)[key];
+  return typeof value === "string" ? value : undefined;
+}
+
+function appendJsonPointer(path: string, key: string | undefined): string {
+  if (!key) return path;
+  const escaped = key.replace(/~/gu, "~0").replace(/\//gu, "~1");
+  return path === "/" ? `/${escaped}` : `${path}/${escaped}`;
+}
+
+function missingArgsFromErrors(
+  errors: CompactSchemaError[],
+  requiredArgs: string[],
+  args: Record<string, unknown>,
+): string[] {
+  const missing = errors
+    .filter((error) => error.rule === "required" && error.path.split("/").length === 2)
+    .map((error) => error.missing)
+    .filter((value): value is string => typeof value === "string");
+  if (missing.length > 0) return [...new Set(missing)].sort();
+  return requiredArgs.filter((key) => args[key] === undefined);
+}
+
+function unexpectedArgsFromErrors(errors: CompactSchemaError[]): string[] {
+  return errors
+    .filter((error) => error.rule === "additionalProperties" && error.unexpected)
+    .map((error) => error.unexpected!)
+    .sort();
+}
+
+function formatSchemaError(error: CompactSchemaError): string {
+  if (error.rule === "type" && error.expected) {
+    return `${error.path} must be ${error.expected}`;
+  }
+  if (error.rule === "enum" && error.allowed) {
+    return `${error.path} must be one of ${error.allowed.map((value) => JSON.stringify(value)).join(", ")}`;
+  }
+  if (error.rule === "const" && error.allowed) {
+    return `${error.path} must be ${JSON.stringify(error.allowed[0])}`;
+  }
+  return error.message ? `${error.path} ${error.message}` : `${error.path} failed ${error.rule}`;
+}
+
+function minimalArgsTemplate(
+  schema: Record<string, unknown>,
+  requiredArgs: string[],
+): Record<string, unknown> {
+  const properties = isPlainObject(schema.properties) ? schema.properties : {};
+  const template: Record<string, unknown> = {};
+  for (const key of requiredArgs) {
+    template[key] = placeholderValueForSchema(properties[key], 0);
+  }
+  return template;
+}
+
+function placeholderValueForSchema(schema: unknown, depth: number): unknown {
+  if (depth > 2 || !isPlainObject(schema)) return null;
+  if ("const" in schema) return schema.const;
+  if (Array.isArray(schema.enum) && schema.enum.length > 0) return schema.enum[0];
+  const type = Array.isArray(schema.type)
+    ? (schema.type.find((value) => value !== "null") ?? schema.type[0])
+    : schema.type;
+  if (type === "string") return "";
+  if (type === "integer" || type === "number") return 0;
+  if (type === "boolean") return false;
+  if (type === "array") return [];
+  if (type === "object" || isPlainObject(schema.properties)) {
+    const required = Array.isArray(schema.required)
+      ? schema.required.filter((value): value is string => typeof value === "string").sort()
+      : [];
+    const properties = isPlainObject(schema.properties) ? schema.properties : {};
+    const value: Record<string, unknown> = {};
+    for (const key of required) {
+      value[key] = placeholderValueForSchema(properties[key], depth + 1);
+    }
+    return value;
+  }
+  return null;
+}
+
+function hasGetTool(backend: unknown): backend is {
+  getTool(server: never, name: string): Promise<{ inputSchema?: unknown; outputSchema?: unknown }>;
+} {
+  return Boolean(
+    backend &&
+    typeof backend === "object" &&
+    "getTool" in backend &&
+    typeof (backend as { getTool?: unknown }).getTool === "function",
+  );
+}
+
+function schemaToTypeScript(schema: unknown, fallbackName: string): string {
+  return `type ${fallbackName} = ${schemaType(schema)};`;
+}
+
+function schemaType(schema: unknown): string {
+  if (!isPlainObject(schema)) return "unknown";
+  if ("const" in schema) return JSON.stringify(schema.const);
+  if (Array.isArray(schema.enum)) {
+    return schema.enum.map((value) => JSON.stringify(value)).join(" | ") || "unknown";
+  }
+  const type = schema.type;
+  if (Array.isArray(type)) {
+    const variants = type.map((item) => schemaType({ ...schema, type: item }));
+    return [...new Set(variants)].join(" | ") || "unknown";
+  }
+  if (type === "string") return "string";
+  if (type === "number" || type === "integer") return "number";
+  if (type === "boolean") return "boolean";
+  if (type === "null") return "null";
+  if (type === "array") return `${schemaType(schema.items)}[]`;
+  if (type === "object" || isPlainObject(schema.properties)) return objectSchemaType(schema);
+  if (Array.isArray(schema.oneOf)) return unionSchemaType(schema.oneOf);
+  if (Array.isArray(schema.anyOf)) return unionSchemaType(schema.anyOf);
+  if (Array.isArray(schema.allOf)) {
+    return schema.allOf.map(schemaType).join(" & ") || "Record<string, unknown>";
+  }
+  return "unknown";
+}
+
+function objectSchemaType(schema: Record<string, unknown>): string {
+  const properties = isPlainObject(schema.properties) ? schema.properties : {};
+  const required = new Set(
+    Array.isArray(schema.required)
+      ? schema.required.filter((value): value is string => typeof value === "string")
+      : [],
+  );
+  const fields = Object.entries(properties)
+    .sort(([left], [right]) => left.localeCompare(right))
+    .map(([key, value]) => {
+      const optional = required.has(key) ? "" : "?";
+      return `${propertySignature(key)}${optional}: ${schemaType(value)};`;
+    });
+  if (fields.length === 0) {
+    return schema.additionalProperties === false ? "{}" : "Record<string, unknown>";
+  }
+  if (schema.additionalProperties && isPlainObject(schema.additionalProperties)) {
+    fields.push(`[key: string]: ${schemaType(schema.additionalProperties)};`);
+  }
+  return `{ ${fields.join(" ")} }`;
+}
+
+function unionSchemaType(schemas: unknown[]): string {
+  return schemas.map(schemaType).join(" | ") || "unknown";
+}
+
+function propertySignature(key: string): string {
+  return /^[A-Za-z_$][\w$]*$/u.test(key) ? key : JSON.stringify(key);
+}
+
+function toolTypeBaseName(toolName: string): string {
+  const base = toolName
+    .split(/[^a-zA-Z0-9]+/u)
+    .filter(Boolean)
+    .map((part) => `${part.charAt(0).toUpperCase()}${part.slice(1)}`)
+    .join("");
+  return base || "Tool";
+}
+
+async function readObservedOutputShape(
+  options: HandleServerToolOptions,
+  server: CapletConfig,
+  toolName: string,
+  outputSchema: unknown,
+) {
+  if (!options.observedOutputShapeStore || usefulOutputSchema(outputSchema)) return undefined;
+  try {
+    return await options.observedOutputShapeStore.read(
+      observedOutputShapeKey({
+        scope: options.observedOutputShapeScope ?? "local",
+        workspaceId: options.workspaceId,
+        projectFingerprint: options.projectFingerprint,
+        caplet: server,
+        toolName,
+      }),
+    );
+  } catch {
+    return undefined;
+  }
+}
+
+async function writeObservedOutputShape(
+  options: HandleServerToolOptions,
+  server: CapletConfig,
+  toolName: string,
+  result: unknown,
+): Promise<void> {
+  if (!options.observedOutputShapeStore || resultIsError(result)) return;
+  const value = normalizedObservableValue(result);
+  if (value === undefined) return;
+  const key = observedOutputShapeKey({
+    scope: options.observedOutputShapeScope ?? "local",
+    workspaceId: options.workspaceId,
+    projectFingerprint: options.projectFingerprint,
+    caplet: server,
+    toolName,
+  });
+  try {
+    const existing = await options.observedOutputShapeStore.read(key);
+    const observed = observeOutputShape({ value, existing });
+    if (observed) await options.observedOutputShapeStore.write(key, observed);
+  } catch {
+    return;
+  }
+}
+
+function resultIsError(result: unknown): boolean {
+  return Boolean(result && typeof result === "object" && (result as { isError?: unknown }).isError);
+}
+
 export function validateOperationRequest(
   request: unknown,
-  maxSearchLimit: number,
+  _maxSearchLimit: number,
   backend: string = "tool",
 ): RequiredOperationRequest {
   const result = generatedToolInputSchemaForCaplet({ backend }).safeParse(request);
@@ -304,91 +791,62 @@ export function validateOperationRequest(
 
   switch (value.operation) {
     case "inspect":
-    case "check_backend":
+    case "check":
       allowed([]);
       return { operation: value.operation };
-    case "list_tools":
-      allowed(["limit"]);
-      if (value.limit !== undefined && value.limit > maxSearchLimit) {
-        throw new CapletsError("REQUEST_INVALID", `list_tools limit must be <= ${maxSearchLimit}`);
-      }
-      return value.limit === undefined
-        ? { operation: "list_tools" }
-        : { operation: "list_tools", limit: value.limit };
+    case "tools":
+      allowed(["limit", "cursor"]);
+      return normalizePageRequest(value);
     case "search_tools":
-      allowed(["query", "limit"]);
+      allowed(["query", "limit", "cursor"]);
       if (!value.query) {
         throw new CapletsError("REQUEST_INVALID", "search_tools requires query");
       }
-      if (value.limit !== undefined && value.limit > maxSearchLimit) {
-        throw new CapletsError(
-          "REQUEST_INVALID",
-          `search_tools limit must be <= ${maxSearchLimit}`,
-        );
-      }
-      return value.limit === undefined
-        ? { operation: "search_tools", query: value.query }
-        : { operation: "search_tools", query: value.query, limit: value.limit };
-    case "get_tool":
-      allowed(["tool"]);
-      if (!value.tool) {
-        throw new CapletsError("REQUEST_INVALID", "get_tool requires tool");
+      return normalizePageRequest(value) as RequiredOperationRequest;
+    case "describe_tool":
+      allowed(["name"]);
+      if (!value.name) {
+        throw new CapletsError("REQUEST_INVALID", "describe_tool requires name");
       }
-      return { operation: "get_tool", tool: value.tool };
+      return { operation: "describe_tool", name: value.name };
     case "call_tool":
-      allowed(["tool", "arguments", "fields"]);
-      if (!value.tool) {
-        throw new CapletsError("REQUEST_INVALID", "call_tool requires tool");
+      allowed(["name", "args", "fields"]);
+      if (!value.name) {
+        throw new CapletsError("REQUEST_INVALID", "call_tool requires name");
       }
-      if (!isPlainObject(value.arguments)) {
-        throw new CapletsError("REQUEST_INVALID", "call_tool.arguments must be a JSON object");
+      if (!isPlainObject(value.args)) {
+        throw new CapletsError("REQUEST_INVALID", "call_tool.args must be a JSON object");
       }
       return value.fields === undefined
-        ? { operation: "call_tool", tool: value.tool, arguments: value.arguments }
+        ? { operation: "call_tool", name: value.name, args: value.args }
         : {
             operation: "call_tool",
-            tool: value.tool,
-            arguments: value.arguments,
+            name: value.name,
+            args: value.args,
             fields: value.fields,
           };
-    case "list_resources":
-    case "list_resource_templates":
-    case "list_prompts":
-      allowed(["limit"]);
-      if (value.limit !== undefined && value.limit > maxSearchLimit) {
-        throw new CapletsError(
-          "REQUEST_INVALID",
-          `${value.operation} limit must be <= ${maxSearchLimit}`,
-        );
-      }
-      return value.limit === undefined
-        ? { operation: value.operation }
-        : { operation: value.operation, limit: value.limit };
+    case "resources":
+    case "resource_templates":
+    case "prompts":
+      allowed(["limit", "cursor"]);
+      return normalizePageRequest(value);
     case "search_resources":
     case "search_prompts":
-      allowed(["query", "limit"]);
+      allowed(["query", "limit", "cursor"]);
       if (!value.query)
         throw new CapletsError("REQUEST_INVALID", `${value.operation} requires query`);
-      if (value.limit !== undefined && value.limit > maxSearchLimit) {
-        throw new CapletsError(
-          "REQUEST_INVALID",
-          `${value.operation} limit must be <= ${maxSearchLimit}`,
-        );
-      }
-      return value.limit === undefined
-        ? { operation: value.operation, query: value.query }
-        : { operation: value.operation, query: value.query, limit: value.limit };
+      return normalizePageRequest(value) as RequiredOperationRequest;
     case "read_resource":
       allowed(["uri"]);
       if (!value.uri) throw new CapletsError("REQUEST_INVALID", "read_resource requires uri");
       return { operation: "read_resource", uri: value.uri };
     case "get_prompt":
-      allowed(["prompt", "arguments"]);
-      if (!value.prompt) throw new CapletsError("REQUEST_INVALID", "get_prompt requires prompt");
-      if (value.arguments !== undefined && !isPlainObject(value.arguments)) {
-        throw new CapletsError("REQUEST_INVALID", "get_prompt.arguments must be a JSON object");
+      allowed(["name", "args"]);
+      if (!value.name) throw new CapletsError("REQUEST_INVALID", "get_prompt requires name");
+      if (value.args !== undefined && !isPlainObject(value.args)) {
+        throw new CapletsError("REQUEST_INVALID", "get_prompt.args must be a JSON object");
       }
-      return { operation: "get_prompt", prompt: value.prompt, arguments: value.arguments ?? {} };
+      return { operation: "get_prompt", name: value.name, args: value.args ?? {} };
     case "complete":
       allowed(["ref", "argument"]);
       if (!value.ref) throw new CapletsError("REQUEST_INVALID", "complete requires ref");
@@ -398,8 +856,37 @@ export function validateOperationRequest(
   throw new CapletsError("INTERNAL_ERROR", "Unhandled operation");
 }
 
-function mcpBackendFor(server: CapletConfig, downstream: DownstreamManager): DownstreamManager {
+function normalizePageRequest<T extends ParsedOperationRequest>(value: T): T {
+  return {
+    ...value,
+    ...(value.limit === undefined ? {} : { limit: value.limit }),
+    ...(typeof value.cursor === "string" ? { cursor: value.cursor } : {}),
+  };
+}
+
+function pageItems<T>(
+  items: T[],
+  input: { limit?: number; cursor?: string },
+  maxLimit: number,
+): { items: T[]; nextCursor?: string; truncated?: boolean } {
+  const cursor = input.cursor === undefined ? 0 : Number.parseInt(input.cursor, 10);
+  const start = Number.isFinite(cursor) && cursor > 0 ? cursor : 0;
+  const requestedLimit = input.limit ?? maxLimit;
+  const limit = Math.max(1, Math.min(requestedLimit, maxLimit));
+  const page = items.slice(start, start + limit);
+  const nextIndex = start + page.length;
+  return nextIndex < items.length
+    ? { items: page, nextCursor: String(nextIndex), truncated: true }
+    : { items: page };
+}
+
+function mcpBackendFor(
+  server: CapletConfig,
+  downstream: DownstreamManager,
+  mode: "page" | "direct",
+): DownstreamManager | undefined {
   if (server.backend !== "mcp") {
+    if (mode === "page") return undefined;
     throw new CapletsError(
       "UNSUPPORTED_OPERATION",
       "MCP resource, prompt, and completion operations require an MCP-backed Caplet",
@@ -409,15 +896,20 @@ function mcpBackendFor(server: CapletConfig, downstream: DownstreamManager): Dow
 }
 
 type RequiredOperationRequest =
-  | { operation: "inspect" | "check_backend" }
-  | { operation: "list_tools"; limit?: number }
-  | { operation: "search_tools"; query: string; limit?: number }
-  | { operation: "get_tool"; tool: string }
-  | { operation: "call_tool"; tool: string; arguments: Record<string, unknown>; fields?: string[] }
-  | { operation: "list_resources" | "list_resource_templates" | "list_prompts"; limit?: number }
-  | { operation: "search_resources" | "search_prompts"; query: string; limit?: number }
+  | { operation: "inspect" | "check" }
+  | { operation: "tools"; limit?: number; cursor?: string }
+  | { operation: "search_tools"; query: string; limit?: number; cursor?: string }
+  | { operation: "describe_tool"; name: string }
+  | { operation: "call_tool"; name: string; args: Record<string, unknown>; fields?: string[] }
+  | { operation: "resources" | "resource_templates" | "prompts"; limit?: number; cursor?: string }
+  | {
+      operation: "search_resources" | "search_prompts";
+      query: string;
+      limit?: number;
+      cursor?: string;
+    }
   | { operation: "read_resource"; uri: string }
-  | { operation: "get_prompt"; prompt: string; arguments: Record<string, unknown> }
+  | { operation: "get_prompt"; name: string; args: Record<string, unknown> }
   | {
       operation: "complete";
       ref: { type: "prompt"; name: string } | { type: "resourceTemplate"; uri: string };
diff --git a/packages/core/test/caplet-sets.test.ts b/packages/core/test/caplet-sets.test.ts
index c66f99a..d47e210 100644
--- a/packages/core/test/caplet-sets.test.ts
+++ b/packages/core/test/caplet-sets.test.ts
@@ -39,7 +39,7 @@ describe("CapletSetManager", () => {
     });
     const tools = await manager.listTools(caplet);
     expect(tools.map((tool) => tool.name)).toEqual(["echoes"]);
-    expect(manager.search(caplet, tools, "echo", 5)).toMatchObject([{ tool: "echoes" }]);
+    expect(manager.search(caplet, tools, "echo", 5)).toMatchObject([{ name: "echoes" }]);
     await expect(manager.getTool(caplet, "echoes")).resolves.toMatchObject({
       name: "echoes",
       inputSchema: expect.objectContaining({
@@ -47,18 +47,18 @@ describe("CapletSetManager", () => {
       }),
     });
 
-    const listed = await manager.callTool(caplet, "echoes", { operation: "list_tools" });
+    const listed = await manager.callTool(caplet, "echoes", { operation: "tools" });
     expect(listed.structuredContent).toMatchObject({
       result: {
         id: "echoes",
-        tools: [{ tool: "echo_json" }],
+        items: [{ name: "echo_json" }],
       },
     });
 
     const called = await manager.callTool(caplet, "echoes", {
       operation: "call_tool",
-      tool: "echo_json",
-      arguments: { message: "hello" },
+      name: "echo_json",
+      args: { message: "hello" },
     });
     expect(called.isError).toBe(false);
     expect(called.structuredContent).toMatchObject({
@@ -272,7 +272,7 @@ describe("CapletSetManager", () => {
     const caplet = config.capletSets.nested!;
     const manager = new CapletSetManager(new ServerRegistry(config));
 
-    const result = await manager.callTool(caplet, "self", { operation: "check_backend" });
+    const result = await manager.callTool(caplet, "self", { operation: "check" });
 
     expect(result.structuredContent).toMatchObject({
       result: {
diff --git a/packages/core/test/cli-remote.test.ts b/packages/core/test/cli-remote.test.ts
index aa8f54c..91ea659 100644
--- a/packages/core/test/cli-remote.test.ts
+++ b/packages/core/test/cli-remote.test.ts
@@ -396,8 +396,8 @@ describe("remote CLI routing", () => {
             caplet: "github",
             request: {
               operation: "call_tool",
-              tool: "search",
-              arguments: { query: "caplets" },
+              name: "search",
+              args: { query: "caplets" },
             },
           },
         }),
@@ -462,7 +462,7 @@ describe("remote CLI routing", () => {
         command: "call_tool",
         arguments: {
           caplet: "shared",
-          request: { operation: "call_tool", tool: "echo", arguments: {} },
+          request: { operation: "call_tool", name: "echo", args: {} },
         },
       },
     ]);
@@ -492,7 +492,7 @@ describe("remote CLI routing", () => {
         command: "call_tool",
         arguments: {
           caplet: "remote",
-          request: { operation: "call_tool", tool: "echo", arguments: {} },
+          request: { operation: "call_tool", name: "echo", args: {} },
         },
       },
     ]);
@@ -524,7 +524,7 @@ describe("remote CLI routing", () => {
         command: "call_tool",
         arguments: {
           caplet: "remote",
-          request: { operation: "call_tool", tool: "echo", arguments: {} },
+          request: { operation: "call_tool", name: "echo", args: {} },
         },
       },
     ]);
@@ -538,7 +538,7 @@ describe("remote CLI routing", () => {
     const fetch = vi.fn(async (url: Parameters<typeof globalThis.fetch>[0], init?: RequestInit) => {
       const body = JSON.parse(String(init?.body ?? "{}")) as { command: string };
       requests.push({ url: String(url), body: init?.body });
-      if (body.command === "list_resources") {
+      if (body.command === "resources") {
         return Response.json({
           ok: true,
           result: {
@@ -598,7 +598,7 @@ describe("remote CLI routing", () => {
     expect(JSON.parse(out[2] ?? "{}")).toEqual({ completion: { values: ["src/index.ts"] } });
     expect(
       requests.map((request) => JSON.parse(String((request as { body: string }).body)).command),
-    ).toEqual(["list_resources", "read_resource", "complete"]);
+    ).toEqual(["resources", "read_resource", "complete"]);
   });
 
   it("keeps config path local-only in remote mode", async () => {
diff --git a/packages/core/test/cli-tools.test.ts b/packages/core/test/cli-tools.test.ts
index 2f18cd3..ade9e08 100644
--- a/packages/core/test/cli-tools.test.ts
+++ b/packages/core/test/cli-tools.test.ts
@@ -30,7 +30,9 @@ describe("CliToolsManager", () => {
     });
     const tools = await manager.listTools(caplet);
     expect(tools.map((tool) => tool.name)).toEqual(["echo_json", "fail", "fail_json"]);
-    expect(manager.search(caplet, tools, "echo", 5)).toMatchObject([{ tool: "echo_json" }]);
+    expect(manager.search(caplet, tools, "echo", 5)).toMatchObject([
+      { name: "echo_json", readOnlyHint: true },
+    ]);
     expect(await manager.getTool(caplet, "echo_json")).toMatchObject({
       name: "echo_json",
       inputSchema: expect.objectContaining({ type: "object" }),
@@ -159,8 +161,8 @@ describe("CliToolsManager", () => {
       caplet,
       {
         operation: "call_tool",
-        tool: "echo_json",
-        arguments: { message: "hello" },
+        name: "echo_json",
+        args: { message: "hello" },
         fields: ["json.message"],
       },
       registry,
diff --git a/packages/core/test/cli.test.ts b/packages/core/test/cli.test.ts
index c8fda36..4aafa25 100644
--- a/packages/core/test/cli.test.ts
+++ b/packages/core/test/cli.test.ts
@@ -640,9 +640,9 @@ describe("cli init", () => {
         status: "available",
         toolCount: 3,
       });
-      expect(results[2].tools).toHaveLength(3);
+      expect(results[2].items).toHaveLength(3);
       expect(results[3]).toMatchObject({ query: "echo" });
-      expect(results[3].tools).toHaveLength(1);
+      expect(results[3].items).toHaveLength(1);
       expect(results[4].tool.name).toBe("echo_json");
       expect(results[5].structuredContent).toEqual({ json: { message: "hello" } });
     } finally {
@@ -750,8 +750,8 @@ describe("cli init", () => {
           caplet: "linear",
           request: {
             operation: "get_prompt",
-            prompt: "review_issue",
-            arguments: { issueId: "CAP-123" },
+            name: "review_issue",
+            args: { issueId: "CAP-123" },
           },
         },
       },
diff --git a/packages/core/test/cloud-auth.test.ts b/packages/core/test/cloud-auth.test.ts
index f8128dd..69a64cd 100644
--- a/packages/core/test/cloud-auth.test.ts
+++ b/packages/core/test/cloud-auth.test.ts
@@ -1,4 +1,4 @@
-import { existsSync, mkdtempSync, rmSync, statSync } from "node:fs";
+import { existsSync, mkdirSync, mkdtempSync, rmSync, statSync, writeFileSync } from "node:fs";
 import { tmpdir } from "node:os";
 import { join } from "node:path";
 import { afterEach, describe, expect, it } from "vitest";
@@ -110,6 +110,64 @@ describe("caplets cloud auth CLI", () => {
 
     expect(existsSync(path)).toBe(false);
   });
+
+  it("uploads local caplet-files to the selected Cloud workspace", async () => {
+    const authPath = tempAuthPath();
+    await new CloudAuthStore({ path: authPath }).save(credentials);
+    const root = tempDir("caplets-cloud-add-");
+    mkdirSync(join(root, "search"), { recursive: true });
+    writeFileSync(
+      join(root, "search", "CAPLET.md"),
+      `---
+name: Search
+description: Search API.
+openapiEndpoint:
+  specPath: ./openapi.yaml
+  auth:
+    type: none
+---
+
+# Search
+`,
+    );
+    writeFileSync(join(root, "search", "openapi.yaml"), "openapi: 3.0.3\ninfo:\n  title: Search\n");
+    const requests: Array<{ url: string; init?: RequestInit }> = [];
+    const out: string[] = [];
+
+    await runCli(["cloud", "add", root, "--json"], {
+      env: { CAPLETS_CLOUD_AUTH_PATH: authPath },
+      fetch: (async (url, init) => {
+        requests.push({ url: String(url), ...(init === undefined ? {} : { init }) });
+        return Response.json(
+          {
+            caplet: { id: "search", name: "Search" },
+            caplets: [{ id: "search", name: "Search" }],
+          },
+          { status: 201 },
+        );
+      }) as typeof fetch,
+      writeOut: (value) => out.push(value),
+    });
+
+    expect(requests).toHaveLength(1);
+    expect(requests[0]?.url).toBe("https://cloud.caplets.dev/api/workspaces/team/caplets/custom");
+    expect(new Headers(requests[0]?.init?.headers).get("authorization")).toBe("Bearer access");
+    expect(JSON.parse(String(requests[0]?.init?.body))).toEqual({
+      bundle: {
+        files: [
+          expect.objectContaining({
+            path: "search/CAPLET.md",
+            content: expect.stringContaining("Search"),
+          }),
+          { path: "search/openapi.yaml", content: "openapi: 3.0.3\ninfo:\n  title: Search\n" },
+        ],
+      },
+    });
+    expect(JSON.parse(out.join(""))).toEqual({
+      caplets: [{ id: "search", name: "Search" }],
+      workspace: "team",
+    });
+  });
 });
 
 describe("CloudAuthStore", () => {
@@ -164,7 +222,11 @@ describe("CloudAuthStore", () => {
 });
 
 function tempAuthPath(): string {
-  const dir = mkdtempSync(join(tmpdir(), "caplets-cloud-auth-"));
+  return join(tempDir("caplets-cloud-auth-"), "cloud-auth.json");
+}
+
+function tempDir(prefix: string): string {
+  const dir = mkdtempSync(join(tmpdir(), prefix));
   tempDirs.push(dir);
-  return join(dir, "cloud-auth.json");
+  return dir;
 }
diff --git a/packages/core/test/code-mode-api.test.ts b/packages/core/test/code-mode-api.test.ts
new file mode 100644
index 0000000..1e8b661
--- /dev/null
+++ b/packages/core/test/code-mode-api.test.ts
@@ -0,0 +1,529 @@
+import { describe, expect, it, vi } from "vitest";
+import { createCodeModeCapletsApi, listCodeModeCallableCaplets } from "../src/code-mode/api";
+import type { CodeModeCapletHandle } from "../src/code-mode/api";
+import { CapletsError } from "../src/errors";
+import type { NativeCapletTool, NativeCapletsService } from "../src/native/service";
+
+function service(tools: NativeCapletTool[]): NativeCapletsService {
+  return {
+    listTools: () => tools,
+    execute: vi.fn(async (capletId: string, request: unknown) => ({
+      content: [{ type: "text", text: JSON.stringify({ capletId, request }) }],
+      structuredContent: { capletId, request },
+    })),
+    reload: vi.fn(async () => true),
+    onToolsChanged: vi.fn(() => () => undefined),
+    close: vi.fn(async () => undefined),
+  };
+}
+
+describe("Code Mode Caplets API", () => {
+  it("lists callable caplets from native service tools", () => {
+    const callable = listCodeModeCallableCaplets(
+      service([
+        {
+          caplet: "github",
+          toolName: "caplets_github",
+          title: "GitHub",
+          description: "GitHub repo operations.",
+          promptGuidance: [],
+        },
+      ]),
+    );
+
+    expect(callable).toEqual([
+      { id: "github", name: "GitHub", description: "GitHub repo operations." },
+    ]);
+  });
+
+  it("creates strict caplet handles that call existing progressive operations", async () => {
+    const native = service([
+      {
+        caplet: "github",
+        toolName: "caplets_github",
+        title: "GitHub",
+        description: "GitHub repo operations.",
+        promptGuidance: [],
+      },
+    ]);
+    const api = createCodeModeCapletsApi({ service: native });
+    const github = api.github as CodeModeCapletHandle;
+
+    expect(github.id).toBe("github");
+    await github.inspect();
+    await github.check();
+    await github.tools();
+    await github.describeTool("listIssues");
+    await expect(github.callTool("listIssues", { state: "open" })).resolves.toMatchObject({
+      ok: true,
+      data: {
+        capletId: "github",
+        request: {
+          args: { state: "open" },
+          operation: "call_tool",
+          name: "listIssues",
+        },
+      },
+      meta: { capletId: "github", tool: "listIssues" },
+    });
+
+    expect(native.execute).toHaveBeenNthCalledWith(1, "github", { operation: "inspect" });
+    expect(native.execute).toHaveBeenNthCalledWith(2, "github", { operation: "check" });
+    expect(native.execute).toHaveBeenNthCalledWith(3, "github", { operation: "tools" });
+    expect(native.execute).toHaveBeenNthCalledWith(4, "github", {
+      operation: "describe_tool",
+      name: "listIssues",
+    });
+    expect(native.execute).toHaveBeenNthCalledWith(5, "github", {
+      operation: "call_tool",
+      name: "listIssues",
+      args: { state: "open" },
+    });
+  });
+
+  it("treats unavailable backend checks as expected readiness failures", async () => {
+    const native = service([
+      {
+        caplet: "browser",
+        toolName: "caplets_browser",
+        title: "Browser",
+        description: "Browser automation.",
+        promptGuidance: [],
+      },
+    ]);
+    vi.mocked(native.execute).mockResolvedValueOnce({
+      structuredContent: {
+        result: {
+          id: "browser",
+          status: "unavailable",
+          elapsedMs: 21,
+          error: {
+            code: "SERVER_UNAVAILABLE",
+            message: "Browser profile is locked.",
+          },
+        },
+      },
+    });
+    const api = createCodeModeCapletsApi({ service: native });
+    const browser = api.browser as CodeModeCapletHandle;
+
+    await expect(browser.check()).resolves.toMatchObject({
+      ok: false,
+      error: {
+        code: "backend_not_ready",
+        message: "browser is unavailable: Browser profile is locked.",
+        details: {
+          id: "browser",
+          status: "unavailable",
+          error: {
+            code: "SERVER_UNAVAILABLE",
+            message: "Browser profile is locked.",
+          },
+        },
+      },
+      meta: { capletId: "browser" },
+    });
+  });
+
+  it("unwraps progressive disclosure results for handle inspection and tool discovery", async () => {
+    const native = service([
+      {
+        caplet: "github",
+        toolName: "caplets_github",
+        title: "GitHub",
+        description: "GitHub repo operations.",
+        promptGuidance: [],
+      },
+    ]);
+    vi.mocked(native.execute)
+      .mockResolvedValueOnce({
+        structuredContent: {
+          result: {
+            id: "github",
+            name: "GitHub",
+            description: "GitHub repo operations.",
+          },
+        },
+      })
+      .mockResolvedValueOnce({
+        structuredContent: {
+          result: {
+            id: "github",
+            name: "GitHub",
+            items: [
+              {
+                name: "get_me",
+                description: "Get current user.",
+                useWhen: "Use to identify the authenticated user.",
+                avoidWhen: "Avoid for repository owner lookup.",
+                hasInputSchema: true,
+                hasOutputSchema: false,
+                supportsFields: false,
+                readOnlyHint: true,
+              },
+            ],
+          },
+        },
+      })
+      .mockResolvedValueOnce({
+        structuredContent: {
+          result: {
+            id: "github",
+            tool: {
+              name: "get_me",
+              description: "Get current user.",
+              useWhen: "Use to identify the authenticated user.",
+              avoidWhen: "Avoid for repository owner lookup.",
+              inputSchema: {
+                type: "object",
+                properties: { owner: { type: "string" }, page: { type: "integer" } },
+                required: ["owner"],
+                additionalProperties: false,
+              },
+              outputSchema: {
+                type: "object",
+                properties: { login: { type: "string" } },
+                required: ["login"],
+              },
+            },
+            fieldSelection: { supported: true },
+            observedOutputShape: {
+              version: 1,
+              source: "observed",
+              observedAt: "2026-06-08T00:00:00.000Z",
+              sampleCount: 1,
+              typeScript: "type ObservedOutput = { login?: string; };",
+              jsonShape: {
+                kind: "object",
+                fields: { login: { optional: true, shape: { kind: "string" } } },
+              },
+              truncated: false,
+            },
+          },
+        },
+      });
+    const api = createCodeModeCapletsApi({ service: native });
+    const github = api.github as CodeModeCapletHandle;
+
+    await expect(github.inspect()).resolves.toMatchObject({ id: "github", name: "GitHub" });
+    await expect(github.tools({ limit: 1 })).resolves.toEqual({
+      items: [
+        {
+          name: "get_me",
+          description: "Get current user.",
+          useWhen: "Use to identify the authenticated user.",
+          avoidWhen: "Avoid for repository owner lookup.",
+          readOnlyHint: true,
+        },
+      ],
+    });
+    const descriptor = await github.describeTool("get_me");
+    expect(descriptor).toMatchObject({
+      ok: true,
+      data: {
+        id: "github",
+        tool: {
+          name: "get_me",
+          description: "Get current user.",
+          useWhen: "Use to identify the authenticated user.",
+          avoidWhen: "Avoid for repository owner lookup.",
+        },
+        inputSchema: expect.objectContaining({ type: "object" }),
+        outputSchema: expect.objectContaining({ type: "object" }),
+        callSignature:
+          'callTool(name: "get_me", args: GetMeInput): Promise<CapletsResult<GetMeOutput>>',
+        inputTypeScript: "type GetMeInput = { owner: string; page?: number; };",
+        outputTypeScript: expect.stringContaining("login: string"),
+        observedOutputShape: {
+          source: "observed",
+          typeScript: "type ObservedOutput = { login?: string; };",
+        },
+        examples: [],
+      },
+    });
+    if (!descriptor.ok) throw new Error("expected descriptor success");
+    const tool = (descriptor.data as { tool?: Record<string, unknown> }).tool ?? {};
+    expect((descriptor.data as { fieldSelection?: unknown }).fieldSelection).toBeUndefined();
+    expect(tool.inputSchema).toBeUndefined();
+    expect(tool.outputSchema).toBeUndefined();
+    expect(tool.icons).toBeUndefined();
+  });
+
+  it("returns expected tool failures as result envelopes", async () => {
+    const native = service([
+      {
+        caplet: "github",
+        toolName: "caplets_github",
+        title: "GitHub",
+        description: "GitHub repo operations.",
+        promptGuidance: [],
+      },
+    ]);
+    vi.mocked(native.execute).mockResolvedValueOnce({
+      isError: true,
+      content: [{ type: "text", text: "Bad request." }],
+      structuredContent: { errorCode: "request_invalid" },
+    });
+    const api = createCodeModeCapletsApi({ service: native });
+    const github = api.github as CodeModeCapletHandle;
+
+    await expect(github.callTool("listIssues", {})).resolves.toMatchObject({
+      ok: false,
+      error: { code: "request_invalid", message: "Bad request." },
+      meta: { capletId: "github", tool: "listIssues" },
+    });
+  });
+
+  it("preserves structured error details without double wrapping", async () => {
+    const native = service([
+      {
+        caplet: "github",
+        toolName: "caplets_github",
+        title: "GitHub",
+        description: "GitHub repo operations.",
+        promptGuidance: [],
+      },
+    ]);
+    vi.mocked(native.execute).mockResolvedValueOnce({
+      isError: true,
+      content: [{ type: "text", text: "call_tool args are invalid" }],
+      structuredContent: {
+        error: {
+          code: "REQUEST_INVALID",
+          message: "call_tool args are invalid",
+          details: {
+            requiredArgs: ["query"],
+            acceptedArgs: ["perPage", "query"],
+          },
+        },
+      },
+    });
+    const api = createCodeModeCapletsApi({ service: native });
+    const github = api.github as CodeModeCapletHandle;
+
+    await expect(github.callTool("search_issues", { q: "repo:o/r" })).resolves.toMatchObject({
+      ok: false,
+      error: {
+        code: "REQUEST_INVALID",
+        message: "callTool args are invalid",
+        details: {
+          requiredArgs: ["query"],
+          acceptedArgs: ["perPage", "query"],
+        },
+      },
+    });
+  });
+
+  it("preserves thrown validation details for Code Mode repair", async () => {
+    const native = service([
+      {
+        caplet: "github",
+        toolName: "caplets_github",
+        title: "GitHub",
+        description: "GitHub repo operations.",
+        promptGuidance: [],
+      },
+    ]);
+    vi.mocked(native.execute).mockRejectedValueOnce(
+      new CapletsError(
+        "REQUEST_INVALID",
+        "call_tool args for search_issues are invalid; use search_tools or describe_tool before call_tool.",
+        {
+          tool: "search_issues",
+          schemaErrors: [{ path: "/query", rule: "type", expected: "string" }],
+          callSignature:
+            'callTool(name: "search_issues", args: SearchIssuesInput): Promise<CapletsResult<SearchIssuesOutput>>',
+          retry:
+            "Call describe_tool for this tool, then call_tool with args matching inputSchema/inputTypeScript exactly.",
+          fallback:
+            "If this is not the right tool, use search_tools, read_resource, resource_templates, search_resources, search_prompts, get_prompt, or complete.",
+          nested: ["describe_tool", { operation: "call_tool" }],
+        },
+      ),
+    );
+    const api = createCodeModeCapletsApi({ service: native });
+    const github = api.github as CodeModeCapletHandle;
+
+    const result = await github.callTool("search_issues", { query: 123 });
+    expect(result).toMatchObject({
+      ok: false,
+      error: {
+        code: "REQUEST_INVALID",
+        message:
+          "callTool args for search_issues are invalid; use searchTools or describeTool before callTool.",
+        details: {
+          tool: "search_issues",
+          schemaErrors: [{ path: "/query", rule: "type", expected: "string" }],
+          retry:
+            "Call describeTool for this tool, then callTool with args matching inputSchema/inputTypeScript exactly.",
+          fallback:
+            "If this is not the right tool, use searchTools, readResource, resourceTemplates, searchResources, searchPrompts, getPrompt, or complete.",
+          nested: ["describeTool", { operation: "callTool" }],
+        },
+      },
+    });
+    expect(JSON.stringify(result)).not.toContain("call_tool");
+    expect(JSON.stringify(result)).not.toContain("describe_tool");
+    expect(JSON.stringify(result)).not.toContain("search_tools");
+    expect(JSON.stringify(result)).not.toContain("read_resource");
+    expect(JSON.stringify(result)).not.toContain("resource_templates");
+    expect(JSON.stringify(result)).not.toContain("search_resources");
+    expect(JSON.stringify(result)).not.toContain("search_prompts");
+    expect(JSON.stringify(result)).not.toContain("get_prompt");
+  });
+
+  it("compacts tool call success results to the useful payload", async () => {
+    const native = service([
+      {
+        caplet: "github",
+        toolName: "caplets_github",
+        title: "GitHub",
+        description: "GitHub repo operations.",
+        promptGuidance: [],
+      },
+    ]);
+    vi.mocked(native.execute).mockResolvedValueOnce({
+      content: [{ type: "text", text: JSON.stringify({ login: "octocat", id: 1 }) }],
+      _meta: {
+        caplets: {
+          id: "github",
+          name: "GitHub",
+          backend: "mcp",
+          operation: "call_tool",
+          tool: "get_me",
+          status: "ok",
+          elapsedMs: 12,
+        },
+      },
+    });
+    const api = createCodeModeCapletsApi({ service: native });
+    const github = api.github as CodeModeCapletHandle;
+
+    await expect(github.callTool("get_me", {})).resolves.toEqual({
+      ok: true,
+      data: { login: "octocat", id: 1 },
+      meta: {
+        capletId: "github",
+        tool: "get_me",
+        durationMs: expect.any(Number),
+        status: "ok",
+        elapsedMs: 12,
+      },
+    });
+  });
+
+  it("unwraps HTTP-style structured bodies for tool call success results", async () => {
+    const native = service([
+      {
+        caplet: "osv",
+        toolName: "caplets_osv",
+        title: "OSV",
+        description: "Open Source Vulnerabilities operations.",
+        promptGuidance: [],
+      },
+    ]);
+    vi.mocked(native.execute).mockResolvedValueOnce({
+      structuredContent: {
+        status: 200,
+        statusText: "",
+        headers: { "content-type": "application/json" },
+        body: {
+          vulns: [
+            { id: "GHSA-35jh-r3h4-6jhm", aliases: ["CVE-2021-23337"] },
+            { id: "GHSA-29mw-wpgm-hmr9", aliases: ["CVE-2020-28500"] },
+          ],
+        },
+      },
+      content: [{ type: "text", text: "HTTP 200" }],
+    });
+    const api = createCodeModeCapletsApi({ service: native });
+    const osv = api.osv as CodeModeCapletHandle;
+
+    await expect(
+      osv.callTool("query_package_version", {
+        name: "lodash",
+        ecosystem: "npm",
+        version: "4.17.20",
+      }),
+    ).resolves.toMatchObject({
+      ok: true,
+      data: {
+        vulns: [
+          { id: "GHSA-35jh-r3h4-6jhm", aliases: ["CVE-2021-23337"] },
+          { id: "GHSA-29mw-wpgm-hmr9", aliases: ["CVE-2020-28500"] },
+        ],
+      },
+      meta: { capletId: "osv", tool: "query_package_version" },
+    });
+  });
+
+  it("does not expose raw MCP transport details in expected tool failures", async () => {
+    const native = service([
+      {
+        caplet: "github",
+        toolName: "caplets_github",
+        title: "GitHub",
+        description: "GitHub repo operations.",
+        promptGuidance: [],
+      },
+    ]);
+    vi.mocked(native.execute).mockResolvedValueOnce({
+      isError: true,
+      content: [{ type: "text", text: "missing required parameter: owner" }],
+      _meta: {
+        caplets: {
+          id: "github",
+          name: "GitHub",
+          backend: "mcp",
+          operation: "call_tool",
+          tool: "create_branch",
+          status: "error",
+          elapsedMs: 180,
+        },
+      },
+    });
+    const api = createCodeModeCapletsApi({ service: native });
+    const github = api.github as CodeModeCapletHandle;
+    const result = await github.callTool("create_branch", {});
+
+    expect(result).toEqual({
+      ok: false,
+      error: {
+        code: "tool_call_failed",
+        message: "missing required parameter: owner",
+      },
+      meta: {
+        capletId: "github",
+        tool: "create_branch",
+        durationMs: expect.any(Number),
+        status: "error",
+        elapsedMs: 180,
+      },
+    });
+    expect(JSON.stringify(result)).not.toContain('"content"');
+    expect(JSON.stringify(result)).not.toContain('"_meta"');
+  });
+
+  it("adds debug.readLogs without hiding a debug caplet handle", () => {
+    const native = service([
+      {
+        caplet: "debug",
+        toolName: "caplets_debug",
+        title: "Debug",
+        description: "Debug caplet.",
+        promptGuidance: [],
+      },
+    ]);
+    const api = createCodeModeCapletsApi({
+      service: native,
+      readLogs: vi.fn(async () => ({
+        entries: [],
+      })),
+    });
+    const debug = api.debug as CodeModeCapletHandle & { readLogs: unknown };
+
+    expect(debug.id).toBe("debug");
+    expect(debug.readLogs).toBeTypeOf("function");
+    expect(debug.callTool).toBeTypeOf("function");
+  });
+});
diff --git a/packages/core/test/code-mode-cli.test.ts b/packages/core/test/code-mode-cli.test.ts
new file mode 100644
index 0000000..3a971be
--- /dev/null
+++ b/packages/core/test/code-mode-cli.test.ts
@@ -0,0 +1,173 @@
+import { mkdirSync, mkdtempSync, rmSync, writeFileSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { afterEach, beforeEach, describe, expect, it } from "vitest";
+import { runCli } from "../src/cli";
+
+describe("Code Mode CLI", () => {
+  const originalMode = process.env.CAPLETS_MODE;
+  const originalConfigPath = process.env.CAPLETS_CONFIG;
+  const originalProjectConfigPath = process.env.CAPLETS_PROJECT_CONFIG;
+
+  beforeEach(() => {
+    process.env.CAPLETS_MODE = "local";
+    delete process.env.CAPLETS_PROJECT_CONFIG;
+  });
+
+  afterEach(() => {
+    if (originalMode === undefined) {
+      delete process.env.CAPLETS_MODE;
+    } else {
+      process.env.CAPLETS_MODE = originalMode;
+    }
+    if (originalConfigPath === undefined) {
+      delete process.env.CAPLETS_CONFIG;
+    } else {
+      process.env.CAPLETS_CONFIG = originalConfigPath;
+    }
+    if (originalProjectConfigPath === undefined) {
+      delete process.env.CAPLETS_PROJECT_CONFIG;
+    } else {
+      process.env.CAPLETS_PROJECT_CONFIG = originalProjectConfigPath;
+    }
+  });
+
+  it("runs inline code and prints the JSON envelope", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "caplets-code-mode-cli-"));
+    const out: string[] = [];
+    try {
+      process.env.CAPLETS_CONFIG = writeConfig(dir, {});
+
+      await runCli(["run", "return { ok: true };", "--json"], {
+        writeOut: (value) => out.push(value),
+      });
+
+      expect(JSON.parse(out.join(""))).toMatchObject({
+        ok: true,
+        value: { ok: true },
+      });
+    } finally {
+      rmSync(dir, { recursive: true, force: true });
+    }
+  });
+
+  it("reads --file paths relative to the current working directory", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "caplets-code-mode-cli-"));
+    const cwd = process.cwd();
+    const out: string[] = [];
+    try {
+      process.env.CAPLETS_CONFIG = writeConfig(dir, {});
+      const project = join(dir, "project");
+      mkdirSync(project, { recursive: true });
+      writeFileSync(join(project, "workflow.ts"), "return { source: 'file' };\n");
+      process.chdir(project);
+
+      await runCli(["run", "--file", "workflow.ts", "--json"], {
+        writeOut: (value) => out.push(value),
+      });
+
+      expect(JSON.parse(out.join(""))).toMatchObject({
+        ok: true,
+        value: { source: "file" },
+      });
+    } finally {
+      process.chdir(cwd);
+      rmSync(dir, { recursive: true, force: true });
+    }
+  });
+
+  it("reads stdin when inline code and file input are absent", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "caplets-code-mode-cli-"));
+    const out: string[] = [];
+    try {
+      process.env.CAPLETS_CONFIG = writeConfig(dir, {});
+
+      await runCli(["run", "--json"], {
+        writeOut: (value) => out.push(value),
+        readStdin: async () => "return { source: 'stdin' };",
+      });
+
+      expect(JSON.parse(out.join(""))).toMatchObject({
+        ok: true,
+        value: { source: "stdin" },
+      });
+    } finally {
+      rmSync(dir, { recursive: true, force: true });
+    }
+  });
+
+  it("prints generated declaration text", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "caplets-code-mode-cli-"));
+    const out: string[] = [];
+    try {
+      process.env.CAPLETS_CONFIG = writeConfig(dir, {
+        mcpServers: {
+          github: {
+            name: "GitHub",
+            description: "GitHub repo operations.",
+            command: "node",
+          },
+        },
+      });
+
+      await runCli(["code-mode", "types"], {
+        writeOut: (value) => out.push(value),
+      });
+
+      expect(out.join("")).toContain('github:CapletHandle<"github">;');
+      expect(out.join("")).toContain("GitHub repo operations.");
+    } finally {
+      rmSync(dir, { recursive: true, force: true });
+    }
+  });
+
+  it("prints generated declaration metadata as JSON", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "caplets-code-mode-cli-"));
+    const out: string[] = [];
+    try {
+      process.env.CAPLETS_CONFIG = writeConfig(dir, {
+        mcpServers: {
+          github: {
+            name: "GitHub",
+            description: "GitHub repo operations.",
+            command: "node",
+          },
+        },
+      });
+
+      await runCli(["code-mode", "types", "--json"], {
+        writeOut: (value) => out.push(value),
+      });
+
+      expect(JSON.parse(out.join(""))).toMatchObject({
+        callableCount: 1,
+        runtimeScope: "local",
+      });
+      expect(JSON.parse(out.join("")).declarationHash).toMatch(/^[a-f0-9]{64}$/u);
+    } finally {
+      rmSync(dir, { recursive: true, force: true });
+    }
+  });
+});
+
+function writeConfig(dir: string, config: Record<string, unknown>): string {
+  const path = join(dir, "config.json");
+  writeFileSync(
+    path,
+    JSON.stringify(
+      Object.keys(config).length > 0
+        ? config
+        : {
+            mcpServers: {
+              placeholder: {
+                name: "Placeholder",
+                description: "Disabled placeholder.",
+                command: "node",
+                disabled: true,
+              },
+            },
+          },
+    ),
+  );
+  return path;
+}
diff --git a/packages/core/test/code-mode-declarations.test.ts b/packages/core/test/code-mode-declarations.test.ts
new file mode 100644
index 0000000..e99da82
--- /dev/null
+++ b/packages/core/test/code-mode-declarations.test.ts
@@ -0,0 +1,151 @@
+import { readFileSync } from "node:fs";
+import { join } from "node:path";
+import { describe, expect, it } from "vitest";
+import { CODE_MODE_RUNTIME_API_DECLARATION } from "../src/code-mode/runtime-api.generated";
+import {
+  codeModeDeclarationHash,
+  generateCodeModeDeclarations,
+  generateCodeModeRunToolDescription,
+  minifyCodeModeDeclarationText,
+} from "../src/code-mode/declarations";
+import type { CodeModeCallableCaplet } from "../src/code-mode/types";
+
+describe("generateCodeModeDeclarations", () => {
+  it("keeps the generated runtime API declaration in sync with the checked template", () => {
+    const template = readFileSync(
+      join(import.meta.dirname, "../src/code-mode/runtime-api.d.ts"),
+      "utf8",
+    );
+
+    expect(CODE_MODE_RUNTIME_API_DECLARATION).toBe(minifyCodeModeDeclarationText(template));
+  });
+
+  it("declares callable caplets with strict handle ids and compact descriptions", () => {
+    const declaration = generateCodeModeDeclarations({
+      caplets: [
+        {
+          id: "github",
+          name: "GitHub",
+          description: "GitHub repo, issue, PR, workflow ops.",
+          useWhen: "Use for repository issue, PR, and workflow tasks.",
+          avoidWhen: "Avoid for package vulnerability lookup.",
+        },
+        {
+          id: "build-system",
+          name: "Build System",
+          description: "Internal build system operations.",
+        },
+      ],
+    });
+
+    expect(declaration).toContain('github:CapletHandle<"github">;');
+    expect(declaration).toContain('"build-system":CapletHandle<"build-system">;');
+    expect(declaration).toContain(
+      "/**GitHub repo, issue, PR, workflow ops. Use when: Use for repository issue, PR, and workflow tasks. Avoid when: Avoid for package vulnerability lookup.*/",
+    );
+    expect(declaration).toContain("/** Search tool summaries for the discovery pass;");
+    expect(declaration).toContain("prefer outputSchema/outputTypeScript over observed hints");
+    expect(declaration).toContain("Exact downstream tool identifier");
+    expect(declaration).toContain("useWhen?:string");
+    expect(declaration).toContain("avoidWhen?:string");
+    expect(declaration).toContain("readOnlyHint?:boolean");
+    expect(declaration).toContain("destructiveHint?:boolean");
+    expect(declaration).toContain("type ToolSummary={");
+    expect(declaration).not.toContain("ToolSummary={id?:string");
+    expect(declaration).not.toContain("tool?:string;description");
+    expect(declaration).toContain("inspect():Promise<CapletCard<Id>>;");
+    expect(declaration).toContain(
+      "callTool(name:string,args?:unknown):Promise<CapletsResult<unknown>>",
+    );
+    expect(declaration).toContain("observedOutputShape?:ObservedOutputShape");
+    expect(declaration).not.toContain("fieldSelection");
+    expect(declaration).toContain("resources(input?:PageInput):Promise<Page<ResourceSummary>>");
+    expect(declaration).toContain("readLogs(input:ReadLogsInput):Promise<ReadLogsResult>");
+    expect(declaration).not.toContain("\n\n");
+    expect(declaration).not.toContain(" = ");
+  });
+
+  it("builds the shared run tool description from generated declarations", () => {
+    const declaration = 'declare const caplets:{docs:CapletHandle<"docs">;};';
+    const description = generateCodeModeRunToolDescription(declaration);
+
+    expect(description).toContain("Prefer a two-pass workflow for non-trivial tasks");
+    expect(description).toContain(
+      "Pass 1: discover and inspect candidate caplets/tools/resources/prompts",
+    );
+    expect(description).toContain("Pass 2: execute with exact args");
+    expect(description).toContain("Return decision-ready JSON, not raw tool payloads");
+    expect(description).toContain("For fallback, check candidate handles first");
+    expect(description).toContain("const ready=await h.check()");
+    expect(description).toContain("Never invent tool names, resource URIs, prompt names");
+    expect(description).toContain("Never infer input/output schemas from memory");
+    expect(description).toContain("use describeTool for the exact callSignature");
+    expect(description).toContain("Generated declaration hints:");
+    expect(description).toContain(declaration);
+    expect(description).not.toContain("Do not split discovery and execution");
+    expect(description).not.toContain("caplets.github");
+    expect(description).not.toContain("search_issues");
+  });
+
+  it("uses intersection typing when a callable caplet id collides with debug", () => {
+    const declaration = generateCodeModeDeclarations({
+      caplets: [
+        {
+          id: "debug",
+          name: "Debug Caplet",
+          description: "Debug capability domain.",
+        },
+      ],
+    });
+
+    expect(declaration).toContain('debug:DebugApi&CapletHandle<"debug">;');
+    expect(declaration).not.toContain("debug: {");
+  });
+
+  it("removes repeated discovery guidance and native metadata from JSDoc hints", () => {
+    const declaration = generateCodeModeDeclarations({
+      caplets: [
+        {
+          id: "github",
+          name: "GitHub",
+          description:
+            "GitHub Caplet. Inspect and manage GitHub repositories, issues, pull requests, branches, commits, and code review workflows. Use inspect for details when needed; use tools for actions, resources for readable context, prompts for reusable workflows, and complete for prompt/resource-template arguments. Native tool name: caplets_github Original Caplet ID: github",
+        },
+      ],
+    });
+
+    expect(declaration).toContain(
+      "/**GitHub Caplet. Inspect and manage GitHub repositories, issues, pull requests, branches, commits, and code review workflows.*/",
+    );
+    expect(declaration).not.toContain("Use inspect for details when needed");
+    expect(declaration).not.toContain("Native tool name:");
+    expect(declaration).not.toContain("Original Caplet ID:");
+  });
+
+  it("bounds long JSDoc hints", () => {
+    const declaration = generateCodeModeDeclarations({
+      caplets: [
+        {
+          id: "verbose",
+          name: "Verbose",
+          description: "A".repeat(500),
+        },
+      ],
+    });
+
+    expect(declaration).toContain(`${"A".repeat(177)}...`);
+    expect(declaration).not.toContain("A".repeat(181));
+  });
+
+  it("returns stable hashes for equivalent declaration content", () => {
+    const caplets: CodeModeCallableCaplet[] = [
+      { id: "github", name: "GitHub", description: "GitHub repo operations." },
+    ];
+
+    const first = codeModeDeclarationHash(generateCodeModeDeclarations({ caplets }));
+    const second = codeModeDeclarationHash(generateCodeModeDeclarations({ caplets }));
+
+    expect(first).toMatch(/^[a-f0-9]{64}$/u);
+    expect(second).toBe(first);
+  });
+});
diff --git a/packages/core/test/code-mode-diagnostics.test.ts b/packages/core/test/code-mode-diagnostics.test.ts
new file mode 100644
index 0000000..4629d53
--- /dev/null
+++ b/packages/core/test/code-mode-diagnostics.test.ts
@@ -0,0 +1,136 @@
+import { describe, expect, it } from "vitest";
+import { generateCodeModeDeclarations } from "../src/code-mode/declarations";
+import { diagnoseCodeModeTypeScript } from "../src/code-mode/diagnostics";
+
+const declaration = generateCodeModeDeclarations({
+  caplets: [{ id: "github", name: "GitHub", description: "GitHub repo operations." }],
+});
+
+describe("diagnoseCodeModeTypeScript", () => {
+  it("blocks unknown CapletHandle methods before execution", () => {
+    const diagnostics = diagnoseCodeModeTypeScript({
+      declaration,
+      code: 'await caplets.github.call("listIssues", {});',
+    });
+
+    expect(diagnostics.some((diagnostic) => diagnostic.severity === "error")).toBe(true);
+    expect(diagnostics.map((diagnostic) => diagnostic.message).join("\n")).toContain(
+      "CapletHandle does not expose call()",
+    );
+    expect(diagnostics.map((diagnostic) => diagnostic.message).join("\n")).toContain("callTool");
+  });
+
+  it("blocks direct fetch because the ambient lib omits network globals", () => {
+    const diagnostics = diagnoseCodeModeTypeScript({
+      declaration,
+      code: 'await fetch("https://example.com");',
+    });
+
+    expect(diagnostics.some((diagnostic) => diagnostic.severity === "error")).toBe(true);
+    expect(diagnostics.map((diagnostic) => diagnostic.message).join("\n")).toContain(
+      "Direct fetch is not available",
+    );
+  });
+
+  it("allows standard JavaScript, console, URL, JSON, and Caplet callTool", () => {
+    const diagnostics = diagnoseCodeModeTypeScript({
+      declaration,
+      code: `
+        const url = new URL("https://example.com/issues?state=open");
+        console.log(JSON.stringify({ state: url.searchParams.get("state") }));
+        const result = await caplets.github.callTool("listIssues", { state: "open" });
+        return result;
+      `,
+    });
+
+    expect(diagnostics.filter((diagnostic) => diagnostic.severity === "error")).toEqual([]);
+  });
+
+  it("blocks static and dynamic imports", () => {
+    const diagnostics = diagnoseCodeModeTypeScript({
+      declaration,
+      code: `
+        import fs from "node:fs";
+        await import("node:process");
+      `,
+    });
+
+    expect(
+      diagnostics.filter((diagnostic) => diagnostic.severity === "error").length,
+    ).toBeGreaterThanOrEqual(1);
+    expect(diagnostics.map((diagnostic) => diagnostic.message).join("\n")).toContain(
+      "Imports are not available in Code Mode",
+    );
+  });
+
+  it("honors per-line @ts-ignore for TypeScript diagnostics", () => {
+    const diagnostics = diagnoseCodeModeTypeScript({
+      declaration,
+      code: `
+        // @ts-ignore
+        caplets.github.notARealMethod();
+        return true;
+      `,
+    });
+
+    expect(diagnostics.filter((diagnostic) => diagnostic.severity === "error")).toEqual([]);
+    expect(diagnostics.map((diagnostic) => diagnostic.code)).not.toContain("2339");
+  });
+
+  it("honors per-line @ts-expect-error and reports unused directives", () => {
+    const suppressed = diagnoseCodeModeTypeScript({
+      declaration,
+      code: `
+        // @ts-expect-error
+        caplets.github.notARealMethod();
+        return true;
+      `,
+    });
+    const unused = diagnoseCodeModeTypeScript({
+      declaration,
+      code: `
+        // @ts-expect-error
+        return true;
+      `,
+    });
+
+    expect(suppressed.map((diagnostic) => diagnostic.code)).not.toContain("2339");
+    expect(unused.map((diagnostic) => diagnostic.code)).toContain("2578");
+  });
+
+  it("honors whole-script @ts-nocheck line and block comments", () => {
+    const lineComment = diagnoseCodeModeTypeScript({
+      declaration,
+      code: `
+        // @ts-nocheck
+        caplets.github.notARealMethod();
+        return true;
+      `,
+    });
+    const blockComment = diagnoseCodeModeTypeScript({
+      declaration,
+      code: `
+        /* @ts-nocheck */
+        caplets.github.notARealMethod();
+        return true;
+      `,
+    });
+
+    expect(lineComment.map((diagnostic) => diagnostic.code)).toContain("ts_nocheck_applied");
+    expect(lineComment.map((diagnostic) => diagnostic.code)).not.toContain("2339");
+    expect(blockComment.map((diagnostic) => diagnostic.code)).toContain("ts_nocheck_applied");
+    expect(blockComment.map((diagnostic) => diagnostic.code)).not.toContain("2339");
+  });
+
+  it("does not allow TypeScript comments to suppress Code Mode safety checks", () => {
+    const diagnostics = diagnoseCodeModeTypeScript({
+      declaration,
+      code: `
+        // @ts-ignore
+        await fetch("https://example.com");
+      `,
+    });
+
+    expect(diagnostics.map((diagnostic) => diagnostic.code)).toContain("FETCH_UNAVAILABLE");
+  });
+});
diff --git a/packages/core/test/code-mode-logs.test.ts b/packages/core/test/code-mode-logs.test.ts
new file mode 100644
index 0000000..ff8d5d7
--- /dev/null
+++ b/packages/core/test/code-mode-logs.test.ts
@@ -0,0 +1,93 @@
+import { mkdtempSync, readFileSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { describe, expect, it } from "vitest";
+import { CodeModeLogStore, redactCodeModeLogText } from "../src/code-mode/logs";
+
+describe("Code Mode logs", () => {
+  it("redacts common secrets, credentials, and PII", () => {
+    const redacted = redactCodeModeLogText(
+      [
+        "Authorization: Bearer secret-token-value",
+        "cookie=session=secret-cookie",
+        "email ian@example.com",
+        "phone +1 (555) 123-4567",
+        "ssn 123-45-6789",
+        "card 4111 1111 1111 1111",
+        "token abcdefghijklmnopqrstuvwxyzABCDEFGHIJKL0123456789",
+      ].join("\n"),
+    );
+
+    expect(redacted).not.toContain("secret-token-value");
+    expect(redacted).not.toContain("secret-cookie");
+    expect(redacted).not.toContain("ian@example.com");
+    expect(redacted).not.toContain("123-45-6789");
+    expect(redacted).not.toContain("4111 1111 1111 1111");
+    expect(redacted).toContain("[REDACTED:token]");
+    expect(redacted).toContain("[REDACTED:email]");
+    expect(redacted).toContain("[REDACTED:ssn]");
+    expect(redacted).toContain("[REDACTED:credit-card]");
+  });
+
+  it("stores redacted entries and reads them by opaque logRef", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "caplets-code-mode-logs-"));
+    try {
+      const store = new CodeModeLogStore({
+        stateDir: dir,
+        now: () => new Date("2026-06-07T12:00:00.000Z"),
+      });
+      const stored = await store.store([
+        {
+          level: "log",
+          message: "hello bearer secret-token-value ian@example.com",
+          timestamp: "2026-06-07T12:00:00.000Z",
+        },
+      ]);
+
+      expect(stored.logRef).toMatch(/^[a-f0-9]{48}$/u);
+      const raw = readFileSync(join(dir, "code-mode", "logs", `${stored.logRef}.json`), "utf8");
+      expect(raw).not.toContain("secret-token-value");
+      expect(raw).not.toContain("ian@example.com");
+
+      const read = await store.read({ logRef: stored.logRef, limit: 10 });
+
+      expect(read.entries).toEqual([
+        {
+          level: "log",
+          message: "hello bearer [REDACTED:token] [REDACTED:email]",
+          timestamp: "2026-06-07T12:00:00.000Z",
+        },
+      ]);
+    } finally {
+      rmSync(dir, { recursive: true, force: true });
+    }
+  });
+
+  it("returns no entries for expired or unknown log refs", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "caplets-code-mode-logs-"));
+    try {
+      const store = new CodeModeLogStore({
+        stateDir: dir,
+        now: () => new Date("2026-06-07T12:00:00.000Z"),
+        logRefTtlMs: 1,
+      });
+      const stored = await store.store([
+        {
+          level: "log",
+          message: "hello",
+          timestamp: "2026-06-07T12:00:00.000Z",
+        },
+      ]);
+      const expiredStore = new CodeModeLogStore({
+        stateDir: dir,
+        now: () => new Date("2026-06-07T12:00:01.000Z"),
+        logRefTtlMs: 1,
+      });
+
+      await expect(expiredStore.read({ logRef: stored.logRef })).resolves.toEqual({ entries: [] });
+      await expect(expiredStore.read({ logRef: "0".repeat(48) })).resolves.toEqual({ entries: [] });
+    } finally {
+      rmSync(dir, { recursive: true, force: true });
+    }
+  });
+});
diff --git a/packages/core/test/code-mode-mcp.test.ts b/packages/core/test/code-mode-mcp.test.ts
new file mode 100644
index 0000000..0131f7d
--- /dev/null
+++ b/packages/core/test/code-mode-mcp.test.ts
@@ -0,0 +1,161 @@
+import { mkdirSync, mkdtempSync, rmSync, writeFileSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import type { RegisteredTool } from "@modelcontextprotocol/sdk/server/mcp";
+import { afterEach, describe, expect, it, vi } from "vitest";
+import { CapletsEngine } from "../src/engine";
+import { CapletsMcpSession } from "../src/serve/session";
+
+const dirs: string[] = [];
+
+afterEach(() => {
+  for (const dir of dirs.splice(0)) {
+    rmSync(dir, { recursive: true, force: true });
+  }
+});
+
+describe("Code Mode MCP run tool", () => {
+  it("registers run alongside existing Caplet tools", async () => {
+    const { dir, configPath, projectConfigPath } = tempConfig({
+      mcpServers: {
+        github: { name: "GitHub", description: "GitHub repo operations.", command: "node" },
+      },
+    });
+    dirs.push(dir);
+    const engine = new CapletsEngine({ configPath, projectConfigPath, watch: false });
+    const server = mockServer();
+    const session = new CapletsMcpSession(engine, { server });
+
+    expect(session.registeredToolIds()).toEqual(["github"]);
+    expect(server.registered.get("github")).toBeDefined();
+    expect(server.registered.get("run")).toBeDefined();
+    expect(server.definitions.get("run")?.description).toContain("caplets.<id>");
+    expect(server.definitions.get("run")?.description).toContain(
+      "Prefer a two-pass workflow for non-trivial tasks",
+    );
+    expect(server.definitions.get("run")?.description).toContain(
+      "Pass 1: discover and inspect candidate caplets/tools/resources/prompts",
+    );
+    expect(server.definitions.get("run")?.description).toContain(
+      "return chosen handles, call signatures/schemas, and planned args",
+    );
+    expect(server.definitions.get("run")?.description).toContain("Pass 2: execute with exact args");
+    expect(server.definitions.get("run")?.description).toContain(
+      "Return decision-ready JSON, not raw tool payloads",
+    );
+    expect(server.definitions.get("run")?.description).toContain(
+      "derive final recommendations from all relevant records",
+    );
+    expect(server.definitions.get("run")?.description).toContain(
+      "summary, key evidence, derived fields, recommendation",
+    );
+    expect(server.definitions.get("run")?.description).toContain(
+      "if records disagree or have ranges/statuses, compute the strictest applicable conclusion",
+    );
+    expect(server.definitions.get("run")?.description).toContain(
+      "prefer `outputSchema` or `outputTypeScript`",
+    );
+    expect(server.definitions.get("run")?.description).toContain(
+      "do not guess from provider memory",
+    );
+    expect(server.definitions.get("run")?.description).toContain(
+      "Never invent tool names, resource URIs, prompt names",
+    );
+    expect(server.definitions.get("run")?.description).toContain(
+      "Never infer input/output schemas from memory",
+    );
+    expect(server.definitions.get("run")?.description).toContain(
+      "use describeTool for the exact callSignature",
+    );
+    expect(server.definitions.get("run")?.description).toContain("list broad candidate records");
+    expect(server.definitions.get("run")?.description).toContain('const h=caplets["caplet-id"]');
+    expect(server.definitions.get("run")?.description).toContain("observedOutputShape");
+    expect(server.definitions.get("run")?.description).toContain("absent or generic");
+    expect(server.definitions.get("run")?.description).toContain("Filter bulky results in script");
+    expect(server.definitions.get("run")?.description).toContain("html_url");
+    expect(server.definitions.get("run")?.description).not.toContain(
+      "Do not split discovery and execution",
+    );
+    expect(server.definitions.get("run")?.description).not.toContain(
+      "inside the same script before returning",
+    );
+    expect(server.definitions.get("run")?.description).not.toContain(
+      "Use multiple `run` calls only after",
+    );
+    expect(server.definitions.get("run")?.description).not.toContain("OSV");
+    expect(server.definitions.get("run")?.description).not.toContain("vulnerability");
+    expect(server.definitions.get("run")?.description).not.toContain("release");
+    expect(server.definitions.get("run")?.description).toContain("Generated declaration hints:");
+    expect(server.definitions.get("run")?.description).toContain('github:CapletHandle<"github">');
+
+    await session.close();
+    await engine.close();
+  });
+
+  it("returns a structured run envelope from the run tool", async () => {
+    const { dir, configPath, projectConfigPath } = tempConfig({
+      mcpServers: {
+        github: { name: "GitHub", description: "GitHub repo operations.", command: "node" },
+      },
+    });
+    dirs.push(dir);
+    const engine = new CapletsEngine({ configPath, projectConfigPath, watch: false });
+    const server = mockServer();
+    const session = new CapletsMcpSession(engine, { server });
+    const callback = server.callbacks.get("run");
+
+    const result = await callback?.({ code: "return { ok: true };" });
+
+    expect(result?.structuredContent).toMatchObject({
+      ok: true,
+      value: { ok: true },
+    });
+    expect(result?.content[0]).toMatchObject({ type: "text" });
+
+    await session.close();
+    await engine.close();
+  });
+});
+
+function tempConfig(config: unknown): {
+  dir: string;
+  configPath: string;
+  projectConfigPath: string;
+} {
+  const dir = mkdtempSync(join(tmpdir(), "caplets-code-mode-mcp-"));
+  const userRoot = join(dir, "user");
+  const projectRoot = join(dir, "project", ".caplets");
+  mkdirSync(userRoot, { recursive: true });
+  mkdirSync(projectRoot, { recursive: true });
+  const configPath = join(userRoot, "config.json");
+  const projectConfigPath = join(projectRoot, "config.json");
+  writeFileSync(configPath, JSON.stringify(config));
+  return { dir, configPath, projectConfigPath };
+}
+
+function mockServer() {
+  const registered = new Map<string, RegisteredTool>();
+  const definitions = new Map<string, { description?: string }>();
+  const callbacks = new Map<string, (request: unknown) => Promise<any>>();
+  return {
+    registered,
+    definitions,
+    callbacks,
+    registerTool: vi.fn((name: string, definition: { description?: string }, callback) => {
+      const tool = {
+        update: vi.fn(),
+        remove: vi.fn(() => registered.delete(name)),
+        enable: vi.fn(),
+        disable: vi.fn(),
+        enabled: true,
+        handler: vi.fn(),
+      } as unknown as RegisteredTool;
+      registered.set(name, tool);
+      definitions.set(name, definition);
+      callbacks.set(name, callback);
+      return tool;
+    }),
+    connect: vi.fn(async () => {}),
+    close: vi.fn(async () => {}),
+  };
+}
diff --git a/packages/core/test/code-mode-runner.test.ts b/packages/core/test/code-mode-runner.test.ts
new file mode 100644
index 0000000..9c32153
--- /dev/null
+++ b/packages/core/test/code-mode-runner.test.ts
@@ -0,0 +1,139 @@
+import { mkdtempSync, rmSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { describe, expect, it, vi } from "vitest";
+import { runCodeMode } from "../src/code-mode/runner";
+import { CodeModeLogStore } from "../src/code-mode/logs";
+import type { NativeCapletTool, NativeCapletsService } from "../src/native/service";
+
+function service(): NativeCapletsService {
+  const tools: NativeCapletTool[] = [
+    {
+      caplet: "github",
+      toolName: "caplets_github",
+      title: "GitHub",
+      description: "GitHub repo operations.",
+      promptGuidance: [],
+    },
+  ];
+  return {
+    listTools: () => tools,
+    execute: vi.fn(async (capletId: string, request: unknown) => ({
+      ok: true,
+      capletId,
+      request,
+    })),
+    reload: vi.fn(async () => true),
+    onToolsChanged: vi.fn(() => () => undefined),
+    close: vi.fn(async () => undefined),
+  };
+}
+
+describe("runCodeMode", () => {
+  it("returns an ok envelope for JSON-serializable values", async () => {
+    const result = await runCodeMode({
+      code: "return { ok: true, count: 2 + 2 };",
+      service: service(),
+      runtimeScope: "test",
+    });
+
+    expect(result).toMatchObject({
+      ok: true,
+      value: { ok: true, count: 4 },
+      diagnostics: [],
+      meta: { timeoutMs: 10_000 },
+    });
+  });
+
+  it("blocks diagnostics before Caplet calls", async () => {
+    const native = service();
+    const result = await runCodeMode({
+      code: 'await caplets.github.call("listIssues", {});',
+      service: native,
+    });
+
+    expect(result.ok).toBe(false);
+    expect(result.diagnostics.some((diagnostic) => diagnostic.severity === "error")).toBe(true);
+    expect(native.execute).not.toHaveBeenCalled();
+  });
+
+  it("blocks direct fetch and imports", async () => {
+    const fetchResult = await runCodeMode({
+      code: 'return await fetch("https://example.com");',
+      service: service(),
+    });
+    const importResult = await runCodeMode({
+      code: 'return await import("node:fs");',
+      service: service(),
+    });
+
+    expect(fetchResult.ok).toBe(false);
+    expect(importResult.ok).toBe(false);
+    expect(fetchResult.diagnostics.map((diagnostic) => diagnostic.message).join("\n")).toContain(
+      "Cannot find name 'fetch'",
+    );
+    expect(importResult.diagnostics.map((diagnostic) => diagnostic.message).join("\n")).toContain(
+      "Imports are not available in Code Mode",
+    );
+  });
+
+  it("captures redacted logs and expands them through debug.readLogs", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "caplets-code-mode-runner-"));
+    try {
+      const logStore = new CodeModeLogStore({
+        stateDir: dir,
+        now: () => new Date("2026-06-07T12:00:00.000Z"),
+      });
+      const result = await runCodeMode({
+        code: `
+          console.log("token", "Bearer secret-token-value", "ian@example.com");
+          return "done";
+        `,
+        service: service(),
+        logStore,
+      });
+
+      expect(result.ok).toBe(true);
+      expect(JSON.stringify(result)).not.toContain("secret-token-value");
+      expect(JSON.stringify(result)).not.toContain("ian@example.com");
+      expect(result.logs.stored).toBe(true);
+      expect(result.logs.logRef).toMatch(/^[a-f0-9]{48}$/u);
+      const expanded = await logStore.read({ logRef: result.logs.logRef ?? "", limit: 10 });
+      expect(expanded.entries).toMatchObject([
+        {
+          level: "log",
+          message: "token Bearer [REDACTED:token] [REDACTED:email]",
+        },
+      ]);
+    } finally {
+      rmSync(dir, { recursive: true, force: true });
+    }
+  });
+
+  it("routes Caplet callTool through NativeCapletsService.execute", async () => {
+    const native = service();
+    const result = await runCodeMode({
+      code: 'return await caplets.github.callTool("listIssues", { state: "open" });',
+      service: native,
+    });
+
+    expect(result.ok).toBe(true);
+    expect(native.execute).toHaveBeenCalledWith("github", {
+      operation: "call_tool",
+      name: "listIssues",
+      args: { state: "open" },
+    });
+  });
+
+  it("fails non-JSON return values with a structured serialization diagnostic", async () => {
+    const result = await runCodeMode({
+      code: "return 1n;",
+      service: service(),
+    });
+
+    expect(result.ok).toBe(false);
+    expect(result.diagnostics.map((diagnostic) => diagnostic.code)).toContain(
+      "SERIALIZATION_ERROR",
+    );
+  });
+});
diff --git a/packages/core/test/config.test.ts b/packages/core/test/config.test.ts
index d13a25c..a2eb248 100644
--- a/packages/core/test/config.test.ts
+++ b/packages/core/test/config.test.ts
@@ -67,6 +67,73 @@ describe("config", () => {
     rmSync(dir, { recursive: true, force: true });
   });
 
+  it("loads optional agent selection hints from JSON config", () => {
+    const config = parseConfig({
+      mcpServers: {
+        docs: {
+          name: "Docs",
+          description: "Search and read product documentation.",
+          command: "node",
+          useWhen: "Use for product documentation questions.",
+          avoidWhen: "Avoid for source-code search.",
+        },
+      },
+      httpApis: {
+        osv: {
+          name: "OSV",
+          description: "Query vulnerability data from OSV.",
+          baseUrl: "https://api.osv.dev",
+          auth: { type: "none" },
+          useWhen: "Use for package vulnerability lookups.",
+          actions: {
+            query_package_version: {
+              method: "POST",
+              path: "/v1/query",
+              useWhen: "Use when the task names one ecosystem, package, and version.",
+              avoidWhen: "Avoid for multi-package batch requests.",
+            },
+          },
+        },
+      },
+      cliTools: {
+        repo: {
+          name: "Repo",
+          description: "Run repository inspection commands.",
+          useWhen: "Use for local repository state.",
+          actions: {
+            status: {
+              command: "git",
+              args: ["status", "--short"],
+              useWhen: "Use for a concise working-tree status.",
+            },
+          },
+        },
+      },
+    });
+
+    expect(config.mcpServers.docs).toMatchObject({
+      useWhen: "Use for product documentation questions.",
+      avoidWhen: "Avoid for source-code search.",
+    });
+    expect(config.httpApis.osv).toMatchObject({
+      useWhen: "Use for package vulnerability lookups.",
+      actions: {
+        query_package_version: {
+          useWhen: "Use when the task names one ecosystem, package, and version.",
+          avoidWhen: "Avoid for multi-package batch requests.",
+        },
+      },
+    });
+    expect(config.cliTools.repo).toMatchObject({
+      useWhen: "Use for local repository state.",
+      actions: {
+        status: {
+          useWhen: "Use for a concise working-tree status.",
+        },
+      },
+    });
+  });
+
   it("loads project config when user config does not exist", () => {
     const dir = mkdtempSync(join(tmpdir(), "caplets-config-"));
     const projectConfigPath = join(dir, ".caplets", "config.json");
@@ -148,6 +215,48 @@ describe("config", () => {
     rmSync(dir, { recursive: true, force: true });
   });
 
+  it("loads optional agent selection hints from CAPLET.md frontmatter", () => {
+    const dir = mkdtempSync(join(tmpdir(), "caplets-hints-files-"));
+    writeFileSync(
+      join(dir, "osv.md"),
+      [
+        "---",
+        "name: OSV",
+        "description: Query vulnerability data from OSV.",
+        "useWhen: Use for package vulnerability lookups.",
+        "avoidWhen: Avoid for license or maintainer lookups.",
+        "httpApi:",
+        "  baseUrl: https://api.osv.dev",
+        "  auth:",
+        "    type: none",
+        "  actions:",
+        "    query_package_version:",
+        "      method: POST",
+        "      path: /v1/query",
+        "      useWhen: Use when the task names one ecosystem, package, and version.",
+        "      avoidWhen: Avoid for multi-package batch requests.",
+        "---",
+        "",
+        "# OSV",
+        "",
+      ].join("\n"),
+    );
+
+    const config = loadCapletFiles(dir);
+
+    expect(config?.httpApis?.osv).toMatchObject({
+      useWhen: "Use for package vulnerability lookups.",
+      avoidWhen: "Avoid for license or maintainer lookups.",
+      actions: {
+        query_package_version: {
+          useWhen: "Use when the task names one ecosystem, package, and version.",
+          avoidWhen: "Avoid for multi-package batch requests.",
+        },
+      },
+    });
+    rmSync(dir, { recursive: true, force: true });
+  });
+
   it("rejects setup commands that look like agent tools", () => {
     const root = mkdtempSync(join(tmpdir(), "caplets-setup-invalid-"));
     writeFileSync(
diff --git a/packages/core/test/doctor-cli.test.ts b/packages/core/test/doctor-cli.test.ts
index 1569564..4e4d1e2 100644
--- a/packages/core/test/doctor-cli.test.ts
+++ b/packages/core/test/doctor-cli.test.ts
@@ -17,6 +17,7 @@ describe("caplets doctor", () => {
     expect(report).toContain("Project sync");
     expect(report).toContain("Daemon");
     expect(report).toContain("Cloud Auth");
+    expect(report).toContain("Code Mode");
     expect(report).not.toContain("local presence");
   });
 
@@ -62,6 +63,14 @@ describe("caplets doctor", () => {
       sync: { state: "idle" },
       daemon: { running: false },
       cloudAuth: { authenticated: false },
+      codeMode: {
+        typesGeneration: { ok: true },
+        diagnostics: { ok: true },
+        sandboxSmoke: { ok: true },
+        logStorage: { ok: true },
+        callableIndex: { ok: true },
+        observedOutputShapes: { ok: true },
+      },
     });
   });
 });
diff --git a/packages/core/test/downstream.test.ts b/packages/core/test/downstream.test.ts
index 0050459..37da10f 100644
--- a/packages/core/test/downstream.test.ts
+++ b/packages/core/test/downstream.test.ts
@@ -25,6 +25,7 @@ describe("compact schema fingerprints", () => {
     const schema = {
       type: "object",
       properties: { value: { type: "string" }, count: { type: "number" } },
+      required: ["value"],
     };
 
     const first = manager.compact(server, { name: "first", inputSchema: schema } as Tool);
@@ -34,7 +35,12 @@ describe("compact schema fingerprints", () => {
       outputSchema: schema,
     } as Tool);
 
-    expect(first).toMatchObject({ hasInputSchema: true, hasOutputSchema: false });
+    expect(first).toMatchObject({
+      hasInputSchema: true,
+      hasOutputSchema: false,
+      requiredArgs: ["value"],
+      acceptedArgs: ["count", "value"],
+    });
     expect(second).toMatchObject({ hasInputSchema: true, hasOutputSchema: true });
     expect(first).not.toHaveProperty("inputSchemaHash");
     expect(second).not.toHaveProperty("outputSchemaHash");
@@ -53,6 +59,7 @@ describe("compact schema fingerprints", () => {
     } as Tool);
 
     expect(compact).toMatchObject({ hasInputSchema: true, hasOutputSchema: false });
+    expect(compact).toMatchObject({ acceptedArgs: ["a", "b"] });
     expect(compact).not.toHaveProperty("inputSchemaHash");
     expect(compact).not.toHaveProperty("outputSchemaHash");
   });
@@ -117,8 +124,8 @@ describe("downstream stdio lifecycle", () => {
         config.mcpServers.fixture!,
         {
           operation: "call_tool",
-          tool: "echo",
-          arguments: { message: "hello" },
+          name: "echo",
+          args: { message: "hello" },
           fields: ["message"],
         },
         registry,
@@ -282,7 +289,7 @@ describe("downstream stdio lifecycle", () => {
               JSON.stringify({
                 jsonrpc: "2.0",
                 id: message.id,
-                result: { tools: [{ name: "remote_echo", inputSchema: {} }] },
+                result: { tools: [{ name: "remote_echo", inputSchema: { type: "object" } }] },
               }),
             );
             return;
@@ -330,6 +337,100 @@ describe("downstream stdio lifecycle", () => {
       await new Promise<void>((resolve) => server.close(() => resolve()));
     }
   });
+
+  it("shares one in-flight remote connection across concurrent operations", async () => {
+    const releaseInitialize = deferred<void>();
+    let initializeCount = 0;
+    let toolsListCount = 0;
+    const server = createServer((request: IncomingMessage, response: ServerResponse) => {
+      let body = "";
+      request.setEncoding("utf8");
+      request.on("data", (chunk) => {
+        body += chunk;
+      });
+      request.on("end", () => {
+        void (async () => {
+          if (!body) {
+            response.statusCode = 202;
+            response.end();
+            return;
+          }
+          const message = JSON.parse(body) as { id?: number; method?: string };
+          response.setHeader("content-type", "application/json");
+          if (message.method === "initialize") {
+            initializeCount += 1;
+            await releaseInitialize.promise;
+            response.end(
+              JSON.stringify({
+                jsonrpc: "2.0",
+                id: message.id,
+                result: {
+                  protocolVersion: "2025-06-18",
+                  capabilities: { tools: {} },
+                  serverInfo: { name: "fixture-remote", version: "1.0.0" },
+                },
+              }),
+            );
+            return;
+          }
+          if (message.method === "tools/list") {
+            toolsListCount += 1;
+            response.end(
+              JSON.stringify({
+                jsonrpc: "2.0",
+                id: message.id,
+                result: { tools: [{ name: "remote_echo", inputSchema: { type: "object" } }] },
+              }),
+            );
+            return;
+          }
+          response.statusCode = 202;
+          response.end();
+        })().catch((error) => {
+          response.statusCode = 500;
+          response.end(String(error));
+        });
+      });
+    });
+
+    try {
+      await new Promise<void>((resolve) => server.listen(0, "127.0.0.1", resolve));
+      const address = server.address();
+      if (!address || typeof address === "string") {
+        throw new Error("Could not bind fixture server");
+      }
+      const config = parseConfig({
+        mcpServers: {
+          remote: {
+            name: "Remote",
+            description: "A useful remote server.",
+            transport: "http",
+            url: `http://127.0.0.1:${address.port}/mcp`,
+          },
+        },
+      });
+      const registry = new ServerRegistry(config);
+      const manager = new DownstreamManager(registry);
+      const check = manager.checkServer(config.mcpServers.remote!);
+      const list = manager.listTools(config.mcpServers.remote!);
+
+      await waitUntil(() => initializeCount === 1);
+      releaseInitialize.resolve();
+
+      const [checkResult, tools] = await Promise.all([check, list]);
+
+      expect(checkResult).toMatchObject({ id: "remote", status: "available", toolCount: 1 });
+      expect(tools.map((tool) => tool.name)).toEqual(["remote_echo"]);
+      expect(initializeCount).toBe(1);
+      expect(toolsListCount).toBeGreaterThanOrEqual(1);
+      expect(registry.getStatus("remote")).toBe("available");
+
+      await manager.close();
+    } finally {
+      releaseInitialize.resolve();
+      await new Promise<void>((resolve) => server.close(() => resolve()));
+    }
+  });
 });
 
 describe("downstream remote OAuth lifecycle", () => {
@@ -560,3 +661,13 @@ function deferred<T>(): {
   });
   return { promise, resolve, reject };
 }
+
+async function waitUntil(predicate: () => boolean): Promise<void> {
+  const started = Date.now();
+  while (!predicate()) {
+    if (Date.now() - started > 1_000) {
+      throw new Error("Timed out waiting for predicate");
+    }
+    await new Promise((resolve) => setTimeout(resolve, 5));
+  }
+}
diff --git a/packages/core/test/http-actions.test.ts b/packages/core/test/http-actions.test.ts
index 0889630..7d8d118 100644
--- a/packages/core/test/http-actions.test.ts
+++ b/packages/core/test/http-actions.test.ts
@@ -134,7 +134,7 @@ describe("HttpActionManager", () => {
     ]);
   });
 
-  it("exposes output schemas through get_tool, compact metadata, and call_tool.fields", async () => {
+  it("exposes output schemas through describe_tool, compact metadata, and call_tool.fields", async () => {
     requests.length = 0;
     const config = parseConfig({
       httpApis: {
@@ -176,15 +176,16 @@ describe("HttpActionManager", () => {
       properties: { body: { properties: { ok: { type: "boolean" } } } },
     });
     expect(http.compact(caplet, tool)).toMatchObject({
-      id: "http",
-      tool: "ping",
+      name: "ping",
       hasInputSchema: true,
       hasOutputSchema: true,
+      readOnlyHint: true,
+      destructiveHint: false,
     });
 
     const fetched = (await handleServerTool(
       caplet,
-      { operation: "get_tool", tool: "ping" },
+      { operation: "describe_tool", name: "ping" },
       registry,
       downstream,
       undefined,
@@ -197,7 +198,7 @@ describe("HttpActionManager", () => {
 
     const projected = (await handleServerTool(
       caplet,
-      { operation: "call_tool", tool: "ping", arguments: {}, fields: ["body.ok"] },
+      { operation: "call_tool", name: "ping", args: {}, fields: ["body.ok"] },
       registry,
       downstream,
       undefined,
diff --git a/packages/core/test/native-remote.test.ts b/packages/core/test/native-remote.test.ts
index be0f7b5..08ad550 100644
--- a/packages/core/test/native-remote.test.ts
+++ b/packages/core/test/native-remote.test.ts
@@ -436,7 +436,7 @@ describe("createNativeCapletsService remote mode", () => {
       writeErr,
     });
 
-    expect(service.listTools().map((tool) => tool.caplet)).toEqual(["local"]);
+    expect(configuredCapletIds(service.listTools())).toEqual(["local"]);
     expect(writeErr).toHaveBeenCalledTimes(1);
     expect(writeErr).toHaveBeenCalledWith(
       "Remote project binding unavailable; using local Caplets only. Run caplets doctor for details.\n",
@@ -467,7 +467,7 @@ describe("createNativeCapletsService remote mode", () => {
 
     await service.reload();
 
-    expect(service.listTools().map((tool) => [tool.caplet, tool.title])).toEqual([
+    expect(configuredCapletTitles(service.listTools())).toEqual([
       ["remote-only", "Remote Only"],
       ["shared", "Local Shared"],
       ["local-only", "Local Only"],
@@ -528,10 +528,7 @@ describe("createNativeCapletsService remote mode", () => {
     fixture.emit();
     await vi.waitFor(() => expect(listener).toHaveBeenCalledTimes(1));
 
-    expect(listener).toHaveBeenCalledWith([
-      expect.objectContaining({ caplet: "beta" }),
-      expect.objectContaining({ caplet: "local" }),
-    ]);
+    expect(configuredCapletIds(listener.mock.calls[0]?.[0] ?? [])).toEqual(["beta", "local"]);
     await expect(service.reload()).resolves.toBe(true);
     expect(listener).toHaveBeenCalledTimes(1);
     await service.close();
@@ -569,9 +566,9 @@ describe("createNativeCapletsService remote mode", () => {
     await expect(service.reload()).resolves.toBe(true);
 
     expect(listener).toHaveBeenCalledTimes(1);
-    expect(listener).toHaveBeenCalledWith([
-      expect.objectContaining({ caplet: "beta", title: "Beta" }),
-      expect.objectContaining({ caplet: "local", title: "Local Renamed" }),
+    expect(configuredCapletTitles(listener.mock.calls[0]?.[0] ?? [])).toEqual([
+      ["beta", "Beta"],
+      ["local", "Local Renamed"],
     ]);
     await service.close();
   });
@@ -603,10 +600,7 @@ describe("createNativeCapletsService remote mode", () => {
 
     await expect(service.reload()).resolves.toBe(true);
 
-    expect(secondListener).toHaveBeenCalledWith([
-      expect.objectContaining({ caplet: "beta" }),
-      expect.objectContaining({ caplet: "local" }),
-    ]);
+    expect(configuredCapletIds(secondListener.mock.calls[0]?.[0] ?? [])).toEqual(["beta", "local"]);
     expect(writeErr).toHaveBeenCalledWith(
       expect.stringContaining("Caplets tools-changed listener failed"),
     );
@@ -641,7 +635,7 @@ describe("createNativeCapletsService remote mode", () => {
 
     await expect(service.reload()).resolves.toBe(false);
 
-    expect(service.listTools().map((tool) => [tool.caplet, tool.title])).toEqual([
+    expect(configuredCapletTitles(service.listTools())).toEqual([
       ["alpha", "Alpha"],
       ["local", "Local"],
     ]);
@@ -674,7 +668,7 @@ describe("createNativeCapletsService remote mode", () => {
 
     await expect(service.reload()).resolves.toBe(true);
 
-    expect(service.listTools().map((tool) => tool.caplet)).toEqual(["remote", "local"]);
+    expect(configuredCapletIds(service.listTools())).toEqual(["remote", "local"]);
     expect(writeErr).toHaveBeenCalledWith(expect.stringContaining("Caplets local overlay warning"));
     await service.close();
   });
@@ -697,7 +691,7 @@ describe("createNativeCapletsService remote mode", () => {
 
     await service.reload();
 
-    expect(service.listTools().map((tool) => tool.caplet)).toEqual(["remote"]);
+    expect(configuredCapletIds(service.listTools())).toEqual(["remote"]);
     expect(writeErr).toHaveBeenCalledWith(expect.stringContaining("Caplets local overlay warning"));
     await service.close();
   });
@@ -770,7 +764,7 @@ describe("createNativeCapletsService remote mode", () => {
 
     await expect(service.reload()).resolves.toBe(true);
 
-    expect(service.listTools().map((tool) => tool.caplet)).toEqual(["remote", "local"]);
+    expect(configuredCapletIds(service.listTools())).toEqual(["remote", "local"]);
     expect(writeErr).toHaveBeenCalledWith(expect.stringContaining(badCapletPath));
     await service.close();
   });
@@ -937,3 +931,11 @@ function tempConfig(config: unknown) {
   writeFileSync(projectConfigPath, JSON.stringify({}), "utf8");
   return { dir, configPath, projectConfigPath };
 }
+
+function configuredCapletIds(tools: Array<{ caplet: string }>): string[] {
+  return tools.map((tool) => tool.caplet).filter((caplet) => caplet !== "run");
+}
+
+function configuredCapletTitles(tools: Array<{ caplet: string; title: string }>): string[][] {
+  return tools.filter((tool) => tool.caplet !== "run").map((tool) => [tool.caplet, tool.title]);
+}
diff --git a/packages/core/test/native.test.ts b/packages/core/test/native.test.ts
index 4e301ef..bcea49e 100644
--- a/packages/core/test/native.test.ts
+++ b/packages/core/test/native.test.ts
@@ -48,14 +48,25 @@ describe("native Caplets service", () => {
     const service = createNativeCapletsService({ configPath, projectConfigPath });
 
     try {
-      expect(service.listTools()).toEqual([
-        expect.objectContaining({
-          caplet: "git-hub",
-          toolName: "caplets_git_hub",
-          title: "GitHub",
-        }),
-      ]);
-      expect(service.listTools()[0]?.description).toContain("Native tool name: caplets_git_hub");
+      expect(service.listTools()).toEqual(
+        expect.arrayContaining([
+          expect.objectContaining({
+            caplet: "git-hub",
+            toolName: "caplets_git_hub",
+            title: "GitHub",
+          }),
+          expect.objectContaining({
+            caplet: "run",
+            toolName: "caplets_run",
+            title: "Code Mode",
+          }),
+        ]),
+      );
+      const githubTool = service.listTools().find((tool) => tool.caplet === "git-hub");
+      expect(githubTool?.description).toContain("Native tool name: caplets_git_hub");
+      expect(githubTool?.inputSchema).toMatchObject({
+        properties: expect.objectContaining({ fields: expect.anything() }),
+      });
     } finally {
       await service.close();
     }
@@ -113,9 +124,11 @@ describe("native Caplets service", () => {
 
     expect(guidance).toContain("caplets_linear_api__v2");
     expect(guidance).toContain("Flow: inspect when the domain is unfamiliar");
-    expect(guidance).toContain(
-      "Use fields on call_tool when a non-GraphQL downstream outputSchema allows",
-    );
+    expect(guidance).toContain("exact inputSchema property names");
+    expect(guidance).toContain("Do not guess downstream tool names");
+    expect(guidance).toContain("Do not infer input/output schemas");
+    expect(guidance).toContain("avoid broad provider searches");
+    expect(guidance).toContain("follow its fieldSelection hint");
   });
 
   it("builds concise per-Caplet prompt guidance with safe discovery", () => {
@@ -133,6 +146,9 @@ describe("native Caplets service", () => {
     }).join("\n");
 
     expect(guidance).toContain("Use caplets_browser for the Browser Caplet capability domain.");
+    expect(guidance).toContain("Use describe_tool before call_tool when args matter");
+    expect(guidance).toContain("call_tool.args must match inputSchema exactly");
+    expect(guidance).toContain("Do not guess tool names or schemas");
     expect(guidance).not.toContain("For unfamiliar tasks, discover safely");
     expect(guidance).not.toContain("Call caplets_browser with operation inspect before");
   });
@@ -151,7 +167,7 @@ describe("native Caplets service", () => {
     const service = createNativeCapletsService({ configPath, projectConfigPath, watch: false });
 
     try {
-      expect(service.listTools().map((tool) => tool.caplet)).toEqual(["alpha"]);
+      expect(configuredCapletIds(service.listTools())).toEqual(["alpha"]);
       writeFileSync(
         configPath,
         JSON.stringify({
@@ -166,9 +182,7 @@ describe("native Caplets service", () => {
       );
 
       await expect(service.reload()).resolves.toBe(true);
-      expect(service.listTools()).toEqual([
-        expect.objectContaining({ caplet: "beta", toolName: "caplets_beta", title: "Beta" }),
-      ]);
+      expect(configuredCapletIds(service.listTools())).toEqual(["beta"]);
     } finally {
       await service.close();
     }
@@ -194,7 +208,7 @@ describe("native Caplets service", () => {
     });
     const events: string[][] = [];
     const unsubscribe = service.onToolsChanged((tools) => {
-      events.push(tools.map((tool) => tool.caplet));
+      events.push(configuredCapletIds(tools));
     });
 
     try {
@@ -263,7 +277,7 @@ describe("native Caplets service", () => {
       };
     const events: string[][] = [];
     service.onToolsChanged((tools) => {
-      events.push(tools.map((tool) => tool.caplet));
+      events.push(configuredCapletIds(tools));
     });
 
     try {
@@ -307,7 +321,7 @@ describe("native Caplets service", () => {
     });
     const events: string[][] = [];
     service.onToolsChanged((tools) => {
-      events.push(tools.map((tool) => tool.caplet));
+      events.push(configuredCapletIds(tools));
     });
 
     try {
@@ -351,3 +365,7 @@ describe("native Caplets service", () => {
 async function watcherReady(): Promise<void> {
   await new Promise((resolve) => setTimeout(resolve, 100));
 }
+
+function configuredCapletIds(tools: Array<{ caplet: string }>): string[] {
+  return tools.map((tool) => tool.caplet).filter((caplet) => caplet !== "run");
+}
diff --git a/packages/core/test/observed-output-shapes.test.ts b/packages/core/test/observed-output-shapes.test.ts
new file mode 100644
index 0000000..c2661e9
--- /dev/null
+++ b/packages/core/test/observed-output-shapes.test.ts
@@ -0,0 +1,178 @@
+import { mkdtempSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { describe, expect, it } from "vitest";
+import { parseConfig } from "../src/config";
+import { defaultObservedOutputShapeCacheDir } from "../src/config/paths";
+import {
+  backendFingerprint,
+  FileObservedOutputShapeStore,
+  mergeJsonShapes,
+  observeOutputShape,
+  observedOutputShapeKey,
+  parseShapeableJsonText,
+  shapeToTypeScript,
+} from "../src/observed-output-shapes";
+
+describe("Observed Output Shapes", () => {
+  it("extracts structure without storing primitive values", () => {
+    const observed = observeOutputShape({
+      value: {
+        issues: [
+          {
+            number: 2,
+            title: "secret issue title",
+            token: "ghp_secret",
+            nested: { email: "person@example.com" },
+          },
+        ],
+      },
+    });
+
+    expect(observed).toMatchObject({
+      version: 1,
+      source: "observed",
+      sampleCount: 1,
+      jsonShape: { kind: "object" },
+    });
+    expect(observed?.typeScript).toContain("issues?:");
+    const serialized = JSON.stringify(observed);
+    expect(serialized).not.toContain("secret issue title");
+    expect(serialized).not.toContain("ghp_secret");
+    expect(serialized).not.toContain("person@example.com");
+  });
+
+  it("ignores primitive roots and parses only JSON text objects or arrays", () => {
+    expect(observeOutputShape({ value: "ok" })).toBeUndefined();
+    expect(parseShapeableJsonText({ content: [{ type: "text", text: "true" }] })).toBeUndefined();
+    expect(parseShapeableJsonText({ content: [{ type: "text", text: "123" }] })).toBeUndefined();
+    expect(
+      parseShapeableJsonText({ content: [{ type: "text", text: "# heading" }] }),
+    ).toBeUndefined();
+    expect(
+      parseShapeableJsonText({ content: [{ type: "text", text: '{"items":[{"id":1}]}' }] }),
+    ).toEqual({ items: [{ id: 1 }] });
+  });
+
+  it("merges conservatively with optional fields and bounded unions", () => {
+    const first = observeOutputShape({ value: { id: "1", issue: { number: 1 } } });
+    const second = observeOutputShape({
+      value: { id: 2, issue: { title: "Issue" }, pull: { number: 3 } },
+      existing: first,
+    });
+
+    expect(second?.typeScript).toContain("id?: number | string");
+    expect(second?.typeScript).toContain("issue?:");
+    expect(second?.typeScript).toContain("number?: number");
+    expect(second?.typeScript).toContain("title?: string");
+    expect(second?.typeScript).toContain("pull?:");
+  });
+
+  it("collapses over-wide unions and truncates wide objects", () => {
+    const union = mergeJsonShapes(
+      {
+        kind: "union",
+        variants: [{ kind: "string" }, { kind: "number" }, { kind: "boolean" }, { kind: "null" }],
+      },
+      { kind: "array" },
+    );
+    expect(union).toEqual({ kind: "unknown" });
+
+    const wide = Object.fromEntries(
+      Array.from({ length: 45 }, (_, index) => [`field_${index}`, index]),
+    );
+    const observed = observeOutputShape({ value: wide });
+    if (!observed || observed.jsonShape.kind !== "object") throw new Error("expected object shape");
+    expect(observed?.truncated).toBe(true);
+    expect(Object.keys(observed.jsonShape.fields)).toHaveLength(40);
+  });
+
+  it("emits compact TypeScript and falls back to unknown when too large", () => {
+    const emitted = shapeToTypeScript(
+      {
+        kind: "object",
+        fields: {
+          "not-valid-js": { optional: true, shape: { kind: "string" } },
+        },
+      },
+      "ObservedOutput",
+    );
+    expect(emitted.typeScript).toBe('type ObservedOutput = { "not-valid-js"?: string; };');
+
+    const tiny = shapeToTypeScript(
+      { kind: "object", fields: { a: { optional: true, shape: { kind: "string" } } } },
+      "ObservedOutput",
+      10,
+    );
+    expect(tiny).toEqual({ typeScript: "type ObservedOutput = unknown;", truncated: true });
+  });
+
+  it("builds non-secret backend fingerprints and cache keys without input args", () => {
+    const config = parseConfig({
+      mcpServers: {
+        github: {
+          name: "GitHub",
+          description: "GitHub repo ops",
+          command: "github-mcp",
+          args: ["stdio"],
+          env: { GH_TOKEN: "secret" },
+        },
+      },
+    });
+    const caplet = config.mcpServers.github!;
+    const fingerprint = backendFingerprint(caplet);
+    expect(fingerprint).not.toContain("secret");
+
+    const key = observedOutputShapeKey({
+      scope: "local",
+      caplet,
+      toolName: "list_issues",
+      projectFingerprint: "project-a",
+    });
+    expect(key).toMatchObject({
+      capletId: "github",
+      backendKind: "mcp",
+      toolName: "list_issues",
+      projectFingerprint: "project-a",
+      resultVersion: 1,
+    });
+    expect(JSON.stringify(key)).not.toContain("GH_TOKEN");
+  });
+
+  it("stores, expires, and prunes filesystem cache entries", async () => {
+    const dir = mkdtempSync(join(tmpdir(), "caplets-observed-shapes-"));
+    const ttlMs = 1_000;
+    const store = new FileObservedOutputShapeStore(dir, { ttlMs, maxEntries: 1 });
+    const config = parseConfig({
+      mcpServers: { alpha: { name: "Alpha", description: "Alpha tools.", command: "node" } },
+    });
+    const key = observedOutputShapeKey({
+      scope: "local",
+      caplet: config.mcpServers.alpha!,
+      toolName: "read",
+    });
+    const shape = observeOutputShape({ value: { items: [{ id: 1 }] } })!;
+
+    await store.write(key, shape);
+    await expect(store.read(key)).resolves.toMatchObject({ sampleCount: 1 });
+    await store.prune(new Date(Date.now() + ttlMs + 1));
+    await expect(store.read(key)).resolves.toBeUndefined();
+    await expect(store.health()).resolves.toMatchObject({ readable: true, writable: true });
+  });
+
+  it("uses platform cache conventions for result shapes", () => {
+    expect(
+      defaultObservedOutputShapeCacheDir({ XDG_CACHE_HOME: "/tmp/cache" }, "/home/alice", "linux"),
+    ).toBe("/tmp/cache/caplets/result-shapes");
+    expect(defaultObservedOutputShapeCacheDir({}, "/Users/alice", "darwin")).toBe(
+      "/Users/alice/Library/Caches/caplets/result-shapes",
+    );
+    expect(
+      defaultObservedOutputShapeCacheDir(
+        { LOCALAPPDATA: "C:\\Users\\Alice\\AppData\\Local" },
+        "C:\\Users\\Alice",
+        "win32",
+      ),
+    ).toBe("C:\\Users\\Alice\\AppData\\Local\\caplets\\cache\\result-shapes");
+  });
+});
diff --git a/packages/core/test/openapi.test.ts b/packages/core/test/openapi.test.ts
index 83844dc..9ca95c3 100644
--- a/packages/core/test/openapi.test.ts
+++ b/packages/core/test/openapi.test.ts
@@ -179,23 +179,27 @@ describe("native OpenAPI Caplets", () => {
     try {
       const list = (await handleServerTool(
         caplet,
-        { operation: "list_tools" },
+        { operation: "tools" },
         registry,
         downstream,
         openapi,
       )) as any;
       expect(
-        list.structuredContent.result.tools.map((tool: { tool: string }) => tool.tool),
+        list.structuredContent.result.items.map((tool: { name: string }) => tool.name),
       ).toEqual(["createUser", "GET /users/{id}"]);
       expect(
-        list.structuredContent.result.tools.find(
-          (candidate: { tool: string }) => candidate.tool === "GET /users/{id}",
+        list.structuredContent.result.items.find(
+          (candidate: { name: string }) => candidate.name === "GET /users/{id}",
         ),
-      ).toMatchObject({ hasOutputSchema: true });
+      ).toMatchObject({
+        hasOutputSchema: true,
+        readOnlyHint: true,
+        destructiveHint: false,
+      });
 
       const tool = (await handleServerTool(
         caplet,
-        { operation: "get_tool", tool: "GET /users/{id}" },
+        { operation: "describe_tool", name: "GET /users/{id}" },
         registry,
         downstream,
         openapi,
@@ -239,8 +243,8 @@ describe("native OpenAPI Caplets", () => {
         caplet,
         {
           operation: "call_tool",
-          tool: "GET /users/{id}",
-          arguments: { path: { id: "42" }, query: { active: true } },
+          name: "GET /users/{id}",
+          args: { path: { id: "42" }, query: { active: true } },
         },
         registry,
         downstream,
@@ -255,8 +259,8 @@ describe("native OpenAPI Caplets", () => {
         caplet,
         {
           operation: "call_tool",
-          tool: "GET /users/{id}",
-          arguments: { path: { id: "42" }, query: { active: true } },
+          name: "GET /users/{id}",
+          args: { path: { id: "42" }, query: { active: true } },
           fields: ["body.name"],
         },
         registry,
@@ -269,8 +273,8 @@ describe("native OpenAPI Caplets", () => {
         caplet,
         {
           operation: "call_tool",
-          tool: "createUser",
-          arguments: { body: { name: "Ada" } },
+          name: "createUser",
+          args: { body: { name: "Ada" } },
         },
         registry,
         downstream,
@@ -285,8 +289,8 @@ describe("native OpenAPI Caplets", () => {
           caplet,
           {
             operation: "call_tool",
-            tool: "createUser",
-            arguments: { body: { name: "Ada" } },
+            name: "createUser",
+            args: { body: { name: "Ada" } },
             fields: ["body.created"],
           },
           registry,
@@ -644,7 +648,7 @@ describe("native OpenAPI Caplets", () => {
     try {
       const tool = (await handleServerTool(
         caplet,
-        { operation: "get_tool", tool: "schemaLess" },
+        { operation: "describe_tool", name: "schemaLess" },
         registry,
         downstream,
         openapi,
@@ -655,7 +659,7 @@ describe("native OpenAPI Caplets", () => {
       await expect(
         handleServerTool(
           caplet,
-          { operation: "call_tool", tool: "schemaLess", arguments: {}, fields: ["body"] },
+          { operation: "call_tool", name: "schemaLess", args: {}, fields: ["body"] },
           registry,
           downstream,
           openapi,
diff --git a/packages/core/test/project-binding-integration.test.ts b/packages/core/test/project-binding-integration.test.ts
index 59d2162..419af97 100644
--- a/packages/core/test/project-binding-integration.test.ts
+++ b/packages/core/test/project-binding-integration.test.ts
@@ -94,7 +94,7 @@ describe("Project Binding integration", () => {
     });
 
     await service.reload();
-    expect(service.listTools().map((tool) => [tool.caplet, tool.title])).toEqual([
+    expect(configuredCapletTitles(service.listTools())).toEqual([
       ["deploy", "Remote Deploy"],
       ["build", "Local Build"],
     ]);
@@ -121,3 +121,7 @@ function remoteClientFixture(
     close: vi.fn(async () => undefined),
   };
 }
+
+function configuredCapletTitles(tools: Array<{ caplet: string; title: string }>): string[][] {
+  return tools.filter((tool) => tool.caplet !== "run").map((tool) => [tool.caplet, tool.title]);
+}
diff --git a/packages/core/test/registry.test.ts b/packages/core/test/registry.test.ts
index 4f9ebd6..11d24bf 100644
--- a/packages/core/test/registry.test.ts
+++ b/packages/core/test/registry.test.ts
@@ -11,6 +11,8 @@ describe("registry", () => {
           name: "Enabled Server",
           description: "A useful enabled server.",
           command: "node",
+          useWhen: "Use for enabled test workflows.",
+          avoidWhen: "Avoid for disabled server checks.",
           args: ["secret-arg", "$env:SECRET_TOKEN"],
           env: { SECRET_TOKEN: "$env:SECRET_TOKEN" },
           auth: undefined,
@@ -88,12 +90,23 @@ describe("registry", () => {
     expect(registry.get("status")?.backend).toBe("http");
     const description = capabilityDescription(config.mcpServers.enabled!);
     expect(description).toContain("Enabled Server");
+    expect(description).toContain("Use when: Use for enabled test workflows.");
+    expect(description).toContain("Avoid when: Avoid for disabled server checks.");
     expect(description).toContain("Use inspect for details when needed");
+    expect(description).toContain("use describe_tool before call_tool when args matter");
+    expect(description).toContain("call_tool.args must match inputSchema exactly");
+    expect(description).toContain("do not guess tool names or schemas");
+    expect(description).toContain("Resources/prompts/completions may exist");
     expect(description).not.toContain("Recommended flow:");
     expect(description).not.toContain("secret-arg");
     expect(description).not.toContain("secret-env-value");
 
     const remoteDetail = registry.detail(config.mcpServers.remote!);
+    const enabledDetail = registry.detail(config.mcpServers.enabled!);
+    expect(enabledDetail).toMatchObject({
+      useWhen: "Use for enabled test workflows.",
+      avoidWhen: "Avoid for disabled server checks.",
+    });
     const serialized = JSON.stringify(remoteDetail);
     expect(serialized).toContain('"transport":"http"');
     expect(serialized).not.toContain("secret-url-value");
@@ -101,6 +114,8 @@ describe("registry", () => {
 
     const openApiDescription = capabilityDescription(config.openapiEndpoints.users!);
     expect(openApiDescription).toContain("Use inspect for details when needed");
+    expect(openApiDescription).toContain("call_tool.args must match inputSchema exactly");
+    expect(openApiDescription).toContain("do not guess tool names or schemas");
     const openApiDetail = registry.detail(config.openapiEndpoints.users!);
     expect(openApiDetail).toEqual({
       id: "users",
@@ -118,6 +133,7 @@ describe("registry", () => {
 
     const graphQlDescription = capabilityDescription(config.graphqlEndpoints.catalog!);
     expect(graphQlDescription).toContain("Use inspect for details when needed");
+    expect(graphQlDescription).toContain("use describe_tool before call_tool when args matter");
     const graphQlDetail = registry.detail(config.graphqlEndpoints.catalog!);
     expect(graphQlDetail).toEqual({
       id: "catalog",
@@ -136,6 +152,7 @@ describe("registry", () => {
 
     const httpDescription = capabilityDescription(config.httpApis.status!);
     expect(httpDescription).toContain("Use inspect for details when needed");
+    expect(httpDescription).toContain("use tools/search_tools to discover downstream operations");
     const httpDetail = registry.detail(config.httpApis.status!);
     expect(httpDetail).toEqual({
       id: "status",
@@ -152,6 +169,7 @@ describe("registry", () => {
 
     const cliDescription = capabilityDescription(config.cliTools.repo!);
     expect(cliDescription).toContain("Use inspect for details when needed");
+    expect(cliDescription).toContain("call_tool.args must match inputSchema exactly");
     const cliDetail = registry.detail(config.cliTools.repo!);
     expect(cliDetail).toEqual({
       id: "repo",
@@ -168,6 +186,7 @@ describe("registry", () => {
 
     const capletSetDescription = capabilityDescription(config.capletSets.nested!);
     expect(capletSetDescription).toContain("Use inspect for details when needed");
+    expect(capletSetDescription).toContain("use describe_tool before call_tool when args matter");
     const capletSetDetail = registry.detail(config.capletSets.nested!);
     expect(capletSetDetail).toEqual({
       id: "nested",
diff --git a/packages/core/test/remote-control-client.test.ts b/packages/core/test/remote-control-client.test.ts
index 532701f..9925552 100644
--- a/packages/core/test/remote-control-client.test.ts
+++ b/packages/core/test/remote-control-client.test.ts
@@ -51,7 +51,7 @@ describe("RemoteControlClient", () => {
         }),
     });
 
-    await expect(client.request("get_tool", { tool: "missing" })).rejects.toMatchObject({
+    await expect(client.request("describe_tool", { name: "missing" })).rejects.toMatchObject({
       code: "TOOL_NOT_FOUND",
       message: "Tool missing",
       details: { nextAction: "run_caplets_list_tools" },
diff --git a/packages/core/test/remote-control-dispatch.test.ts b/packages/core/test/remote-control-dispatch.test.ts
index 93c5ba2..5b8a2a7 100644
--- a/packages/core/test/remote-control-dispatch.test.ts
+++ b/packages/core/test/remote-control-dispatch.test.ts
@@ -80,7 +80,7 @@ describe("dispatchRemoteCliRequest", () => {
       structuredContent: {
         result: {
           query: "check",
-          tools: [expect.objectContaining({ tool: "check" })],
+          items: [expect.objectContaining({ name: "check" })],
         },
       },
     });
@@ -90,7 +90,10 @@ describe("dispatchRemoteCliRequest", () => {
     const context = testContext();
 
     const response = await dispatchRemoteCliRequest(
-      { command: "get_tool", arguments: { caplet: "server_status", request: { tool: "check" } } },
+      {
+        command: "describe_tool",
+        arguments: { caplet: "server_status", request: { name: "check" } },
+      },
       context,
     );
 
@@ -111,7 +114,7 @@ describe("dispatchRemoteCliRequest", () => {
         command: "call_tool",
         arguments: {
           caplet: "server_status",
-          request: { operation: "get_tool", tool: "check", arguments: {} },
+          request: { operation: "describe_tool", name: "check", arguments: {} },
         },
       },
       context,
diff --git a/packages/core/test/runtime.test.ts b/packages/core/test/runtime.test.ts
index d5869c4..a6ed125 100644
--- a/packages/core/test/runtime.test.ts
+++ b/packages/core/test/runtime.test.ts
@@ -36,7 +36,8 @@ describe("CapletsRuntime", () => {
     const runtime = new CapletsRuntime({ configPath, projectConfigPath, server });
 
     expect(runtime.registeredToolIds()).toEqual(["alpha"]);
-    expect(server.registerTool).toHaveBeenCalledTimes(1);
+    expect(server.registerTool).toHaveBeenCalledTimes(2);
+    expect(server.registered.get("run")).toBeDefined();
 
     await runtime.close();
   });
diff --git a/packages/core/test/serve-session.test.ts b/packages/core/test/serve-session.test.ts
index 104ed66..5ed10b6 100644
--- a/packages/core/test/serve-session.test.ts
+++ b/packages/core/test/serve-session.test.ts
@@ -28,7 +28,15 @@ describe("CapletsMcpSession", () => {
     const session = new CapletsMcpSession(engine, { server });
 
     expect(session.registeredToolIds()).toEqual(["alpha"]);
-    expect(server.registerTool).toHaveBeenCalledTimes(1);
+    expect(server.registerTool).toHaveBeenCalledTimes(2);
+    expect(server.registered.get("run")).toBeDefined();
+    expect(server.registerTool).toHaveBeenCalledWith(
+      "alpha",
+      expect.objectContaining({
+        inputSchema: expect.objectContaining({ fields: expect.anything() }),
+      }),
+      expect.any(Function),
+    );
 
     await session.close();
     await engine.close();
@@ -45,6 +53,7 @@ describe("CapletsMcpSession", () => {
     const server = mockServer();
     const session = new CapletsMcpSession(engine, { server });
     const alpha = server.registered.get("alpha")!;
+    const run = server.registered.get("run")!;
 
     writeConfig(configPath, {
       httpApis: {
@@ -60,6 +69,16 @@ describe("CapletsMcpSession", () => {
     await engine.reload();
 
     expect(alpha.remove).toHaveBeenCalledTimes(1);
+    expect(run.update).toHaveBeenCalledWith(
+      expect.objectContaining({
+        description: expect.stringContaining('gamma:CapletHandle<"gamma">'),
+      }),
+    );
+    expect(run.update).toHaveBeenCalledWith(
+      expect.not.objectContaining({
+        description: expect.stringContaining('alpha:CapletHandle<"alpha">'),
+      }),
+    );
     expect(session.registeredToolIds()).toEqual(["gamma"]);
     expect(server.registered.get("gamma")).toBeDefined();
 
diff --git a/packages/core/test/tools.test.ts b/packages/core/test/tools.test.ts
index 06548b6..976ae56 100644
--- a/packages/core/test/tools.test.ts
+++ b/packages/core/test/tools.test.ts
@@ -7,6 +7,11 @@ import { CapletsError } from "../src/errors";
 import type { GraphQLManager, GraphqlEndpointConfig } from "../src/graphql";
 import type { HttpActionManager } from "../src/http-actions";
 import type { OpenApiManager } from "../src/openapi";
+import type {
+  ObservedOutputShape,
+  ObservedOutputShapeKey,
+  ObservedOutputShapeStore,
+} from "../src/observed-output-shapes";
 import { ServerRegistry } from "../src/registry";
 import {
   generatedToolInputSchema,
@@ -18,14 +23,14 @@ import {
 
 describe("generated tool request validation", () => {
   it("rejects operation-specific extra fields", () => {
-    expect(() => validateOperationRequest({ operation: "list_tools", tool: "x" }, 50)).toThrow(
+    expect(() => validateOperationRequest({ operation: "tools", tool: "x" }, 50)).toThrow(
       CapletsError,
     );
     expect(() =>
-      validateOperationRequest({ operation: "get_tool", query: "x", tool: "x" }, 50),
+      validateOperationRequest({ operation: "describe_tool", query: "x", tool: "x" }, 50),
     ).toThrow(CapletsError);
     expect(() =>
-      validateOperationRequest({ operation: "call_tool", tool: "x", arguments: [] }, 50),
+      validateOperationRequest({ operation: "call_tool", name: "x", args: [] }, 50),
     ).toThrow(CapletsError);
   });
 
@@ -34,72 +39,68 @@ describe("generated tool request validation", () => {
       operation: "search_tools",
       query: "read",
     });
-    expect(() =>
+    expect(
       validateOperationRequest({ operation: "search_tools", query: "read", limit: 51 }, 50),
-    ).toThrow(CapletsError);
-    expect(() => validateOperationRequest({ operation: "call_tool", arguments: {} }, 50)).toThrow(
+    ).toEqual({ operation: "search_tools", query: "read", limit: 51 });
+    expect(() => validateOperationRequest({ operation: "call_tool", args: {} }, 50)).toThrow(
       CapletsError,
     );
   });
 
-  it("validates list_tools limit", () => {
-    expect(validateOperationRequest({ operation: "list_tools", limit: 2 }, 50)).toEqual({
-      operation: "list_tools",
+  it("accepts tools pagination input without hard limit failures", () => {
+    expect(validateOperationRequest({ operation: "tools", limit: 2 }, 50)).toEqual({
+      operation: "tools",
       limit: 2,
     });
-    expect(() => validateOperationRequest({ operation: "list_tools", limit: 51 }, 50)).toThrow(
-      CapletsError,
-    );
+    expect(validateOperationRequest({ operation: "tools", limit: 51, cursor: "10" }, 50)).toEqual({
+      operation: "tools",
+      limit: 51,
+      cursor: "10",
+    });
   });
 
   it("accepts top-level field selection only for call_tool", () => {
     expect(
       validateOperationRequest(
-        { operation: "call_tool", tool: "read", arguments: {}, fields: ["body.name"] },
+        { operation: "call_tool", name: "read", args: {}, fields: ["body.name"] },
         50,
       ),
     ).toEqual({
       operation: "call_tool",
-      tool: "read",
-      arguments: {},
+      name: "read",
+      args: {},
       fields: ["body.name"],
     });
     expect(() =>
-      validateOperationRequest({ operation: "get_tool", tool: "read", fields: ["body.name"] }, 50),
+      validateOperationRequest(
+        { operation: "describe_tool", name: "read", fields: ["body.name"] },
+        50,
+      ),
     ).toThrow(CapletsError);
   });
 
   it("rejects invalid top-level field selections", () => {
     expect(() =>
-      validateOperationRequest(
-        { operation: "call_tool", tool: "read", arguments: {}, fields: [] },
-        50,
-      ),
+      validateOperationRequest({ operation: "call_tool", name: "read", args: {}, fields: [] }, 50),
     ).toThrow(CapletsError);
     expect(() =>
       validateOperationRequest(
-        { operation: "call_tool", tool: "read", arguments: {}, fields: [""] },
+        { operation: "call_tool", name: "read", args: {}, fields: [""] },
         50,
       ),
     ).toThrow(CapletsError);
     expect(() =>
-      validateOperationRequest(
-        { operation: "call_tool", tool: "read", arguments: {}, fields: [1] },
-        50,
-      ),
+      validateOperationRequest({ operation: "call_tool", name: "read", args: {}, fields: [1] }, 50),
     ).toThrow(CapletsError);
   });
 
   it("treats arguments.fields as downstream input", () => {
     expect(
-      validateOperationRequest(
-        { operation: "call_tool", tool: "read", arguments: { fields: [] } },
-        50,
-      ),
+      validateOperationRequest({ operation: "call_tool", name: "read", args: { fields: [] } }, 50),
     ).toEqual({
       operation: "call_tool",
-      tool: "read",
-      arguments: { fields: [] },
+      name: "read",
+      args: { fields: [] },
     });
   });
 
@@ -125,25 +126,25 @@ describe("generated tool request validation", () => {
 
     expect(schema.properties.operation?.enum).toEqual([
       "inspect",
-      "check_backend",
-      "list_tools",
+      "check",
+      "tools",
       "search_tools",
-      "get_tool",
+      "describe_tool",
       "call_tool",
     ]);
   });
 
   it("returns Markdown wrapper content while preserving structured result", () => {
-    const result = jsonResult({ id: "alpha", tools: [{ tool: "read" }, { tool: "write" }] });
+    const result = jsonResult({ id: "alpha", items: [{ name: "read" }, { name: "write" }] });
 
     expect(result.structuredContent).toEqual({
-      result: { id: "alpha", tools: [{ tool: "read" }, { tool: "write" }] },
+      result: { id: "alpha", items: [{ name: "read" }, { name: "write" }] },
     });
     const text = result.content[0]?.type === "text" ? result.content[0].text : "";
     expect(text).toContain("# Result");
     expect(text).toContain("## Full Result");
-    expect(text).toContain('"tool": "read"');
-    expect(text).toContain('"tool": "write"');
+    expect(text).toContain('"name": "read"');
+    expect(text).toContain('"name": "write"');
   });
 
   it("describes the nested call_tool argument shape to agents", () => {
@@ -152,21 +153,23 @@ describe("generated tool request validation", () => {
     };
 
     const operationDescription = schema.properties.operation?.description;
-    const toolDescription = schema.properties.tool?.description;
-    const argumentsDescription = schema.properties.arguments?.description;
+    const toolDescription = schema.properties.name?.description;
+    const argumentsDescription = schema.properties.args?.description;
     const fieldsDescription = schema.properties.fields?.description;
 
     expect(operationDescription).toContain("call_tool");
-    expect(toolDescription).toContain("Exact downstream tool name");
-    expect(argumentsDescription).toContain("arguments");
-    expect(argumentsDescription).toContain("downstream inputs");
+    expect(toolDescription).toContain("Exact downstream tool or prompt name");
+    expect(argumentsDescription).toContain("call_tool");
+    expect(argumentsDescription).toContain("get_prompt");
     expect(fieldsDescription).toBe(
-      "Optional call_tool structured output paths when outputSchema allows it.",
+      "Optional call_tool structured output paths. Use only after describe_tool returns fieldSelection.supported true.",
     );
   });
 });
 
 describe("generated tool handlers", () => {
+  type HintTool = Tool & { useWhen?: string; avoidWhen?: string };
+
   const graphqlFieldsUnsupportedMessage =
     "call_tool.fields is not supported for GraphQL-backed Caplets; select fields in the GraphQL operation document instead";
   const config = parseConfig({
@@ -185,21 +188,37 @@ describe("generated tool handlers", () => {
   });
   const registry = new ServerRegistry(config);
   const server = config.mcpServers.alpha!;
-  const tools: Tool[] = [
+  const tools: HintTool[] = [
     {
       name: "read",
       description: "Read files",
       inputSchema: { type: "object" },
       outputSchema: { type: "object" },
+      annotations: { readOnlyHint: true, destructiveHint: false },
+      useWhen: "Use for reading file contents.",
+      avoidWhen: "Avoid for writes.",
     },
     {
       name: "write",
       description: "Write files",
       inputSchema: { type: "object" },
       annotations: { destructiveHint: true },
+      useWhen: "Use for updating file contents.",
     },
   ];
 
+  class MemoryObservedOutputShapeStore implements ObservedOutputShapeStore {
+    readonly entries = new Map<string, ObservedOutputShape>();
+
+    async read(key: ObservedOutputShapeKey): Promise<ObservedOutputShape | undefined> {
+      return this.entries.get(JSON.stringify(key));
+    }
+
+    async write(key: ObservedOutputShapeKey, shape: ObservedOutputShape): Promise<void> {
+      this.entries.set(JSON.stringify(key), shape);
+    }
+  }
+
   it("returns inspect without starting downstream", async () => {
     const downstream = { checkServer: vi.fn(), listTools: vi.fn() } as unknown as DownstreamManager;
     const result = (await handleServerTool(
@@ -303,7 +322,7 @@ describe("generated tool handlers", () => {
     } as unknown as DownstreamManager;
     const result = (await handleServerTool(
       server,
-      { operation: "check_backend" },
+      { operation: "check" },
       registry,
       downstream,
     )) as any;
@@ -324,18 +343,18 @@ describe("generated tool handlers", () => {
     const browserRegistry = new ServerRegistry(browserConfig);
     const downstream = {
       listTools: vi.fn().mockResolvedValue([{ name: "browser_click", inputSchema: {} }]),
-      compact: (_capletServer: typeof server, tool: Tool) => ({ tool: tool.name }),
+      compact: (_capletServer: typeof server, tool: Tool) => ({ name: tool.name }),
     } as unknown as DownstreamManager;
 
     const browser = (await handleServerTool(
       browserConfig.mcpServers.browser!,
-      { operation: "list_tools" },
+      { operation: "tools" },
       browserRegistry,
       downstream,
     )) as any;
     const stealth = (await handleServerTool(
       browserConfig.mcpServers.stealth!,
-      { operation: "list_tools" },
+      { operation: "tools" },
       browserRegistry,
       downstream,
     )) as any;
@@ -344,31 +363,44 @@ describe("generated tool handlers", () => {
     expect(stealth.content[0]?.text).toContain("browser_click");
     expect(browser.content[0]?.text).toContain("Browser");
     expect(stealth.content[0]?.text).toContain("Stealth Browser");
-    expect(browser.structuredContent?.result.tools).toEqual([{ tool: "browser_click" }]);
-    expect(stealth.structuredContent?.result.tools).toEqual([{ tool: "browser_click" }]);
+    expect(browser.structuredContent?.result.items).toEqual([{ name: "browser_click" }]);
+    expect(stealth.structuredContent?.result.items).toEqual([{ name: "browser_click" }]);
   });
 
-  it("lists compact metadata and preserves full get_tool metadata", async () => {
+  it("lists compact metadata and preserves full describe_tool metadata", async () => {
     expect(new DownstreamManager(registry).compact(server, tools[0]!)).toMatchObject({
+      name: "read",
       hasOutputSchema: true,
+      supportsFields: true,
+      readOnlyHint: true,
+      destructiveHint: false,
+      useWhen: "Use for reading file contents.",
+      avoidWhen: "Avoid for writes.",
     });
 
     const downstream = {
       listTools: vi.fn().mockResolvedValue(tools),
-      compact: (capletServer: typeof server, tool: Tool) => ({
-        id: capletServer.server,
-        tool: tool.name,
+      compact: (_capletServer: typeof server, tool: HintTool) => ({
+        name: tool.name,
         description: tool.description,
-        annotations: tool.annotations,
         hasInputSchema: Boolean(tool.inputSchema),
         hasOutputSchema: Boolean(tool.outputSchema),
+        supportsFields: Boolean(tool.outputSchema),
+        ...(tool.useWhen ? { useWhen: tool.useWhen } : {}),
+        ...(tool.avoidWhen ? { avoidWhen: tool.avoidWhen } : {}),
+        ...(typeof tool.annotations?.readOnlyHint === "boolean"
+          ? { readOnlyHint: tool.annotations.readOnlyHint }
+          : {}),
+        ...(typeof tool.annotations?.destructiveHint === "boolean"
+          ? { destructiveHint: tool.annotations.destructiveHint }
+          : {}),
       }),
       getTool: vi.fn().mockResolvedValue(tools[1]),
     } as unknown as DownstreamManager;
 
     const list = (await handleServerTool(
       server,
-      { operation: "list_tools" },
+      { operation: "tools" },
       registry,
       downstream,
     )) as any;
@@ -377,36 +409,40 @@ describe("generated tool handlers", () => {
       id: "alpha",
       name: "Alpha",
       backend: "mcp",
-      operation: "list_tools",
+      operation: "tools",
       status: "ok",
       elapsedMs: expect.any(Number),
     });
     expect(list.structuredContent?.result).toEqual({
       id: "alpha",
       name: "Alpha",
-      tools: [
+      items: [
         {
-          id: "alpha",
-          tool: "read",
+          name: "read",
           description: "Read files",
-          annotations: undefined,
           hasInputSchema: true,
           hasOutputSchema: true,
+          supportsFields: true,
+          useWhen: "Use for reading file contents.",
+          avoidWhen: "Avoid for writes.",
+          readOnlyHint: true,
+          destructiveHint: false,
         },
         {
-          id: "alpha",
-          tool: "write",
+          name: "write",
           description: "Write files",
-          annotations: { destructiveHint: true },
           hasInputSchema: true,
           hasOutputSchema: false,
+          supportsFields: false,
+          useWhen: "Use for updating file contents.",
+          destructiveHint: true,
         },
       ],
     });
 
     const full = (await handleServerTool(
       server,
-      { operation: "get_tool", tool: "write" },
+      { operation: "describe_tool", name: "write" },
       registry,
       downstream,
     )) as any;
@@ -414,28 +450,32 @@ describe("generated tool handlers", () => {
       id: "alpha",
       name: "Alpha",
       backend: "mcp",
-      operation: "get_tool",
+      operation: "describe_tool",
       tool: "write",
       status: "ok",
       elapsedMs: expect.any(Number),
     });
-    expect(full.structuredContent?.result).toEqual({ id: "alpha", tool: tools[1] });
+    expect(full.structuredContent?.result).toEqual({
+      id: "alpha",
+      tool: tools[1],
+      fieldSelection: { supported: false, reason: "output_schema_unavailable" },
+    });
   });
 
   it("limits listed tools", async () => {
     const downstream = {
       listTools: vi.fn().mockResolvedValue(tools),
-      compact: (_capletServer: typeof server, tool: Tool) => ({ tool: tool.name }),
+      compact: (_capletServer: typeof server, tool: Tool) => ({ name: tool.name }),
     } as unknown as DownstreamManager;
 
     const list = (await handleServerTool(
       server,
-      { operation: "list_tools", limit: 1 },
+      { operation: "tools", limit: 1 },
       registry,
       downstream,
     )) as any;
 
-    expect(list.structuredContent?.result.tools).toEqual([{ tool: "read" }]);
+    expect(list.structuredContent?.result.items).toEqual([{ name: "read" }]);
   });
 
   it("searches tools by any query token", async () => {
@@ -444,11 +484,13 @@ describe("generated tool handlers", () => {
         name: "browser_navigate",
         description: "Navigate to a URL",
         inputSchema: { type: "object" },
+        annotations: { readOnlyHint: true },
       },
       {
         name: "browser_take_screenshot",
         description: "Take a screenshot",
         inputSchema: { type: "object" },
+        annotations: { readOnlyHint: true },
       },
       {
         name: "browser_click",
@@ -459,6 +501,7 @@ describe("generated tool handlers", () => {
         name: "browser_snapshot",
         description: "Capture accessibility snapshot",
         inputSchema: { type: "object" },
+        annotations: { readOnlyHint: true },
       },
       {
         name: "browser_console_messages",
@@ -470,7 +513,7 @@ describe("generated tool handlers", () => {
 
     const results = downstream
       .search(server, browserTools, "navigate screenshot click snapshot type", 10)
-      .map((tool) => tool.tool);
+      .map((tool) => tool.name);
     expect(results).toHaveLength(4);
     expect(results).toEqual(
       expect.arrayContaining([
@@ -482,6 +525,269 @@ describe("generated tool handlers", () => {
     );
   });
 
+  it("ranks read-only tool search matches first unless the query asks to mutate", async () => {
+    const issueTools: Tool[] = [
+      {
+        name: "create_issue",
+        description: "Create issue",
+        inputSchema: { type: "object" },
+        annotations: { destructiveHint: false },
+      },
+      {
+        name: "delete_issue",
+        description: "Delete issue",
+        inputSchema: { type: "object" },
+        annotations: { destructiveHint: true },
+      },
+      {
+        name: "search_issues",
+        description: "Search issues",
+        inputSchema: { type: "object" },
+        annotations: { readOnlyHint: true },
+      },
+    ];
+    const downstream = new DownstreamManager(registry);
+
+    expect(downstream.search(server, issueTools, "issue", 10).map((tool) => tool.name)).toEqual([
+      "search_issues",
+      "create_issue",
+      "delete_issue",
+    ]);
+    expect(
+      downstream.search(server, issueTools, "create issue", 10).map((tool) => tool.name),
+    ).toEqual(["create_issue", "delete_issue", "search_issues"]);
+  });
+
+  it("warms observed output shape cache from schema-less call_tool results", async () => {
+    const store = new MemoryObservedOutputShapeStore();
+    const downstream = {
+      getTool: vi.fn(async (_server, name: string) => tools.find((tool) => tool.name === name)!),
+      callTool: vi.fn(async () => ({
+        structuredContent: {
+          issues: [
+            { number: 2, title: "PRD", body: "caplets run" },
+            { number: 1, title: "Binding", body: "remote runtime" },
+          ],
+        },
+        content: [{ type: "text", text: "ok" }],
+      })),
+    } as unknown as DownstreamManager;
+
+    await handleServerTool(
+      server,
+      { operation: "call_tool", name: "write", args: {} },
+      registry,
+      downstream,
+      undefined,
+      undefined,
+      undefined,
+      undefined,
+      undefined,
+      { observedOutputShapeStore: store, projectFingerprint: "project-a" },
+    );
+    const described = (await handleServerTool(
+      server,
+      { operation: "describe_tool", name: "write" },
+      registry,
+      downstream,
+      undefined,
+      undefined,
+      undefined,
+      undefined,
+      undefined,
+      { observedOutputShapeStore: store, projectFingerprint: "project-a" },
+    )) as any;
+
+    expect(described.structuredContent.result.observedOutputShape).toMatchObject({
+      source: "observed",
+      sampleCount: 1,
+    });
+    expect(described.structuredContent.result.observedOutputShape.typeScript).toContain("issues?:");
+    expect(JSON.stringify(described.structuredContent.result.observedOutputShape)).not.toContain(
+      "caplets run",
+    );
+  });
+
+  it("omits observed output shape when describe_tool has a useful output schema", async () => {
+    const store = new MemoryObservedOutputShapeStore();
+    const downstream = {
+      getTool: vi.fn(async (_server, name: string) => ({
+        ...tools.find((tool) => tool.name === name)!,
+        outputSchema: {
+          type: "object",
+          properties: { message: { type: "string" } },
+        },
+      })),
+      callTool: vi.fn(async () => ({
+        structuredContent: { message: "ok" },
+        content: [{ type: "text", text: "ok" }],
+      })),
+    } as unknown as DownstreamManager;
+
+    await handleServerTool(
+      server,
+      { operation: "call_tool", name: "read", args: {} },
+      registry,
+      downstream,
+      undefined,
+      undefined,
+      undefined,
+      undefined,
+      undefined,
+      { observedOutputShapeStore: store },
+    );
+    const described = (await handleServerTool(
+      server,
+      { operation: "describe_tool", name: "read" },
+      registry,
+      downstream,
+      undefined,
+      undefined,
+      undefined,
+      undefined,
+      undefined,
+      { observedOutputShapeStore: store },
+    )) as any;
+
+    expect(described.structuredContent.result.fieldSelection).toEqual({ supported: true });
+    expect(described.structuredContent.result.observedOutputShape).toBeUndefined();
+  });
+
+  it("does not fail call_tool when observed output shape storage fails", async () => {
+    const store: ObservedOutputShapeStore = {
+      read: vi.fn(async () => undefined),
+      write: vi.fn(async () => {
+        throw new Error("cache unavailable");
+      }),
+    };
+    const downstream = {
+      callTool: vi.fn(async () => ({
+        structuredContent: { items: [{ id: 1 }] },
+        content: [{ type: "text", text: "ok" }],
+      })),
+    } as unknown as DownstreamManager;
+
+    const result = (await handleServerTool(
+      server,
+      { operation: "call_tool", name: "write", args: {} },
+      registry,
+      downstream,
+      undefined,
+      undefined,
+      undefined,
+      undefined,
+      undefined,
+      { observedOutputShapeStore: store },
+    )) as any;
+
+    expect(result.structuredContent).toEqual({ items: [{ id: 1 }] });
+    expect(result._meta.caplets.status).toBe("ok");
+  });
+
+  it("returns descriptor-driven guidance for wrong call_tool argument names", async () => {
+    const downstream = {
+      getTool: vi.fn(async () => ({
+        name: "search_issues",
+        description: "Search issues",
+        inputSchema: {
+          type: "object",
+          properties: {
+            query: { type: "string" },
+            perPage: { type: "number" },
+          },
+          required: ["query"],
+        },
+      })),
+      callTool: vi.fn(),
+    } as unknown as DownstreamManager;
+
+    await expect(
+      handleServerTool(
+        server,
+        { operation: "call_tool", name: "search_issues", args: { q: "repo:o/r", per_page: 10 } },
+        registry,
+        downstream,
+      ),
+    ).rejects.toMatchObject({
+      code: "REQUEST_INVALID",
+      message: expect.stringContaining("missing required argument(s): query"),
+      details: {
+        tool: "search_issues",
+        requiredArgs: ["query"],
+        acceptedArgs: ["perPage", "query"],
+        unexpectedArgs: ["per_page", "q"],
+        callSignature:
+          'callTool(name: "search_issues", args: SearchIssuesInput): Promise<CapletsResult<SearchIssuesOutput>>',
+        inputTypeScript: "type SearchIssuesInput = { perPage?: number; query: string; };",
+        retry: expect.stringContaining("describe_tool"),
+      },
+    });
+    expect(vi.mocked(downstream.callTool)).not.toHaveBeenCalled();
+  });
+
+  it("returns schema validation repair hints for invalid call_tool argument shapes", async () => {
+    const downstream = {
+      getTool: vi.fn(async () => ({
+        name: "search_issues",
+        description: "Search issues",
+        inputSchema: {
+          type: "object",
+          properties: {
+            query: { type: "string" },
+            limit: { type: "integer" },
+            state: { enum: ["open", "closed"] },
+            labels: {
+              type: "array",
+              items: { type: "string" },
+            },
+          },
+          required: ["query", "labels"],
+          additionalProperties: false,
+        },
+      })),
+      callTool: vi.fn(),
+    } as unknown as DownstreamManager;
+
+    await expect(
+      handleServerTool(
+        server,
+        {
+          operation: "call_tool",
+          name: "search_issues",
+          args: {
+            query: 123,
+            limit: "10",
+            state: "merged",
+            labels: "bug",
+          },
+        },
+        registry,
+        downstream,
+      ),
+    ).rejects.toMatchObject({
+      code: "REQUEST_INVALID",
+      message: expect.stringContaining("call_tool args for search_issues are invalid"),
+      details: {
+        tool: "search_issues",
+        requiredArgs: ["labels", "query"],
+        acceptedArgs: ["labels", "limit", "query", "state"],
+        minimalArgsTemplate: { labels: [], query: "" },
+        schemaErrors: expect.arrayContaining([
+          { path: "/labels", rule: "type", expected: "array" },
+          { path: "/limit", rule: "type", expected: "integer" },
+          { path: "/query", rule: "type", expected: "string" },
+          { path: "/state", rule: "enum", allowed: ["open", "closed"] },
+        ]),
+        callSignature:
+          'callTool(name: "search_issues", args: SearchIssuesInput): Promise<CapletsResult<SearchIssuesOutput>>',
+        inputTypeScript:
+          'type SearchIssuesInput = { labels: string[]; limit?: number; query: string; state?: "open" | "closed"; };',
+        retry: expect.stringContaining("matching inputSchema/inputTypeScript exactly"),
+      },
+    });
+    expect(vi.mocked(downstream.callTool)).not.toHaveBeenCalled();
+  });
+
   it("annotates call_tool result metadata without changing downstream shape", async () => {
     const downstreamResult = {
       content: [{ type: "text" as const, text: "ok" }],
@@ -494,7 +800,7 @@ describe("generated tool handlers", () => {
     } as unknown as DownstreamManager;
     const result = await handleServerTool(
       server,
-      { operation: "call_tool", tool: "read", arguments: { path: "x" } },
+      { operation: "call_tool", name: "read", args: { path: "x" } },
       registry,
       downstream,
     );
@@ -530,7 +836,7 @@ describe("generated tool handlers", () => {
     } as unknown as DownstreamManager;
     const result = await handleServerTool(
       server,
-      { operation: "call_tool", tool: "write", arguments: {} },
+      { operation: "call_tool", name: "write", args: {} },
       registry,
       downstream,
     );
@@ -567,7 +873,7 @@ describe("generated tool handlers", () => {
     } as unknown as DownstreamManager;
     const result = await handleServerTool(
       server,
-      { operation: "call_tool", tool: "read", arguments: { path: "x" } },
+      { operation: "call_tool", name: "read", args: { path: "x" } },
       registry,
       downstream,
     );
@@ -706,7 +1012,7 @@ describe("generated tool handlers", () => {
     } as unknown as DownstreamManager;
     return handleServerTool(
       server,
-      { operation: "call_tool", tool: "read", arguments: {} },
+      { operation: "call_tool", name: "read", args: {} },
       registry,
       downstream,
     );
@@ -721,7 +1027,7 @@ describe("generated tool handlers", () => {
     };
     const downstream = {
       getTool: vi.fn().mockResolvedValue({
-        name: "read",
+        tool: "read",
         inputSchema: { type: "object" },
         outputSchema: {
           type: "object",
@@ -736,7 +1042,7 @@ describe("generated tool handlers", () => {
 
     const result = await handleServerTool(
       server,
-      { operation: "call_tool", tool: "read", arguments: { path: "x" }, fields: ["message"] },
+      { operation: "call_tool", name: "read", args: { path: "x" }, fields: ["message"] },
       registry,
       downstream,
     );
@@ -806,7 +1112,7 @@ describe("generated tool handlers", () => {
 
     const result = await handleServerTool(
       openApiServer,
-      { operation: "call_tool", tool: "getUser", arguments: { id: "42" }, fields: ["body.name"] },
+      { operation: "call_tool", name: "getUser", args: { id: "42" }, fields: ["body.name"] },
       openApiRegistry,
       downstream,
       openapi,
@@ -840,7 +1146,7 @@ describe("generated tool handlers", () => {
     const downstream = { callTool: vi.fn() } as unknown as DownstreamManager;
     const http = {
       getTool: vi.fn().mockResolvedValue({
-        name: "check",
+        tool: "check",
         inputSchema: { type: "object" },
         outputSchema: {
           type: "object",
@@ -859,7 +1165,7 @@ describe("generated tool handlers", () => {
 
     const result = await handleServerTool(
       httpServer,
-      { operation: "call_tool", tool: "check", arguments: { id: "42" }, fields: ["ok"] },
+      { operation: "call_tool", name: "check", args: { id: "42" }, fields: ["ok"] },
       httpRegistry,
       downstream,
       undefined,
@@ -917,7 +1223,7 @@ describe("generated tool handlers", () => {
     };
     const downstream = {
       getTool: vi.fn().mockResolvedValue({
-        name: "read",
+        tool: "read",
         inputSchema: { type: "object" },
         outputSchema: {
           type: "object",
@@ -931,7 +1237,7 @@ describe("generated tool handlers", () => {
 
     const result = await handleServerTool(
       server,
-      { operation: "call_tool", tool: "read", arguments: { path: "x" }, fields: ["message"] },
+      { operation: "call_tool", name: "read", args: { path: "x" }, fields: ["message"] },
       registry,
       downstream,
     );
@@ -962,7 +1268,7 @@ describe("generated tool handlers", () => {
   it("reports downstream protocol errors when field selection lacks structured output", async () => {
     const downstream = {
       getTool: vi.fn().mockResolvedValue({
-        name: "read",
+        tool: "read",
         inputSchema: { type: "object" },
         outputSchema: { type: "object", properties: { message: { type: "string" } } },
       }),
@@ -974,7 +1280,7 @@ describe("generated tool handlers", () => {
     await expect(
       handleServerTool(
         server,
-        { operation: "call_tool", tool: "read", arguments: { path: "x" }, fields: ["message"] },
+        { operation: "call_tool", name: "read", args: { path: "x" }, fields: ["message"] },
         registry,
         downstream,
       ),
@@ -993,7 +1299,7 @@ describe("generated tool handlers", () => {
     await expect(
       handleServerTool(
         server,
-        { operation: "call_tool", tool: "write", arguments: {}, fields: ["secret"] },
+        { operation: "call_tool", name: "write", args: {}, fields: ["secret"] },
         registry,
         downstream,
       ),
@@ -1004,7 +1310,7 @@ describe("generated tool handlers", () => {
   it("rejects invalid field paths before calling tools with output schemas", async () => {
     const downstream = {
       getTool: vi.fn().mockResolvedValue({
-        name: "read",
+        tool: "read",
         inputSchema: { type: "object" },
         outputSchema: {
           type: "object",
@@ -1022,7 +1328,7 @@ describe("generated tool handlers", () => {
     await expect(
       handleServerTool(
         server,
-        { operation: "call_tool", tool: "read", arguments: {}, fields: ["secret"] },
+        { operation: "call_tool", name: "read", args: {}, fields: ["secret"] },
         registry,
         downstream,
       ),
@@ -1060,7 +1366,7 @@ describe("generated tool handlers", () => {
 
     const result = await handleServerTool(
       graphqlCaplet as never,
-      { operation: "call_tool", tool: "query_user", arguments: { id: "42" } },
+      { operation: "call_tool", name: "query_user", args: { id: "42" } },
       graphRegistry,
       downstream,
       undefined,
@@ -1118,7 +1424,7 @@ describe("generated tool handlers", () => {
     await expect(
       handleServerTool(
         graphqlCaplet as never,
-        { operation: "call_tool", tool: "query_user", arguments: { id: "42" }, fields: ["user"] },
+        { operation: "call_tool", name: "query_user", args: { id: "42" }, fields: ["user"] },
         graphRegistry,
         downstream,
         undefined,
@@ -1159,7 +1465,7 @@ describe("generated tool handlers", () => {
 
     const result = await handleServerTool(
       httpCaplet,
-      { operation: "call_tool", tool: "check", arguments: { id: "42" } },
+      { operation: "call_tool", name: "check", args: { id: "42" } },
       httpRegistry,
       downstream,
       undefined,
diff --git a/packages/opencode/src/hooks.ts b/packages/opencode/src/hooks.ts
index 665b280..ce0e1c2 100644
--- a/packages/opencode/src/hooks.ts
+++ b/packages/opencode/src/hooks.ts
@@ -1,6 +1,6 @@
 import { tool, type Hooks } from "@opencode-ai/plugin";
 import { nativeCapletsSystemGuidance, type NativeCapletsService } from "@caplets/core/native";
-import { capletsOpenCodeArgs } from "./schema";
+import { capletsOpenCodeArgs, capletsOpenCodeRunArgs } from "./schema";
 
 export async function createCapletsOpenCodeHooks(service: NativeCapletsService): Promise<Hooks> {
   const capletTools = service.listTools();
@@ -12,7 +12,9 @@ export async function createCapletsOpenCodeHooks(service: NativeCapletsService):
         caplet.toolName,
         tool({
           description: caplet.description,
-          args: capletsOpenCodeArgs(caplet.operationNames ?? undefined),
+          args: caplet.codeModeRun
+            ? capletsOpenCodeRunArgs()
+            : capletsOpenCodeArgs(caplet.operationNames ?? undefined),
           async execute(args) {
             const result = await service.execute(caplet.caplet, args);
             return compactOpenCodeResult(result);
diff --git a/packages/opencode/src/schema.ts b/packages/opencode/src/schema.ts
index 3d738f5..e98fe29 100644
--- a/packages/opencode/src/schema.ts
+++ b/packages/opencode/src/schema.ts
@@ -31,3 +31,10 @@ export function capletsOpenCodeArgs(operationNames: string[] = [...operations])
       .optional(),
   };
 }
+
+export function capletsOpenCodeRunArgs() {
+  return {
+    code: tool.schema.string(),
+    timeoutMs: tool.schema.number().int().positive().optional(),
+  };
+}
diff --git a/packages/pi/package.json b/packages/pi/package.json
index a46ed2c..3b27e32 100644
--- a/packages/pi/package.json
+++ b/packages/pi/package.json
@@ -27,7 +27,7 @@
   },
   "scripts": {
     "clean": "rm -rf dist",
-    "build": "pnpm run clean && rolldown -c",
+    "build": "pnpm run clean && rolldown -c && node ./scripts/copy-quickjs-wasm.mjs",
     "build:watch": "pnpm run clean && rolldown -c --watch",
     "prepack": "pnpm build",
     "typecheck": "tsgo --noEmit",
@@ -37,6 +37,7 @@
     "@caplets/core": "workspace:*"
   },
   "devDependencies": {
+    "@jitl/quickjs-wasmfile-release-sync": "^0.32.0",
     "@types/node": "^25.9.1",
     "@typescript/native-preview": "7.0.0-dev.20260603.1",
     "rolldown": "^1.0.3",
diff --git a/packages/pi/scripts/copy-quickjs-wasm.mjs b/packages/pi/scripts/copy-quickjs-wasm.mjs
new file mode 100644
index 0000000..46f2463
--- /dev/null
+++ b/packages/pi/scripts/copy-quickjs-wasm.mjs
@@ -0,0 +1,26 @@
+import { copyFileSync, mkdirSync, readdirSync } from "node:fs";
+import { createRequire } from "node:module";
+import { dirname, join, resolve } from "node:path";
+import { fileURLToPath } from "node:url";
+
+const require = createRequire(import.meta.url);
+const quickJsWasmSource = require.resolve("@jitl/quickjs-wasmfile-release-sync/wasm");
+const scriptDir = dirname(fileURLToPath(import.meta.url));
+const distDir = resolve(scriptDir, "../dist");
+const quickJsWasmTarget = join(distDir, "emscripten-module.wasm");
+
+mkdirSync(distDir, { recursive: true });
+copyFileSync(quickJsWasmSource, quickJsWasmTarget);
+console.log(`Copied ${quickJsWasmSource} -> ${quickJsWasmTarget}`);
+
+const typescriptEntry = require.resolve("typescript");
+const typescriptLibDir = dirname(typescriptEntry);
+for (const fileName of readdirSync(typescriptLibDir)) {
+  if (!/^lib\..*\.d\.ts$/u.test(fileName)) {
+    continue;
+  }
+  const source = join(typescriptLibDir, fileName);
+  const target = join(distDir, fileName);
+  copyFileSync(source, target);
+}
+console.log(`Copied TypeScript lib declarations -> ${distDir}`);
diff --git a/packages/pi/test/pi.test.ts b/packages/pi/test/pi.test.ts
index 544e69d..fc3caf4 100644
--- a/packages/pi/test/pi.test.ts
+++ b/packages/pi/test/pi.test.ts
@@ -520,7 +520,7 @@ describe("@caplets/pi", () => {
       structuredContent: {
         caplets: {
           name: "Context7",
-          operation: "list_tools",
+          operation: "tools",
         },
       },
     });
@@ -531,15 +531,15 @@ describe("@caplets/pi", () => {
     });
 
     const tool = registered[0];
-    const result = await tool?.execute("call-1", { operation: "list_tools" });
+    const result = await tool?.execute("call-1", { operation: "tools" });
     const rendered = renderText(
       tool?.renderResult(result!, { expanded: true, isPartial: false }, plainTheme),
     );
 
-    expect(rendered).toContain("✓ Context7 list_tools complete (ctrl+o to collapse)");
+    expect(rendered).toContain("✓ Context7 tools complete (ctrl+o to collapse)");
     expect(rendered).toContain("\nvery long docs");
     expect(rendered).not.toContain("Result summary:");
-    expect(rendered.indexOf("✓ Context7 list_tools complete")).toBeLessThan(
+    expect(rendered.indexOf("✓ Context7 tools complete")).toBeLessThan(
       rendered.indexOf("very long docs"),
     );
   });
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index 5d586d3..cd96f75 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -143,6 +143,9 @@ importers:
       '@modelcontextprotocol/sdk':
         specifier: ^1.29.0
         version: 1.29.0(zod@4.4.3)
+      ajv:
+        specifier: ^8.20.0
+        version: 8.20.0
       commander:
         specifier: ^15.0.0
         version: 15.0.0
@@ -152,6 +155,12 @@ importers:
       hono:
         specifier: ^4.12.23
         version: 4.12.23
+      quickjs-emscripten:
+        specifier: ^0.32.0
+        version: 0.32.0
+      typescript:
+        specifier: ^6.0.3
+        version: 6.0.3
       vfile:
         specifier: ^6.0.3
         version: 6.0.3
@@ -174,9 +183,6 @@ importers:
       rolldown:
         specifier: ^1.0.3
         version: 1.0.3
-      typescript:
-        specifier: ^6.0.3
-        version: 6.0.3
       vitest:
         specifier: ^4.1.8
         version: 4.1.8(@types/node@25.9.1)(vite@8.0.16(@types/node@25.9.1)(esbuild@0.28.0)(jiti@2.7.0)(tsx@4.22.4)(yaml@2.9.0))
@@ -218,6 +224,9 @@ importers:
         specifier: '*'
         version: 0.78.0
     devDependencies:
+      '@jitl/quickjs-wasmfile-release-sync':
+        specifier: ^0.32.0
+        version: 0.32.0
       '@types/node':
         specifier: ^25.9.1
         version: 25.9.1
@@ -1521,6 +1530,21 @@ packages:
     resolution: {integrity: sha512-O8jcjabXaleOG9DQ0+ARXWZBTfnP4WNAqzuiJK7ll44AmxGKv/J2M4TPjxjY3znBCfvBXFzucm1twdyFybFqEA==}
     engines: {node: '>=12'}
 
+  '@jitl/quickjs-ffi-types@0.32.0':
+    resolution: {integrity: sha512-v9T+GQpmk43VDJ7d72sf0Nexhk+ArvtUihW27dy7lqAl0zBObFKtSBBIm5RBjwIhE8VwsPPm9PNuvPvNqLWUEg==}
+
+  '@jitl/quickjs-wasmfile-debug-asyncify@0.32.0':
+    resolution: {integrity: sha512-EX8zbXwGqCgAE764M+qvkHtyXDi/FUoMBea0JnES7vCM3P7a2+EOZOjGv85wtZ2sJhI1oJ+nekmqpOODFDY+hw==}
+
+  '@jitl/quickjs-wasmfile-debug-sync@0.32.0':
+    resolution: {integrity: sha512-LeYWrPGC1uNCTBWvibo3ZLJj0CSVNYUXvJpXMCmuQ5Sap2cCACc3uvGvYV4homHHBAzfw5akoTqMMS4YFRtw+Q==}
+
+  '@jitl/quickjs-wasmfile-release-asyncify@0.32.0':
+    resolution: {integrity: sha512-3oSwPfja12ICz4aIblB58cuY8JlEq5Txt8Cut4VLo+LH47QN+mzCnSgnbB03hWzg1LBcc+VyyI9UOag7a1NF+Q==}
+
+  '@jitl/quickjs-wasmfile-release-sync@0.32.0':
+    resolution: {integrity: sha512-BKNDI/TPBfGlLNGYpLrhcDGXmIk4xHm4MRAisOBnOzpXVn9HZWsfmMAc9WMBrAHjvvds6HOikKeaOBKdPdpVrg==}
+
   '@jridgewell/gen-mapping@0.3.13':
     resolution: {integrity: sha512-2kkt/7niJ6MgEPxF0bYdQ6etZaA+fQvDcLKckhy1yIQOzaoKjBBjSj63/aLVjYE3qhRt5dvM+uUyfCg6UKCBbA==}
 
@@ -4475,6 +4499,13 @@ packages:
   queue-microtask@1.2.3:
     resolution: {integrity: sha512-NuaNSa6flKT5JaSYQzJok04JzTL1CA6aGhv5rfLW3PgqA+M2ChpZQnAC8h8i4ZFkBS8X5RqkDBHA7r4hej3K9A==}
 
+  quickjs-emscripten-core@0.32.0:
+    resolution: {integrity: sha512-QFnPfjFey8EqknSrSxe1hZrf1/8z7/6s1QzGOmKo6++02r7QRRX7ZoyNaZh7JuVjWsVW87KnQrbZqnHkOAzUyg==}
+
+  quickjs-emscripten@0.32.0:
+    resolution: {integrity: sha512-So0Sqw869y/S2oE3Nuc0uT3Dhqgvsj8FSrwBdsuTosVsG8ME5/OcudU1GxsrIFdFABgy17GHnTVO9TYV/bLQcA==}
+    engines: {node: '>=16.0.0'}
+
   radix3@1.1.2:
     resolution: {integrity: sha512-b484I/7b8rDEdSDKckSSBA8knMpcdsXudlE/LNL639wFoHKwLbEkQFZHWEYwDC0wa0FKUcCY+GAF73Z7wxNVFA==}
 
@@ -6737,6 +6768,24 @@ snapshots:
       wrap-ansi: 8.1.0
       wrap-ansi-cjs: wrap-ansi@7.0.0
 
+  '@jitl/quickjs-ffi-types@0.32.0': {}
+
+  '@jitl/quickjs-wasmfile-debug-asyncify@0.32.0':
+    dependencies:
+      '@jitl/quickjs-ffi-types': 0.32.0
+
+  '@jitl/quickjs-wasmfile-debug-sync@0.32.0':
+    dependencies:
+      '@jitl/quickjs-ffi-types': 0.32.0
+
+  '@jitl/quickjs-wasmfile-release-asyncify@0.32.0':
+    dependencies:
+      '@jitl/quickjs-ffi-types': 0.32.0
+
+  '@jitl/quickjs-wasmfile-release-sync@0.32.0':
+    dependencies:
+      '@jitl/quickjs-ffi-types': 0.32.0
+
   '@jridgewell/gen-mapping@0.3.13':
     dependencies:
       '@jridgewell/sourcemap-codec': 1.5.5
@@ -9725,6 +9774,18 @@ snapshots:
 
   queue-microtask@1.2.3: {}
 
+  quickjs-emscripten-core@0.32.0:
+    dependencies:
+      '@jitl/quickjs-ffi-types': 0.32.0
+
+  quickjs-emscripten@0.32.0:
+    dependencies:
+      '@jitl/quickjs-wasmfile-debug-asyncify': 0.32.0
+      '@jitl/quickjs-wasmfile-debug-sync': 0.32.0
+      '@jitl/quickjs-wasmfile-release-asyncify': 0.32.0
+      '@jitl/quickjs-wasmfile-release-sync': 0.32.0
+      quickjs-emscripten-core: 0.32.0
+
   radix3@1.1.2: {}
 
   range-parser@1.2.1: {}
diff --git a/schemas/caplet.schema.json b/schemas/caplet.schema.json
index a8f8b41..36f73d7 100644
--- a/schemas/caplet.schema.json
+++ b/schemas/caplet.schema.json
@@ -29,6 +29,18 @@
         "maxLength": 80
       }
     },
+    "useWhen": {
+      "description": "When agents should prefer this Caplet or configured action.",
+      "type": "string",
+      "minLength": 1,
+      "maxLength": 500
+    },
+    "avoidWhen": {
+      "description": "When agents should avoid this Caplet or configured action.",
+      "type": "string",
+      "minLength": 1,
+      "maxLength": 500
+    },
     "setup": {
       "type": "object",
       "properties": {
@@ -741,6 +753,18 @@
                 "description": "Operation capability description.",
                 "type": "string",
                 "minLength": 1
+              },
+              "useWhen": {
+                "description": "When agents should prefer this Caplet or configured action.",
+                "type": "string",
+                "minLength": 1,
+                "maxLength": 500
+              },
+              "avoidWhen": {
+                "description": "When agents should avoid this Caplet or configured action.",
+                "type": "string",
+                "minLength": 1,
+                "maxLength": 500
               }
             },
             "additionalProperties": false
@@ -1180,6 +1204,18 @@
                 "type": "string",
                 "minLength": 1
               },
+              "useWhen": {
+                "description": "When agents should prefer this Caplet or configured action.",
+                "type": "string",
+                "minLength": 1,
+                "maxLength": 500
+              },
+              "avoidWhen": {
+                "description": "When agents should avoid this Caplet or configured action.",
+                "type": "string",
+                "minLength": 1,
+                "maxLength": 500
+              },
               "inputSchema": {
                 "description": "JSON Schema for call_tool arguments.",
                 "type": "object",
@@ -1312,6 +1348,18 @@
                 "type": "string",
                 "minLength": 1
               },
+              "useWhen": {
+                "description": "When agents should prefer this Caplet or configured action.",
+                "type": "string",
+                "minLength": 1,
+                "maxLength": 500
+              },
+              "avoidWhen": {
+                "description": "When agents should avoid this Caplet or configured action.",
+                "type": "string",
+                "minLength": 1,
+                "maxLength": 500
+              },
               "inputSchema": {
                 "description": "JSON Schema for call_tool arguments.",
                 "type": "object",
diff --git a/schemas/caplets-config.schema.json b/schemas/caplets-config.schema.json
index 399c2aa..8f7bebe 100644
--- a/schemas/caplets-config.schema.json
+++ b/schemas/caplets-config.schema.json
@@ -301,6 +301,18 @@
               "maxLength": 80
             }
           },
+          "useWhen": {
+            "description": "When agents should prefer this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
+          "avoidWhen": {
+            "description": "When agents should avoid this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
           "setup": {
             "type": "object",
             "properties": {
@@ -694,6 +706,18 @@
               "maxLength": 80
             }
           },
+          "useWhen": {
+            "description": "When agents should prefer this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
+          "avoidWhen": {
+            "description": "When agents should avoid this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
           "setup": {
             "type": "object",
             "properties": {
@@ -938,6 +962,18 @@
                   "description": "Operation capability description.",
                   "type": "string",
                   "minLength": 1
+                },
+                "useWhen": {
+                  "description": "When agents should prefer this Caplet or configured action.",
+                  "type": "string",
+                  "minLength": 1,
+                  "maxLength": 500
+                },
+                "avoidWhen": {
+                  "description": "When agents should avoid this Caplet or configured action.",
+                  "type": "string",
+                  "minLength": 1,
+                  "maxLength": 500
                 }
               },
               "additionalProperties": false
@@ -1119,6 +1155,18 @@
               "maxLength": 80
             }
           },
+          "useWhen": {
+            "description": "When agents should prefer this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
+          "avoidWhen": {
+            "description": "When agents should avoid this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
           "setup": {
             "type": "object",
             "properties": {
@@ -1520,6 +1568,18 @@
                   "type": "string",
                   "minLength": 1
                 },
+                "useWhen": {
+                  "description": "When agents should prefer this Caplet or configured action.",
+                  "type": "string",
+                  "minLength": 1,
+                  "maxLength": 500
+                },
+                "avoidWhen": {
+                  "description": "When agents should avoid this Caplet or configured action.",
+                  "type": "string",
+                  "minLength": 1,
+                  "maxLength": 500
+                },
                 "inputSchema": {
                   "description": "JSON Schema for call_tool arguments.",
                   "type": "object",
@@ -1594,6 +1654,18 @@
               "maxLength": 80
             }
           },
+          "useWhen": {
+            "description": "When agents should prefer this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
+          "avoidWhen": {
+            "description": "When agents should avoid this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
           "setup": {
             "type": "object",
             "properties": {
@@ -1803,6 +1875,18 @@
                   "type": "string",
                   "minLength": 1
                 },
+                "useWhen": {
+                  "description": "When agents should prefer this Caplet or configured action.",
+                  "type": "string",
+                  "minLength": 1,
+                  "maxLength": 500
+                },
+                "avoidWhen": {
+                  "description": "When agents should avoid this Caplet or configured action.",
+                  "type": "string",
+                  "minLength": 1,
+                  "maxLength": 500
+                },
                 "inputSchema": {
                   "description": "JSON Schema for call_tool arguments.",
                   "type": "object",
@@ -1918,6 +2002,18 @@
               "maxLength": 80
             }
           },
+          "useWhen": {
+            "description": "When agents should prefer this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
+          "avoidWhen": {
+            "description": "When agents should avoid this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
           "setup": {
             "type": "object",
             "properties": {
@@ -2152,6 +2248,18 @@
               "maxLength": 80
             }
           },
+          "useWhen": {
+            "description": "When agents should prefer this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
+          "avoidWhen": {
+            "description": "When agents should avoid this Caplet or configured action.",
+            "type": "string",
+            "minLength": 1,
+            "maxLength": 500
+          },
           "setup": {
             "type": "object",
             "properties": {
diff --git a/scripts/generate-code-mode-runtime-api.mjs b/scripts/generate-code-mode-runtime-api.mjs
new file mode 100644
index 0000000..63fe7d3
--- /dev/null
+++ b/scripts/generate-code-mode-runtime-api.mjs
@@ -0,0 +1,48 @@
+#!/usr/bin/env node
+import { readFileSync, writeFileSync } from "node:fs";
+import { dirname, join } from "node:path";
+import { fileURLToPath } from "node:url";
+
+const root = dirname(dirname(fileURLToPath(import.meta.url)));
+const check = process.argv.includes("--check");
+const template = "packages/core/src/code-mode/runtime-api.d.ts";
+const output = "packages/core/src/code-mode/runtime-api.generated.ts";
+const exportName = "CODE_MODE_RUNTIME_API_DECLARATION";
+
+const declaration = minifyDeclarationText(readFileSync(join(root, template), "utf8"));
+const generated = [
+  "// Generated by scripts/generate-code-mode-runtime-api.mjs. Do not edit by hand.",
+  `export const ${exportName} =`,
+  `  '${singleQuoted(declaration)}' as const;`,
+  "",
+].join("\n");
+
+if (check) {
+  const current = readFileSync(join(root, output), "utf8");
+  if (current !== generated) {
+    console.error(`${output} is out of date. Run pnpm code-mode:generate-api.`);
+    process.exitCode = 1;
+  }
+} else {
+  writeFileSync(join(root, output), generated);
+}
+
+function singleQuoted(value) {
+  return value.replace(/\\/gu, "\\\\").replace(/'/gu, "\\'");
+}
+
+function minifyDeclarationText(value) {
+  return value
+    .replace(/^\s*export\s*\{\s*\}\s*;?\s*/u, "")
+    .replace(/\r\n?/gu, "\n")
+    .split("\n")
+    .map((line) => line.trim())
+    .filter(Boolean)
+    .join(" ")
+    .replace(/\s+/gu, " ")
+    .replace(/\s*([{}()[\]:;,|&=])\s*/gu, "$1")
+    .replace(/\s*<\s*/gu, "<")
+    .replace(/\s*>\s*/gu, ">")
+    .replace(/\?\s*:/gu, "?:")
+    .trim();
+}

From dd1d846fbc45baabc01443f7155b77fe508faf75 Mon Sep 17 00:00:00 2001
From: Ian Pascoe <ian.g.pascoe@gmail.com>
Date: Mon, 8 Jun 2026 16:33:46 -0400
Subject: [PATCH 5/8] fix(opencode): package native code mode assets

---
 .changeset/native-opencode-code-mode.md       |  5 +++
 packages/opencode/README.md                   |  4 ++-
 packages/opencode/package.json                |  3 +-
 .../scripts/copy-code-mode-assets.mjs         | 25 +++++++++++++++
 packages/opencode/test/opencode.test.ts       | 31 +++++++++++++++++--
 pnpm-lock.yaml                                |  3 ++
 6 files changed, 66 insertions(+), 5 deletions(-)
 create mode 100644 .changeset/native-opencode-code-mode.md
 create mode 100644 packages/opencode/scripts/copy-code-mode-assets.mjs

diff --git a/.changeset/native-opencode-code-mode.md b/.changeset/native-opencode-code-mode.md
new file mode 100644
index 0000000..9118b3c
--- /dev/null
+++ b/.changeset/native-opencode-code-mode.md
@@ -0,0 +1,5 @@
+---
+"@caplets/opencode": patch
+---
+
+Package native Caplets Code Mode assets for OpenCode and cover `caplets_run` registration.
diff --git a/packages/opencode/README.md b/packages/opencode/README.md
index 5a37e1f..ef941d9 100644
--- a/packages/opencode/README.md
+++ b/packages/opencode/README.md
@@ -2,10 +2,12 @@
 
 Native OpenCode plugin for Caplets.
 
-This package exposes configured Caplets as native OpenCode tools named `caplets_<id>`. It does not start the Caplets MCP server and does not edit `opencode.json`; prompt guidance is injected through OpenCode plugin hooks.
+This package exposes configured Caplets as native OpenCode tools named `caplets_<id>` plus `caplets_run` for Caplets Code Mode. It does not start the Caplets MCP server and does not edit `opencode.json`; prompt guidance is injected through OpenCode plugin hooks.
 
 MCP-backed Caplets advertise resource, prompt, template, and completion operations in their generated schema; OpenAPI, GraphQL, HTTP, CLI, and Caplet-set backends remain tool/action-only.
 
+Use `caplets_run` for multi-step workflows that benefit from Code Mode: TypeScript with generated `caplets.<id>` handles, progressive discovery, downstream tool calls, filtering, joins, and compact synthesis in one native OpenCode call.
+
 ```jsonc
 {
   "plugin": ["@caplets/opencode"],
diff --git a/packages/opencode/package.json b/packages/opencode/package.json
index 831d6d2..a4c26af 100644
--- a/packages/opencode/package.json
+++ b/packages/opencode/package.json
@@ -27,7 +27,7 @@
   },
   "scripts": {
     "clean": "rm -rf dist",
-    "build": "pnpm run clean && rolldown -c",
+    "build": "pnpm run clean && rolldown -c && node ./scripts/copy-code-mode-assets.mjs",
     "build:watch": "pnpm run clean && rolldown -c --watch",
     "prepack": "pnpm build",
     "typecheck": "tsgo --noEmit",
@@ -37,6 +37,7 @@
     "@caplets/core": "workspace:*"
   },
   "devDependencies": {
+    "@jitl/quickjs-wasmfile-release-sync": "^0.32.0",
     "@types/node": "^25.9.1",
     "@typescript/native-preview": "7.0.0-dev.20260603.1",
     "rolldown": "^1.0.3",
diff --git a/packages/opencode/scripts/copy-code-mode-assets.mjs b/packages/opencode/scripts/copy-code-mode-assets.mjs
new file mode 100644
index 0000000..bd4acb9
--- /dev/null
+++ b/packages/opencode/scripts/copy-code-mode-assets.mjs
@@ -0,0 +1,25 @@
+import { copyFileSync, mkdirSync, readdirSync } from "node:fs";
+import { createRequire } from "node:module";
+import { dirname, join, resolve } from "node:path";
+import { fileURLToPath } from "node:url";
+
+const require = createRequire(import.meta.url);
+const scriptDir = dirname(fileURLToPath(import.meta.url));
+const distDir = resolve(scriptDir, "../dist");
+
+mkdirSync(distDir, { recursive: true });
+
+const quickJsWasmSource = require.resolve("@jitl/quickjs-wasmfile-release-sync/wasm");
+const quickJsWasmTarget = join(distDir, "emscripten-module.wasm");
+copyFileSync(quickJsWasmSource, quickJsWasmTarget);
+console.log(`Copied ${quickJsWasmSource} -> ${quickJsWasmTarget}`);
+
+const typescriptEntry = require.resolve("typescript");
+const typescriptLibDir = dirname(typescriptEntry);
+for (const fileName of readdirSync(typescriptLibDir)) {
+  if (!/^lib\..*\.d\.ts$/u.test(fileName)) {
+    continue;
+  }
+  copyFileSync(join(typescriptLibDir, fileName), join(distDir, fileName));
+}
+console.log(`Copied TypeScript lib declarations -> ${distDir}`);
diff --git a/packages/opencode/test/opencode.test.ts b/packages/opencode/test/opencode.test.ts
index 660d8be..226b269 100644
--- a/packages/opencode/test/opencode.test.ts
+++ b/packages/opencode/test/opencode.test.ts
@@ -4,7 +4,11 @@ vi.mock("@opencode-ai/plugin", () => ({
   tool: Object.assign((definition: unknown) => definition, {
     schema: {
       enum: () => ({ type: "enum" }),
-      string: () => ({ optional: () => ({ type: "string", optional: true }), min: () => ({}) }),
+      string: () => ({
+        type: "string",
+        optional: () => ({ type: "string", optional: true }),
+        min: () => ({ type: "string" }),
+      }),
       number: () => ({
         int: () => ({ positive: () => ({ optional: () => ({ type: "number", optional: true }) }) }),
       }),
@@ -32,7 +36,7 @@ vi.mock("@opencode-ai/plugin", () => ({
 }));
 
 describe("@caplets/opencode", () => {
-  it("registers one prefixed native tool per Caplet", async () => {
+  it("registers one prefixed native tool per Caplet plus Code Mode", async () => {
     const { createCapletsOpenCodeHooks } = await import("../src/hooks");
     const service = {
       listTools: () => [
@@ -43,6 +47,14 @@ describe("@caplets/opencode", () => {
           description: "GitHub\n\nUse this Caplet.",
           promptGuidance: ["Use caplets_git_hub for GitHub."],
         },
+        {
+          caplet: "run",
+          toolName: "caplets_run",
+          title: "Code Mode",
+          description: "Run Caplets Code Mode TypeScript.",
+          codeModeRun: true,
+          promptGuidance: ["Use caplets_run for multi-step Caplets workflows."],
+        },
       ],
       execute: vi.fn(async () => ({ ok: true })),
       reload: vi.fn(async () => true),
@@ -52,7 +64,7 @@ describe("@caplets/opencode", () => {
 
     const hooks = await createCapletsOpenCodeHooks(service);
 
-    expect(Object.keys(hooks.tool ?? {})).toEqual(["caplets_git_hub"]);
+    expect(Object.keys(hooks.tool ?? {})).toEqual(["caplets_git_hub", "caplets_run"]);
     const capletsTool = hooks.tool!.caplets_git_hub as {
       execute(args: unknown, context: unknown): Promise<string>;
     };
@@ -60,9 +72,22 @@ describe("@caplets/opencode", () => {
     expect(service.execute).toHaveBeenCalledWith("git-hub", { operation: "inspect" });
     expect(result).toContain('"ok": true');
 
+    const runTool = hooks.tool!.caplets_run as {
+      args: { code?: unknown; timeoutMs?: unknown };
+      execute(args: unknown, context: unknown): Promise<string>;
+    };
+    expect(runTool.args).toMatchObject({
+      code: { type: "string" },
+      timeoutMs: { type: "number", optional: true },
+    });
+    const runResult = await runTool.execute({ code: "return {ok:true};" }, {} as never);
+    expect(service.execute).toHaveBeenCalledWith("run", { code: "return {ok:true};" });
+    expect(runResult).toContain('"ok": true');
+
     const output = { system: [] as string[] };
     await hooks["experimental.chat.system.transform"]?.({} as never, output);
     expect(output.system.join("\n")).toContain("caplets_git_hub");
+    expect(output.system.join("\n")).toContain("caplets_run");
   });
 
   it("returns stable text when tool result serialization fails", async () => {
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index cd96f75..4916fbf 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -196,6 +196,9 @@ importers:
         specifier: '>=1'
         version: 1.15.13
     devDependencies:
+      '@jitl/quickjs-wasmfile-release-sync':
+        specifier: ^0.32.0
+        version: 0.32.0
       '@types/node':
         specifier: ^25.9.1
         version: 25.9.1

From 91461e2c1aeb54705cd83eabf1a57a252d345828 Mon Sep 17 00:00:00 2001
From: Ian Pascoe <ian.g.pascoe@gmail.com>
Date: Mon, 8 Jun 2026 20:44:13 -0400
Subject: [PATCH 6/8] feat(core): add pure observed output shape export

---
 packages/core/package.json                       |  4 ++++
 packages/core/rolldown.config.ts                 |  1 +
 packages/core/src/observed-output-shapes/pure.ts | 16 ++++++++++++++++
 packages/core/test/package-boundaries.test.ts    |  6 +++++-
 4 files changed, 26 insertions(+), 1 deletion(-)
 create mode 100644 packages/core/src/observed-output-shapes/pure.ts

diff --git a/packages/core/package.json b/packages/core/package.json
index 0650027..27cc075 100644
--- a/packages/core/package.json
+++ b/packages/core/package.json
@@ -55,6 +55,10 @@
       "types": "./dist/observed-output-shapes/index.d.ts",
       "default": "./dist/observed-output-shapes.js"
     },
+    "./observed-output-shapes/pure": {
+      "types": "./dist/observed-output-shapes/pure.d.ts",
+      "default": "./dist/observed-output-shapes/pure.js"
+    },
     "./runtime-plan": {
       "types": "./dist/runtime-plan/index.d.ts",
       "default": "./dist/runtime-plan.js"
diff --git a/packages/core/rolldown.config.ts b/packages/core/rolldown.config.ts
index 35e9e8e..42ad32b 100644
--- a/packages/core/rolldown.config.ts
+++ b/packages/core/rolldown.config.ts
@@ -21,6 +21,7 @@ export default defineConfig([
     input: {
       "caplet-source": "src/caplet-source/index.ts",
       "code-mode": "src/code-mode/index.ts",
+      "observed-output-shapes/pure": "src/observed-output-shapes/pure.ts",
       "runtime-plan": "src/runtime-plan/index.ts",
     },
     output: {
diff --git a/packages/core/src/observed-output-shapes/pure.ts b/packages/core/src/observed-output-shapes/pure.ts
new file mode 100644
index 0000000..337f02c
--- /dev/null
+++ b/packages/core/src/observed-output-shapes/pure.ts
@@ -0,0 +1,16 @@
+export {
+  extractJsonShape,
+  normalizedObservableValue,
+  observeOutputShape,
+  parseShapeableJsonText,
+} from "./extract";
+export { mergeJsonShapes } from "./merge";
+export { usefulOutputSchema } from "./schema";
+export { hasTruncatedShape, shapeToTypeScript, shapeType } from "./typescript";
+export {
+  OBSERVED_OUTPUT_SHAPE_LIMITS,
+  OBSERVED_OUTPUT_SHAPE_VERSION,
+  type JsonShape,
+  type ObservedOutputShape,
+  type ExtractObservedOutputShapeInput,
+} from "./types";
diff --git a/packages/core/test/package-boundaries.test.ts b/packages/core/test/package-boundaries.test.ts
index 55ed399..3e22c9b 100644
--- a/packages/core/test/package-boundaries.test.ts
+++ b/packages/core/test/package-boundaries.test.ts
@@ -96,7 +96,11 @@ describe("package boundaries", () => {
   });
 
   it("keeps Worker-safe core exports on dedicated bundles", () => {
-    const dedicatedExports = ["./caplet-source", "./runtime-plan"] as const;
+    const dedicatedExports = [
+      "./caplet-source",
+      "./observed-output-shapes/pure",
+      "./runtime-plan",
+    ] as const;
     const rootDefault = (corePackage.exports["."] as { default: string }).default;
 
     for (const specifier of dedicatedExports) {

From 34929546da26f28dd4338bab96fa1f58979bd1fc Mon Sep 17 00:00:00 2001
From: Ian Pascoe <ian.g.pascoe@gmail.com>
Date: Tue, 9 Jun 2026 06:16:32 -0400
Subject: [PATCH 7/8] feat(code-mode)!: rename execution surface to code_mode

BREAKING CHANGE: Code Mode is exposed as code_mode/caplets_code_mode and the CLI entrypoint is caplets code-mode instead of run/caplets_run/caplets run.
---
 docs/benchmarks/coding-agent.md               | 10 +--
 packages/benchmarks/lib/code-mode.ts          | 10 +--
 packages/core/src/cli.ts                      | 35 ++++----
 packages/core/src/cli/commands.ts             |  2 -
 packages/core/src/code-mode/diagnostics.ts    | 34 +++++++-
 packages/core/src/native.ts                   |  4 +-
 packages/core/src/native/remote.ts            |  4 +-
 packages/core/src/native/service.ts           | 16 ++--
 packages/core/src/native/tools.ts             |  6 +-
 packages/core/src/serve/session.ts            | 12 +--
 packages/core/test/code-mode-cli.test.ts      |  6 +-
 .../core/test/code-mode-declarations.test.ts  |  2 +-
 packages/core/test/code-mode-mcp.test.ts      | 79 +++++++++++--------
 packages/core/test/code-mode-runner.test.ts   | 26 ++++++
 packages/core/test/native-remote.test.ts      |  6 +-
 packages/core/test/native.test.ts             |  6 +-
 .../test/project-binding-integration.test.ts  |  4 +-
 packages/core/test/runtime.test.ts            |  3 +-
 packages/core/test/serve-session.test.ts      |  9 ++-
 packages/core/test/tools.test.ts              |  4 +-
 packages/opencode/README.md                   |  4 +-
 packages/opencode/test/opencode.test.ts       | 14 ++--
 22 files changed, 185 insertions(+), 111 deletions(-)

diff --git a/docs/benchmarks/coding-agent.md b/docs/benchmarks/coding-agent.md
index 4521b7d..c8b1805 100644
--- a/docs/benchmarks/coding-agent.md
+++ b/docs/benchmarks/coding-agent.md
@@ -51,11 +51,11 @@ The deterministic Code Mode fixture covers 12 PRD task categories and shows 80.5
 
 Task: Discover GitHub issue/PR tools, inspect schemas or observed shapes, fetch open work, preserve labels and URLs, and synthesize a next-action triage brief.
 
-| Strategy               | External calls | LLM round trips | Code Mode run calls | Internal Caplet calls | Approx. payload tokens | Success score |
-| ---------------------- | -------------: | --------------: | ------------------: | --------------------: | ---------------------: | ------------: |
-| Vanilla MCP            |              4 |               4 |                   0 |                     0 |                   4200 |          0.72 |
-| Progressive disclosure |             13 |              13 |                   0 |                     0 |                   8600 |          0.95 |
-| Code Mode              |              1 |               1 |                   1 |                     7 |                   2300 |          0.93 |
+| Strategy               | External calls | LLM round trips | Code Mode calls | Internal Caplet calls | Approx. payload tokens | Success score |
+| ---------------------- | -------------: | --------------: | --------------: | --------------------: | ---------------------: | ------------: |
+| Vanilla MCP            |              4 |               4 |               0 |                     0 |                   4200 |          0.72 |
+| Progressive disclosure |             13 |              13 |               0 |                     0 |                   8600 |          0.95 |
+| Code Mode              |              1 |               1 |               1 |                     7 |                   2300 |          0.93 |
 
 Code Mode preserves required triage fields (`number`, `title`, `state`, `url`, `html_url`, `labels`, `created_at`, `updated_at`) while reducing external calls versus progressive disclosure by 92.3% and approximate payload tokens by 73.3%.
 
diff --git a/packages/benchmarks/lib/code-mode.ts b/packages/benchmarks/lib/code-mode.ts
index a499ccc..4ca2458 100644
--- a/packages/benchmarks/lib/code-mode.ts
+++ b/packages/benchmarks/lib/code-mode.ts
@@ -399,11 +399,11 @@ The deterministic Code Mode fixture covers ${benchmark.tasks.length} PRD task ca
 
 Task: ${complex.task.description}
 
-| Strategy               | External calls | LLM round trips | Code Mode run calls | Internal Caplet calls | Approx. payload tokens | Success score |
-| ---------------------- | -------------: | --------------: | ------------------: | --------------------: | ---------------------: | ------------: |
-| Vanilla MCP            |              ${vanilla.externalToolCalls} |               ${vanilla.llmRoundTrips} |                   ${vanilla.codeModeRunCalls} |                     ${vanilla.internalCapletCalls} |                   ${vanilla.approxPayloadTokens} |          ${vanilla.successScore.toFixed(2)} |
-| Progressive disclosure |             ${progressive.externalToolCalls} |              ${progressive.llmRoundTrips} |                   ${progressive.codeModeRunCalls} |                     ${progressive.internalCapletCalls} |                   ${progressive.approxPayloadTokens} |          ${progressive.successScore.toFixed(2)} |
-| Code Mode              |              ${codeMode.externalToolCalls} |               ${codeMode.llmRoundTrips} |                   ${codeMode.codeModeRunCalls} |                     ${codeMode.internalCapletCalls} |                   ${codeMode.approxPayloadTokens} |          ${codeMode.successScore.toFixed(2)} |
+| Strategy               | External calls | LLM round trips | Code Mode calls | Internal Caplet calls | Approx. payload tokens | Success score |
+| ---------------------- | -------------: | --------------: | --------------: | --------------------: | ---------------------: | ------------: |
+| Vanilla MCP            |              ${vanilla.externalToolCalls} |               ${vanilla.llmRoundTrips} |               ${vanilla.codeModeRunCalls} |                     ${vanilla.internalCapletCalls} |                   ${vanilla.approxPayloadTokens} |          ${vanilla.successScore.toFixed(2)} |
+| Progressive disclosure |             ${progressive.externalToolCalls} |              ${progressive.llmRoundTrips} |               ${progressive.codeModeRunCalls} |                     ${progressive.internalCapletCalls} |                   ${progressive.approxPayloadTokens} |          ${progressive.successScore.toFixed(2)} |
+| Code Mode              |              ${codeMode.externalToolCalls} |               ${codeMode.llmRoundTrips} |               ${codeMode.codeModeRunCalls} |                     ${codeMode.internalCapletCalls} |                   ${codeMode.approxPayloadTokens} |          ${codeMode.successScore.toFixed(2)} |
 
 Code Mode preserves required triage fields (${complex.task.requiredFields.map((field) => `\`${field}\``).join(", ")}) while reducing external calls versus progressive disclosure by ${percent(complex.reductions.codeModeVsProgressiveExternalCalls)} and approximate payload tokens by ${percent(complex.reductions.codeModeVsProgressivePayloadTokens)}.
 
diff --git a/packages/core/src/cli.ts b/packages/core/src/cli.ts
index 9d8ee19..428dc2b 100644
--- a/packages/core/src/cli.ts
+++ b/packages/core/src/cli.ts
@@ -342,9 +342,9 @@ export function createProgram(io: CliIO = {}): Command {
       if (suggestions.length > 0) writeOut(`${suggestions.join("\n")}\n`);
     });
 
-  program
-    .command(cliCommands.run)
-    .description("Run TypeScript Code Mode locally with the generated Caplets API.")
+  const codeMode = program
+    .command(cliCommands.codeMode)
+    .description("Run, inspect, and debug Caplets Code Mode.")
     .argument("[code]", "inline TypeScript code to run")
     .option("--file <path>", "read TypeScript code from a file relative to the current directory")
     .option("--timeout-ms <ms>", "execution timeout in milliseconds", parsePositiveInteger)
@@ -369,24 +369,25 @@ export function createProgram(io: CliIO = {}): Command {
         });
       },
     );
-
-  const codeMode = program
-    .command(cliCommands.codeMode)
-    .description("Inspect and debug Caplets Code Mode.");
   codeMode
     .command("types")
     .description("Print the generated Code Mode TypeScript declarations.")
     .option("--json", "print declaration metadata as JSON")
-    .action(async (options: { json?: boolean }) => {
-      await codeModeTypesCli({
-        env,
-        ...(currentConfigPath() ? { configPath: currentConfigPath() } : {}),
-        projectConfigPath: envProjectConfigPath(env),
-        ...(io.authDir ? { authDir: io.authDir } : {}),
-        ...(options.json === undefined ? {} : { json: options.json }),
-        writeOut,
-      });
-    });
+    .action(
+      async (options: { json?: boolean }, command: { parent?: { opts(): { json?: boolean } } }) => {
+        const parentOptions = command.parent?.opts() ?? {};
+        await codeModeTypesCli({
+          env,
+          ...(currentConfigPath() ? { configPath: currentConfigPath() } : {}),
+          projectConfigPath: envProjectConfigPath(env),
+          ...(io.authDir ? { authDir: io.authDir } : {}),
+          ...(options.json === undefined && parentOptions.json === undefined
+            ? {}
+            : { json: options.json ?? parentOptions.json }),
+          writeOut,
+        });
+      },
+    );
 
   const serve = program
     .command(cliCommands.serve)
diff --git a/packages/core/src/cli/commands.ts b/packages/core/src/cli/commands.ts
index f340bf9..9659ade 100644
--- a/packages/core/src/cli/commands.ts
+++ b/packages/core/src/cli/commands.ts
@@ -4,7 +4,6 @@ export type CompletionShell = (typeof completionShells)[number];
 export const cliCommands = {
   completion: "completion",
   completeHidden: "__complete",
-  run: "run",
   codeMode: "code-mode",
   serve: "serve",
   attach: "attach",
@@ -35,7 +34,6 @@ export const cliCommands = {
 
 export const topLevelCommandNames = [
   cliCommands.serve,
-  cliCommands.run,
   cliCommands.codeMode,
   cliCommands.attach,
   cliCommands.cloud,
diff --git a/packages/core/src/code-mode/diagnostics.ts b/packages/core/src/code-mode/diagnostics.ts
index 75e7654..38d3f39 100644
--- a/packages/core/src/code-mode/diagnostics.ts
+++ b/packages/core/src/code-mode/diagnostics.ts
@@ -12,7 +12,6 @@ const CODE_FILE = "/caplets-code-mode/input.ts";
 const DECLARATION_FILE = "/caplets-code-mode/caplets.d.ts";
 const AMBIENT_FILE = "/caplets-code-mode/ambient.d.ts";
 
-const IMPORT_PATTERN = /\bimport\s*(?:\(|[\s{*"A-Za-z_$])/u;
 const TS_NOCHECK_PATTERN =
   /^\s*(?:(?:\/\/[^\n]*|\/\*[\s\S]*?\*\/)\s*)*?(?:(?:\/\/\s*@ts-nocheck\b[^\n]*)|(?:\/\*\s*@ts-nocheck\b[\s\S]*?\*\/))/u;
 const BAD_CALL_METHOD_PATTERN = /\bcaplets(?:\.[A-Za-z_$][\w$]*|\[[^\]]+\])\.call\s*\(/u;
@@ -88,7 +87,7 @@ export function diagnoseCodeModeTypeScript(
 
 function preflightDiagnostics(code: string): CodeModeDiagnostic[] {
   const diagnostics: CodeModeDiagnostic[] = [];
-  if (!IMPORT_PATTERN.test(code)) {
+  if (!hasExecutableImport(code)) {
     // continue with other custom checks below
   } else {
     diagnostics.push({
@@ -114,6 +113,37 @@ function preflightDiagnostics(code: string): CodeModeDiagnostic[] {
   return diagnostics;
 }
 
+function hasExecutableImport(code: string): boolean {
+  const source = ts.createSourceFile(
+    CODE_FILE,
+    code,
+    ts.ScriptTarget.ES2022,
+    true,
+    ts.ScriptKind.TS,
+  );
+  let found = false;
+
+  const visit = (node: ts.Node): void => {
+    if (found) return;
+    if (
+      ts.isImportDeclaration(node) ||
+      ts.isImportEqualsDeclaration(node) ||
+      (ts.isExportDeclaration(node) && node.moduleSpecifier !== undefined)
+    ) {
+      found = true;
+      return;
+    }
+    if (ts.isCallExpression(node) && node.expression.kind === ts.SyntaxKind.ImportKeyword) {
+      found = true;
+      return;
+    }
+    ts.forEachChild(node, visit);
+  };
+
+  visit(source);
+  return found;
+}
+
 function createVirtualCompilerHost(
   options: ts.CompilerOptions,
   files: Record<string, string>,
diff --git a/packages/core/src/native.ts b/packages/core/src/native.ts
index 67d7c0e..47eaa6b 100644
--- a/packages/core/src/native.ts
+++ b/packages/core/src/native.ts
@@ -14,8 +14,8 @@ export {
   nativeCapletToolDescription,
   nativeCapletToolName,
   nativeCapletsSystemGuidance,
-  nativeCodeModeRunToolId,
-  nativeCodeModeRunToolName,
+  nativeCodeModeToolId,
+  nativeCodeModeToolName,
 } from "./native/tools";
 export { generatedToolInputSchema } from "./tools";
 export { generatedToolInputJsonSchema } from "./generated-tool-input-schema";
diff --git a/packages/core/src/native/remote.ts b/packages/core/src/native/remote.ts
index 74f2a9c..33386ff 100644
--- a/packages/core/src/native/remote.ts
+++ b/packages/core/src/native/remote.ts
@@ -10,7 +10,7 @@ import type {
   NativeCapletsToolsChangedListener,
   NativeCapletTool,
 } from "./service";
-import { nativeCapletToolName, nativeCodeModeRunToolId } from "./tools";
+import { nativeCapletToolName, nativeCodeModeToolId } from "./tools";
 
 export type RemoteCapletsTool = {
   name: string;
@@ -253,7 +253,7 @@ function remoteToolToNativeTool(tool: RemoteCapletsTool): NativeCapletTool {
       `Remote Caplet ID: ${tool.name}`,
     ].join("\n"),
     promptGuidance: [`Use ${toolName} through the remote Caplets service.`],
-    ...(tool.name === nativeCodeModeRunToolId ? { codeModeRun: true } : {}),
+    ...(tool.name === nativeCodeModeToolId ? { codeModeRun: true } : {}),
     inputSchema,
     operationNames: operationNamesFromSchema(inputSchema),
   };
diff --git a/packages/core/src/native/service.ts b/packages/core/src/native/service.ts
index 47cdc1e..04c5886 100644
--- a/packages/core/src/native/service.ts
+++ b/packages/core/src/native/service.ts
@@ -19,8 +19,8 @@ import {
   nativeCapletPromptGuidance,
   nativeCapletToolDescription,
   nativeCapletToolName,
-  nativeCodeModeRunToolId,
-  nativeCodeModeRunToolName,
+  nativeCodeModeToolId,
+  nativeCodeModeToolName,
 } from "./tools";
 import {
   generateCodeModeDeclarations,
@@ -146,7 +146,7 @@ class DefaultNativeCapletsService implements NativeCapletsService {
   }
 
   async execute(capletId: string, request: unknown): Promise<unknown> {
-    if (capletId === nativeCodeModeRunToolId && isCodeModeRunRequest(request)) {
+    if (capletId === nativeCodeModeToolId && isCodeModeRunRequest(request)) {
       return await executeCodeModeRunNative(this, request);
     }
     return await this.engine.execute(capletId, request);
@@ -176,17 +176,17 @@ function codeModeRunNativeTool(capletTools: NativeCapletTool[]): NativeCapletToo
     })),
   });
   return {
-    caplet: nativeCodeModeRunToolId,
-    toolName: nativeCodeModeRunToolName,
+    caplet: nativeCodeModeToolId,
+    toolName: nativeCodeModeToolName,
     title: "Code Mode",
     description: [
       generateCodeModeRunToolDescription(declaration),
       "",
-      `Native tool name: ${nativeCodeModeRunToolName}`,
+      `Native tool name: ${nativeCodeModeToolName}`,
     ].join("\n"),
     codeModeRun: true,
     promptGuidance: [
-      `Use ${nativeCodeModeRunToolName} to run Caplets Code Mode TypeScript with generated caplets.<id> handles.`,
+      `Use ${nativeCodeModeToolName} to run Caplets Code Mode TypeScript with generated caplets.<id> handles.`,
       "Prefer Code Mode for multi-step Caplet discovery, tool calls, filtering, joins, and compact synthesis.",
       "Return decision-ready JSON from Code Mode rather than raw bulky provider payloads.",
     ],
@@ -407,7 +407,7 @@ class CompositeNativeCapletsService implements NativeCapletsService {
   }
 
   async execute(capletId: string, request: unknown): Promise<unknown> {
-    if (capletId === nativeCodeModeRunToolId && isCodeModeRunRequest(request)) {
+    if (capletId === nativeCodeModeToolId && isCodeModeRunRequest(request)) {
       return await executeCodeModeRunNative(this, request);
     }
     if (this.local.listTools().some((tool) => tool.caplet === capletId)) {
diff --git a/packages/core/src/native/tools.ts b/packages/core/src/native/tools.ts
index 012dd46..bc43060 100644
--- a/packages/core/src/native/tools.ts
+++ b/packages/core/src/native/tools.ts
@@ -1,8 +1,8 @@
 import type { CapletConfig } from "../config";
 import { capabilityDescription } from "../registry";
 
-export const nativeCodeModeRunToolId = "run";
-export const nativeCodeModeRunToolName = "caplets_run";
+export const nativeCodeModeToolId = "code_mode";
+export const nativeCodeModeToolName = "caplets_code_mode";
 
 export function nativeCapletToolName(capletId: string): string {
   return `caplets_${capletId.replace(/_/g, "__").replace(/-/g, "_")}`;
@@ -18,7 +18,7 @@ export function nativeCapletsSystemGuidance(toolNames: string[]): string {
     "Available Caplets native tools:",
     tools,
     "",
-    `${nativeCodeModeRunToolName} executes Caplets Code Mode: TypeScript with generated caplets.<id> handles for multi-step discovery, tool calls, filtering, and compact synthesis in one native call.`,
+    `${nativeCodeModeToolName} executes Caplets Code Mode: TypeScript with generated caplets.<id> handles for multi-step discovery, tool calls, filtering, and compact synthesis in one native call.`,
     "Flow: inspect when the domain is unfamiliar; use tools/search_tools for downstream names; use describe_tool before call_tool when args matter; pass call_tool.args with exact inputSchema property names.",
     "Do not guess downstream tool names, resource URIs, prompt names, input args, output fields, or schemas. Do not infer input/output schemas from memory.",
     "Prefer list/read/search operations for triage and avoid broad provider searches that can return huge payloads or hit rate limits.",
diff --git a/packages/core/src/serve/session.ts b/packages/core/src/serve/session.ts
index b5e80be..61be5fb 100644
--- a/packages/core/src/serve/session.ts
+++ b/packages/core/src/serve/session.ts
@@ -29,7 +29,7 @@ export type CapletsMcpSessionOptions = {
 export class CapletsMcpSession {
   readonly server: ToolServer;
   private readonly tools = new Map<string, RegisteredTool>();
-  private readonly codeModeRunTool: RegisteredTool;
+  private readonly codeModeTool: RegisteredTool;
   private readonly unsubscribeReload: () => void;
   private closed = false;
 
@@ -43,7 +43,7 @@ export class CapletsMcpSession {
         name: "caplets",
         version: packageJsonVersion,
       });
-    this.codeModeRunTool = this.registerCodeModeRunTool();
+    this.codeModeTool = this.registerCodeModeTool();
     this.unsubscribeReload = this.engine.onReload(({ previous, next }) =>
       this.reconcileTools(previous, next),
     );
@@ -64,15 +64,15 @@ export class CapletsMcpSession {
     }
     this.closed = true;
     this.unsubscribeReload();
-    this.codeModeRunTool.remove();
+    this.codeModeTool.remove();
     this.tools.clear();
     await this.server.close();
   }
 
-  private registerCodeModeRunTool(): RegisteredTool {
+  private registerCodeModeTool(): RegisteredTool {
     const codeModeService = new EngineNativeCapletsService(this.engine);
     return this.server.registerTool(
-      "run",
+      "code_mode",
       {
         title: "Code Mode",
         description: codeModeRunToolDescription(codeModeService),
@@ -118,7 +118,7 @@ export class CapletsMcpSession {
 
   private reconcileTools(previous: CapletsConfig | undefined, next: CapletsConfig): void {
     if (previous) {
-      this.codeModeRunTool.update({
+      this.codeModeTool.update({
         title: "Code Mode",
         description: codeModeRunToolDescription(new EngineNativeCapletsService(this.engine)),
         paramsSchema: codeModeRunParamsSchema,
diff --git a/packages/core/test/code-mode-cli.test.ts b/packages/core/test/code-mode-cli.test.ts
index 3a971be..af45985 100644
--- a/packages/core/test/code-mode-cli.test.ts
+++ b/packages/core/test/code-mode-cli.test.ts
@@ -38,7 +38,7 @@ describe("Code Mode CLI", () => {
     try {
       process.env.CAPLETS_CONFIG = writeConfig(dir, {});
 
-      await runCli(["run", "return { ok: true };", "--json"], {
+      await runCli(["code-mode", "return { ok: true };", "--json"], {
         writeOut: (value) => out.push(value),
       });
 
@@ -62,7 +62,7 @@ describe("Code Mode CLI", () => {
       writeFileSync(join(project, "workflow.ts"), "return { source: 'file' };\n");
       process.chdir(project);
 
-      await runCli(["run", "--file", "workflow.ts", "--json"], {
+      await runCli(["code-mode", "--file", "workflow.ts", "--json"], {
         writeOut: (value) => out.push(value),
       });
 
@@ -82,7 +82,7 @@ describe("Code Mode CLI", () => {
     try {
       process.env.CAPLETS_CONFIG = writeConfig(dir, {});
 
-      await runCli(["run", "--json"], {
+      await runCli(["code-mode", "--json"], {
         writeOut: (value) => out.push(value),
         readStdin: async () => "return { source: 'stdin' };",
       });
diff --git a/packages/core/test/code-mode-declarations.test.ts b/packages/core/test/code-mode-declarations.test.ts
index e99da82..d99da57 100644
--- a/packages/core/test/code-mode-declarations.test.ts
+++ b/packages/core/test/code-mode-declarations.test.ts
@@ -65,7 +65,7 @@ describe("generateCodeModeDeclarations", () => {
     expect(declaration).not.toContain(" = ");
   });
 
-  it("builds the shared run tool description from generated declarations", () => {
+  it("builds the shared Code Mode tool description from generated declarations", () => {
     const declaration = 'declare const caplets:{docs:CapletHandle<"docs">;};';
     const description = generateCodeModeRunToolDescription(declaration);
 
diff --git a/packages/core/test/code-mode-mcp.test.ts b/packages/core/test/code-mode-mcp.test.ts
index 0131f7d..2ffbc91 100644
--- a/packages/core/test/code-mode-mcp.test.ts
+++ b/packages/core/test/code-mode-mcp.test.ts
@@ -14,8 +14,8 @@ afterEach(() => {
   }
 });
 
-describe("Code Mode MCP run tool", () => {
-  it("registers run alongside existing Caplet tools", async () => {
+describe("Code Mode MCP tool", () => {
+  it("registers code_mode alongside existing Caplet tools", async () => {
     const { dir, configPath, projectConfigPath } = tempConfig({
       mcpServers: {
         github: { name: "GitHub", description: "GitHub repo operations.", command: "node" },
@@ -28,71 +28,84 @@ describe("Code Mode MCP run tool", () => {
 
     expect(session.registeredToolIds()).toEqual(["github"]);
     expect(server.registered.get("github")).toBeDefined();
-    expect(server.registered.get("run")).toBeDefined();
-    expect(server.definitions.get("run")?.description).toContain("caplets.<id>");
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.registered.get("code_mode")).toBeDefined();
+    expect(server.registered.get("run")).toBeUndefined();
+    expect(server.definitions.get("code_mode")?.description).toContain("caplets.<id>");
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "Prefer a two-pass workflow for non-trivial tasks",
     );
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "Pass 1: discover and inspect candidate caplets/tools/resources/prompts",
     );
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "return chosen handles, call signatures/schemas, and planned args",
     );
-    expect(server.definitions.get("run")?.description).toContain("Pass 2: execute with exact args");
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
+      "Pass 2: execute with exact args",
+    );
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "Return decision-ready JSON, not raw tool payloads",
     );
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "derive final recommendations from all relevant records",
     );
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "summary, key evidence, derived fields, recommendation",
     );
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "if records disagree or have ranges/statuses, compute the strictest applicable conclusion",
     );
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "prefer `outputSchema` or `outputTypeScript`",
     );
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "do not guess from provider memory",
     );
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "Never invent tool names, resource URIs, prompt names",
     );
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "Never infer input/output schemas from memory",
     );
-    expect(server.definitions.get("run")?.description).toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
       "use describeTool for the exact callSignature",
     );
-    expect(server.definitions.get("run")?.description).toContain("list broad candidate records");
-    expect(server.definitions.get("run")?.description).toContain('const h=caplets["caplet-id"]');
-    expect(server.definitions.get("run")?.description).toContain("observedOutputShape");
-    expect(server.definitions.get("run")?.description).toContain("absent or generic");
-    expect(server.definitions.get("run")?.description).toContain("Filter bulky results in script");
-    expect(server.definitions.get("run")?.description).toContain("html_url");
-    expect(server.definitions.get("run")?.description).not.toContain(
+    expect(server.definitions.get("code_mode")?.description).toContain(
+      "list broad candidate records",
+    );
+    expect(server.definitions.get("code_mode")?.description).toContain(
+      'const h=caplets["caplet-id"]',
+    );
+    expect(server.definitions.get("code_mode")?.description).toContain("observedOutputShape");
+    expect(server.definitions.get("code_mode")?.description).toContain("absent or generic");
+    expect(server.definitions.get("code_mode")?.description).toContain(
+      "Filter bulky results in script",
+    );
+    expect(server.definitions.get("code_mode")?.description).toContain("html_url");
+    expect(server.definitions.get("code_mode")?.description).not.toContain(
       "Do not split discovery and execution",
     );
-    expect(server.definitions.get("run")?.description).not.toContain(
+    expect(server.definitions.get("code_mode")?.description).not.toContain(
       "inside the same script before returning",
     );
-    expect(server.definitions.get("run")?.description).not.toContain(
+    expect(server.definitions.get("code_mode")?.description).not.toContain(
       "Use multiple `run` calls only after",
     );
-    expect(server.definitions.get("run")?.description).not.toContain("OSV");
-    expect(server.definitions.get("run")?.description).not.toContain("vulnerability");
-    expect(server.definitions.get("run")?.description).not.toContain("release");
-    expect(server.definitions.get("run")?.description).toContain("Generated declaration hints:");
-    expect(server.definitions.get("run")?.description).toContain('github:CapletHandle<"github">');
+    expect(server.definitions.get("code_mode")?.description).not.toContain("OSV");
+    expect(server.definitions.get("code_mode")?.description).not.toContain("vulnerability");
+    expect(server.definitions.get("code_mode")?.description).not.toContain("release");
+    expect(server.definitions.get("code_mode")?.description).toContain(
+      "Generated declaration hints:",
+    );
+    expect(server.definitions.get("code_mode")?.description).toContain(
+      'github:CapletHandle<"github">',
+    );
 
     await session.close();
     await engine.close();
   });
 
-  it("returns a structured run envelope from the run tool", async () => {
+  it("returns a structured run envelope from the code_mode tool", async () => {
     const { dir, configPath, projectConfigPath } = tempConfig({
       mcpServers: {
         github: { name: "GitHub", description: "GitHub repo operations.", command: "node" },
@@ -102,7 +115,7 @@ describe("Code Mode MCP run tool", () => {
     const engine = new CapletsEngine({ configPath, projectConfigPath, watch: false });
     const server = mockServer();
     const session = new CapletsMcpSession(engine, { server });
-    const callback = server.callbacks.get("run");
+    const callback = server.callbacks.get("code_mode");
 
     const result = await callback?.({ code: "return { ok: true };" });
 
diff --git a/packages/core/test/code-mode-runner.test.ts b/packages/core/test/code-mode-runner.test.ts
index 9c32153..484cbb7 100644
--- a/packages/core/test/code-mode-runner.test.ts
+++ b/packages/core/test/code-mode-runner.test.ts
@@ -77,6 +77,32 @@ describe("runCodeMode", () => {
     );
   });
 
+  it("allows import syntax inside returned documentation strings", async () => {
+    const result = await runCodeMode({
+      code: `
+        return {
+          guidance: [
+            "import { McpServer } from '@modelcontextprotocol/server';",
+            "import { StdioServerTransport } from '@modelcontextprotocol/server/stdio';",
+            "const server = new McpServer({ name: 'demo', version: '1.0.0' });",
+          ],
+        };
+      `,
+      service: service(),
+    });
+
+    expect(result).toMatchObject({
+      ok: true,
+      value: {
+        guidance: [
+          "import { McpServer } from '@modelcontextprotocol/server';",
+          "import { StdioServerTransport } from '@modelcontextprotocol/server/stdio';",
+          "const server = new McpServer({ name: 'demo', version: '1.0.0' });",
+        ],
+      },
+    });
+  });
+
   it("captures redacted logs and expands them through debug.readLogs", async () => {
     const dir = mkdtempSync(join(tmpdir(), "caplets-code-mode-runner-"));
     try {
diff --git a/packages/core/test/native-remote.test.ts b/packages/core/test/native-remote.test.ts
index 08ad550..cb6a5eb 100644
--- a/packages/core/test/native-remote.test.ts
+++ b/packages/core/test/native-remote.test.ts
@@ -933,9 +933,11 @@ function tempConfig(config: unknown) {
 }
 
 function configuredCapletIds(tools: Array<{ caplet: string }>): string[] {
-  return tools.map((tool) => tool.caplet).filter((caplet) => caplet !== "run");
+  return tools.map((tool) => tool.caplet).filter((caplet) => caplet !== "code_mode");
 }
 
 function configuredCapletTitles(tools: Array<{ caplet: string; title: string }>): string[][] {
-  return tools.filter((tool) => tool.caplet !== "run").map((tool) => [tool.caplet, tool.title]);
+  return tools
+    .filter((tool) => tool.caplet !== "code_mode")
+    .map((tool) => [tool.caplet, tool.title]);
 }
diff --git a/packages/core/test/native.test.ts b/packages/core/test/native.test.ts
index bcea49e..4998968 100644
--- a/packages/core/test/native.test.ts
+++ b/packages/core/test/native.test.ts
@@ -56,8 +56,8 @@ describe("native Caplets service", () => {
             title: "GitHub",
           }),
           expect.objectContaining({
-            caplet: "run",
-            toolName: "caplets_run",
+            caplet: "code_mode",
+            toolName: "caplets_code_mode",
             title: "Code Mode",
           }),
         ]),
@@ -367,5 +367,5 @@ async function watcherReady(): Promise<void> {
 }
 
 function configuredCapletIds(tools: Array<{ caplet: string }>): string[] {
-  return tools.map((tool) => tool.caplet).filter((caplet) => caplet !== "run");
+  return tools.map((tool) => tool.caplet).filter((caplet) => caplet !== "code_mode");
 }
diff --git a/packages/core/test/project-binding-integration.test.ts b/packages/core/test/project-binding-integration.test.ts
index 419af97..ca0ef1b 100644
--- a/packages/core/test/project-binding-integration.test.ts
+++ b/packages/core/test/project-binding-integration.test.ts
@@ -123,5 +123,7 @@ function remoteClientFixture(
 }
 
 function configuredCapletTitles(tools: Array<{ caplet: string; title: string }>): string[][] {
-  return tools.filter((tool) => tool.caplet !== "run").map((tool) => [tool.caplet, tool.title]);
+  return tools
+    .filter((tool) => tool.caplet !== "code_mode")
+    .map((tool) => [tool.caplet, tool.title]);
 }
diff --git a/packages/core/test/runtime.test.ts b/packages/core/test/runtime.test.ts
index a6ed125..7c9e3c1 100644
--- a/packages/core/test/runtime.test.ts
+++ b/packages/core/test/runtime.test.ts
@@ -37,7 +37,8 @@ describe("CapletsRuntime", () => {
 
     expect(runtime.registeredToolIds()).toEqual(["alpha"]);
     expect(server.registerTool).toHaveBeenCalledTimes(2);
-    expect(server.registered.get("run")).toBeDefined();
+    expect(server.registered.get("code_mode")).toBeDefined();
+    expect(server.registered.get("run")).toBeUndefined();
 
     await runtime.close();
   });
diff --git a/packages/core/test/serve-session.test.ts b/packages/core/test/serve-session.test.ts
index 5ed10b6..4657c0e 100644
--- a/packages/core/test/serve-session.test.ts
+++ b/packages/core/test/serve-session.test.ts
@@ -29,7 +29,8 @@ describe("CapletsMcpSession", () => {
 
     expect(session.registeredToolIds()).toEqual(["alpha"]);
     expect(server.registerTool).toHaveBeenCalledTimes(2);
-    expect(server.registered.get("run")).toBeDefined();
+    expect(server.registered.get("code_mode")).toBeDefined();
+    expect(server.registered.get("run")).toBeUndefined();
     expect(server.registerTool).toHaveBeenCalledWith(
       "alpha",
       expect.objectContaining({
@@ -53,7 +54,7 @@ describe("CapletsMcpSession", () => {
     const server = mockServer();
     const session = new CapletsMcpSession(engine, { server });
     const alpha = server.registered.get("alpha")!;
-    const run = server.registered.get("run")!;
+    const codeMode = server.registered.get("code_mode")!;
 
     writeConfig(configPath, {
       httpApis: {
@@ -69,12 +70,12 @@ describe("CapletsMcpSession", () => {
     await engine.reload();
 
     expect(alpha.remove).toHaveBeenCalledTimes(1);
-    expect(run.update).toHaveBeenCalledWith(
+    expect(codeMode.update).toHaveBeenCalledWith(
       expect.objectContaining({
         description: expect.stringContaining('gamma:CapletHandle<"gamma">'),
       }),
     );
-    expect(run.update).toHaveBeenCalledWith(
+    expect(codeMode.update).toHaveBeenCalledWith(
       expect.not.objectContaining({
         description: expect.stringContaining('alpha:CapletHandle<"alpha">'),
       }),
diff --git a/packages/core/test/tools.test.ts b/packages/core/test/tools.test.ts
index 976ae56..6b4154b 100644
--- a/packages/core/test/tools.test.ts
+++ b/packages/core/test/tools.test.ts
@@ -565,7 +565,7 @@ describe("generated tool handlers", () => {
       callTool: vi.fn(async () => ({
         structuredContent: {
           issues: [
-            { number: 2, title: "PRD", body: "caplets run" },
+            { number: 2, title: "PRD", body: "caplets code-mode" },
             { number: 1, title: "Binding", body: "remote runtime" },
           ],
         },
@@ -604,7 +604,7 @@ describe("generated tool handlers", () => {
     });
     expect(described.structuredContent.result.observedOutputShape.typeScript).toContain("issues?:");
     expect(JSON.stringify(described.structuredContent.result.observedOutputShape)).not.toContain(
-      "caplets run",
+      "caplets code-mode",
     );
   });
 
diff --git a/packages/opencode/README.md b/packages/opencode/README.md
index ef941d9..b6c9860 100644
--- a/packages/opencode/README.md
+++ b/packages/opencode/README.md
@@ -2,11 +2,11 @@
 
 Native OpenCode plugin for Caplets.
 
-This package exposes configured Caplets as native OpenCode tools named `caplets_<id>` plus `caplets_run` for Caplets Code Mode. It does not start the Caplets MCP server and does not edit `opencode.json`; prompt guidance is injected through OpenCode plugin hooks.
+This package exposes configured Caplets as native OpenCode tools named `caplets_<id>` plus `caplets_code_mode` for Caplets Code Mode. It does not start the Caplets MCP server and does not edit `opencode.json`; prompt guidance is injected through OpenCode plugin hooks.
 
 MCP-backed Caplets advertise resource, prompt, template, and completion operations in their generated schema; OpenAPI, GraphQL, HTTP, CLI, and Caplet-set backends remain tool/action-only.
 
-Use `caplets_run` for multi-step workflows that benefit from Code Mode: TypeScript with generated `caplets.<id>` handles, progressive discovery, downstream tool calls, filtering, joins, and compact synthesis in one native OpenCode call.
+Use `caplets_code_mode` for multi-step workflows that benefit from Code Mode: TypeScript with generated `caplets.<id>` handles, progressive discovery, downstream tool calls, filtering, joins, and compact synthesis in one native OpenCode call.
 
 ```jsonc
 {
diff --git a/packages/opencode/test/opencode.test.ts b/packages/opencode/test/opencode.test.ts
index 226b269..cb78778 100644
--- a/packages/opencode/test/opencode.test.ts
+++ b/packages/opencode/test/opencode.test.ts
@@ -48,12 +48,12 @@ describe("@caplets/opencode", () => {
           promptGuidance: ["Use caplets_git_hub for GitHub."],
         },
         {
-          caplet: "run",
-          toolName: "caplets_run",
+          caplet: "code_mode",
+          toolName: "caplets_code_mode",
           title: "Code Mode",
           description: "Run Caplets Code Mode TypeScript.",
           codeModeRun: true,
-          promptGuidance: ["Use caplets_run for multi-step Caplets workflows."],
+          promptGuidance: ["Use caplets_code_mode for multi-step Caplets workflows."],
         },
       ],
       execute: vi.fn(async () => ({ ok: true })),
@@ -64,7 +64,7 @@ describe("@caplets/opencode", () => {
 
     const hooks = await createCapletsOpenCodeHooks(service);
 
-    expect(Object.keys(hooks.tool ?? {})).toEqual(["caplets_git_hub", "caplets_run"]);
+    expect(Object.keys(hooks.tool ?? {})).toEqual(["caplets_git_hub", "caplets_code_mode"]);
     const capletsTool = hooks.tool!.caplets_git_hub as {
       execute(args: unknown, context: unknown): Promise<string>;
     };
@@ -72,7 +72,7 @@ describe("@caplets/opencode", () => {
     expect(service.execute).toHaveBeenCalledWith("git-hub", { operation: "inspect" });
     expect(result).toContain('"ok": true');
 
-    const runTool = hooks.tool!.caplets_run as {
+    const runTool = hooks.tool!.caplets_code_mode as {
       args: { code?: unknown; timeoutMs?: unknown };
       execute(args: unknown, context: unknown): Promise<string>;
     };
@@ -81,13 +81,13 @@ describe("@caplets/opencode", () => {
       timeoutMs: { type: "number", optional: true },
     });
     const runResult = await runTool.execute({ code: "return {ok:true};" }, {} as never);
-    expect(service.execute).toHaveBeenCalledWith("run", { code: "return {ok:true};" });
+    expect(service.execute).toHaveBeenCalledWith("code_mode", { code: "return {ok:true};" });
     expect(runResult).toContain('"ok": true');
 
     const output = { system: [] as string[] };
     await hooks["experimental.chat.system.transform"]?.({} as never, output);
     expect(output.system.join("\n")).toContain("caplets_git_hub");
-    expect(output.system.join("\n")).toContain("caplets_run");
+    expect(output.system.join("\n")).toContain("caplets_code_mode");
   });
 
   it("returns stable text when tool result serialization fails", async () => {

From 9972852e876ac308aba48f872ea1d6f90fcf5ab3 Mon Sep 17 00:00:00 2001
From: Ian Pascoe <ian.g.pascoe@gmail.com>
Date: Tue, 9 Jun 2026 11:05:05 -0400
Subject: [PATCH 8/8] feat(core): add exposure policy and shared helpers

---
 packages/core/package.json                    |  12 +
 packages/core/rolldown.config.ts              |   3 +
 packages/core/src/caplet-files-bundle.ts      |   6 +
 packages/core/src/cli/doctor.ts               |  96 +++-
 packages/core/src/code-mode/diagnostics.ts    |   4 +-
 packages/core/src/code-mode/index.ts          |   1 +
 .../core/src/code-mode/static-analysis.ts     |  92 ++++
 packages/core/src/config-runtime.ts           |  34 ++
 packages/core/src/config.ts                   |  42 ++
 packages/core/src/engine.ts                   | 130 +++++-
 packages/core/src/errors.ts                   |  12 +-
 packages/core/src/exposure/direct-names.ts    |  44 ++
 packages/core/src/exposure/discovery.ts       | 265 +++++++++++
 packages/core/src/exposure/policy.ts          |  21 +
 packages/core/src/native/service.ts           | 280 +++++++++++-
 .../core/src/observed-output-shapes/key.ts    |  21 +-
 packages/core/src/project-binding/index.ts    |   9 +
 packages/core/src/redaction.ts                |  50 +++
 packages/core/src/runtime-plan/resources.ts   |  10 +-
 packages/core/src/schema-hash.ts              |  21 +-
 packages/core/src/serve/session.ts            | 412 ++++++++++++++----
 packages/core/src/stable-json.ts              |  28 ++
 packages/core/test/caplet-files.test.ts       |  26 ++
 .../core/test/code-mode-diagnostics.test.ts   |  15 +
 .../test/code-mode-static-analysis.test.ts    |  23 +
 packages/core/test/config.test.ts             |  37 ++
 packages/core/test/doctor-cli.test.ts         |   2 +
 .../core/test/exposure-direct-names.test.ts   |  27 ++
 packages/core/test/exposure-discovery.test.ts | 121 +++++
 packages/core/test/exposure-policy.test.ts    |  22 +
 packages/core/test/native.test.ts             | 126 ++++++
 packages/core/test/openapi.test.ts            |   3 +
 packages/core/test/package-boundaries.test.ts |   3 +
 packages/core/test/serve-session.test.ts      |  52 ++-
 .../test/shared-worker-safe-helpers.test.ts   |  41 ++
 packages/opencode/src/hooks.ts                |  10 +-
 packages/opencode/src/schema.ts               |  38 ++
 packages/opencode/test/opencode.test.ts       |  34 ++
 schemas/caplet.schema.json                    |  11 +
 schemas/caplets-config.schema.json            | 102 +++++
 40 files changed, 2130 insertions(+), 156 deletions(-)
 create mode 100644 packages/core/src/code-mode/static-analysis.ts
 create mode 100644 packages/core/src/exposure/direct-names.ts
 create mode 100644 packages/core/src/exposure/discovery.ts
 create mode 100644 packages/core/src/exposure/policy.ts
 create mode 100644 packages/core/src/project-binding/index.ts
 create mode 100644 packages/core/src/redaction.ts
 create mode 100644 packages/core/src/stable-json.ts
 create mode 100644 packages/core/test/code-mode-static-analysis.test.ts
 create mode 100644 packages/core/test/exposure-direct-names.test.ts
 create mode 100644 packages/core/test/exposure-discovery.test.ts
 create mode 100644 packages/core/test/exposure-policy.test.ts
 create mode 100644 packages/core/test/shared-worker-safe-helpers.test.ts

diff --git a/packages/core/package.json b/packages/core/package.json
index 27cc075..23a8a56 100644
--- a/packages/core/package.json
+++ b/packages/core/package.json
@@ -59,10 +59,22 @@
       "types": "./dist/observed-output-shapes/pure.d.ts",
       "default": "./dist/observed-output-shapes/pure.js"
     },
+    "./project-binding": {
+      "types": "./dist/project-binding/index.d.ts",
+      "default": "./dist/project-binding.js"
+    },
+    "./redaction": {
+      "types": "./dist/redaction.d.ts",
+      "default": "./dist/redaction.js"
+    },
     "./runtime-plan": {
       "types": "./dist/runtime-plan/index.d.ts",
       "default": "./dist/runtime-plan.js"
     },
+    "./stable-json": {
+      "types": "./dist/stable-json.d.ts",
+      "default": "./dist/stable-json.js"
+    },
     "./config-runtime": {
       "types": "./dist/config-runtime.d.ts",
       "default": "./dist/config-runtime.js"
diff --git a/packages/core/rolldown.config.ts b/packages/core/rolldown.config.ts
index 42ad32b..90e4de4 100644
--- a/packages/core/rolldown.config.ts
+++ b/packages/core/rolldown.config.ts
@@ -22,7 +22,10 @@ export default defineConfig([
       "caplet-source": "src/caplet-source/index.ts",
       "code-mode": "src/code-mode/index.ts",
       "observed-output-shapes/pure": "src/observed-output-shapes/pure.ts",
+      "project-binding": "src/project-binding/index.ts",
+      redaction: "src/redaction.ts",
       "runtime-plan": "src/runtime-plan/index.ts",
+      "stable-json": "src/stable-json.ts",
     },
     output: {
       dir: "./dist",
diff --git a/packages/core/src/caplet-files-bundle.ts b/packages/core/src/caplet-files-bundle.ts
index d872d1a..dbf8489 100644
--- a/packages/core/src/caplet-files-bundle.ts
+++ b/packages/core/src/caplet-files-bundle.ts
@@ -124,6 +124,10 @@ const capletAgentSelectionHintsSchema = {
     .describe("When agents should avoid this Caplet or configured action."),
 };
 
+const capletExposureSchema = z
+  .enum(["direct", "progressive", "code_mode", "direct_and_code_mode", "progressive_and_code_mode"])
+  .describe("How this Caplet is exposed to agents.");
+
 const capletEndpointAuthSchema = z
   .discriminatedUnion("type", [
     z.object({ type: z.literal("none") }).strict(),
@@ -633,6 +637,7 @@ export const capletFileSchema = z
       .array(z.string().trim().min(1).max(80))
       .optional()
       .describe("Optional tags for grouping or searching Caplets."),
+    exposure: capletExposureSchema.optional(),
     ...capletAgentSelectionHintsSchema,
     setup: capletSetupSchema.optional(),
     projectBinding: capletProjectBindingSchema.optional(),
@@ -976,6 +981,7 @@ function capletToServerConfig(
 function sharedCapletFields(frontmatter: CapletFileFrontmatter): Record<string, unknown> {
   return {
     ...(frontmatter.tags ? { tags: frontmatter.tags } : {}),
+    ...(frontmatter.exposure ? { exposure: frontmatter.exposure } : {}),
     ...(frontmatter.useWhen ? { useWhen: frontmatter.useWhen } : {}),
     ...(frontmatter.avoidWhen ? { avoidWhen: frontmatter.avoidWhen } : {}),
     ...(frontmatter.setup ? { setup: frontmatter.setup } : {}),
diff --git a/packages/core/src/cli/doctor.ts b/packages/core/src/cli/doctor.ts
index ffb1ebd..65c89e8 100644
--- a/packages/core/src/cli/doctor.ts
+++ b/packages/core/src/cli/doctor.ts
@@ -13,8 +13,14 @@ import { diagnoseCodeModeTypeScript } from "../code-mode/diagnostics";
 import { CodeModeLogStore } from "../code-mode/logs";
 import { runCodeMode } from "../code-mode/runner";
 import { listCodeModeCallableCaplets } from "../code-mode/api";
-import { DEFAULT_OBSERVED_OUTPUT_SHAPE_CACHE_DIR } from "../config/paths";
+import {
+  DEFAULT_OBSERVED_OUTPUT_SHAPE_CACHE_DIR,
+  resolveConfigPath,
+  resolveProjectConfigPath,
+} from "../config/paths";
 import { FileObservedOutputShapeStore } from "../observed-output-shapes";
+import { loadConfig, type CapletConfig } from "../config";
+import { resolveExposure } from "../exposure/policy";
 
 export type DoctorOptions = {
   env?: NodeJS.ProcessEnv | Record<string, string | undefined>;
@@ -31,6 +37,7 @@ export type DoctorJsonReport = {
   sync: Record<string, unknown>;
   daemon: Record<string, unknown>;
   cloudAuth: Record<string, unknown>;
+  exposure: Record<string, unknown>;
   codeMode: Record<string, unknown>;
 };
 
@@ -76,6 +83,7 @@ export async function doctorJsonReport(options: DoctorOptions = {}): Promise<Doc
       running: false,
     },
     cloudAuth: redactedCloudAuthStatus(credentials),
+    exposure: await resolveExposureSection(env),
     codeMode: await resolveCodeModeSection(options, env),
   };
 }
@@ -124,6 +132,18 @@ export async function formatDoctorReport(options: DoctorOptions = {}): Promise<s
       ? [`  Selected Workspace: ${report.cloudAuth.workspaceSlug ?? report.cloudAuth.workspaceId}`]
       : []),
     "",
+    "Exposure",
+    `  Default: ${report.exposure.default ?? "unknown"}`,
+    `  Discovery timeout: ${report.exposure.discoveryTimeoutMs ?? "unknown"}ms`,
+    `  Discovery concurrency: ${report.exposure.discoveryConcurrency ?? "unknown"}`,
+    `  Callable native tools: ${report.exposure.callableNativeToolCount ?? 0}`,
+    ...(Array.isArray(report.exposure.caplets)
+      ? (report.exposure.caplets as Array<Record<string, unknown>>).map(
+          (caplet) =>
+            `  ${caplet.id}: ${caplet.exposure} (${caplet.callable ? "callable" : `hidden: ${caplet.hiddenReason}`})`,
+        )
+      : []),
+    "",
     "Code Mode",
     `  Types generation: ${doctorOk(report.codeMode.typesGeneration)}`,
     `  Diagnostics: ${doctorOk(report.codeMode.diagnostics)}`,
@@ -140,6 +160,54 @@ export async function formatDoctorReport(options: DoctorOptions = {}): Promise<s
   return `${lines.join("\n")}\n`;
 }
 
+async function resolveExposureSection(env: NodeJS.ProcessEnv | Record<string, string | undefined>) {
+  const configPath = env.CAPLETS_CONFIG?.trim() ? env.CAPLETS_CONFIG.trim() : resolveConfigPath();
+  const projectConfigPath = env.CAPLETS_PROJECT_CONFIG?.trim()
+    ? env.CAPLETS_PROJECT_CONFIG.trim()
+    : resolveProjectConfigPath();
+  try {
+    const config = loadConfig(configPath, projectConfigPath);
+    const service = createNativeCapletsService({
+      mode: "local",
+      configPath,
+      projectConfigPath,
+      watch: false,
+      writeErr: () => undefined,
+    });
+    try {
+      const nativeTools = service.listTools();
+      const callableIds = new Set(nativeTools.map((tool) => tool.caplet));
+      return {
+        ok: true,
+        default: config.options.exposure,
+        discoveryTimeoutMs: config.options.exposureDiscoveryTimeoutMs,
+        discoveryConcurrency: config.options.exposureDiscoveryConcurrency,
+        callableNativeToolCount: nativeTools.length,
+        caplets: allCaplets(config).map((caplet) => {
+          const exposure = resolveExposure(caplet.exposure, config.options.exposure);
+          const callable =
+            callableIds.has(caplet.server) ||
+            [...callableIds].some((id) => id.startsWith(`${caplet.server}__`));
+          return {
+            id: caplet.server,
+            exposure: exposure.value,
+            callable,
+            ...(callable ? {} : { hiddenReason: hiddenReasonFor(caplet) }),
+          };
+        }),
+      };
+    } finally {
+      await service.close();
+    }
+  } catch (error) {
+    return {
+      ok: true,
+      configLoaded: false,
+      message: error instanceof Error ? error.message : String(error),
+    };
+  }
+}
+
 function resolveServerSection(env: NodeJS.ProcessEnv | Record<string, string | undefined>) {
   try {
     const server = resolveCapletsServer({}, env);
@@ -294,3 +362,29 @@ function observedOutputShapePath(value: unknown): string | undefined {
     ? (value as { path: string }).path
     : undefined;
 }
+
+function allCaplets(config: { [key: string]: unknown }): CapletConfig[] {
+  const typed = config as {
+    mcpServers?: Record<string, CapletConfig>;
+    openapiEndpoints?: Record<string, CapletConfig>;
+    graphqlEndpoints?: Record<string, CapletConfig>;
+    httpApis?: Record<string, CapletConfig>;
+    cliTools?: Record<string, CapletConfig>;
+    capletSets?: Record<string, CapletConfig>;
+  };
+  return [
+    ...Object.values(typed.mcpServers ?? {}),
+    ...Object.values(typed.openapiEndpoints ?? {}),
+    ...Object.values(typed.graphqlEndpoints ?? {}),
+    ...Object.values(typed.httpApis ?? {}),
+    ...Object.values(typed.cliTools ?? {}),
+    ...Object.values(typed.capletSets ?? {}),
+  ];
+}
+
+function hiddenReasonFor(caplet: CapletConfig): string {
+  if (caplet.disabled) return "disabled";
+  if (caplet.setup) return "setup_required";
+  if (caplet.projectBinding?.required) return "project_binding_required";
+  return "not_exposed";
+}
diff --git a/packages/core/src/code-mode/diagnostics.ts b/packages/core/src/code-mode/diagnostics.ts
index 38d3f39..36dad3e 100644
--- a/packages/core/src/code-mode/diagnostics.ts
+++ b/packages/core/src/code-mode/diagnostics.ts
@@ -1,4 +1,5 @@
 import ts from "typescript";
+import { hasDirectFetchCall } from "./static-analysis";
 import type { CodeModeDiagnostic } from "./types";
 
 export type DiagnoseCodeModeTypeScriptInput = {
@@ -15,7 +16,6 @@ const AMBIENT_FILE = "/caplets-code-mode/ambient.d.ts";
 const TS_NOCHECK_PATTERN =
   /^\s*(?:(?:\/\/[^\n]*|\/\*[\s\S]*?\*\/)\s*)*?(?:(?:\/\/\s*@ts-nocheck\b[^\n]*)|(?:\/\*\s*@ts-nocheck\b[\s\S]*?\*\/))/u;
 const BAD_CALL_METHOD_PATTERN = /\bcaplets(?:\.[A-Za-z_$][\w$]*|\[[^\]]+\])\.call\s*\(/u;
-const FETCH_PATTERN = /\bfetch\s*\(/u;
 
 export function diagnoseCodeModeTypeScript(
   input: DiagnoseCodeModeTypeScriptInput,
@@ -103,7 +103,7 @@ function preflightDiagnostics(code: string): CodeModeDiagnostic[] {
       message: "CapletHandle does not expose call(). Use callTool(name, args) for tool calls.",
     });
   }
-  if (FETCH_PATTERN.test(code)) {
+  if (hasDirectFetchCall(code)) {
     diagnostics.push({
       code: "FETCH_UNAVAILABLE",
       severity: "error",
diff --git a/packages/core/src/code-mode/index.ts b/packages/core/src/code-mode/index.ts
index a18e8c2..b6664bb 100644
--- a/packages/core/src/code-mode/index.ts
+++ b/packages/core/src/code-mode/index.ts
@@ -10,6 +10,7 @@ export {
   codeModeRunParamsSchema,
   isCodeModeRunRequest,
 } from "./tool";
+export { hasDirectFetchCall, hasExecutableImport } from "./static-analysis";
 export type {
   CodeModeCallableCaplet,
   CodeModeDeclarationInput,
diff --git a/packages/core/src/code-mode/static-analysis.ts b/packages/core/src/code-mode/static-analysis.ts
new file mode 100644
index 0000000..922cbd6
--- /dev/null
+++ b/packages/core/src/code-mode/static-analysis.ts
@@ -0,0 +1,92 @@
+export function hasDirectFetchCall(code: string): boolean {
+  const executableSource = maskLiteralsAndComments(code);
+  return (
+    /(^|[^\w$.\]])fetch\s*(?:\?\.)?\s*\(/u.test(executableSource) ||
+    /\b(?:globalThis|window|self)\s*(?:\.\s*fetch|\[\s*["']fetch["']\s*\])\s*(?:\?\.)?\s*\(/u.test(
+      executableSource,
+    )
+  );
+}
+
+export function hasExecutableImport(code: string): boolean {
+  const executableSource = maskLiteralsAndComments(code);
+  return (
+    /(^|[^\w$.])import\s*(?:\(|[\w$*{]|(?=\s*;))/u.test(executableSource) ||
+    /(^|[^\w$.])export\s+(?:\*|\{[^}]*\}|type\s+\{[^}]*\}|interface\s+\w+[^;]*?)\s+from\b/u.test(
+      executableSource,
+    )
+  );
+}
+
+function maskLiteralsAndComments(code: string): string {
+  let output = "";
+  let index = 0;
+  while (index < code.length) {
+    const char = code[index]!;
+    const next = code[index + 1];
+    if (char === '"' || char === "'" || char === "`") {
+      const masked = maskQuoted(code, index, char);
+      output += masked.text;
+      index = masked.nextIndex;
+      continue;
+    }
+    if (char === "/" && next === "/") {
+      const masked = maskLineComment(code, index);
+      output += masked.text;
+      index = masked.nextIndex;
+      continue;
+    }
+    if (char === "/" && next === "*") {
+      const masked = maskBlockComment(code, index);
+      output += masked.text;
+      index = masked.nextIndex;
+      continue;
+    }
+    output += char;
+    index += 1;
+  }
+  return output;
+}
+
+function maskQuoted(
+  code: string,
+  start: number,
+  quote: '"' | "'" | "`",
+): { text: string; nextIndex: number } {
+  let text = " ";
+  let index = start + 1;
+  while (index < code.length) {
+    const char = code[index]!;
+    text += char === "\n" ? "\n" : " ";
+    index += char === "\\" ? 2 : 1;
+    if (char === quote) break;
+  }
+  return { text, nextIndex: index };
+}
+
+function maskLineComment(code: string, start: number): { text: string; nextIndex: number } {
+  let text = "  ";
+  let index = start + 2;
+  while (index < code.length && code[index] !== "\n") {
+    text += " ";
+    index += 1;
+  }
+  return { text, nextIndex: index };
+}
+
+function maskBlockComment(code: string, start: number): { text: string; nextIndex: number } {
+  let text = "  ";
+  let index = start + 2;
+  while (index < code.length) {
+    const char = code[index]!;
+    const next = code[index + 1];
+    text += char === "\n" ? "\n" : " ";
+    index += 1;
+    if (char === "*" && next === "/") {
+      text += " ";
+      index += 1;
+      break;
+    }
+  }
+  return { text, nextIndex: index };
+}
diff --git a/packages/core/src/config-runtime.ts b/packages/core/src/config-runtime.ts
index 1b670c9..ad23c96 100644
--- a/packages/core/src/config-runtime.ts
+++ b/packages/core/src/config-runtime.ts
@@ -58,6 +58,13 @@ export type AgentSelectionHintsConfig = {
   avoidWhen?: string | undefined;
 };
 
+export type CapletExposure =
+  | "direct"
+  | "progressive"
+  | "code_mode"
+  | "direct_and_code_mode"
+  | "progressive_and_code_mode";
+
 export type CapletServerConfig = CommonCapletConfig & {
   backend: "mcp";
   transport: "stdio" | "http" | "sse";
@@ -176,6 +183,9 @@ export type CapletsConfig = {
   options: {
     defaultSearchLimit: number;
     maxSearchLimit: number;
+    exposure: CapletExposure;
+    exposureDiscoveryTimeoutMs: number;
+    exposureDiscoveryConcurrency: number;
     completion: {
       discoveryTimeoutMs: number;
       overallTimeoutMs: number;
@@ -195,6 +205,7 @@ type CommonCapletConfig = AgentSelectionHintsConfig & {
   server: string;
   name: string;
   description: string;
+  exposure?: CapletExposure | undefined;
   tags?: string[] | undefined;
   body?: string | undefined;
   setup?: CapletSetupConfig | undefined;
@@ -255,6 +266,13 @@ const agentSelectionHintsSchema = {
   useWhen: agentSelectionHintSchema.optional(),
   avoidWhen: agentSelectionHintSchema.optional(),
 };
+const exposureSchema = z.enum([
+  "direct",
+  "progressive",
+  "code_mode",
+  "direct_and_code_mode",
+  "progressive_and_code_mode",
+]);
 const commonSchema = {
   name: z.string().trim().min(1).max(80),
   description: z
@@ -265,6 +283,7 @@ const commonSchema = {
     )
     .refine((value) => value.length <= 1500, "description must be at most 1500 characters"),
   tags: z.array(z.string().trim().min(1).max(80)).optional(),
+  exposure: exposureSchema.optional(),
   ...agentSelectionHintsSchema,
   body: z.string().optional(),
   setup: setupSchema.optional(),
@@ -440,6 +459,18 @@ const configSchema = z
         cacheTtlMs: 300_000,
         negativeCacheTtlMs: 30_000,
       }),
+    options: z
+      .object({
+        exposure: exposureSchema.default("progressive_and_code_mode"),
+        exposureDiscoveryTimeoutMs: z.number().int().positive().default(15_000),
+        exposureDiscoveryConcurrency: z.number().int().positive().max(32).default(4),
+      })
+      .strict()
+      .default({
+        exposure: "progressive_and_code_mode",
+        exposureDiscoveryTimeoutMs: 15_000,
+        exposureDiscoveryConcurrency: 4,
+      }),
     mcpServers: z.record(z.string().regex(SERVER_ID_PATTERN), mcpServerSchema).default({}),
     openapiEndpoints: z
       .record(z.string().regex(SERVER_ID_PATTERN), openApiEndpointSchema)
@@ -474,6 +505,9 @@ export function parseConfig(input: unknown): CapletsConfig {
     options: {
       defaultSearchLimit: config.defaultSearchLimit,
       maxSearchLimit: config.maxSearchLimit,
+      exposure: config.options.exposure,
+      exposureDiscoveryTimeoutMs: config.options.exposureDiscoveryTimeoutMs,
+      exposureDiscoveryConcurrency: config.options.exposureDiscoveryConcurrency,
       completion: config.completion,
     },
     mcpServers: mapBackend(config.mcpServers, "mcp", (id, raw) => {
diff --git a/packages/core/src/config.ts b/packages/core/src/config.ts
index 5b5da32..197979f 100644
--- a/packages/core/src/config.ts
+++ b/packages/core/src/config.ts
@@ -94,11 +94,19 @@ export type AgentSelectionHintsConfig = {
   avoidWhen?: string | undefined;
 };
 
+export type CapletExposure =
+  | "direct"
+  | "progressive"
+  | "code_mode"
+  | "direct_and_code_mode"
+  | "progressive_and_code_mode";
+
 export type CapletServerConfig = AgentSelectionHintsConfig & {
   server: string;
   backend: "mcp";
   name: string;
   description: string;
+  exposure?: CapletExposure | undefined;
   tags?: string[] | undefined;
   body?: string | undefined;
   transport: "stdio" | "http" | "sse";
@@ -128,6 +136,7 @@ export type OpenApiEndpointConfig = AgentSelectionHintsConfig & {
   backend: "openapi";
   name: string;
   description: string;
+  exposure?: CapletExposure | undefined;
   tags?: string[] | undefined;
   body?: string | undefined;
   specPath?: string | undefined;
@@ -154,6 +163,7 @@ export type GraphQlEndpointConfig = AgentSelectionHintsConfig & {
   backend: "graphql";
   name: string;
   description: string;
+  exposure?: CapletExposure | undefined;
   tags?: string[] | undefined;
   body?: string | undefined;
   endpointUrl: string;
@@ -187,6 +197,7 @@ export type HttpApiConfig = AgentSelectionHintsConfig & {
   backend: "http";
   name: string;
   description: string;
+  exposure?: CapletExposure | undefined;
   tags?: string[] | undefined;
   body?: string | undefined;
   baseUrl: string;
@@ -230,6 +241,7 @@ export type CliToolsConfig = AgentSelectionHintsConfig & {
   backend: "cli";
   name: string;
   description: string;
+  exposure?: CapletExposure | undefined;
   tags?: string[] | undefined;
   body?: string | undefined;
   actions: Record<string, CliToolActionConfig>;
@@ -248,6 +260,7 @@ export type CapletSetConfig = AgentSelectionHintsConfig & {
   backend: "caplets";
   name: string;
   description: string;
+  exposure?: CapletExposure | undefined;
   tags?: string[] | undefined;
   body?: string | undefined;
   configPath?: string | undefined;
@@ -272,6 +285,9 @@ export type CapletConfig =
 export type CapletsOptions = {
   defaultSearchLimit: number;
   maxSearchLimit: number;
+  exposure: CapletExposure;
+  exposureDiscoveryTimeoutMs: number;
+  exposureDiscoveryConcurrency: number;
   completion: CompletionConfig;
 };
 
@@ -477,6 +493,10 @@ const agentSelectionHintsSchema = {
     .describe("When agents should avoid this Caplet or configured action."),
 };
 
+const exposureSchema = z
+  .enum(["direct", "progressive", "code_mode", "direct_and_code_mode", "progressive_and_code_mode"])
+  .describe("How this Caplet is exposed to agents.");
+
 const publicServerSchema = z
   .object({
     name: z.string().trim().min(1).max(80).describe("Human-readable server display name."),
@@ -502,6 +522,7 @@ const publicServerSchema = z
     url: z.string().url().optional().describe("Remote MCP server URL for http or sse transport."),
     auth: remoteAuthSchema.optional(),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    exposure: exposureSchema.optional(),
     ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
@@ -553,6 +574,7 @@ const publicOpenApiEndpointSchema = z
       'Explicit OpenAPI request auth config. Use {"type":"none"} for public APIs.',
     ),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    exposure: exposureSchema.optional(),
     ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
@@ -627,6 +649,7 @@ const publicGraphQlEndpointSchema = z
       'Explicit GraphQL request auth config. Use {"type":"none"} for public APIs.',
     ),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    exposure: exposureSchema.optional(),
     ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
@@ -745,6 +768,7 @@ const publicHttpApiSchema = z
       )
       .describe("Configured HTTP actions keyed by stable tool name."),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    exposure: exposureSchema.optional(),
     ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
@@ -842,6 +866,7 @@ const publicCliToolsSchema = z
       .optional()
       .describe("Default environment variables for CLI actions."),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    exposure: exposureSchema.optional(),
     ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
@@ -899,6 +924,7 @@ const publicCapletSetSchema = z
       .default(30_000)
       .describe("Milliseconds child Caplet metadata stays fresh. Set 0 to refresh every time."),
     tags: z.array(z.string().trim().min(1).max(80)).optional(),
+    exposure: exposureSchema.optional(),
     ...agentSelectionHintsSchema,
     setup: setupSchema.optional(),
     projectBinding: projectBindingSchema.optional(),
@@ -986,6 +1012,19 @@ function configSchemaFor(
           negativeCacheTtlMs: 30_000,
         })
         .describe("Shell completion discovery timeout and cache settings."),
+      options: z
+        .object({
+          exposure: exposureSchema.default("progressive_and_code_mode"),
+          exposureDiscoveryTimeoutMs: z.number().int().positive().default(15_000),
+          exposureDiscoveryConcurrency: z.number().int().positive().max(32).default(4),
+        })
+        .strict()
+        .default({
+          exposure: "progressive_and_code_mode",
+          exposureDiscoveryTimeoutMs: 15_000,
+          exposureDiscoveryConcurrency: 4,
+        })
+        .describe("Global Caplets runtime options."),
       mcpServers: z
         .record(z.string().regex(SERVER_ID_PATTERN), serverValueSchema)
         .default({})
@@ -1908,6 +1947,9 @@ export function parseConfig(input: unknown): CapletsConfig {
     options: {
       defaultSearchLimit: parsed.data.defaultSearchLimit,
       maxSearchLimit: parsed.data.maxSearchLimit,
+      exposure: parsed.data.options.exposure,
+      exposureDiscoveryTimeoutMs: parsed.data.options.exposureDiscoveryTimeoutMs,
+      exposureDiscoveryConcurrency: parsed.data.options.exposureDiscoveryConcurrency,
       completion: parsed.data.completion,
     },
     mcpServers: servers,
diff --git a/packages/core/src/engine.ts b/packages/core/src/engine.ts
index be19963..a68c948 100644
--- a/packages/core/src/engine.ts
+++ b/packages/core/src/engine.ts
@@ -13,7 +13,7 @@ import {
 } from "./config";
 import { DEFAULT_OBSERVED_OUTPUT_SHAPE_CACHE_DIR } from "./config/paths";
 import { DownstreamManager } from "./downstream";
-import { errorResult, toSafeError } from "./errors";
+import { CapletsError, errorResult, toSafeError } from "./errors";
 import { GraphQLManager } from "./graphql";
 import { HttpActionManager } from "./http-actions";
 import { OpenApiManager } from "./openapi";
@@ -24,6 +24,7 @@ import {
 } from "./observed-output-shapes";
 import { ServerRegistry } from "./registry";
 import { handleServerTool } from "./tools";
+import { discoverExposureSnapshot, type ExposureSnapshot } from "./exposure/discovery";
 
 type ToolSummary = { name: string; description?: string };
 
@@ -74,6 +75,7 @@ export class CapletsEngine {
   private readonly observedOutputShapeScope: ObservedOutputShapeKey["scope"];
   private readonly projectFingerprint: string | undefined;
   private readonly reloadListeners = new Set<(event: CapletsEngineReloadEvent) => void>();
+  private lastExposureSnapshot: ExposureSnapshot | undefined;
   private watchers: FSWatcher[] = [];
   private reloadTimer: NodeJS.Timeout | undefined;
   private watcherRefreshTimer: NodeJS.Timeout | undefined;
@@ -118,6 +120,25 @@ export class CapletsEngine {
     return nextEnabledServers(this.registry.config);
   }
 
+  async exposureSnapshot(): Promise<ExposureSnapshot> {
+    this.lastExposureSnapshot = await discoverExposureSnapshot({
+      config: this.registry.config,
+      caplets: this.enabledServers(),
+      listTools: async (caplet) => this.listTools(caplet),
+      listResources: async (caplet) =>
+        this.optionalMcpList(caplet, () => this.downstream.listResources(caplet, true)),
+      listResourceTemplates: async (caplet) =>
+        this.optionalMcpList(caplet, () => this.downstream.listResourceTemplates(caplet, true)),
+      listPrompts: async (caplet) =>
+        this.optionalMcpList(caplet, () => this.downstream.listPrompts(caplet, true)),
+    });
+    return this.lastExposureSnapshot;
+  }
+
+  currentExposureSnapshot(): ExposureSnapshot | undefined {
+    return this.lastExposureSnapshot;
+  }
+
   watchedPaths(): string[] {
     return [...new Set(watchedPaths(this.paths).map((entry) => entry.path))].sort();
   }
@@ -180,6 +201,46 @@ export class CapletsEngine {
     }
   }
 
+  async executeDirectTool(
+    serverId: string,
+    toolName: string,
+    args: Record<string, unknown>,
+  ): Promise<unknown> {
+    try {
+      const caplet = this.registry.require(serverId);
+      const result = await this.callTool(caplet, toolName, args);
+      return annotateDirectResult(result, caplet, toolName);
+    } catch (error) {
+      return errorResult(error);
+    }
+  }
+
+  async readDirectResource(serverId: string, downstreamUri: string): Promise<unknown> {
+    try {
+      const caplet = this.registry.require(serverId);
+      if (caplet.backend !== "mcp") throw new Error(`Caplet ${serverId} has no MCP resources`);
+      const result = await this.downstream.readResource(caplet, downstreamUri);
+      return annotateDirectResult(result, caplet, "read_resource");
+    } catch (error) {
+      return errorResult(error);
+    }
+  }
+
+  async getDirectPrompt(
+    serverId: string,
+    promptName: string,
+    args: Record<string, unknown>,
+  ): Promise<unknown> {
+    try {
+      const caplet = this.registry.require(serverId);
+      if (caplet.backend !== "mcp") throw new Error(`Caplet ${serverId} has no MCP prompts`);
+      const result = await this.downstream.getPrompt(caplet, promptName, args);
+      return annotateDirectResult(result, caplet, promptName);
+    } catch (error) {
+      return errorResult(error);
+    }
+  }
+
   async completeCliWords(words: string[]): Promise<string[]> {
     const { completeCliWords } = await import("./cli/completion");
     return await completeCliWords(words, {
@@ -254,6 +315,46 @@ export class CapletsEngine {
     }));
   }
 
+  private async listTools(server: CapletConfig) {
+    return server.backend === "mcp"
+      ? await this.downstream.listTools(server)
+      : server.backend === "openapi"
+        ? await this.openapi.listTools(server)
+        : server.backend === "graphql"
+          ? await this.graphql.listTools(server)
+          : server.backend === "http"
+            ? await this.http.listTools(server)
+            : server.backend === "cli"
+              ? await this.cli.listTools(server)
+              : await this.capletSets.listTools(server);
+  }
+
+  private async callTool(server: CapletConfig, toolName: string, args: Record<string, unknown>) {
+    return server.backend === "mcp"
+      ? await this.downstream.callTool(server, toolName, args)
+      : server.backend === "openapi"
+        ? await this.openapi.callTool(server, toolName, args)
+        : server.backend === "graphql"
+          ? await this.graphql.callTool(server, toolName, args)
+          : server.backend === "http"
+            ? await this.http.callTool(server, toolName, args)
+            : server.backend === "cli"
+              ? await this.cli.callTool(server, toolName, args)
+              : await this.capletSets.callTool(server, toolName, args);
+  }
+
+  private async optionalMcpList<T>(
+    caplet: Extract<CapletConfig, { backend: "mcp" }>,
+    list: () => Promise<T[]>,
+  ): Promise<T[]> {
+    try {
+      return await list();
+    } catch (error) {
+      if (isUnsupportedCapability(error)) return [];
+      throw error;
+    }
+  }
+
   private async reloadOnce(): Promise<boolean> {
     if (this.closed) {
       return false;
@@ -525,3 +626,30 @@ function isDirectory(path: string): boolean {
     return false;
   }
 }
+
+function annotateDirectResult(result: unknown, caplet: CapletConfig, operation: string): unknown {
+  if (!result || typeof result !== "object" || Array.isArray(result)) {
+    return result;
+  }
+  const existingMeta = (result as { _meta?: unknown })._meta;
+  return {
+    ...result,
+    _meta: {
+      ...(isRecord(existingMeta) ? existingMeta : {}),
+      caplets: {
+        capletId: caplet.server,
+        backend: caplet.backend,
+        operation,
+        exposure: "direct",
+      },
+    },
+  };
+}
+
+function isUnsupportedCapability(error: unknown): boolean {
+  return error instanceof CapletsError && error.code === "UNSUPPORTED_CAPABILITY";
+}
+
+function isRecord(value: unknown): value is Record<string, unknown> {
+  return Boolean(value) && typeof value === "object" && !Array.isArray(value);
+}
diff --git a/packages/core/src/errors.ts b/packages/core/src/errors.ts
index 842483a..54e4b84 100644
--- a/packages/core/src/errors.ts
+++ b/packages/core/src/errors.ts
@@ -1,3 +1,5 @@
+import { isSecretKey, redactSecretText } from "./redaction";
+
 export const CAPLETS_ERROR_CODES = [
   "CONFIG_NOT_FOUND",
   "CONFIG_EXISTS",
@@ -44,15 +46,9 @@ export class CapletsError extends Error {
   }
 }
 
-const SECRET_KEY_PATTERN =
-  /(token|secret|authorization|auth|api[-_]?key|password|credential|clientsecret|client_secret|code|refresh)/i;
-
-const SECRET_VALUE_PATTERN =
-  /(bearer\s+)[a-z0-9._~+/=-]+|([?&](?:access_token|refresh_token|token|code)=)[^&\s]+/gi;
-
 export function redactSecrets(value: unknown): unknown {
   if (typeof value === "string") {
-    return value.replace(SECRET_VALUE_PATTERN, "$1$2[REDACTED]");
+    return redactSecretText(value).text;
   }
 
   if (Array.isArray(value)) {
@@ -62,7 +58,7 @@ export function redactSecrets(value: unknown): unknown {
   if (value && typeof value === "object") {
     const redacted: Record<string, unknown> = {};
     for (const [key, nested] of Object.entries(value)) {
-      redacted[key] = SECRET_KEY_PATTERN.test(key) ? "[REDACTED]" : redactSecrets(nested);
+      redacted[key] = isSecretKey(key) ? "[REDACTED]" : redactSecrets(nested);
     }
     return redacted;
   }
diff --git a/packages/core/src/exposure/direct-names.ts b/packages/core/src/exposure/direct-names.ts
new file mode 100644
index 0000000..8d8fcb2
--- /dev/null
+++ b/packages/core/src/exposure/direct-names.ts
@@ -0,0 +1,44 @@
+import { CapletsError } from "../errors";
+
+export function directToolName(capletId: string, operationName: string): string {
+  return `${capletId}__${operationName}`;
+}
+
+export function directPromptName(capletId: string, promptName: string): string {
+  return `${capletId}__${promptName}`;
+}
+
+export function nativeDirectToolName(capletId: string, operationName: string): string {
+  return `caplets__${capletId}__${operationName}`;
+}
+
+export function directResourceUri(capletId: string, downstreamUri: string): string {
+  return `caplets://${capletId}/resources/${encodeURIComponent(downstreamUri)}`;
+}
+
+export function directResourceTemplateUri(capletId: string): string {
+  return `caplets://${capletId}/resources/{encodedUri}`;
+}
+
+export function decodeDirectResourceUri(uri: string): {
+  capletId: string;
+  downstreamUri: string;
+} {
+  let parsed: URL;
+  try {
+    parsed = new URL(uri);
+  } catch (error) {
+    throw new CapletsError("REQUEST_INVALID", `Invalid Caplets resource URI ${uri}`, error);
+  }
+  if (parsed.protocol !== "caplets:" || !parsed.hostname) {
+    throw new CapletsError("REQUEST_INVALID", `Invalid Caplets resource URI ${uri}`);
+  }
+  const prefix = "/resources/";
+  if (!parsed.pathname.startsWith(prefix)) {
+    throw new CapletsError("REQUEST_INVALID", `Invalid Caplets resource URI ${uri}`);
+  }
+  return {
+    capletId: parsed.hostname,
+    downstreamUri: decodeURIComponent(parsed.pathname.slice(prefix.length)),
+  };
+}
diff --git a/packages/core/src/exposure/discovery.ts b/packages/core/src/exposure/discovery.ts
new file mode 100644
index 0000000..8cc197e
--- /dev/null
+++ b/packages/core/src/exposure/discovery.ts
@@ -0,0 +1,265 @@
+import type { Prompt, Resource, ResourceTemplate, Tool } from "@modelcontextprotocol/sdk/types";
+import type { CapletConfig, CapletsConfig } from "../config";
+import { toSafeError, type SafeErrorSummary } from "../errors";
+import {
+  directPromptName,
+  directResourceTemplateUri,
+  directResourceUri,
+  directToolName,
+} from "./direct-names";
+import { resolveExposure, type ResolvedExposure } from "./policy";
+
+export type HiddenCapletReason =
+  | "disabled"
+  | "setup_required"
+  | "project_binding_required"
+  | "discovery_failed"
+  | "empty_surface";
+
+export type HiddenCaplet = {
+  capletId: string;
+  reason: HiddenCapletReason;
+  error?: SafeErrorSummary | undefined;
+};
+
+export type CallableCaplet = {
+  caplet: CapletConfig;
+  exposure: ResolvedExposure;
+  tools: Tool[];
+  resources: Resource[];
+  resourceTemplates: ResourceTemplate[];
+  prompts: Prompt[];
+  discoveredAt: number;
+};
+
+export type DirectToolRegistration = {
+  caplet: CapletConfig;
+  downstreamName: string;
+  name: string;
+  tool: Tool;
+};
+
+export type DirectResourceRegistration = {
+  caplet: Extract<CapletConfig, { backend: "mcp" }>;
+  downstreamUri: string;
+  uri: string;
+  resource: Resource;
+};
+
+export type DirectResourceTemplateRegistration = {
+  caplet: Extract<CapletConfig, { backend: "mcp" }>;
+  downstreamUriTemplate: string;
+  uriTemplate: string;
+  resourceTemplate: ResourceTemplate;
+};
+
+export type DirectPromptRegistration = {
+  caplet: Extract<CapletConfig, { backend: "mcp" }>;
+  downstreamName: string;
+  name: string;
+  prompt: Prompt;
+};
+
+export type ExposureSnapshot = {
+  callableCaplets: CallableCaplet[];
+  progressiveCaplets: CallableCaplet[];
+  codeModeCaplets: CallableCaplet[];
+  directTools: DirectToolRegistration[];
+  directResources: DirectResourceRegistration[];
+  directResourceTemplates: DirectResourceTemplateRegistration[];
+  directPrompts: DirectPromptRegistration[];
+  hiddenCaplets: HiddenCaplet[];
+};
+
+export type DiscoverExposureSnapshotOptions = {
+  config: CapletsConfig;
+  caplets: CapletConfig[];
+  listTools(caplet: CapletConfig): Promise<Tool[]>;
+  listResources?(caplet: Extract<CapletConfig, { backend: "mcp" }>): Promise<Resource[]>;
+  listResourceTemplates?(
+    caplet: Extract<CapletConfig, { backend: "mcp" }>,
+  ): Promise<ResourceTemplate[]>;
+  listPrompts?(caplet: Extract<CapletConfig, { backend: "mcp" }>): Promise<Prompt[]>;
+};
+
+export async function discoverExposureSnapshot(
+  options: DiscoverExposureSnapshotOptions,
+): Promise<ExposureSnapshot> {
+  const results = await mapWithConcurrency(
+    options.caplets,
+    Math.max(1, Math.min(32, options.config.options.exposureDiscoveryConcurrency)),
+    async (caplet) => discoverCaplet(options, caplet),
+  );
+
+  const callableCaplets = results.flatMap((result) => (result.callable ? [result.callable] : []));
+  const hiddenCaplets = results.flatMap((result) => (result.hidden ? [result.hidden] : []));
+  return {
+    callableCaplets,
+    progressiveCaplets: callableCaplets.filter((entry) => entry.exposure.progressive),
+    codeModeCaplets: callableCaplets.filter((entry) => entry.exposure.codeMode),
+    directTools: callableCaplets.flatMap((entry) =>
+      entry.exposure.direct
+        ? entry.tools.map((tool) => ({
+            caplet: entry.caplet,
+            downstreamName: tool.name,
+            name: directToolName(entry.caplet.server, tool.name),
+            tool,
+          }))
+        : [],
+    ),
+    directResources: callableCaplets.flatMap(directResourcesFor),
+    directResourceTemplates: callableCaplets.flatMap(directResourceTemplatesFor),
+    directPrompts: callableCaplets.flatMap(directPromptsFor),
+    hiddenCaplets,
+  };
+}
+
+function directResourcesFor(entry: CallableCaplet): DirectResourceRegistration[] {
+  if (!entry.exposure.direct || !isMcpCaplet(entry.caplet)) return [];
+  const caplet = entry.caplet;
+  return entry.resources.map((resource) => ({
+    caplet,
+    downstreamUri: resource.uri,
+    uri: directResourceUri(caplet.server, resource.uri),
+    resource,
+  }));
+}
+
+function directResourceTemplatesFor(entry: CallableCaplet): DirectResourceTemplateRegistration[] {
+  if (!entry.exposure.direct || !isMcpCaplet(entry.caplet)) return [];
+  const caplet = entry.caplet;
+  return entry.resourceTemplates.map((resourceTemplate) => ({
+    caplet,
+    downstreamUriTemplate: resourceTemplate.uriTemplate,
+    uriTemplate: directResourceTemplateUri(caplet.server),
+    resourceTemplate,
+  }));
+}
+
+function directPromptsFor(entry: CallableCaplet): DirectPromptRegistration[] {
+  if (!entry.exposure.direct || !isMcpCaplet(entry.caplet)) return [];
+  const caplet = entry.caplet;
+  return entry.prompts.map((prompt) => ({
+    caplet,
+    downstreamName: prompt.name,
+    name: directPromptName(caplet.server, prompt.name),
+    prompt,
+  }));
+}
+
+function isMcpCaplet(caplet: CapletConfig): caplet is Extract<CapletConfig, { backend: "mcp" }> {
+  return caplet.backend === "mcp";
+}
+
+async function discoverCaplet(
+  options: DiscoverExposureSnapshotOptions,
+  caplet: CapletConfig,
+): Promise<{ callable?: CallableCaplet; hidden?: HiddenCaplet }> {
+  if (caplet.disabled) return { hidden: { capletId: caplet.server, reason: "disabled" } };
+  if (caplet.setup) return { hidden: { capletId: caplet.server, reason: "setup_required" } };
+  if (caplet.projectBinding?.required) {
+    return { hidden: { capletId: caplet.server, reason: "project_binding_required" } };
+  }
+
+  const exposure = resolveExposure(caplet.exposure, options.config.options.exposure);
+  if (!exposure.direct) {
+    return {
+      callable: {
+        caplet,
+        exposure,
+        tools: [],
+        resources: [],
+        resourceTemplates: [],
+        prompts: [],
+        discoveredAt: Date.now(),
+      },
+    };
+  }
+  try {
+    const tools = await withTimeout(
+      options.listTools(caplet),
+      options.config.options.exposureDiscoveryTimeoutMs,
+    );
+    const resources =
+      caplet.backend === "mcp" && options.listResources
+        ? await withTimeout(
+            options.listResources(caplet),
+            options.config.options.exposureDiscoveryTimeoutMs,
+          )
+        : [];
+    const resourceTemplates =
+      caplet.backend === "mcp" && options.listResourceTemplates
+        ? await withTimeout(
+            options.listResourceTemplates(caplet),
+            options.config.options.exposureDiscoveryTimeoutMs,
+          )
+        : [];
+    const prompts =
+      caplet.backend === "mcp" && options.listPrompts
+        ? await withTimeout(
+            options.listPrompts(caplet),
+            options.config.options.exposureDiscoveryTimeoutMs,
+          )
+        : [];
+    if (
+      tools.length === 0 &&
+      resources.length === 0 &&
+      resourceTemplates.length === 0 &&
+      prompts.length === 0
+    ) {
+      return { hidden: { capletId: caplet.server, reason: "empty_surface" } };
+    }
+    return {
+      callable: {
+        caplet,
+        exposure,
+        tools,
+        resources,
+        resourceTemplates,
+        prompts,
+        discoveredAt: Date.now(),
+      },
+    };
+  } catch (error) {
+    return {
+      hidden: {
+        capletId: caplet.server,
+        reason: "discovery_failed",
+        error: toSafeError(error, "SERVER_UNAVAILABLE"),
+      },
+    };
+  }
+}
+
+async function mapWithConcurrency<T, R>(
+  values: T[],
+  concurrency: number,
+  mapper: (value: T) => Promise<R>,
+): Promise<R[]> {
+  const results: R[] = [];
+  let index = 0;
+  async function worker(): Promise<void> {
+    for (;;) {
+      const current = index;
+      index += 1;
+      if (current >= values.length) return;
+      results[current] = await mapper(values[current]!);
+    }
+  }
+  await Promise.all(Array.from({ length: Math.min(concurrency, values.length) }, () => worker()));
+  return results;
+}
+
+async function withTimeout<T>(promise: Promise<T>, timeoutMs: number): Promise<T> {
+  let timeout: NodeJS.Timeout | undefined;
+  try {
+    return await Promise.race([
+      promise,
+      new Promise<never>((_, reject) => {
+        timeout = setTimeout(() => reject(new Error("Exposure discovery timed out")), timeoutMs);
+      }),
+    ]);
+  } finally {
+    if (timeout) clearTimeout(timeout);
+  }
+}
diff --git a/packages/core/src/exposure/policy.ts b/packages/core/src/exposure/policy.ts
new file mode 100644
index 0000000..9fa70d3
--- /dev/null
+++ b/packages/core/src/exposure/policy.ts
@@ -0,0 +1,21 @@
+import type { CapletExposure } from "../config";
+
+export type ResolvedExposure = {
+  value: CapletExposure;
+  direct: boolean;
+  progressive: boolean;
+  codeMode: boolean;
+};
+
+export function resolveExposure(
+  capletExposure: CapletExposure | undefined,
+  globalExposure: CapletExposure,
+): ResolvedExposure {
+  const value = capletExposure ?? globalExposure;
+  return {
+    value,
+    direct: value === "direct" || value === "direct_and_code_mode",
+    progressive: value === "progressive" || value === "progressive_and_code_mode",
+    codeMode: value === "code_mode" || value.endsWith("_and_code_mode"),
+  };
+}
diff --git a/packages/core/src/native/service.ts b/packages/core/src/native/service.ts
index 04c5886..e709af4 100644
--- a/packages/core/src/native/service.ts
+++ b/packages/core/src/native/service.ts
@@ -22,10 +22,13 @@ import {
   nativeCodeModeToolId,
   nativeCodeModeToolName,
 } from "./tools";
+import { nativeDirectToolName } from "../exposure/direct-names";
+import { resolveExposure } from "../exposure/policy";
 import {
   generateCodeModeDeclarations,
   generateCodeModeRunToolDescription,
 } from "../code-mode/declarations";
+import type { DirectToolRegistration, ExposureSnapshot } from "../exposure/discovery";
 import { runCodeMode } from "../code-mode/runner";
 import {
   codeModeRunInputJsonSchema,
@@ -67,6 +70,7 @@ export type NativeCapletTool = {
   avoidWhen?: string;
   promptGuidance: string[];
   inputSchema?: ReturnType<typeof generatedToolInputJsonSchemaForCaplet> | Record<string, unknown>;
+  outputSchema?: Record<string, unknown>;
   operationNames?: string[];
 };
 
@@ -118,6 +122,8 @@ type LocalNativeCapletsServiceOptions = NativeCapletsServiceOptions & {
 
 class DefaultNativeCapletsService implements NativeCapletsService {
   private readonly engine: CapletsEngine;
+  private directToolRoutes = new Map<string, { capletId: string; operationName: string }>();
+  private exposureSnapshot: ExposureSnapshot | undefined;
 
   constructor(options: LocalNativeCapletsServiceOptions) {
     this.engine = new CapletsEngine({
@@ -127,33 +133,61 @@ class DefaultNativeCapletsService implements NativeCapletsService {
   }
 
   listTools(): NativeCapletTool[] {
-    const capletTools = this.engine.enabledServers().map((caplet) => {
-      const toolName = nativeCapletToolName(caplet.server);
-      const inputSchema = generatedToolInputJsonSchemaForCaplet(caplet);
-      return {
-        caplet: caplet.server,
-        toolName,
-        title: caplet.name,
-        description: nativeCapletToolDescription(toolName, caplet),
-        ...(caplet.useWhen ? { useWhen: caplet.useWhen } : {}),
-        ...(caplet.avoidWhen ? { avoidWhen: caplet.avoidWhen } : {}),
-        promptGuidance: nativeCapletPromptGuidance(toolName, caplet),
-        inputSchema,
-        operationNames: [...inputSchema.properties.operation.enum],
-      };
-    });
-    return [...capletTools, codeModeRunNativeTool(capletTools)];
+    this.directToolRoutes = new Map();
+    const progressiveTools: NativeCapletTool[] = [];
+    const codeModeCaplets: NativeCapletTool[] = [];
+    const directTools: NativeCapletTool[] = [];
+    for (const caplet of this.engine.enabledServers()) {
+      if (caplet.setup || caplet.projectBinding?.required) continue;
+      const exposure = resolveExposure(
+        caplet.exposure,
+        this.engine.currentConfig().options.exposure,
+      );
+      if (exposure.progressive) {
+        const tool = progressiveNativeTool(caplet);
+        progressiveTools.push(tool);
+        if (exposure.codeMode) codeModeCaplets.push(tool);
+        continue;
+      }
+      if (exposure.direct) {
+        directTools.push(...this.directNativeTools(caplet, this.exposureSnapshot));
+      }
+      if (exposure.codeMode) {
+        codeModeCaplets.push(codeModeCapletDescriptor(caplet));
+      }
+    }
+    return [
+      ...progressiveTools,
+      ...directTools,
+      ...(codeModeCaplets.length > 0 ? [codeModeRunNativeTool(codeModeCaplets)] : []),
+    ];
   }
 
   async execute(capletId: string, request: unknown): Promise<unknown> {
     if (capletId === nativeCodeModeToolId && isCodeModeRunRequest(request)) {
       return await executeCodeModeRunNative(this, request);
     }
+    const route = this.directToolRoutes.get(capletId);
+    if (route) {
+      if (isMcpPrimitiveRoute(route.operationName)) {
+        return await this.engine.execute(
+          route.capletId,
+          nativeMcpPrimitiveRequest(route.operationName, request),
+        );
+      }
+      return await this.engine.executeDirectTool(
+        route.capletId,
+        route.operationName,
+        isRecord(request) ? request : {},
+      );
+    }
     return await this.engine.execute(capletId, request);
   }
 
   async reload(): Promise<boolean> {
-    return await this.engine.reload();
+    const reloaded = await this.engine.reload();
+    await this.refreshExposureSnapshot();
+    return reloaded;
   }
 
   onToolsChanged(listener: NativeCapletsToolsChangedListener): () => void {
@@ -163,6 +197,218 @@ class DefaultNativeCapletsService implements NativeCapletsService {
   async close(): Promise<void> {
     await this.engine.close();
   }
+
+  private directNativeTools(
+    caplet: ReturnType<CapletsEngine["enabledServers"]>[number],
+    snapshot: ExposureSnapshot | undefined,
+  ): NativeCapletTool[] {
+    if (caplet.backend === "http") {
+      return Object.entries(caplet.actions)
+        .sort(([left], [right]) => left.localeCompare(right))
+        .map(([operationName, action]) =>
+          this.directNativeTool(caplet, operationName, {
+            ...(action.description ? { description: action.description } : {}),
+            ...(action.inputSchema ? { inputSchema: action.inputSchema } : {}),
+            ...(action.outputSchema ? { outputSchema: action.outputSchema } : {}),
+            annotations: {
+              readOnlyHint: action.method === "GET",
+              destructiveHint: action.method === "DELETE",
+            },
+          }),
+        );
+    }
+    if (caplet.backend === "cli") {
+      return Object.entries(caplet.actions)
+        .sort(([left], [right]) => left.localeCompare(right))
+        .map(([operationName, action]) =>
+          this.directNativeTool(caplet, operationName, {
+            ...(action.description ? { description: action.description } : {}),
+            ...(action.inputSchema ? { inputSchema: action.inputSchema } : {}),
+            ...(action.outputSchema ? { outputSchema: action.outputSchema } : {}),
+            ...(action.annotations ? { annotations: action.annotations } : {}),
+          }),
+        );
+    }
+    if (caplet.backend === "mcp") {
+      const directTools =
+        snapshot?.directTools
+          .filter((entry) => entry.caplet.server === caplet.server)
+          .map((entry) => this.directMcpTool(caplet, entry)) ?? [];
+      return [
+        ...directTools,
+        ...mcpPrimitiveNativeTools(caplet, snapshot).map((operationName) =>
+          this.directNativeTool(caplet, operationName, {
+            description: `MCP ${operationName.replace(/_/g, " ")}.`,
+            inputSchema: nativeMcpPrimitiveInputSchema(operationName),
+          }),
+        ),
+      ];
+    }
+    return [];
+  }
+
+  private directMcpTool(
+    caplet: ReturnType<CapletsEngine["enabledServers"]>[number],
+    entry: DirectToolRegistration,
+  ): NativeCapletTool {
+    return this.directNativeTool(caplet, entry.downstreamName, {
+      ...(entry.tool.description ? { description: entry.tool.description } : {}),
+      ...(entry.tool.inputSchema
+        ? { inputSchema: entry.tool.inputSchema as Record<string, unknown> }
+        : {}),
+      ...(entry.tool.outputSchema
+        ? { outputSchema: entry.tool.outputSchema as Record<string, unknown> }
+        : {}),
+      ...(entry.tool.annotations ? { annotations: entry.tool.annotations } : {}),
+    });
+  }
+
+  private directNativeTool(
+    caplet: ReturnType<CapletsEngine["enabledServers"]>[number],
+    operationName: string,
+    options: {
+      description?: string;
+      inputSchema?: Record<string, unknown>;
+      outputSchema?: Record<string, unknown>;
+      annotations?: Record<string, unknown>;
+    },
+  ): NativeCapletTool {
+    const routeId = `${caplet.server}__${operationName}`;
+    const toolName = nativeDirectToolName(caplet.server, operationName);
+    this.directToolRoutes.set(routeId, { capletId: caplet.server, operationName });
+    return {
+      caplet: routeId,
+      toolName,
+      title: operationName,
+      description: options.description ?? "",
+      ...(caplet.useWhen ? { useWhen: caplet.useWhen } : {}),
+      ...(caplet.avoidWhen ? { avoidWhen: caplet.avoidWhen } : {}),
+      promptGuidance: [`Use ${toolName} for ${caplet.name} ${operationName}.`],
+      ...(options.inputSchema ? { inputSchema: options.inputSchema } : {}),
+      ...(options.outputSchema ? { outputSchema: options.outputSchema } : {}),
+    };
+  }
+
+  private async refreshExposureSnapshot(): Promise<void> {
+    this.exposureSnapshot = await this.engine.exposureSnapshot();
+  }
+}
+
+function progressiveNativeTool(
+  caplet: ReturnType<CapletsEngine["enabledServers"]>[number],
+): NativeCapletTool {
+  const toolName = nativeCapletToolName(caplet.server);
+  const inputSchema = generatedToolInputJsonSchemaForCaplet(caplet);
+  return {
+    caplet: caplet.server,
+    toolName,
+    title: caplet.name,
+    description: nativeCapletToolDescription(toolName, caplet),
+    ...(caplet.useWhen ? { useWhen: caplet.useWhen } : {}),
+    ...(caplet.avoidWhen ? { avoidWhen: caplet.avoidWhen } : {}),
+    promptGuidance: nativeCapletPromptGuidance(toolName, caplet),
+    inputSchema,
+    operationNames: [...inputSchema.properties.operation.enum],
+  };
+}
+
+function codeModeCapletDescriptor(
+  caplet: ReturnType<CapletsEngine["enabledServers"]>[number],
+): NativeCapletTool {
+  const toolName = nativeCapletToolName(caplet.server);
+  return {
+    caplet: caplet.server,
+    toolName,
+    title: caplet.name,
+    description: nativeCapletToolDescription(toolName, caplet),
+    ...(caplet.useWhen ? { useWhen: caplet.useWhen } : {}),
+    ...(caplet.avoidWhen ? { avoidWhen: caplet.avoidWhen } : {}),
+    promptGuidance: nativeCapletPromptGuidance(toolName, caplet),
+  };
+}
+
+function mcpPrimitiveNativeTools(
+  caplet: ReturnType<CapletsEngine["enabledServers"]>[number],
+  snapshot: ExposureSnapshot | undefined,
+): string[] {
+  const operations = [];
+  if (snapshot?.directResources.some((entry) => entry.caplet.server === caplet.server)) {
+    operations.push("list_resources", "read_resource");
+  }
+  if (snapshot?.directResourceTemplates.some((entry) => entry.caplet.server === caplet.server)) {
+    operations.push("list_resource_templates", "read_resource");
+  }
+  if (snapshot?.directPrompts.some((entry) => entry.caplet.server === caplet.server)) {
+    operations.push("list_prompts", "get_prompt", "complete");
+  }
+  return [...new Set(operations)];
+}
+
+function nativeMcpPrimitiveInputSchema(operationName: string): Record<string, unknown> {
+  if (operationName === "read_resource") {
+    return {
+      type: "object",
+      properties: { uri: { type: "string" } },
+      required: ["uri"],
+      additionalProperties: false,
+    };
+  }
+  if (operationName === "get_prompt") {
+    return {
+      type: "object",
+      properties: {
+        name: { type: "string" },
+        args: { type: "object", additionalProperties: true },
+      },
+      required: ["name"],
+      additionalProperties: false,
+    };
+  }
+  if (operationName === "complete") {
+    return {
+      type: "object",
+      properties: {
+        ref: { type: "object", additionalProperties: true },
+        argument: { type: "object", additionalProperties: true },
+      },
+      required: ["ref", "argument"],
+      additionalProperties: false,
+    };
+  }
+  return { type: "object", additionalProperties: false };
+}
+
+function isMcpPrimitiveRoute(operationName: string): boolean {
+  return [
+    "list_resources",
+    "list_resource_templates",
+    "read_resource",
+    "list_prompts",
+    "get_prompt",
+    "complete",
+  ].includes(operationName);
+}
+
+function nativeMcpPrimitiveRequest(
+  operationName: string,
+  request: unknown,
+): Record<string, unknown> {
+  const args = isRecord(request) ? request : {};
+  if (operationName === "list_resources") return { operation: "resources" };
+  if (operationName === "list_resource_templates") return { operation: "resource_templates" };
+  if (operationName === "list_prompts") return { operation: "prompts" };
+  if (operationName === "read_resource") return { operation: "read_resource", uri: args.uri };
+  if (operationName === "get_prompt") {
+    return { operation: "get_prompt", name: args.name, args: args.args ?? {} };
+  }
+  if (operationName === "complete") {
+    return { operation: "complete", ref: args.ref, argument: args.argument };
+  }
+  return { operation: operationName };
+}
+
+function isRecord(value: unknown): value is Record<string, unknown> {
+  return Boolean(value) && typeof value === "object" && !Array.isArray(value);
 }
 
 function codeModeRunNativeTool(capletTools: NativeCapletTool[]): NativeCapletTool {
diff --git a/packages/core/src/observed-output-shapes/key.ts b/packages/core/src/observed-output-shapes/key.ts
index 068d5a1..08283d4 100644
--- a/packages/core/src/observed-output-shapes/key.ts
+++ b/packages/core/src/observed-output-shapes/key.ts
@@ -1,6 +1,7 @@
 import { createHash } from "node:crypto";
 import type { CapletConfig } from "../config";
 import { schemaHash } from "../schema-hash";
+import { stableJsonStringify } from "../stable-json";
 import { OBSERVED_OUTPUT_SHAPE_VERSION, type ObservedOutputShapeKey } from "./types";
 
 export function observedOutputShapeStorageKey(key: ObservedOutputShapeKey): string {
@@ -37,9 +38,7 @@ export function backendFingerprint(caplet: CapletConfig): string {
 }
 
 export function stableHash(value: unknown): string {
-  return createHash("sha256")
-    .update(JSON.stringify(stableJsonValue(value)))
-    .digest("hex");
+  return createHash("sha256").update(stableJsonStringify(value)).digest("hex");
 }
 
 function nonSecretBackendIdentity(caplet: CapletConfig): unknown {
@@ -121,19 +120,3 @@ function nonSecretBackendIdentity(caplet: CapletConfig): unknown {
       };
   }
 }
-
-function stableJsonValue(value: unknown): unknown {
-  if (Array.isArray(value)) {
-    return value.map((item) => stableJsonValue(item));
-  }
-  if (value && typeof value === "object") {
-    const record = value as Record<string, unknown>;
-    const sorted: Record<string, unknown> = {};
-    for (const key of Object.keys(record).sort()) {
-      const item = record[key];
-      if (item !== undefined) sorted[key] = stableJsonValue(item);
-    }
-    return sorted;
-  }
-  return value;
-}
diff --git a/packages/core/src/project-binding/index.ts b/packages/core/src/project-binding/index.ts
new file mode 100644
index 0000000..38360c0
--- /dev/null
+++ b/packages/core/src/project-binding/index.ts
@@ -0,0 +1,9 @@
+export { PROJECT_BINDING_STATES, PROJECT_BINDING_SYNC_STATES } from "./types";
+export type {
+  BindingTerminalReason,
+  ProjectBindingLease,
+  ProjectBindingSetupReceipt,
+  ProjectBindingState,
+  ProjectBindingSyncState,
+  ProjectBindingWorkspaceMetadata,
+} from "./types";
diff --git a/packages/core/src/redaction.ts b/packages/core/src/redaction.ts
new file mode 100644
index 0000000..1fb6ed3
--- /dev/null
+++ b/packages/core/src/redaction.ts
@@ -0,0 +1,50 @@
+export const SECRET_KEY_PATTERN =
+  /(token|secret|authorization|auth|api[-_]?key|password|credential|clientsecret|client_secret|code|refresh)/iu;
+
+export const SECRET_TEXT_PATTERNS = [
+  /(Authorization:\s*Bearer\s+)[0-9A-Za-z._~+/=-]+/giu,
+  /(bearer\s+)[a-z0-9._~+/=-]+/giu,
+  /([?&](?:access_token|refresh_token|token|code)=)[^&\s]+/giu,
+] as const;
+
+export type RedactionResult = {
+  text: string;
+  redacted: boolean;
+};
+
+export type RedactionOptions = {
+  patterns?: readonly RegExp[] | undefined;
+  additionalSecrets?: readonly string[] | undefined;
+  replacement?: string | undefined;
+};
+
+export function isSecretKey(key: string): boolean {
+  return SECRET_KEY_PATTERN.test(key);
+}
+
+export function redactSecretText(value: string, options: RedactionOptions = {}): RedactionResult {
+  const replacement = options.replacement ?? "[REDACTED]";
+  let text = value;
+  for (const pattern of [...(options.patterns ?? []), ...SECRET_TEXT_PATTERNS]) {
+    text = text.replace(pattern, (...args: unknown[]) => {
+      const prefix = typeof args[1] === "string" ? args[1] : "";
+      return `${prefix}${replacement}`;
+    });
+  }
+  for (const secret of options.additionalSecrets?.filter(Boolean) ?? []) {
+    text = text.split(secret).join(replacement);
+  }
+  return { text, redacted: text !== value };
+}
+
+export function redactUnknownSecrets<T>(value: T, options: RedactionOptions = {}): T {
+  if (typeof value === "string") return redactSecretText(value, options).text as T;
+  if (Array.isArray(value)) return value.map((item) => redactUnknownSecrets(item, options)) as T;
+  if (!value || typeof value !== "object") return value;
+  return Object.fromEntries(
+    Object.entries(value).map(([key, entry]) => [
+      key,
+      isSecretKey(key) ? "[REDACTED]" : redactUnknownSecrets(entry, options),
+    ]),
+  ) as T;
+}
diff --git a/packages/core/src/runtime-plan/resources.ts b/packages/core/src/runtime-plan/resources.ts
index 7a51fc8..b73bf88 100644
--- a/packages/core/src/runtime-plan/resources.ts
+++ b/packages/core/src/runtime-plan/resources.ts
@@ -20,6 +20,14 @@ const rank: Record<string, number> = {
   heavy: 3,
 };
 
+export function resourceClassRank(value: string): number {
+  return rank[value] ?? 0;
+}
+
+export function isRuntimeResourceClassAllowed(requested: string, maximum: string): boolean {
+  return resourceClassRank(requested) <= resourceClassRank(maximum);
+}
+
 type ResourceInput = {
   backend?: string | undefined;
   features: string[];
@@ -84,5 +92,5 @@ function capClass(
   maxClass: HostedRuntimeResourceClass | undefined,
 ) {
   if (!maxClass) return requested;
-  return (rank[requested] ?? 0) > (rank[maxClass] ?? 0) ? maxClass : requested;
+  return isRuntimeResourceClassAllowed(requested, maxClass) ? requested : maxClass;
 }
diff --git a/packages/core/src/schema-hash.ts b/packages/core/src/schema-hash.ts
index e711616..afb5aff 100644
--- a/packages/core/src/schema-hash.ts
+++ b/packages/core/src/schema-hash.ts
@@ -1,27 +1,10 @@
 import { createHash } from "node:crypto";
+import { stableJsonStringify } from "./stable-json";
 
 export function schemaHash(schema: unknown | undefined): string | null {
   if (schema === undefined || schema === null) {
     return null;
   }
-  const json = JSON.stringify(stableJsonValue(schema));
+  const json = stableJsonStringify(schema);
   return `sha256:${createHash("sha256").update(json).digest("hex")}`;
 }
-
-function stableJsonValue(value: unknown): unknown {
-  if (Array.isArray(value)) {
-    return value.map((item) => stableJsonValue(item));
-  }
-  if (value && typeof value === "object") {
-    const record = value as Record<string, unknown>;
-    const sorted: Record<string, unknown> = {};
-    for (const key of Object.keys(record).sort()) {
-      const item = record[key];
-      if (item !== undefined) {
-        sorted[key] = stableJsonValue(item);
-      }
-    }
-    return sorted;
-  }
-  return value;
-}
diff --git a/packages/core/src/serve/session.ts b/packages/core/src/serve/session.ts
index 61be5fb..2f71e21 100644
--- a/packages/core/src/serve/session.ts
+++ b/packages/core/src/serve/session.ts
@@ -1,35 +1,60 @@
-import { McpServer, type RegisteredTool } from "@modelcontextprotocol/sdk/server/mcp";
+import {
+  McpServer,
+  ResourceTemplate,
+  type RegisteredPrompt,
+  type RegisteredResource,
+  type RegisteredResourceTemplate,
+  type RegisteredTool,
+} from "@modelcontextprotocol/sdk/server/mcp";
 import type { Transport } from "@modelcontextprotocol/sdk/shared/transport";
+import { z } from "zod";
 import { version as packageJsonVersion } from "../../package.json";
 import type { CapletConfig, CapletsConfig } from "../config";
-import type { CapletsEngine } from "../engine";
-import { capabilityDescription } from "../registry";
-import { generatedToolInputSchemaForCaplet } from "../generated-tool-input-schema";
-import { listCodeModeCallableCaplets } from "../code-mode/api";
 import {
   generateCodeModeDeclarations,
   generateCodeModeRunToolDescription,
 } from "../code-mode/declarations";
+import { CodeModeLogStore } from "../code-mode/logs";
 import { runCodeMode } from "../code-mode/runner";
 import { codeModeRunInputSchema, codeModeRunParamsSchema } from "../code-mode/tool";
-import { CodeModeLogStore } from "../code-mode/logs";
+import type { CapletsEngine } from "../engine";
+import type {
+  CallableCaplet,
+  DirectPromptRegistration,
+  DirectResourceRegistration,
+  DirectResourceTemplateRegistration,
+  DirectToolRegistration,
+  ExposureSnapshot,
+} from "../exposure/discovery";
+import { decodeDirectResourceUri } from "../exposure/direct-names";
+import { resolveExposure } from "../exposure/policy";
+import { generatedToolInputSchemaForCaplet } from "../generated-tool-input-schema";
 import type { NativeCapletTool, NativeCapletsService } from "../native/service";
 import {
   nativeCapletPromptGuidance,
   nativeCapletToolDescription,
   nativeCapletToolName,
 } from "../native/tools";
+import { capabilityDescription } from "../registry";
 
-export type ToolServer = Pick<McpServer, "registerTool" | "connect" | "close">;
+export type ToolServer = Pick<McpServer, "registerTool" | "connect" | "close"> &
+  Partial<Pick<McpServer, "registerResource" | "registerPrompt">>;
 
 export type CapletsMcpSessionOptions = {
   server?: ToolServer;
 };
 
+type ToolRegistrationPlan = {
+  register(): RegisteredTool;
+  update(tool: RegisteredTool): void;
+};
+
 export class CapletsMcpSession {
   readonly server: ToolServer;
   private readonly tools = new Map<string, RegisteredTool>();
-  private readonly codeModeTool: RegisteredTool;
+  private readonly resources = new Map<string, RegisteredResource | RegisteredResourceTemplate>();
+  private readonly prompts = new Map<string, RegisteredPrompt>();
+  private codeModeTool: RegisteredTool | undefined;
   private readonly unsubscribeReload: () => void;
   private closed = false;
 
@@ -43,14 +68,17 @@ export class CapletsMcpSession {
         name: "caplets",
         version: packageJsonVersion,
       });
-    this.codeModeTool = this.registerCodeModeTool();
-    this.unsubscribeReload = this.engine.onReload(({ previous, next }) =>
-      this.reconcileTools(previous, next),
+    this.unsubscribeReload = this.engine.onReload(({ previous, next }) => {
+      this.reconcileFromSnapshot(staticExposureSnapshot(next, this.engine.enabledServers()));
+      void this.refreshExposure(previous, next);
+    });
+    this.reconcileFromSnapshot(
+      staticExposureSnapshot(this.engine.currentConfig(), this.engine.enabledServers()),
     );
-    this.reconcileTools(undefined, this.engine.currentConfig());
   }
 
   async connect(transport: Transport): Promise<void> {
+    await this.refreshExposure(undefined, this.engine.currentConfig());
     await this.server.connect(transport);
   }
 
@@ -58,24 +86,129 @@ export class CapletsMcpSession {
     return [...this.tools.keys()].sort();
   }
 
+  async refreshExposure(
+    _previous: CapletsConfig | undefined = undefined,
+    _next: CapletsConfig = this.engine.currentConfig(),
+  ): Promise<void> {
+    if (this.closed) return;
+    this.reconcileFromSnapshot(await this.engine.exposureSnapshot());
+  }
+
   async close(): Promise<void> {
-    if (this.closed) {
-      return;
-    }
+    if (this.closed) return;
     this.closed = true;
     this.unsubscribeReload();
-    this.codeModeTool.remove();
-    this.tools.clear();
+    this.clearRegistrations();
     await this.server.close();
   }
 
-  private registerCodeModeTool(): RegisteredTool {
-    const codeModeService = new EngineNativeCapletsService(this.engine);
+  private reconcileFromSnapshot(snapshot: ExposureSnapshot): void {
+    if (snapshot.codeModeCaplets.length > 0) {
+      if (this.codeModeTool) {
+        this.codeModeTool.update({
+          title: "Code Mode",
+          description: codeModeRunToolDescription(snapshot.codeModeCaplets),
+          paramsSchema: codeModeRunParamsSchema,
+          callback: async (request: unknown) => this.handleCodeModeRunTool(request),
+          enabled: true,
+        });
+      } else {
+        this.codeModeTool = this.registerCodeModeTool(snapshot);
+      }
+    } else if (this.codeModeTool) {
+      this.codeModeTool.remove();
+      this.codeModeTool = undefined;
+    }
+
+    const desiredTools = new Map<string, ToolRegistrationPlan>();
+    for (const entry of snapshot.progressiveCaplets) {
+      desiredTools.set(entry.caplet.server, {
+        register: () => this.registerCapletTool(entry.caplet),
+        update: (tool) =>
+          (tool.update as (updates: Record<string, unknown>) => void)({
+            title: entry.caplet.name,
+            description: capabilityDescription(entry.caplet),
+            paramsSchema: generatedToolInputSchemaForCaplet(entry.caplet).shape,
+            callback: async (request: unknown) =>
+              this.engine.execute(entry.caplet.server, request) as never,
+            enabled: true,
+          }),
+      });
+    }
+    for (const entry of snapshot.directTools) {
+      desiredTools.set(entry.name, {
+        register: () => this.registerDirectTool(entry),
+        update: (tool) =>
+          (tool.update as (updates: Record<string, unknown>) => void)({
+            title: entry.tool.name,
+            description: entry.tool.description,
+            paramsSchema: entry.tool.inputSchema as never,
+            outputSchema: entry.tool.outputSchema as never,
+            annotations: entry.tool.annotations,
+            _meta: {
+              caplets: {
+                capletId: entry.caplet.server,
+                downstreamName: entry.downstreamName,
+                exposure: "direct",
+              },
+            },
+            callback: async (request: unknown) =>
+              this.engine.executeDirectTool(
+                entry.caplet.server,
+                entry.downstreamName,
+                isRecord(request) ? request : {},
+              ) as never,
+            enabled: true,
+          }),
+      });
+    }
+    for (const [name, tool] of this.tools) {
+      const plan = desiredTools.get(name);
+      if (!plan) {
+        tool.remove();
+        this.tools.delete(name);
+      } else {
+        plan.update(tool);
+      }
+    }
+    for (const [name, plan] of desiredTools) {
+      if (!this.tools.has(name)) {
+        this.tools.set(name, plan.register());
+      }
+    }
+
+    for (const resource of this.resources.values()) resource.remove();
+    for (const prompt of this.prompts.values()) prompt.remove();
+    this.resources.clear();
+    this.prompts.clear();
+    for (const entry of snapshot.directResources) {
+      this.resources.set(entry.uri, this.registerDirectResource(entry));
+    }
+    for (const entry of coalesceResourceTemplates(snapshot.directResourceTemplates)) {
+      this.resources.set(entry.uriTemplate, this.registerDirectResourceTemplate(entry));
+    }
+    for (const entry of snapshot.directPrompts) {
+      this.prompts.set(entry.name, this.registerDirectPrompt(entry));
+    }
+  }
+
+  private clearRegistrations(): void {
+    this.codeModeTool?.remove();
+    this.codeModeTool = undefined;
+    for (const tool of this.tools.values()) tool.remove();
+    for (const resource of this.resources.values()) resource.remove();
+    for (const prompt of this.prompts.values()) prompt.remove();
+    this.tools.clear();
+    this.resources.clear();
+    this.prompts.clear();
+  }
+
+  private registerCodeModeTool(snapshot: ExposureSnapshot): RegisteredTool {
     return this.server.registerTool(
       "code_mode",
       {
         title: "Code Mode",
-        description: codeModeRunToolDescription(codeModeService),
+        description: codeModeRunToolDescription(snapshot.codeModeCaplets),
         inputSchema: codeModeRunParamsSchema,
       },
       async (request: unknown) => this.handleCodeModeRunTool(request),
@@ -116,67 +249,117 @@ export class CapletsMcpSession {
     };
   }
 
-  private reconcileTools(previous: CapletsConfig | undefined, next: CapletsConfig): void {
-    if (previous) {
-      this.codeModeTool.update({
-        title: "Code Mode",
-        description: codeModeRunToolDescription(new EngineNativeCapletsService(this.engine)),
-        paramsSchema: codeModeRunParamsSchema,
-        callback: async (request: unknown) => this.handleCodeModeRunTool(request),
-        enabled: true,
-      });
-    }
-
-    const enabled = new Map(nextEnabledServers(next).map((server) => [server.server, server]));
+  private registerCapletTool(caplet: CapletConfig): RegisteredTool {
+    return this.server.registerTool(
+      caplet.server,
+      {
+        title: caplet.name,
+        description: capabilityDescription(caplet),
+        inputSchema: generatedToolInputSchemaForCaplet(caplet).shape,
+      },
+      async (request: unknown) => this.engine.execute(caplet.server, request) as never,
+    );
+  }
 
-    for (const [serverId, tool] of this.tools) {
-      const caplet = enabled.get(serverId);
-      if (!caplet) {
-        tool.remove();
-        this.tools.delete(serverId);
-        continue;
-      }
+  private registerDirectTool(entry: DirectToolRegistration): RegisteredTool {
+    return (this.server.registerTool as (...args: unknown[]) => RegisteredTool)(
+      entry.name,
+      {
+        title: entry.tool.name,
+        ...(entry.tool.description ? { description: entry.tool.description } : {}),
+        ...(entry.tool.inputSchema ? { inputSchema: entry.tool.inputSchema as never } : {}),
+        ...(entry.tool.outputSchema ? { outputSchema: entry.tool.outputSchema as never } : {}),
+        ...(entry.tool.annotations ? { annotations: entry.tool.annotations } : {}),
+        _meta: {
+          caplets: {
+            capletId: entry.caplet.server,
+            downstreamName: entry.downstreamName,
+            exposure: "direct",
+          },
+        },
+      },
+      async (request: unknown) =>
+        this.engine.executeDirectTool(
+          entry.caplet.server,
+          entry.downstreamName,
+          isRecord(request) ? request : {},
+        ) as never,
+    );
+  }
 
-      const previousCaplet = previous ? capletById(previous, serverId) : undefined;
-      if (!previousCaplet || serializeCaplet(previousCaplet) !== serializeCaplet(caplet)) {
-        tool.update({
-          title: caplet.name,
-          description: capabilityDescription(caplet),
-          paramsSchema: generatedToolInputSchemaForCaplet(caplet).shape,
-          callback: async (request: unknown) => this.handleTool(serverId, request),
-          enabled: true,
-        });
-      }
+  private registerDirectResource(entry: DirectResourceRegistration): RegisteredResource {
+    if (!this.server.registerResource) {
+      throw new Error("MCP server does not support resource registration");
     }
+    return this.server.registerResource(
+      entry.resource.name ?? entry.uri,
+      entry.uri,
+      resourceMetadata(entry.resource),
+      async () => this.directResourceResult(entry.caplet.server, entry.downstreamUri),
+    );
+  }
 
-    for (const caplet of enabled.values()) {
-      if (this.tools.has(caplet.server)) {
-        continue;
-      }
-      this.tools.set(caplet.server, this.registerCapletTool(caplet));
+  private registerDirectResourceTemplate(
+    entry: DirectResourceTemplateRegistration,
+  ): RegisteredResourceTemplate {
+    if (!this.server.registerResource) {
+      throw new Error("MCP server does not support resource registration");
     }
+    return this.server.registerResource(
+      entry.caplet.server,
+      new ResourceTemplate(entry.uriTemplate, { list: undefined }),
+      resourceTemplateMetadata(entry.resourceTemplate),
+      async (uri) => {
+        const decoded = decodeDirectResourceUri(uri.toString());
+        return this.directResourceResult(decoded.capletId, decoded.downstreamUri);
+      },
+    );
   }
 
-  private registerCapletTool(caplet: CapletConfig): RegisteredTool {
-    return this.server.registerTool(
-      caplet.server,
+  private registerDirectPrompt(entry: DirectPromptRegistration): RegisteredPrompt {
+    if (!this.server.registerPrompt) {
+      throw new Error("MCP server does not support prompt registration");
+    }
+    return this.server.registerPrompt(
+      entry.name,
       {
-        title: caplet.name,
-        description: capabilityDescription(caplet),
-        inputSchema: generatedToolInputSchemaForCaplet(caplet).shape,
+        title: entry.prompt.name,
+        ...(entry.prompt.description ? { description: entry.prompt.description } : {}),
+        argsSchema: promptArgsSchema(entry.prompt.arguments),
       },
-      async (request: unknown) => this.handleTool(caplet.server, request),
+      async (args) =>
+        (await this.engine.getDirectPrompt(
+          entry.caplet.server,
+          entry.downstreamName,
+          isRecord(args) ? stringifyRecord(args) : {},
+        )) as never,
     );
   }
 
-  private async handleTool(serverId: string, request: unknown): Promise<any> {
-    return await this.engine.execute(serverId, request);
+  private async directResourceResult(serverId: string, downstreamUri: string): Promise<any> {
+    const result = await this.engine.readDirectResource(serverId, downstreamUri);
+    if (isRecord(result) && "contents" in result) return result;
+    return {
+      contents: [
+        {
+          uri: downstreamUri,
+          mimeType: "application/json",
+          text: JSON.stringify(result, null, 2),
+        },
+      ],
+    };
   }
 }
 
-function codeModeRunToolDescription(service: NativeCapletsService): string {
+function codeModeRunToolDescription(caplets: CallableCaplet[]): string {
   const declaration = generateCodeModeDeclarations({
-    caplets: listCodeModeCallableCaplets(service),
+    caplets: caplets.map((entry) => ({
+      id: entry.caplet.server,
+      name: entry.caplet.name,
+      description: capabilityDescription(entry.caplet),
+      ...(entry.caplet.useWhen ? { useWhen: entry.caplet.useWhen } : {}),
+      ...(entry.caplet.avoidWhen ? { avoidWhen: entry.caplet.avoidWhen } : {}),
+    })),
   });
   return generateCodeModeRunToolDescription(declaration);
 }
@@ -185,7 +368,10 @@ class EngineNativeCapletsService implements NativeCapletsService {
   constructor(private readonly engine: CapletsEngine) {}
 
   listTools(): NativeCapletTool[] {
-    return this.engine.enabledServers().map((caplet) => {
+    const snapshot = this.engine.currentExposureSnapshot();
+    const caplets =
+      snapshot?.codeModeCaplets.map((entry) => entry.caplet) ?? this.engine.enabledServers();
+    return caplets.map((caplet) => {
       const toolName = nativeCapletToolName(caplet.server);
       return {
         caplet: caplet.server,
@@ -214,28 +400,84 @@ class EngineNativeCapletsService implements NativeCapletsService {
   }
 }
 
-function nextEnabledServers(config: CapletsConfig): CapletConfig[] {
-  return [
-    ...Object.values(config.mcpServers),
-    ...Object.values(config.openapiEndpoints),
-    ...Object.values(config.graphqlEndpoints),
-    ...Object.values(config.httpApis),
-    ...Object.values(config.cliTools),
-    ...Object.values(config.capletSets),
-  ].filter((server) => !server.disabled);
+function resourceMetadata(resource: DirectResourceRegistration["resource"]) {
+  return {
+    ...(resource.description ? { description: resource.description } : {}),
+    ...(resource.mimeType ? { mimeType: resource.mimeType } : {}),
+    ...(typeof resource.size === "number" ? { size: resource.size } : {}),
+    _meta: { caplets: { downstreamUri: resource.uri, exposure: "direct" } },
+  };
 }
 
-function capletById(config: CapletsConfig, serverId: string): CapletConfig | undefined {
-  return (
-    config.mcpServers[serverId] ??
-    config.openapiEndpoints[serverId] ??
-    config.graphqlEndpoints[serverId] ??
-    config.httpApis[serverId] ??
-    config.cliTools[serverId] ??
-    config.capletSets[serverId]
+function resourceTemplateMetadata(
+  resourceTemplate: DirectResourceTemplateRegistration["resourceTemplate"],
+) {
+  return {
+    ...(resourceTemplate.description ? { description: resourceTemplate.description } : {}),
+    ...(resourceTemplate.mimeType ? { mimeType: resourceTemplate.mimeType } : {}),
+    _meta: {
+      caplets: { downstreamUriTemplate: resourceTemplate.uriTemplate, exposure: "direct" },
+    },
+  };
+}
+
+function promptArgsSchema(args: DirectPromptRegistration["prompt"]["arguments"]) {
+  const shape: Record<string, z.ZodTypeAny> = {};
+  for (const arg of args ?? []) {
+    shape[arg.name] = z.string().optional();
+  }
+  return shape;
+}
+
+function stringifyRecord(value: Record<string, unknown>): Record<string, string> {
+  return Object.fromEntries(
+    Object.entries(value).map(([key, nested]) => [key, nested === undefined ? "" : String(nested)]),
   );
 }
 
-function serializeCaplet(caplet: CapletConfig | undefined): string {
-  return JSON.stringify(caplet ?? null);
+function coalesceResourceTemplates(
+  entries: DirectResourceTemplateRegistration[],
+): DirectResourceTemplateRegistration[] {
+  const byCaplet = new Map<string, DirectResourceTemplateRegistration>();
+  for (const entry of entries) {
+    byCaplet.set(entry.caplet.server, entry);
+  }
+  return [...byCaplet.values()];
+}
+
+function isRecord(value: unknown): value is Record<string, unknown> {
+  return Boolean(value) && typeof value === "object" && !Array.isArray(value);
+}
+
+function staticExposureSnapshot(config: CapletsConfig, caplets: CapletConfig[]): ExposureSnapshot {
+  const callableCaplets = caplets
+    .filter((caplet) => !caplet.disabled && !caplet.setup && !caplet.projectBinding?.required)
+    .map((caplet) => ({
+      caplet,
+      exposure: resolveExposure(caplet.exposure, config.options.exposure),
+      tools: [],
+      resources: [],
+      resourceTemplates: [],
+      prompts: [],
+      discoveredAt: Date.now(),
+    }));
+  return {
+    callableCaplets,
+    progressiveCaplets: callableCaplets.filter((entry) => entry.exposure.progressive),
+    codeModeCaplets: callableCaplets.filter((entry) => entry.exposure.codeMode),
+    directTools: [],
+    directResources: [],
+    directResourceTemplates: [],
+    directPrompts: [],
+    hiddenCaplets: caplets
+      .filter((caplet) => caplet.disabled || caplet.setup || caplet.projectBinding?.required)
+      .map((caplet) => ({
+        capletId: caplet.server,
+        reason: caplet.disabled
+          ? ("disabled" as const)
+          : caplet.setup
+            ? ("setup_required" as const)
+            : ("project_binding_required" as const),
+      })),
+  };
 }
diff --git a/packages/core/src/stable-json.ts b/packages/core/src/stable-json.ts
new file mode 100644
index 0000000..57a96de
--- /dev/null
+++ b/packages/core/src/stable-json.ts
@@ -0,0 +1,28 @@
+export function stableJsonValue(value: unknown): unknown {
+  if (Array.isArray(value)) {
+    return value.map((item) => stableJsonValue(item));
+  }
+  if (isPlainObject(value)) {
+    const sorted: Record<string, unknown> = {};
+    for (const key of Object.keys(value).sort()) {
+      const item = value[key];
+      if (item !== undefined) sorted[key] = stableJsonValue(item);
+    }
+    return sorted;
+  }
+  return value;
+}
+
+export function stableJsonStringify(value: unknown): string {
+  return JSON.stringify(stableJsonValue(value));
+}
+
+export async function stableJsonSha256Hex(value: unknown): Promise<string> {
+  const bytes = new TextEncoder().encode(stableJsonStringify(value));
+  const digest = await globalThis.crypto.subtle.digest("SHA-256", bytes);
+  return [...new Uint8Array(digest)].map((byte) => byte.toString(16).padStart(2, "0")).join("");
+}
+
+function isPlainObject(value: unknown): value is Record<string, unknown> {
+  return Boolean(value) && typeof value === "object" && !Array.isArray(value);
+}
diff --git a/packages/core/test/caplet-files.test.ts b/packages/core/test/caplet-files.test.ts
index 1b0fa24..29b3857 100644
--- a/packages/core/test/caplet-files.test.ts
+++ b/packages/core/test/caplet-files.test.ts
@@ -33,6 +33,32 @@ openapiEndpoint:
     );
   });
 
+  it("loads top-level exposure from CAPLET.md frontmatter", () => {
+    const result = loadCapletFilesFromMap({
+      files: [
+        {
+          path: "github/CAPLET.md",
+          content: `---
+name: GitHub
+description: Manage GitHub repositories.
+exposure: direct_and_code_mode
+mcpServer:
+  command: github-mcp
+---
+
+# GitHub
+`,
+        },
+      ],
+    });
+
+    expect(result?.config.mcpServers?.github).toEqual(
+      expect.objectContaining({
+        exposure: "direct_and_code_mode",
+      }),
+    );
+  });
+
   it("rejects duplicate in-memory caplet ids", () => {
     expect(() =>
       loadCapletFilesFromMap({
diff --git a/packages/core/test/code-mode-diagnostics.test.ts b/packages/core/test/code-mode-diagnostics.test.ts
index 4629d53..2768641 100644
--- a/packages/core/test/code-mode-diagnostics.test.ts
+++ b/packages/core/test/code-mode-diagnostics.test.ts
@@ -32,6 +32,21 @@ describe("diagnoseCodeModeTypeScript", () => {
     );
   });
 
+  it("does not block fetch text or non-global fetch member calls", () => {
+    const diagnostics = diagnoseCodeModeTypeScript({
+      declaration,
+      code: `
+        const guidance = "Use the browser Caplet instead of await fetch('https://example.com')";
+        const client = { fetch: (value: string) => ({ value }) };
+        const result = client.fetch(guidance);
+        return result;
+      `,
+    });
+
+    expect(diagnostics.map((diagnostic) => diagnostic.code)).not.toContain("FETCH_UNAVAILABLE");
+    expect(diagnostics.filter((diagnostic) => diagnostic.severity === "error")).toEqual([]);
+  });
+
   it("allows standard JavaScript, console, URL, JSON, and Caplet callTool", () => {
     const diagnostics = diagnoseCodeModeTypeScript({
       declaration,
diff --git a/packages/core/test/code-mode-static-analysis.test.ts b/packages/core/test/code-mode-static-analysis.test.ts
new file mode 100644
index 0000000..3b78db8
--- /dev/null
+++ b/packages/core/test/code-mode-static-analysis.test.ts
@@ -0,0 +1,23 @@
+import { describe, expect, it } from "vitest";
+import { hasDirectFetchCall, hasExecutableImport } from "../src/code-mode/static-analysis";
+
+describe("Code Mode static analysis", () => {
+  it("detects direct fetch calls without blocking text or member fetch calls", () => {
+    expect(hasDirectFetchCall('await fetch("https://example.com");')).toBe(true);
+    expect(hasDirectFetchCall('await globalThis.fetch("https://example.com");')).toBe(true);
+    expect(hasDirectFetchCall('const note = "await fetch(\\"https://example.com\\")";')).toBe(
+      false,
+    );
+    expect(hasDirectFetchCall("const result = client.fetch('/issues');")).toBe(false);
+  });
+
+  it("detects executable imports without blocking import text", () => {
+    expect(hasExecutableImport('import fs from "node:fs";')).toBe(true);
+    expect(hasExecutableImport('import { readFile } from "node:fs";')).toBe(true);
+    expect(hasExecutableImport('import "node:fs";')).toBe(true);
+    expect(hasExecutableImport('await import("node:fs");')).toBe(true);
+    expect(hasExecutableImport('export { readFile } from "node:fs";')).toBe(true);
+    expect(hasExecutableImport('const note = "import fs from node:fs";')).toBe(false);
+    expect(hasExecutableImport("const result = client.import('value');")).toBe(false);
+  });
+});
diff --git a/packages/core/test/config.test.ts b/packages/core/test/config.test.ts
index a2eb248..f1c96a4 100644
--- a/packages/core/test/config.test.ts
+++ b/packages/core/test/config.test.ts
@@ -41,6 +41,37 @@ describe("config", () => {
     }
   });
 
+  it("defaults exposure options and accepts per-Caplet exposure overrides", () => {
+    expect(parseConfig({}).options).toMatchObject({
+      exposure: "progressive_and_code_mode",
+      exposureDiscoveryTimeoutMs: 15000,
+      exposureDiscoveryConcurrency: 4,
+    });
+
+    const config = parseConfig({
+      options: {
+        exposure: "direct",
+        exposureDiscoveryTimeoutMs: 5000,
+        exposureDiscoveryConcurrency: 8,
+      },
+      mcpServers: {
+        github: {
+          name: "GitHub",
+          description: "Manage GitHub repositories.",
+          exposure: "direct_and_code_mode",
+          command: "github-mcp",
+        },
+      },
+    });
+
+    expect(config.options).toMatchObject({
+      exposure: "direct",
+      exposureDiscoveryTimeoutMs: 5000,
+      exposureDiscoveryConcurrency: 8,
+    });
+    expect(config.mcpServers.github?.exposure).toBe("direct_and_code_mode");
+  });
+
   it("loads user config from a path with defaults and interpolation", () => {
     const dir = mkdtempSync(join(tmpdir(), "caplets-config-"));
     const path = join(dir, "config.json");
@@ -470,6 +501,9 @@ describe("config", () => {
     expect(config.options).toEqual({
       defaultSearchLimit: 7,
       maxSearchLimit: 40,
+      exposure: "progressive_and_code_mode",
+      exposureDiscoveryTimeoutMs: 15000,
+      exposureDiscoveryConcurrency: 4,
       completion: {
         discoveryTimeoutMs: 750,
         overallTimeoutMs: 1500,
@@ -1826,6 +1860,9 @@ describe("config", () => {
     expect(config.options).toEqual({
       defaultSearchLimit: 5,
       maxSearchLimit: 10,
+      exposure: "progressive_and_code_mode",
+      exposureDiscoveryTimeoutMs: 15000,
+      exposureDiscoveryConcurrency: 4,
       completion: {
         discoveryTimeoutMs: 750,
         overallTimeoutMs: 1500,
diff --git a/packages/core/test/doctor-cli.test.ts b/packages/core/test/doctor-cli.test.ts
index 4e4d1e2..390e574 100644
--- a/packages/core/test/doctor-cli.test.ts
+++ b/packages/core/test/doctor-cli.test.ts
@@ -17,6 +17,7 @@ describe("caplets doctor", () => {
     expect(report).toContain("Project sync");
     expect(report).toContain("Daemon");
     expect(report).toContain("Cloud Auth");
+    expect(report).toContain("Exposure");
     expect(report).toContain("Code Mode");
     expect(report).not.toContain("local presence");
   });
@@ -63,6 +64,7 @@ describe("caplets doctor", () => {
       sync: { state: "idle" },
       daemon: { running: false },
       cloudAuth: { authenticated: false },
+      exposure: { ok: true },
       codeMode: {
         typesGeneration: { ok: true },
         diagnostics: { ok: true },
diff --git a/packages/core/test/exposure-direct-names.test.ts b/packages/core/test/exposure-direct-names.test.ts
new file mode 100644
index 0000000..ef20542
--- /dev/null
+++ b/packages/core/test/exposure-direct-names.test.ts
@@ -0,0 +1,27 @@
+import { describe, expect, it } from "vitest";
+import {
+  decodeDirectResourceUri,
+  directPromptName,
+  directResourceTemplateUri,
+  directResourceUri,
+  directToolName,
+  nativeDirectToolName,
+} from "../src/exposure/direct-names";
+
+describe("direct exposure names", () => {
+  it("prefixes MCP and native direct operation names without parsing names back", () => {
+    expect(directToolName("git_hub", "repos__list")).toBe("git_hub__repos__list");
+    expect(directPromptName("git-hub", "summarize")).toBe("git-hub__summarize");
+    expect(nativeDirectToolName("git-hub", "repos__list")).toBe("caplets__git-hub__repos__list");
+  });
+
+  it("encodes and decodes direct resource URIs", () => {
+    const encoded = directResourceUri("docs", "file:///src/README.md?rev=main");
+    expect(encoded).toBe("caplets://docs/resources/file%3A%2F%2F%2Fsrc%2FREADME.md%3Frev%3Dmain");
+    expect(decodeDirectResourceUri(encoded)).toEqual({
+      capletId: "docs",
+      downstreamUri: "file:///src/README.md?rev=main",
+    });
+    expect(directResourceTemplateUri("docs")).toBe("caplets://docs/resources/{encodedUri}");
+  });
+});
diff --git a/packages/core/test/exposure-discovery.test.ts b/packages/core/test/exposure-discovery.test.ts
new file mode 100644
index 0000000..667958a
--- /dev/null
+++ b/packages/core/test/exposure-discovery.test.ts
@@ -0,0 +1,121 @@
+import type { Tool } from "@modelcontextprotocol/sdk/types";
+import { describe, expect, it, vi } from "vitest";
+import type { CapletConfig, CapletsConfig } from "../src/config";
+import { discoverExposureSnapshot } from "../src/exposure/discovery";
+
+describe("exposure discovery", () => {
+  it("discovers callable direct and Code Mode surfaces", async () => {
+    const caplet = httpCaplet("osv", "direct_and_code_mode");
+    const snapshot = await discoverExposureSnapshot({
+      config: configFor([caplet], { exposure: "progressive" }),
+      caplets: [caplet],
+      listTools: async () => [tool("query")],
+    });
+
+    expect(snapshot.callableCaplets.map((entry) => entry.caplet.server)).toEqual(["osv"]);
+    expect(snapshot.codeModeCaplets.map((entry) => entry.caplet.server)).toEqual(["osv"]);
+    expect(snapshot.directTools.map((entry) => entry.name)).toEqual(["osv__query"]);
+    expect(snapshot.progressiveCaplets).toEqual([]);
+  });
+
+  it("hides failed discovery without failing the whole snapshot", async () => {
+    const direct = httpCaplet("direct", "direct");
+    const progressive = httpCaplet("progressive", "progressive");
+    const snapshot = await discoverExposureSnapshot({
+      config: configFor([direct, progressive]),
+      caplets: [direct, progressive],
+      listTools: async (caplet) => {
+        if (caplet.server === "direct") throw new Error("unavailable");
+        return [tool("search")];
+      },
+    });
+
+    expect(snapshot.directTools).toEqual([]);
+    expect(snapshot.progressiveCaplets.map((entry) => entry.caplet.server)).toEqual([
+      "progressive",
+    ]);
+    expect(snapshot.hiddenCaplets).toEqual([
+      expect.objectContaining({ capletId: "direct", reason: "discovery_failed" }),
+    ]);
+  });
+
+  it("limits concurrent discovery", async () => {
+    const caplets = [
+      httpCaplet("one", "direct"),
+      httpCaplet("two", "direct"),
+      httpCaplet("three", "direct"),
+    ];
+    let active = 0;
+    let maxActive = 0;
+    const snapshot = await discoverExposureSnapshot({
+      config: configFor(caplets, { exposureDiscoveryConcurrency: 2 }),
+      caplets,
+      listTools: vi.fn(async () => {
+        active += 1;
+        maxActive = Math.max(maxActive, active);
+        await new Promise((resolve) => setTimeout(resolve, 5));
+        active -= 1;
+        return [tool("run")];
+      }),
+    });
+
+    expect(snapshot.directTools).toHaveLength(3);
+    expect(maxActive).toBeLessThanOrEqual(2);
+  });
+});
+
+function configFor(
+  caplets: CapletConfig[],
+  options: Partial<CapletsConfig["options"]> = {},
+): CapletsConfig {
+  return {
+    version: 1,
+    options: {
+      defaultSearchLimit: 20,
+      maxSearchLimit: 50,
+      exposure: "progressive_and_code_mode",
+      exposureDiscoveryTimeoutMs: 15000,
+      exposureDiscoveryConcurrency: 4,
+      completion: {
+        discoveryTimeoutMs: 750,
+        overallTimeoutMs: 1500,
+        cacheTtlMs: 300000,
+        negativeCacheTtlMs: 30000,
+      },
+      ...options,
+    },
+    mcpServers: {},
+    openapiEndpoints: {},
+    graphqlEndpoints: {},
+    httpApis: Object.fromEntries(
+      caplets
+        .filter((caplet) => caplet.backend === "http")
+        .map((caplet) => [caplet.server, caplet]),
+    ) as CapletsConfig["httpApis"],
+    cliTools: {},
+    capletSets: {},
+  };
+}
+
+function httpCaplet(
+  server: string,
+  exposure: CapletConfig["exposure"],
+): Extract<CapletConfig, { backend: "http" }> {
+  return {
+    server,
+    backend: "http",
+    name: server,
+    description: `Call ${server} actions.`,
+    exposure,
+    baseUrl: "https://example.com",
+    auth: { type: "none" },
+    actions: { query: { method: "GET", path: "/query" } },
+    requestTimeoutMs: 60000,
+    maxResponseBytes: 200000,
+    disabled: false,
+  };
+}
+
+function tool(name: string): Tool {
+  return { name, description: `Run ${name}.`, inputSchema: { type: "object" } };
+}
diff --git a/packages/core/test/exposure-policy.test.ts b/packages/core/test/exposure-policy.test.ts
new file mode 100644
index 0000000..85f8373
--- /dev/null
+++ b/packages/core/test/exposure-policy.test.ts
@@ -0,0 +1,22 @@
+import { describe, expect, it } from "vitest";
+import { resolveExposure } from "../src/exposure/policy";
+
+describe("exposure policy", () => {
+  it("uses the global default when a Caplet has no override", () => {
+    expect(resolveExposure(undefined, "progressive_and_code_mode")).toEqual({
+      value: "progressive_and_code_mode",
+      direct: false,
+      progressive: true,
+      codeMode: true,
+    });
+  });
+
+  it("lets a Caplet override the global default", () => {
+    expect(resolveExposure("direct_and_code_mode", "progressive")).toEqual({
+      value: "direct_and_code_mode",
+      direct: true,
+      progressive: false,
+      codeMode: true,
+    });
+  });
+});
diff --git a/packages/core/test/native.test.ts b/packages/core/test/native.test.ts
index 4998968..71e3226 100644
--- a/packages/core/test/native.test.ts
+++ b/packages/core/test/native.test.ts
@@ -1,6 +1,7 @@
 import { mkdirSync, mkdtempSync, rmSync, writeFileSync } from "node:fs";
 import { tmpdir } from "node:os";
 import { join } from "node:path";
+import { fileURLToPath } from "node:url";
 import { afterEach, beforeEach, describe, expect, it } from "vitest";
 import {
   createNativeCapletsService,
@@ -9,6 +10,9 @@ import {
   nativeCapletsSystemGuidance,
 } from "../src/native";
 
+const fixturesDir = fileURLToPath(new URL("fixtures", import.meta.url));
+const tsxImport = import.meta.resolve("tsx");
+
 describe("native Caplets service", () => {
   const dirs: string[] = [];
   const originalMode = process.env.CAPLETS_MODE;
@@ -96,6 +100,128 @@ describe("native Caplets service", () => {
     }
   });
 
+  it("lists direct native operation tools with the caplets double-underscore prefix", async () => {
+    const { dir, configPath, projectConfigPath } = tempConfig({
+      httpApis: {
+        status: {
+          name: "Status HTTP",
+          description: "Call status over HTTP.",
+          exposure: "direct",
+          baseUrl: "http://127.0.0.1:1",
+          auth: { type: "none" },
+          actions: {
+            ping: {
+              method: "GET",
+              path: "/ping",
+              description: "Ping the service.",
+              inputSchema: {
+                type: "object",
+                properties: { verbose: { type: "boolean" } },
+              },
+            },
+          },
+        },
+      },
+    });
+    dirs.push(dir);
+    const service = createNativeCapletsService({ configPath, projectConfigPath });
+
+    try {
+      expect(service.listTools()).toEqual([
+        expect.objectContaining({
+          caplet: "status__ping",
+          toolName: "caplets__status__ping",
+          title: "ping",
+          description: "Ping the service.",
+          inputSchema: {
+            type: "object",
+            properties: { verbose: { type: "boolean" } },
+          },
+        }),
+      ]);
+    } finally {
+      await service.close();
+    }
+  });
+
+  it("discovers direct MCP tools for native integrations during reload", async () => {
+    const fixture = join(fixturesDir, "stdio-server.ts");
+    const { dir, configPath, projectConfigPath } = tempConfig({
+      mcpServers: {
+        fixture: {
+          name: "Fixture MCP",
+          description: "Expose fixture MCP directly.",
+          exposure: "direct",
+          command: process.execPath,
+          args: ["--import", tsxImport, fixture],
+          toolCacheTtlMs: 30_000,
+        },
+      },
+    });
+    dirs.push(dir);
+    const service = createNativeCapletsService({ configPath, projectConfigPath, watch: false });
+
+    try {
+      await expect(service.reload()).resolves.toBe(true);
+      expect(service.listTools()).toEqual(
+        expect.arrayContaining([
+          expect.objectContaining({
+            caplet: "fixture__echo",
+            toolName: "caplets__fixture__echo",
+            title: "echo",
+            description: "Echo a message.",
+            inputSchema: expect.objectContaining({ type: "object" }),
+            outputSchema: expect.objectContaining({ type: "object" }),
+          }),
+          expect.objectContaining({
+            caplet: "fixture__list_resources",
+            toolName: "caplets__fixture__list_resources",
+          }),
+          expect.objectContaining({
+            caplet: "fixture__get_prompt",
+            toolName: "caplets__fixture__get_prompt",
+          }),
+        ]),
+      );
+
+      await expect(service.execute("fixture__echo", { message: "hello" })).resolves.toMatchObject({
+        structuredContent: { message: "hello" },
+        _meta: {
+          caplets: expect.objectContaining({
+            capletId: "fixture",
+            operation: "echo",
+            exposure: "direct",
+          }),
+        },
+      });
+    } finally {
+      await service.close();
+    }
+  });
+
+  it("lists Code Mode only when exposure includes Code Mode", async () => {
+    const { dir, configPath, projectConfigPath } = tempConfig({
+      httpApis: {
+        status: {
+          name: "Status HTTP",
+          description: "Call status over HTTP.",
+          exposure: "code_mode",
+          baseUrl: "http://127.0.0.1:1",
+          auth: { type: "none" },
+          actions: { ping: { method: "GET", path: "/ping" } },
+        },
+      },
+    });
+    dirs.push(dir);
+    const service = createNativeCapletsService({ configPath, projectConfigPath });
+
+    try {
+      expect(service.listTools().map((tool) => tool.toolName)).toEqual(["caplets_code_mode"]);
+    } finally {
+      await service.close();
+    }
+  });
+
   it("returns structured errors for unknown Caplets", async () => {
     const { dir, configPath, projectConfigPath } = tempConfig({
       mcpServers: {
diff --git a/packages/core/test/openapi.test.ts b/packages/core/test/openapi.test.ts
index 9ca95c3..e3ae56f 100644
--- a/packages/core/test/openapi.test.ts
+++ b/packages/core/test/openapi.test.ts
@@ -809,6 +809,9 @@ describe("native OpenAPI Caplets", () => {
         options: {
           defaultSearchLimit: 20,
           maxSearchLimit: 50,
+          exposure: "progressive_and_code_mode",
+          exposureDiscoveryTimeoutMs: 15000,
+          exposureDiscoveryConcurrency: 4,
           completion: {
             discoveryTimeoutMs: 750,
             overallTimeoutMs: 1500,
diff --git a/packages/core/test/package-boundaries.test.ts b/packages/core/test/package-boundaries.test.ts
index 3e22c9b..e9ba501 100644
--- a/packages/core/test/package-boundaries.test.ts
+++ b/packages/core/test/package-boundaries.test.ts
@@ -99,7 +99,10 @@ describe("package boundaries", () => {
     const dedicatedExports = [
       "./caplet-source",
       "./observed-output-shapes/pure",
+      "./project-binding",
+      "./redaction",
       "./runtime-plan",
+      "./stable-json",
     ] as const;
     const rootDefault = (corePackage.exports["."] as { default: string }).default;
 
diff --git a/packages/core/test/serve-session.test.ts b/packages/core/test/serve-session.test.ts
index 4657c0e..2f539e4 100644
--- a/packages/core/test/serve-session.test.ts
+++ b/packages/core/test/serve-session.test.ts
@@ -86,6 +86,51 @@ describe("CapletsMcpSession", () => {
     await session.close();
     await engine.close();
   });
+
+  it("registers direct operation tools without progressive wrapper or Code Mode", async () => {
+    const { dir, configPath, projectConfigPath } = tempConfig({
+      httpApis: {
+        status: {
+          name: "Status HTTP",
+          description: "Call status over HTTP.",
+          exposure: "direct",
+          baseUrl: "http://127.0.0.1:1",
+          auth: { type: "none" },
+          actions: {
+            ping: {
+              method: "GET",
+              path: "/ping",
+              description: "Ping the service.",
+              inputSchema: {
+                type: "object",
+                properties: { verbose: { type: "boolean" } },
+              },
+            },
+          },
+        },
+      },
+    });
+    dirs.push(dir);
+    const engine = new CapletsEngine({ configPath, projectConfigPath, watch: false });
+    const server = mockServer();
+    const session = new CapletsMcpSession(engine, { server });
+
+    await session.refreshExposure();
+
+    expect(session.registeredToolIds()).toEqual(["status__ping"]);
+    expect(server.registered.get("status")).toBeUndefined();
+    expect(server.registered.get("code_mode")).toBeUndefined();
+    expect(server.definitions.get("status__ping")).toMatchObject({
+      description: "Ping the service.",
+      inputSchema: {
+        type: "object",
+        properties: { verbose: { type: "boolean" } },
+      },
+    });
+
+    await session.close();
+    await engine.close();
+  });
 });
 
 function tempConfig(config: unknown): {
@@ -110,9 +155,11 @@ function writeConfig(path: string, config: unknown): void {
 
 function mockServer() {
   const registered = new Map<string, RegisteredTool>();
+  const definitions = new Map<string, Record<string, unknown>>();
   return {
     registered,
-    registerTool: vi.fn((name: string) => {
+    definitions,
+    registerTool: vi.fn((name: string, definition: Record<string, unknown>) => {
       const tool = {
         update: vi.fn(),
         remove: vi.fn(() => registered.delete(name)),
@@ -122,8 +169,11 @@ function mockServer() {
         handler: vi.fn(),
       } as unknown as RegisteredTool;
       registered.set(name, tool);
+      definitions.set(name, definition);
       return tool;
     }),
+    registerResource: vi.fn(),
+    registerPrompt: vi.fn(),
     connect: vi.fn(async () => {}),
     close: vi.fn(async () => {}),
   };
diff --git a/packages/core/test/shared-worker-safe-helpers.test.ts b/packages/core/test/shared-worker-safe-helpers.test.ts
new file mode 100644
index 0000000..ca72fe7
--- /dev/null
+++ b/packages/core/test/shared-worker-safe-helpers.test.ts
@@ -0,0 +1,41 @@
+import { describe, expect, it } from "vitest";
+import { isRuntimeResourceClassAllowed, resourceClassRank } from "../src/runtime-plan";
+
+describe("shared Worker-safe helpers", () => {
+  it("sorts object keys stably and omits undefined values", async () => {
+    const { stableJsonSha256Hex, stableJsonStringify, stableJsonValue } =
+      await import("../src/stable-json");
+
+    expect(stableJsonValue({ b: 2, a: undefined, c: { z: 1, y: 2 } })).toEqual({
+      b: 2,
+      c: { y: 2, z: 1 },
+    });
+    expect(stableJsonStringify({ b: 2, a: 1 })).toBe('{"a":1,"b":2}');
+    await expect(stableJsonSha256Hex({ b: 2, a: 1 })).resolves.toMatch(/^[0-9a-f]{64}$/u);
+  });
+
+  it("redacts shared secret keys and text patterns", async () => {
+    const { isSecretKey, redactSecretText, redactUnknownSecrets } =
+      await import("../src/redaction");
+
+    expect(isSecretKey("refresh_token")).toBe(true);
+    expect(redactSecretText("Authorization: Bearer secret-token-value").text).toBe(
+      "Authorization: Bearer [REDACTED]",
+    );
+    expect(
+      redactSecretText("stripe sk_live_123", { patterns: [/sk_(?:live|test)_[0-9A-Za-z._-]+/gu] })
+        .text,
+    ).toBe("stripe [REDACTED]");
+    expect(redactUnknownSecrets({ refreshToken: "abc", nested: ["Bearer abcdefgh"] })).toEqual({
+      refreshToken: "[REDACTED]",
+      nested: ["Bearer [REDACTED]"],
+    });
+  });
+
+  it("shares runtime resource class ordering", () => {
+    expect(resourceClassRank("small")).toBeLessThan(resourceClassRank("medium"));
+    expect(resourceClassRank("standard")).toBe(resourceClassRank("medium"));
+    expect(isRuntimeResourceClassAllowed("medium", "small")).toBe(false);
+    expect(isRuntimeResourceClassAllowed("standard", "medium")).toBe(true);
+  });
+});
diff --git a/packages/opencode/src/hooks.ts b/packages/opencode/src/hooks.ts
index ce0e1c2..89621aa 100644
--- a/packages/opencode/src/hooks.ts
+++ b/packages/opencode/src/hooks.ts
@@ -1,6 +1,10 @@
 import { tool, type Hooks } from "@opencode-ai/plugin";
 import { nativeCapletsSystemGuidance, type NativeCapletsService } from "@caplets/core/native";
-import { capletsOpenCodeArgs, capletsOpenCodeRunArgs } from "./schema";
+import {
+  capletsOpenCodeArgs,
+  capletsOpenCodeJsonSchemaArgs,
+  capletsOpenCodeRunArgs,
+} from "./schema";
 
 export async function createCapletsOpenCodeHooks(service: NativeCapletsService): Promise<Hooks> {
   const capletTools = service.listTools();
@@ -14,7 +18,9 @@ export async function createCapletsOpenCodeHooks(service: NativeCapletsService):
           description: caplet.description,
           args: caplet.codeModeRun
             ? capletsOpenCodeRunArgs()
-            : capletsOpenCodeArgs(caplet.operationNames ?? undefined),
+            : caplet.operationNames
+              ? capletsOpenCodeArgs(caplet.operationNames)
+              : capletsOpenCodeJsonSchemaArgs(caplet.inputSchema),
           async execute(args) {
             const result = await service.execute(caplet.caplet, args);
             return compactOpenCodeResult(result);
diff --git a/packages/opencode/src/schema.ts b/packages/opencode/src/schema.ts
index e98fe29..8c09859 100644
--- a/packages/opencode/src/schema.ts
+++ b/packages/opencode/src/schema.ts
@@ -38,3 +38,41 @@ export function capletsOpenCodeRunArgs() {
     timeoutMs: tool.schema.number().int().positive().optional(),
   };
 }
+
+export function capletsOpenCodeJsonSchemaArgs(schema: Record<string, unknown> | undefined) {
+  const properties =
+    schema &&
+    typeof schema.properties === "object" &&
+    schema.properties &&
+    !Array.isArray(schema.properties)
+      ? (schema.properties as Record<string, unknown>)
+      : {};
+  if (Object.keys(properties).length === 0) {
+    return {};
+  }
+  return Object.fromEntries(
+    Object.entries(properties).map(([key, value]) => [key, jsonSchemaPropertyToOpenCode(value)]),
+  );
+}
+
+function jsonSchemaPropertyToOpenCode(value: unknown) {
+  if (!value || typeof value !== "object" || Array.isArray(value)) return tool.schema.unknown();
+  const schema = value as Record<string, unknown>;
+  if (Array.isArray(schema.enum) && schema.enum.every((item) => typeof item === "string")) {
+    return tool.schema.enum(schema.enum as [string, ...string[]]);
+  }
+  if (schema.type === "string") return tool.schema.string().optional();
+  if (schema.type === "number" || schema.type === "integer") {
+    return tool.schema.number().int().positive().optional();
+  }
+  if (schema.type === "boolean" && "boolean" in tool.schema) {
+    return (tool.schema as typeof tool.schema & { boolean: () => unknown }).boolean();
+  }
+  if (schema.type === "object") {
+    return tool.schema.record(tool.schema.string(), tool.schema.unknown()).optional();
+  }
+  if (schema.type === "array") {
+    return tool.schema.array(tool.schema.unknown()).min(1).optional();
+  }
+  return tool.schema.unknown();
+}
diff --git a/packages/opencode/test/opencode.test.ts b/packages/opencode/test/opencode.test.ts
index cb78778..0d96b8a 100644
--- a/packages/opencode/test/opencode.test.ts
+++ b/packages/opencode/test/opencode.test.ts
@@ -9,6 +9,7 @@ vi.mock("@opencode-ai/plugin", () => ({
         optional: () => ({ type: "string", optional: true }),
         min: () => ({ type: "string" }),
       }),
+      boolean: () => ({ type: "boolean" }),
       number: () => ({
         int: () => ({ positive: () => ({ optional: () => ({ type: "number", optional: true }) }) }),
       }),
@@ -119,6 +120,39 @@ describe("@caplets/opencode", () => {
     expect(result).toContain("BigInt");
   });
 
+  it("uses direct native input schemas without progressive operation args", async () => {
+    const { createCapletsOpenCodeHooks } = await import("../src/hooks");
+    const service = {
+      listTools: () => [
+        {
+          caplet: "status__ping",
+          toolName: "caplets__status__ping",
+          title: "ping",
+          description: "Ping the service.",
+          promptGuidance: ["Use caplets__status__ping."],
+          inputSchema: {
+            type: "object",
+            properties: { verbose: { type: "boolean" } },
+          },
+        },
+      ],
+      execute: vi.fn(async () => ({ ok: true })),
+      reload: vi.fn(async () => true),
+      onToolsChanged: vi.fn(() => () => {}),
+      close: vi.fn(async () => {}),
+    };
+
+    const hooks = await createCapletsOpenCodeHooks(service);
+    const directTool = hooks.tool!.caplets__status__ping as {
+      args: Record<string, unknown>;
+      execute(args: unknown, context: unknown): Promise<string>;
+    };
+
+    expect(directTool.args).toEqual({ verbose: { type: "boolean" } });
+    await directTool.execute({ verbose: true }, {} as never);
+    expect(service.execute).toHaveBeenCalledWith("status__ping", { verbose: true });
+  });
+
   it("returns stable text when JSON.stringify returns undefined", async () => {
     const { createCapletsOpenCodeHooks } = await import("../src/hooks");
     const service = {
diff --git a/schemas/caplet.schema.json b/schemas/caplet.schema.json
index 36f73d7..7f21f86 100644
--- a/schemas/caplet.schema.json
+++ b/schemas/caplet.schema.json
@@ -29,6 +29,17 @@
         "maxLength": 80
       }
     },
+    "exposure": {
+      "type": "string",
+      "enum": [
+        "direct",
+        "progressive",
+        "code_mode",
+        "direct_and_code_mode",
+        "progressive_and_code_mode"
+      ],
+      "description": "How this Caplet is exposed to agents."
+    },
     "useWhen": {
       "description": "When agents should prefer this Caplet or configured action.",
       "type": "string",
diff --git a/schemas/caplets-config.schema.json b/schemas/caplets-config.schema.json
index 8f7bebe..90bd382 100644
--- a/schemas/caplets-config.schema.json
+++ b/schemas/caplets-config.schema.json
@@ -67,6 +67,42 @@
       },
       "additionalProperties": false
     },
+    "options": {
+      "default": {
+        "exposure": "progressive_and_code_mode",
+        "exposureDiscoveryTimeoutMs": 15000,
+        "exposureDiscoveryConcurrency": 4
+      },
+      "description": "Global Caplets runtime options.",
+      "type": "object",
+      "properties": {
+        "exposure": {
+          "default": "progressive_and_code_mode",
+          "type": "string",
+          "enum": [
+            "direct",
+            "progressive",
+            "code_mode",
+            "direct_and_code_mode",
+            "progressive_and_code_mode"
+          ],
+          "description": "How this Caplet is exposed to agents."
+        },
+        "exposureDiscoveryTimeoutMs": {
+          "default": 15000,
+          "type": "integer",
+          "exclusiveMinimum": 0,
+          "maximum": 9007199254740991
+        },
+        "exposureDiscoveryConcurrency": {
+          "default": 4,
+          "type": "integer",
+          "exclusiveMinimum": 0,
+          "maximum": 32
+        }
+      },
+      "additionalProperties": false
+    },
     "mcpServers": {
       "default": {},
       "description": "Downstream MCP servers keyed by stable server ID.",
@@ -301,6 +337,17 @@
               "maxLength": 80
             }
           },
+          "exposure": {
+            "type": "string",
+            "enum": [
+              "direct",
+              "progressive",
+              "code_mode",
+              "direct_and_code_mode",
+              "progressive_and_code_mode"
+            ],
+            "description": "How this Caplet is exposed to agents."
+          },
           "useWhen": {
             "description": "When agents should prefer this Caplet or configured action.",
             "type": "string",
@@ -706,6 +753,17 @@
               "maxLength": 80
             }
           },
+          "exposure": {
+            "type": "string",
+            "enum": [
+              "direct",
+              "progressive",
+              "code_mode",
+              "direct_and_code_mode",
+              "progressive_and_code_mode"
+            ],
+            "description": "How this Caplet is exposed to agents."
+          },
           "useWhen": {
             "description": "When agents should prefer this Caplet or configured action.",
             "type": "string",
@@ -1155,6 +1213,17 @@
               "maxLength": 80
             }
           },
+          "exposure": {
+            "type": "string",
+            "enum": [
+              "direct",
+              "progressive",
+              "code_mode",
+              "direct_and_code_mode",
+              "progressive_and_code_mode"
+            ],
+            "description": "How this Caplet is exposed to agents."
+          },
           "useWhen": {
             "description": "When agents should prefer this Caplet or configured action.",
             "type": "string",
@@ -1654,6 +1723,17 @@
               "maxLength": 80
             }
           },
+          "exposure": {
+            "type": "string",
+            "enum": [
+              "direct",
+              "progressive",
+              "code_mode",
+              "direct_and_code_mode",
+              "progressive_and_code_mode"
+            ],
+            "description": "How this Caplet is exposed to agents."
+          },
           "useWhen": {
             "description": "When agents should prefer this Caplet or configured action.",
             "type": "string",
@@ -2002,6 +2082,17 @@
               "maxLength": 80
             }
           },
+          "exposure": {
+            "type": "string",
+            "enum": [
+              "direct",
+              "progressive",
+              "code_mode",
+              "direct_and_code_mode",
+              "progressive_and_code_mode"
+            ],
+            "description": "How this Caplet is exposed to agents."
+          },
           "useWhen": {
             "description": "When agents should prefer this Caplet or configured action.",
             "type": "string",
@@ -2248,6 +2339,17 @@
               "maxLength": 80
             }
           },
+          "exposure": {
+            "type": "string",
+            "enum": [
+              "direct",
+              "progressive",
+              "code_mode",
+              "direct_and_code_mode",
+              "progressive_and_code_mode"
+            ],
+            "description": "How this Caplet is exposed to agents."
+          },
           "useWhen": {
             "description": "When agents should prefer this Caplet or configured action.",
             "type": "string",