temporalio · lex00 · Apr 13, 2026 · Apr 13, 2026 · Apr 13, 2026
@@ -0,0 +1,247 @@
+# @temporalio/tool-registry
+
+LLM tool-calling primitives for Temporal activities — define tools once, use with
+Anthropic or OpenAI.
+
+## Before you start
+
+A Temporal Activity is a function that Temporal monitors and retries automatically on failure. Temporal streams progress between retries via heartbeats — that's the mechanism `agenticSession` uses to resume a crashed LLM conversation mid-turn.
+
+`runToolLoop` works standalone in any async function — no Temporal server needed. Add `agenticSession` only when you need crash-safe resume inside a Temporal activity.
+
+`agenticSession` requires a running Temporal worker — it reads and writes heartbeat state from the active activity context. Use `runToolLoop` standalone for scripts, one-off jobs, or any code that runs outside a Temporal worker.
+
+New to Temporal? → https://docs.temporal.io/develop
+
+## Install
+
+```bash
+npm install @temporalio/tool-registry @anthropic-ai/sdk   # Anthropic
+npm install @temporalio/tool-registry openai              # OpenAI
+```
+
+## Quickstart
+
+Tool definitions use [JSON Schema](https://json-schema.org/understanding-json-schema/) for `input_schema`. The quickstart uses a single string field; for richer schemas refer to the JSON Schema docs.
+
+```typescript
+import { ToolRegistry, runToolLoop } from '@temporalio/tool-registry';
+
+export async function analyzeCode(prompt: string): Promise<string[]> {
+  const results: string[] = [];
+  const tools = new ToolRegistry();
+
+  tools.define(
+    {
+      name: 'flag_issue',
+      description: 'Flag a problem found in the analysis',
+      input_schema: {
+        type: 'object',
+        properties: { description: { type: 'string' } },
+        required: ['description'],
+      },
+    },
+    (inp: Record<string, unknown>) => {
+      results.push(inp['description'] as string);
+      return 'recorded'; // this string is sent back to the LLM as the tool result
+    }
+  );
+
+  await runToolLoop({
+    provider: 'anthropic', // reads ANTHROPIC_API_KEY from environment; or use 'openai'
+    system: 'You are a code reviewer. Call flag_issue for each problem you find.',
+    prompt,
+    tools,
+  });
+
+  return results;
+}
+```
+
+## Feature matrix
+
+| Feature | `@temporalio/tool-registry` | `@temporalio/ai-sdk` |
+|---|---|---|
+| Anthropic (claude-*) | ✓ | ✗ |
+| OpenAI (gpt-*) | ✓ | ✓ (via AI SDK) |
+| MCP tool wrapping | ✓ | ✓ |
+| Crash-safe heartbeat resume | ✓ (via `agenticSession`) | ✗ |
+| AI SDK provider abstraction | ✗ | ✓ |
+
+Use `@temporalio/ai-sdk` when you are already using the Vercel AI SDK and want each model call to be a separately observable, retryable Temporal activity.
+Use `@temporalio/tool-registry` for direct Anthropic support, crash-safe sessions that survive server-side session expiry, or when you need the same implementation pattern across all six Temporal SDKs (Go, Java, Ruby, .NET have no framework-level integrations).
+
+## Sandbox configuration
+
+You need this if you register both workflows and activities on the same `Worker` instance. If your activities run on a dedicated worker (no `workflowsPath`), skip this section.
+
+The Temporal workflow bundler excludes third-party packages. Use `ToolRegistryPlugin`
+so that activities using LLM libraries can run on the same worker as bundled workflows:
+
+```typescript
+import { Worker } from '@temporalio/worker';
+import { ToolRegistryPlugin } from '@temporalio/tool-registry';
+
+const worker = await Worker.create({
+  connection,
+  namespace: 'default',
+  taskQueue: 'my-queue',
+  plugins: [new ToolRegistryPlugin({ provider: 'anthropic' })],
+  workflowsPath: require.resolve('./workflows'),
+  activities,
+});
+```
+
+## MCP integration
+
+MCP tool wrapping is supported via `ToolRegistry.fromMcpTools()`. See the MCP integration guide for a complete example including server setup.
+
+### Selecting a model
+
+The default model is `"claude-sonnet-4-6"` (Anthropic) or `"gpt-4o"` (OpenAI). Pass `model` to `runToolLoop`:
+
+```typescript
+await runToolLoop({
+  provider: 'anthropic',
+  model: 'claude-3-5-sonnet-20241022',
+  system: '...',
+  prompt,
+  tools,
+});
+```
+
+Model IDs are defined by the provider — see Anthropic or OpenAI docs for current names.
+
+### OpenAI
+
+```typescript
+await runToolLoop({
+  provider: 'openai', // reads OPENAI_API_KEY from environment
+  system: '...',
+  prompt,
+  tools,
+});
+```
+
+## Crash-safe agentic sessions
+
+For multi-turn LLM conversations that must survive activity retries, use
+`agenticSession`. It saves conversation history via `activity.heartbeat()` on every
+turn and restores it automatically on retry.
+
+```typescript
+export async function longAnalysis(prompt: string): Promise<object[]> {
+  let results: object[] = [];
+  await agenticSession(async (session) => {
+    const tools = new ToolRegistry();
+    tools.define(
+      { name: 'flag', description: '...', input_schema: { type: 'object' } },
+      (inp: Record<string, unknown>) => {
+        session.results.push(inp);
+        return 'ok'; // this string is sent back to the LLM as the tool result
+      }
+    );
+    await session.runToolLoop({
+      registry: tools,
+      provider: 'anthropic', // reads ANTHROPIC_API_KEY from environment
+      system: '...',
+      prompt,
+    });
+    results = session.results; // capture after loop completes
+  });
+  return results;
+}
+```
+
+## Testing without an API key
+
+Use `MockProvider` and `ResponseBuilder` to test tool-calling logic without hitting a live API:
+
+```typescript
+import { ToolRegistry } from '@temporalio/tool-registry';
+import { MockProvider, ResponseBuilder } from '@temporalio/tool-registry/testing';
+
+const tools = new ToolRegistry();
+tools.define(
+  { name: 'flag', description: 'd', input_schema: { type: 'object' } },
+  (inp: Record<string, unknown>) => 'ok' // this string is sent back to the LLM as the tool result
+);
+
+const provider = new MockProvider([
+  ResponseBuilder.toolCall('flag', { description: 'stale API' }),
+  ResponseBuilder.done('done'),
+]);
+const messages = [{ role: 'user', content: 'analyze' }];
+await provider.runLoop(messages, tools);
+assert(messages.length > 2);
+```
+
+## Integration testing with real providers
+
+To run the integration tests against live Anthropic and OpenAI APIs:
+
+```bash
+RUN_INTEGRATION_TESTS=1 \
+  ANTHROPIC_API_KEY=sk-ant-... \
+  OPENAI_API_KEY=sk-proj-... \
+  npm test
+```
+
+Tests skip automatically when `RUN_INTEGRATION_TESTS` is unset. Real API calls
+incur billing — expect a few cents per full test run.
+
+## Storing application results
+
+`session.results` accumulates application-level results during the tool loop.
+Elements are serialized to JSON inside each heartbeat checkpoint — they must be
+plain objects with JSON-serializable values. A non-serializable value raises
+a non-retryable `ApplicationFailure` at heartbeat time rather than silently losing
+data on the next retry.
+
+### Storing typed results
+
+Convert your domain type to a plain object at the tool-call site and back after
+the session:
+
+```typescript
+interface Finding { type: string; file: string; }
+
+// Inside tool handler:
+session.results.push({ type: 'smell', file: 'foo.ts' } satisfies Finding);
+
+// After session:
+const findings = session.results as Finding[];
+```
+
+## Per-turn LLM timeout
+
+Individual LLM calls inside the tool loop are unbounded by default. A hung HTTP
+connection holds the activity open until Temporal's `ScheduleToCloseTimeout`
+fires — potentially many minutes. Set a per-turn timeout on the provider client:
+
+```typescript
+import Anthropic from '@anthropic-ai/sdk';
+const client = new Anthropic({ apiKey: '...', timeout: 30_000 }); // ms
+await session.runToolLoop({ ..., client });
+```
+
+Recommended timeouts:
+
+| Model type | Recommended |
+|---|---|
+| Standard (Claude 3.x, GPT-4o) | 30 s |
+| Reasoning (o1, o3, extended thinking) | 300 s |
+
+### Activity-level timeout
+
+Set `scheduleToCloseTimeout` on the activity options to bound the entire conversation:
+
+```typescript
+await workflow.executeActivity(longAnalysis, prompt, {
+  scheduleToCloseTimeout: '10m',
+});
+```
+
+The per-turn client timeout and `scheduleToCloseTimeout` are complementary:
+- Per-turn timeout fires if one LLM call hangs (protects against a single stuck turn)
+- `scheduleToCloseTimeout` bounds the entire conversation including all retries (protects against runaway multi-turn loops)
@@ -0,0 +1,66 @@
+{
+  "name": "@temporalio/tool-registry",
+  "version": "1.15.0",
+  "description": "LLM tool-calling primitives for Temporal activities — define tools once, use with Anthropic or OpenAI",
+  "main": "lib/index.js",
+  "types": "./lib/index.d.ts",
+  "keywords": [
+    "temporal",
+    "workflow",
+    "llm",
+    "anthropic",
+    "openai",
+    "tool-use",
+    "agentic"
+  ],
+  "author": "Temporal Technologies Inc. <sdk@temporal.io>",
+  "license": "MIT",
+  "dependencies": {
+    "@temporalio/activity": "workspace:*",
+    "@temporalio/common": "workspace:*",
+    "@temporalio/plugin": "workspace:*"
+  },
+  "peerDependencies": {
+    "@anthropic-ai/sdk": ">=0.40.0",
+    "openai": ">=4.0.0"
+  },
+  "peerDependenciesMeta": {
+    "@anthropic-ai/sdk": {
+      "optional": true
+    },
+    "openai": {
+      "optional": true
+    }
+  },
+  "devDependencies": {
+    "@anthropic-ai/sdk": "^0.40.0",
+    "@types/mocha": "^10.0.10",
+    "@types/node": "^20.10.8",
+    "mocha": "^10.0.0",
+    "ts-node": "^10.9.0",
+    "typescript": "^5.0.0"
+  },
+  "scripts": {
+    "build": "tsc --build",
+    "test": "TS_NODE_PROJECT=tsconfig.test.json mocha --require ts-node/register --extension ts 'src/**/*.test.ts'"
+  },
+  "engines": {
+    "node": ">= 20.0.0"
+  },
+  "bugs": {
+    "url": "https://github.com/temporalio/sdk-typescript/issues"
+  },
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/temporalio/sdk-typescript.git",
+    "directory": "packages/tool-registry"
+  },
+  "homepage": "https://github.com/temporalio/sdk-typescript/tree/main/packages/tool-registry",
+  "publishConfig": {
+    "access": "public"
+  },
+  "files": [
+    "src",
+    "lib"
+  ]
+}
@@ -0,0 +1,43 @@
+/**
+ * @temporalio/tool-registry — LLM tool-calling primitives for Temporal activities.
+ *
+ * Define tools once with {@link ToolRegistry}, export provider-specific schemas
+ * for Anthropic or OpenAI, and run complete multi-turn tool-calling conversations
+ * with {@link runToolLoop}.
+ *
+ * For crash-safe multi-turn sessions that survive activity retries, use
+ * {@link agenticSession} (exported from `./session`).
+ *
+ * @example
+ * ```typescript
+ * import { ToolRegistry, runToolLoop } from '@temporalio/tool-registry';
+ *
+ * const tools = new ToolRegistry();
+ * const issues: string[] = [];
+ *
+ * tools.define(
+ *   { name: 'flag', description: 'Flag an issue', input_schema: { ... } },
+ *   (inp) => { issues.push(inp.description as string); return 'recorded'; }
+ * );
+ *
+ * await runToolLoop({
+ *   provider: 'anthropic',
+ *   system: 'You are a code reviewer...',
+ *   prompt: 'Review this code...',
+ *   tools,
+ * });
+ * ```
+ */
+
+export { ToolRegistry } from './registry';
+export type { ToolDefinition, ToolHandler, McpToolDescriptor } from './registry';
+export { AnthropicProvider, OpenAIProvider, runToolLoop } from './providers';
+export type { Message, RunToolLoopOptions as ProviderRunLoopOptions } from './providers';
+export { ToolRegistryPlugin } from './plugin';
+export type { ToolRegistryPluginOptions } from './plugin';
+export { registryFromMcpTools } from './mcp';
+export type { McpTool } from './mcp';
+export { AgenticSession, agenticSession } from './session';
+export type { RunToolLoopOptions } from './session';
+export { ResponseBuilder, MockProvider, FakeToolRegistry, MockAgenticSession, CrashAfterTurns } from './testing';
+export type { MockResponse } from './testing';
@@ -0,0 +1,36 @@
+/**
+ * MCP (Model Context Protocol) integration for ToolRegistry.
+ *
+ * Provides utilities for wrapping MCP tool definitions in a {@link ToolRegistry},
+ * enabling use of MCP-sourced tools with Anthropic or OpenAI providers.
+ */
+
+import { ToolRegistry } from './registry';
+
+/** MCP-compatible tool descriptor. */
+export interface McpTool {
+  name: string;
+  description?: string;
+  inputSchema?: Record<string, unknown>;
+}
+
+/**
+ * Build a {@link ToolRegistry} from a list of MCP tool descriptors.
+ *
+ * Each MCP tool is registered with a no-op handler (returns empty string).
+ * Replace handlers by calling {@link ToolRegistry.define} with the same name
+ * after construction.
+ *
+ * @example
+ * ```typescript
+ * const registry = registryFromMcpTools(mcpServer.listTools());
+ * // Override the handler for a specific tool:
+ * registry.define(
+ *   { name: 'read_file', description: '...', input_schema: { ... } },
+ *   (inp) => mcpServer.callTool('read_file', inp)
+ * );
+ * ```
+ */
+export function registryFromMcpTools(tools: McpTool[]): ToolRegistry {
+  return ToolRegistry.fromMcpTools(tools);
+}