diff --git a/.gitignore b/.gitignore
index 3cf0bc4..cdf8daf 100644
--- a/.gitignore
+++ b/.gitignore
@@ -8,4 +8,5 @@ __pycache__/
 *.pb.go
 *_pb2.py
 .superpowers/
+docs/superpowers/
 sdk/rust/target/
diff --git a/LICENSE b/LICENSE
new file mode 100644
index 0000000..935d8e3
--- /dev/null
+++ b/LICENSE
@@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) 2026 Max Silverblatt
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
diff --git a/README.md b/README.md
index 2d53df2..0d0f1ec 100644
--- a/README.md
+++ b/README.md
@@ -21,6 +21,8 @@ protomcp is a language-agnostic MCP runtime. Write your server logic in Python,
 
 pmcp uses the [official MCP Go SDK](https://github.com/modelcontextprotocol/go-sdk) for full spec compliance. Your code registers tools, resources, and prompts through a simple protobuf protocol over a unix socket. pmcp handles everything else — protocol negotiation, transport, pagination, session management, and hot reload.
 
+The unix socket + protobuf layer adds ~0.5ms of overhead per tool call.
+
 ## Quick Start
 
 ### Install
@@ -29,6 +31,22 @@ pmcp uses the [official MCP Go SDK](https://github.com/modelcontextprotocol/go-s
 brew install msilverblatt/tap/protomcp
 ```
 
+### Install SDK
+
+```sh
+# Python
+pip install protomcp
+
+# TypeScript
+npm install protomcp
+
+# Go
+go get github.com/msilverblatt/protomcp/sdk/go/protomcp
+
+# Rust
+# Add to Cargo.toml: protomcp = "0.1"
+```
+
 ### Python
 
 ```python
@@ -346,7 +364,7 @@ See the [full documentation](https://msilverblatt.github.io/protomcp/) for detai
 
 protomcp is not a replacement for the official MCP SDKs — it's built on top of the [official Go SDK](https://github.com/modelcontextprotocol/go-sdk). Use protomcp when:
 
-- **You want one server in multiple languages** — write tools in Python, prompts in TypeScript, resources in Go, all served by a single MCP server
+- **You want the same API across languages** — switch between Python, TypeScript, Go, and Rust with identical concepts and patterns
 - **You want zero-config hot reload** — save a file, everything reloads instantly
 - **You don't want to learn MCP internals** — no JSON-RPC, no transport wiring, no session management
 - **You want a single binary** — `pmcp` is a single Go binary, no runtime dependencies for the server itself
diff --git a/docs/superpowers/plans/2026-03-12-protomcp-v1.1.md b/docs/superpowers/plans/2026-03-12-protomcp-v1.1.md
deleted file mode 100644
index a5d1c0a..0000000
--- a/docs/superpowers/plans/2026-03-12-protomcp-v1.1.md
+++ /dev/null
@@ -1,2751 +0,0 @@
-# protomcp v1.1 Implementation Plan
-
-> **For agentic workers:** REQUIRED: Use superpowers:subagent-driven-development (if subagents available) or superpowers:executing-plans to implement this plan. Steps use checkbox (`- [ ]`) syntax for tracking.
-
-**Goal:** Expand protomcp with Go and Rust SDKs, custom and auth middleware, build-time validation, CI/publishing pipelines, and comprehensive documentation.
-
-**Architecture:** Builds on v1.0's Go binary + protobuf-over-unix-socket architecture. Adds two new SDK implementations (Go, Rust) following the same module structure as Python/TypeScript SDKs. Extends the protobuf protocol with four new middleware messages (field numbers 24-27). Adds a `validate` subcommand and `--auth` flag to the CLI. CI/CD via GitHub Actions.
-
-**Tech Stack:** Go 1.25+, Rust (stable, prost, tokio), Protocol Buffers 3, GitHub Actions, GoReleaser
-
-**Spec:** `docs/superpowers/specs/2026-03-12-protomcp-v1.1-design.md`
-
----
-
-## File Structure
-
-```
-# New files
-sdk/go/
-├── go.mod
-├── protomcp/
-│   ├── tool.go         # Tool() registration with functional options
-│   ├── tool_test.go
-│   ├── result.go       # ToolResult struct
-│   ├── result_test.go
-│   ├── context.go      # ToolContext (progress, cancellation)
-│   ├── context_test.go
-│   ├── manager.go      # ToolManager for dynamic enable/disable
-│   ├── manager_test.go
-│   ├── log.go          # Server logging (8 levels)
-│   ├── log_test.go
-│   ├── transport.go    # Unix socket + envelope framing
-│   ├── transport_test.go
-│   └── runner.go       # Main loop: connect, handshake, dispatch
-│   └── runner_test.go
-
-sdk/rust/
-├── Cargo.toml
-├── build.rs            # prost-build for protobuf generation
-├── src/
-│   ├── lib.rs          # Public API exports
-│   ├── tool.rs         # Builder pattern registration
-│   ├── result.rs       # ToolResult struct
-│   ├── context.rs      # ToolContext (progress, cancellation)
-│   ├── manager.rs      # ToolManager for dynamic enable/disable
-│   ├── log.rs          # Server logging
-│   ├── transport.rs    # Unix socket + envelope framing
-│   └── runner.rs       # Main async loop
-├── tests/
-│   ├── tool_test.rs
-│   ├── result_test.rs
-│   ├── transport_test.rs
-│   └── integration_test.rs
-
-internal/middleware/
-├── auth.go             # NEW: built-in auth middleware
-├── auth_test.go        # NEW
-├── custom.go           # NEW: user-registered middleware dispatch
-├── custom_test.go      # NEW
-
-internal/validate/
-├── validate.go         # NEW: tool definition validation
-├── validate_test.go    # NEW
-
-.github/workflows/
-├── ci.yml              # NEW: CI pipeline
-├── release.yml         # NEW: release/publishing pipeline
-
-examples/go/
-├── basic.go
-├── real_world.go
-├── full_showcase.go
-
-examples/rust/
-├── basic/Cargo.toml + src/main.rs
-├── real_world/Cargo.toml + src/main.rs
-├── full_showcase/Cargo.toml + src/main.rs
-
-docs/src/content/docs/guides/
-├── writing-tools-go.mdx        # NEW
-├── writing-tools-rust.mdx      # NEW
-├── middleware.mdx               # NEW
-├── auth.mdx                     # NEW
-├── writing-a-language-library.mdx # NEW
-
-# Modified files
-proto/protomcp.proto                    # Add middleware messages (fields 24-27)
-gen/proto/protomcp/protomcp.pb.go       # Regenerated
-sdk/python/gen/protomcp_pb2.py          # Regenerated
-sdk/typescript/gen/                     # Regenerated
-cmd/protomcp/main.go                    # Add validate command, --auth flag
-internal/config/config.go              # Add Auth, Strict, Format fields; validate command; fix Rust runtime
-internal/config/config_test.go         # Tests for new fields
-internal/process/manager.go            # Extended handshake for middleware registration
-internal/process/manager_test.go       # Tests for extended handshake
-internal/middleware/chain.go           # Priority-based ordering with custom middleware
-sdk/python/src/protomcp/runner.py      # Middleware registration support
-sdk/python/src/protomcp/__init__.py    # Export middleware
-sdk/typescript/src/runner.ts           # Middleware registration support
-sdk/typescript/src/index.ts            # Export middleware
-README.md                              # Badges, Go/Rust examples, features
-docs/src/content/docs/index.mdx        # Add Go/Rust cards
-docs/src/content/docs/getting-started/quick-start.mdx    # Go/Rust snippets
-docs/src/content/docs/getting-started/installation.mdx   # Go/Rust install
-docs/src/content/docs/reference/cli.mdx                  # validate, --auth
-```
-
----
-
-## Chunk 1: Protobuf + Config + Rust Runtime Fix
-
-### Task 1: Add middleware messages to protobuf
-
-**Files:**
-- Modify: `proto/protomcp.proto`
-
-- [ ] **Step 1: Write the new message types and envelope fields**
-
-Add after the `TaskCancelRequest` message (line 170) in `proto/protomcp.proto`:
-
-```protobuf
-// --- Middleware ---
-
-message RegisterMiddlewareRequest {
-  string name = 1;
-  int32 priority = 2;  // lower runs first
-}
-
-message RegisterMiddlewareResponse {
-  bool success = 1;
-}
-
-message MiddlewareInterceptRequest {
-  string middleware_name = 1;
-  string phase = 2;  // "before" or "after"
-  string tool_name = 3;
-  string arguments_json = 4;
-  string result_json = 5;  // empty for "before" phase
-  bool is_error = 6;       // only set in "after" phase
-}
-
-message MiddlewareInterceptResponse {
-  string arguments_json = 1;  // potentially modified (before phase)
-  string result_json = 2;     // potentially modified (after phase)
-  bool reject = 3;            // if true, abort the call
-  string reject_reason = 4;
-}
-```
-
-Add these fields to the `Envelope.oneof msg` block (after `task_cancel = 23`):
-
-```protobuf
-    RegisterMiddlewareRequest register_middleware = 24;
-    RegisterMiddlewareResponse register_middleware_response = 25;
-    MiddlewareInterceptRequest middleware_intercept = 26;
-    MiddlewareInterceptResponse middleware_intercept_response = 27;
-```
-
-- [ ] **Step 2: Regenerate all protobuf code**
-
-Run: `make proto`
-Expected: `gen/proto/protomcp/protomcp.pb.go`, `sdk/python/gen/protomcp_pb2.py`, and `sdk/typescript/gen/` are all updated with the new middleware message types. The Makefile handles Go, Python, and TypeScript generation in one command.
-
-- [ ] **Step 6: Verify all existing tests still pass**
-
-Run: `go test ./... && cd sdk/python && python -m pytest && cd ../typescript && npx vitest run`
-Expected: All tests pass (no regressions from protobuf changes).
-
-- [ ] **Step 7: Commit**
-
-```bash
-git add proto/protomcp.proto gen/ sdk/python/gen/ sdk/typescript/gen/
-git commit -m "proto: add middleware messages (fields 24-27)"
-```
-
----
-
-### Task 2: Fix Rust runtime detection bug + add validate command to config
-
-**Files:**
-- Modify: `internal/config/config.go`
-- Modify: `internal/config/config_test.go`
-
-- [ ] **Step 1: Write failing test for Rust runtime fix**
-
-Add to `config_test.go`:
-
-```go
-func TestRuntimeCommandRust(t *testing.T) {
-	cmd, args := config.RuntimeCommand("tools.rs")
-	if cmd != "cargo" {
-		t.Errorf("cmd = %q, want %q", cmd, "cargo")
-	}
-	// cargo run does NOT take a file argument; it runs the package
-	expected := []string{"run", "--manifest-path", "Cargo.toml"}
-	if !reflect.DeepEqual(args, expected) {
-		t.Errorf("args = %v, want %v", args, expected)
-	}
-}
-```
-
-- [ ] **Step 2: Run test to verify it fails**
-
-Run: `go test ./internal/config/ -run TestRuntimeCommandRust -v`
-Expected: FAIL — currently returns `["run", "tools.rs"]`.
-
-- [ ] **Step 3: Fix RuntimeCommand for .rs files**
-
-In `config.go`, change the `.rs` case in `RuntimeCommand`:
-
-```go
-	case ".rs":
-		dir := filepath.Dir(file)
-		manifestPath := filepath.Join(dir, "Cargo.toml")
-		return "cargo", []string{"run", "--manifest-path", manifestPath}
-```
-
-- [ ] **Step 4: Run test to verify it passes**
-
-Run: `go test ./internal/config/ -run TestRuntimeCommandRust -v`
-Expected: PASS.
-
-- [ ] **Step 5: Update existing Rust test case in TestRuntimeCommand table**
-
-Change the `server.rs` entry to expect the new args format:
-
-```go
-		{"server.rs", "cargo", []string{"run", "--manifest-path", "Cargo.toml"}},
-```
-
-- [ ] **Step 6: Run all config tests**
-
-Run: `go test ./internal/config/ -v`
-Expected: All pass.
-
-- [ ] **Step 7: Write failing test for validate command parsing**
-
-Add to `config_test.go`:
-
-```go
-func TestParseValidateCommand(t *testing.T) {
-	cfg, err := config.Parse([]string{"validate", "tools.py"})
-	if err != nil {
-		t.Fatalf("Parse failed: %v", err)
-	}
-	if cfg.Command != "validate" {
-		t.Errorf("Command = %q, want %q", cfg.Command, "validate")
-	}
-	if cfg.File != "tools.py" {
-		t.Errorf("File = %q, want %q", cfg.File, "tools.py")
-	}
-}
-
-func TestParseValidateWithStrict(t *testing.T) {
-	cfg, err := config.Parse([]string{"validate", "tools.py", "--strict"})
-	if err != nil {
-		t.Fatalf("Parse failed: %v", err)
-	}
-	if !cfg.Strict {
-		t.Error("Strict should be true")
-	}
-}
-
-func TestParseValidateWithFormatJSON(t *testing.T) {
-	cfg, err := config.Parse([]string{"validate", "tools.py", "--format", "json"})
-	if err != nil {
-		t.Fatalf("Parse failed: %v", err)
-	}
-	if cfg.Format != "json" {
-		t.Errorf("Format = %q, want %q", cfg.Format, "json")
-	}
-}
-
-func TestParseAuthFlag(t *testing.T) {
-	cfg, err := config.Parse([]string{"dev", "tools.py", "--auth", "token:MY_TOKEN"})
-	if err != nil {
-		t.Fatalf("Parse failed: %v", err)
-	}
-	if len(cfg.Auth) != 1 || cfg.Auth[0] != "token:MY_TOKEN" {
-		t.Errorf("Auth = %v, want [\"token:MY_TOKEN\"]", cfg.Auth)
-	}
-}
-
-func TestParseMultipleAuthFlags(t *testing.T) {
-	cfg, err := config.Parse([]string{"dev", "tools.py", "--auth", "token:T1", "--auth", "apikey:K1"})
-	if err != nil {
-		t.Fatalf("Parse failed: %v", err)
-	}
-	if len(cfg.Auth) != 2 {
-		t.Errorf("Auth length = %d, want 2", len(cfg.Auth))
-	}
-}
-
-func TestParseAuthMalformed(t *testing.T) {
-	_, err := config.Parse([]string{"dev", "tools.py", "--auth", "invalid"})
-	if err == nil {
-		t.Error("expected error for malformed --auth value")
-	}
-}
-
-func TestParseAuthUnknownScheme(t *testing.T) {
-	_, err := config.Parse([]string{"dev", "tools.py", "--auth", "oauth:FOO"})
-	if err == nil {
-		t.Error("expected error for unknown auth scheme")
-	}
-}
-```
-
-- [ ] **Step 8: Run tests to verify they fail**
-
-Run: `go test ./internal/config/ -run TestParseValidate -v`
-Expected: FAIL — "validate" not recognized as valid command.
-
-- [ ] **Step 9: Update Config struct and Parse function**
-
-In `config.go`, add fields to `Config`:
-
-```go
-type Config struct {
-	Command            string
-	File               string
-	Transport          string
-	HotReloadImmediate bool
-	CallTimeout        time.Duration
-	LogLevel           string
-	SocketPath         string
-	Runtime            string
-	Host               string
-	Port               int
-	Auth               []string
-	Strict             bool
-	Format             string
-}
-```
-
-Update `Parse`:
-- Change command validation from `cmd != "dev" && cmd != "run"` to `cmd != "dev" && cmd != "run" && cmd != "validate"`
-- Add `--auth` flag handling (repeatable, validates format `scheme:value` where scheme is `token` or `apikey`):
-
-```go
-		case "--auth":
-			i++
-			if i >= len(args) {
-				return nil, fmt.Errorf("--auth requires a value")
-			}
-			authVal := args[i]
-			parts := strings.SplitN(authVal, ":", 2)
-			if len(parts) != 2 || parts[1] == "" {
-				return nil, fmt.Errorf("--auth value must be scheme:ENV_VAR (got %q)", authVal)
-			}
-			scheme := parts[0]
-			if scheme != "token" && scheme != "apikey" {
-				return nil, fmt.Errorf("unknown auth scheme %q: must be 'token' or 'apikey'", scheme)
-			}
-			cfg.Auth = append(cfg.Auth, authVal)
-		case "--strict":
-			cfg.Strict = true
-		case "--format":
-			i++
-			if i >= len(args) {
-				return nil, fmt.Errorf("--format requires a value")
-			}
-			cfg.Format = args[i]
-```
-
-Add `"strings"` to imports.
-
-- [ ] **Step 10: Run all config tests**
-
-Run: `go test ./internal/config/ -v`
-Expected: All pass.
-
-- [ ] **Step 11: Verify full build**
-
-Run: `go build ./...`
-Expected: Clean build.
-
-- [ ] **Step 12: Commit**
-
-```bash
-git add internal/config/config.go internal/config/config_test.go
-git commit -m "config: add validate command, --auth flag, fix Rust runtime detection"
-```
-
----
-
-### Task 3: Build-time validation
-
-**Files:**
-- Create: `internal/validate/validate.go`
-- Create: `internal/validate/validate_test.go`
-
-- [ ] **Step 1: Write failing tests for validation logic**
-
-Create `internal/validate/validate_test.go`:
-
-```go
-package validate_test
-
-import (
-	"testing"
-
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-	"github.com/msilverblatt/protomcp/internal/validate"
-)
-
-func TestValidateValidTools(t *testing.T) {
-	tools := []*pb.ToolDefinition{
-		{Name: "add", Description: "Add two numbers", InputSchemaJson: `{"type":"object","properties":{"a":{"type":"integer"}}}`},
-		{Name: "multiply", Description: "Multiply two numbers", InputSchemaJson: `{"type":"object","properties":{"b":{"type":"integer"}}}`},
-	}
-	result := validate.Tools(tools, false)
-	if !result.Pass {
-		t.Errorf("expected pass, got errors: %v", result.Errors)
-	}
-	if len(result.Tools) != 2 {
-		t.Errorf("expected 2 tools, got %d", len(result.Tools))
-	}
-}
-
-func TestValidateEmptyName(t *testing.T) {
-	tools := []*pb.ToolDefinition{
-		{Name: "", Description: "Something", InputSchemaJson: `{"type":"object"}`},
-	}
-	result := validate.Tools(tools, false)
-	if result.Pass {
-		t.Error("expected fail for empty name")
-	}
-}
-
-func TestValidateInvalidNameChars(t *testing.T) {
-	tools := []*pb.ToolDefinition{
-		{Name: "my-tool", Description: "Has hyphens", InputSchemaJson: `{"type":"object"}`},
-	}
-	result := validate.Tools(tools, false)
-	if result.Pass {
-		t.Error("expected fail for invalid name characters")
-	}
-}
-
-func TestValidateDuplicateNames(t *testing.T) {
-	tools := []*pb.ToolDefinition{
-		{Name: "add", Description: "First", InputSchemaJson: `{"type":"object"}`},
-		{Name: "add", Description: "Second", InputSchemaJson: `{"type":"object"}`},
-	}
-	result := validate.Tools(tools, false)
-	if result.Pass {
-		t.Error("expected fail for duplicate names")
-	}
-}
-
-func TestValidateEmptyDescription(t *testing.T) {
-	tools := []*pb.ToolDefinition{
-		{Name: "add", Description: "", InputSchemaJson: `{"type":"object"}`},
-	}
-	result := validate.Tools(tools, false)
-	if result.Pass {
-		t.Error("expected fail for empty description")
-	}
-}
-
-func TestValidateInvalidSchema(t *testing.T) {
-	tools := []*pb.ToolDefinition{
-		{Name: "add", Description: "Add", InputSchemaJson: `not json`},
-	}
-	result := validate.Tools(tools, false)
-	if result.Pass {
-		t.Error("expected fail for invalid JSON schema")
-	}
-}
-
-func TestValidateStrictShortDescription(t *testing.T) {
-	tools := []*pb.ToolDefinition{
-		{Name: "add", Description: "Add", InputSchemaJson: `{"type":"object","properties":{"a":{"type":"integer"}}}`},
-	}
-	result := validate.Tools(tools, true)
-	if result.Pass {
-		t.Error("expected fail in strict mode for short description")
-	}
-}
-
-func TestValidateStrictGenericName(t *testing.T) {
-	tools := []*pb.ToolDefinition{
-		{Name: "test", Description: "A test tool for testing", InputSchemaJson: `{"type":"object","properties":{"a":{"type":"integer"}}}`},
-	}
-	result := validate.Tools(tools, true)
-	if result.Pass {
-		t.Error("expected fail in strict mode for generic name")
-	}
-}
-
-func TestResultFormatText(t *testing.T) {
-	tools := []*pb.ToolDefinition{
-		{Name: "add", Description: "Add two numbers", InputSchemaJson: `{"type":"object"}`},
-	}
-	result := validate.Tools(tools, false)
-	output := result.FormatText()
-	if output == "" {
-		t.Error("expected non-empty text output")
-	}
-}
-
-func TestResultFormatJSON(t *testing.T) {
-	tools := []*pb.ToolDefinition{
-		{Name: "add", Description: "Add two numbers", InputSchemaJson: `{"type":"object"}`},
-	}
-	result := validate.Tools(tools, false)
-	output := result.FormatJSON()
-	if output == "" {
-		t.Error("expected non-empty JSON output")
-	}
-}
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `go test ./internal/validate/ -v`
-Expected: FAIL — package doesn't exist yet.
-
-- [ ] **Step 3: Implement validation logic**
-
-Create `internal/validate/validate.go`:
-
-```go
-package validate
-
-import (
-	"encoding/json"
-	"fmt"
-	"regexp"
-	"strings"
-
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-var validName = regexp.MustCompile(`^[a-zA-Z_][a-zA-Z0-9_]*$`)
-
-var genericNames = map[string]bool{
-	"test": true, "tool1": true, "foo": true, "bar": true, "baz": true,
-	"temp": true, "tmp": true, "example": true,
-}
-
-type ToolStatus struct {
-	Name   string `json:"name"`
-	Status string `json:"status"`
-}
-
-type ValidationError struct {
-	Tool  string `json:"tool"`
-	Issue string `json:"issue"`
-}
-
-type Result struct {
-	Tools  []ToolStatus      `json:"tools"`
-	Errors []ValidationError `json:"errors"`
-	Pass   bool              `json:"pass"`
-}
-
-func Tools(tools []*pb.ToolDefinition, strict bool) Result {
-	result := Result{Pass: true}
-	seen := make(map[string]bool)
-
-	for _, t := range tools {
-		status := ToolStatus{Name: t.Name, Status: "ok"}
-
-		if t.Name == "" {
-			result.Errors = append(result.Errors, ValidationError{Tool: "", Issue: "empty tool name"})
-			result.Pass = false
-			status.Status = "error"
-		} else if !validName.MatchString(t.Name) {
-			result.Errors = append(result.Errors, ValidationError{Tool: t.Name, Issue: fmt.Sprintf("invalid name %q: must match [a-zA-Z_][a-zA-Z0-9_]*", t.Name)})
-			result.Pass = false
-			status.Status = "error"
-		} else if seen[t.Name] {
-			result.Errors = append(result.Errors, ValidationError{Tool: t.Name, Issue: "duplicate tool name"})
-			result.Pass = false
-			status.Status = "error"
-		}
-		seen[t.Name] = true
-
-		if t.Description == "" {
-			result.Errors = append(result.Errors, ValidationError{Tool: t.Name, Issue: "no description"})
-			result.Pass = false
-			status.Status = "error"
-		}
-
-		if t.InputSchemaJson != "" {
-			var schema map[string]interface{}
-			if err := json.Unmarshal([]byte(t.InputSchemaJson), &schema); err != nil {
-				result.Errors = append(result.Errors, ValidationError{Tool: t.Name, Issue: fmt.Sprintf("invalid input schema JSON: %v", err)})
-				result.Pass = false
-				status.Status = "error"
-			}
-		}
-
-		if strict {
-			if len(t.Description) < 10 {
-				result.Errors = append(result.Errors, ValidationError{Tool: t.Name, Issue: fmt.Sprintf("description too short (%d chars, minimum 10)", len(t.Description))})
-				result.Pass = false
-				status.Status = "error"
-			}
-			if genericNames[strings.ToLower(t.Name)] {
-				result.Errors = append(result.Errors, ValidationError{Tool: t.Name, Issue: fmt.Sprintf("generic name %q", t.Name)})
-				result.Pass = false
-				status.Status = "error"
-			}
-		}
-
-		result.Tools = append(result.Tools, status)
-	}
-
-	return result
-}
-
-func (r Result) FormatText() string {
-	var sb strings.Builder
-	for _, t := range r.Tools {
-		if t.Status == "ok" {
-			sb.WriteString(fmt.Sprintf("✓ %s — OK\n", t.Name))
-		}
-	}
-	if len(r.Errors) > 0 {
-		sb.WriteString(fmt.Sprintf("✗ — %d error(s):\n", len(r.Errors)))
-		for _, e := range r.Errors {
-			if e.Tool != "" {
-				sb.WriteString(fmt.Sprintf("  · %q: %s\n", e.Tool, e.Issue))
-			} else {
-				sb.WriteString(fmt.Sprintf("  · %s\n", e.Issue))
-			}
-		}
-	}
-	return sb.String()
-}
-
-func (r Result) FormatJSON() string {
-	b, _ := json.Marshal(r)
-	return string(b)
-}
-```
-
-- [ ] **Step 4: Run tests to verify they pass**
-
-Run: `go test ./internal/validate/ -v`
-Expected: All pass.
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/validate/
-git commit -m "feat: add build-time tool validation"
-```
-
----
-
-### Task 4: Wire validate command and --auth into main.go
-
-**Files:**
-- Modify: `cmd/protomcp/main.go`
-
-- [ ] **Step 1: Add validate subcommand handling**
-
-Add an import for the validate package and handle the validate command before the existing dev/run flow. In `main()`, after parsing config, add:
-
-```go
-	if cfg.Command == "validate" {
-		runValidate(ctx, cfg)
-		return
-	}
-```
-
-Add the `runValidate` function:
-
-```go
-func runValidate(ctx context.Context, cfg *config.Config) {
-	var runtimeCmd string
-	var runtimeArgs []string
-	if cfg.Runtime != "" {
-		runtimeCmd = cfg.Runtime
-		runtimeArgs = []string{cfg.File}
-	} else {
-		runtimeCmd, runtimeArgs = config.RuntimeCommand(cfg.File)
-	}
-
-	pm := process.NewManager(process.ManagerConfig{
-		File:        cfg.File,
-		RuntimeCmd:  runtimeCmd,
-		RuntimeArgs: runtimeArgs,
-		SocketPath:  cfg.SocketPath,
-		MaxRetries:  1,
-		CallTimeout: 30 * time.Second,
-	})
-
-	tools, err := pm.Start(ctx)
-	if err != nil {
-		fmt.Fprintf(os.Stderr, "error: failed to start tool process: %v\n", err)
-		os.Exit(1)
-	}
-	defer pm.Stop()
-
-	result := validate.Tools(tools, cfg.Strict)
-
-	if cfg.Format == "json" {
-		fmt.Println(result.FormatJSON())
-	} else {
-		fmt.Print(result.FormatText())
-	}
-
-	if !result.Pass {
-		os.Exit(1)
-	}
-}
-```
-
-Add imports: `"github.com/msilverblatt/protomcp/internal/validate"`, `"time"`.
-
-- [ ] **Step 2: Verify build** (auth wiring is deferred to Task 5 to avoid compilation errors)
-
-Run: `go build ./cmd/protomcp/`
-Expected: Build succeeds.
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add cmd/protomcp/main.go
-git commit -m "feat: wire validate command into CLI"
-```
-
----
-
-### Task 5: Auth middleware
-
-**Files:**
-- Create: `internal/middleware/auth.go`
-- Create: `internal/middleware/auth_test.go`
-
-- [ ] **Step 1: Write failing tests**
-
-Create `internal/middleware/auth_test.go`:
-
-```go
-package middleware_test
-
-import (
-	"context"
-	"encoding/json"
-	"os"
-	"testing"
-
-	"github.com/msilverblatt/protomcp/internal/mcp"
-	"github.com/msilverblatt/protomcp/internal/middleware"
-)
-
-func TestAuthTokenValid(t *testing.T) {
-	os.Setenv("TEST_TOKEN", "secret123")
-	defer os.Unsetenv("TEST_TOKEN")
-
-	mw, err := middleware.NewAuth([]string{"token:TEST_TOKEN"})
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	next := func(ctx context.Context, req mcp.JSONRPCRequest) (*mcp.JSONRPCResponse, error) {
-		return &mcp.JSONRPCResponse{ID: req.ID, Result: []byte(`"ok"`)}, nil
-	}
-
-	handler := mw(next)
-	ctx := middleware.WithAuthHeader(context.Background(), "Bearer secret123")
-	resp, err := handler(ctx, mcp.JSONRPCRequest{ID: json.RawMessage(`1`), Method: "tools/call"})
-	if err != nil {
-		t.Fatal(err)
-	}
-	if resp == nil {
-		t.Fatal("expected response")
-	}
-}
-
-func TestAuthTokenInvalid(t *testing.T) {
-	os.Setenv("TEST_TOKEN", "secret123")
-	defer os.Unsetenv("TEST_TOKEN")
-
-	mw, err := middleware.NewAuth([]string{"token:TEST_TOKEN"})
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	next := func(ctx context.Context, req mcp.JSONRPCRequest) (*mcp.JSONRPCResponse, error) {
-		return &mcp.JSONRPCResponse{ID: req.ID, Result: []byte(`"ok"`)}, nil
-	}
-
-	handler := mw(next)
-	ctx := middleware.WithAuthHeader(context.Background(), "Bearer wrong")
-	_, err = handler(ctx, mcp.JSONRPCRequest{ID: json.RawMessage(`1`), Method: "tools/call"})
-	if err == nil {
-		t.Fatal("expected auth error")
-	}
-}
-
-func TestAuthTokenMissing(t *testing.T) {
-	os.Setenv("TEST_TOKEN", "secret123")
-	defer os.Unsetenv("TEST_TOKEN")
-
-	mw, err := middleware.NewAuth([]string{"token:TEST_TOKEN"})
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	next := func(ctx context.Context, req mcp.JSONRPCRequest) (*mcp.JSONRPCResponse, error) {
-		return &mcp.JSONRPCResponse{}, nil
-	}
-
-	handler := mw(next)
-	_, err = handler(context.Background(), mcp.JSONRPCRequest{ID: json.RawMessage(`1`), Method: "tools/call"})
-	if err == nil {
-		t.Fatal("expected auth error for missing header")
-	}
-}
-
-func TestAuthApikeyValid(t *testing.T) {
-	os.Setenv("TEST_KEY", "mykey")
-	defer os.Unsetenv("TEST_KEY")
-
-	mw, err := middleware.NewAuth([]string{"apikey:TEST_KEY"})
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	next := func(ctx context.Context, req mcp.JSONRPCRequest) (*mcp.JSONRPCResponse, error) {
-		return &mcp.JSONRPCResponse{ID: req.ID, Result: []byte(`"ok"`)}, nil
-	}
-
-	handler := mw(next)
-	ctx := middleware.WithAPIKeyHeader(context.Background(), "mykey")
-	resp, err := handler(ctx, mcp.JSONRPCRequest{ID: json.RawMessage(`1`), Method: "tools/call"})
-	if err != nil {
-		t.Fatal(err)
-	}
-	if resp == nil {
-		t.Fatal("expected response")
-	}
-}
-
-func TestNewAuthEnvNotSet(t *testing.T) {
-	os.Unsetenv("NONEXISTENT_VAR")
-	_, err := middleware.NewAuth([]string{"token:NONEXISTENT_VAR"})
-	if err == nil {
-		t.Error("expected error for unset env var")
-	}
-}
-
-func TestNewAuthMultiple(t *testing.T) {
-	os.Setenv("TEST_TOKEN2", "tok")
-	os.Setenv("TEST_KEY2", "key")
-	defer os.Unsetenv("TEST_TOKEN2")
-	defer os.Unsetenv("TEST_KEY2")
-
-	mw, err := middleware.NewAuth([]string{"token:TEST_TOKEN2", "apikey:TEST_KEY2"})
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	next := func(ctx context.Context, req mcp.JSONRPCRequest) (*mcp.JSONRPCResponse, error) {
-		return &mcp.JSONRPCResponse{ID: req.ID, Result: []byte(`"ok"`)}, nil
-	}
-
-	handler := mw(next)
-	ctx := middleware.WithAuthHeader(context.Background(), "Bearer tok")
-	ctx = middleware.WithAPIKeyHeader(ctx, "key")
-	resp, err := handler(ctx, mcp.JSONRPCRequest{ID: json.RawMessage(`1`), Method: "tools/call"})
-	if err != nil {
-		t.Fatal(err)
-	}
-	if resp == nil {
-		t.Fatal("expected response")
-	}
-}
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `go test ./internal/middleware/ -v`
-Expected: FAIL — `NewAuth`, `WithAuthHeader`, `WithAPIKeyHeader` don't exist.
-
-- [ ] **Step 3: Implement auth middleware**
-
-Create `internal/middleware/auth.go`:
-
-```go
-package middleware
-
-import (
-	"context"
-	"fmt"
-	"os"
-	"strings"
-)
-
-type authContextKey string
-
-const (
-	authHeaderKey  authContextKey = "auth-header"
-	apiKeyHeaderKey authContextKey = "apikey-header"
-)
-
-// WithAuthHeader adds an Authorization header value to the context.
-func WithAuthHeader(ctx context.Context, value string) context.Context {
-	return context.WithValue(ctx, authHeaderKey, value)
-}
-
-// WithAPIKeyHeader adds an X-API-Key header value to the context.
-func WithAPIKeyHeader(ctx context.Context, value string) context.Context {
-	return context.WithValue(ctx, apiKeyHeaderKey, value)
-}
-
-// GetAuthHeader retrieves the Authorization header from context.
-func GetAuthHeader(ctx context.Context) string {
-	v, _ := ctx.Value(authHeaderKey).(string)
-	return v
-}
-
-// GetAPIKeyHeader retrieves the X-API-Key header from context.
-func GetAPIKeyHeader(ctx context.Context) string {
-	v, _ := ctx.Value(apiKeyHeaderKey).(string)
-	return v
-}
-
-type authChecker struct {
-	scheme string
-	value  string
-}
-
-// NewAuth creates an auth middleware from --auth flag values.
-// Each value must be "token:ENV_VAR" or "apikey:ENV_VAR".
-// Returns error if env var is not set.
-func NewAuth(authSpecs []string) (Middleware, error) {
-	var checkers []authChecker
-
-	for _, spec := range authSpecs {
-		parts := strings.SplitN(spec, ":", 2)
-		if len(parts) != 2 {
-			return nil, fmt.Errorf("invalid auth spec %q", spec)
-		}
-		scheme, envVar := parts[0], parts[1]
-		value := os.Getenv(envVar)
-		if value == "" {
-			return nil, fmt.Errorf("environment variable %q is not set (required by --auth %s)", envVar, spec)
-		}
-		checkers = append(checkers, authChecker{scheme: scheme, value: value})
-	}
-
-	return func(next Handler) Handler {
-		return func(ctx context.Context, req JSONRPCRequest) (*JSONRPCResponse, error) {
-			for _, c := range checkers {
-				switch c.scheme {
-				case "token":
-					header := GetAuthHeader(ctx)
-					expected := "Bearer " + c.value
-					if header != expected {
-						return nil, fmt.Errorf("unauthorized: invalid or missing Bearer token")
-					}
-				case "apikey":
-					header := GetAPIKeyHeader(ctx)
-					if header != c.value {
-						return nil, fmt.Errorf("unauthorized: invalid or missing API key")
-					}
-				}
-			}
-			return next(ctx, req)
-		}
-	}, nil
-}
-```
-
-Note: Import the `mcp` package types via the existing middleware package imports. The `Handler` and `Middleware` types are already defined in `chain.go`. Add the `JSONRPCRequest` and `JSONRPCResponse` type aliases or import from `mcp` package as needed — check what `chain.go` already imports.
-
-- [ ] **Step 4: Run tests to verify they pass**
-
-Run: `go test ./internal/middleware/ -v`
-Expected: All pass.
-
-- [ ] **Step 5: Wire auth middleware into main.go**
-
-In `cmd/protomcp/main.go`, replace the existing middleware chain setup with:
-
-```go
-	// 6. Apply middleware
-	middlewares := []middleware.Middleware{
-		middleware.Logging(logger),
-		middleware.ErrorFormatting(),
-	}
-
-	if len(cfg.Auth) > 0 {
-		if cfg.Transport == "stdio" {
-			slog.Warn("--auth ignored for stdio transport")
-		} else {
-			authMw, err := middleware.NewAuth(cfg.Auth)
-			if err != nil {
-				slog.Error("invalid --auth configuration", "error", err)
-				os.Exit(1)
-			}
-			middlewares = append([]middleware.Middleware{authMw}, middlewares...)
-		}
-	}
-
-	chain := middleware.Chain(
-		func(ctx context.Context, req mcp.JSONRPCRequest) (*mcp.JSONRPCResponse, error) {
-			return handler.Handle(ctx, req)
-		},
-		middlewares...,
-	)
-```
-
-- [ ] **Step 6: Verify full build**
-
-Run: `go build ./cmd/protomcp/`
-Expected: Clean build.
-
-- [ ] **Step 7: Commit**
-
-```bash
-git add internal/middleware/auth.go internal/middleware/auth_test.go cmd/protomcp/main.go
-git commit -m "feat: add auth middleware (token + apikey) and wire into CLI"
-```
-
----
-
-### Task 6: Extended handshake for middleware registration
-
-**Files:**
-- Modify: `internal/process/manager.go`
-- Modify: `internal/process/manager_test.go`
-- Create: `internal/middleware/custom.go`
-- Create: `internal/middleware/custom_test.go`
-
-- [ ] **Step 1: Add middleware tracking to Manager**
-
-Add to `Manager` struct:
-
-```go
-	middlewares []RegisteredMiddleware
-```
-
-Add type:
-
-```go
-type RegisteredMiddleware struct {
-	Name     string
-	Priority int32
-}
-```
-
-- [ ] **Step 2: Extend handshake in Start()**
-
-After `listTools` returns, add a loop that waits for optional `RegisterMiddlewareRequest` messages or a `ReloadResponse` (handshake-complete signal):
-
-```go
-	// After listTools, wait for optional middleware registrations + handshake-complete signal.
-	m.mu.Lock()
-	m.tools = tools
-	m.mu.Unlock()
-
-	middlewares, err := m.awaitHandshakeComplete(ctx)
-	if err != nil {
-		m.cleanup()
-		return nil, fmt.Errorf("handshake middleware: %w", err)
-	}
-	m.mu.Lock()
-	m.middlewares = middlewares
-	m.mu.Unlock()
-```
-
-Implement `awaitHandshakeComplete`:
-
-```go
-func (m *Manager) awaitHandshakeComplete(ctx context.Context) ([]RegisteredMiddleware, error) {
-	var middlewares []RegisteredMiddleware
-	// Short timeout for handshake-complete signal. If v1.0 SDKs don't send it,
-	// we treat "no message within 500ms" as handshake-complete (backward compat).
-	timer := time.NewTimer(500 * time.Millisecond)
-	defer timer.Stop()
-
-	for {
-		select {
-		case <-ctx.Done():
-			return nil, ctx.Err()
-		case <-timer.C:
-			// Backward compat: v1.0 SDKs don't send handshake-complete signal.
-			// Treat timeout as "no middleware registered, handshake done."
-			return middlewares, nil
-		case env := <-m.handshakeCh:
-			if rr := env.GetReloadResponse(); rr != nil {
-				// Handshake complete signal
-				return middlewares, nil
-			}
-			if rm := env.GetRegisterMiddleware(); rm != nil {
-				middlewares = append(middlewares, RegisteredMiddleware{
-					Name:     rm.Name,
-					Priority: rm.Priority,
-				})
-				// Send acknowledgment
-				resp := &pb.Envelope{
-					Msg: &pb.Envelope_RegisterMiddlewareResponse{
-						RegisterMiddlewareResponse: &pb.RegisterMiddlewareResponse{Success: true},
-					},
-				}
-				if err := envelope.Write(m.conn, resp); err != nil {
-					return nil, fmt.Errorf("write RegisterMiddlewareResponse: %w", err)
-				}
-				continue
-			}
-			// Unexpected message type — ignore
-		}
-	}
-}
-```
-
-- [ ] **Step 3: Add Middlewares() accessor**
-
-```go
-func (m *Manager) Middlewares() []RegisteredMiddleware {
-	m.mu.Lock()
-	defer m.mu.Unlock()
-	return m.middlewares
-}
-```
-
-- [ ] **Step 4: Update readLoop to route RegisterMiddleware and MiddlewareIntercept messages**
-
-In `readLoop()`, add handling for `MiddlewareInterceptResponse` — route it via `pending` map using `request_id` (same as `CallToolResponse`). For `RegisterMiddlewareRequest` with no `request_id`, route to `handshakeCh`.
-
-Update the unsolicited message handling in `readLoop`:
-
-```go
-		if reqID == "" {
-			// Unsolicited message (ToolListResponse after reload, or middleware registration during handshake).
-			select {
-			case m.handshakeCh <- env:
-			default:
-			}
-			continue
-		}
-```
-
-This already works because `RegisterMiddlewareRequest` during handshake has no `request_id` and goes to `handshakeCh`. `MiddlewareInterceptResponse` has a `request_id` and routes via `pending`.
-
-- [ ] **Step 5: Add SendMiddlewareIntercept method to Manager**
-
-```go
-func (m *Manager) SendMiddlewareIntercept(ctx context.Context, mwName, phase, toolName, argsJSON, resultJSON string, isError bool) (*pb.MiddlewareInterceptResponse, error) {
-	reqID := m.nextRequestID()
-
-	env := &pb.Envelope{
-		RequestId: reqID,
-		Msg: &pb.Envelope_MiddlewareIntercept{
-			MiddlewareIntercept: &pb.MiddlewareInterceptRequest{
-				MiddlewareName: mwName,
-				Phase:          phase,
-				ToolName:       toolName,
-				ArgumentsJson:  argsJSON,
-				ResultJson:     resultJSON,
-				IsError:        isError,
-			},
-		},
-	}
-
-	respCh := make(chan *pb.Envelope, 1)
-	m.mu.Lock()
-	m.pending[reqID] = respCh
-	m.mu.Unlock()
-
-	defer func() {
-		m.mu.Lock()
-		delete(m.pending, reqID)
-		m.mu.Unlock()
-	}()
-
-	if err := envelope.Write(m.conn, env); err != nil {
-		return nil, fmt.Errorf("write MiddlewareInterceptRequest: %w", err)
-	}
-
-	timer := time.NewTimer(m.cfg.CallTimeout)
-	defer timer.Stop()
-
-	select {
-	case <-ctx.Done():
-		return nil, ctx.Err()
-	case <-timer.C:
-		return nil, fmt.Errorf("middleware intercept %q timed out", mwName)
-	case resp := <-respCh:
-		mir := resp.GetMiddlewareInterceptResponse()
-		if mir == nil {
-			return nil, fmt.Errorf("unexpected response type for MiddlewareIntercept")
-		}
-		return mir, nil
-	}
-}
-```
-
-- [ ] **Step 6: Create custom middleware dispatcher**
-
-Create `internal/middleware/custom.go`:
-
-```go
-package middleware
-
-import (
-	"context"
-	"encoding/json"
-	"fmt"
-	"sort"
-
-	"github.com/msilverblatt/protomcp/internal/mcp"
-)
-
-// MiddlewareDispatcher sends intercept requests to the tool process.
-type MiddlewareDispatcher interface {
-	SendMiddlewareIntercept(ctx context.Context, mwName, phase, toolName, argsJSON, resultJSON string, isError bool) (interceptResp interface{ GetReject() bool; GetRejectReason() string; GetArgumentsJson() string; GetResultJson() string }, error)
-}
-
-// RegisteredMW holds a registered custom middleware from the tool process.
-type RegisteredMW struct {
-	Name     string
-	Priority int32
-}
-
-// CustomMiddleware creates a middleware that dispatches to tool-process-registered middleware.
-func CustomMiddleware(dispatcher MiddlewareDispatcher, registered []RegisteredMW) Middleware {
-	if len(registered) == 0 {
-		return func(next Handler) Handler { return next }
-	}
-
-	// Sort by priority (lower first)
-	sorted := make([]RegisteredMW, len(registered))
-	copy(sorted, registered)
-	sort.Slice(sorted, func(i, j int) bool {
-		return sorted[i].Priority < sorted[j].Priority
-	})
-
-	return func(next Handler) Handler {
-		return func(ctx context.Context, req JSONRPCRequest) (*JSONRPCResponse, error) {
-			// Extract tool name and args from the request if it's a tools/call
-			// For non-tool-call requests, skip custom middleware
-			if req.Method != "tools/call" {
-				return next(ctx, req)
-			}
-
-			toolName, argsJSON := extractToolCallParams(req)
-
-			// Before phase
-			currentArgs := argsJSON
-			for _, mw := range sorted {
-				resp, err := dispatcher.SendMiddlewareIntercept(ctx, mw.Name, "before", toolName, currentArgs, "", false)
-				if err != nil {
-					return nil, fmt.Errorf("middleware %q before: %w", mw.Name, err)
-				}
-				if resp.GetReject() {
-					return nil, fmt.Errorf("rejected by middleware %q: %s", mw.Name, resp.GetRejectReason())
-				}
-				if modified := resp.GetArgumentsJson(); modified != "" {
-					currentArgs = modified
-				}
-			}
-
-			// Inject modified args back into the request
-			if currentArgs != argsJSON {
-				modifiedParams, _ := json.Marshal(map[string]json.RawMessage{
-					"name":      json.RawMessage(fmt.Sprintf("%q", toolName)),
-					"arguments": json.RawMessage(currentArgs),
-				})
-				req.Params = modifiedParams
-			}
-
-			result, err := next(ctx, req)
-
-			// After phase (reverse order)
-			resultJSON := ""
-			isError := false
-			if result != nil {
-				resultJSON = string(result.Result)
-				isError = result.Error != nil
-			}
-
-			for i := len(sorted) - 1; i >= 0; i-- {
-				mw := sorted[i]
-				resp, afterErr := dispatcher.SendMiddlewareIntercept(ctx, mw.Name, "after", toolName, currentArgs, resultJSON, isError)
-				if afterErr != nil {
-					return result, err // Return original result on after-phase error
-				}
-				if modified := resp.GetResultJson(); modified != "" {
-					resultJSON = modified
-				}
-			}
-
-			return result, err
-		}
-	}
-}
-
-func extractToolCallParams(req JSONRPCRequest) (string, string) {
-	var params struct {
-		Name      string          `json:"name"`
-		Arguments json.RawMessage `json:"arguments"`
-	}
-	if err := json.Unmarshal(req.Params, &params); err != nil {
-		return "", "{}"
-	}
-	argsJSON := "{}"
-	if len(params.Arguments) > 0 {
-		argsJSON = string(params.Arguments)
-	}
-	return params.Name, argsJSON
-}
-```
-
-- [ ] **Step 7: Run all tests**
-
-Run: `go test ./internal/... -v`
-Expected: All pass.
-
-- [ ] **Step 8: Commit**
-
-```bash
-git add internal/process/manager.go internal/middleware/custom.go internal/middleware/custom_test.go
-git commit -m "feat: extended handshake for middleware registration + custom middleware dispatch"
-```
-
----
-
-### Task 7: Update SDK runners for middleware + handshake-complete signal
-
-**Files:**
-- Modify: `sdk/python/src/protomcp/runner.py`
-- Modify: `sdk/python/src/protomcp/__init__.py`
-- Modify: `sdk/typescript/src/runner.ts`
-- Modify: `sdk/typescript/src/index.ts`
-
-- [ ] **Step 1: Add middleware registry to Python SDK**
-
-Create `sdk/python/src/protomcp/middleware.py`:
-
-```python
-from dataclasses import dataclass
-from typing import Callable, Any
-
-_middleware_registry: list["MiddlewareDef"] = []
-
-@dataclass
-class MiddlewareDef:
-    name: str
-    priority: int
-    handler: Callable  # (phase, tool_name, args_json, result_json, is_error) -> dict
-
-def middleware(name: str, priority: int = 100):
-    def decorator(func: Callable) -> Callable:
-        _middleware_registry.append(MiddlewareDef(
-            name=name,
-            priority=priority,
-            handler=func,
-        ))
-        return func
-    return decorator
-
-def get_registered_middleware() -> list[MiddlewareDef]:
-    return list(_middleware_registry)
-
-def clear_middleware_registry():
-    _middleware_registry.clear()
-```
-
-- [ ] **Step 2: Update Python runner to send handshake-complete signal and handle middleware**
-
-In `runner.py`, after `_handle_list_tools`, send `RegisterMiddlewareRequest` for each registered middleware, then send `ReloadResponse { success: true }` as handshake-complete. Also handle `MiddlewareInterceptRequest`:
-
-Update the main `run()` loop setup to:
-1. After sending `ToolListResponse`, send middleware registrations
-2. Send `ReloadResponse(success=True)` with no `request_id` as handshake-complete
-3. In the message loop, handle `middleware_intercept` messages
-
-Update `_handle_reload` to also send middleware registrations + handshake-complete after tool list.
-
-- [ ] **Step 3: Update TypeScript runner similarly**
-
-Add `sdk/typescript/src/middleware.ts` with equivalent registration. Update `runner.ts` to send middleware registrations + handshake-complete signal. Handle `middlewareIntercept` messages in the loop.
-
-- [ ] **Step 4: Export middleware from both SDKs**
-
-Update `sdk/python/src/protomcp/__init__.py` to export `middleware`, `get_registered_middleware`.
-Update `sdk/typescript/src/index.ts` to export `middleware` from `middleware.ts`.
-
-- [ ] **Step 5: Run existing SDK tests to ensure no regressions**
-
-Run: `cd sdk/python && python -m pytest -v && cd ../typescript && npx vitest run`
-Expected: All existing tests pass.
-
-- [ ] **Step 6: Commit**
-
-```bash
-git add sdk/python/src/protomcp/ sdk/typescript/src/
-git commit -m "feat: add middleware support to Python and TypeScript SDKs"
-```
-
----
-
-## Chunk 2: Go SDK
-
-### Task 8: Go SDK scaffolding + transport
-
-**Files:**
-- Create: `sdk/go/go.mod`
-- Create: `sdk/go/protomcp/transport.go`
-- Create: `sdk/go/protomcp/transport_test.go`
-
-- [ ] **Step 1: Create go.mod**
-
-```
-module github.com/msilverblatt/protomcp/sdk/go
-
-go 1.25.6
-
-require github.com/msilverblatt/protomcp v0.0.0
-
-replace github.com/msilverblatt/protomcp => ../..
-```
-
-- [ ] **Step 2: Write failing transport test**
-
-Create `sdk/go/protomcp/transport_test.go`:
-
-```go
-package protomcp_test
-
-import (
-	"net"
-	"os"
-	"path/filepath"
-	"testing"
-
-	"github.com/msilverblatt/protomcp/sdk/go/protomcp"
-)
-
-func TestTransportConnectAndClose(t *testing.T) {
-	dir := t.TempDir()
-	sockPath := filepath.Join(dir, "test.sock")
-
-	listener, err := net.Listen("unix", sockPath)
-	if err != nil {
-		t.Fatal(err)
-	}
-	defer listener.Close()
-
-	os.Setenv("PROTOMCP_SOCKET", sockPath)
-	defer os.Unsetenv("PROTOMCP_SOCKET")
-
-	tp := protomcp.NewTransport(sockPath)
-
-	// Accept in background
-	go func() { listener.Accept() }()
-
-	if err := tp.Connect(); err != nil {
-		t.Fatal(err)
-	}
-	tp.Close()
-}
-```
-
-- [ ] **Step 3: Run test to verify it fails**
-
-Run: `cd sdk/go && go test ./protomcp/ -run TestTransportConnect -v`
-Expected: FAIL — package doesn't exist.
-
-- [ ] **Step 4: Implement transport**
-
-Create `sdk/go/protomcp/transport.go`:
-
-```go
-package protomcp
-
-import (
-	"encoding/binary"
-	"fmt"
-	"io"
-	"net"
-
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-	"google.golang.org/protobuf/proto"
-)
-
-type Transport struct {
-	socketPath string
-	conn       net.Conn
-}
-
-func NewTransport(socketPath string) *Transport {
-	return &Transport{socketPath: socketPath}
-}
-
-func (t *Transport) Connect() error {
-	conn, err := net.Dial("unix", t.socketPath)
-	if err != nil {
-		return fmt.Errorf("connect to socket: %w", err)
-	}
-	t.conn = conn
-	return nil
-}
-
-func (t *Transport) Send(env *pb.Envelope) error {
-	data, err := proto.Marshal(env)
-	if err != nil {
-		return fmt.Errorf("marshal envelope: %w", err)
-	}
-	length := make([]byte, 4)
-	binary.BigEndian.PutUint32(length, uint32(len(data)))
-	if _, err := t.conn.Write(length); err != nil {
-		return err
-	}
-	_, err = t.conn.Write(data)
-	return err
-}
-
-func (t *Transport) Recv() (*pb.Envelope, error) {
-	lengthBuf := make([]byte, 4)
-	if _, err := io.ReadFull(t.conn, lengthBuf); err != nil {
-		return nil, err
-	}
-	length := binary.BigEndian.Uint32(lengthBuf)
-	data := make([]byte, length)
-	if _, err := io.ReadFull(t.conn, data); err != nil {
-		return nil, err
-	}
-	env := &pb.Envelope{}
-	if err := proto.Unmarshal(data, env); err != nil {
-		return nil, fmt.Errorf("unmarshal envelope: %w", err)
-	}
-	return env, nil
-}
-
-func (t *Transport) Close() {
-	if t.conn != nil {
-		t.conn.Close()
-	}
-}
-```
-
-- [ ] **Step 5: Run test to verify it passes**
-
-Run: `cd sdk/go && go test ./protomcp/ -run TestTransportConnect -v`
-Expected: PASS.
-
-- [ ] **Step 6: Commit**
-
-```bash
-git add sdk/go/
-git commit -m "feat(sdk/go): add transport layer"
-```
-
----
-
-### Task 9: Go SDK result + context
-
-**Files:**
-- Create: `sdk/go/protomcp/result.go`
-- Create: `sdk/go/protomcp/result_test.go`
-- Create: `sdk/go/protomcp/context.go`
-- Create: `sdk/go/protomcp/context_test.go`
-
-- [ ] **Step 1: Write failing result test**
-
-```go
-package protomcp_test
-
-import "testing"
-
-func TestToolResultBasic(t *testing.T) {
-	r := protomcp.Result("hello")
-	if r.ResultText != "hello" {
-		t.Errorf("ResultText = %q, want %q", r.ResultText, "hello")
-	}
-	if r.IsError {
-		t.Error("should not be error")
-	}
-}
-
-func TestToolResultError(t *testing.T) {
-	r := protomcp.ErrorResult("failed", "INVALID", "try again", true)
-	if !r.IsError {
-		t.Error("should be error")
-	}
-	if r.ErrorCode != "INVALID" {
-		t.Errorf("ErrorCode = %q, want %q", r.ErrorCode, "INVALID")
-	}
-}
-
-func TestToolResultEnableDisable(t *testing.T) {
-	r := protomcp.Result("ok")
-	r.EnableTools = []string{"admin_panel"}
-	r.DisableTools = []string{"login"}
-	if len(r.EnableTools) != 1 {
-		t.Error("expected 1 enable tool")
-	}
-}
-```
-
-- [ ] **Step 2: Implement result.go**
-
-```go
-package protomcp
-
-type ToolResult struct {
-	ResultText  string
-	IsError     bool
-	ErrorCode   string
-	Message     string
-	Suggestion  string
-	Retryable   bool
-	EnableTools []string
-	DisableTools []string
-}
-
-func Result(text string) ToolResult {
-	return ToolResult{ResultText: text}
-}
-
-func ErrorResult(text, errorCode, suggestion string, retryable bool) ToolResult {
-	return ToolResult{
-		ResultText: text,
-		IsError:    true,
-		ErrorCode:  errorCode,
-		Message:    text,
-		Suggestion: suggestion,
-		Retryable:  retryable,
-	}
-}
-```
-
-- [ ] **Step 3: Write context tests and implement**
-
-Context wraps progress reporting and cancellation. Uses `context.Context` for cancellation:
-
-```go
-package protomcp
-
-import (
-	"context"
-
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-type ToolContext struct {
-	Ctx           context.Context
-	ProgressToken string
-	sendFn        func(*pb.Envelope) error
-}
-
-func (tc *ToolContext) ReportProgress(progress, total int64, message string) error {
-	env := &pb.Envelope{
-		Msg: &pb.Envelope_Progress{
-			Progress: &pb.ProgressNotification{
-				ProgressToken: tc.ProgressToken,
-				Progress:      progress,
-				Total:         total,
-				Message:       message,
-			},
-		},
-	}
-	return tc.sendFn(env)
-}
-
-func (tc *ToolContext) IsCancelled() bool {
-	return tc.Ctx.Err() != nil
-}
-```
-
-- [ ] **Step 4: Run tests**
-
-Run: `cd sdk/go && go test ./protomcp/ -v`
-Expected: All pass.
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/go/protomcp/result.go sdk/go/protomcp/result_test.go sdk/go/protomcp/context.go sdk/go/protomcp/context_test.go
-git commit -m "feat(sdk/go): add ToolResult and ToolContext"
-```
-
----
-
-### Task 10: Go SDK tool registration
-
-**Files:**
-- Create: `sdk/go/protomcp/tool.go`
-- Create: `sdk/go/protomcp/tool_test.go`
-
-- [ ] **Step 1: Write failing test**
-
-```go
-package protomcp_test
-
-import (
-	"testing"
-
-	"github.com/msilverblatt/protomcp/sdk/go/protomcp"
-)
-
-func TestToolRegistration(t *testing.T) {
-	protomcp.ClearRegistry()
-	protomcp.Tool("add",
-		protomcp.Description("Add two numbers"),
-		protomcp.Args(protomcp.IntArg("a"), protomcp.IntArg("b")),
-		protomcp.Handler(func(ctx protomcp.ToolContext, args map[string]interface{}) protomcp.ToolResult {
-			return protomcp.Result("3")
-		}),
-	)
-
-	tools := protomcp.GetRegisteredTools()
-	if len(tools) != 1 {
-		t.Fatalf("expected 1 tool, got %d", len(tools))
-	}
-	if tools[0].Name != "add" {
-		t.Errorf("name = %q, want %q", tools[0].Name, "add")
-	}
-	if tools[0].Desc != "Add two numbers" {
-		t.Errorf("description = %q, want %q", tools[0].Desc, "Add two numbers")
-	}
-}
-
-func TestToolMetadata(t *testing.T) {
-	protomcp.ClearRegistry()
-	protomcp.Tool("delete_user",
-		protomcp.Description("Delete a user account"),
-		protomcp.DestructiveHint(true),
-		protomcp.Handler(func(ctx protomcp.ToolContext, args map[string]interface{}) protomcp.ToolResult {
-			return protomcp.Result("deleted")
-		}),
-	)
-
-	tools := protomcp.GetRegisteredTools()
-	if !tools[0].Destructive {
-		t.Error("expected destructive hint")
-	}
-}
-```
-
-- [ ] **Step 2: Implement tool.go with functional options**
-
-```go
-package protomcp
-
-import (
-	"encoding/json"
-)
-
-type ToolDef struct {
-	Name         string
-	Desc         string
-	InputSchema  map[string]interface{}
-	OutputSchema map[string]interface{}
-	HandlerFn    func(ToolContext, map[string]interface{}) ToolResult
-	Title        string
-	Destructive  bool
-	Idempotent   bool
-	ReadOnly     bool
-	OpenWorld    bool
-	TaskSupport  bool
-}
-
-type ToolOption func(*ToolDef)
-
-var registry []ToolDef
-
-func Tool(name string, opts ...ToolOption) {
-	td := ToolDef{
-		Name:        name,
-		InputSchema: map[string]interface{}{"type": "object", "properties": map[string]interface{}{}},
-	}
-	for _, opt := range opts {
-		opt(&td)
-	}
-	registry = append(registry, td)
-}
-
-func Description(desc string) ToolOption {
-	return func(td *ToolDef) { td.Desc = desc }
-}
-
-type ArgDef struct {
-	Name string
-	Type string
-}
-
-func IntArg(name string) ArgDef  { return ArgDef{Name: name, Type: "integer"} }
-func StrArg(name string) ArgDef  { return ArgDef{Name: name, Type: "string"} }
-func NumArg(name string) ArgDef  { return ArgDef{Name: name, Type: "number"} }
-func BoolArg(name string) ArgDef { return ArgDef{Name: name, Type: "boolean"} }
-
-func Args(args ...ArgDef) ToolOption {
-	return func(td *ToolDef) {
-		props := map[string]interface{}{}
-		required := []string{}
-		for _, a := range args {
-			props[a.Name] = map[string]interface{}{"type": a.Type}
-			required = append(required, a.Name)
-		}
-		td.InputSchema = map[string]interface{}{
-			"type":       "object",
-			"properties": props,
-			"required":   required,
-		}
-	}
-}
-
-func Handler(fn func(ToolContext, map[string]interface{}) ToolResult) ToolOption {
-	return func(td *ToolDef) { td.HandlerFn = fn }
-}
-
-func DestructiveHint(v bool) ToolOption  { return func(td *ToolDef) { td.Destructive = v } }
-func IdempotentHint(v bool) ToolOption   { return func(td *ToolDef) { td.Idempotent = v } }
-func ReadOnlyHint(v bool) ToolOption     { return func(td *ToolDef) { td.ReadOnly = v } }
-func OpenWorldHint(v bool) ToolOption    { return func(td *ToolDef) { td.OpenWorld = v } }
-func TaskSupportHint(v bool) ToolOption  { return func(td *ToolDef) { td.TaskSupport = v } }
-
-func (td ToolDef) InputSchemaJSON() string {
-	b, _ := json.Marshal(td.InputSchema)
-	return string(b)
-}
-
-func GetRegisteredTools() []ToolDef { return append([]ToolDef{}, registry...) }
-func ClearRegistry()                { registry = nil }
-```
-
-- [ ] **Step 3: Run tests**
-
-Run: `cd sdk/go && go test ./protomcp/ -run TestTool -v`
-Expected: All pass.
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add sdk/go/protomcp/tool.go sdk/go/protomcp/tool_test.go
-git commit -m "feat(sdk/go): add tool registration with functional options"
-```
-
----
-
-### Task 11: Go SDK log + manager + runner
-
-**Files:**
-- Create: `sdk/go/protomcp/log.go`
-- Create: `sdk/go/protomcp/manager.go`
-- Create: `sdk/go/protomcp/runner.go`
-
-- [ ] **Step 1: Implement log.go**
-
-Server logging with 8 RFC 5424 levels. Follow the same pattern as Python SDK's `log.py`:
-
-```go
-package protomcp
-
-import (
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-type ServerLogger struct {
-	sendFn func(*pb.Envelope) error
-	logger string
-}
-
-func NewServerLogger(sendFn func(*pb.Envelope) error, logger string) *ServerLogger {
-	return &ServerLogger{sendFn: sendFn, logger: logger}
-}
-
-func (l *ServerLogger) log(level, dataJSON string) {
-	if l.sendFn == nil {
-		return
-	}
-	l.sendFn(&pb.Envelope{
-		Msg: &pb.Envelope_Log{
-			Log: &pb.LogMessage{
-				Level:    level,
-				Logger:   l.logger,
-				DataJson: dataJSON,
-			},
-		},
-	})
-}
-
-func (l *ServerLogger) Debug(msg string)     { l.log("debug", msg) }
-func (l *ServerLogger) Info(msg string)      { l.log("info", msg) }
-func (l *ServerLogger) Notice(msg string)    { l.log("notice", msg) }
-func (l *ServerLogger) Warning(msg string)   { l.log("warning", msg) }
-func (l *ServerLogger) Error(msg string)     { l.log("error", msg) }
-func (l *ServerLogger) Critical(msg string)  { l.log("critical", msg) }
-func (l *ServerLogger) Alert(msg string)     { l.log("alert", msg) }
-func (l *ServerLogger) Emergency(msg string) { l.log("emergency", msg) }
-```
-
-- [ ] **Step 2: Implement manager.go**
-
-Dynamic tool list management — `ToolManager` with Enable/Disable/SetAllowed/SetBlocked:
-
-```go
-package protomcp
-
-import (
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-type ToolManager struct {
-	sendFn func(*pb.Envelope) error
-}
-
-func newToolManager(sendFn func(*pb.Envelope) error) *ToolManager {
-	return &ToolManager{sendFn: sendFn}
-}
-
-func (m *ToolManager) Enable(names ...string) {
-	m.sendFn(&pb.Envelope{
-		Msg: &pb.Envelope_EnableTools{
-			EnableTools: &pb.EnableToolsRequest{ToolNames: names},
-		},
-	})
-}
-
-func (m *ToolManager) Disable(names ...string) {
-	m.sendFn(&pb.Envelope{
-		Msg: &pb.Envelope_DisableTools{
-			DisableTools: &pb.DisableToolsRequest{ToolNames: names},
-		},
-	})
-}
-```
-
-- [ ] **Step 3: Implement runner.go**
-
-Main loop: connect to socket, send tool list, handle calls, handle reload. Follow the same pattern as Python/TypeScript runners but with handshake-complete signal:
-
-```go
-package protomcp
-
-import (
-	"encoding/json"
-	"fmt"
-	"os"
-
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-var Log *ServerLogger
-
-func Run() {
-	socketPath := os.Getenv("PROTOMCP_SOCKET")
-	if socketPath == "" {
-		fmt.Fprintln(os.Stderr, "PROTOMCP_SOCKET not set — run via 'pmcp dev'")
-		os.Exit(1)
-	}
-
-	tp := NewTransport(socketPath)
-	if err := tp.Connect(); err != nil {
-		fmt.Fprintf(os.Stderr, "connect: %v\n", err)
-		os.Exit(1)
-	}
-	defer tp.Close()
-
-	Log = NewServerLogger(func(env *pb.Envelope) error { return tp.Send(env) }, "protomcp-go")
-
-	for {
-		env, err := tp.Recv()
-		if err != nil {
-			break
-		}
-
-		reqID := env.GetRequestId()
-
-		switch {
-		case env.GetListTools() != nil:
-			handleListTools(tp, reqID)
-			sendHandshakeComplete(tp)
-		case env.GetCallTool() != nil:
-			handleCallTool(tp, env.GetCallTool(), reqID)
-		case env.GetReload() != nil:
-			handleReload(tp, reqID)
-		case env.GetMiddlewareIntercept() != nil:
-			handleMiddlewareIntercept(tp, env.GetMiddlewareIntercept(), reqID)
-		}
-	}
-}
-
-func handleListTools(tp *Transport, reqID string) {
-	tools := GetRegisteredTools()
-	var defs []*pb.ToolDefinition
-	for _, t := range tools {
-		defs = append(defs, &pb.ToolDefinition{
-			Name:            t.Name,
-			Description:     t.Desc,
-			InputSchemaJson: t.InputSchemaJSON(),
-			DestructiveHint: t.Destructive,
-			IdempotentHint:  t.Idempotent,
-			ReadOnlyHint:    t.ReadOnly,
-			OpenWorldHint:   t.OpenWorld,
-			TaskSupport:     t.TaskSupport,
-		})
-	}
-	tp.Send(&pb.Envelope{
-		RequestId: reqID,
-		Msg: &pb.Envelope_ToolList{
-			ToolList: &pb.ToolListResponse{Tools: defs},
-		},
-	})
-}
-
-func sendHandshakeComplete(tp *Transport) {
-	// Send middleware registrations if any
-	// TODO: add middleware registration here when middleware support is added
-
-	// Send handshake-complete signal
-	tp.Send(&pb.Envelope{
-		Msg: &pb.Envelope_ReloadResponse{
-			ReloadResponse: &pb.ReloadResponse{Success: true},
-		},
-	})
-}
-
-func handleCallTool(tp *Transport, req *pb.CallToolRequest, reqID string) {
-	tools := GetRegisteredTools()
-	var handler func(ToolContext, map[string]interface{}) ToolResult
-	for _, t := range tools {
-		if t.Name == req.Name {
-			handler = t.HandlerFn
-			break
-		}
-	}
-
-	if handler == nil {
-		tp.Send(&pb.Envelope{
-			RequestId: reqID,
-			Msg: &pb.Envelope_CallResult{
-				CallResult: &pb.CallToolResponse{
-					IsError:    true,
-					ResultJson: fmt.Sprintf(`[{"type":"text","text":"Tool not found: %s"}]`, req.Name),
-				},
-			},
-		})
-		return
-	}
-
-	var args map[string]interface{}
-	if req.ArgumentsJson != "" {
-		json.Unmarshal([]byte(req.ArgumentsJson), &args)
-	}
-	if args == nil {
-		args = map[string]interface{}{}
-	}
-
-	ctx := ToolContext{
-		ProgressToken: req.ProgressToken,
-		sendFn:        func(env *pb.Envelope) error { return tp.Send(env) },
-	}
-
-	result := handler(ctx, args)
-
-	resp := &pb.CallToolResponse{
-		IsError:      result.IsError,
-		ResultJson:   fmt.Sprintf(`[{"type":"text","text":"%s"}]`, result.ResultText),
-		EnableTools:  result.EnableTools,
-		DisableTools: result.DisableTools,
-	}
-	if result.IsError && result.ErrorCode != "" {
-		resp.Error = &pb.ToolError{
-			ErrorCode:  result.ErrorCode,
-			Message:    result.Message,
-			Suggestion: result.Suggestion,
-			Retryable:  result.Retryable,
-		}
-	}
-
-	tp.Send(&pb.Envelope{
-		RequestId: reqID,
-		Msg:       &pb.Envelope_CallResult{CallResult: resp},
-	})
-}
-
-func handleReload(tp *Transport, reqID string) {
-	tp.Send(&pb.Envelope{
-		RequestId: reqID,
-		Msg: &pb.Envelope_ReloadResponse{
-			ReloadResponse: &pb.ReloadResponse{Success: true},
-		},
-	})
-	handleListTools(tp, "")
-	sendHandshakeComplete(tp)
-}
-
-func handleMiddlewareIntercept(tp *Transport, req *pb.MiddlewareInterceptRequest, reqID string) {
-	// TODO: dispatch to registered middleware handlers
-	tp.Send(&pb.Envelope{
-		RequestId: reqID,
-		Msg: &pb.Envelope_MiddlewareInterceptResponse{
-			MiddlewareInterceptResponse: &pb.MiddlewareInterceptResponse{
-				ArgumentsJson: req.ArgumentsJson,
-				ResultJson:    req.ResultJson,
-			},
-		},
-	})
-}
-```
-
-- [ ] **Step 4: Run Go SDK tests**
-
-Run: `cd sdk/go && go test ./protomcp/ -v`
-Expected: All pass.
-
-- [ ] **Step 5: Verify build**
-
-Run: `cd sdk/go && go build ./protomcp/`
-Expected: Clean build.
-
-- [ ] **Step 6: Commit**
-
-```bash
-git add sdk/go/protomcp/
-git commit -m "feat(sdk/go): add log, manager, and runner"
-```
-
----
-
-## Chunk 3: Rust SDK
-
-### Task 12: Rust SDK scaffolding
-
-**Files:**
-- Create: `sdk/rust/Cargo.toml`
-- Create: `sdk/rust/build.rs`
-- Create: `sdk/rust/src/lib.rs`
-
-- [ ] **Step 1: Create Cargo.toml**
-
-```toml
-[package]
-name = "protomcp"
-version = "0.1.0"
-edition = "2021"
-description = "Rust SDK for protomcp — write MCP tools in Rust"
-license = "MIT"
-
-[dependencies]
-prost = "0.13"
-tokio = { version = "1", features = ["full"] }
-serde = { version = "1", features = ["derive"] }
-serde_json = "1"
-
-[build-dependencies]
-prost-build = "0.13"
-```
-
-- [ ] **Step 2: Create build.rs**
-
-```rust
-fn main() {
-    prost_build::compile_protos(&["../../proto/protomcp.proto"], &["../../proto/"]).unwrap();
-}
-```
-
-- [ ] **Step 3: Create src/lib.rs with module declarations**
-
-```rust
-pub mod proto {
-    include!(concat!(env!("OUT_DIR"), "/protomcp.rs"));
-}
-
-mod tool;
-mod result;
-mod context;
-mod manager;
-mod log;
-mod transport;
-mod runner;
-
-pub use tool::{tool, ToolDef, ArgDef, clear_registry, get_registered_tools};
-pub use result::ToolResult;
-pub use context::ToolContext;
-pub use runner::run;
-```
-
-- [ ] **Step 4: Verify protobuf generation builds**
-
-Run: `cd sdk/rust && cargo build`
-Expected: May fail on missing modules — that's fine. Proto generation should succeed.
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/rust/
-git commit -m "feat(sdk/rust): scaffold crate with prost protobuf generation"
-```
-
----
-
-### Task 13-16: Rust SDK modules
-
-Follow the same pattern as the Go SDK tasks (9-11), implementing:
-- `result.rs` — `ToolResult` struct
-- `context.rs` — `ToolContext` with progress, cancellation token
-- `tool.rs` — builder pattern registration
-- `log.rs` — `ServerLogger`
-- `manager.rs` — `ToolManager` (enable/disable)
-- `transport.rs` — Unix socket + envelope framing
-- `runner.rs` — async main loop with tokio
-
-Each module mirrors the Go SDK's functionality. Implementation follows the API surface from the spec. Tests use `#[cfg(test)]` inline modules.
-
-Key differences from Go SDK:
-- Uses `tokio::net::UnixStream` instead of `net.Conn`
-- Uses `tokio::sync::CancellationToken` instead of `context.Context`
-- Builder pattern for tool registration instead of functional options
-- All handlers are `async`
-
-- [ ] **Step 1: Implement all modules**
-- [ ] **Step 2: Run tests**: `cd sdk/rust && cargo test`
-- [ ] **Step 3: Commit**
-
-```bash
-git add sdk/rust/src/
-git commit -m "feat(sdk/rust): implement full SDK (tool, result, context, transport, runner)"
-```
-
----
-
-## Chunk 4: CI/CD + Badges
-
-### Task 17: CI Pipeline
-
-**Files:**
-- Create: `.github/workflows/ci.yml`
-
-- [ ] **Step 1: Create CI workflow**
-
-```yaml
-name: CI
-
-on:
-  push:
-    branches: [master]
-  pull_request:
-    branches: [master]
-
-jobs:
-  go:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-      - uses: actions/setup-go@v5
-        with:
-          go-version: '1.25'
-      - run: go vet ./...
-      - run: go test ./...
-      - run: go build ./cmd/protomcp/
-
-  go-sdk:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-      - uses: actions/setup-go@v5
-        with:
-          go-version: '1.25'
-      - run: cd sdk/go && go test ./...
-
-  python-sdk:
-    runs-on: ubuntu-latest
-    strategy:
-      matrix:
-        python-version: ['3.10', '3.11', '3.12']
-    steps:
-      - uses: actions/checkout@v4
-      - uses: actions/setup-python@v5
-        with:
-          python-version: ${{ matrix.python-version }}
-      - run: cd sdk/python && pip install -e ".[dev]" && python -m pytest
-
-  typescript-sdk:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-      - uses: actions/setup-node@v4
-        with:
-          node-version: '20'
-      - run: cd sdk/typescript && npm ci && npx vitest run
-
-  rust-sdk:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-      - uses: dtolnay/rust-toolchain@stable
-      - run: cd sdk/rust && cargo test
-      - run: cd sdk/rust && cargo clippy -- -D warnings
-
-  e2e:
-    runs-on: ubuntu-latest
-    needs: [go]
-    steps:
-      - uses: actions/checkout@v4
-      - uses: actions/setup-go@v5
-        with:
-          go-version: '1.25'
-      - uses: actions/setup-python@v5
-        with:
-          python-version: '3.12'
-      - uses: actions/setup-node@v4
-        with:
-          node-version: '20'
-      - run: go build -o pmcp ./cmd/protomcp/
-      - run: cd sdk/python && pip install -e .
-      - run: cd sdk/typescript && npm ci
-      - run: go test ./test/e2e/ -v
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add .github/workflows/ci.yml
-git commit -m "ci: add GitHub Actions CI pipeline"
-```
-
----
-
-### Task 18: Release Pipeline
-
-**Files:**
-- Create: `.github/workflows/release.yml`
-
-- [ ] **Step 1: Create release workflow**
-
-```yaml
-name: Release
-
-on:
-  push:
-    tags: ['v*']
-
-permissions:
-  contents: write
-
-jobs:
-  goreleaser:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-        with:
-          fetch-depth: 0
-      - uses: actions/setup-go@v5
-        with:
-          go-version: '1.25'
-      - uses: goreleaser/goreleaser-action@v6
-        with:
-          args: release --clean
-        env:
-          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-
-  pypi:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-      - uses: actions/setup-python@v5
-        with:
-          python-version: '3.12'
-      - run: pip install build twine
-      - run: cd sdk/python && python -m build
-      - run: cd sdk/python && twine upload dist/*
-        env:
-          TWINE_USERNAME: __token__
-          TWINE_PASSWORD: ${{ secrets.PYPI_API_TOKEN }}
-
-  npm:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-      - uses: actions/setup-node@v4
-        with:
-          node-version: '20'
-          registry-url: 'https://registry.npmjs.org'
-      - run: cd sdk/typescript && npm ci && npm publish
-        env:
-          NODE_AUTH_TOKEN: ${{ secrets.NPM_TOKEN }}
-
-  crates:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-      - uses: dtolnay/rust-toolchain@stable
-      - run: cd sdk/rust && cargo publish
-        env:
-          CARGO_REGISTRY_TOKEN: ${{ secrets.CARGO_REGISTRY_TOKEN }}
-
-  homebrew:
-    runs-on: ubuntu-latest
-    needs: [goreleaser]
-    steps:
-      - uses: actions/checkout@v4
-        with:
-          repository: protomcp/homebrew-tap
-          token: ${{ secrets.HOMEBREW_TAP_TOKEN }}
-      - name: Update formula
-        run: |
-          VERSION=${GITHUB_REF#refs/tags/v}
-          # GoReleaser generates checksums — update the formula with new version + SHA256
-          sed -i "s/version \".*\"/version \"${VERSION}\"/" Formula/protomcp.rb
-          git add Formula/protomcp.rb
-          git commit -m "protomcp ${VERSION}"
-          git push
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add .github/workflows/release.yml
-git commit -m "ci: add release pipeline for Go binary, PyPI, npm, crates.io"
-```
-
----
-
-### Task 19: Fix README badges
-
-**Files:**
-- Modify: `README.md`
-
-- [ ] **Step 1: Update badges**
-
-Replace the current badge block with:
-
-```markdown
-[![CI](https://github.com/msilverblatt/protomcp/actions/workflows/ci.yml/badge.svg)](https://github.com/msilverblatt/protomcp/actions/workflows/ci.yml)
-[![License: MIT](https://img.shields.io/badge/License-MIT-blue.svg)](LICENSE)
-[![Go](https://img.shields.io/badge/Go-1.25+-00ADD8?logo=go)](https://go.dev)
-[![PyPI](https://img.shields.io/pypi/v/protomcp)](https://pypi.org/project/protomcp/)
-[![npm](https://img.shields.io/npm/v/protomcp)](https://www.npmjs.com/package/protomcp)
-[![crates.io](https://img.shields.io/crates/v/protomcp)](https://crates.io/crates/protomcp)
-```
-
-Changes: renamed Build→CI to match workflow name, added crates.io badge, reordered.
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add README.md
-git commit -m "docs: fix README badges to match CI workflow"
-```
-
----
-
-## Chunk 5: Examples + Documentation
-
-### Task 20: Go examples
-
-**Files:**
-- Create: `examples/go/basic.go`
-- Create: `examples/go/real_world.go`
-- Create: `examples/go/full_showcase.go`
-
-- [ ] **Step 1: Create basic example**
-
-```go
-// examples/go/basic.go
-// A minimal protomcp tool — adds and multiplies numbers.
-// Run: pmcp dev examples/go/basic.go
-package main
-
-import (
-	"fmt"
-
-	"github.com/msilverblatt/protomcp/sdk/go/protomcp"
-)
-
-func main() {
-	protomcp.Tool("add",
-		protomcp.Description("Add two numbers"),
-		protomcp.Args(protomcp.IntArg("a"), protomcp.IntArg("b")),
-		protomcp.Handler(func(ctx protomcp.ToolContext, args map[string]interface{}) protomcp.ToolResult {
-			a := int(args["a"].(float64))
-			b := int(args["b"].(float64))
-			return protomcp.Result(fmt.Sprintf("%d", a+b))
-		}),
-	)
-
-	protomcp.Tool("multiply",
-		protomcp.Description("Multiply two numbers"),
-		protomcp.Args(protomcp.IntArg("a"), protomcp.IntArg("b")),
-		protomcp.Handler(func(ctx protomcp.ToolContext, args map[string]interface{}) protomcp.ToolResult {
-			a := int(args["a"].(float64))
-			b := int(args["b"].(float64))
-			return protomcp.Result(fmt.Sprintf("%d", a*b))
-		}),
-	)
-
-	protomcp.Run()
-}
-```
-
-- [ ] **Step 2: Create real_world and full_showcase examples**
-
-Follow the same patterns as the Python examples but in Go, adding progress reporting, cancellation, logging, dynamic tool lists, structured output, and metadata.
-
-- [ ] **Step 3: Verify examples parse**: `cd examples/go && go vet ./...`
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add examples/go/
-git commit -m "examples: add Go examples at 3 tiers"
-```
-
----
-
-### Task 21: Rust examples
-
-**Files:**
-- Create: `examples/rust/basic/Cargo.toml` + `examples/rust/basic/src/main.rs`
-- Create: `examples/rust/real_world/Cargo.toml` + `examples/rust/real_world/src/main.rs`
-- Create: `examples/rust/full_showcase/Cargo.toml` + `examples/rust/full_showcase/src/main.rs`
-
-Each is a standalone Cargo project that depends on the `protomcp` crate via path dependency.
-
-- [ ] **Step 1: Create basic example**
-- [ ] **Step 2: Create real_world and full_showcase**
-- [ ] **Step 3: Verify**: `cd examples/rust/basic && cargo check`
-- [ ] **Step 4: Commit**
-
-```bash
-git add examples/rust/
-git commit -m "examples: add Rust examples at 3 tiers"
-```
-
----
-
-### Task 22: Documentation — new guide pages
-
-**Files:**
-- Create: `docs/src/content/docs/guides/writing-tools-go.mdx`
-- Create: `docs/src/content/docs/guides/writing-tools-rust.mdx`
-- Create: `docs/src/content/docs/guides/middleware.mdx`
-- Create: `docs/src/content/docs/guides/auth.mdx`
-- Create: `docs/src/content/docs/guides/writing-a-language-library.mdx`
-
-Each guide follows the same structure as the existing Python/TypeScript guides:
-1. Installation
-2. Basic usage (decorator/builder pattern)
-3. Type hints / schema definition
-4. Optional parameters
-5. Progress reporting
-6. Cancellation
-7. Logging
-8. Error handling
-9. Advanced features (middleware, dynamic tools)
-
-For the middleware and auth guides, focus on configuration and usage patterns with examples in all four languages.
-
-The "Writing a Language Library" guide covers:
-1. The protobuf contract (envelope format, message types)
-2. Unix socket connection
-3. Length-prefixed framing
-4. Handshake protocol (ListToolsRequest → ToolListResponse → optional middleware → ReloadResponse)
-5. Tool call dispatch
-6. Reload handling
-7. Testing against the Go binary
-
-- [ ] **Step 1: Write all five guide pages**
-- [ ] **Step 2: Verify docs build**: `cd docs && npm run build`
-- [ ] **Step 3: Commit**
-
-```bash
-git add docs/src/content/docs/guides/
-git commit -m "docs: add Go, Rust, middleware, auth, and language library guides"
-```
-
----
-
-### Task 23: Documentation — update existing pages
-
-**Files:**
-- Modify: `docs/src/content/docs/index.mdx`
-- Modify: `docs/src/content/docs/getting-started/quick-start.mdx`
-- Modify: `docs/src/content/docs/getting-started/installation.mdx`
-- Modify: `docs/src/content/docs/reference/cli.mdx`
-
-- [ ] **Step 1: Update index.mdx**
-
-Add Go and Rust cards to the CardGrid.
-
-- [ ] **Step 2: Update quick-start.mdx**
-
-Add Go and Rust quick start snippets (install SDK, write tool file, run).
-
-- [ ] **Step 3: Update installation.mdx**
-
-Add Go SDK install (`go get github.com/msilverblatt/protomcp/sdk/go`) and Rust SDK install (`cargo add protomcp`).
-
-- [ ] **Step 4: Update cli.mdx**
-
-Add `validate` subcommand docs and `--auth` flag docs.
-
-- [ ] **Step 5: Verify docs build**: `cd docs && npm run build`
-
-- [ ] **Step 6: Commit**
-
-```bash
-git add docs/src/content/docs/
-git commit -m "docs: update index, quick-start, installation, and CLI reference for v1.1"
-```
-
----
-
-### Task 24: Update README
-
-**Files:**
-- Modify: `README.md`
-
-- [ ] **Step 1: Add Go and Rust quick start examples**
-
-After the TypeScript example, add Go and Rust sections:
-
-````markdown
-### Go
-
-```go
-// tools.go
-package main
-
-import (
-	"fmt"
-	"github.com/msilverblatt/protomcp/sdk/go/protomcp"
-)
-
-func main() {
-	protomcp.Tool("add",
-		protomcp.Description("Add two numbers"),
-		protomcp.Args(protomcp.IntArg("a"), protomcp.IntArg("b")),
-		protomcp.Handler(func(ctx protomcp.ToolContext, args map[string]interface{}) protomcp.ToolResult {
-			a := int(args["a"].(float64))
-			b := int(args["b"].(float64))
-			return protomcp.Result(fmt.Sprintf("%d", a+b))
-		}),
-	)
-	protomcp.Run()
-}
-```
-
-```sh
-pmcp dev tools.go
-```
-
-### Rust
-
-```rust
-// src/main.rs
-use protomcp::{tool, ToolResult};
-
-#[tokio::main]
-async fn main() {
-    tool("add")
-        .description("Add two numbers")
-        .arg::<i64>("a")
-        .arg::<i64>("b")
-        .handler(|_ctx, args| {
-            let a = args["a"].as_i64().unwrap_or(0);
-            let b = args["b"].as_i64().unwrap_or(0);
-            ToolResult::new(format!("{}", a + b))
-        })
-        .register();
-
-    protomcp::run().await;
-}
-```
-
-```sh
-pmcp dev src/main.rs
-```
-````
-
-- [ ] **Step 2: Update features list**
-
-Add after "Tool Metadata":
-
-```markdown
-- **Middleware** — intercept tool calls before/after with custom logic
-- **Auth** — built-in token and API key authentication for network transports
-- **Validation** — `pmcp validate` checks tool definitions before deployment
-```
-
-- [ ] **Step 3: Update comparison table**
-
-Add middleware and validation rows. Update language support to mention Go/Rust explicitly.
-
-- [ ] **Step 4: Verify README renders**
-
-Visually inspect or use a markdown previewer.
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add README.md
-git commit -m "docs: update README with Go/Rust examples, middleware, validation"
-```
-
----
-
-### Task 25: Update sidebar config
-
-**Files:**
-- Modify: `docs/astro.config.mjs`
-
-- [ ] **Step 1: Add new guide pages to sidebar**
-
-Add entries for the new guides (writing-tools-go, writing-tools-rust, middleware, auth, writing-a-language-library) in the sidebar configuration.
-
-- [ ] **Step 2: Verify docs build**: `cd docs && npm run build`
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add docs/astro.config.mjs
-git commit -m "docs: add v1.1 guide pages to sidebar"
-```
-
----
-
-### Task 26: Final verification
-
-- [ ] **Step 1: Run all tests**
-
-```bash
-go test ./...
-cd sdk/go && go test ./...
-cd ../rust && cargo test
-cd ../../sdk/python && python -m pytest
-cd ../typescript && npx vitest run
-```
-
-- [ ] **Step 2: Build binary**
-
-Run: `go build -o pmcp ./cmd/protomcp/`
-
-- [ ] **Step 3: Build docs**
-
-Run: `cd docs && npm run build`
-
-- [ ] **Step 4: Verify README badges will resolve**
-
-Check that `.github/workflows/ci.yml` has `name: CI` matching the badge URL.
-
-- [ ] **Step 5: Final commit if any cleanup needed**
-
-```bash
-git add -A
-git commit -m "chore: v1.1 final cleanup"
-```
diff --git a/docs/superpowers/plans/2026-03-12-protomcp-v1.md b/docs/superpowers/plans/2026-03-12-protomcp-v1.md
deleted file mode 100644
index d6d5604..0000000
--- a/docs/superpowers/plans/2026-03-12-protomcp-v1.md
+++ /dev/null
@@ -1,4992 +0,0 @@
-# protomcp v1.0 Implementation Plan
-
-> **For agentic workers:** REQUIRED: Use superpowers:subagent-driven-development (if subagents available) or superpowers:executing-plans to implement this plan. Steps use checkbox (`- [ ]`) syntax for tracking.
-
-**Goal:** Build a language-agnostic MCP runtime — a Go binary that proxies MCP protocol to tool processes in any language via protobuf over unix socket, with hot-reload, dynamic tool list management, progress notifications, async tasks, cancellation, server logging, structured output, and tool metadata.
-
-**Architecture:** A precompiled Go binary handles all MCP transport/protocol. It communicates with a spawned tool process over a unix socket using length-prefixed protobuf envelopes. First-class Python and TypeScript SDKs provide decorator APIs. The binary proxies progress, cancellation, logging, and async task lifecycle. Starlight documentation site.
-
-**Tech Stack:** Go 1.22+, Protocol Buffers 3, Python 3.10+ (with protobuf, inspect), TypeScript 5+ (with Zod, protobuf-ts), Astro Starlight, fsnotify (Go file watching)
-
-**Spec:** `docs/superpowers/specs/2026-03-12-protomcp-design.md`
-
----
-
-## File Structure
-
-```
-protomcp/
-├── proto/
-│   └── protomcp.proto                    # Single source of truth for internal protocol
-├── cmd/
-│   └── protomcp/
-│       └── main.go                       # CLI entry point (dev, run commands)
-├── internal/
-│   ├── envelope/
-│   │   ├── envelope.go                   # Length-prefixed protobuf read/write
-│   │   └── envelope_test.go
-│   ├── toollist/
-│   │   ├── manager.go                    # Tool list state machine (open/allow/block)
-│   │   └── manager_test.go
-│   ├── process/
-│   │   ├── manager.go                    # Tool process spawn, handshake, crash recovery
-│   │   └── manager_test.go
-│   ├── reload/
-│   │   ├── watcher.go                    # File watcher + reload orchestration
-│   │   └── watcher_test.go
-│   ├── mcp/
-│   │   ├── types.go                      # MCP JSON-RPC types (requests, responses, notifications)
-│   │   ├── handler.go                    # MCP request handler (tools/list, tools/call dispatch)
-│   │   └── handler_test.go
-│   ├── transport/
-│   │   ├── transport.go                  # Transport interface
-│   │   ├── stdio.go                      # stdio transport
-│   │   ├── stdio_test.go
-│   │   ├── http.go                       # Streamable HTTP transport
-│   │   ├── http_test.go
-│   │   ├── sse.go                        # SSE transport
-│   │   ├── sse_test.go
-│   │   ├── grpc.go                       # gRPC transport
-│   │   ├── grpc_test.go
-│   │   ├── ws.go                         # WebSocket transport
-│   │   └── ws_test.go
-│   ├── middleware/
-│   │   ├── chain.go                      # Middleware interceptor chain
-│   │   ├── logging.go                    # Structured logging middleware
-│   │   └── errors.go                     # Error formatting middleware
-│   ├── progress/
-│   │   ├── progress.go                   # Progress notification proxy
-│   │   └── progress_test.go
-│   ├── tasks/
-│   │   ├── manager.go                    # Async task lifecycle manager
-│   │   └── manager_test.go
-│   ├── cancel/
-│   │   ├── tracker.go                    # Cancellation tracking for in-flight calls
-│   │   └── tracker_test.go
-│   ├── serverlog/
-│   │   ├── forwarder.go                  # Server log forwarding to MCP notifications/message
-│   │   └── forwarder_test.go
-│   └── config/
-│       └── config.go                     # CLI flag parsing and config struct
-├── gen/
-│   └── proto/
-│       └── protomcp/
-│           ├── protomcp.pb.go            # Generated Go protobuf types
-│           └── protomcp_grpc.pb.go       # Generated gRPC service (for external gRPC transport)
-├── go.mod
-├── go.sum
-├── sdk/
-│   ├── python/
-│   │   ├── pyproject.toml
-│   │   ├── src/
-│   │   │   └── protomcp/
-│   │   │       ├── __init__.py           # Public API exports
-│   │   │       ├── tool.py               # @tool decorator + schema generation
-│   │   │       ├── result.py             # ToolResult type
-│   │   │       ├── manager.py            # tool_manager client
-│   │   │       ├── context.py           # ToolContext (progress, cancellation)
-│   │   │       ├── log.py               # Server logging API
-│   │   │       ├── transport.py          # Unix socket + envelope framing
-│   │   │       └── runner.py             # Main loop: connect, listen, reload, dispatch
-│   │   ├── tests/
-│   │   │   ├── test_tool.py
-│   │   │   ├── test_result.py
-│   │   │   ├── test_manager.py
-│   │   │   ├── test_transport.py
-│   │   │   └── test_integration.py       # End-to-end with Go binary
-│   │   └── gen/
-│   │       └── protomcp_pb2.py           # Generated Python protobuf types
-│   └── typescript/
-│       ├── package.json
-│       ├── tsconfig.json
-│       ├── vitest.config.ts
-│       ├── src/
-│       │   ├── index.ts                  # Public API exports
-│       │   ├── tool.ts                   # tool() function + Zod schema generation
-│       │   ├── result.ts                 # ToolResult type
-│       │   ├── manager.ts               # tool_manager client
-│       │   ├── context.ts               # ToolContext (progress, cancellation)
-│       │   ├── log.ts                   # Server logging API
-│       │   ├── transport.ts              # Unix socket + envelope framing
-│       │   └── runner.ts                 # Main loop
-│       ├── tests/
-│       │   ├── tool.test.ts
-│       │   ├── result.test.ts
-│       │   ├── manager.test.ts
-│       │   ├── transport.test.ts
-│       │   └── integration.test.ts       # End-to-end with Go binary
-│       └── gen/
-│           └── protomcp.ts               # Generated TS protobuf types
-├── test/
-│   ├── e2e/
-│   │   ├── e2e_test.go                   # Full pipeline: Go binary + Python tool + MCP client
-│   │   ├── fixtures/
-│   │   │   ├── simple_tool.py            # Basic Python tool for testing
-│   │   │   ├── dynamic_tool.py           # Tool with enable/disable mutations
-│   │   │   ├── simple_tool.ts            # Basic TS tool for testing
-│   │   │   ├── crash_tool.py             # Tool that crashes (for recovery testing)
-│   │   │   ├── progress_tool.py          # Tool that reports progress
-│   │   │   ├── async_tool.py             # Tool with task_support for async testing
-│   │   │   ├── logging_tool.py           # Tool that emits server logs
-│   │   │   └── structured_output_tool.py # Tool with output_type for structured output
-│   │   └── helpers.go                    # Test helpers (start binary, MCP client mock)
-│   └── proto/
-│       └── proto_test.go                 # Validate proto generates correctly for all languages
-├── docs/
-│   ├── astro.config.mjs
-│   ├── package.json
-│   └── src/
-│       └── content/
-│           └── docs/
-│               ├── index.mdx
-│               ├── getting-started/
-│               │   ├── installation.mdx
-│               │   ├── quick-start.mdx
-│               │   └── how-it-works.mdx
-│               ├── guides/
-│               │   ├── writing-tools-python.mdx
-│               │   ├── writing-tools-typescript.mdx
-│               │   ├── dynamic-tool-lists.mdx
-│               │   ├── hot-reload.mdx
-│               │   ├── progress-notifications.mdx
-│               │   ├── async-tasks.mdx
-│               │   ├── cancellation.mdx
-│               │   ├── server-logging.mdx
-│               │   ├── structured-output.mdx
-│               │   ├── error-handling.mdx
-│               │   └── production-deployment.mdx
-│               ├── reference/
-│               │   ├── cli.mdx
-│               │   ├── protobuf-spec.mdx
-│               │   ├── python-api.mdx
-│               │   └── typescript-api.mdx
-│               └── concepts/
-│                   ├── architecture.mdx
-│                   ├── tool-list-modes.mdx
-│                   └── transports.mdx
-├── Makefile                              # proto-gen, build, test, docs commands
-└── .goreleaser.yml                       # Cross-platform binary releases
-```
-
----
-
-## Chunk 1: Foundation — Project Setup, Protobuf, Envelope, Tool List Manager
-
-### Task 1: Project Initialization
-
-**Files:**
-- Create: `go.mod`
-- Create: `Makefile`
-- Create: `.gitignore`
-- Create: `.goreleaser.yml`
-
-- [ ] **Step 1: Initialize Go module**
-
-```bash
-cd /Users/msilverblatt/hotmcp
-go mod init github.com/msilverblatt/protomcp
-```
-
-- [ ] **Step 2: Create Makefile**
-
-Create `Makefile` with targets:
-```makefile
-.PHONY: proto build test clean
-
-PROTO_DIR := proto
-GEN_DIR := gen/proto/protomcp
-PYTHON_GEN_DIR := sdk/python/gen
-TS_GEN_DIR := sdk/typescript/gen
-
-proto:
-	mkdir -p $(GEN_DIR) $(PYTHON_GEN_DIR) $(TS_GEN_DIR)
-	protoc --go_out=$(GEN_DIR) --go_opt=paths=source_relative \
-		--go-grpc_out=$(GEN_DIR) --go-grpc_opt=paths=source_relative \
-		-I$(PROTO_DIR) $(PROTO_DIR)/protomcp.proto
-	protoc --python_out=$(PYTHON_GEN_DIR) \
-		-I$(PROTO_DIR) $(PROTO_DIR)/protomcp.proto
-	protoc --plugin=protoc-gen-ts=$$(which protoc-gen-ts) \
-		--ts_out=$(TS_GEN_DIR) \
-		-I$(PROTO_DIR) $(PROTO_DIR)/protomcp.proto
-
-build:
-	go build -o bin/protomcp ./cmd/protomcp
-
-test:
-	go test ./...
-
-test-python:
-	cd sdk/python && python -m pytest tests/ -v
-
-test-ts:
-	cd sdk/typescript && npx vitest run
-
-test-all: test test-python test-ts
-
-clean:
-	rm -rf bin/ gen/
-```
-
-- [ ] **Step 3: Create .gitignore**
-
-```
-bin/
-gen/
-dist/
-node_modules/
-__pycache__/
-*.egg-info/
-.venv/
-*.pb.go
-*_pb2.py
-```
-
-- [ ] **Step 4: Create .goreleaser.yml**
-
-```yaml
-version: 2
-builds:
-  - main: ./cmd/protomcp
-    binary: protomcp
-    goos:
-      - linux
-      - darwin
-      - windows
-    goarch:
-      - amd64
-      - arm64
-    env:
-      - CGO_ENABLED=0
-
-archives:
-  - format: tar.gz
-    name_template: "protomcp_{{ .Os }}_{{ .Arch }}"
-
-brews:
-  - repository:
-      owner: msilverblatt
-      name: homebrew-tap
-    homepage: "https://github.com/msilverblatt/protomcp"
-    description: "Language-agnostic MCP runtime"
-```
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add go.mod Makefile .gitignore .goreleaser.yml
-git commit -m "feat: initialize project with Go module, Makefile, and release config"
-```
-
----
-
-### Task 2: Protobuf Spec
-
-**Files:**
-- Create: `proto/protomcp.proto`
-
-- [ ] **Step 1: Write the protobuf spec**
-
-Create `proto/protomcp.proto` — this is the single source of truth for the internal protocol between the Go binary and tool processes:
-
-```protobuf
-syntax = "proto3";
-
-package protomcp;
-
-option go_package = "github.com/msilverblatt/protomcp/gen/proto/protomcp";
-
-// Envelope wraps all messages with length-prefixed framing.
-// Wire format: 4-byte big-endian uint32 length prefix, then serialized Envelope.
-message Envelope {
-  oneof msg {
-    // Go -> Tool Process
-    ReloadRequest reload = 1;
-    ListToolsRequest list_tools = 2;
-    CallToolRequest call_tool = 3;
-
-    // Tool Process -> Go
-    ReloadResponse reload_response = 4;
-    ToolListResponse tool_list = 5;
-    CallToolResponse call_result = 6;
-    EnableToolsRequest enable_tools = 7;
-    DisableToolsRequest disable_tools = 8;
-    SetAllowedRequest set_allowed = 9;
-    SetBlockedRequest set_blocked = 10;
-    GetActiveToolsRequest get_active_tools = 11;
-    BatchUpdateRequest batch = 12;
-    ActiveToolsResponse active_tools = 13;
-
-    // Progress, cancellation, logging, tasks
-    ProgressNotification progress = 16;
-    CancelRequest cancel = 17;
-    LogMessage log = 18;
-    CreateTaskResponse create_task = 19;
-    TaskStatusRequest task_status = 20;
-    TaskStatusResponse task_status_response = 21;
-    TaskResultRequest task_result = 22;
-    TaskCancelRequest task_cancel = 23;
-  }
-  // Correlation ID for matching requests to responses.
-  // Required for CallToolRequest/CallToolResponse to support concurrent calls.
-  // Optional for other message types.
-  string request_id = 14;
-  // Namespace for future multi-process support. Ignored in v1.
-  string namespace = 15;
-}
-
-// --- Go -> Tool Process ---
-
-message ReloadRequest {}
-
-message ListToolsRequest {}
-
-message CallToolRequest {
-  string name = 1;
-  // JSON-encoded arguments from the MCP client
-  string arguments_json = 2;
-  // Progress token from client's _meta.progressToken (empty if none)
-  string progress_token = 3;
-}
-
-// --- Tool Process -> Go ---
-
-message ReloadResponse {
-  bool success = 1;
-  string error = 2; // Non-empty on failure (e.g., syntax error, import error)
-}
-
-message ToolListResponse {
-  repeated ToolDefinition tools = 1;
-}
-
-message ToolDefinition {
-  string name = 1;
-  string description = 2;
-  // JSON Schema for the tool's input parameters
-  string input_schema_json = 3;
-  // JSON Schema for the tool's output (empty if unstructured)
-  string output_schema_json = 4;
-  // Tool metadata/annotations
-  string title = 5;
-  bool read_only_hint = 6;
-  bool destructive_hint = 7;
-  bool idempotent_hint = 8;
-  bool open_world_hint = 9;
-  bool task_support = 10; // Advertises async task capability
-}
-
-message CallToolResponse {
-  bool is_error = 1;
-  // JSON-encoded result content (MCP content array)
-  string result_json = 2;
-  // Optional tool list mutations — Go binary intercepts these before proxying to host
-  repeated string enable_tools = 3;
-  repeated string disable_tools = 4;
-  // Structured error details (if is_error is true)
-  ToolError error = 5;
-  // Structured output (JSON, validated against outputSchema)
-  string structured_content_json = 6;
-}
-
-message ToolError {
-  string error_code = 1;
-  string message = 2;
-  string suggestion = 3;
-  bool retryable = 4;
-}
-
-// --- Tool List Control (Tool Process -> Go) ---
-
-message EnableToolsRequest {
-  repeated string tool_names = 1;
-}
-
-message DisableToolsRequest {
-  repeated string tool_names = 1;
-}
-
-message SetAllowedRequest {
-  repeated string tool_names = 1;
-}
-
-message SetBlockedRequest {
-  repeated string tool_names = 1;
-}
-
-message GetActiveToolsRequest {}
-
-message BatchUpdateRequest {
-  repeated string enable = 1;
-  repeated string disable = 2;
-  repeated string allow = 3;  // Set allowed list (mutually exclusive with block)
-  repeated string block = 4;  // Set blocked list (mutually exclusive with allow)
-}
-
-message ActiveToolsResponse {
-  repeated string tool_names = 1;
-}
-
-// --- Progress, Cancellation, Logging ---
-
-message ProgressNotification {
-  string progress_token = 1; // Token from CallToolRequest
-  int64 progress = 2;        // Current progress value
-  int64 total = 3;           // Total expected (0 = indeterminate)
-  string message = 4;        // Human-readable status
-}
-
-message CancelRequest {
-  string request_id = 1; // ID of the call to cancel
-}
-
-message LogMessage {
-  string level = 1;   // RFC 5424: emergency, alert, critical, error, warning, notice, info, debug
-  string logger = 2;  // Source component (optional)
-  string data_json = 3; // JSON-encoded log data
-}
-
-// --- Task (Async) Lifecycle ---
-
-message CreateTaskResponse {
-  string task_id = 1;
-}
-
-message TaskStatusRequest {
-  string task_id = 1;
-}
-
-message TaskStatusResponse {
-  string task_id = 1;
-  string state = 2;    // running, completed, failed, cancelled
-  int64 progress = 3;  // Optional progress
-  int64 total = 4;     // Optional total
-  string message = 5;  // Optional status message
-}
-
-message TaskResultRequest {
-  string task_id = 1;
-}
-
-message TaskCancelRequest {
-  string task_id = 1;
-}
-```
-
-- [ ] **Step 2: Generate Go code from proto**
-
-```bash
-make proto
-```
-
-Verify: `gen/proto/protomcp/protomcp.pb.go` exists and compiles.
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add proto/protomcp.proto
-git commit -m "feat: add protobuf spec defining internal protocol between Go binary and tool processes"
-```
-
----
-
-### Task 3: Envelope — Length-Prefixed Protobuf Read/Write
-
-**Files:**
-- Create: `internal/envelope/envelope.go`
-- Create: `internal/envelope/envelope_test.go`
-
-- [ ] **Step 1: Write failing tests for envelope**
-
-Create `internal/envelope/envelope_test.go`:
-
-```go
-package envelope_test
-
-import (
-	"bytes"
-	"testing"
-
-	"github.com/msilverblatt/protomcp/internal/envelope"
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-func TestWriteAndReadEnvelope(t *testing.T) {
-	// Create a test envelope with a ListToolsRequest
-	env := &pb.Envelope{
-		Msg: &pb.Envelope_ListTools{
-			ListTools: &pb.ListToolsRequest{},
-		},
-		RequestId: "test-123",
-	}
-
-	var buf bytes.Buffer
-	err := envelope.Write(&buf, env)
-	if err != nil {
-		t.Fatalf("Write failed: %v", err)
-	}
-
-	got, err := envelope.Read(&buf)
-	if err != nil {
-		t.Fatalf("Read failed: %v", err)
-	}
-
-	if got.RequestId != "test-123" {
-		t.Errorf("RequestId = %q, want %q", got.RequestId, "test-123")
-	}
-
-	if got.GetListTools() == nil {
-		t.Error("expected ListToolsRequest, got nil")
-	}
-}
-
-func TestWriteAndReadCallTool(t *testing.T) {
-	env := &pb.Envelope{
-		Msg: &pb.Envelope_CallTool{
-			CallTool: &pb.CallToolRequest{
-				Name:          "search",
-				ArgumentsJson: `{"query": "hello"}`,
-			},
-		},
-		RequestId: "call-456",
-	}
-
-	var buf bytes.Buffer
-	err := envelope.Write(&buf, env)
-	if err != nil {
-		t.Fatalf("Write failed: %v", err)
-	}
-
-	got, err := envelope.Read(&buf)
-	if err != nil {
-		t.Fatalf("Read failed: %v", err)
-	}
-
-	ct := got.GetCallTool()
-	if ct == nil {
-		t.Fatal("expected CallToolRequest, got nil")
-	}
-	if ct.Name != "search" {
-		t.Errorf("Name = %q, want %q", ct.Name, "search")
-	}
-	if ct.ArgumentsJson != `{"query": "hello"}` {
-		t.Errorf("ArgumentsJson = %q, want %q", ct.ArgumentsJson, `{"query": "hello"}`)
-	}
-}
-
-func TestReadEmptyBuffer(t *testing.T) {
-	var buf bytes.Buffer
-	_, err := envelope.Read(&buf)
-	if err == nil {
-		t.Error("expected error reading empty buffer, got nil")
-	}
-}
-
-func TestMultipleEnvelopes(t *testing.T) {
-	var buf bytes.Buffer
-
-	envs := []*pb.Envelope{
-		{Msg: &pb.Envelope_ListTools{ListTools: &pb.ListToolsRequest{}}, RequestId: "1"},
-		{Msg: &pb.Envelope_Reload{Reload: &pb.ReloadRequest{}}, RequestId: "2"},
-		{Msg: &pb.Envelope_ListTools{ListTools: &pb.ListToolsRequest{}}, RequestId: "3"},
-	}
-
-	for _, env := range envs {
-		if err := envelope.Write(&buf, env); err != nil {
-			t.Fatalf("Write failed: %v", err)
-		}
-	}
-
-	for i, want := range envs {
-		got, err := envelope.Read(&buf)
-		if err != nil {
-			t.Fatalf("Read %d failed: %v", i, err)
-		}
-		if got.RequestId != want.RequestId {
-			t.Errorf("envelope %d: RequestId = %q, want %q", i, got.RequestId, want.RequestId)
-		}
-	}
-}
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-```bash
-go test ./internal/envelope/... -v
-```
-
-Expected: compilation error — package `envelope` doesn't exist.
-
-- [ ] **Step 3: Implement envelope**
-
-Create `internal/envelope/envelope.go`:
-
-```go
-package envelope
-
-import (
-	"encoding/binary"
-	"fmt"
-	"io"
-
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-	"google.golang.org/protobuf/proto"
-)
-
-const maxMessageSize = 10 * 1024 * 1024 // 10MB
-
-// Write serializes an Envelope and writes it with a 4-byte big-endian length prefix.
-func Write(w io.Writer, env *pb.Envelope) error {
-	data, err := proto.Marshal(env)
-	if err != nil {
-		return fmt.Errorf("marshal envelope: %w", err)
-	}
-
-	length := uint32(len(data))
-	if err := binary.Write(w, binary.BigEndian, length); err != nil {
-		return fmt.Errorf("write length prefix: %w", err)
-	}
-
-	if _, err := w.Write(data); err != nil {
-		return fmt.Errorf("write envelope data: %w", err)
-	}
-
-	return nil
-}
-
-// Read reads a length-prefixed Envelope from the reader.
-func Read(r io.Reader) (*pb.Envelope, error) {
-	var length uint32
-	if err := binary.Read(r, binary.BigEndian, &length); err != nil {
-		return nil, fmt.Errorf("read length prefix: %w", err)
-	}
-
-	if length > maxMessageSize {
-		return nil, fmt.Errorf("message size %d exceeds max %d", length, maxMessageSize)
-	}
-
-	data := make([]byte, length)
-	if _, err := io.ReadFull(r, data); err != nil {
-		return nil, fmt.Errorf("read envelope data: %w", err)
-	}
-
-	env := &pb.Envelope{}
-	if err := proto.Unmarshal(data, env); err != nil {
-		return nil, fmt.Errorf("unmarshal envelope: %w", err)
-	}
-
-	return env, nil
-}
-```
-
-- [ ] **Step 4: Run tests to verify they pass**
-
-```bash
-go test ./internal/envelope/... -v
-```
-
-Expected: all 4 tests PASS.
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/envelope/
-git commit -m "feat: implement length-prefixed protobuf envelope read/write"
-```
-
----
-
-### Task 4: Tool List Manager — State Machine
-
-**Files:**
-- Create: `internal/toollist/manager.go`
-- Create: `internal/toollist/manager_test.go`
-
-- [ ] **Step 1: Write failing tests for tool list manager**
-
-Create `internal/toollist/manager_test.go`:
-
-```go
-package toollist_test
-
-import (
-	"testing"
-
-	"github.com/msilverblatt/protomcp/internal/toollist"
-)
-
-func TestOpenMode_AllToolsActive(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-
-	got := m.Active()
-	want := []string{"a", "b", "c"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestOpenMode_DisableTool(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-
-	changed := m.Disable([]string{"b"})
-	if !changed {
-		t.Error("Disable should report change")
-	}
-
-	got := m.Active()
-	want := []string{"a", "c"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestOpenMode_EnableReAdds(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-	m.Disable([]string{"b"})
-
-	changed := m.Enable([]string{"b"})
-	if !changed {
-		t.Error("Enable should report change")
-	}
-
-	got := m.Active()
-	want := []string{"a", "b", "c"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestAllowlistMode(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c", "d"})
-
-	changed := m.SetAllowed([]string{"a", "c"})
-	if !changed {
-		t.Error("SetAllowed should report change")
-	}
-
-	got := m.Active()
-	want := []string{"a", "c"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestAllowlistMode_EnableAddsToAllowlist(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-	m.SetAllowed([]string{"a"})
-
-	m.Enable([]string{"b"})
-
-	got := m.Active()
-	want := []string{"a", "b"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestAllowlistMode_DisableRemovesFromAllowlist(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-	m.SetAllowed([]string{"a", "b"})
-
-	m.Disable([]string{"a"})
-
-	got := m.Active()
-	want := []string{"b"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestBlocklistMode(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c", "d"})
-
-	changed := m.SetBlocked([]string{"b", "d"})
-	if !changed {
-		t.Error("SetBlocked should report change")
-	}
-
-	got := m.Active()
-	want := []string{"a", "c"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestBlocklistMode_DisableAddsToBlocklist(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-	m.SetBlocked([]string{"c"})
-
-	m.Disable([]string{"a"})
-
-	got := m.Active()
-	want := []string{"b"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestBlocklistMode_EnableRemovesFromBlocklist(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-	m.SetBlocked([]string{"b", "c"})
-
-	m.Enable([]string{"c"})
-
-	got := m.Active()
-	want := []string{"a", "c"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestSetAllowedSwitchesFromBlocklist(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-	m.SetBlocked([]string{"c"})
-	m.SetAllowed([]string{"a"})
-
-	got := m.Active()
-	want := []string{"a"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestEmptyAllowlistResetsToOpen(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-	m.SetAllowed([]string{"a"})
-	m.SetAllowed([]string{})
-
-	got := m.Active()
-	want := []string{"a", "b", "c"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestEmptyBlocklistResetsToOpen(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-	m.SetBlocked([]string{"a"})
-	m.SetBlocked([]string{})
-
-	got := m.Active()
-	want := []string{"a", "b", "c"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestBatch_EnableAndDisable(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-	m.Disable([]string{"a", "b"})
-
-	changed, err := m.Batch([]string{"a"}, []string{"c"}, nil, nil)
-	if err != nil {
-		t.Fatalf("Batch failed: %v", err)
-	}
-	if !changed {
-		t.Error("Batch should report change")
-	}
-
-	got := m.Active()
-	want := []string{"a"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestBatch_AllowAndBlockRejects(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-
-	_, err := m.Batch(nil, nil, []string{"a"}, []string{"b"})
-	if err == nil {
-		t.Error("Batch with both allow and block should return error")
-	}
-}
-
-func TestBatch_AllowThenEnableDelta(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-
-	// Set allow to ["a"], then enable "b" — should result in ["a", "b"]
-	changed, err := m.Batch([]string{"b"}, nil, []string{"a"}, nil)
-	if err != nil {
-		t.Fatalf("Batch failed: %v", err)
-	}
-	if !changed {
-		t.Error("Batch should report change")
-	}
-
-	got := m.Active()
-	want := []string{"a", "b"}
-	if !slicesEqual(got, want) {
-		t.Errorf("Active() = %v, want %v", got, want)
-	}
-}
-
-func TestNoChangeReturnsFalse(t *testing.T) {
-	m := toollist.New()
-	m.SetRegistered([]string{"a", "b", "c"})
-
-	changed := m.Enable([]string{"a"}) // already active
-	if changed {
-		t.Error("Enable of already-active tool should return false")
-	}
-}
-
-func slicesEqual(a, b []string) bool {
-	if len(a) != len(b) {
-		return false
-	}
-	m := make(map[string]bool, len(a))
-	for _, v := range a {
-		m[v] = true
-	}
-	for _, v := range b {
-		if !m[v] {
-			return false
-		}
-	}
-	return true
-}
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-```bash
-go test ./internal/toollist/... -v
-```
-
-Expected: compilation error — package `toollist` doesn't exist.
-
-- [ ] **Step 3: Implement tool list manager**
-
-Create `internal/toollist/manager.go`:
-
-```go
-package toollist
-
-import (
-	"fmt"
-	"sort"
-	"sync"
-)
-
-type mode int
-
-const (
-	modeOpen mode = iota
-	modeAllowlist
-	modeBlocklist
-)
-
-// Manager tracks which tools are active using open/allowlist/blocklist modes.
-// All methods are safe for concurrent use.
-type Manager struct {
-	mu         sync.RWMutex
-	registered map[string]bool // all tools the tool process has registered
-	current    mode
-	set        map[string]bool // allowlist entries, blocklist entries, or disabled set (open mode)
-}
-
-func New() *Manager {
-	return &Manager{
-		registered: make(map[string]bool),
-		current:    modeOpen,
-		set:        make(map[string]bool),
-	}
-}
-
-// SetRegistered updates the full set of registered tools (called after reload).
-func (m *Manager) SetRegistered(tools []string) {
-	m.mu.Lock()
-	defer m.mu.Unlock()
-	m.registered = make(map[string]bool, len(tools))
-	for _, t := range tools {
-		m.registered[t] = true
-	}
-}
-
-// Active returns the currently active tool names.
-func (m *Manager) Active() []string {
-	m.mu.RLock()
-	defer m.mu.RUnlock()
-	return m.activeLocked()
-}
-
-func (m *Manager) activeLocked() []string {
-	var result []string
-	switch m.current {
-	case modeOpen:
-		for t := range m.registered {
-			if !m.set[t] { // set contains disabled tools in open mode
-				result = append(result, t)
-			}
-		}
-	case modeAllowlist:
-		for t := range m.set {
-			if m.registered[t] {
-				result = append(result, t)
-			}
-		}
-	case modeBlocklist:
-		for t := range m.registered {
-			if !m.set[t] {
-				result = append(result, t)
-			}
-		}
-	}
-	sort.Strings(result)
-	return result
-}
-
-// Enable adds tools. Behavior depends on mode:
-// Open: re-enables disabled tools. Allowlist: adds to allowlist. Blocklist: removes from blocklist.
-func (m *Manager) Enable(tools []string) bool {
-	m.mu.Lock()
-	defer m.mu.Unlock()
-	before := m.activeLocked()
-
-	switch m.current {
-	case modeOpen:
-		for _, t := range tools {
-			delete(m.set, t)
-		}
-	case modeAllowlist:
-		for _, t := range tools {
-			m.set[t] = true
-		}
-	case modeBlocklist:
-		for _, t := range tools {
-			delete(m.set, t)
-		}
-	}
-
-	after := m.activeLocked()
-	return !slicesEqual(before, after)
-}
-
-// Disable removes tools. Behavior depends on mode:
-// Open: disables tools. Allowlist: removes from allowlist. Blocklist: adds to blocklist.
-func (m *Manager) Disable(tools []string) bool {
-	m.mu.Lock()
-	defer m.mu.Unlock()
-	before := m.activeLocked()
-
-	switch m.current {
-	case modeOpen:
-		for _, t := range tools {
-			m.set[t] = true
-		}
-	case modeAllowlist:
-		for _, t := range tools {
-			delete(m.set, t)
-		}
-	case modeBlocklist:
-		for _, t := range tools {
-			m.set[t] = true
-		}
-	}
-
-	after := m.activeLocked()
-	return !slicesEqual(before, after)
-}
-
-// SetAllowed switches to allowlist mode. Empty list resets to open mode.
-func (m *Manager) SetAllowed(tools []string) bool {
-	m.mu.Lock()
-	defer m.mu.Unlock()
-	before := m.activeLocked()
-
-	if len(tools) == 0 {
-		m.current = modeOpen
-		m.set = make(map[string]bool)
-	} else {
-		m.current = modeAllowlist
-		m.set = make(map[string]bool, len(tools))
-		for _, t := range tools {
-			m.set[t] = true
-		}
-	}
-
-	after := m.activeLocked()
-	return !slicesEqual(before, after)
-}
-
-// SetBlocked switches to blocklist mode. Empty list resets to open mode.
-func (m *Manager) SetBlocked(tools []string) bool {
-	m.mu.Lock()
-	defer m.mu.Unlock()
-	before := m.activeLocked()
-
-	if len(tools) == 0 {
-		m.current = modeOpen
-		m.set = make(map[string]bool)
-	} else {
-		m.current = modeBlocklist
-		m.set = make(map[string]bool, len(tools))
-		for _, t := range tools {
-			m.set[t] = true
-		}
-	}
-
-	after := m.activeLocked()
-	return !slicesEqual(before, after)
-}
-
-// Batch applies multiple operations atomically. Allow and block are mutually exclusive.
-// Order: mode-setting (allow/block) first, then deltas (enable/disable).
-func (m *Manager) Batch(enable, disable, allow, block []string) (bool, error) {
-	if len(allow) > 0 && len(block) > 0 {
-		return false, fmt.Errorf("batch: allow and block are mutually exclusive")
-	}
-
-	m.mu.Lock()
-	defer m.mu.Unlock()
-	before := m.activeLocked()
-
-	// Mode-setting first
-	if len(allow) > 0 {
-		m.current = modeAllowlist
-		m.set = make(map[string]bool, len(allow))
-		for _, t := range allow {
-			m.set[t] = true
-		}
-	} else if len(block) > 0 {
-		m.current = modeBlocklist
-		m.set = make(map[string]bool, len(block))
-		for _, t := range block {
-			m.set[t] = true
-		}
-	}
-
-	// Then deltas (reuse logic without locks since we hold mu)
-	if len(enable) > 0 {
-		switch m.current {
-		case modeOpen:
-			for _, t := range enable {
-				delete(m.set, t)
-			}
-		case modeAllowlist:
-			for _, t := range enable {
-				m.set[t] = true
-			}
-		case modeBlocklist:
-			for _, t := range enable {
-				delete(m.set, t)
-			}
-		}
-	}
-	if len(disable) > 0 {
-		switch m.current {
-		case modeOpen:
-			for _, t := range disable {
-				m.set[t] = true
-			}
-		case modeAllowlist:
-			for _, t := range disable {
-				delete(m.set, t)
-			}
-		case modeBlocklist:
-			for _, t := range disable {
-				m.set[t] = true
-			}
-		}
-	}
-
-	after := m.activeLocked()
-	return !slicesEqual(before, after), nil
-}
-
-func slicesEqual(a, b []string) bool {
-	if len(a) != len(b) {
-		return false
-	}
-	m := make(map[string]bool, len(a))
-	for _, v := range a {
-		m[v] = true
-	}
-	for _, v := range b {
-		if !m[v] {
-			return false
-		}
-	}
-	return true
-}
-```
-
-- [ ] **Step 4: Run tests to verify they pass**
-
-```bash
-go test ./internal/toollist/... -v
-```
-
-Expected: all 16 tests PASS.
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/toollist/
-git commit -m "feat: implement tool list state machine with open/allowlist/blocklist modes"
-```
-
----
-
-## Chunk 2: Go Binary Core — Process Manager, MCP Handler, Config
-
-### Task 5: Config — CLI Flag Parsing
-
-**Files:**
-- Create: `internal/config/config.go`
-- Create: `internal/config/config_test.go`
-
-- [ ] **Step 1: Write failing tests for config parsing**
-
-Create `internal/config/config_test.go`:
-
-```go
-package config_test
-
-import (
-	"reflect"
-	"testing"
-	"time"
-
-	"github.com/msilverblatt/protomcp/internal/config"
-)
-
-func TestParseDefaults(t *testing.T) {
-	cfg, err := config.Parse([]string{"dev", "server.py"})
-	if err != nil {
-		t.Fatalf("Parse failed: %v", err)
-	}
-	if cfg.Command != "dev" {
-		t.Errorf("Command = %q, want %q", cfg.Command, "dev")
-	}
-	if cfg.File != "server.py" {
-		t.Errorf("File = %q, want %q", cfg.File, "server.py")
-	}
-	if cfg.Transport != "stdio" {
-		t.Errorf("Transport = %q, want %q", cfg.Transport, "stdio")
-	}
-	if cfg.CallTimeout != 5*time.Minute {
-		t.Errorf("CallTimeout = %v, want %v", cfg.CallTimeout, 5*time.Minute)
-	}
-	if cfg.HotReloadImmediate {
-		t.Error("HotReloadImmediate should default to false")
-	}
-	if cfg.LogLevel != "info" {
-		t.Errorf("LogLevel = %q, want %q", cfg.LogLevel, "info")
-	}
-}
-
-func TestParseWithFlags(t *testing.T) {
-	cfg, err := config.Parse([]string{
-		"run", "tools.ts",
-		"--transport", "grpc",
-		"--hot-reload", "immediate",
-		"--call-timeout", "30s",
-		"--log-level", "debug",
-		"--socket", "/tmp/test.sock",
-		"--runtime", "python3.12",
-	})
-	if err != nil {
-		t.Fatalf("Parse failed: %v", err)
-	}
-	if cfg.Command != "run" {
-		t.Errorf("Command = %q, want %q", cfg.Command, "run")
-	}
-	if cfg.File != "tools.ts" {
-		t.Errorf("File = %q, want %q", cfg.File, "tools.ts")
-	}
-	if cfg.Transport != "grpc" {
-		t.Errorf("Transport = %q, want %q", cfg.Transport, "grpc")
-	}
-	if !cfg.HotReloadImmediate {
-		t.Error("HotReloadImmediate should be true")
-	}
-	if cfg.CallTimeout != 30*time.Second {
-		t.Errorf("CallTimeout = %v, want %v", cfg.CallTimeout, 30*time.Second)
-	}
-	if cfg.SocketPath != "/tmp/test.sock" {
-		t.Errorf("SocketPath = %q, want %q", cfg.SocketPath, "/tmp/test.sock")
-	}
-	if cfg.Runtime != "python3.12" {
-		t.Errorf("Runtime = %q, want %q", cfg.Runtime, "python3.12")
-	}
-}
-
-func TestParseMissingFile(t *testing.T) {
-	_, err := config.Parse([]string{"dev"})
-	if err == nil {
-		t.Error("expected error for missing file argument")
-	}
-}
-
-func TestParseInvalidCommand(t *testing.T) {
-	_, err := config.Parse([]string{"foo", "server.py"})
-	if err == nil {
-		t.Error("expected error for invalid command")
-	}
-}
-
-func TestRuntimeCommand(t *testing.T) {
-	tests := []struct {
-		file     string
-		wantCmd  string
-		wantArgs []string
-	}{
-		{"server.py", "python3", []string{"server.py"}},
-		{"server.ts", "npx", []string{"tsx", "server.ts"}},
-		{"server.js", "node", []string{"server.js"}},
-		{"server.go", "go", []string{"run", "server.go"}},
-		{"server.rs", "cargo", []string{"run", "server.rs"}},
-		{"server", "server", nil},
-	}
-	for _, tt := range tests {
-		cmd, args := config.RuntimeCommand(tt.file)
-		if cmd != tt.wantCmd {
-			t.Errorf("RuntimeCommand(%q) cmd = %q, want %q", tt.file, cmd, tt.wantCmd)
-		}
-		if !reflect.DeepEqual(args, tt.wantArgs) {
-			t.Errorf("RuntimeCommand(%q) args = %v, want %v", tt.file, args, tt.wantArgs)
-		}
-	}
-}
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-```bash
-go test ./internal/config/... -v
-```
-
-- [ ] **Step 3: Implement config**
-
-Create `internal/config/config.go`:
-
-```go
-package config
-
-import (
-	"fmt"
-	"os"
-	"path/filepath"
-	"time"
-)
-
-type Config struct {
-	Command            string
-	File               string
-	Transport          string
-	HotReloadImmediate bool
-	CallTimeout        time.Duration
-	LogLevel           string
-	SocketPath         string
-	Runtime            string
-	Host               string // For network transports (default: "localhost")
-	Port               int    // For network transports (default: 8080)
-}
-
-func Parse(args []string) (*Config, error) {
-	if len(args) < 1 {
-		return nil, fmt.Errorf("usage: protomcp <dev|run> <file> [flags]")
-	}
-
-	cmd := args[0]
-	if cmd != "dev" && cmd != "run" {
-		return nil, fmt.Errorf("unknown command %q: must be 'dev' or 'run'", cmd)
-	}
-
-	cfg := &Config{
-		Command:     cmd,
-		Transport:   "stdio",
-		CallTimeout: 5 * time.Minute,
-		LogLevel:    "info",
-		Host:        "localhost",
-		Port:        8080,
-	}
-
-	// Find file argument (first non-flag after command)
-	i := 1
-	if i >= len(args) || args[i] == "--" {
-		return nil, fmt.Errorf("missing file argument")
-	}
-	if args[i][0] != '-' {
-		cfg.File = args[i]
-		i++
-	} else {
-		return nil, fmt.Errorf("missing file argument")
-	}
-
-	// Parse flags
-	for i < len(args) {
-		switch args[i] {
-		case "--transport":
-			i++
-			if i >= len(args) {
-				return nil, fmt.Errorf("--transport requires a value")
-			}
-			cfg.Transport = args[i]
-		case "--hot-reload":
-			i++
-			if i >= len(args) {
-				return nil, fmt.Errorf("--hot-reload requires a value")
-			}
-			if args[i] == "immediate" {
-				cfg.HotReloadImmediate = true
-			}
-		case "--call-timeout":
-			i++
-			if i >= len(args) {
-				return nil, fmt.Errorf("--call-timeout requires a value")
-			}
-			d, err := time.ParseDuration(args[i])
-			if err != nil {
-				return nil, fmt.Errorf("invalid --call-timeout: %w", err)
-			}
-			cfg.CallTimeout = d
-		case "--log-level":
-			i++
-			if i >= len(args) {
-				return nil, fmt.Errorf("--log-level requires a value")
-			}
-			cfg.LogLevel = args[i]
-		case "--socket":
-			i++
-			if i >= len(args) {
-				return nil, fmt.Errorf("--socket requires a value")
-			}
-			cfg.SocketPath = args[i]
-		case "--runtime":
-			i++
-			if i >= len(args) {
-				return nil, fmt.Errorf("--runtime requires a value")
-			}
-			cfg.Runtime = args[i]
-		case "--host":
-			i++
-			if i >= len(args) {
-				return nil, fmt.Errorf("--host requires a value")
-			}
-			cfg.Host = args[i]
-		case "--port":
-			i++
-			if i >= len(args) {
-				return nil, fmt.Errorf("--port requires a value")
-			}
-			p, err := strconv.Atoi(args[i])
-			if err != nil {
-				return nil, fmt.Errorf("invalid --port: %w", err)
-			}
-			cfg.Port = p
-		default:
-			return nil, fmt.Errorf("unknown flag %q", args[i])
-		}
-		i++
-	}
-
-	// Default socket path
-	if cfg.SocketPath == "" {
-		dir := os.Getenv("XDG_RUNTIME_DIR")
-		if dir == "" {
-			dir = os.TempDir()
-		}
-		cfg.SocketPath = filepath.Join(dir, "protomcp", fmt.Sprintf("%d.sock", os.Getpid()))
-	}
-
-	return cfg, nil
-}
-
-// RuntimeCommand returns the command and args to run a tool file.
-// Returns (command, args) to be used with exec.Command(command, args...).
-func RuntimeCommand(file string) (string, []string) {
-	ext := filepath.Ext(file)
-	switch ext {
-	case ".py":
-		cmd := "python3"
-		if env := os.Getenv("PROTOMCP_PYTHON"); env != "" {
-			cmd = env
-		}
-		return cmd, []string{file}
-	case ".ts":
-		cmd := "npx"
-		if env := os.Getenv("PROTOMCP_NODE"); env != "" {
-			return env, []string{file}
-		}
-		return cmd, []string{"tsx", file}
-	case ".js":
-		cmd := "node"
-		if env := os.Getenv("PROTOMCP_NODE"); env != "" {
-			cmd = env
-		}
-		return cmd, []string{file}
-	case ".go":
-		return "go", []string{"run", file}
-	case ".rs":
-		return "cargo", []string{"run", file}
-	default:
-		return file, nil // Treat as executable binary
-	}
-}
-```
-
-- [ ] **Step 4: Run tests to verify they pass**
-
-```bash
-go test ./internal/config/... -v
-```
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/config/
-git commit -m "feat: implement CLI config parsing with flag defaults and runtime detection"
-```
-
----
-
-### Task 6: Process Manager — Spawn, Handshake, Crash Recovery
-
-**Files:**
-- Create: `internal/process/manager.go`
-- Create: `internal/process/manager_test.go`
-
-- [ ] **Step 1: Write failing tests for process manager**
-
-Create `internal/process/manager_test.go`. Tests use a mock tool process (a small Go program compiled as a test helper) that speaks the protobuf protocol over the unix socket:
-
-```go
-package process_test
-
-import (
-	"context"
-	"os"
-	"path/filepath"
-	"testing"
-	"time"
-
-	"github.com/msilverblatt/protomcp/internal/process"
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-// TestStartAndHandshake verifies the process manager can spawn a tool process,
-// perform the handshake, and retrieve the tool list.
-func TestStartAndHandshake(t *testing.T) {
-	socketPath := filepath.Join(t.TempDir(), "test.sock")
-
-	pm := process.NewManager(process.ManagerConfig{
-		File:       "testdata/echo_tool.py",
-		Runtime:    "python3",
-		SocketPath: socketPath,
-		MaxRetries: 1,
-	})
-
-	ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
-	defer cancel()
-
-	tools, err := pm.Start(ctx)
-	if err != nil {
-		t.Fatalf("Start failed: %v", err)
-	}
-	defer pm.Stop()
-
-	if len(tools) == 0 {
-		t.Fatal("expected at least one tool from handshake")
-	}
-}
-
-// TestCallTool verifies tool call dispatch and response.
-func TestCallTool(t *testing.T) {
-	socketPath := filepath.Join(t.TempDir(), "test.sock")
-
-	pm := process.NewManager(process.ManagerConfig{
-		File:       "testdata/echo_tool.py",
-		Runtime:    "python3",
-		SocketPath: socketPath,
-		MaxRetries: 1,
-	})
-
-	ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
-	defer cancel()
-
-	_, err := pm.Start(ctx)
-	if err != nil {
-		t.Fatalf("Start failed: %v", err)
-	}
-	defer pm.Stop()
-
-	resp, err := pm.CallTool(ctx, "echo", `{"message": "hello"}`)
-	if err != nil {
-		t.Fatalf("CallTool failed: %v", err)
-	}
-	if resp.IsError {
-		t.Errorf("unexpected error: %s", resp.ResultJson)
-	}
-}
-
-// TestReload verifies the reload cycle.
-func TestReload(t *testing.T) {
-	socketPath := filepath.Join(t.TempDir(), "test.sock")
-
-	pm := process.NewManager(process.ManagerConfig{
-		File:       "testdata/echo_tool.py",
-		Runtime:    "python3",
-		SocketPath: socketPath,
-		MaxRetries: 1,
-	})
-
-	ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
-	defer cancel()
-
-	_, err := pm.Start(ctx)
-	if err != nil {
-		t.Fatalf("Start failed: %v", err)
-	}
-	defer pm.Stop()
-
-	tools, err := pm.Reload(ctx)
-	if err != nil {
-		t.Fatalf("Reload failed: %v", err)
-	}
-	if len(tools) == 0 {
-		t.Fatal("expected tools after reload")
-	}
-}
-```
-
-Note: `testdata/echo_tool.py` is a minimal Python tool process that speaks the protobuf protocol. It will be created as part of the Python SDK task but a simple test fixture version is needed here. Create `internal/process/testdata/echo_tool.py` — a minimal script that:
-1. Reads `PROTOMCP_SOCKET` env var
-2. Connects to the unix socket
-3. Responds to `ListToolsRequest` with one tool ("echo")
-4. Responds to `CallToolRequest` by echoing the args back
-5. Responds to `ReloadRequest` with success
-
-- [ ] **Step 2: Implement process manager**
-
-Create `internal/process/manager.go`:
-
-The process manager must:
-1. Create the unix socket and listen
-2. Spawn the tool process with `PROTOMCP_SOCKET` env var
-3. Accept the connection from the tool process
-4. Send `ListToolsRequest`, receive `ToolListResponse` (handshake)
-5. Handle `CallTool` by sending `CallToolRequest` and waiting for `CallToolResponse` (with request_id correlation)
-6. Handle `Reload` by sending `ReloadRequest`, waiting for `ReloadResponse`, then re-fetching tools
-7. Monitor the child process — on unexpected exit, attempt restart with exponential backoff (up to MaxRetries)
-8. Handle concurrent calls using request_id for correlation
-9. Provide a `Stop()` method for clean shutdown
-
-Key interfaces:
-```go
-type ManagerConfig struct {
-    File       string
-    Runtime    string        // e.g., "python3" — if empty, detect from extension
-    SocketPath string
-    MaxRetries int           // default 3
-    CallTimeout time.Duration // default 5m
-}
-
-type Manager struct { /* ... */ }
-
-func NewManager(cfg ManagerConfig) *Manager
-func (m *Manager) Start(ctx context.Context) ([]*pb.ToolDefinition, error)
-func (m *Manager) Stop() error
-func (m *Manager) CallTool(ctx context.Context, name string, argsJSON string) (*pb.CallToolResponse, error)
-func (m *Manager) Reload(ctx context.Context) ([]*pb.ToolDefinition, error)
-func (m *Manager) HandleToolListControl(ctx context.Context, env *pb.Envelope) (*pb.ActiveToolsResponse, error)
-func (m *Manager) OnCrash() <-chan error // channel that receives crash events
-```
-
-- [ ] **Step 3: Create test fixture echo_tool.py**
-
-Create `internal/process/testdata/echo_tool.py` — a minimal Python script that speaks the protobuf envelope protocol. This is a standalone test fixture (not the SDK). It:
-- Reads `PROTOMCP_SOCKET` from env
-- Connects to the unix socket
-- Reads length-prefixed envelopes
-- Responds to `ListToolsRequest` with one tool: `echo(message: str) -> str`
-- Responds to `CallToolRequest` by echoing args
-- Responds to `ReloadRequest` with `success=true`
-
-This requires the generated Python protobuf code. For the test fixture, use raw protobuf encoding with the `protobuf` pip package and the generated `protomcp_pb2.py`.
-
-- [ ] **Step 4: Run tests to verify they pass**
-
-```bash
-go test ./internal/process/... -v -timeout 30s
-```
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/process/
-git commit -m "feat: implement process manager with spawn, handshake, call dispatch, and crash recovery"
-```
-
----
-
-### Task 7: MCP Protocol Types and Handler
-
-**Files:**
-- Create: `internal/mcp/types.go`
-- Create: `internal/mcp/handler.go`
-- Create: `internal/mcp/handler_test.go`
-
-- [ ] **Step 1: Write MCP JSON-RPC types**
-
-Create `internal/mcp/types.go` with types for:
-- `JSONRPCRequest` / `JSONRPCResponse` / `JSONRPCNotification` (generic JSON-RPC 2.0)
-- `InitializeRequest` / `InitializeResponse` (MCP initialization with capabilities)
-- `ToolsListRequest` / `ToolsListResponse` (tools/list)
-- `ToolsCallRequest` / `ToolsCallResponse` (tools/call)
-- `ToolsListChangedNotification` (notifications/tools/list_changed)
-- MCP capability structs (declaring `tools.listChanged: true`)
-
-These are standard MCP protocol types serialized as JSON, not protobuf.
-
-- [ ] **Step 2: Write failing tests for MCP handler**
-
-Create `internal/mcp/handler_test.go`:
-
-```go
-package mcp_test
-
-import (
-	"context"
-	"encoding/json"
-	"testing"
-
-	"github.com/msilverblatt/protomcp/internal/mcp"
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-// mockToolBackend implements the interface the handler uses to talk to the tool process
-type mockToolBackend struct {
-	tools []*pb.ToolDefinition
-}
-
-func (m *mockToolBackend) ActiveTools() []*pb.ToolDefinition {
-	return m.tools
-}
-
-func (m *mockToolBackend) CallTool(ctx context.Context, name, argsJSON string) (*pb.CallToolResponse, error) {
-	return &pb.CallToolResponse{
-		ResultJson: `[{"type":"text","text":"result"}]`,
-	}, nil
-}
-
-func TestHandleInitialize(t *testing.T) {
-	h := mcp.NewHandler(&mockToolBackend{})
-
-	req := mcp.JSONRPCRequest{
-		JSONRPC: "2.0",
-		ID:      json.RawMessage(`1`),
-		Method:  "initialize",
-	}
-
-	resp, err := h.Handle(context.Background(), req)
-	if err != nil {
-		t.Fatalf("Handle initialize failed: %v", err)
-	}
-
-	// Should return capabilities with tools.listChanged = true
-	var result mcp.InitializeResult
-	if err := json.Unmarshal(resp.Result, &result); err != nil {
-		t.Fatalf("unmarshal result: %v", err)
-	}
-	if !result.Capabilities.Tools.ListChanged {
-		t.Error("expected tools.listChanged = true")
-	}
-}
-
-func TestHandleToolsList(t *testing.T) {
-	backend := &mockToolBackend{
-		tools: []*pb.ToolDefinition{
-			{Name: "search", Description: "Search docs", InputSchemaJson: `{"type":"object","properties":{"query":{"type":"string"}}}`},
-		},
-	}
-	h := mcp.NewHandler(backend)
-
-	req := mcp.JSONRPCRequest{
-		JSONRPC: "2.0",
-		ID:      json.RawMessage(`2`),
-		Method:  "tools/list",
-	}
-
-	resp, err := h.Handle(context.Background(), req)
-	if err != nil {
-		t.Fatalf("Handle tools/list failed: %v", err)
-	}
-
-	var result mcp.ToolsListResult
-	if err := json.Unmarshal(resp.Result, &result); err != nil {
-		t.Fatalf("unmarshal result: %v", err)
-	}
-	if len(result.Tools) != 1 {
-		t.Fatalf("expected 1 tool, got %d", len(result.Tools))
-	}
-	if result.Tools[0].Name != "search" {
-		t.Errorf("tool name = %q, want %q", result.Tools[0].Name, "search")
-	}
-}
-
-func TestHandleToolsCall(t *testing.T) {
-	backend := &mockToolBackend{
-		tools: []*pb.ToolDefinition{
-			{Name: "search", Description: "Search docs", InputSchemaJson: `{}`},
-		},
-	}
-	h := mcp.NewHandler(backend)
-
-	params, _ := json.Marshal(map[string]interface{}{
-		"name":      "search",
-		"arguments": map[string]string{"query": "hello"},
-	})
-	req := mcp.JSONRPCRequest{
-		JSONRPC: "2.0",
-		ID:      json.RawMessage(`3`),
-		Method:  "tools/call",
-		Params:  params,
-	}
-
-	resp, err := h.Handle(context.Background(), req)
-	if err != nil {
-		t.Fatalf("Handle tools/call failed: %v", err)
-	}
-
-	if resp.Error != nil {
-		t.Errorf("unexpected error: %v", resp.Error)
-	}
-}
-```
-
-- [ ] **Step 3: Implement MCP handler**
-
-Create `internal/mcp/handler.go`:
-
-The handler:
-- Implements `Handle(ctx, JSONRPCRequest) -> JSONRPCResponse`
-- Routes by method: `initialize`, `tools/list`, `tools/call`, `notifications/initialized`
-- For `initialize`: returns server info and capabilities (`tools.listChanged: true`)
-- For `tools/list`: calls `backend.ActiveTools()` and formats as MCP response
-- For `tools/call`: extracts tool name and args, calls `backend.CallTool()`, intercepts `enable_tools`/`disable_tools` from the response, and returns the MCP-formatted result
-- Provides `ListChangedNotification() -> JSONRPCNotification` for the transport to send
-- Unknown methods return JSON-RPC method-not-found error
-
-- [ ] **Step 4: Run tests to verify they pass**
-
-```bash
-go test ./internal/mcp/... -v
-```
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/mcp/
-git commit -m "feat: implement MCP JSON-RPC handler with initialize, tools/list, and tools/call"
-```
-
----
-
-### Task 8: Middleware — Logging and Error Handling
-
-**Files:**
-- Create: `internal/middleware/chain.go`
-- Create: `internal/middleware/logging.go`
-- Create: `internal/middleware/errors.go`
-
-- [ ] **Step 1: Implement middleware chain**
-
-Create `internal/middleware/chain.go`:
-
-```go
-package middleware
-
-import (
-	"context"
-
-	"github.com/msilverblatt/protomcp/internal/mcp"
-)
-
-// Handler processes an MCP request and returns a response.
-type Handler func(ctx context.Context, req mcp.JSONRPCRequest) (*mcp.JSONRPCResponse, error)
-
-// Middleware wraps a Handler with additional behavior.
-type Middleware func(next Handler) Handler
-
-// Chain applies middleware in order (first middleware is outermost).
-func Chain(handler Handler, middlewares ...Middleware) Handler {
-	for i := len(middlewares) - 1; i >= 0; i-- {
-		handler = middlewares[i](handler)
-	}
-	return handler
-}
-```
-
-- [ ] **Step 2: Implement logging middleware**
-
-Create `internal/middleware/logging.go`:
-
-Logs each request (method, request ID) and response (duration, error status). Uses `log/slog` for structured logging. Log level controlled by config.
-
-- [ ] **Step 3: Implement error formatting middleware**
-
-Create `internal/middleware/errors.go`:
-
-Catches panics and unhandled errors from the handler, formats them as agent-friendly structured errors with `error_code`, `message`, `suggestion`, and `retryable` fields.
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add internal/middleware/
-git commit -m "feat: implement middleware chain with structured logging and error formatting"
-```
-
----
-
-## Chunk 3: Transports, File Watcher, CLI Entry Point
-
-### Task 9: Transport Interface and stdio Transport
-
-**Files:**
-- Create: `internal/transport/transport.go`
-- Create: `internal/transport/stdio.go`
-- Create: `internal/transport/stdio_test.go`
-
-- [ ] **Step 1: Define transport interface**
-
-Create `internal/transport/transport.go`:
-
-```go
-package transport
-
-import (
-	"context"
-
-	"github.com/msilverblatt/protomcp/internal/mcp"
-)
-
-// Transport handles bidirectional MCP communication with the host/client.
-type Transport interface {
-	// Start begins listening for MCP requests. Calls handler for each request.
-	// Blocks until ctx is cancelled or an error occurs.
-	Start(ctx context.Context, handler mcp.RequestHandler) error
-
-	// SendNotification pushes a server-initiated notification to the client.
-	SendNotification(notification mcp.JSONRPCNotification) error
-
-	// Close shuts down the transport.
-	Close() error
-}
-
-// mcp.RequestHandler is: func(ctx context.Context, req JSONRPCRequest) (*JSONRPCResponse, error)
-```
-
-- [ ] **Step 2: Write failing tests for stdio transport**
-
-Create `internal/transport/stdio_test.go`:
-
-Test that the stdio transport reads JSON-RPC requests from stdin, passes them to the handler, and writes responses to stdout. Use `io.Pipe` to simulate stdin/stdout.
-
-- [ ] **Step 3: Implement stdio transport**
-
-Create `internal/transport/stdio.go`:
-
-Reads newline-delimited JSON-RPC messages from stdin, dispatches to handler, writes JSON-RPC responses to stdout. Handles `notifications/initialized` (no response needed).
-
-- [ ] **Step 4: Run tests**
-
-```bash
-go test ./internal/transport/... -run TestStdio -v
-```
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/transport/transport.go internal/transport/stdio.go internal/transport/stdio_test.go
-git commit -m "feat: implement transport interface and stdio transport"
-```
-
----
-
-### Task 10: Streamable HTTP Transport
-
-**Files:**
-- Create: `internal/transport/http.go`
-- Create: `internal/transport/http_test.go`
-
-- [ ] **Step 1: Write failing tests**
-
-Test that:
-- POST to `/mcp` with a JSON-RPC request returns a JSON-RPC response
-- GET to `/mcp` opens an SSE stream for server-initiated notifications
-- `SendNotification` pushes events to connected SSE clients
-
-- [ ] **Step 2: Implement HTTP transport**
-
-Uses `net/http`. Single endpoint `/mcp`. POST for requests, GET for SSE stream. Maintains a list of SSE clients for notifications.
-
-- [ ] **Step 3: Run tests and commit**
-
-```bash
-go test ./internal/transport/... -run TestHTTP -v
-git add internal/transport/http.go internal/transport/http_test.go
-git commit -m "feat: implement streamable HTTP transport with SSE notifications"
-```
-
----
-
-### Task 11: SSE Transport
-
-**Files:**
-- Create: `internal/transport/sse.go`
-- Create: `internal/transport/sse_test.go`
-
-- [ ] **Step 1: Implement SSE transport**
-
-Legacy SSE transport per MCP spec: separate SSE endpoint for server-to-client, POST endpoint for client-to-server. Largely reuses HTTP transport internals.
-
-- [ ] **Step 2: Test and commit**
-
-```bash
-go test ./internal/transport/... -run TestSSE -v
-git add internal/transport/sse.go internal/transport/sse_test.go
-git commit -m "feat: implement legacy SSE transport"
-```
-
----
-
-### Task 12: WebSocket Transport
-
-**Files:**
-- Create: `internal/transport/ws.go`
-- Create: `internal/transport/ws_test.go`
-
-- [ ] **Step 1: Implement WebSocket transport**
-
-Uses `nhooyr.io/websocket` (or `gorilla/websocket`). Single WebSocket connection for bidirectional JSON-RPC. Notifications are pushed as WebSocket messages.
-
-- [ ] **Step 2: Test and commit**
-
-```bash
-go test ./internal/transport/... -run TestWS -v
-git add internal/transport/ws.go internal/transport/ws_test.go
-git commit -m "feat: implement WebSocket transport"
-```
-
----
-
-### Task 13: gRPC Transport
-
-**Files:**
-- Create: `internal/transport/grpc.go`
-- Create: `internal/transport/grpc_test.go`
-- Modify: `proto/protomcp.proto` (add external gRPC service definition)
-
-- [ ] **Step 1: Add external gRPC service to proto**
-
-Add a separate service definition in `proto/protomcp.proto` for the external gRPC transport (client-facing, separate from the internal envelope protocol):
-
-```protobuf
-// External gRPC service — client-facing MCP transport
-service MCPService {
-  rpc Request(MCPRequest) returns (MCPResponse);
-  rpc Subscribe(MCPSubscribeRequest) returns (stream MCPNotification);
-}
-
-message MCPRequest {
-  string jsonrpc_request = 1; // JSON-encoded MCP JSON-RPC request
-}
-message MCPResponse {
-  string jsonrpc_response = 1; // JSON-encoded MCP JSON-RPC response
-}
-message MCPSubscribeRequest {}
-message MCPNotification {
-  string jsonrpc_notification = 1; // JSON-encoded notification
-}
-```
-
-- [ ] **Step 2: Regenerate proto and implement gRPC transport**
-
-```bash
-make proto
-```
-
-Implement gRPC server that wraps JSON-RPC messages in protobuf, dispatches to handler, and streams notifications.
-
-- [ ] **Step 3: Test and commit**
-
-```bash
-go test ./internal/transport/... -run TestGRPC -v
-git add internal/transport/grpc.go internal/transport/grpc_test.go proto/protomcp.proto
-git commit -m "feat: implement gRPC transport with external service definition"
-```
-
----
-
-### Task 14: File Watcher — Reload Orchestration
-
-**Files:**
-- Create: `internal/reload/watcher.go`
-- Create: `internal/reload/watcher_test.go`
-
-- [ ] **Step 1: Write failing tests**
-
-Test that:
-- Watcher detects file modifications and calls the reload callback
-- Watcher debounces rapid changes (only one reload per debounce window)
-- Watcher supports both single file and directory watching
-- Watcher filters by relevant file extensions
-
-- [ ] **Step 2: Implement file watcher**
-
-Create `internal/reload/watcher.go`:
-
-Uses `github.com/fsnotify/fsnotify`. Key behavior:
-- Watches the specified file or directory
-- On change, debounces (100ms) then calls the reload callback
-- Reload callback signature: `func() error`
-- The watcher does NOT do the reload itself — it signals the main server loop
-- In `run` mode (production), the watcher is never started
-
-```go
-type Watcher struct { /* ... */ }
-
-func NewWatcher(path string, extensions []string, onChange func()) (*Watcher, error)
-func (w *Watcher) Start(ctx context.Context) error
-func (w *Watcher) Stop() error
-```
-
-- [ ] **Step 3: Test and commit**
-
-```bash
-go test ./internal/reload/... -v
-git add internal/reload/
-git commit -m "feat: implement file watcher with debouncing and extension filtering"
-```
-
----
-
-### Task 15: CLI Entry Point — Wiring It All Together
-
-**Files:**
-- Create: `cmd/protomcp/main.go`
-
-- [ ] **Step 1: Implement main.go**
-
-Create `cmd/protomcp/main.go` that wires everything together:
-
-```go
-package main
-
-import (
-	"context"
-	"fmt"
-	"log/slog"
-	"os"
-	"os/signal"
-
-	"github.com/msilverblatt/protomcp/internal/config"
-	"github.com/msilverblatt/protomcp/internal/mcp"
-	"github.com/msilverblatt/protomcp/internal/middleware"
-	"github.com/msilverblatt/protomcp/internal/process"
-	"github.com/msilverblatt/protomcp/internal/reload"
-	"github.com/msilverblatt/protomcp/internal/toollist"
-	"github.com/msilverblatt/protomcp/internal/transport"
-)
-
-func main() {
-	cfg, err := config.Parse(os.Args[1:])
-	if err != nil {
-		fmt.Fprintf(os.Stderr, "error: %v\n", err)
-		fmt.Fprintf(os.Stderr, "usage: protomcp <dev|run> <file> [flags]\n")
-		os.Exit(1)
-	}
-
-	// Setup structured logging
-	logLevel := parseLogLevel(cfg.LogLevel)
-	logger := slog.New(slog.NewTextHandler(os.Stderr, &slog.HandlerOptions{Level: logLevel}))
-	slog.SetDefault(logger)
-
-	ctx, cancel := signal.NotifyContext(context.Background(), os.Interrupt)
-	defer cancel()
-
-	// 1. Create tool list manager
-	tlm := toollist.New()
-
-	// 2. Determine runtime command
-	var runtimeCmd string
-	var runtimeArgs []string
-	if cfg.Runtime != "" {
-		runtimeCmd = cfg.Runtime
-		runtimeArgs = []string{cfg.File}
-	} else {
-		runtimeCmd, runtimeArgs = config.RuntimeCommand(cfg.File)
-	}
-
-	// 3. Start process manager
-	pm := process.NewManager(process.ManagerConfig{
-		File:        cfg.File,
-		RuntimeCmd:  runtimeCmd,
-		RuntimeArgs: runtimeArgs,
-		SocketPath:  cfg.SocketPath,
-		MaxRetries:  3,
-		CallTimeout: cfg.CallTimeout,
-	})
-
-	tools, err := pm.Start(ctx)
-	if err != nil {
-		slog.Error("failed to start tool process", "error", err)
-		os.Exit(1)
-	}
-
-	// Register tools and log them
-	toolNames := make([]string, len(tools))
-	for i, t := range tools {
-		toolNames[i] = t.Name
-		slog.Info("tool registered", "name", t.Name, "description", t.Description)
-	}
-	tlm.SetRegistered(toolNames)
-
-	// 4. Create MCP handler with tool backend
-	backend := newToolBackend(pm, tlm, tools)
-	handler := mcp.NewHandler(backend)
-
-	// 5. Apply middleware
-	chain := middleware.Chain(
-		handler.Handle,
-		middleware.Logging(logger),
-		middleware.ErrorFormatting(),
-	)
-
-	// 6. Create transport
-	tp, err := createTransport(cfg.Transport)
-	if err != nil {
-		slog.Error("failed to create transport", "error", err)
-		os.Exit(1)
-	}
-
-	// 7. Handle tool list control messages from tool process
-	go handleToolListControl(ctx, pm, tlm, tp)
-
-	// 8. Handle crash recovery
-	go handleCrashRecovery(ctx, pm, tlm, tools, tp)
-
-	// 9. Start file watcher (dev mode only)
-	if cfg.Command == "dev" {
-		w, err := reload.NewWatcher(cfg.File, nil, func() {
-			// Wait for in-flight calls unless immediate mode
-			if !cfg.HotReloadImmediate {
-				pm.WaitForInFlight()
-			}
-			newTools, err := pm.Reload(ctx)
-			if err != nil {
-				slog.Error("reload failed", "error", err)
-				return
-			}
-			// Update tool list
-			newNames := make([]string, len(newTools))
-			for i, t := range newTools {
-				newNames[i] = t.Name
-			}
-			oldActive := tlm.Active()
-			tlm.SetRegistered(newNames)
-			backend.UpdateTools(newTools)
-			newActive := tlm.Active()
-			if !slicesEqual(oldActive, newActive) {
-				slog.Info("tool list changed", "added", diff(newActive, oldActive), "removed", diff(oldActive, newActive))
-				tp.SendNotification(mcp.ListChangedNotification())
-			}
-		})
-		if err != nil {
-			slog.Error("failed to create file watcher", "error", err)
-			os.Exit(1)
-		}
-		go w.Start(ctx)
-		defer w.Stop()
-	}
-
-	// 10. Start transport (blocks until ctx cancelled)
-	slog.Info("protomcp started", "command", cfg.Command, "file", cfg.File, "transport", cfg.Transport)
-	if err := tp.Start(ctx, chain); err != nil {
-		slog.Error("transport error", "error", err)
-		os.Exit(1)
-	}
-}
-```
-
-Note: `createTransport()`, `newToolBackend()`, `handleToolListControl()`, `handleCrashRecovery()`, `parseLogLevel()`, `slicesEqual()`, `diff()` are helper functions in the same file or a `helpers.go` file. Keep it focused — these are thin wiring functions, not business logic.
-
-- [ ] **Step 2: Build and verify it compiles**
-
-```bash
-make build
-```
-
-Expected: `bin/protomcp` binary created.
-
-- [ ] **Step 3: Smoke test with a Python fixture**
-
-```bash
-echo '{"jsonrpc":"2.0","id":1,"method":"initialize","params":{}}' | bin/protomcp dev internal/process/testdata/echo_tool.py
-```
-
-Expected: JSON-RPC response with capabilities.
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add cmd/protomcp/
-git commit -m "feat: implement CLI entry point wiring all components together"
-```
-
----
-
-## Chunk 4: Python SDK
-
-### Task 16: Python Project Setup
-
-**Files:**
-- Create: `sdk/python/pyproject.toml`
-- Create: `sdk/python/src/protomcp/__init__.py`
-
-- [ ] **Step 1: Create pyproject.toml**
-
-```toml
-[build-system]
-requires = ["hatchling"]
-build-backend = "hatchling.build"
-
-[project]
-name = "protomcp"
-version = "0.1.0"
-description = "Write MCP tools in Python. No MCP knowledge required."
-requires-python = ">=3.10"
-dependencies = [
-    "protobuf>=4.0",
-]
-
-[project.optional-dependencies]
-dev = [
-    "pytest>=7.0",
-    "pytest-asyncio>=0.21",
-]
-
-[tool.hatch.build.targets.wheel]
-packages = ["src/protomcp"]
-```
-
-- [ ] **Step 2: Create __init__.py with public API**
-
-```python
-from protomcp.tool import tool
-from protomcp.result import ToolResult
-from protomcp import manager as tool_manager
-
-__all__ = ["tool", "ToolResult", "tool_manager"]
-```
-
-- [ ] **Step 3: Generate Python protobuf code**
-
-```bash
-make proto
-```
-
-Verify: `sdk/python/gen/protomcp_pb2.py` exists.
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add sdk/python/pyproject.toml sdk/python/src/protomcp/__init__.py
-git commit -m "feat: initialize Python SDK project"
-```
-
----
-
-### Task 17: Python — @tool Decorator and Schema Generation
-
-**Files:**
-- Create: `sdk/python/src/protomcp/tool.py`
-- Create: `sdk/python/tests/test_tool.py`
-
-- [ ] **Step 1: Write failing tests**
-
-Create `sdk/python/tests/test_tool.py`:
-
-```python
-import json
-from protomcp.tool import tool, get_registered_tools
-
-
-def test_tool_decorator_registers():
-    """@tool() should register the function as a tool."""
-    clear_registry()
-    @tool(description="Add two numbers")
-    def add(a: int, b: int) -> int:
-        return a + b
-
-    tools = get_registered_tools()
-    assert any(t.name == "add" for t in tools)
-
-
-def test_tool_schema_from_type_hints():
-    """Schema should be generated from Python type annotations."""
-    clear_registry()
-    @tool(description="Search documents")
-    def search(query: str, limit: int = 10) -> list:
-        return []
-
-    tools = get_registered_tools()
-    t = next(t for t in tools if t.name == "search")
-    schema = json.loads(t.input_schema_json)
-
-    assert schema["type"] == "object"
-    assert "query" in schema["properties"]
-    assert schema["properties"]["query"]["type"] == "string"
-    assert "limit" in schema["properties"]
-    assert schema["properties"]["limit"]["type"] == "integer"
-    assert schema["properties"]["limit"]["default"] == 10
-    assert "query" in schema["required"]
-    assert "limit" not in schema["required"]  # has default
-
-
-def test_tool_callable():
-    """Decorated function should still be callable normally."""
-    clear_registry()
-    @tool(description="Double a number")
-    def double(n: int) -> int:
-        return n * 2
-
-    assert double(5) == 10
-
-
-def test_tool_optional_params():
-    """Optional params should not be in required."""
-    clear_registry()
-    from typing import Optional
-
-    @tool(description="Greet")
-    def greet(name: str, greeting: Optional[str] = None) -> str:
-        return f"{greeting or 'Hello'}, {name}!"
-
-    tools = get_registered_tools()
-    t = next(t for t in tools if t.name == "greet")
-    schema = json.loads(t.input_schema_json)
-
-    assert "name" in schema["required"]
-    assert "greeting" not in schema["required"]
-
-def test_tool_optional_without_default():
-    """Optional[X] without a default should NOT be required."""
-    clear_registry()
-    from typing import Optional
-
-    @tool(description="Maybe filter")
-    def search(query: str, tag: Optional[str] = None) -> list:
-        return []
-
-    tools = get_registered_tools()
-    t = next(t for t in tools if t.name == "search")
-    schema = json.loads(t.input_schema_json)
-    assert "tag" not in schema.get("required", [])
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-```bash
-cd sdk/python && python -m pytest tests/test_tool.py -v
-```
-
-- [ ] **Step 3: Implement @tool decorator**
-
-Create `sdk/python/src/protomcp/tool.py`:
-
-```python
-import inspect
-import json
-from dataclasses import dataclass
-from typing import Any, Callable, Optional, get_type_hints
-
-# Global registry of tools
-_registry: list["ToolDef"] = []
-
-
-@dataclass
-class ToolDef:
-    name: str
-    description: str
-    input_schema_json: str
-    handler: Callable
-
-
-def tool(description: str):
-    """Decorator that registers a function as an MCP tool.
-
-    Schema is generated automatically from Python type annotations.
-    """
-    def decorator(func: Callable) -> Callable:
-        schema = _generate_schema(func)
-        _registry.append(ToolDef(
-            name=func.__name__,
-            description=description,
-            input_schema_json=json.dumps(schema),
-            handler=func,
-        ))
-        return func
-    return decorator
-
-
-def get_registered_tools() -> list[ToolDef]:
-    return list(_registry)
-
-
-def clear_registry():
-    _registry.clear()
-
-
-_PYTHON_TYPE_TO_JSON_SCHEMA = {
-    str: "string",
-    int: "integer",
-    float: "number",
-    bool: "boolean",
-    list: "array",
-    dict: "object",
-}
-
-
-def _generate_schema(func: Callable) -> dict:
-    """Generate JSON Schema from function signature and type hints."""
-    hints = get_type_hints(func)
-    sig = inspect.signature(func)
-
-    properties = {}
-    required = []
-
-    for name, param in sig.parameters.items():
-        if name in ("self", "cls", "ctx"):
-            continue
-
-        hint = hints.get(name, Any)
-        # Skip ToolContext parameters
-        if hint.__name__ == "ToolContext" if hasattr(hint, "__name__") else False:
-            continue
-        json_type = _python_type_to_json(hint)
-        prop: dict[str, Any] = {"type": json_type}
-
-        if param.default is not inspect.Parameter.empty:
-            prop["default"] = param.default
-        elif not _is_optional_type(hint):
-            required.append(name)
-
-        properties[name] = prop
-
-    schema: dict[str, Any] = {
-        "type": "object",
-        "properties": properties,
-    }
-    if required:
-        schema["required"] = required
-
-    return schema
-
-
-def _is_optional_type(hint) -> bool:
-    """Check if a type hint is Optional[X] (Union[X, None])."""
-    import typing
-    origin = getattr(hint, "__origin__", None)
-    if origin is typing.Union:
-        return type(None) in hint.__args__
-    return False
-
-
-def _python_type_to_json(hint) -> str:
-    """Convert a Python type hint to a JSON Schema type string."""
-    # Handle Optional[X] (Union[X, None])
-    origin = getattr(hint, "__origin__", None)
-    if origin is type(None):
-        return "null"
-
-    # Handle Optional (typing.Union with None)
-    import typing
-    if origin is typing.Union:
-        args = hint.__args__
-        non_none = [a for a in args if a is not type(None)]
-        if len(non_none) == 1:
-            return _python_type_to_json(non_none[0])
-
-    return _PYTHON_TYPE_TO_JSON_SCHEMA.get(hint, "string")
-```
-
-- [ ] **Step 4: Run tests to verify they pass**
-
-```bash
-cd sdk/python && python -m pytest tests/test_tool.py -v
-```
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/python/src/protomcp/tool.py sdk/python/tests/test_tool.py
-git commit -m "feat: implement Python @tool decorator with automatic schema generation from type hints"
-```
-
----
-
-### Task 18: Python — ToolResult Type
-
-**Files:**
-- Create: `sdk/python/src/protomcp/result.py`
-- Create: `sdk/python/tests/test_result.py`
-
-- [ ] **Step 1: Write failing tests**
-
-```python
-from protomcp.result import ToolResult
-
-
-def test_tool_result_basic():
-    r = ToolResult(result="success")
-    assert r.result == "success"
-    assert r.enable_tools is None
-    assert r.disable_tools is None
-
-
-def test_tool_result_with_mutations():
-    r = ToolResult(
-        result="connected",
-        enable_tools=["query_db"],
-        disable_tools=["connect_db"],
-    )
-    assert r.enable_tools == ["query_db"]
-    assert r.disable_tools == ["connect_db"]
-
-
-def test_tool_result_with_error():
-    r = ToolResult(
-        is_error=True,
-        error_code="NOT_FOUND",
-        message="User not found",
-        suggestion="Try searching by email",
-        retryable=False,
-    )
-    assert r.is_error is True
-    assert r.error_code == "NOT_FOUND"
-```
-
-- [ ] **Step 2: Implement ToolResult**
-
-```python
-from dataclasses import dataclass, field
-from typing import Optional
-
-
-@dataclass
-class ToolResult:
-    result: str = ""
-    is_error: bool = False
-    enable_tools: Optional[list[str]] = None
-    disable_tools: Optional[list[str]] = None
-    # Structured error fields
-    error_code: Optional[str] = None
-    message: Optional[str] = None
-    suggestion: Optional[str] = None
-    retryable: bool = False
-```
-
-- [ ] **Step 3: Test and commit**
-
-```bash
-cd sdk/python && python -m pytest tests/test_result.py -v
-git add sdk/python/src/protomcp/result.py sdk/python/tests/test_result.py
-git commit -m "feat: implement Python ToolResult type with tool list mutations and structured errors"
-```
-
----
-
-### Task 19: Python — Transport Layer (Unix Socket + Envelope)
-
-**Files:**
-- Create: `sdk/python/src/protomcp/transport.py`
-- Create: `sdk/python/tests/test_transport.py`
-
-- [ ] **Step 1: Write failing tests**
-
-Test that `Transport` can:
-- Connect to a unix socket
-- Write a length-prefixed protobuf envelope
-- Read a length-prefixed protobuf envelope
-- Handle multiple sequential messages
-
-- [ ] **Step 2: Implement transport**
-
-```python
-import socket
-import struct
-from protomcp.gen import protomcp_pb2 as pb
-
-
-class Transport:
-    """Speaks length-prefixed protobuf envelopes over a unix socket."""
-
-    def __init__(self, socket_path: str):
-        self._socket_path = socket_path
-        self._sock: socket.socket | None = None
-
-    def connect(self):
-        self._sock = socket.socket(socket.AF_UNIX, socket.SOCK_STREAM)
-        self._sock.connect(self._socket_path)
-
-    def send(self, envelope: pb.Envelope):
-        data = envelope.SerializeToString()
-        length = struct.pack(">I", len(data))
-        self._sock.sendall(length + data)
-
-    def recv(self) -> pb.Envelope:
-        length_bytes = self._recv_exactly(4)
-        length = struct.unpack(">I", length_bytes)[0]
-        data = self._recv_exactly(length)
-        env = pb.Envelope()
-        env.ParseFromString(data)
-        return env
-
-    def close(self):
-        if self._sock:
-            self._sock.close()
-
-    def _recv_exactly(self, n: int) -> bytes:
-        buf = bytearray()
-        while len(buf) < n:
-            chunk = self._sock.recv(n - len(buf))
-            if not chunk:
-                raise ConnectionError("socket closed")
-            buf.extend(chunk)
-        return bytes(buf)
-```
-
-- [ ] **Step 3: Test and commit**
-
-```bash
-cd sdk/python && python -m pytest tests/test_transport.py -v
-git add sdk/python/src/protomcp/transport.py sdk/python/tests/test_transport.py
-git commit -m "feat: implement Python transport layer for unix socket + envelope protocol"
-```
-
----
-
-### Task 20: Python — tool_manager Client
-
-**Files:**
-- Create: `sdk/python/src/protomcp/manager.py`
-- Create: `sdk/python/tests/test_manager.py`
-
-- [ ] **Step 1: Write failing tests**
-
-Test that `tool_manager` methods send the correct protobuf messages over the transport and return the response.
-
-- [ ] **Step 2: Implement manager**
-
-```python
-from protomcp.transport import Transport
-from protomcp.gen import protomcp_pb2 as pb
-
-_transport: Transport | None = None
-
-
-def _get_transport() -> Transport:
-    if _transport is None:
-        raise RuntimeError("protomcp not connected — are you running via 'protomcp dev'?")
-    return _transport
-
-
-def _init(transport: Transport):
-    global _transport
-    _transport = transport
-
-
-def enable(tool_names: list[str]) -> list[str]:
-    t = _get_transport()
-    env = pb.Envelope(
-        enable_tools=pb.EnableToolsRequest(tool_names=tool_names)
-    )
-    t.send(env)
-    resp = t.recv()
-    return list(resp.active_tools.tool_names)
-
-
-def disable(tool_names: list[str]) -> list[str]:
-    t = _get_transport()
-    env = pb.Envelope(
-        disable_tools=pb.DisableToolsRequest(tool_names=tool_names)
-    )
-    t.send(env)
-    resp = t.recv()
-    return list(resp.active_tools.tool_names)
-
-
-def set_allowed(tool_names: list[str]) -> list[str]:
-    t = _get_transport()
-    env = pb.Envelope(
-        set_allowed=pb.SetAllowedRequest(tool_names=tool_names)
-    )
-    t.send(env)
-    resp = t.recv()
-    return list(resp.active_tools.tool_names)
-
-
-def set_blocked(tool_names: list[str]) -> list[str]:
-    t = _get_transport()
-    env = pb.Envelope(
-        set_blocked=pb.SetBlockedRequest(tool_names=tool_names)
-    )
-    t.send(env)
-    resp = t.recv()
-    return list(resp.active_tools.tool_names)
-
-
-def get_active_tools() -> list[str]:
-    t = _get_transport()
-    env = pb.Envelope(
-        get_active_tools=pb.GetActiveToolsRequest()
-    )
-    t.send(env)
-    resp = t.recv()
-    return list(resp.active_tools.tool_names)
-
-
-def batch(
-    enable: list[str] | None = None,
-    disable: list[str] | None = None,
-    allow: list[str] | None = None,
-    block: list[str] | None = None,
-) -> list[str]:
-    t = _get_transport()
-    env = pb.Envelope(
-        batch=pb.BatchUpdateRequest(
-            enable=enable or [],
-            disable=disable or [],
-            allow=allow or [],
-            block=block or [],
-        )
-    )
-    t.send(env)
-    resp = t.recv()
-    return list(resp.active_tools.tool_names)
-```
-
-- [ ] **Step 3: Test and commit**
-
-```bash
-cd sdk/python && python -m pytest tests/test_manager.py -v
-git add sdk/python/src/protomcp/manager.py sdk/python/tests/test_manager.py
-git commit -m "feat: implement Python tool_manager client for dynamic tool list control"
-```
-
----
-
-### Task 21: Python — Runner (Main Loop)
-
-**Files:**
-- Create: `sdk/python/src/protomcp/runner.py`
-
-- [ ] **Step 1: Implement runner**
-
-The runner is the main loop that the tool process runs. It:
-1. Reads `PROTOMCP_SOCKET` from env
-2. Connects to the unix socket via `Transport`
-3. Initializes `tool_manager` with the transport
-4. Listens for envelopes from the Go binary
-5. Dispatches `ListToolsRequest` → returns registered tools from `tool.get_registered_tools()`
-6. Dispatches `CallToolRequest` → finds the handler, calls it, returns `CallToolResponse`
-7. Dispatches `ReloadRequest` → calls `importlib.reload()` on the user's module, clears and re-registers tools, returns `ReloadResponse`
-
-The user's tool file imports this runner at module level (or the SDK auto-runs it):
-
-```python
-# At the bottom of a user's tool file, or auto-detected:
-if __name__ == "__main__":
-    from protomcp.runner import run
-    run()
-```
-
-Actually, the runner should auto-start. When the tool process is spawned, the Python SDK needs to:
-1. Import the user's module (which registers tools via `@tool()`)
-2. Start the runner loop
-
-This is handled by the SDK's entry point. The Go binary runs: `python -c "import protomcp.runner; protomcp.runner.start('server')"` where `server` is the module path. Or simpler: the user's file calls `protomcp.run()` at the bottom.
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add sdk/python/src/protomcp/runner.py
-git commit -m "feat: implement Python runner main loop with reload and tool dispatch"
-```
-
----
-
-## Chunk 5: TypeScript SDK
-
-### Task 22: TypeScript Project Setup
-
-**Files:**
-- Create: `sdk/typescript/package.json`
-- Create: `sdk/typescript/tsconfig.json`
-- Create: `sdk/typescript/vitest.config.ts`
-- Create: `sdk/typescript/src/index.ts`
-
-- [ ] **Step 1: Create package.json**
-
-```json
-{
-  "name": "protomcp",
-  "version": "0.1.0",
-  "description": "Write MCP tools in TypeScript. No MCP knowledge required.",
-  "type": "module",
-  "main": "dist/index.js",
-  "types": "dist/index.d.ts",
-  "scripts": {
-    "build": "tsc",
-    "test": "vitest run",
-    "test:watch": "vitest"
-  },
-  "dependencies": {
-    "protobufjs": "^7.0.0",
-    "zod": "^3.22.0",
-    "zod-to-json-schema": "^3.22.0"
-  },
-  "devDependencies": {
-    "typescript": "^5.3.0",
-    "vitest": "^1.0.0",
-    "@types/node": "^20.0.0"
-  }
-}
-```
-
-- [ ] **Step 2: Create tsconfig.json, vitest.config.ts, index.ts**
-
-Standard TypeScript config with ESM output. Index exports `tool`, `ToolResult`, `toolManager`.
-
-- [ ] **Step 3: Install dependencies and commit**
-
-```bash
-cd sdk/typescript && npm install
-git add sdk/typescript/package.json sdk/typescript/tsconfig.json sdk/typescript/vitest.config.ts sdk/typescript/src/index.ts
-git commit -m "feat: initialize TypeScript SDK project"
-```
-
----
-
-### Task 23: TypeScript — tool() Function with Zod Schema
-
-**Files:**
-- Create: `sdk/typescript/src/tool.ts`
-- Create: `sdk/typescript/tests/tool.test.ts`
-
-- [ ] **Step 1: Write failing tests**
-
-```typescript
-import { describe, it, expect } from 'vitest';
-import { z } from 'zod';
-import { tool, getRegisteredTools, clearRegistry } from '../src/tool';
-
-describe('tool()', () => {
-  beforeEach(() => clearRegistry());
-
-  it('registers a tool with Zod schema', () => {
-    const add = tool({
-      name: 'add',
-      description: 'Add two numbers',
-      args: z.object({
-        a: z.number().describe('First number'),
-        b: z.number().describe('Second number'),
-      }),
-      handler: (args) => args.a + args.b,
-    });
-
-    const tools = getRegisteredTools();
-    expect(tools).toHaveLength(1);
-    expect(tools[0].name).toBe('add');
-    expect(tools[0].description).toBe('Add two numbers');
-  });
-
-  it('requires name for arrow function handlers', () => {
-    const t = tool({
-      description: 'No name',
-      args: z.object({ x: z.number() }),
-      handler: (args) => args.x,
-    });
-    // Arrow functions have empty .name, so falls back to tool_N
-    expect(t.name).toMatch(/^tool_\d+$/);
-  });
-
-  it('generates JSON Schema from Zod', () => {
-    tool({
-      name: 'search',
-      description: 'Search',
-      args: z.object({
-        query: z.string().describe('Search query'),
-        limit: z.number().default(10).describe('Max results'),
-      }),
-      handler: (args) => [],
-    });
-
-    const tools = getRegisteredTools();
-    const schema = JSON.parse(tools[0].inputSchemaJson);
-    expect(schema.type).toBe('object');
-    expect(schema.properties.query.type).toBe('string');
-    expect(schema.properties.limit.default).toBe(10);
-    expect(schema.required).toContain('query');
-    expect(schema.required).not.toContain('limit');
-  });
-
-  it('handler is callable', () => {
-    const add = tool({
-      description: 'Add',
-      args: z.object({ a: z.number(), b: z.number() }),
-      handler: (args) => args.a + args.b,
-    });
-
-    expect(add.handler({ a: 2, b: 3 })).toBe(5);
-  });
-});
-```
-
-- [ ] **Step 2: Implement tool()**
-
-```typescript
-import { z } from 'zod';
-import { zodToJsonSchema } from 'zod-to-json-schema';
-
-interface ToolDef<T extends z.ZodType> {
-  name: string;
-  description: string;
-  inputSchemaJson: string;
-  handler: (args: z.infer<T>) => any;
-}
-
-const registry: ToolDef<any>[] = [];
-
-interface ToolOptions<T extends z.ZodObject<any>> {
-  description: string;
-  args: T;
-  handler: (args: z.infer<T>) => any;
-  name?: string; // defaults to handler function name or export name
-}
-
-export function tool<T extends z.ZodObject<any>>(options: ToolOptions<T>): ToolDef<T> {
-  const schema = zodToJsonSchema(options.args, { target: 'openApi3' });
-  const def: ToolDef<T> = {
-    name: options.name || options.handler.name || `tool_${registry.length}`,
-    description: options.description,
-    inputSchemaJson: JSON.stringify(schema),
-    handler: options.handler,
-  };
-  registry.push(def);
-  return def;
-}
-
-export function getRegisteredTools(): ToolDef<any>[] {
-  return [...registry];
-}
-
-export function clearRegistry(): void {
-  registry.length = 0;
-}
-```
-
-- [ ] **Step 3: Test and commit**
-
-```bash
-cd sdk/typescript && npx vitest run tests/tool.test.ts
-git add sdk/typescript/src/tool.ts sdk/typescript/tests/tool.test.ts
-git commit -m "feat: implement TypeScript tool() function with Zod schema generation"
-```
-
----
-
-### Task 24: TypeScript — ToolResult, Transport, Manager, Runner
-
-**Files:**
-- Create: `sdk/typescript/src/result.ts`
-- Create: `sdk/typescript/src/transport.ts`
-- Create: `sdk/typescript/src/manager.ts`
-- Create: `sdk/typescript/src/runner.ts`
-- Create: `sdk/typescript/tests/result.test.ts`
-- Create: `sdk/typescript/tests/transport.test.ts`
-- Create: `sdk/typescript/tests/manager.test.ts`
-
-These mirror the Python implementations exactly:
-
-- **result.ts**: `ToolResult` interface with `result`, `isError`, `enableTools`, `disableTools`, `errorCode`, `message`, `suggestion`, `retryable`
-- **transport.ts**: Unix socket client with length-prefixed protobuf envelope read/write using `net.Socket` and `protobufjs`
-- **manager.ts**: `toolManager` with `enable()`, `disable()`, `setAllowed()`, `setBlocked()`, `getActiveTools()`, `batch()`
-- **runner.ts**: Main loop that connects to socket, listens for envelopes, dispatches tool calls, handles reload via Node module cache invalidation
-
-Follow the same TDD pattern as the Python tasks: write tests first, verify they fail, implement, verify they pass, commit.
-
-- [ ] **Step 1: Implement and test ToolResult**
-- [ ] **Step 2: Implement and test transport**
-- [ ] **Step 3: Implement and test manager**
-- [ ] **Step 4: Implement runner**
-- [ ] **Step 5: Commit all**
-
-```bash
-git add sdk/typescript/src/ sdk/typescript/tests/
-git commit -m "feat: implement TypeScript SDK — ToolResult, transport, manager, runner"
-```
-
----
-
-## Chunk 6: Integration Tests and Documentation
-
-### Task 25: End-to-End Integration Tests
-
-**Files:**
-- Create: `test/e2e/e2e_test.go`
-- Create: `test/e2e/helpers.go`
-- Create: `test/e2e/fixtures/simple_tool.py`
-- Create: `test/e2e/fixtures/dynamic_tool.py`
-- Create: `test/e2e/fixtures/simple_tool.ts`
-- Create: `test/e2e/fixtures/crash_tool.py`
-
-- [ ] **Step 1: Create test fixtures**
-
-`simple_tool.py`:
-```python
-from protomcp import tool
-
-@tool(description="Echo a message back")
-def echo(message: str) -> str:
-    return message
-
-@tool(description="Add two numbers")
-def add(a: int, b: int) -> int:
-    return a + b
-```
-
-`dynamic_tool.py`:
-```python
-from protomcp import tool, ToolResult, tool_manager
-
-# Start with admin_action hidden — it gets enabled after auth
-tool_manager.set_blocked(["admin_action"])
-
-@tool(description="Authenticate")
-def auth(token: str) -> ToolResult:
-    if token == "valid":
-        return ToolResult(
-            result="Authenticated",
-            enable_tools=["admin_action"],
-            disable_tools=["auth"],
-        )
-    return ToolResult(is_error=True, message="Invalid token", suggestion="Use 'valid' as token")
-
-@tool(description="Admin action (hidden until auth)")
-def admin_action() -> str:
-    return "admin stuff done"
-```
-
-`crash_tool.py`:
-```python
-from protomcp import tool
-import sys
-
-@tool(description="Crash the process")
-def crash() -> str:
-    sys.exit(1)
-```
-
-`simple_tool.ts`:
-```typescript
-import { tool } from 'protomcp';
-import { z } from 'zod';
-
-export const echo = tool({
-  description: 'Echo a message back',
-  args: z.object({ message: z.string() }),
-  handler: (args) => args.message,
-});
-```
-
-- [ ] **Step 2: Write e2e test helpers**
-
-Create `test/e2e/helpers.go`:
-
-```go
-package e2e
-
-import (
-	"bufio"
-	"encoding/json"
-	"io"
-	"os/exec"
-	"testing"
-
-	"github.com/msilverblatt/protomcp/internal/mcp"
-)
-
-// StartProtomcp starts the protomcp binary with the given args.
-// Returns stdin writer, stdout reader, and cleanup function.
-func StartProtomcp(t *testing.T, args ...string) (io.Writer, *bufio.Scanner, func()) {
-	t.Helper()
-	cmd := exec.Command("../../bin/protomcp", args...)
-	stdin, _ := cmd.StdinPipe()
-	stdout, _ := cmd.StdoutPipe()
-	cmd.Stderr = nil // suppress stderr in tests
-
-	if err := cmd.Start(); err != nil {
-		t.Fatalf("failed to start protomcp: %v", err)
-	}
-
-	scanner := bufio.NewScanner(stdout)
-	cleanup := func() {
-		stdin.Close()
-		cmd.Process.Kill()
-		cmd.Wait()
-	}
-
-	return stdin, scanner, cleanup
-}
-
-// SendRequest sends a JSON-RPC request and reads the response.
-func SendRequest(t *testing.T, w io.Writer, r *bufio.Scanner, method string, params interface{}) mcp.JSONRPCResponse {
-	t.Helper()
-	id := json.RawMessage(`1`)
-	p, _ := json.Marshal(params)
-	req := mcp.JSONRPCRequest{
-		JSONRPC: "2.0",
-		ID:      id,
-		Method:  method,
-		Params:  p,
-	}
-	data, _ := json.Marshal(req)
-	w.Write(append(data, '\n'))
-
-	if !r.Scan() {
-		t.Fatal("no response from protomcp")
-	}
-
-	var resp mcp.JSONRPCResponse
-	json.Unmarshal(r.Bytes(), &resp)
-	return resp
-}
-```
-
-- [ ] **Step 3: Write e2e tests**
-
-Create `test/e2e/e2e_test.go`:
-
-```go
-package e2e
-
-import (
-	"encoding/json"
-	"testing"
-
-	"github.com/msilverblatt/protomcp/internal/mcp"
-)
-
-func TestE2E_Initialize(t *testing.T) {
-	w, r, cleanup := StartProtomcp(t, "dev", "fixtures/simple_tool.py")
-	defer cleanup()
-
-	resp := SendRequest(t, w, r, "initialize", nil)
-	if resp.Error != nil {
-		t.Fatalf("initialize error: %v", resp.Error)
-	}
-
-	var result mcp.InitializeResult
-	json.Unmarshal(resp.Result, &result)
-	if !result.Capabilities.Tools.ListChanged {
-		t.Error("expected tools.listChanged = true")
-	}
-}
-
-func TestE2E_ToolsList(t *testing.T) {
-	w, r, cleanup := StartProtomcp(t, "dev", "fixtures/simple_tool.py")
-	defer cleanup()
-
-	SendRequest(t, w, r, "initialize", nil)
-	resp := SendRequest(t, w, r, "tools/list", nil)
-
-	var result mcp.ToolsListResult
-	json.Unmarshal(resp.Result, &result)
-	if len(result.Tools) != 2 {
-		t.Fatalf("expected 2 tools, got %d", len(result.Tools))
-	}
-}
-
-func TestE2E_ToolsCall(t *testing.T) {
-	w, r, cleanup := StartProtomcp(t, "dev", "fixtures/simple_tool.py")
-	defer cleanup()
-
-	SendRequest(t, w, r, "initialize", nil)
-	resp := SendRequest(t, w, r, "tools/call", map[string]interface{}{
-		"name":      "echo",
-		"arguments": map[string]string{"message": "hello"},
-	})
-
-	if resp.Error != nil {
-		t.Fatalf("tools/call error: %v", resp.Error)
-	}
-}
-
-func TestE2E_DynamicToolList(t *testing.T) {
-	w, r, cleanup := StartProtomcp(t, "dev", "fixtures/dynamic_tool.py")
-	defer cleanup()
-
-	SendRequest(t, w, r, "initialize", nil)
-
-	// Initially, auth should be visible but admin_action should not
-	// (admin_action starts disabled — depends on how the fixture sets initial state)
-	// Call auth with valid token
-	resp := SendRequest(t, w, r, "tools/call", map[string]interface{}{
-		"name":      "auth",
-		"arguments": map[string]string{"token": "valid"},
-	})
-	if resp.Error != nil {
-		t.Fatalf("auth call error: %v", resp.Error)
-	}
-
-	// After auth, admin_action should now be visible in tools/list
-	listResp := SendRequest(t, w, r, "tools/list", nil)
-	var result mcp.ToolsListResult
-	json.Unmarshal(listResp.Result, &result)
-
-	found := false
-	for _, tool := range result.Tools {
-		if tool.Name == "admin_action" {
-			found = true
-		}
-	}
-	if !found {
-		t.Error("admin_action should be visible after auth")
-	}
-}
-
-func TestE2E_TypeScript(t *testing.T) {
-	w, r, cleanup := StartProtomcp(t, "dev", "fixtures/simple_tool.ts")
-	defer cleanup()
-
-	SendRequest(t, w, r, "initialize", nil)
-	resp := SendRequest(t, w, r, "tools/list", nil)
-
-	var result mcp.ToolsListResult
-	json.Unmarshal(resp.Result, &result)
-	if len(result.Tools) != 1 {
-		t.Fatalf("expected 1 tool, got %d", len(result.Tools))
-	}
-	if result.Tools[0].Name != "echo" {
-		t.Errorf("tool name = %q, want %q", result.Tools[0].Name, "echo")
-	}
-}
-```
-
-- [ ] **Step 4: Build binary and run e2e tests**
-
-```bash
-make build
-go test ./test/e2e/... -v -timeout 60s
-```
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add test/
-git commit -m "feat: add end-to-end integration tests for Python, TypeScript, and dynamic tool lists"
-```
-
----
-
-### Task 26: Documentation Site Setup
-
-**Files:**
-- Create: `docs/package.json`
-- Create: `docs/astro.config.mjs`
-- Create: `docs/src/content/docs/index.mdx`
-
-- [ ] **Step 1: Scaffold Starlight site**
-
-```bash
-cd docs && npm create astro@latest -- --template starlight
-```
-
-Or manually create `docs/package.json`:
-```json
-{
-  "name": "protomcp-docs",
-  "scripts": {
-    "dev": "astro dev",
-    "build": "astro build"
-  },
-  "dependencies": {
-    "@astrojs/starlight": "latest",
-    "astro": "latest"
-  }
-}
-```
-
-- [ ] **Step 2: Configure astro.config.mjs**
-
-```javascript
-import { defineConfig } from 'astro/config';
-import starlight from '@astrojs/starlight';
-
-export default defineConfig({
-  integrations: [
-    starlight({
-      title: 'protomcp',
-      description: 'Language-agnostic MCP runtime',
-      social: {
-        github: 'https://github.com/msilverblatt/protomcp',
-      },
-      sidebar: [
-        {
-          label: 'Getting Started',
-          items: [
-            { label: 'Installation', slug: 'getting-started/installation' },
-            { label: 'Quick Start', slug: 'getting-started/quick-start' },
-            { label: 'How It Works', slug: 'getting-started/how-it-works' },
-          ],
-        },
-        {
-          label: 'Guides',
-          items: [
-            { label: 'Writing Tools (Python)', slug: 'guides/writing-tools-python' },
-            { label: 'Writing Tools (TypeScript)', slug: 'guides/writing-tools-typescript' },
-            { label: 'Dynamic Tool Lists', slug: 'guides/dynamic-tool-lists' },
-            { label: 'Hot Reload', slug: 'guides/hot-reload' },
-            { label: 'Error Handling', slug: 'guides/error-handling' },
-            { label: 'Production Deployment', slug: 'guides/production-deployment' },
-          ],
-        },
-        {
-          label: 'Reference',
-          items: [
-            { label: 'CLI', slug: 'reference/cli' },
-            { label: 'Protobuf Spec', slug: 'reference/protobuf-spec' },
-            { label: 'Python API', slug: 'reference/python-api' },
-            { label: 'TypeScript API', slug: 'reference/typescript-api' },
-          ],
-        },
-        {
-          label: 'Concepts',
-          items: [
-            { label: 'Architecture', slug: 'concepts/architecture' },
-            { label: 'Tool List Modes', slug: 'concepts/tool-list-modes' },
-            { label: 'Transports', slug: 'concepts/transports' },
-          ],
-        },
-      ],
-    }),
-  ],
-});
-```
-
-- [ ] **Step 3: Install dependencies and verify build**
-
-```bash
-cd docs && npm install && npm run build
-```
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add docs/package.json docs/astro.config.mjs docs/src/
-git commit -m "feat: scaffold Starlight documentation site with sidebar structure"
-```
-
----
-
-### Task 27: Documentation — Getting Started Pages
-
-**Files:**
-- Create: `docs/src/content/docs/getting-started/installation.mdx`
-- Create: `docs/src/content/docs/getting-started/quick-start.mdx`
-- Create: `docs/src/content/docs/getting-started/how-it-works.mdx`
-
-- [ ] **Step 1: Write Installation page**
-
-Covers: Homebrew, binary download, building from source. Platform-specific instructions for macOS, Linux, Windows. Python and TypeScript SDK installation via pip/npm.
-
-- [ ] **Step 2: Write Quick Start page**
-
-5-minute tutorial:
-1. Install protomcp
-2. Write a Python tool file (3 lines)
-3. Run `protomcp dev server.py`
-4. Configure your MCP client
-5. Use the tool — edit, save, see it update live
-
-Include exact terminal output at each step.
-
-- [ ] **Step 3: Write How It Works page**
-
-Architecture explainer with Mermaid diagrams:
-- The three layers (host, Go binary, tool process)
-- How hot-reload works (sequence diagram)
-- How dynamic tool lists work (state diagram)
-- Why the Go binary never needs to change
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add docs/src/content/docs/getting-started/
-git commit -m "docs: add Getting Started pages — installation, quick start, architecture"
-```
-
----
-
-### Task 28: Documentation — Guides
-
-**Files:**
-- Create: `docs/src/content/docs/guides/writing-tools-python.mdx`
-- Create: `docs/src/content/docs/guides/writing-tools-typescript.mdx`
-- Create: `docs/src/content/docs/guides/dynamic-tool-lists.mdx`
-- Create: `docs/src/content/docs/guides/hot-reload.mdx`
-- Create: `docs/src/content/docs/guides/error-handling.mdx`
-- Create: `docs/src/content/docs/guides/production-deployment.mdx`
-
-- [ ] **Step 1: Write Python guide**
-
-Covers: `@tool()` decorator, type hints for schema generation, `ToolResult`, `tool_manager`, async tools, testing tools outside protomcp. All examples pulled from test files.
-
-- [ ] **Step 2: Write TypeScript guide**
-
-Covers: `tool()` function, Zod schemas, `ToolResult`, `toolManager`. Parallel structure to Python guide.
-
-- [ ] **Step 3: Write Dynamic Tool Lists guide**
-
-Covers: inline mutations (enable_tools/disable_tools in ToolResult), programmatic control (tool_manager), modes (open/allowlist/blocklist), batch operations, event-driven examples (locks, auth).
-
-- [ ] **Step 4: Write Hot Reload guide**
-
-Covers: how it works, what triggers a reload, in-flight call handling (default vs immediate), reload logs, common gotchas (module-level side effects, import caching).
-
-- [ ] **Step 5: Write Error Handling guide**
-
-Covers: structured errors (error_code, message, suggestion, retryable), how errors are formatted by the Go binary, best practices for agent-friendly errors.
-
-- [ ] **Step 6: Write Production Deployment guide**
-
-Covers: `protomcp run` vs `protomcp dev`, transport selection for production, systemd/supervisor config, Docker (optional), monitoring via logs.
-
-- [ ] **Step 7: Commit**
-
-```bash
-git add docs/src/content/docs/guides/
-git commit -m "docs: add all v1.0 guides — Python, TypeScript, dynamic tools, hot reload, errors, production"
-```
-
----
-
-### Task 29: Documentation — Reference Pages
-
-**Files:**
-- Create: `docs/src/content/docs/reference/cli.mdx`
-- Create: `docs/src/content/docs/reference/protobuf-spec.mdx`
-- Create: `docs/src/content/docs/reference/python-api.mdx`
-- Create: `docs/src/content/docs/reference/typescript-api.mdx`
-
-- [ ] **Step 1: Write CLI Reference**
-
-Exhaustive documentation of `protomcp dev`, `protomcp run`, and all flags with examples.
-
-- [ ] **Step 2: Write Protobuf Spec Reference**
-
-Full `.proto` file with annotated explanations of every message type, field, and the wire format.
-
-- [ ] **Step 3: Write Python API Reference**
-
-Complete API docs for `@tool()`, `ToolResult`, `tool_manager` — all parameters, return types, examples.
-
-- [ ] **Step 4: Write TypeScript API Reference**
-
-Same as Python reference but for TS — `tool()`, `ToolResult`, `toolManager`.
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add docs/src/content/docs/reference/
-git commit -m "docs: add reference pages — CLI, protobuf spec, Python API, TypeScript API"
-```
-
----
-
-### Task 30: Documentation — Concepts Pages
-
-**Files:**
-- Create: `docs/src/content/docs/concepts/architecture.mdx`
-- Create: `docs/src/content/docs/concepts/tool-list-modes.mdx`
-- Create: `docs/src/content/docs/concepts/transports.mdx`
-
-- [ ] **Step 1: Write Architecture page**
-
-Deep dive into the three-layer architecture with Mermaid diagrams. Explains why the Go binary is language-agnostic, how protobuf enables any-language support, and the unix socket communication pattern.
-
-- [ ] **Step 2: Write Tool List Modes page**
-
-Explains open/allowlist/blocklist modes, mode transitions, interaction semantics, batch operations. Includes state diagram.
-
-- [ ] **Step 3: Write Transports page**
-
-Explains all five transports, when to use each, configuration, and client compatibility matrix.
-
-- [ ] **Step 4: Build docs and verify**
-
-```bash
-cd docs && npm run build
-```
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add docs/src/content/docs/concepts/
-git commit -m "docs: add concept pages — architecture, tool list modes, transports"
-```
-
----
-
-## Chunk 7: MCP Advanced Features — Progress, Tasks, Cancellation, Logging, Structured Output, Tool Metadata
-
-### Task 32: Go — Progress Notification Proxy
-
-**Files:**
-- Create: `internal/progress/progress.go`
-- Create: `internal/progress/progress_test.go`
-
-- [ ] **Step 1: Write failing test for progress proxy**
-
-```go
-// internal/progress/progress_test.go
-package progress
-
-import (
-	"testing"
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-func TestProgressProxy_ForwardsToMCP(t *testing.T) {
-	var sent []map[string]any
-	proxy := NewProxy(func(notification map[string]any) {
-		sent = append(sent, notification)
-	})
-	proxy.HandleProgress(&pb.ProgressNotification{
-		ProgressToken: "tok-1",
-		Progress:      5,
-		Total:         10,
-		Message:       "Processing item 5",
-	})
-	if len(sent) != 1 {
-		t.Fatalf("expected 1 notification, got %d", len(sent))
-	}
-	if sent[0]["method"] != "notifications/progress" {
-		t.Fatalf("expected notifications/progress, got %v", sent[0]["method"])
-	}
-}
-
-func TestProgressProxy_DropsWhenNoToken(t *testing.T) {
-	var sent []map[string]any
-	proxy := NewProxy(func(notification map[string]any) {
-		sent = append(sent, notification)
-	})
-	proxy.HandleProgress(&pb.ProgressNotification{
-		ProgressToken: "",
-		Progress:      1,
-	})
-	if len(sent) != 0 {
-		t.Fatalf("expected 0 notifications for empty token, got %d", len(sent))
-	}
-}
-```
-
-- [ ] **Step 2: Run test to verify it fails**
-
-Run: `go test ./internal/progress/ -v`
-Expected: FAIL — package doesn't exist yet.
-
-- [ ] **Step 3: Implement progress proxy**
-
-```go
-// internal/progress/progress.go
-package progress
-
-import pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-
-type NotifySender func(notification map[string]any)
-
-type Proxy struct {
-	send NotifySender
-}
-
-func NewProxy(send NotifySender) *Proxy {
-	return &Proxy{send: send}
-}
-
-func (p *Proxy) HandleProgress(msg *pb.ProgressNotification) {
-	if msg.ProgressToken == "" {
-		return // Client didn't request progress — silently drop
-	}
-	params := map[string]any{
-		"progressToken": msg.ProgressToken,
-		"progress":      msg.Progress,
-	}
-	if msg.Total > 0 {
-		params["total"] = msg.Total
-	}
-	if msg.Message != "" {
-		params["message"] = msg.Message
-	}
-	p.send(map[string]any{
-		"method": "notifications/progress",
-		"params": params,
-	})
-}
-```
-
-- [ ] **Step 4: Run test to verify it passes**
-
-Run: `go test ./internal/progress/ -v`
-Expected: PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/progress/
-git commit -m "feat: add progress notification proxy for MCP notifications/progress"
-```
-
----
-
-### Task 33: Go — Cancellation Tracker
-
-**Files:**
-- Create: `internal/cancel/tracker.go`
-- Create: `internal/cancel/tracker_test.go`
-
-- [ ] **Step 1: Write failing test for cancellation tracker**
-
-```go
-// internal/cancel/tracker_test.go
-package cancel
-
-import (
-	"testing"
-)
-
-func TestTracker_SetAndCheck(t *testing.T) {
-	tracker := NewTracker()
-	tracker.TrackCall("req-1")
-	if tracker.IsCancelled("req-1") {
-		t.Fatal("should not be cancelled yet")
-	}
-	tracker.Cancel("req-1")
-	if !tracker.IsCancelled("req-1") {
-		t.Fatal("should be cancelled after Cancel()")
-	}
-}
-
-func TestTracker_CancelUnknownRequestIsNoop(t *testing.T) {
-	tracker := NewTracker()
-	tracker.Cancel("nonexistent") // Should not panic
-}
-
-func TestTracker_CompleteRemovesTracking(t *testing.T) {
-	tracker := NewTracker()
-	tracker.TrackCall("req-1")
-	tracker.Complete("req-1")
-	if tracker.IsCancelled("req-1") {
-		t.Fatal("completed call should not report cancelled")
-	}
-}
-```
-
-- [ ] **Step 2: Run test to verify it fails**
-
-Run: `go test ./internal/cancel/ -v`
-Expected: FAIL
-
-- [ ] **Step 3: Implement cancellation tracker**
-
-```go
-// internal/cancel/tracker.go
-package cancel
-
-import "sync"
-
-type Tracker struct {
-	mu        sync.RWMutex
-	cancelled map[string]bool
-}
-
-func NewTracker() *Tracker {
-	return &Tracker{cancelled: make(map[string]bool)}
-}
-
-func (t *Tracker) TrackCall(requestID string) {
-	t.mu.Lock()
-	defer t.mu.Unlock()
-	t.cancelled[requestID] = false
-}
-
-func (t *Tracker) Cancel(requestID string) {
-	t.mu.Lock()
-	defer t.mu.Unlock()
-	if _, exists := t.cancelled[requestID]; exists {
-		t.cancelled[requestID] = true
-	}
-}
-
-func (t *Tracker) IsCancelled(requestID string) bool {
-	t.mu.RLock()
-	defer t.mu.RUnlock()
-	return t.cancelled[requestID]
-}
-
-func (t *Tracker) Complete(requestID string) {
-	t.mu.Lock()
-	defer t.mu.Unlock()
-	delete(t.cancelled, requestID)
-}
-```
-
-- [ ] **Step 4: Run test to verify it passes**
-
-Run: `go test ./internal/cancel/ -v`
-Expected: PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/cancel/
-git commit -m "feat: add cancellation tracker for cooperative tool call cancellation"
-```
-
----
-
-### Task 34: Go — Server Log Forwarder
-
-**Files:**
-- Create: `internal/serverlog/forwarder.go`
-- Create: `internal/serverlog/forwarder_test.go`
-
-- [ ] **Step 1: Write failing test for log forwarder**
-
-```go
-// internal/serverlog/forwarder_test.go
-package serverlog
-
-import (
-	"testing"
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-func TestForwarder_ForwardsAboveLevel(t *testing.T) {
-	var sent []map[string]any
-	fwd := NewForwarder("info", func(n map[string]any) { sent = append(sent, n) })
-
-	fwd.HandleLog(&pb.LogMessage{Level: "warning", DataJson: `{"msg":"rate limit"}`})
-	if len(sent) != 1 {
-		t.Fatalf("expected 1, got %d", len(sent))
-	}
-	if sent[0]["method"] != "notifications/message" {
-		t.Fatalf("wrong method: %v", sent[0]["method"])
-	}
-}
-
-func TestForwarder_FiltersBelowLevel(t *testing.T) {
-	var sent []map[string]any
-	fwd := NewForwarder("warning", func(n map[string]any) { sent = append(sent, n) })
-
-	fwd.HandleLog(&pb.LogMessage{Level: "info", DataJson: `{"msg":"hello"}`})
-	if len(sent) != 0 {
-		t.Fatalf("expected 0 (filtered), got %d", len(sent))
-	}
-}
-```
-
-- [ ] **Step 2: Run test to verify it fails**
-
-Run: `go test ./internal/serverlog/ -v`
-Expected: FAIL
-
-- [ ] **Step 3: Implement log forwarder**
-
-```go
-// internal/serverlog/forwarder.go
-package serverlog
-
-import (
-	"encoding/json"
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-)
-
-var levelPriority = map[string]int{
-	"debug":     0,
-	"info":      1,
-	"notice":    2,
-	"warning":   3,
-	"error":     4,
-	"critical":  5,
-	"alert":     6,
-	"emergency": 7,
-}
-
-type NotifySender func(notification map[string]any)
-
-type Forwarder struct {
-	minLevel int
-	send     NotifySender
-}
-
-func NewForwarder(minLevelStr string, send NotifySender) *Forwarder {
-	return &Forwarder{
-		minLevel: levelPriority[minLevelStr],
-		send:     send,
-	}
-}
-
-func (f *Forwarder) HandleLog(msg *pb.LogMessage) {
-	priority, ok := levelPriority[msg.Level]
-	if !ok {
-		priority = 1 // default to info for unknown levels
-	}
-	if priority < f.minLevel {
-		return
-	}
-	params := map[string]any{
-		"level": msg.Level,
-	}
-	if msg.Logger != "" {
-		params["logger"] = msg.Logger
-	}
-	if msg.DataJson != "" {
-		var data any
-		if err := json.Unmarshal([]byte(msg.DataJson), &data); err == nil {
-			params["data"] = data
-		} else {
-			params["data"] = msg.DataJson
-		}
-	}
-	f.send(map[string]any{
-		"method": "notifications/message",
-		"params": params,
-	})
-}
-```
-
-- [ ] **Step 4: Run test to verify it passes**
-
-Run: `go test ./internal/serverlog/ -v`
-Expected: PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/serverlog/
-git commit -m "feat: add server log forwarder for MCP notifications/message"
-```
-
----
-
-### Task 35: Go — Async Task Manager
-
-**Files:**
-- Create: `internal/tasks/manager.go`
-- Create: `internal/tasks/manager_test.go`
-
-- [ ] **Step 1: Write failing test for task manager**
-
-```go
-// internal/tasks/manager_test.go
-package tasks
-
-import (
-	"testing"
-)
-
-func TestTaskManager_CreateAndGet(t *testing.T) {
-	mgr := NewManager()
-	mgr.Register("task-1", "req-1")
-	state, err := mgr.GetStatus("task-1")
-	if err != nil {
-		t.Fatal(err)
-	}
-	if state.State != "running" {
-		t.Fatalf("expected running, got %s", state.State)
-	}
-}
-
-func TestTaskManager_FailOnCrash(t *testing.T) {
-	mgr := NewManager()
-	mgr.Register("task-1", "req-1")
-	mgr.FailAll("tool process crashed")
-	state, err := mgr.GetStatus("task-1")
-	if err != nil {
-		t.Fatal(err)
-	}
-	if state.State != "failed" {
-		t.Fatalf("expected failed, got %s", state.State)
-	}
-}
-
-func TestTaskManager_GetUnknownTask(t *testing.T) {
-	mgr := NewManager()
-	_, err := mgr.GetStatus("nonexistent")
-	if err == nil {
-		t.Fatal("expected error for unknown task")
-	}
-}
-```
-
-- [ ] **Step 2: Run test to verify it fails**
-
-Run: `go test ./internal/tasks/ -v`
-Expected: FAIL
-
-- [ ] **Step 3: Implement task manager**
-
-```go
-// internal/tasks/manager.go
-package tasks
-
-import (
-	"fmt"
-	"sync"
-)
-
-type TaskState struct {
-	State   string // running, completed, failed, cancelled
-	Message string
-}
-
-type Manager struct {
-	mu    sync.RWMutex
-	tasks map[string]*TaskState
-}
-
-func NewManager() *Manager {
-	return &Manager{tasks: make(map[string]*TaskState)}
-}
-
-func (m *Manager) Register(taskID, requestID string) {
-	m.mu.Lock()
-	defer m.mu.Unlock()
-	m.tasks[taskID] = &TaskState{State: "running"}
-}
-
-func (m *Manager) GetStatus(taskID string) (*TaskState, error) {
-	m.mu.RLock()
-	defer m.mu.RUnlock()
-	state, ok := m.tasks[taskID]
-	if !ok {
-		return nil, fmt.Errorf("unknown task: %s", taskID)
-	}
-	return state, nil
-}
-
-func (m *Manager) UpdateStatus(taskID, state, message string) error {
-	m.mu.Lock()
-	defer m.mu.Unlock()
-	ts, ok := m.tasks[taskID]
-	if !ok {
-		return fmt.Errorf("unknown task: %s", taskID)
-	}
-	ts.State = state
-	ts.Message = message
-	return nil
-}
-
-func (m *Manager) FailAll(reason string) {
-	m.mu.Lock()
-	defer m.mu.Unlock()
-	for _, ts := range m.tasks {
-		if ts.State == "running" {
-			ts.State = "failed"
-			ts.Message = reason
-		}
-	}
-}
-```
-
-- [ ] **Step 4: Run test to verify it passes**
-
-Run: `go test ./internal/tasks/ -v`
-Expected: PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/tasks/
-git commit -m "feat: add async task manager for MCP task lifecycle"
-```
-
----
-
-### Task 36: Go — Integrate New Features into MCP Handler
-
-**Files:**
-- Modify: `internal/mcp/handler.go`
-- Modify: `internal/mcp/handler_test.go`
-
-- [ ] **Step 1: Write failing tests for new MCP handler capabilities**
-
-Add tests to `internal/mcp/handler_test.go`:
-
-```go
-func TestHandler_ToolsCallWithProgressToken(t *testing.T) {
-	// Test that _meta.progressToken is extracted and forwarded in CallToolRequest
-	handler := newTestHandler()
-	req := makeToolCallRequest("test_tool", `{"x": 1}`, map[string]any{"progressToken": "pt-1"})
-	handler.HandleRequest(req)
-	// Verify CallToolRequest sent to tool process includes progress_token = "pt-1"
-	sentMsg := handler.lastSentToToolProcess()
-	callReq := sentMsg.GetCallTool()
-	if callReq.ProgressToken != "pt-1" {
-		t.Fatalf("expected progress_token pt-1, got %s", callReq.ProgressToken)
-	}
-}
-
-func TestHandler_NotificationsCancelled(t *testing.T) {
-	// Test that notifications/cancelled is forwarded as CancelRequest
-	handler := newTestHandler()
-	handler.startToolCall("req-42")
-	handler.HandleNotification("notifications/cancelled", map[string]any{"requestId": "req-42"})
-	if !handler.cancelTracker.IsCancelled("req-42") {
-		t.Fatal("expected req-42 to be cancelled")
-	}
-}
-
-func TestHandler_ToolsCallReturnsStructuredContent(t *testing.T) {
-	// Test that structuredContent is included when outputSchema is defined
-	handler := newTestHandler()
-	handler.setToolOutputSchema("search", `{"type":"array"}`)
-	resp := handler.callTool("search", `{"q":"test"}`)
-	if resp["structuredContent"] == nil {
-		t.Fatal("expected structuredContent in response")
-	}
-}
-
-func TestHandler_ToolDefinitionIncludesMetadata(t *testing.T) {
-	// Test that tool metadata (title, hints, task_support) is included in tools/list
-	handler := newTestHandler()
-	tools := handler.handleToolsList()
-	for _, tool := range tools {
-		toolMap := tool.(map[string]any)
-		if toolMap["name"] == "delete_doc" {
-			annotations := toolMap["annotations"].(map[string]any)
-			if annotations["destructiveHint"] != true {
-				t.Fatal("expected destructiveHint on delete_doc")
-			}
-		}
-	}
-}
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `go test ./internal/mcp/ -v -run "ProgressToken|Cancelled|StructuredContent|Metadata"`
-Expected: FAIL
-
-- [ ] **Step 3: Update MCP handler implementation**
-
-Update `internal/mcp/handler.go` to:
-1. Extract `_meta.progressToken` from `tools/call` requests and include it in `CallToolRequest.progress_token`
-2. Handle `notifications/cancelled` by forwarding `CancelRequest` to tool process and marking in cancel tracker
-3. Include `outputSchema` in tool definitions from `ToolDefinition.output_schema_json`
-4. Include `structuredContent` in `tools/call` responses from `CallToolResponse.structured_content_json`
-5. Include `annotations` (title, hints) in tool definitions from `ToolDefinition` metadata fields
-6. Include `execution.taskSupport` in tool definitions when `ToolDefinition.task_support` is true
-7. Handle `tasks/get`, `tasks/result`, `tasks/cancel` by forwarding to tool process
-8. Advertise `tasks` capability in `initialize` response when any tool has `task_support`
-9. Handle `notifications/message` from tool process by forwarding via server log forwarder
-
-- [ ] **Step 4: Run tests to verify they pass**
-
-Run: `go test ./internal/mcp/ -v`
-Expected: PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/mcp/
-git commit -m "feat: integrate progress, cancellation, tasks, logging, structured output, and tool metadata into MCP handler"
-```
-
----
-
-### Task 37: Python SDK — ToolContext (Progress + Cancellation)
-
-**Files:**
-- Create: `sdk/python/src/protomcp/context.py`
-- Create: `sdk/python/tests/test_context.py`
-
-- [ ] **Step 1: Write failing test**
-
-```python
-# sdk/python/tests/test_context.py
-from protomcp.context import ToolContext
-
-def test_report_progress_sends_notification():
-    sent = []
-    ctx = ToolContext(progress_token="pt-1", send_fn=lambda msg: sent.append(msg))
-    ctx.report_progress(progress=5, total=10, message="Working")
-    assert len(sent) == 1
-    assert sent[0].progress.progress_token == "pt-1"
-    assert sent[0].progress.progress == 5
-    assert sent[0].progress.total == 10
-
-def test_report_progress_noop_without_token():
-    sent = []
-    ctx = ToolContext(progress_token="", send_fn=lambda msg: sent.append(msg))
-    ctx.report_progress(progress=1)
-    assert len(sent) == 0
-
-def test_is_cancelled():
-    ctx = ToolContext(progress_token="", send_fn=lambda msg: None)
-    assert not ctx.is_cancelled()
-    ctx._cancelled = True
-    assert ctx.is_cancelled()
-```
-
-- [ ] **Step 2: Run test to verify it fails**
-
-Run: `cd sdk/python && python -m pytest tests/test_context.py -v`
-Expected: FAIL
-
-- [ ] **Step 3: Implement ToolContext**
-
-```python
-# sdk/python/src/protomcp/context.py
-import threading
-from protomcp.gen import protomcp_pb2 as pb
-
-class ToolContext:
-    def __init__(self, progress_token: str, send_fn):
-        self._progress_token = progress_token
-        self._send_fn = send_fn
-        self._cancelled = False
-        self._lock = threading.Lock()
-
-    def report_progress(self, progress: int, total: int = 0, message: str = ""):
-        if not self._progress_token:
-            return
-        envelope = pb.Envelope(
-            progress=pb.ProgressNotification(
-                progress_token=self._progress_token,
-                progress=progress,
-                total=total,
-                message=message,
-            )
-        )
-        self._send_fn(envelope)
-
-    def is_cancelled(self) -> bool:
-        with self._lock:
-            return self._cancelled
-
-    def _set_cancelled(self):
-        with self._lock:
-            self._cancelled = True
-```
-
-- [ ] **Step 4: Run test to verify it passes**
-
-Run: `cd sdk/python && python -m pytest tests/test_context.py -v`
-Expected: PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/python/src/protomcp/context.py sdk/python/tests/test_context.py
-git commit -m "feat(python): add ToolContext with progress reporting and cancellation"
-```
-
----
-
-### Task 38: Python SDK — Server Logging API
-
-**Files:**
-- Create: `sdk/python/src/protomcp/log.py`
-- Create: `sdk/python/tests/test_log.py`
-
-- [ ] **Step 1: Write failing test**
-
-```python
-# sdk/python/tests/test_log.py
-from protomcp.log import ServerLogger
-
-def test_log_info():
-    sent = []
-    logger = ServerLogger(send_fn=lambda msg: sent.append(msg))
-    logger.info("hello", data={"count": 5})
-    assert len(sent) == 1
-    assert sent[0].log.level == "info"
-    assert '"count": 5' in sent[0].log.data_json or '"count":5' in sent[0].log.data_json
-
-def test_log_with_logger_name():
-    sent = []
-    logger = ServerLogger(send_fn=lambda msg: sent.append(msg), name="cache")
-    logger.debug("hit")
-    assert sent[0].log.logger == "cache"
-
-def test_all_levels():
-    sent = []
-    logger = ServerLogger(send_fn=lambda msg: sent.append(msg))
-    for level in ["debug", "info", "notice", "warning", "error", "critical", "alert", "emergency"]:
-        getattr(logger, level)("test")
-    assert len(sent) == 8
-```
-
-- [ ] **Step 2: Run test to verify it fails**
-
-Run: `cd sdk/python && python -m pytest tests/test_log.py -v`
-Expected: FAIL
-
-- [ ] **Step 3: Implement ServerLogger**
-
-```python
-# sdk/python/src/protomcp/log.py
-import json
-from protomcp.gen import protomcp_pb2 as pb
-
-class ServerLogger:
-    def __init__(self, send_fn, name: str = ""):
-        self._send_fn = send_fn
-        self._name = name
-
-    def _log(self, level: str, message: str, data: dict | None = None):
-        data_json = json.dumps(data) if data else json.dumps({"message": message})
-        envelope = pb.Envelope(
-            log=pb.LogMessage(
-                level=level,
-                logger=self._name,
-                data_json=data_json,
-            )
-        )
-        self._send_fn(envelope)
-
-    def debug(self, message: str, **kwargs): self._log("debug", message, kwargs.get("data"))
-    def info(self, message: str, **kwargs): self._log("info", message, kwargs.get("data"))
-    def notice(self, message: str, **kwargs): self._log("notice", message, kwargs.get("data"))
-    def warning(self, message: str, **kwargs): self._log("warning", message, kwargs.get("data"))
-    def error(self, message: str, **kwargs): self._log("error", message, kwargs.get("data"))
-    def critical(self, message: str, **kwargs): self._log("critical", message, kwargs.get("data"))
-    def alert(self, message: str, **kwargs): self._log("alert", message, kwargs.get("data"))
-    def emergency(self, message: str, **kwargs): self._log("emergency", message, kwargs.get("data"))
-```
-
-- [ ] **Step 4: Run test to verify it passes**
-
-Run: `cd sdk/python && python -m pytest tests/test_log.py -v`
-Expected: PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/python/src/protomcp/log.py sdk/python/tests/test_log.py
-git commit -m "feat(python): add server logging API for MCP notifications/message"
-```
-
----
-
-### Task 39: Python SDK — Structured Output and Tool Metadata
-
-**Files:**
-- Modify: `sdk/python/src/protomcp/tool.py`
-- Modify: `sdk/python/tests/test_tool.py`
-
-- [ ] **Step 1: Write failing tests for output_type and metadata**
-
-Add to `sdk/python/tests/test_tool.py`:
-
-```python
-from dataclasses import dataclass
-
-def test_tool_with_output_type():
-    clear_registry()
-
-    @dataclass
-    class SearchResult:
-        title: str
-        score: float
-
-    @tool(description="Search", output_type=SearchResult)
-    def search(query: str) -> SearchResult:
-        return SearchResult(title="test", score=0.9)
-
-    tools = get_registered_tools()
-    assert tools[0].output_schema_json != ""
-    schema = json.loads(tools[0].output_schema_json)
-    assert "title" in schema["properties"]
-    assert "score" in schema["properties"]
-
-def test_tool_with_metadata():
-    clear_registry()
-
-    @tool(
-        description="Delete doc",
-        title="Delete Document",
-        destructive=True,
-        idempotent=True,
-    )
-    def delete_doc(doc_id: str) -> str:
-        return "deleted"
-
-    tools = get_registered_tools()
-    assert tools[0].title == "Delete Document"
-    assert tools[0].destructive_hint is True
-    assert tools[0].idempotent_hint is True
-
-def test_tool_with_task_support():
-    clear_registry()
-
-    @tool(description="Long task", task_support=True)
-    async def long_task(data: str) -> str:
-        return "done"
-
-    tools = get_registered_tools()
-    assert tools[0].task_support is True
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `cd sdk/python && python -m pytest tests/test_tool.py -v -k "output_type or metadata or task_support"`
-Expected: FAIL
-
-- [ ] **Step 3: Update @tool decorator**
-
-Update `sdk/python/src/protomcp/tool.py` to accept `output_type`, `title`, `destructive`, `idempotent`, `read_only`, `open_world`, and `task_support` parameters. Generate `output_schema_json` from the output type's fields using the same schema generation logic. Set the corresponding fields on `ToolDefinition`.
-
-- [ ] **Step 4: Run tests to verify they pass**
-
-Run: `cd sdk/python && python -m pytest tests/test_tool.py -v`
-Expected: PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/python/src/protomcp/tool.py sdk/python/tests/test_tool.py
-git commit -m "feat(python): add output_type, tool metadata, and task_support to @tool decorator"
-```
-
----
-
-### Task 40: Python SDK — Update Runner for New Features
-
-**Files:**
-- Modify: `sdk/python/src/protomcp/runner.py`
-- Modify: `sdk/python/src/protomcp/__init__.py`
-
-- [ ] **Step 1: Update runner to handle new message types**
-
-Update `sdk/python/src/protomcp/runner.py` to:
-1. Create `ToolContext` with `progress_token` from `CallToolRequest` and pass it to tool handlers that accept a `ctx` parameter (detected via `inspect.signature`)
-2. Handle incoming `CancelRequest` by calling `ctx._set_cancelled()` on the matching in-flight call
-3. Initialize `ServerLogger` and expose as module-level `log` in `__init__.py`
-4. For tools with `task_support=True`, run handler in a background thread, immediately return `CreateTaskResponse`, and handle `TaskStatusRequest`/`TaskResultRequest`/`TaskCancelRequest` by querying the running task
-
-- [ ] **Step 2: Update __init__.py exports**
-
-```python
-# sdk/python/src/protomcp/__init__.py
-from protomcp.tool import tool
-from protomcp.result import ToolResult
-from protomcp.manager import tool_manager
-from protomcp.context import ToolContext
-from protomcp.log import ServerLogger
-
-log = ServerLogger(send_fn=None)  # Initialized by runner on connect
-```
-
-- [ ] **Step 3: Run all Python tests**
-
-Run: `cd sdk/python && python -m pytest tests/ -v`
-Expected: PASS
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add sdk/python/src/protomcp/
-git commit -m "feat(python): integrate progress, cancellation, logging, and async tasks into runner"
-```
-
----
-
-### Task 41: TypeScript SDK — ToolContext, Logging, Structured Output, Metadata
-
-**Files:**
-- Create: `sdk/typescript/src/context.ts`
-- Create: `sdk/typescript/src/log.ts`
-- Create: `sdk/typescript/tests/context.test.ts`
-- Create: `sdk/typescript/tests/log.test.ts`
-- Modify: `sdk/typescript/src/tool.ts`
-- Modify: `sdk/typescript/tests/tool.test.ts`
-- Modify: `sdk/typescript/src/runner.ts`
-- Modify: `sdk/typescript/src/index.ts`
-
-- [ ] **Step 1: Write failing tests for ToolContext**
-
-```typescript
-// sdk/typescript/tests/context.test.ts
-import { describe, it, expect } from 'vitest';
-import { ToolContext } from '../src/context';
-
-describe('ToolContext', () => {
-  it('sends progress notification', () => {
-    const sent: any[] = [];
-    const ctx = new ToolContext('pt-1', (msg) => sent.push(msg));
-    ctx.reportProgress(5, 10, 'Working');
-    expect(sent).toHaveLength(1);
-    expect(sent[0].progress.progressToken).toBe('pt-1');
-  });
-
-  it('is noop without progress token', () => {
-    const sent: any[] = [];
-    const ctx = new ToolContext('', (msg) => sent.push(msg));
-    ctx.reportProgress(1);
-    expect(sent).toHaveLength(0);
-  });
-
-  it('tracks cancellation', () => {
-    const ctx = new ToolContext('', () => {});
-    expect(ctx.isCancelled()).toBe(false);
-    ctx.setCancelled();
-    expect(ctx.isCancelled()).toBe(true);
-  });
-});
-```
-
-- [ ] **Step 2: Write failing tests for ServerLogger**
-
-```typescript
-// sdk/typescript/tests/log.test.ts
-import { describe, it, expect } from 'vitest';
-import { ServerLogger } from '../src/log';
-
-describe('ServerLogger', () => {
-  it('sends log message', () => {
-    const sent: any[] = [];
-    const logger = new ServerLogger((msg) => sent.push(msg));
-    logger.info('hello', { count: 5 });
-    expect(sent).toHaveLength(1);
-    expect(sent[0].log.level).toBe('info');
-  });
-
-  it('supports all RFC 5424 levels', () => {
-    const sent: any[] = [];
-    const logger = new ServerLogger((msg) => sent.push(msg));
-    const levels = ['debug', 'info', 'notice', 'warning', 'error', 'critical', 'alert', 'emergency'] as const;
-    for (const level of levels) {
-      logger[level]('test');
-    }
-    expect(sent).toHaveLength(8);
-  });
-});
-```
-
-- [ ] **Step 3: Run tests to verify they fail**
-
-Run: `cd sdk/typescript && npx vitest run --reporter=verbose`
-Expected: FAIL
-
-- [ ] **Step 4: Implement ToolContext**
-
-```typescript
-// sdk/typescript/src/context.ts
-export class ToolContext {
-  private _cancelled = false;
-  constructor(
-    private readonly progressToken: string,
-    private readonly sendFn: (msg: any) => void,
-  ) {}
-
-  reportProgress(progress: number, total?: number, message?: string) {
-    if (!this.progressToken) return;
-    this.sendFn({
-      progress: {
-        progressToken: this.progressToken,
-        progress,
-        ...(total !== undefined && { total }),
-        ...(message !== undefined && { message }),
-      },
-    });
-  }
-
-  isCancelled(): boolean { return this._cancelled; }
-  setCancelled() { this._cancelled = true; }
-}
-```
-
-- [ ] **Step 5: Implement ServerLogger**
-
-```typescript
-// sdk/typescript/src/log.ts
-const LEVELS = ['debug', 'info', 'notice', 'warning', 'error', 'critical', 'alert', 'emergency'] as const;
-type LogLevel = typeof LEVELS[number];
-
-export class ServerLogger {
-  constructor(
-    private sendFn: (msg: any) => void,
-    private name?: string,
-  ) {}
-
-  private _log(level: LogLevel, message: string, data?: Record<string, unknown>) {
-    this.sendFn({
-      log: {
-        level,
-        logger: this.name ?? '',
-        dataJson: JSON.stringify(data ?? { message }),
-      },
-    });
-  }
-
-  debug(msg: string, data?: Record<string, unknown>) { this._log('debug', msg, data); }
-  info(msg: string, data?: Record<string, unknown>) { this._log('info', msg, data); }
-  notice(msg: string, data?: Record<string, unknown>) { this._log('notice', msg, data); }
-  warning(msg: string, data?: Record<string, unknown>) { this._log('warning', msg, data); }
-  error(msg: string, data?: Record<string, unknown>) { this._log('error', msg, data); }
-  critical(msg: string, data?: Record<string, unknown>) { this._log('critical', msg, data); }
-  alert(msg: string, data?: Record<string, unknown>) { this._log('alert', msg, data); }
-  emergency(msg: string, data?: Record<string, unknown>) { this._log('emergency', msg, data); }
-}
-```
-
-- [ ] **Step 6: Update tool() to support output, metadata, and task_support**
-
-Update `sdk/typescript/src/tool.ts` to accept `output` (Zod schema), `title`, `destructiveHint`, `idempotentHint`, `readOnlyHint`, `openWorldHint`, and `taskSupport` options. Generate `output_schema_json` from the Zod output schema. Set corresponding fields on the `ToolDefinition`.
-
-Add tests to `sdk/typescript/tests/tool.test.ts`:
-
-```typescript
-it('generates output schema from Zod', () => {
-  const OutputSchema = z.object({ title: z.string(), score: z.number() });
-  const t = tool({
-    name: 'search',
-    description: 'Search',
-    args: z.object({ q: z.string() }),
-    output: OutputSchema,
-    handler: (args) => ({ title: 'test', score: 0.9 }),
-  });
-  expect(t.definition.outputSchemaJson).toBeTruthy();
-  const schema = JSON.parse(t.definition.outputSchemaJson);
-  expect(schema.properties.title).toBeTruthy();
-});
-
-it('includes tool metadata', () => {
-  const t = tool({
-    name: 'delete_doc',
-    description: 'Delete',
-    args: z.object({ id: z.string() }),
-    title: 'Delete Document',
-    destructiveHint: true,
-    handler: (args) => 'deleted',
-  });
-  expect(t.definition.title).toBe('Delete Document');
-  expect(t.definition.destructiveHint).toBe(true);
-});
-```
-
-- [ ] **Step 7: Update runner and index exports**
-
-Update `sdk/typescript/src/runner.ts` to handle new message types (same as Python runner — ToolContext injection, cancel handling, async task lifecycle, log initialization).
-
-Update `sdk/typescript/src/index.ts`:
-
-```typescript
-export { tool, ToolResult } from './tool';
-export { toolManager } from './manager';
-export { ToolContext } from './context';
-export { ServerLogger } from './log';
-```
-
-- [ ] **Step 8: Run all TypeScript tests**
-
-Run: `cd sdk/typescript && npx vitest run --reporter=verbose`
-Expected: PASS
-
-- [ ] **Step 9: Commit**
-
-```bash
-git add sdk/typescript/
-git commit -m "feat(typescript): add progress, cancellation, logging, structured output, and tool metadata"
-```
-
----
-
-### Task 42: E2E Tests for New Features
-
-**Files:**
-- Create: `test/e2e/fixtures/progress_tool.py`
-- Create: `test/e2e/fixtures/async_tool.py`
-- Create: `test/e2e/fixtures/logging_tool.py`
-- Create: `test/e2e/fixtures/structured_output_tool.py`
-- Modify: `test/e2e/e2e_test.go`
-
-- [ ] **Step 1: Create test fixtures**
-
-`progress_tool.py`:
-```python
-from protomcp import tool, ToolContext
-
-@tool(description="Count with progress")
-def count_with_progress(n: int, ctx: ToolContext) -> str:
-    for i in range(n):
-        ctx.report_progress(i + 1, n, f"Step {i + 1}")
-    return f"Counted to {n}"
-```
-
-`async_tool.py`:
-```python
-import asyncio
-from protomcp import tool
-
-@tool(description="Async task", task_support=True)
-async def slow_task(duration_ms: int) -> str:
-    await asyncio.sleep(duration_ms / 1000)
-    return f"Completed after {duration_ms}ms"
-```
-
-`logging_tool.py`:
-```python
-from protomcp import tool, log
-
-@tool(description="Tool that logs")
-def logging_tool(message: str) -> str:
-    log.info("Tool called", data={"message": message})
-    log.debug("Debug detail")
-    return f"Logged: {message}"
-```
-
-`structured_output_tool.py`:
-```python
-from dataclasses import dataclass
-from protomcp import tool
-
-@dataclass
-class SearchResult:
-    title: str
-    score: float
-
-@tool(description="Structured search", output_type=SearchResult)
-def search(query: str) -> SearchResult:
-    return SearchResult(title=f"Result for {query}", score=0.95)
-```
-
-- [ ] **Step 2: Write e2e tests**
-
-Add to `test/e2e/e2e_test.go`:
-
-```go
-func TestE2E_ProgressNotifications(t *testing.T) {
-	binary, cleanup := buildBinary(t)
-	defer cleanup()
-	client := startWithFixture(t, binary, "progress_tool.py")
-	defer client.Close()
-
-	notifications := client.CollectNotifications()
-	result := client.CallTool("count_with_progress", map[string]any{
-		"n": 3,
-	}, map[string]any{"progressToken": "pt-test"})
-
-	assertNoError(t, result)
-	progressNotifs := filterNotifications(notifications, "notifications/progress")
-	if len(progressNotifs) != 3 {
-		t.Fatalf("expected 3 progress notifications, got %d", len(progressNotifs))
-	}
-}
-
-func TestE2E_AsyncTask(t *testing.T) {
-	binary, cleanup := buildBinary(t)
-	defer cleanup()
-	client := startWithFixture(t, binary, "async_tool.py")
-	defer client.Close()
-
-	result := client.CallTool("slow_task", map[string]any{"duration_ms": 100})
-	// Should get a CreateTaskResult with taskId
-	taskID := result["taskId"].(string)
-	if taskID == "" {
-		t.Fatal("expected taskId in response")
-	}
-
-	// Poll until complete
-	var status map[string]any
-	for i := 0; i < 20; i++ {
-		status = client.TaskGet(taskID)
-		if status["state"] == "completed" {
-			break
-		}
-		time.Sleep(50 * time.Millisecond)
-	}
-	if status["state"] != "completed" {
-		t.Fatalf("expected completed, got %s", status["state"])
-	}
-
-	// Get result
-	taskResult := client.TaskResult(taskID)
-	assertNoError(t, taskResult)
-}
-
-func TestE2E_ServerLogging(t *testing.T) {
-	binary, cleanup := buildBinary(t)
-	defer cleanup()
-	client := startWithFixture(t, binary, "logging_tool.py")
-	defer client.Close()
-
-	notifications := client.CollectNotifications()
-	client.CallTool("logging_tool", map[string]any{"message": "test"})
-
-	logNotifs := filterNotifications(notifications, "notifications/message")
-	if len(logNotifs) == 0 {
-		t.Fatal("expected at least one log notification")
-	}
-}
-
-func TestE2E_StructuredOutput(t *testing.T) {
-	binary, cleanup := buildBinary(t)
-	defer cleanup()
-	client := startWithFixture(t, binary, "structured_output_tool.py")
-	defer client.Close()
-
-	// Verify tools/list includes outputSchema
-	tools := client.ListTools()
-	searchTool := findTool(tools, "search")
-	if searchTool["outputSchema"] == nil {
-		t.Fatal("expected outputSchema on search tool")
-	}
-
-	// Verify call result includes structuredContent
-	result := client.CallTool("search", map[string]any{"query": "test"})
-	if result["structuredContent"] == nil {
-		t.Fatal("expected structuredContent in result")
-	}
-}
-```
-
-- [ ] **Step 3: Run e2e tests**
-
-Run: `go test ./test/e2e/... -v -timeout 60s -run "Progress|Async|Logging|Structured"`
-Expected: PASS
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add test/e2e/
-git commit -m "test: add e2e tests for progress, async tasks, server logging, and structured output"
-```
-
----
-
-### Task 43: Documentation — New Feature Guides
-
-**Files:**
-- Create: `docs/src/content/docs/guides/progress-notifications.mdx`
-- Create: `docs/src/content/docs/guides/async-tasks.mdx`
-- Create: `docs/src/content/docs/guides/cancellation.mdx`
-- Create: `docs/src/content/docs/guides/server-logging.mdx`
-- Create: `docs/src/content/docs/guides/structured-output.mdx`
-
-- [ ] **Step 1: Write progress notifications guide**
-
-Cover: how to use `ToolContext.report_progress()`, what happens with/without progressToken, Python and TS examples.
-
-- [ ] **Step 2: Write async tasks guide**
-
-Cover: `task_support=True`, how async tools work, task lifecycle (create → poll → result), cancellation of tasks, Python and TS examples.
-
-- [ ] **Step 3: Write cancellation guide**
-
-Cover: `ctx.is_cancelled()`, cooperative cancellation pattern, how it interacts with async tasks, Python and TS examples.
-
-- [ ] **Step 4: Write server logging guide**
-
-Cover: log levels (RFC 5424), `log.info()`/`log.debug()` etc., how `--log-level` filters, named loggers, Python and TS examples.
-
-- [ ] **Step 5: Write structured output guide**
-
-Cover: `output_type`/`output` parameter, how `outputSchema` appears in tool definitions, `structuredContent` in results, Python and TS examples.
-
-- [ ] **Step 6: Update Starlight sidebar config**
-
-Add new guide pages to the sidebar in `docs/astro.config.mjs`.
-
-- [ ] **Step 7: Build docs to verify**
-
-Run: `cd docs && npm run build`
-Expected: builds successfully.
-
-- [ ] **Step 8: Commit**
-
-```bash
-git add docs/
-git commit -m "docs: add guides for progress, async tasks, cancellation, logging, and structured output"
-```
-
----
-
-### Task 31: Final Verification
-
-- [ ] **Step 1: Run all Go tests**
-
-```bash
-make test
-```
-
-Expected: all tests pass.
-
-- [ ] **Step 2: Run Python SDK tests**
-
-```bash
-make test-python
-```
-
-Expected: all tests pass.
-
-- [ ] **Step 3: Run TypeScript SDK tests**
-
-```bash
-make test-ts
-```
-
-Expected: all tests pass.
-
-- [ ] **Step 4: Run e2e tests**
-
-```bash
-go test ./test/e2e/... -v -timeout 60s
-```
-
-Expected: all tests pass.
-
-- [ ] **Step 5: Build documentation**
-
-```bash
-cd docs && npm run build
-```
-
-Expected: builds successfully.
-
-- [ ] **Step 6: Build release binary**
-
-```bash
-goreleaser build --snapshot --clean
-```
-
-Expected: binaries for linux/darwin/windows amd64/arm64.
-
-- [ ] **Step 7: Final commit**
-
-```bash
-git add -A
-git commit -m "chore: final v1.0 verification — all tests pass, docs build, release builds"
-```
diff --git a/docs/superpowers/plans/2026-03-12-readme-demos-interactive.md b/docs/superpowers/plans/2026-03-12-readme-demos-interactive.md
deleted file mode 100644
index 71874a1..0000000
--- a/docs/superpowers/plans/2026-03-12-readme-demos-interactive.md
+++ /dev/null
@@ -1,1695 +0,0 @@
-# README, Working Demos & Interactive Demo Page — Implementation Plan
-
-> **For agentic workers:** REQUIRED: Use superpowers:subagent-driven-development (if subagents available) or superpowers:executing-plans to implement this plan. Steps use checkbox (`- [ ]`) syntax for tracking.
-
-**Goal:** Create a README, runnable examples at three tiers in Python+TypeScript, and an animated interactive demo page in the Starlight docs site.
-
-**Architecture:** Three independent deliverables. Examples use the protomcp Python/TypeScript SDKs directly. The demo page uses Astro components embedded in a Starlight MDX page with CSS animations and minimal JS for tab toggling.
-
-**Tech Stack:** Markdown (README), Python/TypeScript (examples), Astro/Starlight (demo page), CSS @keyframes (animations), bash (demo runner)
-
----
-
-## Chunk 1: Working Code Examples
-
-### Task 1: Basic Python Example
-
-**Files:**
-- Create: `examples/python/basic.py`
-
-- [ ] **Step 1: Create the basic Python example**
-
-```python
-# examples/python/basic.py
-# A minimal protomcp tool — adds two numbers.
-# Run: pmcp dev examples/python/basic.py
-
-from protomcp import tool, ToolResult
-
-@tool("Add two numbers")
-def add(a: int, b: int) -> ToolResult:
-    return ToolResult(result=str(a + b))
-
-@tool("Multiply two numbers")
-def multiply(a: int, b: int) -> ToolResult:
-    return ToolResult(result=str(a * b))
-```
-
-- [ ] **Step 2: Verify it parses**
-
-Run: `python -c "import ast; ast.parse(open('examples/python/basic.py').read()); print('OK')"`
-Expected: `OK`
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add examples/python/basic.py
-git commit -m "examples: add basic Python example"
-```
-
----
-
-### Task 2: Basic TypeScript Example
-
-**Files:**
-- Create: `examples/typescript/basic.ts`
-
-- [ ] **Step 1: Create the basic TypeScript example**
-
-```typescript
-// examples/typescript/basic.ts
-// A minimal protomcp tool — adds two numbers.
-// Run: pmcp dev examples/typescript/basic.ts
-
-import { tool, ToolResult } from 'protomcp';
-import { z } from 'zod';
-
-tool({
-  name: 'add',
-  description: 'Add two numbers',
-  args: z.object({ a: z.number(), b: z.number() }),
-  handler({ a, b }) {
-    return new ToolResult({ result: String(a + b) });
-  },
-});
-
-tool({
-  name: 'multiply',
-  description: 'Multiply two numbers',
-  args: z.object({ a: z.number(), b: z.number() }),
-  handler({ a, b }) {
-    return new ToolResult({ result: String(a * b) });
-  },
-});
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add examples/typescript/basic.ts
-git commit -m "examples: add basic TypeScript example"
-```
-
----
-
-### Task 3: Real-World Python Example
-
-**Files:**
-- Create: `examples/python/real_world.py`
-
-- [ ] **Step 1: Create the real-world Python example**
-
-This is a file search tool that demonstrates progress reporting, logging, and cancellation.
-
-```python
-# examples/python/real_world.py
-# A file search tool demonstrating progress, logging, and cancellation.
-# Run: pmcp dev examples/python/real_world.py
-
-import os
-import fnmatch
-from protomcp import tool, ToolResult, ToolContext, log
-
-@tool("Search files in a directory by glob pattern", read_only=True)
-def search_files(ctx: ToolContext, directory: str, pattern: str, max_results: int = 50) -> ToolResult:
-    log.info(f"Searching {directory} for '{pattern}'")
-
-    if not os.path.isdir(directory):
-        return ToolResult(
-            result=f"Directory not found: {directory}",
-            is_error=True,
-            error_code="INVALID_PATH",
-            message="The specified directory does not exist",
-            suggestion="Check the path and try again",
-        )
-
-    matches = []
-    all_files = []
-    for root, dirs, files in os.walk(directory):
-        for f in files:
-            all_files.append(os.path.join(root, f))
-
-    total = len(all_files)
-    log.debug(f"Found {total} files to scan")
-
-    for i, filepath in enumerate(all_files):
-        if ctx.is_cancelled():
-            log.warning("Search cancelled by client")
-            return ToolResult(
-                result=f"Cancelled after scanning {i}/{total} files. Found {len(matches)} matches so far.",
-                is_error=True,
-                error_code="CANCELLED",
-                retryable=True,
-            )
-
-        if i % 100 == 0:
-            ctx.report_progress(i, total, f"Scanning... {i}/{total}")
-
-        if fnmatch.fnmatch(os.path.basename(filepath), pattern):
-            matches.append(filepath)
-            if len(matches) >= max_results:
-                log.info(f"Hit max_results={max_results}, stopping early")
-                break
-
-    ctx.report_progress(total, total, "Complete")
-    log.info(f"Search complete: {len(matches)} matches")
-    return ToolResult(result="\n".join(matches) if matches else "No files found")
-```
-
-- [ ] **Step 2: Verify it parses**
-
-Run: `python -c "import ast; ast.parse(open('examples/python/real_world.py').read()); print('OK')"`
-Expected: `OK`
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add examples/python/real_world.py
-git commit -m "examples: add real-world Python example with progress and cancellation"
-```
-
----
-
-### Task 4: Real-World TypeScript Example
-
-**Files:**
-- Create: `examples/typescript/real-world.ts`
-
-- [ ] **Step 1: Create the real-world TypeScript example**
-
-```typescript
-// examples/typescript/real-world.ts
-// A file search tool demonstrating progress, logging, and cancellation.
-// Run: pmcp dev examples/typescript/real-world.ts
-
-import { tool, ToolResult, ToolContext, ServerLogger } from 'protomcp';
-import { z } from 'zod';
-import * as fs from 'fs';
-import * as path from 'path';
-
-// Note: ServerLogger requires a transport send function. In a real pmcp process,
-// this is wired up automatically by the runner. For demonstration purposes,
-// we show the API shape — logging calls are forwarded to the MCP host.
-
-tool({
-  name: 'search_files',
-  description: 'Search files in a directory by glob pattern',
-  readOnlyHint: true,
-  args: z.object({
-    directory: z.string(),
-    pattern: z.string(),
-    max_results: z.number().default(50),
-  }),
-  handler({ directory, pattern, max_results }, ctx: ToolContext) {
-    if (!fs.existsSync(directory)) {
-      return new ToolResult({
-        result: `Directory not found: ${directory}`,
-        isError: true,
-        errorCode: 'INVALID_PATH',
-        message: 'The specified directory does not exist',
-        suggestion: 'Check the path and try again',
-      });
-    }
-
-    const matches: string[] = [];
-    const allFiles: string[] = [];
-
-    function walk(dir: string) {
-      for (const entry of fs.readdirSync(dir, { withFileTypes: true })) {
-        const full = path.join(dir, entry.name);
-        if (entry.isDirectory()) walk(full);
-        else allFiles.push(full);
-      }
-    }
-    walk(directory);
-
-    const total = allFiles.length;
-
-    for (let i = 0; i < total; i++) {
-      if (ctx.isCancelled()) {
-        return new ToolResult({
-          result: `Cancelled after scanning ${i}/${total} files. Found ${matches.length} matches so far.`,
-          isError: true,
-          errorCode: 'CANCELLED',
-          retryable: true,
-        });
-      }
-
-      if (i % 100 === 0) {
-        ctx.reportProgress(i, total, `Scanning... ${i}/${total}`);
-      }
-
-      if (matchGlob(path.basename(allFiles[i]), pattern)) {
-        matches.push(allFiles[i]);
-        if (matches.length >= max_results) break;
-      }
-    }
-
-    ctx.reportProgress(total, total, 'Complete');
-    return new ToolResult({
-      result: matches.length > 0 ? matches.join('\n') : 'No files found',
-    });
-  },
-});
-
-function matchGlob(filename: string, pattern: string): boolean {
-  const regex = new RegExp(
-    '^' + pattern.replace(/\*/g, '.*').replace(/\?/g, '.') + '$'
-  );
-  return regex.test(filename);
-}
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add examples/typescript/real-world.ts
-git commit -m "examples: add real-world TypeScript example with progress and cancellation"
-```
-
----
-
-### Task 5: Full Showcase Python Example
-
-**Files:**
-- Create: `examples/python/full_showcase.py`
-
-- [ ] **Step 1: Create the full showcase Python example**
-
-Multi-tool server demonstrating structured output, dynamic tool lists, metadata, progress, cancellation, and logging.
-
-```python
-# examples/python/full_showcase.py
-# Full-featured protomcp demo — multiple tools showcasing the complete API.
-# Run: pmcp dev examples/python/full_showcase.py
-
-import json
-import time
-from dataclasses import dataclass
-from protomcp import tool, ToolResult, ToolContext, log
-from protomcp import tool_manager
-
-# --- Tool 1: Structured output with output schema ---
-
-@dataclass
-class WeatherData:
-    location: str
-    temperature_f: float
-    conditions: str
-    humidity: int
-
-@tool(
-    "Get current weather for a location",
-    output_type=WeatherData,
-    read_only=True,
-    title="Weather Lookup",
-)
-def get_weather(location: str) -> ToolResult:
-    log.info(f"Weather lookup for {location}")
-    # Simulated weather data
-    data = WeatherData(
-        location=location,
-        temperature_f=72.5,
-        conditions="Partly cloudy",
-        humidity=45,
-    )
-    return ToolResult(result=json.dumps({
-        "location": data.location,
-        "temperature_f": data.temperature_f,
-        "conditions": data.conditions,
-        "humidity": data.humidity,
-    }))
-
-# --- Tool 2: Long-running operation with progress ---
-
-@tool(
-    "Analyze a dataset (simulated long-running task)",
-    title="Dataset Analyzer",
-    idempotent=True,
-    task_support=True,
-)
-def analyze_dataset(ctx: ToolContext, dataset_name: str, depth: str = "basic") -> ToolResult:
-    log.info(f"Starting analysis of {dataset_name} at depth={depth}")
-    steps = 10
-
-    for i in range(steps):
-        if ctx.is_cancelled():
-            log.warning(f"Analysis cancelled at step {i}/{steps}")
-            return ToolResult(
-                result=f"Analysis cancelled at step {i}/{steps}",
-                is_error=True,
-                error_code="CANCELLED",
-                retryable=True,
-            )
-        ctx.report_progress(i, steps, f"Analyzing step {i+1}/{steps}...")
-        time.sleep(0.1)  # Simulate work
-
-    ctx.report_progress(steps, steps, "Analysis complete")
-    log.info("Analysis finished successfully")
-    return ToolResult(result=json.dumps({
-        "dataset": dataset_name,
-        "depth": depth,
-        "rows_analyzed": 15000,
-        "anomalies_found": 3,
-        "summary": "Dataset is healthy with 3 minor anomalies detected.",
-    }))
-
-# --- Tool 3: Dynamic tool list management ---
-
-@tool(
-    "Enable or disable tools at runtime",
-    title="Tool Manager",
-    destructive=True,
-)
-def manage_tools(action: str, tool_names: str) -> ToolResult:
-    names = [n.strip() for n in tool_names.split(",")]
-    log.info(f"manage_tools: action={action}, names={names}")
-
-    if action == "enable":
-        active = tool_manager.enable(names)
-    elif action == "disable":
-        active = tool_manager.disable(names)
-    elif action == "list":
-        active = tool_manager.get_active_tools()
-    else:
-        return ToolResult(
-            result=f"Unknown action: {action}",
-            is_error=True,
-            error_code="INVALID_ACTION",
-            suggestion="Use 'enable', 'disable', or 'list'",
-        )
-
-    return ToolResult(result=json.dumps({"active_tools": active}))
-
-# --- Tool 4: Demonstrates error handling and logging levels ---
-
-@tool(
-    "Validate data against a schema (demonstrates error handling)",
-    title="Data Validator",
-    read_only=True,
-    idempotent=True,
-)
-def validate_data(data_json: str, strict: bool = False) -> ToolResult:
-    log.debug("Starting validation")
-
-    try:
-        data = json.loads(data_json)
-    except json.JSONDecodeError as e:
-        log.error(f"Invalid JSON: {e}")
-        return ToolResult(
-            result=f"Invalid JSON: {e}",
-            is_error=True,
-            error_code="PARSE_ERROR",
-            message="The input is not valid JSON",
-            suggestion="Check for syntax errors and try again",
-            retryable=True,
-        )
-
-    issues = []
-    if not isinstance(data, dict):
-        issues.append("Root must be an object")
-    elif "name" not in data:
-        issues.append("Missing required field: name")
-
-    if strict and isinstance(data, dict):
-        allowed = {"name", "value", "tags"}
-        extra = set(data.keys()) - allowed
-        if extra:
-            issues.append(f"Unknown fields: {', '.join(extra)}")
-
-    if issues:
-        log.warning(f"Validation failed: {issues}")
-        return ToolResult(
-            result=json.dumps({"valid": False, "issues": issues}),
-            is_error=True,
-            error_code="VALIDATION_FAILED",
-        )
-
-    log.info("Validation passed")
-    return ToolResult(result=json.dumps({"valid": True, "issues": []}))
-```
-
-- [ ] **Step 2: Verify it parses**
-
-Run: `python -c "import ast; ast.parse(open('examples/python/full_showcase.py').read()); print('OK')"`
-Expected: `OK`
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add examples/python/full_showcase.py
-git commit -m "examples: add full showcase Python example with structured output, dynamic tools, and error handling"
-```
-
----
-
-### Task 6: Full Showcase TypeScript Example
-
-**Files:**
-- Create: `examples/typescript/full-showcase.ts`
-
-- [ ] **Step 1: Create the full showcase TypeScript example**
-
-```typescript
-// examples/typescript/full-showcase.ts
-// Full-featured protomcp demo — multiple tools showcasing the complete API.
-// Run: pmcp dev examples/typescript/full-showcase.ts
-
-import { tool, ToolResult, ToolContext, toolManager, ServerLogger } from 'protomcp';
-import { z } from 'zod';
-
-// Note: ServerLogger is wired to the MCP host transport automatically by the runner.
-// For demonstration, we show how to create one — in practice, use the runner-provided instance.
-
-// --- Tool 1: Structured output with output schema ---
-
-const WeatherOutput = z.object({
-  location: z.string(),
-  temperature_f: z.number(),
-  conditions: z.string(),
-  humidity: z.number(),
-});
-
-tool({
-  name: 'get_weather',
-  description: 'Get current weather for a location',
-  title: 'Weather Lookup',
-  readOnlyHint: true,
-  output: WeatherOutput,
-  args: z.object({ location: z.string() }),
-  handler({ location }) {
-    const data = {
-      location,
-      temperature_f: 72.5,
-      conditions: 'Partly cloudy',
-      humidity: 45,
-    };
-    return new ToolResult({ result: JSON.stringify(data) });
-  },
-});
-
-// --- Tool 2: Long-running operation with progress + task support ---
-
-tool({
-  name: 'analyze_dataset',
-  description: 'Analyze a dataset (simulated long-running task)',
-  title: 'Dataset Analyzer',
-  idempotentHint: true,
-  taskSupport: true,
-  args: z.object({
-    dataset_name: z.string(),
-    depth: z.enum(['basic', 'deep']).default('basic'),
-  }),
-  async handler({ dataset_name, depth }, ctx: ToolContext) {
-    const steps = 10;
-    for (let i = 0; i < steps; i++) {
-      if (ctx.isCancelled()) {
-        return new ToolResult({
-          result: `Analysis cancelled at step ${i}/${steps}`,
-          isError: true,
-          errorCode: 'CANCELLED',
-          retryable: true,
-        });
-      }
-      ctx.reportProgress(i, steps, `Analyzing step ${i + 1}/${steps}...`);
-      await new Promise(r => setTimeout(r, 100)); // Simulate work
-    }
-    ctx.reportProgress(steps, steps, 'Analysis complete');
-    return new ToolResult({
-      result: JSON.stringify({
-        dataset: dataset_name,
-        depth,
-        rows_analyzed: 15000,
-        anomalies_found: 3,
-        summary: 'Dataset is healthy with 3 minor anomalies detected.',
-      }),
-    });
-  },
-});
-
-// --- Tool 3: Dynamic tool list management ---
-
-tool({
-  name: 'manage_tools',
-  description: 'Enable or disable tools at runtime',
-  title: 'Tool Manager',
-  destructiveHint: true,
-  args: z.object({
-    action: z.enum(['enable', 'disable', 'list']),
-    tool_names: z.string().describe('Comma-separated tool names'),
-  }),
-  async handler({ action, tool_names }) {
-    const names = tool_names.split(',').map(n => n.trim());
-    let active: string[];
-    switch (action) {
-      case 'enable':
-        active = await toolManager.enable(names);
-        break;
-      case 'disable':
-        active = await toolManager.disable(names);
-        break;
-      case 'list':
-        active = await toolManager.getActiveTools();
-        break;
-    }
-    return new ToolResult({ result: JSON.stringify({ active_tools: active }) });
-  },
-});
-
-// --- Tool 4: Error handling, validation, and logging ---
-
-tool({
-  name: 'validate_data',
-  description: 'Validate data against a schema (demonstrates error handling)',
-  title: 'Data Validator',
-  readOnlyHint: true,
-  idempotentHint: true,
-  args: z.object({
-    data_json: z.string(),
-    strict: z.boolean().default(false),
-  }),
-  handler({ data_json, strict }) {
-    let data: unknown;
-    try {
-      data = JSON.parse(data_json);
-    } catch (e) {
-      return new ToolResult({
-        result: `Invalid JSON: ${e}`,
-        isError: true,
-        errorCode: 'PARSE_ERROR',
-        message: 'The input is not valid JSON',
-        suggestion: 'Check for syntax errors and try again',
-        retryable: true,
-      });
-    }
-
-    const issues: string[] = [];
-    if (typeof data !== 'object' || data === null || Array.isArray(data)) {
-      issues.push('Root must be an object');
-    } else {
-      if (!('name' in data)) issues.push('Missing required field: name');
-      if (strict) {
-        const allowed = new Set(['name', 'value', 'tags']);
-        const extra = Object.keys(data).filter(k => !allowed.has(k));
-        if (extra.length) issues.push(`Unknown fields: ${extra.join(', ')}`);
-      }
-    }
-
-    if (issues.length) {
-      return new ToolResult({
-        result: JSON.stringify({ valid: false, issues }),
-        isError: true,
-        errorCode: 'VALIDATION_FAILED',
-      });
-    }
-
-    return new ToolResult({ result: JSON.stringify({ valid: true, issues: [] }) });
-  },
-});
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add examples/typescript/full-showcase.ts
-git commit -m "examples: add full showcase TypeScript example with structured output, dynamic tools, and error handling"
-```
-
----
-
-### Task 7: Example Dependency Files
-
-**Files:**
-- Create: `examples/python/requirements.txt`
-- Create: `examples/typescript/package.json`
-- Create: `examples/typescript/tsconfig.json`
-
-- [ ] **Step 1: Create Python requirements.txt**
-
-```
-protomcp
-```
-
-- [ ] **Step 2: Create TypeScript package.json**
-
-```json
-{
-  "name": "protomcp-examples",
-  "private": true,
-  "type": "module",
-  "dependencies": {
-    "protomcp": "file:../../sdk/typescript",
-    "zod": "^3.22.0"
-  }
-}
-```
-
-Note: Uses `file:` reference to the local SDK so examples work without publishing to npm.
-
-- [ ] **Step 3: Create TypeScript tsconfig.json**
-
-```json
-{
-  "compilerOptions": {
-    "target": "ES2022",
-    "module": "ES2022",
-    "moduleResolution": "node",
-    "esModuleInterop": true,
-    "strict": true,
-    "outDir": "dist"
-  },
-  "include": ["*.ts"]
-}
-```
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add examples/python/requirements.txt examples/typescript/package.json examples/typescript/tsconfig.json
-git commit -m "examples: add dependency files for Python and TypeScript examples"
-```
-
----
-
-### Task 8: Demo Runner Script
-
-**Files:**
-- Create: `examples/run-demo.sh`
-
-- [ ] **Step 1: Create the demo runner script**
-
-This script starts `pmcp dev` for each example, sends JSON-RPC messages over stdio, and prints human-readable output. It performs the full MCP handshake: `initialize` → `initialized` notification → `tools/list` → `tools/call`.
-
-```bash
-#!/usr/bin/env bash
-set -euo pipefail
-
-# examples/run-demo.sh
-# Runs each example through pmcp, demonstrating the MCP protocol interaction.
-# Requires: pmcp installed and on PATH
-
-RED='\033[0;31m'
-GREEN='\033[0;32m'
-CYAN='\033[0;36m'
-YELLOW='\033[1;33m'
-NC='\033[0m'
-
-SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
-PASSED=0
-FAILED=0
-
-if ! command -v pmcp &> /dev/null; then
-    echo -e "${RED}Error: pmcp not found. Install it first: brew install protomcp/tap/protomcp${NC}"
-    exit 1
-fi
-
-# Send a JSON-RPC request to a pmcp process and capture the response.
-# Usage: run_example <label> <file> <tool_name> <args_json>
-run_example() {
-    local label="$1"
-    local file="$2"
-    local tool_name="$3"
-    local args_json="$4"
-
-    echo -e "\n${CYAN}━━━ ${label} ━━━${NC}"
-    echo -e "  File: ${file}"
-    echo -e "  Tool: ${tool_name}"
-    echo -e "  Args: ${args_json}"
-
-    # Build JSON-RPC messages
-    local init_req='{"jsonrpc":"2.0","id":1,"method":"initialize","params":{"protocolVersion":"2024-11-05","capabilities":{},"clientInfo":{"name":"demo","version":"1.0"}}}'
-    local init_notif='{"jsonrpc":"2.0","method":"notifications/initialized"}'
-    local list_req='{"jsonrpc":"2.0","id":2,"method":"tools/list","params":{}}'
-    local call_req="{\"jsonrpc\":\"2.0\",\"id\":3,\"method\":\"tools/call\",\"params\":{\"name\":\"${tool_name}\",\"arguments\":${args_json}}}"
-
-    # Send all messages and capture output
-    local output
-    output=$(printf '%s\n%s\n%s\n%s\n' "$init_req" "$init_notif" "$list_req" "$call_req" | \
-        timeout 10 pmcp dev "$file" 2>/dev/null || true)
-
-    if [ -z "$output" ]; then
-        echo -e "  ${RED}✗ No response${NC}"
-        FAILED=$((FAILED + 1))
-        return
-    fi
-
-    # Extract the tools/call response (id: 3)
-    local result
-    result=$(echo "$output" | grep '"id":3' | head -1 || true)
-
-    if [ -n "$result" ]; then
-        echo -e "  ${GREEN}✓ Result:${NC}"
-        echo "    $result" | python3 -m json.tool 2>/dev/null || echo "    $result"
-        PASSED=$((PASSED + 1))
-    else
-        echo -e "  ${YELLOW}⚠ Could not extract result (raw output below)${NC}"
-        echo "$output" | head -5
-        FAILED=$((FAILED + 1))
-    fi
-}
-
-echo -e "${CYAN}╔══════════════════════════════════════╗${NC}"
-echo -e "${CYAN}║       protomcp Demo Runner           ║${NC}"
-echo -e "${CYAN}╚══════════════════════════════════════╝${NC}"
-
-# Python examples
-run_example "Python: Basic (add)" \
-    "${SCRIPT_DIR}/python/basic.py" \
-    "add" \
-    '{"a": 5, "b": 3}'
-
-run_example "Python: Real-World (file search)" \
-    "${SCRIPT_DIR}/python/real_world.py" \
-    "search_files" \
-    "{\"directory\": \"${SCRIPT_DIR}\", \"pattern\": \"*.py\"}"
-
-run_example "Python: Full Showcase (weather)" \
-    "${SCRIPT_DIR}/python/full_showcase.py" \
-    "get_weather" \
-    '{"location": "San Francisco"}'
-
-run_example "Python: Full Showcase (validate)" \
-    "${SCRIPT_DIR}/python/full_showcase.py" \
-    "validate_data" \
-    '{"data_json": "{\"name\": \"test\", \"value\": 42}", "strict": true}'
-
-# TypeScript examples
-run_example "TypeScript: Basic (add)" \
-    "${SCRIPT_DIR}/typescript/basic.ts" \
-    "add" \
-    '{"a": 5, "b": 3}'
-
-run_example "TypeScript: Real-World (file search)" \
-    "${SCRIPT_DIR}/typescript/real-world.ts" \
-    "search_files" \
-    "{\"directory\": \"${SCRIPT_DIR}\", \"pattern\": \"*.ts\"}"
-
-run_example "TypeScript: Full Showcase (weather)" \
-    "${SCRIPT_DIR}/typescript/full-showcase.ts" \
-    "get_weather" \
-    '{"location": "San Francisco"}'
-
-run_example "TypeScript: Full Showcase (validate)" \
-    "${SCRIPT_DIR}/typescript/full-showcase.ts" \
-    "validate_data" \
-    '{"data_json": "{\"name\": \"test\", \"value\": 42}", "strict": true}'
-
-# Summary
-echo -e "\n${CYAN}━━━ Summary ━━━${NC}"
-echo -e "  ${GREEN}Passed: ${PASSED}${NC}"
-if [ "$FAILED" -gt 0 ]; then
-    echo -e "  ${RED}Failed: ${FAILED}${NC}"
-else
-    echo -e "  Failed: 0"
-fi
-```
-
-- [ ] **Step 2: Make it executable**
-
-Run: `chmod +x examples/run-demo.sh`
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add examples/run-demo.sh
-git commit -m "examples: add demo runner script with MCP handshake"
-```
-
----
-
-### Task 9: Examples README
-
-**Files:**
-- Create: `examples/README.md`
-
-- [ ] **Step 1: Create the examples README**
-
-```markdown
-# protomcp Examples
-
-Working examples for [protomcp](https://github.com/msilverblatt/protomcp) — a language-agnostic MCP runtime.
-
-## Quick Start
-
-Each example can be run directly with `pmcp dev`:
-
-```sh
-# Python
-pmcp dev examples/python/basic.py
-
-# TypeScript
-pmcp dev examples/typescript/basic.ts
-```
-
-## Examples
-
-| Example | Python | TypeScript | Features |
-|---------|--------|------------|----------|
-| **Basic** | `python/basic.py` | `typescript/basic.ts` | `@tool` decorator, `ToolResult` |
-| **Real-World** | `python/real_world.py` | `typescript/real-world.ts` | Progress reporting, cancellation, logging, error codes |
-| **Full Showcase** | `python/full_showcase.py` | `typescript/full-showcase.ts` | Structured output, dynamic tool lists, metadata/annotations, validation |
-
-## Run All Demos
-
-```sh
-./examples/run-demo.sh
-```
-
-This starts `pmcp dev` for each example, sends MCP protocol messages, and prints the results.
-
-## Prerequisites
-
-- [pmcp](https://github.com/msilverblatt/protomcp) installed (`brew install protomcp/tap/protomcp`)
-- Python 3.10+ (for Python examples)
-- Node.js 18+ (for TypeScript examples)
-
-## Links
-
-- [Documentation](https://github.com/msilverblatt/protomcp)
-- [Python Guide](https://github.com/msilverblatt/protomcp/tree/master/docs)
-- [TypeScript Guide](https://github.com/msilverblatt/protomcp/tree/master/docs)
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add examples/README.md
-git commit -m "examples: add README with feature matrix"
-```
-
----
-
-## Chunk 2: README.md
-
-### Task 10: Create README.md
-
-**Files:**
-- Create: `README.md` (repo root)
-
-- [ ] **Step 1: Create the README**
-
-```markdown
-# protomcp
-
-[![Build](https://github.com/msilverblatt/protomcp/actions/workflows/ci.yml/badge.svg)](https://github.com/msilverblatt/protomcp/actions/workflows/ci.yml)
-[![License: MIT](https://img.shields.io/badge/License-MIT-blue.svg)](LICENSE)
-[![Go](https://img.shields.io/badge/Go-1.22+-00ADD8?logo=go)](https://go.dev)
-[![npm](https://img.shields.io/npm/v/protomcp)](https://www.npmjs.com/package/protomcp)
-[![PyPI](https://img.shields.io/pypi/v/protomcp)](https://pypi.org/project/protomcp/)
-
-**Language-agnostic MCP runtime** — write tools in any language, hot-reload without restarting your AI host.
-
-## How It Works
-
-```
-┌─────────────┐         ┌──────────────┐         ┌──────────────┐
-│             │  MCP     │              │ protobuf │              │
-│  MCP Host   │◄───────►│    pmcp      │◄────────►│  Your Code   │
-│  (Claude,   │ JSON-RPC │   (Go)      │  unix    │  (any lang)  │
-│   Cursor…)  │  stdio   │             │  socket  │              │
-└─────────────┘         └──────────────┘         └──────────────┘
-```
-
-pmcp sits between your MCP host and your tool process. It speaks MCP (JSON-RPC over stdio) on one side and a simple protobuf protocol over a unix socket on the other. Your tool process registers handlers, and pmcp handles everything else: listing tools, routing calls, hot reload, and dynamic tool management.
-
-## Quick Start
-
-### Install
-
-```sh
-brew install protomcp/tap/protomcp
-```
-
-### Python
-
-```python
-# tools.py
-from protomcp import tool, ToolResult
-
-@tool("Add two numbers")
-def add(a: int, b: int) -> ToolResult:
-    return ToolResult(result=str(a + b))
-```
-
-```sh
-pmcp dev tools.py
-```
-
-### TypeScript
-
-```typescript
-// tools.ts
-import { tool, ToolResult } from 'protomcp';
-import { z } from 'zod';
-
-tool({
-  name: 'add',
-  description: 'Add two numbers',
-  args: z.object({ a: z.number(), b: z.number() }),
-  handler({ a, b }) {
-    return new ToolResult({ result: String(a + b) });
-  },
-});
-```
-
-```sh
-pmcp dev tools.ts
-```
-
-Then add either `pmcp dev` command to your MCP client config. That's it.
-
-**[See it in action →](docs/src/content/docs/demo.mdx)** — animated architecture diagram, terminal replay, and protocol view.
-
-## Features
-
-- **Any Language** — write tools in Python, TypeScript, Go, Rust, or any language that speaks protobuf over a unix socket
-- **Hot Reload** — save your file and tools reload instantly, no restart needed
-- **Dynamic Tool Lists** — tools can enable/disable themselves at runtime based on context
-- **5 Transports** — stdio, SSE, streamable HTTP, WebSocket, gRPC
-- **Structured Output** — define output schemas for typed tool results
-- **Async Tasks** — long-running operations with background task tracking
-- **Progress & Cancellation** — report progress and respond to cancellation requests
-- **Server Logging** — 8 RFC 5424 log levels forwarded to the MCP host
-- **Tool Metadata** — annotations for destructive, read-only, idempotent, and open-world hints
-
-## Comparison
-
-| Feature | pmcp | FastMCP (Python) | MCP SDKs |
-|---------|------|------------------|----------|
-| Language support | Any (protobuf) | Python only | One SDK per language |
-| Hot reload | Built-in | No | No |
-| Dynamic tool lists | Built-in | No | Manual |
-| Transports | stdio, SSE, HTTP, WS, gRPC | stdio, SSE | Varies by SDK |
-| Structured output | Yes | No | Varies |
-| Async tasks | Yes | No | No |
-| Single binary | Yes (Go) | No (Python runtime) | No (per-language) |
-
-## Examples
-
-See [`examples/`](examples/) for runnable demos at three levels:
-
-- **Basic** — minimal single-tool examples in Python and TypeScript
-- **Real-world** — file search tool with progress reporting, cancellation, and logging
-- **Full showcase** — multi-tool server with structured output, dynamic tool lists, error handling, and metadata
-
-Run all demos: `./examples/run-demo.sh`
-
-## Documentation
-
-Full documentation is available in the [`docs/`](docs/) directory, built with [Starlight](https://starlight.astro.build):
-
-- [Quick Start](docs/src/content/docs/getting-started/quick-start.mdx)
-- [Python Guide](docs/src/content/docs/guides/writing-tools-python.mdx)
-- [TypeScript Guide](docs/src/content/docs/guides/writing-tools-typescript.mdx)
-- [CLI Reference](docs/src/content/docs/reference/cli.mdx)
-- [Protobuf Spec](docs/src/content/docs/reference/protobuf-spec.mdx)
-
-## License
-
-MIT
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add README.md
-git commit -m "docs: add README with architecture diagram, quick start, and comparison table"
-```
-
----
-
-## Chunk 3: Interactive Demo Page — Components
-
-### Task 11: ArchitectureHero Component
-
-**Files:**
-- Create: `docs/src/components/demo/ArchitectureHero.astro`
-
-- [ ] **Step 1: Create the ArchitectureHero component**
-
-This is the large animated hero at the top of the demo page. Three boxes with animated message packets flowing between them. Pure CSS animation.
-
-```astro
----
-// docs/src/components/demo/ArchitectureHero.astro
-// Animated architecture diagram showing MCP Host → pmcp → Your Code
----
-
-<div class="hero-container">
-  <div class="architecture">
-    <div class="node node-host">
-      <div class="node-label">MCP Host</div>
-      <div class="node-sub">Claude, Cursor, etc.</div>
-    </div>
-
-    <div class="connector connector-left">
-      <div class="connector-label">JSON-RPC</div>
-      <div class="connector-line"></div>
-      <div class="packet packet-request"></div>
-      <div class="packet packet-response"></div>
-    </div>
-
-    <div class="node node-pmcp">
-      <div class="node-label">pmcp</div>
-      <div class="node-sub">Go binary</div>
-    </div>
-
-    <div class="connector connector-right">
-      <div class="connector-label">protobuf</div>
-      <div class="connector-line"></div>
-      <div class="packet packet-request"></div>
-      <div class="packet packet-response"></div>
-    </div>
-
-    <div class="node node-code">
-      <div class="node-label">Your Code</div>
-      <div class="node-sub">Python, TS, Go…</div>
-    </div>
-  </div>
-
-  <p class="hero-text">
-    pmcp sits between your MCP host and your tool process. It translates JSON-RPC to protobuf,
-    handles hot reload, and manages tool registration.
-  </p>
-</div>
-
-<style>
-  .hero-container {
-    padding: 2rem 0 1rem;
-    text-align: center;
-  }
-
-  .architecture {
-    display: flex;
-    align-items: center;
-    justify-content: center;
-    gap: 0;
-    padding: 2rem 1rem;
-    max-width: 800px;
-    margin: 0 auto;
-  }
-
-  .node {
-    padding: 1.2rem 1.5rem;
-    border-radius: 12px;
-    background: var(--sl-color-bg-nav);
-    border: 2px solid;
-    text-align: center;
-    min-width: 130px;
-    z-index: 1;
-  }
-
-  .node-host { border-color: #64ffda; }
-  .node-pmcp { border-color: #ffd700; }
-  .node-code { border-color: #ff6b6b; }
-
-  .node-label {
-    font-weight: 700;
-    font-size: 1.1rem;
-    color: var(--sl-color-text);
-  }
-
-  .node-sub {
-    font-size: 0.8rem;
-    color: var(--sl-color-text-accent);
-    margin-top: 0.25rem;
-  }
-
-  .connector {
-    position: relative;
-    width: 120px;
-    height: 60px;
-    display: flex;
-    align-items: center;
-    justify-content: center;
-  }
-
-  .connector-label {
-    position: absolute;
-    top: -4px;
-    font-size: 0.7rem;
-    color: var(--sl-color-text-accent);
-    text-transform: uppercase;
-    letter-spacing: 0.05em;
-    white-space: nowrap;
-  }
-
-  .connector-line {
-    width: 100%;
-    height: 2px;
-    background: var(--sl-color-gray-5);
-  }
-
-  .packet {
-    position: absolute;
-    width: 12px;
-    height: 12px;
-    border-radius: 50%;
-    opacity: 0;
-  }
-
-  /* Request packets flow left → right */
-  .connector-left .packet-request {
-    background: #64ffda;
-    animation: packet-right var(--cycle-duration, 6s) ease-in-out infinite;
-    animation-delay: var(--phase-delay, 0s);
-  }
-
-  .connector-right .packet-request {
-    background: #ffd700;
-    animation: packet-right var(--cycle-duration, 6s) ease-in-out infinite;
-    animation-delay: calc(var(--phase-delay, 0s) + 0.3s);
-  }
-
-  /* Response packets flow right → left */
-  .connector-left .packet-response {
-    background: #64ffda;
-    animation: packet-left var(--cycle-duration, 6s) ease-in-out infinite;
-    animation-delay: calc(var(--phase-delay, 0s) + 2.5s);
-  }
-
-  .connector-right .packet-response {
-    background: #ffd700;
-    animation: packet-left var(--cycle-duration, 6s) ease-in-out infinite;
-    animation-delay: calc(var(--phase-delay, 0s) + 2.2s);
-  }
-
-  @keyframes packet-right {
-    0%, 15% { left: 0; opacity: 0; }
-    20% { opacity: 1; }
-    35% { left: calc(100% - 12px); opacity: 1; }
-    40%, 100% { left: calc(100% - 12px); opacity: 0; }
-  }
-
-  @keyframes packet-left {
-    0%, 15% { left: calc(100% - 12px); opacity: 0; }
-    20% { opacity: 1; }
-    35% { left: 0; opacity: 1; }
-    40%, 100% { left: 0; opacity: 0; }
-  }
-
-  .hero-text {
-    max-width: 600px;
-    margin: 1rem auto 0;
-    color: var(--sl-color-text-accent);
-    font-size: 0.95rem;
-    line-height: 1.6;
-  }
-
-  @media (max-width: 640px) {
-    .architecture {
-      flex-direction: column;
-      gap: 0;
-    }
-    .connector {
-      width: 60px;
-      height: 80px;
-      transform: rotate(90deg);
-    }
-    .node { min-width: 160px; }
-  }
-</style>
-```
-
-- [ ] **Step 2: Verify Astro syntax**
-
-Run: `cd /Users/msilverblatt/hotmcp/docs && node -e "console.log('Astro file created')"`
-(Actual build verification happens after all components are created.)
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add docs/src/components/demo/ArchitectureHero.astro
-git commit -m "docs: add ArchitectureHero animated component"
-```
-
----
-
-### Task 12: TerminalReplay Component
-
-**Files:**
-- Create: `docs/src/components/demo/TerminalReplay.astro`
-
-- [ ] **Step 1: Create the TerminalReplay component**
-
-Dark terminal mockup with CSS typing animation. Includes Python/TypeScript tab toggle via a small client-side script.
-
-```astro
----
-// docs/src/components/demo/TerminalReplay.astro
-// Simulated terminal session showing pmcp in action
----
-
-<div class="terminal-container">
-  <div class="terminal-tabs">
-    <button class="tab active" data-lang="python">Python</button>
-    <button class="tab" data-lang="typescript">TypeScript</button>
-  </div>
-  <div class="terminal">
-    <div class="terminal-header">
-      <span class="dot red"></span>
-      <span class="dot yellow"></span>
-      <span class="dot green"></span>
-    </div>
-    <div class="terminal-body">
-      <div class="line line-1" data-python="$ pmcp dev tools.py" data-typescript="$ pmcp dev tools.ts">
-        <span class="prompt">$</span> <span class="cmd">pmcp dev <span class="filename" data-python="tools.py" data-typescript="tools.ts">tools.py</span></span>
-      </div>
-      <div class="line line-2">
-        <span class="success">✓</span> connected · 3 tools registered
-      </div>
-      <div class="line line-3">
-        <span class="arrow-in">→</span> call <span class="tool-name">add</span> {"a": 2, "b": 3}
-      </div>
-      <div class="line line-4">
-        <span class="arrow-out">←</span> result: <span class="result-value">5</span>
-      </div>
-      <div class="line line-5">
-        <span class="arrow-in">→</span> call <span class="tool-name">search_files</span> {"directory": ".", "pattern": "*.py"}
-      </div>
-      <div class="line line-6">
-        <span class="arrow-out">←</span> result: <span class="result-value">found 12 files</span>
-      </div>
-    </div>
-  </div>
-</div>
-
-<script>
-  const tabs = document.querySelectorAll('.terminal-tabs .tab');
-  const filenames = document.querySelectorAll('.filename');
-
-  tabs.forEach(tab => {
-    tab.addEventListener('click', () => {
-      const lang = tab.getAttribute('data-lang') || 'python';
-      tabs.forEach(t => t.classList.remove('active'));
-      tab.classList.add('active');
-      filenames.forEach(fn => {
-        fn.textContent = fn.getAttribute(`data-${lang}`) || '';
-      });
-    });
-  });
-</script>
-
-<style>
-  .terminal-container {
-    flex: 1;
-    min-width: 300px;
-  }
-
-  .terminal-tabs {
-    display: flex;
-    gap: 0;
-    margin-bottom: 0;
-  }
-
-  .tab {
-    padding: 0.4rem 1rem;
-    background: #1a1a2e;
-    border: 1px solid #2d2d44;
-    border-bottom: none;
-    color: #888;
-    cursor: pointer;
-    font-size: 0.8rem;
-    font-family: inherit;
-    border-radius: 6px 6px 0 0;
-  }
-
-  .tab.active {
-    background: #0d0d0d;
-    color: #64ffda;
-    border-color: #64ffda;
-  }
-
-  .terminal {
-    background: #0d0d0d;
-    border-radius: 0 8px 8px 8px;
-    overflow: hidden;
-    border: 1px solid #2d2d44;
-  }
-
-  .terminal-header {
-    display: flex;
-    gap: 6px;
-    padding: 10px 14px;
-    background: #1a1a2e;
-  }
-
-  .dot {
-    width: 10px;
-    height: 10px;
-    border-radius: 50%;
-  }
-
-  .dot.red { background: #ff5f57; }
-  .dot.yellow { background: #ffbd2e; }
-  .dot.green { background: #28c841; }
-
-  .terminal-body {
-    padding: 1rem 1.2rem;
-    font-family: 'SF Mono', 'Fira Code', 'Consolas', monospace;
-    font-size: 0.85rem;
-    line-height: 1.8;
-    color: #e0e0e0;
-  }
-
-  .line {
-    opacity: 0;
-    animation: fade-in 0.3s ease forwards;
-  }
-
-  .line-1 { animation-delay: calc(var(--phase-delay, 0s) + 0.5s); }
-  .line-2 { animation-delay: calc(var(--phase-delay, 0s) + 1.2s); }
-  .line-3 { animation-delay: calc(var(--phase-delay, 0s) + 2.0s); }
-  .line-4 { animation-delay: calc(var(--phase-delay, 0s) + 2.8s); }
-  .line-5 { animation-delay: calc(var(--phase-delay, 0s) + 3.6s); }
-  .line-6 { animation-delay: calc(var(--phase-delay, 0s) + 4.4s); }
-
-  @keyframes fade-in {
-    from { opacity: 0; transform: translateY(4px); }
-    to { opacity: 1; transform: translateY(0); }
-  }
-
-  .prompt { color: #888; }
-  .cmd { color: #fff; }
-  .success { color: #64ffda; }
-  .arrow-in { color: #ffd700; }
-  .arrow-out { color: #64ffda; }
-  .tool-name { color: #c792ea; }
-  .result-value { color: #c3e88d; }
-  .filename { color: #89ddff; }
-</style>
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add docs/src/components/demo/TerminalReplay.astro
-git commit -m "docs: add TerminalReplay animated component with language toggle"
-```
-
----
-
-### Task 13: ProtocolView Component
-
-**Files:**
-- Create: `docs/src/components/demo/ProtocolView.astro`
-
-- [ ] **Step 1: Create the ProtocolView component**
-
-Side-by-side view of JSON-RPC and protobuf formats with sequential line highlighting.
-
-```astro
----
-// docs/src/components/demo/ProtocolView.astro
-// Side-by-side JSON-RPC ↔ protobuf protocol view
----
-
-<div class="protocol-container">
-  <div class="protocol-columns">
-    <div class="protocol-col">
-      <div class="col-header">
-        <span class="col-dot" style="background: #64ffda"></span>
-        MCP (JSON-RPC)
-      </div>
-      <div class="code-block">
-        <pre class="protocol-code"><span class="hl hl-1">{"{"}</span>
-<span class="hl hl-2">  "jsonrpc": "2.0",</span>
-<span class="hl hl-3">  "id": 1,</span>
-<span class="hl hl-4">  "method": "tools/call",</span>
-<span class="hl hl-5">  "params": {"{"}</span>
-<span class="hl hl-6">    "name": "add",</span>
-<span class="hl hl-7">    "arguments": {"{"}</span>
-<span class="hl hl-8">      "a": 2, "b": 3</span>
-<span class="hl hl-7">    {"}"}</span>
-<span class="hl hl-5">  {"}"}</span>
-<span class="hl hl-1">{"}"}</span></pre>
-      </div>
-    </div>
-
-    <div class="protocol-arrow">
-      <span>↔</span>
-    </div>
-
-    <div class="protocol-col">
-      <div class="col-header">
-        <span class="col-dot" style="background: #ffd700"></span>
-        protobuf (wire)
-      </div>
-      <div class="code-block">
-        <pre class="protocol-code"><span class="hl hl-1">Envelope {"{"}</span>
-<span class="hl hl-3">  request_id: 1</span>
-<span class="hl hl-4">  call_tool: CallToolRequest {"{"}</span>
-<span class="hl hl-6">    name: "add"</span>
-<span class="hl hl-7">    arguments_json:</span>
-<span class="hl hl-8">      '{"a": 2, "b": 3}'</span>
-<span class="hl hl-4">  {"}"}</span>
-<span class="hl hl-1">{"}"}</span>
-<span class="hl proto-note">// 4-byte length prefix</span>
-<span class="hl proto-note">// + serialized bytes</span></pre>
-      </div>
-    </div>
-  </div>
-</div>
-
-<style>
-  .protocol-container {
-    flex: 1;
-    min-width: 300px;
-  }
-
-  .protocol-columns {
-    display: flex;
-    gap: 0.5rem;
-    align-items: stretch;
-  }
-
-  .protocol-col {
-    flex: 1;
-    background: #0d0d0d;
-    border-radius: 8px;
-    border: 1px solid #2d2d44;
-    overflow: hidden;
-  }
-
-  .col-header {
-    display: flex;
-    align-items: center;
-    gap: 8px;
-    padding: 0.6rem 1rem;
-    background: #1a1a2e;
-    font-size: 0.8rem;
-    color: #e0e0e0;
-    font-weight: 600;
-    text-transform: uppercase;
-    letter-spacing: 0.05em;
-  }
-
-  .col-dot {
-    width: 8px;
-    height: 8px;
-    border-radius: 50%;
-  }
-
-  .code-block {
-    padding: 0.8rem 1rem;
-  }
-
-  .protocol-code {
-    font-family: 'SF Mono', 'Fira Code', 'Consolas', monospace;
-    font-size: 0.78rem;
-    line-height: 1.7;
-    color: #888;
-    margin: 0;
-    white-space: pre;
-  }
-
-  .protocol-arrow {
-    display: flex;
-    align-items: center;
-    font-size: 1.5rem;
-    color: var(--sl-color-text-accent);
-    padding: 0 0.25rem;
-  }
-
-  .hl {
-    transition: color 0.3s ease;
-  }
-
-  .hl-1 { animation: highlight var(--cycle-duration, 6s) ease infinite; animation-delay: calc(var(--phase-delay, 0s) + 0.5s); }
-  .hl-2 { animation: highlight var(--cycle-duration, 6s) ease infinite; animation-delay: calc(var(--phase-delay, 0s) + 1.0s); }
-  .hl-3 { animation: highlight var(--cycle-duration, 6s) ease infinite; animation-delay: calc(var(--phase-delay, 0s) + 1.5s); }
-  .hl-4 { animation: highlight var(--cycle-duration, 6s) ease infinite; animation-delay: calc(var(--phase-delay, 0s) + 2.0s); }
-  .hl-5 { animation: highlight var(--cycle-duration, 6s) ease infinite; animation-delay: calc(var(--phase-delay, 0s) + 2.5s); }
-  .hl-6 { animation: highlight var(--cycle-duration, 6s) ease infinite; animation-delay: calc(var(--phase-delay, 0s) + 3.0s); }
-  .hl-7 { animation: highlight var(--cycle-duration, 6s) ease infinite; animation-delay: calc(var(--phase-delay, 0s) + 3.5s); }
-  .hl-8 { animation: highlight var(--cycle-duration, 6s) ease infinite; animation-delay: calc(var(--phase-delay, 0s) + 4.0s); }
-
-  @keyframes highlight {
-    0%, 10% { color: #888; }
-    15% { color: #e0e0e0; }
-    30%, 100% { color: #888; }
-  }
-
-  .proto-note { color: #555; font-style: italic; }
-
-  @media (max-width: 640px) {
-    .protocol-columns { flex-direction: column; }
-    .protocol-arrow { transform: rotate(90deg); justify-content: center; padding: 0.5rem; }
-  }
-</style>
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add docs/src/components/demo/ProtocolView.astro
-git commit -m "docs: add ProtocolView side-by-side component"
-```
-
----
-
-## Chunk 4: Demo Page Assembly & Integration
-
-### Task 14: Demo MDX Page
-
-**Files:**
-- Create: `docs/src/content/docs/demo.mdx`
-
-- [ ] **Step 1: Create the demo page**
-
-```mdx
----
-title: Demo
-description: See pmcp in action — animated architecture, terminal replay, and protocol view.
-template: splash
-hero:
-  tagline: See how pmcp works — from high-level architecture down to the wire protocol.
----
-
-import ArchitectureHero from '../../components/demo/ArchitectureHero.astro';
-import TerminalReplay from '../../components/demo/TerminalReplay.astro';
-import ProtocolView from '../../components/demo/ProtocolView.astro';
-
-<div style="--cycle-duration: 8s; --phase-delay: 0s;">
-
-<ArchitectureHero />
-
-## In Action
-
-Watch a tool call flow through the system — from the terminal command to the wire protocol.
-
-<div class="demo-panels">
-  <TerminalReplay />
-  <ProtocolView />
-</div>
-
-</div>
-
-<style>{`
-  .demo-panels {
-    display: flex;
-    gap: 1.5rem;
-    margin: 1.5rem 0;
-    align-items: flex-start;
-  }
-
-  @media (max-width: 768px) {
-    .demo-panels {
-      flex-direction: column;
-    }
-  }
-`}</style>
-
----
-
-## Try It Yourself
-
-```sh
-brew install protomcp/tap/protomcp
-pmcp dev examples/python/basic.py
-```
-
-Check out the [Quick Start](/getting-started/quick-start/) guide or browse the [examples](https://github.com/msilverblatt/protomcp/tree/master/examples).
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add docs/src/content/docs/demo.mdx
-git commit -m "docs: add interactive demo page with animated components"
-```
-
----
-
-### Task 15: Sidebar Integration
-
-**Files:**
-- Modify: `docs/astro.config.mjs:12` (sidebar array)
-
-- [ ] **Step 1: Add Demo link to sidebar**
-
-In `docs/astro.config.mjs`, add the Demo link as a top-level item before the first group. Change the `sidebar` array from:
-
-```javascript
-      sidebar: [
-        {
-          label: 'Getting Started',
-```
-
-to:
-
-```javascript
-      sidebar: [
-        { label: 'Demo', slug: 'demo' },
-        {
-          label: 'Getting Started',
-```
-
-- [ ] **Step 2: Commit**
-
-```bash
-git add docs/astro.config.mjs
-git commit -m "docs: add Demo to sidebar navigation"
-```
-
----
-
-### Task 16: Build Verification
-
-- [ ] **Step 1: Build the docs site**
-
-Run: `cd /Users/msilverblatt/hotmcp/docs && npm run build`
-Expected: Build succeeds with no errors. The demo page is generated.
-
-- [ ] **Step 2: Verify demo page exists in output**
-
-Run: `ls /Users/msilverblatt/hotmcp/docs/dist/demo/`
-Expected: `index.html` exists
-
----
-
-### Task 17: Makefile and .gitignore Updates
-
-**Files:**
-- Modify: `Makefile` (add demo target)
-- Modify: `.gitignore` (add .superpowers/)
-
-- [ ] **Step 1: Add demo target to Makefile**
-
-Add after the existing `clean` target:
-
-```makefile
-demo:
-	./examples/run-demo.sh
-```
-
-- [ ] **Step 2: Add .superpowers/ to .gitignore**
-
-Append `.superpowers/` to `.gitignore` if not already present.
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add Makefile .gitignore
-git commit -m "chore: add demo target and ignore .superpowers/"
-```
diff --git a/docs/superpowers/plans/2026-03-13-chunked-streaming.md b/docs/superpowers/plans/2026-03-13-chunked-streaming.md
deleted file mode 100644
index e46bae6..0000000
--- a/docs/superpowers/plans/2026-03-13-chunked-streaming.md
+++ /dev/null
@@ -1,2054 +0,0 @@
-# Chunked Streaming Implementation Plan
-
-> **For agentic workers:** REQUIRED: Use superpowers:subagent-driven-development (if subagents available) or superpowers:executing-plans to implement this plan. Steps use checkbox (`- [ ]`) syntax for tracking.
-
-**Goal:** Eliminate protomcp's large-payload performance gap and build streaming content transfer across the internal protocol and MCP transports.
-
-**Architecture:** Three phases — (C) zero-copy JSON passthrough in the handler to skip redundant parse/re-serialize, (A) chunked protobuf streaming over the internal unix socket for large payloads, (B) end-to-end streaming to MCP hosts via a JSON-RPC extension with a true streaming pipeline (no full reassembly). Each phase is backward compatible and independently shippable.
-
-**Tech Stack:** Go (handler, process manager, transports), Protocol Buffers, Python SDK, TypeScript SDK
-
-**Spec:** `docs/superpowers/specs/2026-03-13-chunked-streaming-design.md`
-
----
-
-## Chunk 1: Phase C — Zero-Copy JSON Passthrough
-
-### Task 1: Add RawToolsCallResult type
-
-**Files:**
-- Modify: `internal/mcp/types.go:83-92`
-
-- [ ] **Step 1: Add the new type to types.go**
-
-Add after the existing `ToolsCallResult` (line 87):
-
-```go
-// RawToolsCallResult is like ToolsCallResult but passes content through
-// as raw JSON bytes, avoiding a parse/re-serialize round trip.
-type RawToolsCallResult struct {
-	Content           json.RawMessage `json:"content"`
-	IsError           bool            `json:"isError,omitempty"`
-	StructuredContent json.RawMessage `json:"structuredContent,omitempty"`
-}
-```
-
-- [ ] **Step 2: Verify compilation**
-
-Run: `go build ./internal/mcp/...`
-Expected: Success
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add internal/mcp/types.go
-git commit -m "feat: add RawToolsCallResult type for JSON passthrough"
-```
-
----
-
-### Task 2: Modify handleToolsCall for raw passthrough
-
-**Files:**
-- Modify: `internal/mcp/handler.go:139-188`
-- Test: `internal/mcp/handler_test.go`
-
-Currently `handleToolsCall` (lines 170-183) parses `result_json` into `[]ContentItem` then re-serializes. Replace with a fast-path that checks if `result_json` starts with `[` and passes it through as raw bytes.
-
-- [ ] **Step 1: Write tests**
-
-Add to `internal/mcp/handler_test.go`:
-
-```go
-func TestHandleToolsCall_RawPassthrough(t *testing.T) {
-	// Verify that a large content array passes through without re-parsing.
-	largeText := strings.Repeat("X", 100000)
-	contentJSON := fmt.Sprintf(`[{"type":"text","text":"%s"}]`, largeText)
-
-	backend := &mockToolBackend{
-		tools: []*pb.ToolDefinition{{Name: "generate", InputSchemaJson: `{"type":"object"}`}},
-		callResult: &pb.CallToolResponse{
-			ResultJson: contentJSON,
-		},
-	}
-	h := mcp.NewHandler(backend)
-
-	params, _ := json.Marshal(mcp.ToolsCallParams{Name: "generate"})
-	resp, err := h.Handle(context.Background(), mcp.JSONRPCRequest{
-		JSONRPC: "2.0",
-		ID:      json.RawMessage(`1`),
-		Method:  "tools/call",
-		Params:  params,
-	})
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-	if resp.Error != nil {
-		t.Fatalf("unexpected RPC error: %s", resp.Error.Message)
-	}
-
-	// The content array should be embedded directly, not re-serialized.
-	var result struct {
-		Content json.RawMessage `json:"content"`
-	}
-	json.Unmarshal(resp.Result, &result)
-
-	if string(result.Content) != contentJSON {
-		t.Errorf("content was re-serialized instead of passed through.\nGot length: %d\nWant length: %d", len(result.Content), len(contentJSON))
-	}
-}
-
-func TestHandleToolsCall_RawPassthrough_Fallback(t *testing.T) {
-	// When result_json is NOT a JSON array, fall back to wrapping as text.
-	backend := &mockToolBackend{
-		tools: []*pb.ToolDefinition{{Name: "echo", InputSchemaJson: `{"type":"object"}`}},
-		callResult: &pb.CallToolResponse{
-			ResultJson: `"just a string"`,
-		},
-	}
-	h := mcp.NewHandler(backend)
-
-	params, _ := json.Marshal(mcp.ToolsCallParams{Name: "echo"})
-	resp, err := h.Handle(context.Background(), mcp.JSONRPCRequest{
-		JSONRPC: "2.0",
-		ID:      json.RawMessage(`1`),
-		Method:  "tools/call",
-		Params:  params,
-	})
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-
-	var result struct {
-		Content []mcp.ContentItem `json:"content"`
-	}
-	json.Unmarshal(resp.Result, &result)
-
-	if len(result.Content) != 1 || result.Content[0].Type != "text" {
-		t.Errorf("expected fallback to text content, got: %+v", result.Content)
-	}
-}
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `go test -v ./internal/mcp/ -run TestHandleToolsCall_RawPassthrough`
-Expected: `TestHandleToolsCall_RawPassthrough` fails (content gets re-serialized)
-
-- [ ] **Step 3: Implement the raw passthrough in handleToolsCall**
-
-Replace lines 170-187 of `handler.go` (the content parsing block) with:
-
-```go
-	// Fast path: if result_json starts with '[', it's already a valid content
-	// array — pass it through as raw bytes to avoid parse/re-serialize overhead.
-	resultJSON := resp.ResultJson
-	trimmed := strings.TrimSpace(resultJSON)
-	if len(trimmed) > 0 && trimmed[0] == '[' {
-		result := RawToolsCallResult{
-			Content: json.RawMessage(resultJSON),
-			IsError: resp.IsError,
-		}
-		if resp.StructuredContentJson != "" {
-			result.StructuredContent = json.RawMessage(resp.StructuredContentJson)
-		}
-		return h.success(req.ID, result)
-	}
-
-	// Fallback: result_json is not a JSON array — wrap as text content.
-	var content []ContentItem
-	if resultJSON != "" {
-		if err := json.Unmarshal([]byte(resultJSON), &content); err != nil {
-			content = []ContentItem{{Type: "text", Text: resultJSON}}
-		}
-	}
-	result := ToolsCallResult{
-		Content: content,
-		IsError: resp.IsError,
-	}
-	if resp.StructuredContentJson != "" {
-		result.StructuredContent = json.RawMessage(resp.StructuredContentJson)
-	}
-	return h.success(req.ID, result)
-```
-
-Add `"strings"` to the import block if not already present.
-
-- [ ] **Step 4: Run all handler tests**
-
-Run: `go test -v ./internal/mcp/`
-Expected: All tests pass
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/mcp/handler.go internal/mcp/handler_test.go internal/mcp/types.go
-git commit -m "feat: zero-copy JSON passthrough for tool results
-
-Skip json.Unmarshal/json.Marshal round trip when result_json is already
-a valid content array (starts with '['). Falls back to old parse path
-for non-array results. Eliminates 2 payload copies on the hot path."
-```
-
----
-
-### Task 3: Rebuild and run D4 payload benchmark
-
-- [ ] **Step 1: Rebuild pmcp binary**
-
-Run: `make build`
-
-- [ ] **Step 2: Run D4 payload benchmark**
-
-Run: `go test -v -timeout 120s ./tests/bench/comparison/ -run TestDeepFastMCPComparison/D4`
-Expected: Improvement at 10KB+ sizes vs previous (protomcp was 3.5ms at 100KB, 17ms at 500KB)
-
-- [ ] **Step 3: Run full test suite**
-
-Run: `go test ./internal/mcp/ ./internal/process/ ./internal/envelope/`
-Expected: All pass
-
----
-
-## Chunk 2: Phase A — Chunked Internal Transfer
-
-### Task 4: Add StreamHeader and StreamChunk to protobuf schema
-
-**Files:**
-- Modify: `proto/protomcp.proto`
-
-- [ ] **Step 1: Add message definitions and oneof fields**
-
-In `Envelope.oneof msg`, after `middleware_intercept_response = 27` (line 42), add:
-
-```protobuf
-    // Streaming
-    StreamHeader stream_header = 28;
-    StreamChunk stream_chunk = 29;
-```
-
-At the end of the file, add:
-
-```protobuf
-// StreamHeader initiates a chunked transfer for a large field.
-message StreamHeader {
-  string field_name = 1;     // field being streamed, e.g. "result_json"
-  uint64 total_size = 2;     // total bytes if known, 0 if unknown
-  uint32 chunk_size = 3;     // bytes per chunk
-}
-
-// StreamChunk carries one chunk of a streamed field.
-message StreamChunk {
-  bytes data = 1;            // chunk payload
-  bool final = 2;            // true on last chunk
-}
-```
-
-- [ ] **Step 2: Regenerate all protobuf code (Go, Python, TypeScript)**
-
-Run: `make proto`
-
-This runs the Makefile `proto` target which generates:
-- Go: `gen/proto/protomcp/protomcp.pb.go`
-- Python: `sdk/python/gen/protomcp_pb2.py`
-- TypeScript: `sdk/typescript/gen/` (via `protoc-gen-ts`)
-
-- [ ] **Step 3: Verify compilation**
-
-Run: `go build ./...`
-Expected: Success
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add proto/protomcp.proto gen/ sdk/python/gen/ sdk/typescript/gen/
-git commit -m "proto: add StreamHeader and StreamChunk messages for chunked transfer"
-```
-
----
-
-### Task 5: Implement stream reassembly in readLoop
-
-**Files:**
-- Modify: `internal/process/manager.go`
-- Test: `internal/process/manager_test.go`
-
-- [ ] **Step 1: Write tests for stream reassembly (happy path + error cases)**
-
-Add to `internal/process/manager_test.go`. These tests use a connected socket pair to simulate the tool process, writing protobuf envelopes directly.
-
-```go
-// testStreamSetup creates a unix socket pair and a Manager wired to
-// the server side. Returns the Manager, the tool-side conn, and a cleanup func.
-func testStreamSetup(t *testing.T) (*process.Manager, net.Conn) {
-	t.Helper()
-	socketPath := filepath.Join(os.TempDir(), fmt.Sprintf("pmcp-test-%d-%d.sock", os.Getpid(), time.Now().UnixNano()))
-	t.Cleanup(func() { os.Remove(socketPath) })
-
-	listener, err := net.Listen("unix", socketPath)
-	if err != nil {
-		t.Fatal(err)
-	}
-	t.Cleanup(func() { listener.Close() })
-
-	toolConn, err := net.Dial("unix", socketPath)
-	if err != nil {
-		t.Fatal(err)
-	}
-	t.Cleanup(func() { toolConn.Close() })
-
-	serverConn, err := listener.Accept()
-	if err != nil {
-		t.Fatal(err)
-	}
-	t.Cleanup(func() { serverConn.Close() })
-
-	cfg := process.ManagerConfig{
-		SocketPath:  socketPath,
-		CallTimeout: 5 * time.Second,
-	}
-	mgr := process.NewManagerForTest(cfg, serverConn)
-	go mgr.StartReadLoop()
-
-	return mgr, toolConn
-}
-
-func TestStreamReassembly(t *testing.T) {
-	mgr, toolConn := testStreamSetup(t)
-	respCh := mgr.RegisterPending("req-1")
-
-	// 200KB payload, 64KB chunks
-	fullPayload := strings.Repeat("A", 200*1024)
-	fullResultJSON := fmt.Sprintf(`[{"type":"text","text":"%s"}]`, fullPayload)
-	chunkSize := 64 * 1024
-
-	// Send stream_header
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: "req-1",
-		Msg: &pb.Envelope_StreamHeader{
-			StreamHeader: &pb.StreamHeader{
-				FieldName: "result_json",
-				TotalSize: uint64(len(fullResultJSON)),
-				ChunkSize: uint32(chunkSize),
-			},
-		},
-	})
-
-	// Send chunks
-	remaining := []byte(fullResultJSON)
-	for len(remaining) > 0 {
-		sz := chunkSize
-		if sz > len(remaining) {
-			sz = len(remaining)
-		}
-		envelope.Write(toolConn, &pb.Envelope{
-			RequestId: "req-1",
-			Msg: &pb.Envelope_StreamChunk{
-				StreamChunk: &pb.StreamChunk{
-					Data:  remaining[:sz],
-					Final: sz >= len(remaining),
-				},
-			},
-		})
-		remaining = remaining[sz:]
-	}
-
-	select {
-	case resp := <-respCh:
-		result := resp.GetCallResult()
-		if result == nil {
-			t.Fatal("expected CallToolResponse")
-		}
-		if result.ResultJson != fullResultJSON {
-			t.Errorf("reassembled length = %d, want %d", len(result.ResultJson), len(fullResultJSON))
-		}
-	case <-time.After(5 * time.Second):
-		t.Fatal("timeout")
-	}
-}
-
-func TestStreamReassembly_UnknownSize(t *testing.T) {
-	mgr, toolConn := testStreamSetup(t)
-	respCh := mgr.RegisterPending("req-1")
-
-	payload := `[{"type":"text","text":"hello"}]`
-
-	// total_size = 0 (unknown)
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: "req-1",
-		Msg: &pb.Envelope_StreamHeader{
-			StreamHeader: &pb.StreamHeader{
-				FieldName: "result_json",
-				TotalSize: 0,
-				ChunkSize: 1024,
-			},
-		},
-	})
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: "req-1",
-		Msg: &pb.Envelope_StreamChunk{
-			StreamChunk: &pb.StreamChunk{Data: []byte(payload), Final: true},
-		},
-	})
-
-	select {
-	case resp := <-respCh:
-		if resp.GetCallResult().ResultJson != payload {
-			t.Errorf("got %q, want %q", resp.GetCallResult().ResultJson, payload)
-		}
-	case <-time.After(5 * time.Second):
-		t.Fatal("timeout")
-	}
-}
-
-func TestStreamReassembly_UnknownRequestID(t *testing.T) {
-	mgr, toolConn := testStreamSetup(t)
-	_ = mgr // readLoop is running
-
-	// Send a chunk with no matching stream_header — should be silently discarded.
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: "req-orphan",
-		Msg: &pb.Envelope_StreamChunk{
-			StreamChunk: &pb.StreamChunk{Data: []byte("hello"), Final: true},
-		},
-	})
-
-	// Send a normal response to verify readLoop is still working.
-	respCh := mgr.RegisterPending("req-2")
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: "req-2",
-		Msg: &pb.Envelope_CallResult{
-			CallResult: &pb.CallToolResponse{ResultJson: `[{"type":"text","text":"ok"}]`},
-		},
-	})
-
-	select {
-	case resp := <-respCh:
-		if resp.GetCallResult().ResultJson != `[{"type":"text","text":"ok"}]` {
-			t.Error("unexpected result")
-		}
-	case <-time.After(5 * time.Second):
-		t.Fatal("timeout — readLoop may have crashed on orphan chunk")
-	}
-}
-
-func TestStreamReassembly_InterleavedStreams(t *testing.T) {
-	mgr, toolConn := testStreamSetup(t)
-	respCh1 := mgr.RegisterPending("req-1")
-	respCh2 := mgr.RegisterPending("req-2")
-
-	payload1 := `[{"type":"text","text":"AAAA"}]`
-	payload2 := `[{"type":"text","text":"BBBB"}]`
-
-	// Start both streams
-	for _, id := range []string{"req-1", "req-2"} {
-		envelope.Write(toolConn, &pb.Envelope{
-			RequestId: id,
-			Msg: &pb.Envelope_StreamHeader{
-				StreamHeader: &pb.StreamHeader{FieldName: "result_json", ChunkSize: 1024},
-			},
-		})
-	}
-
-	// Interleave chunks: req-1 chunk, req-2 chunk, req-1 final, req-2 final
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: "req-1",
-		Msg:       &pb.Envelope_StreamChunk{StreamChunk: &pb.StreamChunk{Data: []byte(payload1[:15])}},
-	})
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: "req-2",
-		Msg:       &pb.Envelope_StreamChunk{StreamChunk: &pb.StreamChunk{Data: []byte(payload2[:15])}},
-	})
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: "req-1",
-		Msg:       &pb.Envelope_StreamChunk{StreamChunk: &pb.StreamChunk{Data: []byte(payload1[15:]), Final: true}},
-	})
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: "req-2",
-		Msg:       &pb.Envelope_StreamChunk{StreamChunk: &pb.StreamChunk{Data: []byte(payload2[15:]), Final: true}},
-	})
-
-	for i, ch := range []chan *pb.Envelope{respCh1, respCh2} {
-		want := payload1
-		if i == 1 {
-			want = payload2
-		}
-		select {
-		case resp := <-ch:
-			if resp.GetCallResult().ResultJson != want {
-				t.Errorf("stream %d: got %q, want %q", i+1, resp.GetCallResult().ResultJson, want)
-			}
-		case <-time.After(5 * time.Second):
-			t.Fatalf("stream %d: timeout", i+1)
-		}
-	}
-}
-
-func TestStreamReassembly_CrashMidStream(t *testing.T) {
-	socketPath := filepath.Join(os.TempDir(), fmt.Sprintf("pmcp-crash-%d.sock", os.Getpid()))
-	defer os.Remove(socketPath)
-
-	listener, err := net.Listen("unix", socketPath)
-	if err != nil {
-		t.Fatal(err)
-	}
-	defer listener.Close()
-
-	toolConn, err := net.Dial("unix", socketPath)
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	serverConn, err := listener.Accept()
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	cfg := process.ManagerConfig{SocketPath: socketPath, CallTimeout: 2 * time.Second}
-	mgr := process.NewManagerForTest(cfg, serverConn)
-	done := make(chan struct{})
-	go func() { mgr.StartReadLoop(); close(done) }()
-
-	respCh := mgr.RegisterPending("req-1")
-
-	// Send header but no chunks, then close the tool connection.
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: "req-1",
-		Msg: &pb.Envelope_StreamHeader{
-			StreamHeader: &pb.StreamHeader{FieldName: "result_json", TotalSize: 100000, ChunkSize: 1024},
-		},
-	})
-	toolConn.Close()
-
-	// readLoop should exit. The caller should NOT receive a response.
-	select {
-	case <-done:
-		// readLoop exited — good
-	case <-time.After(5 * time.Second):
-		t.Fatal("readLoop didn't exit after tool crash")
-	}
-
-	// The pending channel should have no message; caller times out.
-	select {
-	case resp := <-respCh:
-		t.Fatalf("unexpected response after crash: %v", resp)
-	default:
-		// Expected: no response
-	}
-}
-```
-
-- [ ] **Step 2: Add test helpers to manager.go**
-
-Add to `internal/process/manager.go`:
-
-```go
-// NewManagerForTest creates a Manager with a pre-established connection.
-// Used by tests that drive the protocol directly without spawning a process.
-func NewManagerForTest(cfg ManagerConfig, conn net.Conn) *Manager {
-	m := NewManager(cfg)
-	m.conn = conn
-	return m
-}
-
-// RegisterPending registers a pending request channel and returns it.
-// Used by tests to receive responses from readLoop.
-func (m *Manager) RegisterPending(reqID string) chan *pb.Envelope {
-	ch := make(chan *pb.Envelope, 1)
-	m.mu.Lock()
-	m.pending[reqID] = ch
-	m.mu.Unlock()
-	return ch
-}
-
-// StartReadLoop starts the readLoop (blocking). Used by tests.
-func (m *Manager) StartReadLoop() {
-	m.readWg.Add(1)
-	m.readLoop()
-}
-```
-
-- [ ] **Step 3: Run tests to verify they fail**
-
-Run: `go test -v ./internal/process/ -run TestStream`
-Expected: Fail — readLoop doesn't handle `stream_header`/`stream_chunk`
-
-- [ ] **Step 4: Implement stream reassembly in readLoop**
-
-Add to `manager.go`:
-
-```go
-// streamAssembly tracks an in-progress chunked transfer.
-type streamAssembly struct {
-	fieldName string
-	buf       bytes.Buffer
-	totalSize uint64
-	created   time.Time
-}
-```
-
-Add field to `Manager` struct:
-
-```go
-	streams map[string]*streamAssembly
-```
-
-Initialize in `NewManager`:
-
-```go
-	streams: make(map[string]*streamAssembly),
-```
-
-In `readLoop`, after the `stopCh` select and before `envelope.Read`, add orphan cleanup:
-
-```go
-		// Clean up orphaned stream assemblies.
-		now := time.Now()
-		for id, asm := range m.streams {
-			if now.Sub(asm.created) > m.cfg.CallTimeout {
-				delete(m.streams, id)
-			}
-		}
-```
-
-After reading the envelope and extracting `reqID` (after the unsolicited message routing, before the `m.pending` dispatch), add stream handling:
-
-```go
-		// Stream reassembly.
-		if sh := env.GetStreamHeader(); sh != nil {
-			assembly := &streamAssembly{
-				fieldName: sh.FieldName,
-				totalSize: sh.TotalSize,
-				created:   time.Now(),
-			}
-			if sh.TotalSize > 0 {
-				assembly.buf.Grow(int(sh.TotalSize))
-			}
-			m.streams[reqID] = assembly
-			continue
-		}
-
-		if sc := env.GetStreamChunk(); sc != nil {
-			assembly, ok := m.streams[reqID]
-			if !ok {
-				continue // no header — discard silently
-			}
-			assembly.buf.Write(sc.Data)
-
-			if sc.Final {
-				delete(m.streams, reqID)
-				result := &pb.Envelope{
-					RequestId: reqID,
-					Msg: &pb.Envelope_CallResult{
-						CallResult: &pb.CallToolResponse{},
-					},
-				}
-				switch assembly.fieldName {
-				case "result_json":
-					result.GetCallResult().ResultJson = assembly.buf.String()
-				case "structured_content_json":
-					result.GetCallResult().StructuredContentJson = assembly.buf.String()
-				}
-
-				m.mu.Lock()
-				ch, chOk := m.pending[reqID]
-				m.mu.Unlock()
-				if chOk {
-					select {
-					case ch <- result:
-					default:
-					}
-				}
-			}
-			continue
-		}
-```
-
-Add `"bytes"` to imports if needed (`"time"` should already be there).
-
-- [ ] **Step 5: Run all stream tests**
-
-Run: `go test -v ./internal/process/ -run TestStream`
-Expected: All 5 tests pass
-
-- [ ] **Step 6: Run all process tests**
-
-Run: `go test -v ./internal/process/`
-Expected: All pass
-
-- [ ] **Step 7: Commit**
-
-```bash
-git add internal/process/manager.go internal/process/manager_test.go
-git commit -m "feat: stream reassembly in readLoop for chunked transfers
-
-Handles StreamHeader/StreamChunk envelopes, accumulating chunks into a
-bytes.Buffer and dispatching a complete CallToolResponse on final chunk.
-Includes orphan cleanup, interleaved stream support, and crash handling."
-```
-
----
-
-### Task 6: Implement chunked send in Python SDK
-
-**Files:**
-- Modify: `sdk/python/src/protomcp/transport.py`
-- Modify: `sdk/python/src/protomcp/runner.py`
-
-- [ ] **Step 1: Add `send_chunked` to transport.py**
-
-Add after the existing `send()` method (line 22 of `transport.py`):
-
-```python
-    def send_chunked(self, request_id: str, field_name: str, data: bytes,
-                     chunk_size: int = 65536):
-        """Send a large field as StreamHeader + StreamChunk messages."""
-        header = pb.Envelope(
-            request_id=request_id,
-            stream_header=pb.StreamHeader(
-                field_name=field_name,
-                total_size=len(data),
-                chunk_size=chunk_size,
-            ),
-        )
-        self.send(header)
-
-        offset = 0
-        while offset < len(data):
-            end = min(offset + chunk_size, len(data))
-            is_final = (end >= len(data))
-            chunk_env = pb.Envelope(
-                request_id=request_id,
-                stream_chunk=pb.StreamChunk(
-                    data=data[offset:end],
-                    final=is_final,
-                ),
-            )
-            self.send(chunk_env)
-            offset = end
-```
-
-- [ ] **Step 2: Modify runner.py to use chunked send for large results**
-
-In `_handle_call_tool()` (around line 120-131 of `runner.py`), replace the response send with:
-
-```python
-    # Check if result_json exceeds chunk threshold — stream if so.
-    chunk_threshold = int(os.environ.get('PROTOMCP_CHUNK_THRESHOLD', '65536'))
-    result_json_str = resp_msg.result_json
-    result_json_bytes = result_json_str.encode('utf-8') if result_json_str else b''
-
-    if len(result_json_bytes) > chunk_threshold:
-        transport.send_chunked(
-            request_id=env.request_id,
-            field_name='result_json',
-            data=result_json_bytes,
-        )
-    else:
-        resp = pb.Envelope(call_result=resp_msg, request_id=env.request_id)
-        transport.send(resp)
-```
-
-Add `import os` at the top if not already present.
-
-- [ ] **Step 3: Run existing integration tests**
-
-Run: `go test -v ./internal/process/`
-Expected: All pass (test payloads are small, below default 64KB threshold)
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add sdk/python/src/protomcp/transport.py sdk/python/src/protomcp/runner.py
-git commit -m "feat: chunked send in Python SDK for large payloads
-
-When result_json exceeds PROTOMCP_CHUNK_THRESHOLD (default 64KB),
-sends StreamHeader + StreamChunk messages instead of a single envelope."
-```
-
----
-
-### Task 7: Implement chunked send in TypeScript SDK
-
-**Files:**
-- Modify: `sdk/typescript/src/transport.ts`
-- Modify: `sdk/typescript/src/runner.ts`
-
-- [ ] **Step 1: Add `sendChunked` to transport.ts**
-
-Add after the existing `send()` method (line 108 of `transport.ts`):
-
-```typescript
-  async sendChunked(requestId: string, fieldName: string, data: Buffer, chunkSize: number = 65536): Promise<void> {
-    const root = await this.getRoot();
-    const Envelope = root.lookupType('protomcp.Envelope');
-    const StreamHeader = root.lookupType('protomcp.StreamHeader');
-    const StreamChunk = root.lookupType('protomcp.StreamChunk');
-
-    // Send header
-    const header = Envelope.create({
-      requestId,
-      streamHeader: StreamHeader.create({
-        fieldName,
-        totalSize: data.length,
-        chunkSize,
-      }),
-    });
-    await this.send(header);
-
-    // Send chunks
-    let offset = 0;
-    while (offset < data.length) {
-      const end = Math.min(offset + chunkSize, data.length);
-      const isFinal = end >= data.length;
-      const chunk = Envelope.create({
-        requestId,
-        streamChunk: StreamChunk.create({
-          data: data.subarray(offset, end),
-          final: isFinal,
-        }),
-      });
-      await this.send(chunk);
-      offset = end;
-    }
-  }
-```
-
-- [ ] **Step 2: Modify runner.ts to use chunked send for large results**
-
-In `runner.ts`, find the block where `callTool` responses are sent (around line 180: `const resp = Envelope.create({ callResult: respMsg, requestId });` and `await transport.send(resp);`).
-
-Replace that block with:
-
-```typescript
-      // Check if result_json exceeds chunk threshold — stream if so.
-      const chunkThreshold = parseInt(process.env['PROTOMCP_CHUNK_THRESHOLD'] ?? '65536', 10);
-      const resultJson = (respMsg as any).resultJson as string ?? '';
-      const resultBytes = Buffer.from(resultJson, 'utf-8');
-
-      if (resultBytes.length > chunkThreshold) {
-        await transport.sendChunked(requestId, 'result_json', resultBytes);
-      } else {
-        const resp = Envelope.create({ callResult: respMsg, requestId });
-        await transport.send(resp);
-      }
-```
-
-- [ ] **Step 3: Verify TypeScript compiles**
-
-Run: `cd sdk/typescript && npm run build`
-Expected: Success
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add sdk/typescript/src/transport.ts sdk/typescript/src/runner.ts
-git commit -m "feat: chunked send in TypeScript SDK for large payloads"
-```
-
----
-
-### Task 8: Integration test — large payload through full Python stack
-
-**Files:**
-- Create: `internal/process/stream_integration_test.go`
-
-The `echo_tool.py` fixture supports a `generate` tool that returns a string of requested size. This test spawns it, calls `generate` with a payload above the chunk threshold, and verifies the Go side reassembles correctly.
-
-- [ ] **Step 1: Write integration test**
-
-```go
-package process_test
-
-import (
-	"context"
-	"encoding/json"
-	"fmt"
-	"os"
-	"path/filepath"
-	"testing"
-	"time"
-
-	"github.com/msilverblatt/protomcp/internal/process"
-	"github.com/msilverblatt/protomcp/tests/testutil"
-)
-
-func TestChunkedStreamIntegration(t *testing.T) {
-	testutil.SetupPythonPath()
-
-	// Set chunk threshold to 1KB to force chunking for moderate payloads.
-	os.Setenv("PROTOMCP_CHUNK_THRESHOLD", "1024")
-	defer os.Unsetenv("PROTOMCP_CHUNK_THRESHOLD")
-
-	socketPath := filepath.Join(os.TempDir(), fmt.Sprintf("pmcp-stream-integ-%d.sock", os.Getpid()))
-
-	cfg := process.ManagerConfig{
-		File:        testutil.FixturePath("tests/bench/fixtures/echo_tool.py"),
-		SocketPath:  socketPath,
-		CallTimeout: 10 * time.Second,
-	}
-
-	mgr := process.NewManager(cfg)
-	ctx := context.Background()
-	tools, err := mgr.Start(ctx)
-	if err != nil {
-		t.Fatalf("start: %v", err)
-	}
-	defer mgr.Stop()
-
-	if len(tools) == 0 {
-		t.Fatal("no tools returned")
-	}
-
-	// Call generate with 100KB — well above 1KB threshold.
-	args, _ := json.Marshal(map[string]int{"size": 100 * 1024})
-	resp, err := mgr.CallTool(ctx, "generate", string(args))
-	if err != nil {
-		t.Fatalf("call tool: %v", err)
-	}
-
-	if resp.IsError {
-		t.Fatalf("tool returned error: %s", resp.ResultJson)
-	}
-
-	var content []struct {
-		Type string `json:"type"`
-		Text string `json:"text"`
-	}
-	if err := json.Unmarshal([]byte(resp.ResultJson), &content); err != nil {
-		t.Fatalf("unmarshal result: %v", err)
-	}
-
-	if len(content) != 1 || len(content[0].Text) != 100*1024 {
-		t.Errorf("expected 100KB text, got %d bytes", len(content[0].Text))
-	}
-}
-```
-
-Note: The `echo_tool.py` fixture uses the raw protobuf protocol directly (not the SDK runner), so chunking will need to be tested either by modifying it or by using a fixture that imports the SDK. If `echo_tool.py` doesn't go through the SDK's `runner.py`, this test should instead use a fixture that does. Check which fixtures use the SDK runner vs raw protocol and adjust accordingly.
-
-- [ ] **Step 2: Run integration test**
-
-Run: `go test -v ./internal/process/ -run TestChunkedStreamIntegration -timeout 30s`
-Expected: PASS
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add internal/process/stream_integration_test.go
-git commit -m "test: integration test for chunked stream through full Python stack"
-```
-
----
-
-### Task 9: Rebuild and run D4 benchmark
-
-- [ ] **Step 1: Rebuild**
-
-Run: `make build`
-
-- [ ] **Step 2: Run D4 benchmark**
-
-Run: `PROTOMCP_CHUNK_THRESHOLD=65536 go test -v -timeout 120s ./tests/bench/comparison/ -run TestDeepFastMCPComparison/D4`
-Expected: Improvement at 100KB+ sizes. Target: beat FastMCP at 500KB.
-
----
-
-## Chunk 3: Phase B — End-to-End Streaming
-
-### Task 10: Add StreamWriter interface and transport implementations
-
-**Files:**
-- Modify: `internal/mcp/types.go`
-- Modify: `internal/transport/stdio.go`
-- Modify: `internal/transport/http.go`
-- Modify: `internal/transport/sse.go`
-
-- [ ] **Step 1: Define StreamWriter interface in types.go**
-
-Add to `internal/mcp/types.go`:
-
-```go
-// StreamWriter supports writing streaming responses to a transport.
-type StreamWriter interface {
-	WriteNotification(method string, params interface{}) error
-	WriteResponse(resp *JSONRPCResponse) error
-	Flush() error
-}
-
-// StreamStartParams is sent as the first notification in a streaming response.
-type StreamStartParams struct {
-	ID        json.RawMessage `json:"id"`
-	StreamID  string          `json:"streamId"`
-	TotalSize int             `json:"totalSize,omitempty"`
-}
-
-// StreamChunkParams carries one chunk of streaming content.
-type StreamChunkParams struct {
-	StreamID string `json:"streamId"`
-	Data     string `json:"data"`
-}
-
-// StreamCompleteResult is the final response with stream metadata.
-type StreamCompleteResult struct {
-	Content         json.RawMessage `json:"content,omitempty"`
-	IsError         bool            `json:"isError,omitempty"`
-	XStreamComplete string          `json:"x-stream-complete,omitempty"`
-}
-```
-
-- [ ] **Step 2: Implement StreamWriter for StdioTransport**
-
-Add to `internal/transport/stdio.go`:
-
-```go
-// NewStreamWriter returns a StreamWriter for the stdio transport.
-func (s *StdioTransport) NewStreamWriter() mcp.StreamWriter {
-	return &stdioStreamWriter{s: s}
-}
-
-type stdioStreamWriter struct {
-	s *StdioTransport
-}
-
-func (w *stdioStreamWriter) WriteNotification(method string, params interface{}) error {
-	p, err := json.Marshal(params)
-	if err != nil {
-		return err
-	}
-	return w.s.SendNotification(mcp.JSONRPCNotification{
-		JSONRPC: "2.0",
-		Method:  method,
-		Params:  p,
-	})
-}
-
-func (w *stdioStreamWriter) WriteResponse(resp *mcp.JSONRPCResponse) error {
-	w.s.mu.Lock()
-	defer w.s.mu.Unlock()
-	data, err := json.Marshal(resp)
-	if err != nil {
-		return err
-	}
-	_, err = w.s.writer.Write(append(data, '\n'))
-	return err
-}
-
-func (w *stdioStreamWriter) Flush() error {
-	return nil // stdio is unbuffered
-}
-```
-
-- [ ] **Step 3: Implement StreamWriter for HTTPTransport**
-
-Add to `internal/transport/http.go`:
-
-```go
-// httpStreamWriter writes streaming responses using HTTP chunked transfer encoding.
-type httpStreamWriter struct {
-	w       http.ResponseWriter
-	flusher http.Flusher
-	mu      sync.Mutex
-	started bool
-}
-
-func newHTTPStreamWriter(w http.ResponseWriter) *httpStreamWriter {
-	flusher, _ := w.(http.Flusher)
-	return &httpStreamWriter{w: w, flusher: flusher}
-}
-
-func (sw *httpStreamWriter) ensureHeaders() {
-	if !sw.started {
-		sw.w.Header().Set("Content-Type", "application/x-ndjson")
-		sw.w.WriteHeader(http.StatusOK)
-		sw.started = true
-	}
-}
-
-func (sw *httpStreamWriter) WriteNotification(method string, params interface{}) error {
-	p, err := json.Marshal(params)
-	if err != nil {
-		return err
-	}
-	notif := mcp.JSONRPCNotification{JSONRPC: "2.0", Method: method, Params: p}
-	sw.mu.Lock()
-	defer sw.mu.Unlock()
-	sw.ensureHeaders()
-	data, err := json.Marshal(notif)
-	if err != nil {
-		return err
-	}
-	_, err = sw.w.Write(append(data, '\n'))
-	return err
-}
-
-func (sw *httpStreamWriter) WriteResponse(resp *mcp.JSONRPCResponse) error {
-	sw.mu.Lock()
-	defer sw.mu.Unlock()
-	sw.ensureHeaders()
-	data, err := json.Marshal(resp)
-	if err != nil {
-		return err
-	}
-	_, err = sw.w.Write(append(data, '\n'))
-	return err
-}
-
-func (sw *httpStreamWriter) Flush() error {
-	sw.mu.Lock()
-	defer sw.mu.Unlock()
-	if sw.flusher != nil {
-		sw.flusher.Flush()
-	}
-	return nil
-}
-```
-
-- [ ] **Step 4: Implement StreamWriter for SSETransport**
-
-Add to `internal/transport/sse.go`:
-
-```go
-// sseStreamWriter writes streaming responses as SSE events.
-type sseStreamWriter struct {
-	transport *SSETransport
-}
-
-// NewStreamWriter returns a StreamWriter that broadcasts via SSE.
-func (s *SSETransport) NewStreamWriter() mcp.StreamWriter {
-	return &sseStreamWriter{transport: s}
-}
-
-func (sw *sseStreamWriter) WriteNotification(method string, params interface{}) error {
-	p, err := json.Marshal(params)
-	if err != nil {
-		return err
-	}
-	return sw.transport.SendNotification(mcp.JSONRPCNotification{
-		JSONRPC: "2.0",
-		Method:  method,
-		Params:  p,
-	})
-}
-
-func (sw *sseStreamWriter) WriteResponse(resp *mcp.JSONRPCResponse) error {
-	data, err := json.Marshal(resp)
-	if err != nil {
-		return err
-	}
-	sw.transport.broadcast(data)
-	return nil
-}
-
-func (sw *sseStreamWriter) Flush() error {
-	return nil // SSE flushes per-event in the broadcast handler
-}
-```
-
-- [ ] **Step 5: Verify compilation**
-
-Run: `go build ./internal/...`
-Expected: Success
-
-- [ ] **Step 6: Commit**
-
-```bash
-git add internal/mcp/types.go internal/transport/stdio.go internal/transport/http.go internal/transport/sse.go
-git commit -m "feat: StreamWriter interface with stdio, HTTP, and SSE implementations"
-```
-
----
-
-### Task 11: Store streaming capability during initialize
-
-**Files:**
-- Modify: `internal/mcp/handler.go`
-- Test: `internal/mcp/handler_test.go`
-
-- [ ] **Step 1: Add streaming fields to Handler struct**
-
-```go
-	streamCapable  bool
-	streamMaxChunk int
-	streamWriter   mcp.StreamWriter
-	streamIDSeq    uint64
-```
-
-Add getter/setter methods:
-
-```go
-func (h *Handler) StreamCapable() bool   { return h.streamCapable }
-func (h *Handler) StreamMaxChunk() int   { return h.streamMaxChunk }
-func (h *Handler) SetStreamWriter(sw StreamWriter) { h.streamWriter = sw }
-```
-
-- [ ] **Step 2: Parse capability in handleInitialize**
-
-At the start of `handleInitialize()`, before the existing response construction:
-
-```go
-	if req.Params != nil {
-		var initParams struct {
-			Capabilities map[string]json.RawMessage `json:"capabilities"`
-		}
-		if err := json.Unmarshal(req.Params, &initParams); err == nil {
-			if streamCap, ok := initParams.Capabilities["x-protomcp-stream"]; ok {
-				h.streamCapable = true
-				var sc struct {
-					MaxChunkSize int `json:"maxChunkSize"`
-				}
-				if json.Unmarshal(streamCap, &sc) == nil && sc.MaxChunkSize > 0 {
-					h.streamMaxChunk = sc.MaxChunkSize
-				} else {
-					h.streamMaxChunk = 65536
-				}
-			}
-		}
-	}
-```
-
-- [ ] **Step 3: Write test**
-
-```go
-func TestHandleInitialize_StreamCapability(t *testing.T) {
-	backend := &mockToolBackend{}
-	h := mcp.NewHandler(backend)
-
-	params, _ := json.Marshal(map[string]interface{}{
-		"protocolVersion": "2024-11-05",
-		"capabilities": map[string]interface{}{
-			"x-protomcp-stream": map[string]int{"maxChunkSize": 32768},
-		},
-		"clientInfo": map[string]string{"name": "test"},
-	})
-
-	_, err := h.Handle(context.Background(), mcp.JSONRPCRequest{
-		JSONRPC: "2.0", ID: json.RawMessage(`1`), Method: "initialize", Params: params,
-	})
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	if !h.StreamCapable() {
-		t.Error("expected stream capable")
-	}
-	if h.StreamMaxChunk() != 32768 {
-		t.Errorf("expected maxChunk 32768, got %d", h.StreamMaxChunk())
-	}
-}
-
-func TestHandleToolsCall_LargePayload_NoStreaming(t *testing.T) {
-	// Without x-protomcp-stream capability, large payloads should still
-	// work via the normal buffered path (raw passthrough from Phase C).
-	largeText := strings.Repeat("X", 200000)
-	contentJSON := fmt.Sprintf(`[{"type":"text","text":"%s"}]`, largeText)
-
-	backend := &mockToolBackend{
-		tools: []*pb.ToolDefinition{{Name: "generate", InputSchemaJson: `{"type":"object"}`}},
-		callResult: &pb.CallToolResponse{ResultJson: contentJSON},
-	}
-	h := mcp.NewHandler(backend)
-
-	// Initialize WITHOUT streaming capability
-	initParams, _ := json.Marshal(map[string]interface{}{
-		"protocolVersion": "2024-11-05",
-		"capabilities":    map[string]interface{}{},
-		"clientInfo":      map[string]string{"name": "test"},
-	})
-	h.Handle(context.Background(), mcp.JSONRPCRequest{
-		JSONRPC: "2.0", ID: json.RawMessage(`0`), Method: "initialize", Params: initParams,
-	})
-
-	params, _ := json.Marshal(mcp.ToolsCallParams{Name: "generate"})
-	resp, err := h.Handle(context.Background(), mcp.JSONRPCRequest{
-		JSONRPC: "2.0", ID: json.RawMessage(`1`), Method: "tools/call", Params: params,
-	})
-	if err != nil {
-		t.Fatal(err)
-	}
-	if resp.Error != nil {
-		t.Fatalf("error: %s", resp.Error.Message)
-	}
-
-	// Should get a normal (non-streamed) response with full content
-	var result struct {
-		Content json.RawMessage `json:"content"`
-	}
-	json.Unmarshal(resp.Result, &result)
-	if len(result.Content) != len(contentJSON) {
-		t.Errorf("expected full content in response, got length %d vs %d", len(result.Content), len(contentJSON))
-	}
-}
-```
-
-- [ ] **Step 4: Run tests**
-
-Run: `go test -v ./internal/mcp/ -run TestHandleInitialize_StreamCapability`
-Run: `go test -v ./internal/mcp/ -run TestHandleToolsCall_LargePayload_NoStreaming`
-Expected: All pass
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/mcp/handler.go internal/mcp/handler_test.go
-git commit -m "feat: detect x-protomcp-stream capability during initialize"
-```
-
----
-
-### Task 12: Add streaming chunk channel to process manager
-
-**Files:**
-- Modify: `internal/process/manager.go`
-- Test: `internal/process/manager_test.go`
-
-For true end-to-end streaming (no full reassembly), the process manager needs a way to forward chunks directly to the handler instead of accumulating them. Add a `CallToolStream` method that returns a channel of stream events.
-
-- [ ] **Step 1: Define StreamEvent type**
-
-Add to `internal/process/manager.go`:
-
-```go
-// StreamEvent represents one event in a chunked tool call response.
-type StreamEvent struct {
-	// Header is set for the first event (stream start).
-	Header *pb.StreamHeader
-	// Chunk is set for data events.
-	Chunk []byte
-	// Final is true when this is the last chunk.
-	Final bool
-	// Result is set when the tool returns a non-streamed response
-	// (payload was below threshold).
-	Result *pb.CallToolResponse
-}
-```
-
-- [ ] **Step 2: Add CallToolStream method**
-
-```go
-// CallToolStream sends a CallToolRequest and returns a channel that receives
-// stream events. If the tool responds with a single (non-chunked) message,
-// the channel receives one StreamEvent with Result set. If the tool streams,
-// it receives a Header event followed by Chunk events.
-func (m *Manager) CallToolStream(ctx context.Context, name, argsJSON string) (<-chan StreamEvent, error) {
-	reqID := m.nextRequestID()
-
-	env := &pb.Envelope{
-		RequestId: reqID,
-		Msg: &pb.Envelope_CallTool{
-			CallTool: &pb.CallToolRequest{
-				Name:          name,
-				ArgumentsJson: argsJSON,
-			},
-		},
-	}
-
-	ch := make(chan StreamEvent, 16)
-
-	m.mu.Lock()
-	m.streamChs[reqID] = ch
-	m.mu.Unlock()
-
-	m.writeMu.Lock()
-	err := envelope.Write(m.conn, env)
-	m.writeMu.Unlock()
-	if err != nil {
-		m.mu.Lock()
-		delete(m.streamChs, reqID)
-		m.mu.Unlock()
-		close(ch)
-		return nil, fmt.Errorf("write CallToolRequest: %w", err)
-	}
-
-	// Cleanup on context cancellation or timeout.
-	go func() {
-		timeout := m.cfg.CallTimeout
-		timer := time.NewTimer(timeout)
-		defer timer.Stop()
-
-		select {
-		case <-ctx.Done():
-		case <-timer.C:
-		}
-
-		m.mu.Lock()
-		if _, ok := m.streamChs[reqID]; ok {
-			delete(m.streamChs, reqID)
-			close(ch)
-		}
-		m.mu.Unlock()
-	}()
-
-	return ch, nil
-}
-```
-
-- [ ] **Step 3: Add streamChs map to Manager**
-
-Add to `Manager` struct:
-
-```go
-	streamChs map[string]chan StreamEvent // for streaming tool call responses
-```
-
-Initialize in `NewManager`:
-
-```go
-	streamChs: make(map[string]chan StreamEvent),
-```
-
-- [ ] **Step 4: Modify readLoop to dispatch to streamChs**
-
-In the readLoop, the stream handling code (from Task 5) needs to check `streamChs` first. If a stream channel exists for the request ID, dispatch events there instead of accumulating in `streamAssembly`.
-
-Modify the `stream_header` handler:
-
-```go
-		if sh := env.GetStreamHeader(); sh != nil {
-			m.mu.Lock()
-			sCh, isStream := m.streamChs[reqID]
-			m.mu.Unlock()
-
-			if isStream {
-				// Streaming mode — forward header to channel.
-				select {
-				case sCh <- StreamEvent{Header: sh}:
-				default:
-				}
-			} else {
-				// Reassembly mode (non-streaming host).
-				assembly := &streamAssembly{
-					fieldName: sh.FieldName,
-					totalSize: sh.TotalSize,
-					created:   time.Now(),
-				}
-				if sh.TotalSize > 0 {
-					assembly.buf.Grow(int(sh.TotalSize))
-				}
-				m.streams[reqID] = assembly
-			}
-			continue
-		}
-```
-
-Modify the `stream_chunk` handler:
-
-```go
-		if sc := env.GetStreamChunk(); sc != nil {
-			m.mu.Lock()
-			sCh, isStream := m.streamChs[reqID]
-			m.mu.Unlock()
-
-			if isStream {
-				// Streaming mode — forward chunk to channel.
-				evt := StreamEvent{Chunk: sc.Data, Final: sc.Final}
-				select {
-				case sCh <- evt:
-				default:
-				}
-				if sc.Final {
-					m.mu.Lock()
-					delete(m.streamChs, reqID)
-					m.mu.Unlock()
-					close(sCh)
-				}
-			} else {
-				// Reassembly mode.
-				assembly, ok := m.streams[reqID]
-				if !ok {
-					continue
-				}
-				assembly.buf.Write(sc.Data)
-				if sc.Final {
-					delete(m.streams, reqID)
-					result := &pb.Envelope{
-						RequestId: reqID,
-						Msg: &pb.Envelope_CallResult{
-							CallResult: &pb.CallToolResponse{},
-						},
-					}
-					switch assembly.fieldName {
-					case "result_json":
-						result.GetCallResult().ResultJson = assembly.buf.String()
-					case "structured_content_json":
-						result.GetCallResult().StructuredContentJson = assembly.buf.String()
-					}
-					m.mu.Lock()
-					ch, chOk := m.pending[reqID]
-					m.mu.Unlock()
-					if chOk {
-						select {
-						case ch <- result:
-						default:
-						}
-					}
-				}
-			}
-			continue
-		}
-```
-
-Also handle the case where a non-streamed response arrives for a `streamChs` request:
-
-```go
-		// Normal response dispatch — check streamChs first.
-		m.mu.Lock()
-		sCh, isStream := m.streamChs[reqID]
-		ch, isPending := m.pending[reqID]
-		m.mu.Unlock()
-
-		if isStream {
-			// Tool returned a non-chunked response to a streaming request.
-			result := env.GetCallResult()
-			if result != nil {
-				select {
-				case sCh <- StreamEvent{Result: result}:
-				default:
-				}
-			}
-			m.mu.Lock()
-			delete(m.streamChs, reqID)
-			m.mu.Unlock()
-			close(sCh)
-		} else if isPending {
-			select {
-			case ch <- env:
-			default:
-			}
-		}
-```
-
-- [ ] **Step 5: Write test for CallToolStream**
-
-```go
-func TestCallToolStream(t *testing.T) {
-	mgr, toolConn := testStreamSetup(t)
-
-	payload := `[{"type":"text","text":"` + strings.Repeat("X", 200*1024) + `"}]`
-	chunkSize := 64 * 1024
-
-	// Start streaming call in background
-	ctx := context.Background()
-	ch, err := mgr.CallToolStream(ctx, "generate", `{"size":204800}`)
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	// Read the CallToolRequest from the tool side
-	toolEnv, err := envelope.Read(toolConn)
-	if err != nil {
-		t.Fatal(err)
-	}
-	reqID := toolEnv.GetRequestId()
-
-	// Send header + chunks from tool side
-	envelope.Write(toolConn, &pb.Envelope{
-		RequestId: reqID,
-		Msg: &pb.Envelope_StreamHeader{
-			StreamHeader: &pb.StreamHeader{
-				FieldName: "result_json",
-				TotalSize: uint64(len(payload)),
-				ChunkSize: uint32(chunkSize),
-			},
-		},
-	})
-
-	remaining := []byte(payload)
-	for len(remaining) > 0 {
-		sz := chunkSize
-		if sz > len(remaining) {
-			sz = len(remaining)
-		}
-		envelope.Write(toolConn, &pb.Envelope{
-			RequestId: reqID,
-			Msg: &pb.Envelope_StreamChunk{
-				StreamChunk: &pb.StreamChunk{
-					Data:  remaining[:sz],
-					Final: sz >= len(remaining),
-				},
-			},
-		})
-		remaining = remaining[sz:]
-	}
-
-	// Read events from channel
-	var gotHeader bool
-	var assembled []byte
-	for evt := range ch {
-		if evt.Header != nil {
-			gotHeader = true
-			if evt.Header.TotalSize != uint64(len(payload)) {
-				t.Errorf("header total_size = %d, want %d", evt.Header.TotalSize, len(payload))
-			}
-		}
-		if evt.Chunk != nil {
-			assembled = append(assembled, evt.Chunk...)
-		}
-	}
-
-	if !gotHeader {
-		t.Error("never received header event")
-	}
-	if string(assembled) != payload {
-		t.Errorf("assembled length = %d, want %d", len(assembled), len(payload))
-	}
-}
-```
-
-- [ ] **Step 6: Run tests**
-
-Run: `go test -v ./internal/process/ -run TestCallToolStream`
-Expected: PASS
-
-Run: `go test -v ./internal/process/`
-Expected: All tests still pass (reassembly tests use `RegisterPending`, not `CallToolStream`)
-
-- [ ] **Step 7: Commit**
-
-```bash
-git add internal/process/manager.go internal/process/manager_test.go
-git commit -m "feat: CallToolStream for true streaming without full reassembly
-
-Adds StreamEvent type and CallToolStream method. readLoop dispatches
-chunks directly to a channel when streaming mode is active, bypassing
-the reassembly buffer. Enables bounded-memory streaming in Phase B."
-```
-
----
-
-### Task 13: Implement streaming tool call response in handler
-
-**Files:**
-- Modify: `internal/mcp/handler.go`
-- Test: `internal/mcp/handler_test.go`
-
-When the handler has a stream-capable client and a large result, it uses `CallToolStream` from the process manager to forward chunks directly to the `StreamWriter` — no full reassembly.
-
-- [ ] **Step 1: Add StreamingBackend interface**
-
-The handler needs access to `CallToolStream` in addition to `CallTool`. Add to `handler.go`:
-
-```go
-// StreamingBackend extends ToolBackend with streaming support.
-type StreamingBackend interface {
-	ToolBackend
-	CallToolStream(ctx context.Context, name, argsJSON string) (<-chan process.StreamEvent, error)
-}
-```
-
-- [ ] **Step 2: Add streaming tool call path to handleToolsCall**
-
-After the existing `CallTool` call and the raw passthrough block, add a streaming path. The logic is:
-
-1. If client is stream-capable AND backend supports streaming AND result is large → use streaming
-2. Otherwise → use the existing raw passthrough path
-
-Since we don't know the result size before calling, we need to either:
-- Always use `CallToolStream` when streaming is available (it handles non-chunked responses too via `StreamEvent.Result`)
-- Or call `CallTool` first and check size
-
-The cleaner approach: when streaming is enabled, always use `CallToolStream`. If the tool returns a small result (below threshold), it comes as a single `StreamEvent.Result` and we return it normally.
-
-```go
-	// Streaming path: use CallToolStream if available.
-	if h.streamCapable && h.streamWriter != nil {
-		if sb, ok := h.backend.(StreamingBackend); ok {
-			return h.handleToolsCallStreaming(ctx, req, sb, params)
-		}
-	}
-```
-
-Add the streaming handler method:
-
-```go
-func (h *Handler) handleToolsCallStreaming(ctx context.Context, req JSONRPCRequest, sb StreamingBackend, params ToolsCallParams) (*JSONRPCResponse, error) {
-	argsJSON := "{}"
-	if params.Arguments != nil {
-		argsJSON = string(params.Arguments)
-	}
-
-	ch, err := sb.CallToolStream(ctx, params.Name, argsJSON)
-	if err != nil {
-		return h.internalError(req.ID, err.Error())
-	}
-
-	streamID := fmt.Sprintf("s-%d", atomic.AddUint64(&h.streamIDSeq, 1))
-	var streaming bool
-
-	for evt := range ch {
-		// Non-chunked response — return normally via raw passthrough.
-		if evt.Result != nil {
-			resultJSON := evt.Result.ResultJson
-			trimmed := strings.TrimSpace(resultJSON)
-			if len(trimmed) > 0 && trimmed[0] == '[' {
-				result := RawToolsCallResult{
-					Content: json.RawMessage(resultJSON),
-					IsError: evt.Result.IsError,
-				}
-				if evt.Result.StructuredContentJson != "" {
-					result.StructuredContent = json.RawMessage(evt.Result.StructuredContentJson)
-				}
-				return h.success(req.ID, result)
-			}
-			var content []ContentItem
-			if resultJSON != "" {
-				if unmarshalErr := json.Unmarshal([]byte(resultJSON), &content); unmarshalErr != nil {
-					content = []ContentItem{{Type: "text", Text: resultJSON}}
-				}
-			}
-			return h.success(req.ID, ToolsCallResult{Content: content, IsError: evt.Result.IsError})
-		}
-
-		// Stream header — send start notification.
-		if evt.Header != nil {
-			streaming = true
-			h.streamWriter.WriteNotification("x-protomcp-stream/start", StreamStartParams{
-				ID:        req.ID,
-				StreamID:  streamID,
-				TotalSize: int(evt.Header.TotalSize),
-			})
-			h.streamWriter.Flush()
-			continue
-		}
-
-		// Stream chunk — forward directly to transport.
-		if evt.Chunk != nil && streaming {
-			h.streamWriter.WriteNotification("x-protomcp-stream/chunk", StreamChunkParams{
-				StreamID: streamID,
-				Data:     string(evt.Chunk),
-			})
-			h.streamWriter.Flush()
-		}
-	}
-
-	// Stream complete — send final response.
-	if streaming {
-		return h.success(req.ID, StreamCompleteResult{
-			XStreamComplete: streamID,
-		})
-	}
-
-	// Channel closed with no events — error.
-	return h.internalError(req.ID, "tool stream closed without response")
-}
-```
-
-Add `"sync/atomic"` to imports.
-
-- [ ] **Step 3: Write test with mock streaming backend**
-
-```go
-type mockStreamingBackend struct {
-	mockToolBackend
-	streamEvents []process.StreamEvent
-}
-
-func (m *mockStreamingBackend) CallToolStream(ctx context.Context, name, argsJSON string) (<-chan process.StreamEvent, error) {
-	ch := make(chan process.StreamEvent, len(m.streamEvents))
-	for _, evt := range m.streamEvents {
-		ch <- evt
-	}
-	close(ch)
-	return ch, nil
-}
-
-func TestHandleToolsCall_StreamingPipeline(t *testing.T) {
-	payload := `[{"type":"text","text":"` + strings.Repeat("X", 200000) + `"}]`
-	chunkSize := 65536
-
-	// Build stream events
-	var events []process.StreamEvent
-	events = append(events, process.StreamEvent{
-		Header: &pb.StreamHeader{FieldName: "result_json", TotalSize: uint64(len(payload)), ChunkSize: uint32(chunkSize)},
-	})
-	data := []byte(payload)
-	for offset := 0; offset < len(data); {
-		end := offset + chunkSize
-		if end > len(data) {
-			end = len(data)
-		}
-		events = append(events, process.StreamEvent{
-			Chunk: data[offset:end],
-			Final: end >= len(data),
-		})
-		offset = end
-	}
-
-	backend := &mockStreamingBackend{
-		mockToolBackend: mockToolBackend{
-			tools: []*pb.ToolDefinition{{Name: "generate", InputSchemaJson: `{"type":"object"}`}},
-		},
-		streamEvents: events,
-	}
-
-	h := mcp.NewHandler(backend)
-	sw := &mockStreamWriter{}
-	h.SetStreamWriter(sw)
-
-	// Initialize with streaming
-	initParams, _ := json.Marshal(map[string]interface{}{
-		"protocolVersion": "2024-11-05",
-		"capabilities":    map[string]interface{}{"x-protomcp-stream": map[string]int{"maxChunkSize": chunkSize}},
-		"clientInfo":      map[string]string{"name": "test"},
-	})
-	h.Handle(context.Background(), mcp.JSONRPCRequest{
-		JSONRPC: "2.0", ID: json.RawMessage(`0`), Method: "initialize", Params: initParams,
-	})
-
-	// Call tool
-	params, _ := json.Marshal(mcp.ToolsCallParams{Name: "generate"})
-	resp, err := h.Handle(context.Background(), mcp.JSONRPCRequest{
-		JSONRPC: "2.0", ID: json.RawMessage(`1`), Method: "tools/call", Params: params,
-	})
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	// Verify start + chunk notifications
-	if len(sw.notifications) < 2 {
-		t.Fatalf("expected >= 2 notifications, got %d", len(sw.notifications))
-	}
-	if sw.notifications[0].method != "x-protomcp-stream/start" {
-		t.Errorf("first notification = %s, want x-protomcp-stream/start", sw.notifications[0].method)
-	}
-
-	// Reassemble chunks
-	var assembled []byte
-	for _, n := range sw.notifications {
-		if n.method == "x-protomcp-stream/chunk" {
-			var cp mcp.StreamChunkParams
-			json.Unmarshal(n.params, &cp)
-			assembled = append(assembled, []byte(cp.Data)...)
-		}
-	}
-	if string(assembled) != payload {
-		t.Errorf("assembled length = %d, want %d", len(assembled), len(payload))
-	}
-
-	// Final response should have x-stream-complete
-	var finalResult mcp.StreamCompleteResult
-	json.Unmarshal(resp.Result, &finalResult)
-	if finalResult.XStreamComplete == "" {
-		t.Error("missing x-stream-complete in final response")
-	}
-}
-
-func TestHandleToolsCall_StreamingBackend_SmallPayload(t *testing.T) {
-	// When streaming backend returns a small (non-chunked) result,
-	// handler should return it normally via raw passthrough.
-	backend := &mockStreamingBackend{
-		mockToolBackend: mockToolBackend{
-			tools: []*pb.ToolDefinition{{Name: "echo", InputSchemaJson: `{"type":"object"}`}},
-		},
-		streamEvents: []process.StreamEvent{
-			{Result: &pb.CallToolResponse{ResultJson: `[{"type":"text","text":"hello"}]`}},
-		},
-	}
-
-	h := mcp.NewHandler(backend)
-	sw := &mockStreamWriter{}
-	h.SetStreamWriter(sw)
-
-	// Initialize with streaming
-	initParams, _ := json.Marshal(map[string]interface{}{
-		"protocolVersion": "2024-11-05",
-		"capabilities":    map[string]interface{}{"x-protomcp-stream": map[string]int{"maxChunkSize": 65536}},
-		"clientInfo":      map[string]string{"name": "test"},
-	})
-	h.Handle(context.Background(), mcp.JSONRPCRequest{
-		JSONRPC: "2.0", ID: json.RawMessage(`0`), Method: "initialize", Params: initParams,
-	})
-
-	params, _ := json.Marshal(mcp.ToolsCallParams{Name: "echo"})
-	resp, err := h.Handle(context.Background(), mcp.JSONRPCRequest{
-		JSONRPC: "2.0", ID: json.RawMessage(`1`), Method: "tools/call", Params: params,
-	})
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	// No streaming notifications — small payload goes through normal path.
-	if len(sw.notifications) != 0 {
-		t.Errorf("expected 0 notifications for small payload, got %d", len(sw.notifications))
-	}
-
-	var result struct {
-		Content json.RawMessage `json:"content"`
-	}
-	json.Unmarshal(resp.Result, &result)
-	if string(result.Content) != `[{"type":"text","text":"hello"}]` {
-		t.Errorf("unexpected content: %s", result.Content)
-	}
-}
-```
-
-- [ ] **Step 4: Add mockStreamWriter if not already in test file**
-
-```go
-type mockStreamWriter struct {
-	notifications []struct {
-		method string
-		params json.RawMessage
-	}
-}
-
-func (m *mockStreamWriter) WriteNotification(method string, params interface{}) error {
-	p, _ := json.Marshal(params)
-	m.notifications = append(m.notifications, struct {
-		method string
-		params json.RawMessage
-	}{method: method, params: p})
-	return nil
-}
-
-func (m *mockStreamWriter) WriteResponse(resp *mcp.JSONRPCResponse) error { return nil }
-func (m *mockStreamWriter) Flush() error                                  { return nil }
-```
-
-- [ ] **Step 5: Run tests**
-
-Run: `go test -v ./internal/mcp/ -run TestHandleToolsCall_Streaming`
-Expected: All pass
-
-Run: `go test -v ./internal/mcp/`
-Expected: All pass
-
-- [ ] **Step 6: Commit**
-
-```bash
-git add internal/mcp/handler.go internal/mcp/handler_test.go
-git commit -m "feat: streaming tool call pipeline with true chunk forwarding
-
-When client supports x-protomcp-stream and backend supports streaming,
-chunks flow from tool process through readLoop to handler to transport
-without full reassembly. Bounded memory regardless of payload size."
-```
-
----
-
-### Task 14: Wire StreamWriter into transports
-
-**Files:**
-- Modify: `internal/transport/http.go:62-109`
-- Modify: `internal/transport/stdio.go:35-87`
-- Modify: `internal/transport/transport.go`
-
-The transports need to provide their `StreamWriter` to the handler before calling `Handle()`. Since the `RequestHandler` type is `func(ctx, req) (*resp, error)`, the cleanest approach is to extend the `Transport` interface.
-
-- [ ] **Step 1: Add StreamWriterProvider to transport.go**
-
-```go
-// StreamWriterProvider is implemented by transports that support streaming.
-type StreamWriterProvider interface {
-	// NewStreamWriter creates a StreamWriter for a specific response.
-	// For HTTP, this wraps the http.ResponseWriter.
-	// For stdio/SSE, this wraps the transport's output.
-	NewStreamWriter() mcp.StreamWriter
-}
-```
-
-- [ ] **Step 2: Update HTTP transport to pass StreamWriter per request**
-
-In `http.go`, the POST handler at line 86 calls `handler(ctx, req)`. Before this call, if the handler supports streaming, set its StreamWriter:
-
-The challenge is that the `RequestHandler` is a function, not a struct — we can't call `SetStreamWriter` on it. The solution: wrap the handler in a closure that sets up the StreamWriter.
-
-Add a `StreamingHandlerWrapper` that the HTTP transport's `Start()` uses:
-
-```go
-// streamingHandler wraps a handler to inject a per-request StreamWriter.
-type streamingHandler struct {
-	handler RequestHandler
-	setup   func(w http.ResponseWriter) // called before handler to set StreamWriter
-}
-```
-
-In the HTTP transport's `Start()`, modify the POST handler:
-
-```go
-	mux.HandleFunc("/", func(w http.ResponseWriter, r *http.Request) {
-		// ... existing request parsing ...
-
-		// Set up per-request StreamWriter if handler supports it.
-		if t.onRequest != nil {
-			t.onRequest(w)
-		}
-
-		resp, err := handler(ctx, req)
-		// ... existing response handling ...
-```
-
-Add a callback field to HTTPTransport:
-
-```go
-	onRequest func(w http.ResponseWriter) // set StreamWriter per request
-```
-
-Add a setter:
-
-```go
-func (t *HTTPTransport) OnRequest(fn func(w http.ResponseWriter)) {
-	t.onRequest = fn
-}
-```
-
-The wiring happens in `cmd/protomcp/main.go` (or wherever the transport and handler are connected):
-
-```go
-httpTransport.OnRequest(func(w http.ResponseWriter) {
-    handler.SetStreamWriter(newHTTPStreamWriter(w))
-})
-```
-
-- [ ] **Step 3: Update stdio transport similarly**
-
-For stdio, the `StreamWriter` is the same for all requests (it writes to stdout). Set it once when the transport starts:
-
-In `main.go` wiring:
-
-```go
-handler.SetStreamWriter(stdioTransport.NewStreamWriter())
-```
-
-- [ ] **Step 4: Update SSE transport**
-
-Same as stdio — single StreamWriter wrapping the SSE broadcast:
-
-```go
-handler.SetStreamWriter(sseTransport.NewStreamWriter())
-```
-
-- [ ] **Step 5: Verify compilation and tests**
-
-Run: `go build ./... && go test ./internal/...`
-Expected: All pass
-
-- [ ] **Step 6: Commit**
-
-```bash
-git add internal/transport/ cmd/
-git commit -m "feat: wire StreamWriter into HTTP, stdio, and SSE transports"
-```
-
----
-
-### Task 15: Final benchmark and verification
-
-- [ ] **Step 1: Rebuild**
-
-Run: `make build`
-
-- [ ] **Step 2: Run full D4 benchmark**
-
-Run: `go test -v -timeout 120s ./tests/bench/comparison/ -run TestDeepFastMCPComparison/D4`
-Expected: protomcp beats FastMCP at all payload sizes
-
-- [ ] **Step 3: Run full test suite**
-
-Run: `go test ./internal/... && go test -timeout 300s ./tests/...`
-Expected: All pass
-
-- [ ] **Step 4: Run full deep comparison**
-
-Run: `go test -v -timeout 600s ./tests/bench/comparison/ -run TestDeepFastMCPComparison`
-Expected: All sections pass, no regressions
diff --git a/docs/superpowers/plans/2026-03-14-harness-ml-migration.md b/docs/superpowers/plans/2026-03-14-harness-ml-migration.md
deleted file mode 100644
index 1cd7d94..0000000
--- a/docs/superpowers/plans/2026-03-14-harness-ml-migration.md
+++ /dev/null
@@ -1,1775 +0,0 @@
-# Harness-ML Migration: Make protomcp the best MCP framework for complex servers
-
-> **For agentic workers:** REQUIRED: Use superpowers:subagent-driven-development (if subagents available) or superpowers:executing-plans to implement this plan. Steps use checkbox (`- [ ]`) syntax for tracking.
-
-**Goal:** Implement 8 features across ALL 4 protomcp SDKs (Python, Go, TypeScript, Rust) that eliminate boilerplate in complex MCP servers — tool groups, local middleware, union type schemas, server context, telemetry, validation, sidecar management, and handler auto-discovery.
-
-**Architecture:** Each feature is a new module per SDK with its own registry and API. Features integrate via each SDK's `runner` (dispatch) and `tool` (schema generation). All SDKs produce identical MCP protocol behavior — the only differences are language idioms. Python is the reference implementation; Go/TS/Rust follow the same design.
-
-**Tech Stack:**
-- **Python**: `typing` module, pytest
-- **Go**: functional options, `testing` package
-- **TypeScript**: Zod schemas, vitest
-- **Rust**: builder pattern, `#[cfg(test)]` inline tests
-- **All**: protobuf (no proto changes — features map to existing `ToolDefinition`)
-
-**Spec:** `/tmp/protomcp/docs/plans/harness-ml-migration.md`
-
----
-
-## SDK Idiom Map
-
-| Concept | Python | Go | TypeScript | Rust |
-|---------|--------|----|------------|------|
-| Registration | `@decorator` | `FuncName(opts...)` | `funcName({opts})` | `func_name().method().register()` |
-| Schema source | type hints | manual `ArgDef` builders | Zod validators | manual `ArgDef` builders |
-| Test framework | pytest | `testing` | vitest | `#[cfg(test)]` |
-| Runner | sync loop | sync loop | async loop | async (tokio) |
-| Exports | `__init__.py` `__all__` | package-level functions | `index.ts` re-exports | `lib.rs` `pub use` |
-| Discovery | Yes (importlib) | No (compiled) | Yes (dynamic import) | No (compiled) |
-
----
-
-## File Structure
-
-### New files to create
-
-**Python SDK:**
-
-| File | Responsibility |
-|------|---------------|
-| `sdk/python/src/protomcp/group.py` | `@tool_group` / `@action` decorators, registry, schema gen (union + separate) |
-| `sdk/python/src/protomcp/local_middleware.py` | `@local_middleware` decorator, chain builder |
-| `sdk/python/src/protomcp/server_context.py` | `@server_context` decorator, resolver registry |
-| `sdk/python/src/protomcp/telemetry.py` | `@telemetry_sink` decorator, `ToolCallEvent` dataclass |
-| `sdk/python/src/protomcp/sidecar.py` | `@sidecar` decorator, process lifecycle |
-| `sdk/python/src/protomcp/discovery.py` | `configure(handlers_dir=...)`, module scanner |
-| `sdk/python/tests/test_schema_types.py` | Union/complex type schema tests |
-| `sdk/python/tests/test_group.py` | Tool group tests |
-| `sdk/python/tests/test_group_validation.py` | Validation tests |
-| `sdk/python/tests/test_local_middleware.py` | Local middleware tests |
-| `sdk/python/tests/test_server_context.py` | Server context tests |
-| `sdk/python/tests/test_telemetry.py` | Telemetry tests |
-| `sdk/python/tests/test_sidecar.py` | Sidecar tests |
-| `sdk/python/tests/test_discovery.py` | Discovery tests |
-
-**Go SDK:**
-
-| File | Responsibility |
-|------|---------------|
-| `sdk/go/protomcp/group.go` | `ToolGroup()` + `Action()` builders, registry, schema gen |
-| `sdk/go/protomcp/group_test.go` | Tool group tests |
-| `sdk/go/protomcp/local_middleware.go` | `LocalMiddleware()` registration, chain builder |
-| `sdk/go/protomcp/local_middleware_test.go` | Local middleware tests |
-| `sdk/go/protomcp/server_context.go` | `ServerContext()` registration, resolver |
-| `sdk/go/protomcp/server_context_test.go` | Server context tests |
-| `sdk/go/protomcp/telemetry.go` | `TelemetrySink()` registration, `ToolCallEvent` |
-| `sdk/go/protomcp/telemetry_test.go` | Telemetry tests |
-| `sdk/go/protomcp/sidecar.go` | `Sidecar()` builder, process lifecycle |
-| `sdk/go/protomcp/sidecar_test.go` | Sidecar tests |
-
-**TypeScript SDK:**
-
-| File | Responsibility |
-|------|---------------|
-| `sdk/typescript/src/group.ts` | `toolGroup()` function, action schemas via Zod |
-| `sdk/typescript/src/group.test.ts` | Tool group tests |
-| `sdk/typescript/src/localMiddleware.ts` | `localMiddleware()` function, chain builder |
-| `sdk/typescript/src/localMiddleware.test.ts` | Local middleware tests |
-| `sdk/typescript/src/serverContext.ts` | `serverContext()` function, resolver registry |
-| `sdk/typescript/src/serverContext.test.ts` | Server context tests |
-| `sdk/typescript/src/telemetry.ts` | `telemetrySink()`, `ToolCallEvent` |
-| `sdk/typescript/src/telemetry.test.ts` | Telemetry tests |
-| `sdk/typescript/src/sidecar.ts` | `sidecar()` function, process lifecycle |
-| `sdk/typescript/src/sidecar.test.ts` | Sidecar tests |
-| `sdk/typescript/src/discovery.ts` | `configure({handlersDir})`, dynamic import scanner |
-| `sdk/typescript/src/discovery.test.ts` | Discovery tests |
-
-**Rust SDK:**
-
-| File | Responsibility |
-|------|---------------|
-| `sdk/rust/src/group.rs` | `tool_group()` builder, action registration |
-| `sdk/rust/src/local_middleware.rs` | `local_middleware()` registration, chain builder |
-| `sdk/rust/src/server_context.rs` | `server_context()` registration, resolver |
-| `sdk/rust/src/telemetry.rs` | `telemetry_sink()` registration, `ToolCallEvent` |
-| `sdk/rust/src/sidecar.rs` | `sidecar()` builder, process lifecycle |
-
-**Examples and Docs:**
-
-| File | Responsibility |
-|------|---------------|
-| `examples/python/tool_groups.py` | Python tool groups example |
-| `examples/python/advanced_server.py` | Python middleware + telemetry + context example |
-| `examples/go/tool_groups/main.go` | Go tool groups example |
-| `examples/typescript/tool_groups.ts` | TypeScript tool groups example |
-| `examples/rust/tool_groups/main.rs` | Rust tool groups example |
-
-### Files to modify
-
-| File | Changes |
-|------|---------|
-| `sdk/python/src/protomcp/tool.py` | Replace `_python_type_to_json` with `_type_to_schema` |
-| `sdk/python/src/protomcp/runner.py` | Group dispatch, middleware chain, context, telemetry, sidecars, discovery |
-| `sdk/python/src/protomcp/__init__.py` | Export new APIs |
-| `sdk/go/protomcp/tool.go` | Add `ArrayArg`, `ObjectArg`, `UnionArg`, `LiteralArg`; include groups in `GetRegisteredTools` |
-| `sdk/go/protomcp/runner.go` | Group dispatch, middleware chain, context, telemetry, sidecars |
-| `sdk/typescript/src/tool.ts` | Include groups in `getRegisteredTools` |
-| `sdk/typescript/src/runner.ts` | Group dispatch, middleware chain, context, telemetry, sidecars, discovery |
-| `sdk/typescript/src/index.ts` | Export new APIs |
-| `sdk/rust/src/tool.rs` | Add `array`, `object`, `union_of`, `literal` to `ArgDef`; include groups |
-| `sdk/rust/src/runner.rs` | Group dispatch, middleware chain, context, telemetry, sidecars |
-| `sdk/rust/src/lib.rs` | Export new modules |
-| `docs/src/content/docs/guides/writing-tools-python.mdx` | All new sections |
-| `docs/src/content/docs/guides/writing-tools-go.mdx` | All new sections |
-| `docs/src/content/docs/guides/writing-tools-typescript.mdx` | All new sections |
-| `docs/src/content/docs/guides/writing-tools-rust.mdx` | All new sections |
-| `docs/src/content/docs/reference/python-api.mdx` | New API entries |
-
----
-
-## Chunk 1: Union Type Schemas + Tool Groups
-
-### Task 1: Python — Recursive type-to-schema (Item 3)
-
-**Files:**
-- Create: `sdk/python/tests/test_schema_types.py`
-- Modify: `sdk/python/src/protomcp/tool.py`
-
-- [ ] **Step 1: Write failing tests for union types**
-
-```python
-# sdk/python/tests/test_schema_types.py
-import json
-from protomcp.tool import _type_to_schema
-
-def test_str_schema():
-    assert _type_to_schema(str) == {"type": "string"}
-
-def test_int_schema():
-    assert _type_to_schema(int) == {"type": "integer"}
-
-def test_float_schema():
-    assert _type_to_schema(float) == {"type": "number"}
-
-def test_bool_schema():
-    assert _type_to_schema(bool) == {"type": "boolean"}
-
-def test_plain_list():
-    assert _type_to_schema(list) == {"type": "array"}
-
-def test_plain_dict():
-    assert _type_to_schema(dict) == {"type": "object"}
-
-def test_list_str():
-    assert _type_to_schema(list[str]) == {"type": "array", "items": {"type": "string"}}
-
-def test_list_int():
-    assert _type_to_schema(list[int]) == {"type": "array", "items": {"type": "integer"}}
-
-def test_list_dict():
-    assert _type_to_schema(list[dict]) == {"type": "array", "items": {"type": "object"}}
-
-def test_dict_str_any():
-    from typing import Any
-    result = _type_to_schema(dict[str, Any])
-    assert result == {"type": "object", "additionalProperties": {}}
-
-def test_dict_str_str():
-    result = _type_to_schema(dict[str, str])
-    assert result == {"type": "object", "additionalProperties": {"type": "string"}}
-
-def test_optional_str():
-    from typing import Optional
-    result = _type_to_schema(Optional[str])
-    assert result == {"anyOf": [{"type": "string"}, {"type": "null"}]}
-
-def test_union_str_dict():
-    result = _type_to_schema(str | dict)
-    assert result == {"anyOf": [{"type": "string"}, {"type": "object"}]}
-
-def test_union_str_dict_none():
-    result = _type_to_schema(str | dict | None)
-    assert result == {"anyOf": [{"type": "string"}, {"type": "object"}, {"type": "null"}]}
-
-def test_union_list_str_list_dict_none():
-    result = _type_to_schema(list[str] | list[dict] | None)
-    assert result == {
-        "anyOf": [
-            {"type": "array", "items": {"type": "string"}},
-            {"type": "array", "items": {"type": "object"}},
-            {"type": "null"},
-        ]
-    }
-
-def test_literal():
-    from typing import Literal
-    result = _type_to_schema(Literal["a", "b", "c"])
-    assert result == {"type": "string", "enum": ["a", "b", "c"]}
-
-def test_literal_ints():
-    from typing import Literal
-    result = _type_to_schema(Literal[1, 2, 3])
-    assert result == {"enum": [1, 2, 3]}
-
-def test_nested_list_of_list():
-    result = _type_to_schema(list[list[str]])
-    assert result == {"type": "array", "items": {"type": "array", "items": {"type": "string"}}}
-
-def test_unknown_type_defaults_to_string():
-    class Custom:
-        pass
-    assert _type_to_schema(Custom) == {"type": "string"}
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `cd /Users/msilverblatt/hotmcp && python -m pytest sdk/python/tests/test_schema_types.py -v`
-Expected: FAIL — `_type_to_schema` does not exist
-
-- [ ] **Step 3: Implement `_type_to_schema` in tool.py**
-
-Replace `_python_type_to_json`, `_PYTHON_TYPE_TO_JSON_SCHEMA` with:
-
-```python
-import typing
-from typing import Any, get_origin, get_args
-
-_PRIMITIVE_TYPE_MAP = {
-    str: "string",
-    int: "integer",
-    float: "number",
-    bool: "boolean",
-    list: "array",
-    dict: "object",
-}
-
-def _type_to_schema(hint) -> dict:
-    """Convert a Python type hint to a JSON Schema dict."""
-    origin = get_origin(hint)
-    args = get_args(hint)
-
-    if origin is typing.Union:
-        non_none = [a for a in args if a is not type(None)]
-        schemas = [_type_to_schema(a) for a in non_none]
-        if type(None) in args:
-            schemas.append({"type": "null"})
-        if len(schemas) == 1:
-            return schemas[0]
-        return {"anyOf": schemas}
-
-    if origin is list:
-        if args:
-            return {"type": "array", "items": _type_to_schema(args[0])}
-        return {"type": "array"}
-
-    if origin is dict:
-        schema: dict[str, Any] = {"type": "object"}
-        if len(args) == 2:
-            schema["additionalProperties"] = _type_to_schema(args[1])
-        return schema
-
-    if origin is typing.Literal:
-        types = set(type(v).__name__ for v in args)
-        if len(types) == 1:
-            t = type(args[0])
-            json_type = _PRIMITIVE_TYPE_MAP.get(t)
-            if json_type:
-                return {"type": json_type, "enum": list(args)}
-        return {"enum": list(args)}
-
-    json_type = _PRIMITIVE_TYPE_MAP.get(hint)
-    if json_type:
-        return {"type": json_type}
-    return {"type": "string"}
-```
-
-Update `_generate_schema` and `_generate_dataclass_schema` to call `_type_to_schema(hint)` instead of `{"type": _python_type_to_json(hint)}`. Remove `_python_type_to_json`.
-
-- [ ] **Step 4: Run tests**
-
-Run: `cd /Users/msilverblatt/hotmcp && python -m pytest sdk/python/tests/test_schema_types.py sdk/python/tests/test_tool.py sdk/python/tests/test_tool_advanced.py -v`
-Expected: All PASS
-
-- [ ] **Step 5: Write integration test — tool with union params**
-
-Add to `test_schema_types.py`:
-
-```python
-from protomcp.tool import clear_registry, get_registered_tools
-from protomcp import tool, ToolResult
-
-def test_tool_with_union_params():
-    clear_registry()
-
-    @tool("Test union types")
-    def process(data: str | dict | None = None, items: list[str] | list[dict] | None = None) -> ToolResult:
-        return ToolResult(result="ok")
-
-    tools = get_registered_tools()
-    schema = json.loads(tools[0].input_schema_json)
-    assert schema["properties"]["data"] == {
-        "anyOf": [{"type": "string"}, {"type": "object"}, {"type": "null"}],
-        "default": None,
-    }
-
-def test_tool_with_literal_param():
-    clear_registry()
-    from typing import Literal
-
-    @tool("Test literal")
-    def choose(mode: Literal["fast", "accurate", "balanced"]) -> ToolResult:
-        return ToolResult(result=mode)
-
-    tools = get_registered_tools()
-    schema = json.loads(tools[0].input_schema_json)
-    assert schema["properties"]["mode"] == {"type": "string", "enum": ["fast", "accurate", "balanced"]}
-    assert schema["required"] == ["mode"]
-```
-
-- [ ] **Step 6: Run all tests, commit**
-
-Run: `cd /Users/msilverblatt/hotmcp && python -m pytest sdk/python/tests/test_schema_types.py -v`
-
-```bash
-git add sdk/python/src/protomcp/tool.py sdk/python/tests/test_schema_types.py
-git commit -m "feat(python-sdk): recursive type-to-schema with union, list[T], dict[K,V], Literal support"
-```
-
----
-
-### Task 2: Go — Complex arg type builders (Item 3)
-
-**Files:**
-- Modify: `sdk/go/protomcp/tool.go`
-- Modify: `sdk/go/protomcp/tool_test.go`
-
-- [ ] **Step 1: Write failing tests for new arg types**
-
-Add to `sdk/go/protomcp/tool_test.go`:
-
-```go
-func TestArrayArg(t *testing.T) {
-    ClearRegistry()
-    Tool("test", Args(ArrayArg("items", "string")))
-    tools := GetRegisteredTools()
-    schema := tools[0].InputSchema
-    props := schema["properties"].(map[string]interface{})
-    items := props["items"].(map[string]interface{})
-    if items["type"] != "array" { t.Fatal("expected array") }
-    innerItems := items["items"].(map[string]interface{})
-    if innerItems["type"] != "string" { t.Fatal("expected string items") }
-}
-
-func TestObjectArg(t *testing.T) {
-    ClearRegistry()
-    Tool("test", Args(ObjectArg("config")))
-    tools := GetRegisteredTools()
-    props := tools[0].InputSchema["properties"].(map[string]interface{})
-    if props["config"].(map[string]interface{})["type"] != "object" { t.Fatal("expected object") }
-}
-
-func TestUnionArg(t *testing.T) {
-    ClearRegistry()
-    Tool("test", Args(UnionArg("data", "string", "object")))
-    tools := GetRegisteredTools()
-    props := tools[0].InputSchema["properties"].(map[string]interface{})
-    data := props["data"].(map[string]interface{})
-    anyOf := data["anyOf"].([]interface{})
-    if len(anyOf) != 2 { t.Fatal("expected 2 anyOf entries") }
-}
-
-func TestLiteralArg(t *testing.T) {
-    ClearRegistry()
-    Tool("test", Args(LiteralArg("mode", "fast", "slow", "balanced")))
-    tools := GetRegisteredTools()
-    props := tools[0].InputSchema["properties"].(map[string]interface{})
-    mode := props["mode"].(map[string]interface{})
-    if mode["type"] != "string" { t.Fatal("expected string") }
-    enum := mode["enum"].([]interface{})
-    if len(enum) != 3 { t.Fatal("expected 3 enum values") }
-}
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `cd /Users/msilverblatt/hotmcp && cd sdk/go && go test ./protomcp/ -run TestArrayArg -v`
-Expected: FAIL — functions don't exist
-
-- [ ] **Step 3: Add new ArgDef builders to tool.go**
-
-```go
-func ArrayArg(name string, itemType string) ArgDef {
-    return ArgDef{Name: name, Type: "array", ItemType: itemType}
-}
-
-func ObjectArg(name string) ArgDef {
-    return ArgDef{Name: name, Type: "object"}
-}
-
-func UnionArg(name string, types ...string) ArgDef {
-    return ArgDef{Name: name, Type: "union", UnionTypes: types}
-}
-
-func LiteralArg(name string, values ...string) ArgDef {
-    return ArgDef{Name: name, Type: "literal", EnumValues: values}
-}
-```
-
-Update `ArgDef` struct:
-```go
-type ArgDef struct {
-    Name       string
-    Type       string
-    ItemType   string   // for array: item type name
-    UnionTypes []string // for union: list of JSON Schema types
-    EnumValues []string // for literal: enum values
-}
-```
-
-Update `Args()` function's schema building to handle the new types:
-```go
-func Args(args ...ArgDef) ToolOption {
-    return func(td *ToolDef) {
-        props := map[string]interface{}{}
-        required := []string{}
-        for _, a := range args {
-            props[a.Name] = argToSchema(a)
-            required = append(required, a.Name)
-        }
-        td.InputSchema = map[string]interface{}{
-            "type": "object", "properties": props, "required": required,
-        }
-    }
-}
-
-func argToSchema(a ArgDef) map[string]interface{} {
-    switch a.Type {
-    case "array":
-        schema := map[string]interface{}{"type": "array"}
-        if a.ItemType != "" {
-            schema["items"] = map[string]interface{}{"type": a.ItemType}
-        }
-        return schema
-    case "union":
-        anyOf := make([]interface{}, len(a.UnionTypes))
-        for i, t := range a.UnionTypes {
-            anyOf[i] = map[string]interface{}{"type": t}
-        }
-        return map[string]interface{}{"anyOf": anyOf}
-    case "literal":
-        vals := make([]interface{}, len(a.EnumValues))
-        for i, v := range a.EnumValues {
-            vals[i] = v
-        }
-        return map[string]interface{}{"type": "string", "enum": vals}
-    default:
-        return map[string]interface{}{"type": a.Type}
-    }
-}
-```
-
-- [ ] **Step 4: Run tests, commit**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/go && go test ./protomcp/ -v`
-
-```bash
-git add sdk/go/protomcp/tool.go sdk/go/protomcp/tool_test.go
-git commit -m "feat(go-sdk): ArrayArg, ObjectArg, UnionArg, LiteralArg for complex schema types"
-```
-
----
-
-### Task 3: TypeScript — Verify Zod already handles union schemas (Item 3)
-
-TypeScript uses Zod + `zodToJsonSchema` which already supports `z.union()`, `z.array()`, `z.literal()`, etc. This task verifies it works and adds test coverage.
-
-**Files:**
-- Modify: `sdk/typescript/src/tool.test.ts`
-
-- [ ] **Step 1: Write verification tests**
-
-```typescript
-// Add to sdk/typescript/src/tool.test.ts
-import { z } from 'zod';
-import { tool, getRegisteredTools, clearRegistry } from './tool.js';
-
-describe('complex schema types', () => {
-  beforeEach(() => clearRegistry());
-
-  it('generates union schema', () => {
-    tool({
-      name: 'test',
-      description: 'test',
-      args: z.object({ data: z.union([z.string(), z.object({}).passthrough()]) }),
-      handler: () => 'ok',
-    });
-    const schema = JSON.parse(getRegisteredTools()[0].inputSchemaJson);
-    expect(schema.properties.data.anyOf).toBeDefined();
-    expect(schema.properties.data.anyOf.length).toBe(2);
-  });
-
-  it('generates array of string schema', () => {
-    tool({
-      name: 'test',
-      description: 'test',
-      args: z.object({ items: z.array(z.string()) }),
-      handler: () => 'ok',
-    });
-    const schema = JSON.parse(getRegisteredTools()[0].inputSchemaJson);
-    expect(schema.properties.items.type).toBe('array');
-    expect(schema.properties.items.items.type).toBe('string');
-  });
-
-  it('generates literal/enum schema', () => {
-    tool({
-      name: 'test',
-      description: 'test',
-      args: z.object({ mode: z.enum(['fast', 'slow', 'balanced']) }),
-      handler: () => 'ok',
-    });
-    const schema = JSON.parse(getRegisteredTools()[0].inputSchemaJson);
-    expect(schema.properties.mode.enum).toEqual(['fast', 'slow', 'balanced']);
-  });
-
-  it('generates nullable schema', () => {
-    tool({
-      name: 'test',
-      description: 'test',
-      args: z.object({ value: z.string().nullable() }),
-      handler: () => 'ok',
-    });
-    const schema = JSON.parse(getRegisteredTools()[0].inputSchemaJson);
-    expect(schema.properties.value.anyOf || schema.properties.value.nullable).toBeTruthy();
-  });
-});
-```
-
-- [ ] **Step 2: Run tests**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/typescript && npx vitest run --reporter=verbose`
-Expected: All PASS (Zod + zodToJsonSchema already handles these)
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add sdk/typescript/src/tool.test.ts
-git commit -m "test(ts-sdk): verify Zod handles union, array, literal, nullable schema generation"
-```
-
----
-
-### Task 4: Rust — Complex arg type builders (Item 3)
-
-**Files:**
-- Modify: `sdk/rust/src/tool.rs`
-
-- [ ] **Step 1: Write failing tests**
-
-Add to the `#[cfg(test)]` block in `sdk/rust/src/tool.rs`:
-
-```rust
-#[test]
-fn test_array_arg() {
-    clear_registry();
-    tool("test")
-        .description("test")
-        .arg(ArgDef::array("items", "string"))
-        .handler(|_, _| ToolResult::new("ok"))
-        .register();
-    with_registry(|tools| {
-        let schema = &tools[0].input_schema;
-        let items_schema = &schema["properties"]["items"];
-        assert_eq!(items_schema["type"], "array");
-        assert_eq!(items_schema["items"]["type"], "string");
-    });
-    clear_registry();
-}
-
-#[test]
-fn test_union_arg() {
-    clear_registry();
-    tool("test")
-        .description("test")
-        .arg(ArgDef::union("data", &["string", "object"]))
-        .handler(|_, _| ToolResult::new("ok"))
-        .register();
-    with_registry(|tools| {
-        let schema = &tools[0].input_schema;
-        let data = &schema["properties"]["data"];
-        assert!(data["anyOf"].is_array());
-        assert_eq!(data["anyOf"].as_array().unwrap().len(), 2);
-    });
-    clear_registry();
-}
-
-#[test]
-fn test_literal_arg() {
-    clear_registry();
-    tool("test")
-        .description("test")
-        .arg(ArgDef::literal("mode", &["fast", "slow"]))
-        .handler(|_, _| ToolResult::new("ok"))
-        .register();
-    with_registry(|tools| {
-        let schema = &tools[0].input_schema;
-        let mode = &schema["properties"]["mode"];
-        assert_eq!(mode["type"], "string");
-        assert_eq!(mode["enum"].as_array().unwrap().len(), 2);
-    });
-    clear_registry();
-}
-```
-
-- [ ] **Step 2: Implement new ArgDef constructors**
-
-Add to `sdk/rust/src/tool.rs`:
-
-```rust
-impl ArgDef {
-    pub fn array(name: &str, item_type: &str) -> Self {
-        Self { name: name.to_string(), type_name: "array".to_string(),
-               item_type: Some(item_type.to_string()), union_types: None, enum_values: None }
-    }
-    pub fn union(name: &str, types: &[&str]) -> Self {
-        Self { name: name.to_string(), type_name: "union".to_string(),
-               item_type: None, union_types: Some(types.iter().map(|s| s.to_string()).collect()), enum_values: None }
-    }
-    pub fn literal(name: &str, values: &[&str]) -> Self {
-        Self { name: name.to_string(), type_name: "literal".to_string(),
-               item_type: None, union_types: None, enum_values: Some(values.iter().map(|s| s.to_string()).collect()) }
-    }
-    pub fn object(name: &str) -> Self {
-        Self { name: name.to_string(), type_name: "object".to_string(),
-               item_type: None, union_types: None, enum_values: None }
-    }
-}
-```
-
-Update `ArgDef` struct to add optional fields and update `register()` schema builder to use `arg_to_schema()` helper.
-
-- [ ] **Step 3: Run tests, commit**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/rust && cargo test`
-
-```bash
-git add sdk/rust/src/tool.rs
-git commit -m "feat(rust-sdk): array, object, union, literal ArgDef constructors for complex schemas"
-```
-
----
-
-### Task 5: Python — Tool group decorator and registry (Item 1)
-
-**Files:**
-- Create: `sdk/python/src/protomcp/group.py`
-- Create: `sdk/python/tests/test_group.py`
-
-- [ ] **Step 1: Write failing tests**
-
-```python
-# sdk/python/tests/test_group.py
-import json
-from protomcp.group import tool_group, action, get_registered_groups, clear_group_registry, groups_to_tool_defs
-
-def test_register_group():
-    clear_group_registry()
-
-    @tool_group("data", description="Manage data")
-    class DataTools:
-        @action("add", description="Add a dataset")
-        def add(self, data_path: str) -> str:
-            return f"added {data_path}"
-
-        @action("profile", description="Profile the dataset")
-        def profile(self, category: str | None = None) -> str:
-            return "profiled"
-
-    groups = get_registered_groups()
-    assert len(groups) == 1
-    assert groups[0].name == "data"
-    assert len(groups[0].actions) == 2
-
-def test_action_schemas():
-    clear_group_registry()
-
-    @tool_group("models", description="Manage models")
-    class ModelTools:
-        @action("create", description="Create a model")
-        def create(self, name: str, model_type: str = "regressor") -> str:
-            return f"created {name}"
-
-    groups = get_registered_groups()
-    a = groups[0].actions[0]
-    assert a.input_schema["properties"]["model_type"] == {"type": "string", "default": "regressor"}
-    assert a.input_schema["required"] == ["name"]
-
-def test_union_strategy_schema():
-    clear_group_registry()
-
-    @tool_group("data", description="Manage data", strategy="union")
-    class DataTools:
-        @action("add", description="Add")
-        def add(self, data_path: str, auto_clean: bool = False) -> str:
-            return "added"
-        @action("profile", description="Profile")
-        def profile(self, category: str | None = None) -> str:
-            return "profiled"
-
-    tool_defs = groups_to_tool_defs()
-    assert len(tool_defs) == 1
-    schema = json.loads(tool_defs[0].input_schema_json)
-    assert schema["properties"]["action"]["enum"] == ["add", "profile"]
-    assert "oneOf" in schema
-    assert len(schema["oneOf"]) == 2
-
-def test_separate_strategy_schema():
-    clear_group_registry()
-
-    @tool_group("models", description="Manage models", strategy="separate")
-    class ModelTools:
-        @action("create", description="Create")
-        def create(self, name: str) -> str:
-            return "created"
-        @action("list", description="List")
-        def list_models(self) -> str:
-            return "listed"
-
-    tool_defs = groups_to_tool_defs()
-    assert len(tool_defs) == 2
-    assert {td.name for td in tool_defs} == {"models.create", "models.list"}
-
-def test_dispatch():
-    clear_group_registry()
-
-    @tool_group("calc", description="Calculator")
-    class CalcTools:
-        @action("add", description="Add")
-        def add(self, a: int, b: int) -> str:
-            return str(a + b)
-
-    groups = get_registered_groups()
-    from protomcp.group import _dispatch_group_action
-    assert _dispatch_group_action(groups[0], action="add", a=2, b=3) == "5"
-
-def test_dispatch_unknown_action():
-    clear_group_registry()
-
-    @tool_group("calc", description="Calculator")
-    class CalcTools:
-        @action("add", description="Add")
-        def add(self, a: int, b: int) -> str:
-            return str(a + b)
-
-    groups = get_registered_groups()
-    from protomcp.group import _dispatch_group_action
-    from protomcp.result import ToolResult
-    result = _dispatch_group_action(groups[0], action="subtract", a=2, b=3)
-    assert isinstance(result, ToolResult)
-    assert result.is_error
-
-def test_groups_in_registered_tools():
-    from protomcp.tool import get_registered_tools, clear_registry
-    clear_registry()
-    clear_group_registry()
-
-    @tool_group("calc", description="Calculator")
-    class CalcTools:
-        @action("add", description="Add")
-        def add(self, a: int, b: int) -> str:
-            return str(a + b)
-
-    tools = get_registered_tools()
-    assert any(t.name == "calc" for t in tools)
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `cd /Users/msilverblatt/hotmcp && python -m pytest sdk/python/tests/test_group.py -v`
-
-- [ ] **Step 3: Implement group.py**
-
-Create `sdk/python/src/protomcp/group.py` with:
-- `ActionDef` dataclass: `name`, `description`, `handler`, `input_schema`, `requires`, `enum_fields`, `cross_rules`, `hints`
-- `GroupDef` dataclass: `name`, `description`, `actions`, `instance`, `strategy`, tool metadata pass-throughs
-- `@action(name, description, ...)` — marks method, stores `_action_def` on the function
-- `@tool_group(name, description, strategy, ...)` — instantiates class, collects `@action` methods, generates per-action schemas using `_type_to_schema`, registers in `_group_registry`
-- `groups_to_tool_defs()` — converts groups to `ToolDef` list (union or separate strategy)
-- `_group_to_union_tool(group)` — single tool with `oneOf` discriminated schema
-- `_group_to_separate_tools(group)` — one tool per action with namespaced names
-- `_dispatch_group_action(group, **kwargs)` — parse `action` from kwargs, dispatch to correct handler with fuzzy suggestions on unknown action
-- `_fuzzy_suggest(value, valid)` — `difflib.get_close_matches`
-
-Update `sdk/python/src/protomcp/tool.py` `get_registered_tools()`:
-```python
-def get_registered_tools() -> list[ToolDef]:
-    from protomcp.group import get_registered_groups, groups_to_tool_defs
-    return list(_registry) + groups_to_tool_defs()
-```
-
-Update `sdk/python/src/protomcp/__init__.py` — add exports for `tool_group`, `action`, `get_registered_groups`, `clear_group_registry`.
-
-- [ ] **Step 4: Run tests, commit**
-
-Run: `cd /Users/msilverblatt/hotmcp && python -m pytest sdk/python/tests/test_group.py -v`
-
-```bash
-git add sdk/python/src/protomcp/group.py sdk/python/tests/test_group.py sdk/python/src/protomcp/tool.py sdk/python/src/protomcp/__init__.py
-git commit -m "feat(python-sdk): tool groups with union/separate strategies and per-action schemas"
-```
-
----
-
-### Task 6: Go — Tool groups (Item 1)
-
-**Files:**
-- Create: `sdk/go/protomcp/group.go`
-- Create: `sdk/go/protomcp/group_test.go`
-- Modify: `sdk/go/protomcp/tool.go` (`GetRegisteredTools` includes groups)
-
-- [ ] **Step 1: Write failing tests**
-
-```go
-// sdk/go/protomcp/group_test.go
-package protomcp
-
-import (
-    "encoding/json"
-    "testing"
-)
-
-func TestToolGroupRegistration(t *testing.T) {
-    ClearGroupRegistry()
-    ToolGroup("data",
-        GroupDescription("Manage data"),
-        Action("add", ActionDescription("Add data"),
-            ActionArgs(StrArg("data_path")),
-            ActionHandler(func(ctx ToolContext, args map[string]interface{}) ToolResult {
-                return ToolResult{ResultText: "added"}
-            }),
-        ),
-        Action("profile", ActionDescription("Profile data"),
-            ActionHandler(func(ctx ToolContext, args map[string]interface{}) ToolResult {
-                return ToolResult{ResultText: "profiled"}
-            }),
-        ),
-    )
-    groups := GetRegisteredGroups()
-    if len(groups) != 1 { t.Fatalf("expected 1 group, got %d", len(groups)) }
-    if groups[0].Name != "data" { t.Fatalf("expected name 'data', got '%s'", groups[0].Name) }
-    if len(groups[0].Actions) != 2 { t.Fatalf("expected 2 actions, got %d", len(groups[0].Actions)) }
-}
-
-func TestGroupUnionSchema(t *testing.T) {
-    ClearGroupRegistry()
-    ClearRegistry()
-    ToolGroup("data",
-        GroupDescription("Manage data"),
-        Action("add", ActionDescription("Add"), ActionArgs(StrArg("path"))),
-        Action("profile", ActionDescription("Profile")),
-    )
-    tools := GetRegisteredTools()
-    var found bool
-    for _, td := range tools {
-        if td.Name == "data" {
-            found = true
-            var schema map[string]interface{}
-            json.Unmarshal([]byte(td.InputSchemaJSON()), &schema)
-            if _, ok := schema["oneOf"]; !ok { t.Fatal("expected oneOf") }
-            props := schema["properties"].(map[string]interface{})
-            action := props["action"].(map[string]interface{})
-            if action["type"] != "string" { t.Fatal("expected action type string") }
-        }
-    }
-    if !found { t.Fatal("data tool not found in registry") }
-}
-
-func TestGroupSeparateStrategy(t *testing.T) {
-    ClearGroupRegistry()
-    ClearRegistry()
-    ToolGroup("models",
-        GroupDescription("Models"),
-        GroupStrategy("separate"),
-        Action("create", ActionDescription("Create"), ActionArgs(StrArg("name"))),
-        Action("list", ActionDescription("List")),
-    )
-    tools := GetRegisteredTools()
-    names := map[string]bool{}
-    for _, td := range tools { names[td.Name] = true }
-    if !names["models.create"] || !names["models.list"] {
-        t.Fatalf("expected models.create and models.list, got %v", names)
-    }
-}
-
-func TestGroupDispatch(t *testing.T) {
-    ClearGroupRegistry()
-    ToolGroup("calc",
-        GroupDescription("Calculator"),
-        Action("add", ActionDescription("Add"), ActionArgs(IntArg("a"), IntArg("b")),
-            ActionHandler(func(ctx ToolContext, args map[string]interface{}) ToolResult {
-                a := int(args["a"].(float64))
-                b := int(args["b"].(float64))
-                return ToolResult{ResultText: fmt.Sprintf("%d", a+b)}
-            }),
-        ),
-    )
-    groups := GetRegisteredGroups()
-    result := DispatchGroupAction(groups[0], map[string]interface{}{"action": "add", "a": float64(2), "b": float64(3)})
-    if result.ResultText != "5" { t.Fatalf("expected '5', got '%s'", result.ResultText) }
-}
-```
-
-- [ ] **Step 2: Implement group.go**
-
-Create `sdk/go/protomcp/group.go` with:
-- `GroupDef` struct: `Name`, `Description`, `Actions []ActionDef`, `Strategy`
-- `ActionDef` struct: `Name`, `Description`, `Args []ArgDef`, `Handler`, `Requires`, `EnumFields`
-- `ToolGroup(name, opts...)` registration function with functional options
-- `GroupDescription`, `GroupStrategy`, `Action(name, opts...)` option functions
-- `ActionDescription`, `ActionArgs`, `ActionHandler` option functions
-- `GroupsToToolDefs()` — converts to `[]ToolDef` (union or separate)
-- `DispatchGroupAction(group, args)` — dispatches by `action` field
-- Update `GetRegisteredTools()` in `tool.go` to include `GroupsToToolDefs()`
-
-- [ ] **Step 3: Run tests, commit**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/go && go test ./protomcp/ -v`
-
-```bash
-git add sdk/go/protomcp/group.go sdk/go/protomcp/group_test.go sdk/go/protomcp/tool.go
-git commit -m "feat(go-sdk): tool groups with union/separate strategies and dispatch"
-```
-
----
-
-### Task 7: TypeScript — Tool groups (Item 1)
-
-**Files:**
-- Create: `sdk/typescript/src/group.ts`
-- Create: `sdk/typescript/src/group.test.ts`
-- Modify: `sdk/typescript/src/tool.ts` (`getRegisteredTools` includes groups)
-- Modify: `sdk/typescript/src/index.ts`
-
-- [ ] **Step 1: Write failing tests**
-
-```typescript
-// sdk/typescript/src/group.test.ts
-import { describe, it, expect, beforeEach } from 'vitest';
-import { z } from 'zod';
-import { toolGroup, getRegisteredGroups, clearGroupRegistry, groupsToToolDefs } from './group.js';
-import { clearRegistry, getRegisteredTools } from './tool.js';
-
-describe('tool groups', () => {
-  beforeEach(() => { clearGroupRegistry(); clearRegistry(); });
-
-  it('registers a group with actions', () => {
-    toolGroup({
-      name: 'data',
-      description: 'Manage data',
-      actions: {
-        add: { description: 'Add data', args: z.object({ path: z.string() }),
-               handler: (args) => 'added' },
-        profile: { description: 'Profile', args: z.object({}),
-                   handler: () => 'profiled' },
-      },
-    });
-    const groups = getRegisteredGroups();
-    expect(groups).toHaveLength(1);
-    expect(groups[0].name).toBe('data');
-    expect(Object.keys(groups[0].actions)).toHaveLength(2);
-  });
-
-  it('generates union schema by default', () => {
-    toolGroup({
-      name: 'data',
-      description: 'Data',
-      actions: {
-        add: { description: 'Add', args: z.object({ path: z.string() }), handler: () => 'ok' },
-        profile: { description: 'Profile', args: z.object({}), handler: () => 'ok' },
-      },
-    });
-    const defs = groupsToToolDefs();
-    expect(defs).toHaveLength(1);
-    const schema = JSON.parse(defs[0].inputSchemaJson);
-    expect(schema.properties.action.enum).toEqual(['add', 'profile']);
-    expect(schema.oneOf).toHaveLength(2);
-  });
-
-  it('generates separate tools with strategy=separate', () => {
-    toolGroup({
-      name: 'models',
-      description: 'Models',
-      strategy: 'separate',
-      actions: {
-        create: { description: 'Create', args: z.object({ name: z.string() }), handler: () => 'ok' },
-        list: { description: 'List', args: z.object({}), handler: () => 'ok' },
-      },
-    });
-    const defs = groupsToToolDefs();
-    expect(defs).toHaveLength(2);
-    expect(defs.map(d => d.name).sort()).toEqual(['models.create', 'models.list']);
-  });
-
-  it('appears in getRegisteredTools', () => {
-    toolGroup({
-      name: 'calc',
-      description: 'Calc',
-      actions: { add: { description: 'Add', args: z.object({ a: z.number(), b: z.number() }), handler: (args) => String(args.a + args.b) } },
-    });
-    const tools = getRegisteredTools();
-    expect(tools.some(t => t.name === 'calc')).toBe(true);
-  });
-});
-```
-
-- [ ] **Step 2: Implement group.ts**
-
-Create `sdk/typescript/src/group.ts` with:
-- `ActionOptions` interface: `description`, `args` (ZodObject), `handler`, `requires?`, `enumFields?`
-- `GroupOptions` interface: `name`, `description`, `actions` (Record of ActionOptions), `strategy?`
-- `GroupDef` interface stored in registry
-- `toolGroup(options)` — registers group, generates per-action schemas via `zodToJsonSchema`
-- `groupsToToolDefs()` — converts groups to `ToolDef[]`
-- Union strategy: builds `oneOf` with `action` discriminator
-- Separate strategy: builds `name.action` namespaced tools
-- Dispatch handler: parses `action` from args, routes to correct handler
-- Update `getRegisteredTools()` in `tool.ts` to include `groupsToToolDefs()`
-- Update `index.ts` to export `toolGroup`, `getRegisteredGroups`, `clearGroupRegistry`
-
-- [ ] **Step 3: Run tests, commit**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/typescript && npx vitest run --reporter=verbose`
-
-```bash
-git add sdk/typescript/src/group.ts sdk/typescript/src/group.test.ts sdk/typescript/src/tool.ts sdk/typescript/src/index.ts
-git commit -m "feat(ts-sdk): tool groups with Zod-based per-action schemas and union/separate strategies"
-```
-
----
-
-### Task 8: Rust — Tool groups (Item 1)
-
-**Files:**
-- Create: `sdk/rust/src/group.rs`
-- Modify: `sdk/rust/src/tool.rs` (include groups)
-- Modify: `sdk/rust/src/lib.rs` (export)
-
-- [ ] **Step 1: Write failing tests**
-
-In `sdk/rust/src/group.rs`:
-
-```rust
-#[cfg(test)]
-mod tests {
-    use super::*;
-    use crate::tool::{ArgDef, clear_registry};
-    use crate::result::ToolResult;
-
-    #[test]
-    fn test_group_registration() {
-        clear_group_registry();
-        tool_group("data")
-            .description("Manage data")
-            .action("add", |a| a
-                .description("Add data")
-                .arg(ArgDef::string("path"))
-                .handler(|_, _| ToolResult::new("added")))
-            .action("profile", |a| a
-                .description("Profile")
-                .handler(|_, _| ToolResult::new("profiled")))
-            .register();
-
-        with_group_registry(|groups| {
-            assert_eq!(groups.len(), 1);
-            assert_eq!(groups[0].name, "data");
-            assert_eq!(groups[0].actions.len(), 2);
-        });
-        clear_group_registry();
-    }
-
-    #[test]
-    fn test_group_union_schema() {
-        clear_group_registry();
-        clear_registry();
-        tool_group("data")
-            .description("Data")
-            .action("add", |a| a.description("Add").arg(ArgDef::string("path")).handler(|_, _| ToolResult::new("ok")))
-            .action("profile", |a| a.description("Profile").handler(|_, _| ToolResult::new("ok")))
-            .register();
-
-        // groups_to_tool_defs included in with_registry via tool.rs
-        crate::tool::with_registry(|tools| {
-            let data = tools.iter().find(|t| t.name == "data").expect("data tool");
-            let schema = &data.input_schema;
-            assert!(schema["oneOf"].is_array());
-            assert_eq!(schema["properties"]["action"]["type"], "string");
-        });
-        clear_group_registry();
-        clear_registry();
-    }
-}
-```
-
-- [ ] **Step 2: Implement group.rs**
-
-Create `sdk/rust/src/group.rs` with:
-- `GroupDef` struct, `ActionDef` struct
-- `tool_group(name) -> GroupBuilder` — builder pattern
-- `GroupBuilder`: `.description()`, `.action(name, |builder| ...)`, `.strategy()`, `.register()`
-- `ActionBuilder`: `.description()`, `.arg()`, `.handler()`
-- `groups_to_tool_defs()` — returns `Vec<ToolDef>`
-- Union schema: `oneOf` with action discriminator
-- Separate: namespaced `group.action` tools
-- Dispatch: match on `action` field in args JSON
-- Update `lib.rs` to `pub mod group;` and export
-
-- [ ] **Step 3: Run tests, commit**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/rust && cargo test`
-
-```bash
-git add sdk/rust/src/group.rs sdk/rust/src/tool.rs sdk/rust/src/lib.rs
-git commit -m "feat(rust-sdk): tool groups with builder pattern and union/separate strategies"
-```
-
----
-
-### Task 9: Examples and docs for Chunk 1
-
-**Files:**
-- Create: `examples/python/tool_groups.py`
-- Create: `examples/go/tool_groups/main.go`
-- Create: `examples/typescript/tool_groups.ts`
-- Modify: `docs/src/content/docs/guides/writing-tools-python.mdx`
-- Modify: `docs/src/content/docs/guides/writing-tools-go.mdx`
-- Modify: `docs/src/content/docs/guides/writing-tools-typescript.mdx`
-- Modify: `docs/src/content/docs/guides/writing-tools-rust.mdx`
-- Modify: `docs/src/content/docs/reference/python-api.mdx`
-
-- [ ] **Step 1: Create Python example** (`examples/python/tool_groups.py`)
-- [ ] **Step 2: Create Go example** (`examples/go/tool_groups/main.go`)
-- [ ] **Step 3: Create TypeScript example** (`examples/typescript/tool_groups.ts`)
-- [ ] **Step 4: Update all 4 language guides** — add union types table and tool groups section
-- [ ] **Step 5: Update Python API reference** — add `@tool_group`, `@action`, `GroupDef`, `ActionDef`
-- [ ] **Step 6: Commit**
-
-```bash
-git add examples/ docs/
-git commit -m "docs: union types, tool groups across all SDKs with examples"
-```
-
----
-
-## Chunk 2: Declarative Validation + Server Context
-
-### Task 10: Python — Declarative per-action validation (Item 6)
-
-**Files:**
-- Create: `sdk/python/tests/test_group_validation.py`
-- Modify: `sdk/python/src/protomcp/group.py`
-
-- [ ] **Step 1: Write failing tests**
-
-Test `requires`, `enum_fields` (with fuzzy match), `cross_rules`, and `hints` on `@action`. See original spec for full test code covering:
-- Missing required param → error with param name
-- Valid required param → passes through
-- Invalid enum value → error with "Did you mean?"
-- Cross-param rule violation → error
-- Hints appended to successful result
-
-- [ ] **Step 2: Add validation to `_dispatch_group_action`**
-
-Add `_validate_action(action_def, kwargs)` and `_collect_hints(action_def, kwargs)` to group.py. Run validation before calling handler; collect hints after.
-
-- [ ] **Step 3: Run tests, commit**
-
-Run: `cd /Users/msilverblatt/hotmcp && python -m pytest sdk/python/tests/test_group_validation.py -v`
-
-```bash
-git add sdk/python/src/protomcp/group.py sdk/python/tests/test_group_validation.py
-git commit -m "feat(python-sdk): declarative per-action validation with requires, enum_fields, cross_rules, hints"
-```
-
-### Task 11: Go — Declarative validation (Item 6)
-
-**Files:**
-- Modify: `sdk/go/protomcp/group.go`
-- Modify: `sdk/go/protomcp/group_test.go`
-
-- [ ] **Step 1: Write tests for validation**
-
-Test `Requires("field")`, `EnumField("strategy", "median", "mean", "mode")`, `CrossRule(fn, msg)` options on `Action()`.
-
-- [ ] **Step 2: Implement validation in DispatchGroupAction**
-
-Add `ActionRequires(fields...)`, `ActionEnumField(name, values...)`, `ActionCrossRule(fn, msg)` option functions. Validate before dispatch. Use Levenshtein or simple substring match for fuzzy suggestions.
-
-- [ ] **Step 3: Run tests, commit**
-
-```bash
-git add sdk/go/protomcp/group.go sdk/go/protomcp/group_test.go
-git commit -m "feat(go-sdk): declarative per-action validation with requires, enum fields, cross rules"
-```
-
-### Task 12: TypeScript — Declarative validation (Item 6)
-
-**Files:**
-- Modify: `sdk/typescript/src/group.ts`
-- Modify: `sdk/typescript/src/group.test.ts`
-
-- [ ] **Step 1: Write tests, implement**
-
-Add `requires`, `enumFields`, `crossRules`, `hints` to `ActionOptions`. TypeScript already has Zod validation for basic type checking, but declarative requires/enum/cross-rules add MCP-specific validation with structured error responses. Implement validation in the dispatch function.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/typescript/src/group.ts sdk/typescript/src/group.test.ts
-git commit -m "feat(ts-sdk): declarative per-action validation with requires, enumFields, crossRules"
-```
-
-### Task 13: Rust — Declarative validation (Item 6)
-
-**Files:**
-- Modify: `sdk/rust/src/group.rs`
-
-- [ ] **Step 1: Write tests, implement**
-
-Add `.requires(&["field"])`, `.enum_field("name", &["a", "b"])`, `.cross_rule(fn, msg)` to `ActionBuilder`. Validate in dispatch. Use `strsim` crate or simple Levenshtein for fuzzy matching.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/rust/src/group.rs
-git commit -m "feat(rust-sdk): declarative per-action validation"
-```
-
----
-
-### Task 14: Python — Server context (Item 4)
-
-**Files:**
-- Create: `sdk/python/src/protomcp/server_context.py`
-- Create: `sdk/python/tests/test_server_context.py`
-- Modify: `sdk/python/src/protomcp/runner.py`
-- Modify: `sdk/python/src/protomcp/group.py`
-- Modify: `sdk/python/src/protomcp/__init__.py`
-
-- [ ] **Step 1: Write failing tests**
-
-Test: register resolver, `resolve_contexts` pops from args, default values, `expose=True/False`, multiple contexts.
-
-- [ ] **Step 2: Implement server_context.py**
-
-`@server_context(param_name, expose=True)` — decorator that registers `ContextDef(param_name, resolver, expose)`.
-`resolve_contexts(args)` — runs all resolvers, returns dict.
-`get_hidden_context_params()` — params with `expose=False`.
-
-- [ ] **Step 3: Integrate into runner.py and group.py**
-
-In `_handle_call_tool`: call `resolve_contexts(args)`, inject into handler kwargs.
-In `_dispatch_group_action`: same pattern.
-
-- [ ] **Step 4: Run tests, commit**
-
-```bash
-git add sdk/python/src/protomcp/server_context.py sdk/python/tests/test_server_context.py sdk/python/src/protomcp/runner.py sdk/python/src/protomcp/group.py sdk/python/src/protomcp/__init__.py
-git commit -m "feat(python-sdk): server context resolvers for shared params like project_dir"
-```
-
-### Task 15: Go — Server context (Item 4)
-
-**Files:**
-- Create: `sdk/go/protomcp/server_context.go`
-- Create: `sdk/go/protomcp/server_context_test.go`
-- Modify: `sdk/go/protomcp/runner.go`
-
-- [ ] **Step 1: Write tests, implement**
-
-`ServerContext(paramName, resolver, opts...)` — registers a resolver.
-`ResolveContexts(args)` — runs resolvers, pops from args, returns resolved map.
-Integrate into `handleCallTool` and `DispatchGroupAction`.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/go/protomcp/server_context.go sdk/go/protomcp/server_context_test.go sdk/go/protomcp/runner.go
-git commit -m "feat(go-sdk): server context resolvers"
-```
-
-### Task 16: TypeScript — Server context (Item 4)
-
-**Files:**
-- Create: `sdk/typescript/src/serverContext.ts`
-- Create: `sdk/typescript/src/serverContext.test.ts`
-- Modify: `sdk/typescript/src/runner.ts`, `sdk/typescript/src/index.ts`
-
-- [ ] **Step 1: Write tests, implement**
-
-`serverContext(paramName, resolver, {expose})` function.
-`resolveContexts(args)` function.
-Integrate into runner dispatch.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/typescript/src/serverContext.ts sdk/typescript/src/serverContext.test.ts sdk/typescript/src/runner.ts sdk/typescript/src/index.ts
-git commit -m "feat(ts-sdk): server context resolvers"
-```
-
-### Task 17: Rust — Server context (Item 4)
-
-**Files:**
-- Create: `sdk/rust/src/server_context.rs`
-- Modify: `sdk/rust/src/runner.rs`, `sdk/rust/src/lib.rs`
-
-- [ ] **Step 1: Write tests, implement**
-
-`server_context(param_name, resolver)` registration.
-`resolve_contexts(args)` function.
-Integrate into runner dispatch.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/rust/src/server_context.rs sdk/rust/src/runner.rs sdk/rust/src/lib.rs
-git commit -m "feat(rust-sdk): server context resolvers"
-```
-
-### Task 18: Docs for Chunk 2
-
-- [ ] **Step 1: Add validation sections to all 4 language guides**
-- [ ] **Step 2: Add server context sections to all 4 language guides**
-- [ ] **Step 3: Update Python API reference**
-- [ ] **Step 4: Commit**
-
-```bash
-git add docs/
-git commit -m "docs: declarative validation and server context across all SDKs"
-```
-
----
-
-## Chunk 3: Local Middleware + Telemetry
-
-### Task 19: Python — Local middleware (Item 2)
-
-**Files:**
-- Create: `sdk/python/src/protomcp/local_middleware.py`
-- Create: `sdk/python/tests/test_local_middleware.py`
-- Modify: `sdk/python/src/protomcp/runner.py`
-- Modify: `sdk/python/src/protomcp/__init__.py`
-
-- [ ] **Step 1: Write failing tests**
-
-Test: registration, priority ordering, chain execution order, arg modification, short-circuit, exception catching, empty chain.
-
-- [ ] **Step 2: Implement local_middleware.py**
-
-`@local_middleware(priority=N)` — registers `LocalMiddlewareDef(priority, handler)`.
-`build_middleware_chain(tool_name, handler)` — builds chain sorted by priority, each calls `next_handler(ctx, args)`.
-Chain signature: `(ctx, args_dict) -> ToolResult`.
-
-- [ ] **Step 3: Integrate into runner.py**
-
-Wrap handler invocation with `build_middleware_chain` in `_handle_call_tool`.
-
-- [ ] **Step 4: Run tests, commit**
-
-```bash
-git add sdk/python/src/protomcp/local_middleware.py sdk/python/tests/test_local_middleware.py sdk/python/src/protomcp/runner.py sdk/python/src/protomcp/__init__.py
-git commit -m "feat(python-sdk): local middleware with priority-ordered chain"
-```
-
-### Task 20: Go — Local middleware (Item 2)
-
-**Files:**
-- Create: `sdk/go/protomcp/local_middleware.go`
-- Create: `sdk/go/protomcp/local_middleware_test.go`
-- Modify: `sdk/go/protomcp/runner.go`
-
-- [ ] **Step 1: Write tests, implement**
-
-`LocalMiddleware(priority, handler)` — handler signature: `func(ctx ToolContext, toolName string, args map[string]interface{}, next func(ToolContext, map[string]interface{}) ToolResult) ToolResult`.
-`BuildMiddlewareChain(toolName, handler)` — returns chain function.
-Integrate into `handleCallTool`.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/go/protomcp/local_middleware.go sdk/go/protomcp/local_middleware_test.go sdk/go/protomcp/runner.go
-git commit -m "feat(go-sdk): local middleware with priority-ordered chain"
-```
-
-### Task 21: TypeScript — Local middleware (Item 2)
-
-**Files:**
-- Create: `sdk/typescript/src/localMiddleware.ts`
-- Create: `sdk/typescript/src/localMiddleware.test.ts`
-- Modify: `sdk/typescript/src/runner.ts`, `sdk/typescript/src/index.ts`
-
-- [ ] **Step 1: Write tests, implement**
-
-`localMiddleware(priority, handler)` — handler: `(ctx, toolName, args, next) => any`.
-`buildMiddlewareChain(toolName, handler)` function.
-Integrate into runner's callTool handling.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/typescript/src/localMiddleware.ts sdk/typescript/src/localMiddleware.test.ts sdk/typescript/src/runner.ts sdk/typescript/src/index.ts
-git commit -m "feat(ts-sdk): local middleware with priority-ordered chain"
-```
-
-### Task 22: Rust — Local middleware (Item 2)
-
-**Files:**
-- Create: `sdk/rust/src/local_middleware.rs`
-- Modify: `sdk/rust/src/runner.rs`, `sdk/rust/src/lib.rs`
-
-- [ ] **Step 1: Write tests, implement**
-
-`local_middleware(priority, handler)` — handler: `Box<dyn Fn(ToolContext, &str, Value, &dyn Fn(ToolContext, Value) -> ToolResult) -> ToolResult>`.
-`build_middleware_chain(tool_name, handler)` function.
-Integrate into `handle_call_tool`.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/rust/src/local_middleware.rs sdk/rust/src/runner.rs sdk/rust/src/lib.rs
-git commit -m "feat(rust-sdk): local middleware with priority-ordered chain"
-```
-
----
-
-### Task 23: Python — Telemetry sinks (Item 5)
-
-**Files:**
-- Create: `sdk/python/src/protomcp/telemetry.py`
-- Create: `sdk/python/tests/test_telemetry.py`
-- Modify: `sdk/python/src/protomcp/runner.py`
-- Modify: `sdk/python/src/protomcp/__init__.py`
-
-- [ ] **Step 1: Write failing tests**
-
-Test: registration, emit start/success/error/progress, sink failure swallowed, multiple sinks.
-
-- [ ] **Step 2: Implement telemetry.py**
-
-`ToolCallEvent` dataclass: `tool_name`, `phase`, `args`, `action`, `result`, `error`, `duration_ms`, `progress`, `total`, `message`.
-`@telemetry_sink` — registers sink function.
-`emit_telemetry(event)` — calls all sinks in try/except (fail-safe).
-
-- [ ] **Step 3: Integrate into runner.py**
-
-Emit `start` before handler, `success`/`error` after, with timing.
-
-- [ ] **Step 4: Run tests, commit**
-
-```bash
-git add sdk/python/src/protomcp/telemetry.py sdk/python/tests/test_telemetry.py sdk/python/src/protomcp/runner.py sdk/python/src/protomcp/__init__.py
-git commit -m "feat(python-sdk): telemetry sinks with fail-safe ToolCallEvent emission"
-```
-
-### Task 24: Go — Telemetry (Item 5)
-
-**Files:**
-- Create: `sdk/go/protomcp/telemetry.go`
-- Create: `sdk/go/protomcp/telemetry_test.go`
-- Modify: `sdk/go/protomcp/runner.go`
-
-- [ ] **Step 1: Write tests, implement**
-
-`ToolCallEvent` struct. `TelemetrySink(handler)` registration. `EmitTelemetry(event)` — fail-safe.
-Integrate into `handleCallTool`.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/go/protomcp/telemetry.go sdk/go/protomcp/telemetry_test.go sdk/go/protomcp/runner.go
-git commit -m "feat(go-sdk): telemetry sinks"
-```
-
-### Task 25: TypeScript — Telemetry (Item 5)
-
-**Files:**
-- Create: `sdk/typescript/src/telemetry.ts`
-- Create: `sdk/typescript/src/telemetry.test.ts`
-- Modify: `sdk/typescript/src/runner.ts`, `sdk/typescript/src/index.ts`
-
-- [ ] **Step 1: Write tests, implement**
-
-`ToolCallEvent` interface. `telemetrySink(handler)` function. `emitTelemetry(event)` — fail-safe.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/typescript/src/telemetry.ts sdk/typescript/src/telemetry.test.ts sdk/typescript/src/runner.ts sdk/typescript/src/index.ts
-git commit -m "feat(ts-sdk): telemetry sinks"
-```
-
-### Task 26: Rust — Telemetry (Item 5)
-
-**Files:**
-- Create: `sdk/rust/src/telemetry.rs`
-- Modify: `sdk/rust/src/runner.rs`, `sdk/rust/src/lib.rs`
-
-- [ ] **Step 1: Write tests, implement**
-
-`ToolCallEvent` struct. `telemetry_sink(handler)` registration. `emit_telemetry(event)` — fail-safe.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/rust/src/telemetry.rs sdk/rust/src/runner.rs sdk/rust/src/lib.rs
-git commit -m "feat(rust-sdk): telemetry sinks"
-```
-
-### Task 27: Examples and docs for Chunk 3
-
-**Files:**
-- Create: `examples/python/advanced_server.py`
-- Modify: all 4 language guide docs
-- Modify: `docs/src/content/docs/reference/python-api.mdx`
-
-- [ ] **Step 1: Create Python advanced_server.py example** — middleware + telemetry + context
-- [ ] **Step 2: Add local middleware section to all 4 language guides**
-- [ ] **Step 3: Add telemetry section to all 4 language guides**
-- [ ] **Step 4: Update Python API reference**
-- [ ] **Step 5: Commit**
-
-```bash
-git add examples/ docs/
-git commit -m "docs: local middleware and telemetry across all SDKs with examples"
-```
-
----
-
-## Chunk 4: Sidecars + Handler Auto-Discovery
-
-### Task 28: Python — Sidecar management (Item 7)
-
-**Files:**
-- Create: `sdk/python/src/protomcp/sidecar.py`
-- Create: `sdk/python/tests/test_sidecar.py`
-- Modify: `sdk/python/src/protomcp/runner.py`
-- Modify: `sdk/python/src/protomcp/__init__.py`
-
-- [ ] **Step 1: Write failing tests**
-
-Test: registration, PID file path, health check success/failure (mocked), stop nonexistent sidecar.
-
-- [ ] **Step 2: Implement sidecar.py**
-
-`@sidecar(name, command, health_check, start_on, ...)` decorator.
-`SidecarDef` dataclass with `pid_file_path` property.
-`_start_sidecar`, `_stop_sidecar`, `_check_health` functions.
-`start_sidecars(trigger)`, `stop_all_sidecars()`.
-`atexit.register(stop_all_sidecars)`.
-
-- [ ] **Step 3: Integrate into runner.py**
-
-`start_sidecars("server_start")` in `run()`.
-`start_sidecars("first_tool_call")` on first tool call (flag guard).
-
-- [ ] **Step 4: Run tests, commit**
-
-```bash
-git add sdk/python/src/protomcp/sidecar.py sdk/python/tests/test_sidecar.py sdk/python/src/protomcp/runner.py sdk/python/src/protomcp/__init__.py
-git commit -m "feat(python-sdk): sidecar process management with health checks"
-```
-
-### Task 29: Go — Sidecar management (Item 7)
-
-**Files:**
-- Create: `sdk/go/protomcp/sidecar.go`
-- Create: `sdk/go/protomcp/sidecar_test.go`
-- Modify: `sdk/go/protomcp/runner.go`
-
-- [ ] **Step 1: Write tests, implement**
-
-`Sidecar(name, command, opts...)` with `HealthCheck(url)`, `StartOn(trigger)` options.
-`StartSidecars(trigger)`, `StopAllSidecars()`.
-Process management via `os/exec`.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/go/protomcp/sidecar.go sdk/go/protomcp/sidecar_test.go sdk/go/protomcp/runner.go
-git commit -m "feat(go-sdk): sidecar process management"
-```
-
-### Task 30: TypeScript — Sidecar management (Item 7)
-
-**Files:**
-- Create: `sdk/typescript/src/sidecar.ts`
-- Create: `sdk/typescript/src/sidecar.test.ts`
-- Modify: `sdk/typescript/src/runner.ts`, `sdk/typescript/src/index.ts`
-
-- [ ] **Step 1: Write tests, implement**
-
-`sidecar({name, command, healthCheck, startOn})` function.
-Process management via `child_process.spawn`.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/typescript/src/sidecar.ts sdk/typescript/src/sidecar.test.ts sdk/typescript/src/runner.ts sdk/typescript/src/index.ts
-git commit -m "feat(ts-sdk): sidecar process management"
-```
-
-### Task 31: Rust — Sidecar management (Item 7)
-
-**Files:**
-- Create: `sdk/rust/src/sidecar.rs`
-- Modify: `sdk/rust/src/runner.rs`, `sdk/rust/src/lib.rs`
-
-- [ ] **Step 1: Write tests, implement**
-
-`sidecar(name, command)` builder with `.health_check()`, `.start_on()`, `.register()`.
-Process management via `tokio::process::Command`.
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/rust/src/sidecar.rs sdk/rust/src/runner.rs sdk/rust/src/lib.rs
-git commit -m "feat(rust-sdk): sidecar process management"
-```
-
----
-
-### Task 32: Python — Handler auto-discovery (Item 8)
-
-**Files:**
-- Create: `sdk/python/src/protomcp/discovery.py`
-- Create: `sdk/python/tests/test_discovery.py`
-- Modify: `sdk/python/src/protomcp/runner.py`
-- Modify: `sdk/python/src/protomcp/__init__.py`
-
-- [ ] **Step 1: Write failing tests**
-
-Test: configure, discover from directory, skip `_` prefixed files, rediscover clears and reimports.
-
-- [ ] **Step 2: Implement discovery.py**
-
-`configure(handlers_dir, hot_reload)` — stores config.
-`discover_handlers()` — scans directory, imports modules via `importlib.util.spec_from_file_location`.
-On hot reload: clears group registry, re-imports all.
-
-- [ ] **Step 3: Integrate into runner.py**
-
-`discover_handlers()` before main loop.
-`discover_handlers()` in `_handle_reload` if `hot_reload` configured.
-
-- [ ] **Step 4: Run tests, commit**
-
-```bash
-git add sdk/python/src/protomcp/discovery.py sdk/python/tests/test_discovery.py sdk/python/src/protomcp/runner.py sdk/python/src/protomcp/__init__.py
-git commit -m "feat(python-sdk): handler auto-discovery with hot reload"
-```
-
-### Task 33: TypeScript — Handler auto-discovery (Item 8)
-
-**Files:**
-- Create: `sdk/typescript/src/discovery.ts`
-- Create: `sdk/typescript/src/discovery.test.ts`
-- Modify: `sdk/typescript/src/runner.ts`, `sdk/typescript/src/index.ts`
-
-- [ ] **Step 1: Write tests, implement**
-
-`configure({handlersDir, hotReload})` function.
-`discoverHandlers()` — scans directory, `import()` each `.ts`/`.js` file.
-On hot reload: clears group registry, re-imports (ESM cache invalidation via query string or `delete require.cache`).
-
-- [ ] **Step 2: Run tests, commit**
-
-```bash
-git add sdk/typescript/src/discovery.ts sdk/typescript/src/discovery.test.ts sdk/typescript/src/runner.ts sdk/typescript/src/index.ts
-git commit -m "feat(ts-sdk): handler auto-discovery with hot reload"
-```
-
-**Note:** Go and Rust are compiled languages — handler auto-discovery does not apply. Tools must be registered at compile time.
-
----
-
-### Task 34: Final docs and examples
-
-**Files:**
-- Modify: all 4 language guide docs
-- Modify: `docs/src/content/docs/reference/python-api.mdx`
-- Modify: `examples/python/full_showcase.py`
-
-- [ ] **Step 1: Add sidecar section to all 4 language guides**
-- [ ] **Step 2: Add handler discovery section to Python and TypeScript guides**
-- [ ] **Step 3: Update Python API reference with all remaining APIs**
-- [ ] **Step 4: Add tool group to full_showcase.py**
-- [ ] **Step 5: Run all tests across all SDKs**
-
-```bash
-cd /Users/msilverblatt/hotmcp && python -m pytest sdk/python/tests/ -v
-cd /Users/msilverblatt/hotmcp/sdk/go && go test ./protomcp/ -v
-cd /Users/msilverblatt/hotmcp/sdk/typescript && npx vitest run
-cd /Users/msilverblatt/hotmcp/sdk/rust && cargo test
-```
-
-- [ ] **Step 6: Commit**
-
-```bash
-git add docs/ examples/
-git commit -m "docs: complete all SDK documentation for harness-ml migration features"
-```
-
----
-
-## Summary
-
-| Task | SDK | Item | What |
-|------|-----|------|------|
-| 1 | Python | 3 | `_type_to_schema` recursive function |
-| 2 | Go | 3 | `ArrayArg`, `ObjectArg`, `UnionArg`, `LiteralArg` |
-| 3 | TypeScript | 3 | Verify Zod handles complex types |
-| 4 | Rust | 3 | `array`, `object`, `union`, `literal` ArgDef |
-| 5 | Python | 1 | `@tool_group` + `@action` + union/separate schemas |
-| 6 | Go | 1 | `ToolGroup()` + `Action()` builders |
-| 7 | TypeScript | 1 | `toolGroup()` with Zod actions |
-| 8 | Rust | 1 | `tool_group()` builder |
-| 9 | All | 1+3 | Examples + docs for types and groups |
-| 10 | Python | 6 | Declarative validation |
-| 11 | Go | 6 | Declarative validation |
-| 12 | TypeScript | 6 | Declarative validation |
-| 13 | Rust | 6 | Declarative validation |
-| 14 | Python | 4 | Server context |
-| 15 | Go | 4 | Server context |
-| 16 | TypeScript | 4 | Server context |
-| 17 | Rust | 4 | Server context |
-| 18 | All | 4+6 | Docs for validation + context |
-| 19 | Python | 2 | Local middleware |
-| 20 | Go | 2 | Local middleware |
-| 21 | TypeScript | 2 | Local middleware |
-| 22 | Rust | 2 | Local middleware |
-| 23 | Python | 5 | Telemetry sinks |
-| 24 | Go | 5 | Telemetry sinks |
-| 25 | TypeScript | 5 | Telemetry sinks |
-| 26 | Rust | 5 | Telemetry sinks |
-| 27 | All | 2+5 | Examples + docs for middleware + telemetry |
-| 28 | Python | 7 | Sidecar management |
-| 29 | Go | 7 | Sidecar management |
-| 30 | TypeScript | 7 | Sidecar management |
-| 31 | Rust | 7 | Sidecar management |
-| 32 | Python | 8 | Handler auto-discovery |
-| 33 | TypeScript | 8 | Handler auto-discovery |
-| 34 | All | 7+8 | Final docs + examples + full test suite |
-
-### Parallelization guide
-
-Within each chunk, SDK tasks are **independent** and can run in parallel:
-- Tasks 1-4 (complex types): all 4 SDKs in parallel
-- Tasks 5-8 (tool groups): all 4 SDKs in parallel (after types complete)
-- Tasks 10-13 (validation): all 4 in parallel
-- Tasks 14-17 (server context): all 4 in parallel
-- Tasks 19-22 (local middleware): all 4 in parallel
-- Tasks 23-26 (telemetry): all 4 in parallel
-- Tasks 28-31 (sidecars): all 4 in parallel
-- Tasks 32-33 (discovery): Python + TS in parallel
-
-Doc/example tasks (9, 18, 27, 34) run after their chunk's implementation tasks complete.
diff --git a/docs/superpowers/plans/2026-03-14-server-defined-workflows.md b/docs/superpowers/plans/2026-03-14-server-defined-workflows.md
deleted file mode 100644
index 8d93539..0000000
--- a/docs/superpowers/plans/2026-03-14-server-defined-workflows.md
+++ /dev/null
@@ -1,1405 +0,0 @@
-# Server-Defined Workflows Implementation Plan
-
-> **For agentic workers:** REQUIRED: Use superpowers:subagent-driven-development (if subagents available) or superpowers:executing-plans to implement this plan. Steps use checkbox (`- [ ]`) syntax for tracking.
-
-**Goal:** Implement `@workflow` and `@step` decorators that let Python MCP servers define multi-step processes as state machines, where the visible tool surface is the state.
-
-**Architecture:** A single new module `workflow.py` that generates tool defs (via the existing tool group separate strategy pattern), manages workflow state, and controls tool visibility via `tool_manager.set_allowed()`. No changes to runner.py, proto, or the Go bridge. Builds entirely on existing primitives.
-
-**Tech Stack:** Python 3.10+, existing protomcp primitives (`tool_manager`, `ToolDef`, `ToolResult`), `fnmatch` for glob patterns.
-
-**Spec:** `docs/superpowers/specs/2026-03-14-server-defined-workflows-design.md`
-
----
-
-## File Structure
-
-### New files
-
-| File | Responsibility |
-|------|---------------|
-| `sdk/python/src/protomcp/workflow.py` | `@workflow`, `@step`, `StepResult`, `WorkflowDef`, `StepDef`, `WorkflowState`, graph validation, tool visibility computation, step dispatch |
-| `sdk/python/tests/test_workflow.py` | Unit tests for workflow registration, graph validation, step dispatch, visibility |
-| `sdk/python/tests/test_workflow_errors.py` | Tests for error handling — stay in state, `on_error` transitions, no_cancel + error |
-| `sdk/python/tests/test_workflow_visibility.py` | Tests for tool visibility — allow_during, block_during, step overrides, exclusive mode |
-| `examples/python/workflow_deploy.py` | Example: deployment pipeline workflow |
-
-### Files to modify
-
-| File | Changes |
-|------|---------|
-| `sdk/python/src/protomcp/__init__.py` | Export `workflow`, `step`, `StepResult` |
-| `sdk/python/src/protomcp/tool.py` | Update `get_registered_tools()` to include workflow-generated tool defs |
-
----
-
-## Chunk 1: Core Data Structures and Registration
-
-### Task 1: StepResult, StepDef, WorkflowDef, WorkflowState data structures
-
-**Files:**
-- Create: `sdk/python/src/protomcp/workflow.py`
-- Create: `sdk/python/tests/test_workflow.py`
-
-- [ ] **Step 1: Write failing tests for data structures**
-
-```python
-# sdk/python/tests/test_workflow.py
-from protomcp.workflow import (
-    workflow, step, StepResult, StepDef, WorkflowDef, WorkflowState,
-    get_registered_workflows, clear_workflow_registry,
-)
-
-def test_step_result_defaults():
-    r = StepResult(result="done")
-    assert r.result == "done"
-    assert r.next is None
-
-def test_step_result_with_next():
-    r = StepResult(result="ok", next=["approve", "reject"])
-    assert r.next == ["approve", "reject"]
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow.py -v`
-Expected: FAIL — module doesn't exist
-
-- [ ] **Step 3: Implement data structures in workflow.py**
-
-```python
-# sdk/python/src/protomcp/workflow.py
-import fnmatch
-import inspect
-from dataclasses import dataclass, field
-from typing import Any, Callable
-
-from protomcp.tool import ToolDef, _type_to_schema, _is_optional_type
-from protomcp.result import ToolResult
-from protomcp import manager as tool_manager
-
-
-@dataclass
-class StepResult:
-    result: str = ""
-    next: list[str] | None = None
-
-
-@dataclass
-class StepDef:
-    name: str
-    description: str
-    handler: Callable
-    input_schema: dict
-    initial: bool = False
-    next: list[str] | None = None
-    terminal: bool = False
-    no_cancel: bool = False
-    allow_during: list[str] | None = None
-    block_during: list[str] | None = None
-    on_error: dict[type, str] | None = None
-    requires: list[str] | None = None
-    enum_fields: dict[str, list] | None = None
-
-
-@dataclass
-class WorkflowDef:
-    name: str
-    description: str
-    steps: list[StepDef]
-    instance: Any
-    allow_during: list[str] | None = None
-    block_during: list[str] | None = None
-    on_cancel: Callable | None = None
-    on_complete: Callable | None = None
-
-
-@dataclass
-class WorkflowState:
-    workflow_name: str
-    current_step: str
-    history: list[tuple[str, StepResult]]
-    pre_workflow_tools: list[str]
-    instance: Any
-
-
-_workflow_registry: list[WorkflowDef] = []
-_active_workflow_stack: list[WorkflowState] = []
-
-
-def get_registered_workflows() -> list[WorkflowDef]:
-    return list(_workflow_registry)
-
-
-def clear_workflow_registry():
-    _workflow_registry.clear()
-    _active_workflow_stack.clear()
-```
-
-- [ ] **Step 4: Run tests**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow.py -v`
-Expected: PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/python/src/protomcp/workflow.py sdk/python/tests/test_workflow.py
-git commit -m "feat(workflow): add core data structures — StepResult, StepDef, WorkflowDef, WorkflowState"
-```
-
----
-
-### Task 2: `@step` decorator and `@workflow` decorator with registration
-
-**Files:**
-- Modify: `sdk/python/src/protomcp/workflow.py`
-- Modify: `sdk/python/tests/test_workflow.py`
-
-- [ ] **Step 1: Write failing tests for decorators**
-
-Add to `sdk/python/tests/test_workflow.py`:
-
-```python
-def test_register_workflow():
-    clear_workflow_registry()
-
-    @workflow("deploy", description="Deploy pipeline")
-    class DeployWorkflow:
-        @step(initial=True, next=["approve", "reject"])
-        def review(self, pr_url: str) -> StepResult:
-            return StepResult(result="reviewed")
-
-        @step(next=["run_tests"])
-        def approve(self, reason: str) -> StepResult:
-            return StepResult(result="approved")
-
-        @step(terminal=True)
-        def reject(self, reason: str) -> StepResult:
-            return StepResult(result="rejected")
-
-        @step(terminal=True)
-        def run_tests(self) -> StepResult:
-            return StepResult(result="tests passed")
-
-    wfs = get_registered_workflows()
-    assert len(wfs) == 1
-    assert wfs[0].name == "deploy"
-    assert len(wfs[0].steps) == 4
-    step_names = [s.name for s in wfs[0].steps]
-    assert "review" in step_names
-    assert "approve" in step_names
-
-def test_step_marks_initial():
-    clear_workflow_registry()
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["done"])
-        def start(self) -> StepResult:
-            return StepResult(result="started")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="done")
-
-    wfs = get_registered_workflows()
-    initial = [s for s in wfs[0].steps if s.initial]
-    assert len(initial) == 1
-    assert initial[0].name == "start"
-
-def test_step_schema_generation():
-    clear_workflow_registry()
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["done"])
-        def start(self, name: str, count: int = 5) -> StepResult:
-            return StepResult(result="ok")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="done")
-
-    wfs = get_registered_workflows()
-    start_step = [s for s in wfs[0].steps if s.name == "start"][0]
-    assert "name" in start_step.input_schema["properties"]
-    assert start_step.input_schema["properties"]["count"]["default"] == 5
-    assert start_step.input_schema["required"] == ["name"]
-
-def test_workflow_captures_on_cancel():
-    clear_workflow_registry()
-
-    @workflow("test")
-    class W:
-        @step(initial=True, terminal=True)
-        def start(self) -> StepResult:
-            return StepResult(result="done")
-
-        def on_cancel(self, current_step, history):
-            return "cancelled"
-
-    wfs = get_registered_workflows()
-    assert wfs[0].on_cancel is not None
-
-def test_workflow_captures_on_complete():
-    clear_workflow_registry()
-
-    @workflow("test")
-    class W:
-        @step(initial=True, terminal=True)
-        def start(self) -> StepResult:
-            return StepResult(result="done")
-
-        def on_complete(self, history):
-            pass
-
-    wfs = get_registered_workflows()
-    assert wfs[0].on_complete is not None
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow.py -v`
-
-- [ ] **Step 3: Implement `@step` and `@workflow` decorators**
-
-Add to `workflow.py`:
-
-```python
-def step(
-    initial: bool = False,
-    next: list[str] | None = None,
-    terminal: bool = False,
-    no_cancel: bool = False,
-    description: str = "",
-    allow_during: list[str] | None = None,
-    block_during: list[str] | None = None,
-    on_error: dict[type, str] | None = None,
-    requires: list[str] | None = None,
-    enum_fields: dict[str, list] | None = None,
-):
-    """Decorator that marks a method as a workflow step."""
-    def decorator(func: Callable) -> Callable:
-        func._step_def = {
-            "name": func.__name__,
-            "initial": initial,
-            "next": next,
-            "terminal": terminal,
-            "no_cancel": no_cancel,
-            "description": description,
-            "allow_during": allow_during,
-            "block_during": block_during,
-            "on_error": on_error,
-            "requires": requires,
-            "enum_fields": enum_fields,
-        }
-        return func
-    return decorator
-
-
-def _generate_step_schema(method: Callable) -> dict:
-    """Generate JSON Schema for a step method, skipping self/cls/ctx."""
-    from typing import get_type_hints, Any as TypingAny
-    hints = get_type_hints(method)
-    sig = inspect.signature(method)
-    properties: dict[str, Any] = {}
-    required: list[str] = []
-    for param_name, param in sig.parameters.items():
-        if param_name in ("self", "cls", "ctx"):
-            continue
-        hint = hints.get(param_name, TypingAny)
-        if hasattr(hint, "__name__") and hint.__name__ == "ToolContext":
-            continue
-        prop = _type_to_schema(hint)
-        if param.default is not inspect.Parameter.empty:
-            prop["default"] = param.default
-        elif not _is_optional_type(hint):
-            required.append(param_name)
-        properties[param_name] = prop
-    schema: dict[str, Any] = {"type": "object", "properties": properties}
-    if required:
-        schema["required"] = required
-    return schema
-
-
-def workflow(
-    name: str,
-    description: str = "",
-    allow_during: list[str] | None = None,
-    block_during: list[str] | None = None,
-):
-    """Class decorator that registers a workflow."""
-    def decorator(cls):
-        instance = cls()
-        steps: list[StepDef] = []
-        for attr_name in dir(instance):
-            method = getattr(instance, attr_name, None)
-            if method is None:
-                continue
-            sdef = getattr(method, "_step_def", None)
-            if sdef is None:
-                continue
-            schema = _generate_step_schema(method)
-            steps.append(StepDef(
-                name=sdef["name"],
-                description=sdef["description"],
-                handler=method,
-                input_schema=schema,
-                initial=sdef["initial"],
-                next=sdef["next"],
-                terminal=sdef["terminal"],
-                no_cancel=sdef["no_cancel"],
-                allow_during=sdef["allow_during"],
-                block_during=sdef["block_during"],
-                on_error=sdef["on_error"],
-                requires=sdef["requires"],
-                enum_fields=sdef["enum_fields"],
-            ))
-
-        on_cancel_fn = getattr(instance, "on_cancel", None)
-        on_complete_fn = getattr(instance, "on_complete", None)
-
-        wf = WorkflowDef(
-            name=name,
-            description=description,
-            steps=steps,
-            instance=instance,
-            allow_during=allow_during,
-            block_during=block_during,
-            on_cancel=on_cancel_fn if callable(on_cancel_fn) else None,
-            on_complete=on_complete_fn if callable(on_complete_fn) else None,
-        )
-        _workflow_registry.append(wf)
-        return cls
-    return decorator
-```
-
-- [ ] **Step 4: Run tests**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow.py -v`
-Expected: All PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/python/src/protomcp/workflow.py sdk/python/tests/test_workflow.py
-git commit -m "feat(workflow): @step and @workflow decorators with registration and schema generation"
-```
-
----
-
-### Task 3: Graph validation
-
-**Files:**
-- Modify: `sdk/python/src/protomcp/workflow.py`
-- Modify: `sdk/python/tests/test_workflow.py`
-
-- [ ] **Step 1: Write failing tests for graph validation**
-
-Add to `sdk/python/tests/test_workflow.py`:
-
-```python
-import pytest
-
-def test_validation_no_initial():
-    clear_workflow_registry()
-    with pytest.raises(ValueError, match="no initial step"):
-        @workflow("bad")
-        class W:
-            @step(next=["done"])
-            def start(self) -> StepResult:
-                return StepResult(result="ok")
-
-            @step(terminal=True)
-            def done(self) -> StepResult:
-                return StepResult(result="done")
-
-def test_validation_multiple_initial():
-    clear_workflow_registry()
-    with pytest.raises(ValueError, match="multiple initial"):
-        @workflow("bad")
-        class W:
-            @step(initial=True, next=["done"])
-            def start1(self) -> StepResult:
-                return StepResult(result="ok")
-
-            @step(initial=True, terminal=True)
-            def start2(self) -> StepResult:
-                return StepResult(result="ok")
-
-            @step(terminal=True)
-            def done(self) -> StepResult:
-                return StepResult(result="done")
-
-def test_validation_missing_next_ref():
-    clear_workflow_registry()
-    with pytest.raises(ValueError, match="nonexistent"):
-        @workflow("bad")
-        class W:
-            @step(initial=True, next=["nonexistent"])
-            def start(self) -> StepResult:
-                return StepResult(result="ok")
-
-def test_validation_dead_end():
-    clear_workflow_registry()
-    with pytest.raises(ValueError, match="no next"):
-        @workflow("bad")
-        class W:
-            @step(initial=True)
-            def start(self) -> StepResult:
-                return StepResult(result="ok")
-
-def test_validation_terminal_with_next():
-    clear_workflow_registry()
-    with pytest.raises(ValueError, match="terminal.*next"):
-        @workflow("bad")
-        class W:
-            @step(initial=True, terminal=True, next=["other"])
-            def start(self) -> StepResult:
-                return StepResult(result="ok")
-
-            @step(terminal=True)
-            def other(self) -> StepResult:
-                return StepResult(result="ok")
-
-def test_validation_valid_graph():
-    clear_workflow_registry()
-    # Should not raise
-    @workflow("good")
-    class W:
-        @step(initial=True, next=["middle"])
-        def start(self) -> StepResult:
-            return StepResult(result="ok")
-
-        @step(next=["end"])
-        def middle(self) -> StepResult:
-            return StepResult(result="ok")
-
-        @step(terminal=True)
-        def end(self) -> StepResult:
-            return StepResult(result="done")
-
-    assert len(get_registered_workflows()) == 1
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow.py -v`
-
-- [ ] **Step 3: Implement graph validation**
-
-Add to `workflow.py`, called inside the `workflow` decorator after collecting steps:
-
-```python
-def _validate_workflow_graph(name: str, steps: list[StepDef]):
-    """Validate the workflow step graph. Raises ValueError on structural errors."""
-    step_names = {s.name for s in steps}
-
-    # Must have exactly one initial step
-    initials = [s for s in steps if s.initial]
-    if len(initials) == 0:
-        raise ValueError(f"Workflow '{name}': no initial step defined. "
-                         f"Mark one step with @step(initial=True)")
-    if len(initials) > 1:
-        raise ValueError(f"Workflow '{name}': multiple initial steps: "
-                         f"{[s.name for s in initials]}")
-
-    for s in steps:
-        # Terminal steps cannot have next
-        if s.terminal and s.next:
-            raise ValueError(f"Workflow '{name}' step '{s.name}': "
-                             f"terminal step cannot have next={s.next}")
-
-        # Non-terminal steps must have next
-        if not s.terminal and not s.next:
-            raise ValueError(f"Workflow '{name}' step '{s.name}': "
-                             f"non-terminal step has no next defined (dead end)")
-
-        # All next refs must exist
-        if s.next:
-            for ref in s.next:
-                if ref not in step_names:
-                    raise ValueError(f"Workflow '{name}' step '{s.name}': "
-                                     f"next references nonexistent step '{ref}'")
-
-        # on_error targets must exist
-        if s.on_error:
-            for exc_type, target in s.on_error.items():
-                if target not in step_names:
-                    raise ValueError(f"Workflow '{name}' step '{s.name}': "
-                                     f"on_error target '{target}' does not exist")
-```
-
-Call `_validate_workflow_graph(name, steps)` in the `workflow` decorator before appending to `_workflow_registry`.
-
-- [ ] **Step 4: Run tests**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow.py -v`
-Expected: All PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/python/src/protomcp/workflow.py sdk/python/tests/test_workflow.py
-git commit -m "feat(workflow): graph validation — initial/terminal checks, next refs, dead ends"
-```
-
----
-
-## Chunk 2: Tool Generation and Step Dispatch
-
-### Task 4: Generate ToolDefs from workflows
-
-**Files:**
-- Modify: `sdk/python/src/protomcp/workflow.py`
-- Modify: `sdk/python/src/protomcp/tool.py`
-- Modify: `sdk/python/src/protomcp/__init__.py`
-- Modify: `sdk/python/tests/test_workflow.py`
-
-- [ ] **Step 1: Write failing tests for tool generation**
-
-```python
-from protomcp.tool import get_registered_tools, clear_registry
-
-def test_workflow_generates_tool_defs():
-    clear_workflow_registry()
-    clear_registry()
-
-    @workflow("deploy")
-    class W:
-        @step(initial=True, next=["done"])
-        def review(self, pr_url: str) -> StepResult:
-            return StepResult(result="ok")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="done")
-
-    tools = get_registered_tools()
-    tool_names = [t.name for t in tools]
-    assert "deploy.review" in tool_names
-    assert "deploy.done" in tool_names
-    assert "deploy.cancel" in tool_names
-
-def test_workflow_cancel_not_generated_when_all_steps_no_cancel():
-    clear_workflow_registry()
-    clear_registry()
-
-    @workflow("locked")
-    class W:
-        @step(initial=True, next=["done"], no_cancel=True)
-        def start(self) -> StepResult:
-            return StepResult(result="ok")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="done")
-
-    tools = get_registered_tools()
-    tool_names = [t.name for t in tools]
-    assert "locked.start" in tool_names
-    # cancel should still exist since 'done' step allows cancel by default
-    # (terminal steps don't get cancel injected anyway, but cancel tool
-    # should exist if ANY non-terminal step allows it)
-    # Actually: start has no_cancel=True, done is terminal. So no step gets cancel.
-    assert "locked.cancel" not in tool_names
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow.py::test_workflow_generates_tool_defs -v`
-
-- [ ] **Step 3: Implement tool generation**
-
-Add to `workflow.py`:
-
-```python
-import json
-
-
-def workflows_to_tool_defs() -> list[ToolDef]:
-    """Convert registered workflows into ToolDef entries."""
-    defs: list[ToolDef] = []
-    for wf in _workflow_registry:
-        defs.extend(_workflow_to_tool_defs(wf))
-    return defs
-
-
-def _workflow_to_tool_defs(wf: WorkflowDef) -> list[ToolDef]:
-    """Generate separate ToolDefs for each step + cancel."""
-    defs: list[ToolDef] = []
-
-    for s in wf.steps:
-        def make_handler(wf_def, step_def):
-            def handler(**kwargs):
-                return _handle_step_call(wf_def, step_def, kwargs)
-            return handler
-
-        defs.append(ToolDef(
-            name=f"{wf.name}.{s.name}",
-            description=s.description or f"{wf.name}: {s.name}",
-            input_schema_json=json.dumps(s.input_schema),
-            handler=make_handler(wf, s),
-            hidden=not s.initial,  # only initial step starts visible
-        ))
-
-    # Add cancel tool if any non-terminal step allows cancel
-    needs_cancel = any(not s.no_cancel and not s.terminal for s in wf.steps)
-    if needs_cancel:
-        def make_cancel_handler(wf_def):
-            def handler(**kwargs):
-                return _handle_cancel(wf_def)
-            return handler
-
-        defs.append(ToolDef(
-            name=f"{wf.name}.cancel",
-            description=f"Cancel the {wf.name} workflow",
-            input_schema_json=json.dumps({"type": "object", "properties": {}}),
-            handler=make_cancel_handler(wf),
-            hidden=True,  # starts hidden, enabled on first transition
-        ))
-
-    return defs
-```
-
-Add placeholder dispatch functions (implemented in Task 5):
-
-```python
-def _handle_step_call(wf: WorkflowDef, step_def: StepDef, kwargs: dict):
-    """Handle a step tool call. Implemented in Task 5."""
-    return ToolResult(result="not yet implemented")
-
-
-def _handle_cancel(wf: WorkflowDef):
-    """Handle cancel. Implemented in Task 5."""
-    return ToolResult(result="not yet implemented")
-```
-
-Update `sdk/python/src/protomcp/tool.py` `get_registered_tools()`:
-
-```python
-def get_registered_tools() -> list[ToolDef]:
-    from protomcp.group import get_registered_groups, groups_to_tool_defs
-    from protomcp.workflow import workflows_to_tool_defs
-    return list(_registry) + groups_to_tool_defs() + workflows_to_tool_defs()
-```
-
-Update `sdk/python/src/protomcp/__init__.py` — add exports:
-
-```python
-from protomcp.workflow import workflow, step, StepResult, get_registered_workflows, clear_workflow_registry
-```
-
-- [ ] **Step 4: Run tests**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow.py -v`
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/python/src/protomcp/workflow.py sdk/python/src/protomcp/tool.py sdk/python/src/protomcp/__init__.py sdk/python/tests/test_workflow.py
-git commit -m "feat(workflow): generate ToolDefs from workflow steps with cancel injection"
-```
-
----
-
-### Task 5: Step dispatch — state management, transitions, cancel
-
-**Files:**
-- Modify: `sdk/python/src/protomcp/workflow.py`
-- Modify: `sdk/python/tests/test_workflow.py`
-
-- [ ] **Step 1: Write failing tests for step dispatch**
-
-```python
-def test_initial_step_dispatch():
-    clear_workflow_registry()
-    clear_registry()
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["done"])
-        def start(self, name: str) -> StepResult:
-            return StepResult(result=f"started {name}")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="complete")
-
-    tools = get_registered_tools()
-    start_tool = [t for t in tools if t.name == "test.start"][0]
-    result = start_tool.handler(name="my-project")
-    assert isinstance(result, ToolResult)
-    assert "started my-project" in result.result
-
-def test_workflow_state_persists():
-    clear_workflow_registry()
-    clear_registry()
-
-    @workflow("test")
-    class W:
-        def __init__(self):
-            self.data = None
-
-        @step(initial=True, next=["done"])
-        def start(self, value: str) -> StepResult:
-            self.data = value
-            return StepResult(result="stored")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result=f"data was {self.data}")
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-    start.handler(value="hello")
-
-    done = [t for t in tools if t.name == "test.done"][0]
-    result = done.handler()
-    assert "data was hello" in result.result
-
-def test_dynamic_next_narrows():
-    clear_workflow_registry()
-    clear_registry()
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["a", "b"])
-        def start(self) -> StepResult:
-            return StepResult(result="ok", next=["a"])  # narrow to just a
-
-        @step(terminal=True)
-        def a(self) -> StepResult:
-            return StepResult(result="a")
-
-        @step(terminal=True)
-        def b(self) -> StepResult:
-            return StepResult(result="b")
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-    result = start.handler()
-    assert not result.is_error
-
-def test_dynamic_next_rejects_invalid():
-    clear_workflow_registry()
-    clear_registry()
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["a"])
-        def start(self) -> StepResult:
-            return StepResult(result="ok", next=["b"])  # b not in declared next
-
-        @step(terminal=True)
-        def a(self) -> StepResult:
-            return StepResult(result="a")
-
-        @step(terminal=True)
-        def b(self) -> StepResult:
-            return StepResult(result="b")
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-    result = start.handler()
-    assert result.is_error
-    assert "not declared" in result.result
-
-def test_cancel_calls_on_cancel():
-    clear_workflow_registry()
-    clear_registry()
-    cancelled = []
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["done"])
-        def start(self) -> StepResult:
-            return StepResult(result="started")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="done")
-
-        def on_cancel(self, current_step, history):
-            cancelled.append((current_step, len(history)))
-            return "cleanup done"
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-    start.handler()
-
-    cancel = [t for t in tools if t.name == "test.cancel"][0]
-    result = cancel.handler()
-    assert "cleanup done" in result.result
-    assert len(cancelled) == 1
-
-def test_on_complete_called():
-    clear_workflow_registry()
-    clear_registry()
-    completed = []
-
-    @workflow("test")
-    class W:
-        @step(initial=True, terminal=True)
-        def start(self) -> StepResult:
-            return StepResult(result="done")
-
-        def on_complete(self, history):
-            completed.append(len(history))
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-    start.handler()
-    assert len(completed) == 1
-
-def test_history_tracks_steps():
-    clear_workflow_registry()
-    clear_registry()
-    recorded_history = []
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["done"])
-        def start(self) -> StepResult:
-            return StepResult(result="started")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="finished")
-
-        def on_complete(self, history):
-            recorded_history.extend(history)
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-    start.handler()
-    done = [t for t in tools if t.name == "test.done"][0]
-    done.handler()
-    assert len(recorded_history) == 2
-    assert recorded_history[0][0] == "start"
-    assert recorded_history[1][0] == "done"
-```
-
-- [ ] **Step 2: Run tests to verify they fail**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow.py -v`
-
-- [ ] **Step 3: Implement step dispatch**
-
-Replace the placeholder `_handle_step_call` and `_handle_cancel` in `workflow.py`:
-
-```python
-def _get_active_workflow() -> WorkflowState | None:
-    """Get the currently active workflow state, or None."""
-    return _active_workflow_stack[-1] if _active_workflow_stack else None
-
-
-def _handle_step_call(wf: WorkflowDef, step_def: StepDef, kwargs: dict) -> ToolResult:
-    """Handle a step tool call — manage state transitions."""
-    active = _get_active_workflow()
-
-    if step_def.initial and active is None:
-        # Starting a new workflow
-        state = WorkflowState(
-            workflow_name=wf.name,
-            current_step=step_def.name,
-            history=[],
-            pre_workflow_tools=tool_manager.get_active_tools(),
-            instance=wf.instance,
-        )
-        _active_workflow_stack.append(state)
-    elif active is not None and active.workflow_name == wf.name:
-        # Continuing an active workflow
-        active.current_step = step_def.name
-    else:
-        return ToolResult(
-            result=f"Cannot call {wf.name}.{step_def.name} — workflow not active",
-            is_error=True,
-        )
-
-    active = _active_workflow_stack[-1]
-
-    # Run the step handler
-    try:
-        result = step_def.handler(**kwargs)
-    except Exception as e:
-        # Check on_error transitions
-        if step_def.on_error:
-            for exc_type, target_step in step_def.on_error.items():
-                if isinstance(e, exc_type):
-                    # Transition to error step
-                    _transition_to_steps(wf, active, [target_step])
-                    return ToolResult(
-                        result=str(e),
-                        is_error=True,
-                    )
-        # Default: stay in current state, agent can retry or cancel
-        return ToolResult(result=str(e), is_error=True)
-
-    if not isinstance(result, StepResult):
-        result = StepResult(result=str(result))
-
-    # Validate dynamic next
-    if result.next is not None and step_def.next:
-        for n in result.next:
-            if n not in step_def.next:
-                return ToolResult(
-                    result=f"Step '{step_def.name}' returned next='{n}' which is not declared in next={step_def.next}",
-                    is_error=True,
-                )
-
-    # Record in history
-    active.history.append((step_def.name, result))
-
-    # Terminal step — complete workflow
-    if step_def.terminal:
-        if wf.on_complete:
-            wf.on_complete(active.history)
-        _restore_tools(active)
-        _active_workflow_stack.pop()
-        return ToolResult(result=result.result)
-
-    # Determine next steps
-    next_steps = result.next if result.next is not None else step_def.next
-    _transition_to_steps(wf, active, next_steps)
-
-    return ToolResult(result=result.result)
-
-
-def _handle_cancel(wf: WorkflowDef) -> ToolResult:
-    """Handle workflow cancellation."""
-    active = _get_active_workflow()
-    if active is None or active.workflow_name != wf.name:
-        return ToolResult(result="No active workflow to cancel", is_error=True)
-
-    message = f"Workflow '{wf.name}' cancelled"
-    if wf.on_cancel:
-        cancel_result = wf.on_cancel(active.current_step, active.history)
-        if cancel_result:
-            message = str(cancel_result)
-
-    _restore_tools(active)
-    _active_workflow_stack.pop()
-    return ToolResult(result=message)
-
-
-def _transition_to_steps(wf: WorkflowDef, state: WorkflowState, next_steps: list[str]):
-    """Transition tool visibility to show the given next steps."""
-    step_defs = {s.name: s for s in wf.steps}
-    visible: list[str] = []
-
-    # Add next step tools
-    for ns in next_steps:
-        visible.append(f"{wf.name}.{ns}")
-
-    # Add cancel if any next step allows it
-    any_allows_cancel = any(not step_defs[ns].no_cancel for ns in next_steps if ns in step_defs)
-    if any_allows_cancel:
-        visible.append(f"{wf.name}.cancel")
-
-    # Add non-workflow tools based on visibility rules
-    # Determine which rule set to use (first next step's override, or workflow default)
-    # Use the first next step's visibility if it has an override, otherwise workflow default
-    first_next = step_defs.get(next_steps[0]) if next_steps else None
-    allow = first_next.allow_during if first_next and first_next.allow_during is not None else wf.allow_during
-    block = first_next.block_during if first_next and first_next.block_during is not None else wf.block_during
-
-    if allow is not None or block is not None:
-        # Get all registered tool names (from snapshot)
-        all_tools = state.pre_workflow_tools
-        for t in all_tools:
-            if t.startswith(f"{wf.name}."):
-                continue  # skip workflow's own tools
-            if _matches_visibility(t, allow, block):
-                visible.append(t)
-
-    tool_manager.set_allowed(visible)
-
-
-def _matches_visibility(tool_name: str, allow: list[str] | None, block: list[str] | None) -> bool:
-    """Check if a tool passes the allow/block filter."""
-    if allow is not None:
-        if not any(fnmatch.fnmatch(tool_name, pattern) for pattern in allow):
-            return False
-    if block is not None:
-        if any(fnmatch.fnmatch(tool_name, pattern) for pattern in block):
-            return False
-    return True
-
-
-def _restore_tools(state: WorkflowState):
-    """Restore the tool list to what it was before the workflow started."""
-    tool_manager.set_allowed(state.pre_workflow_tools)
-```
-
-- [ ] **Step 4: Run tests**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow.py -v`
-Expected: All PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add sdk/python/src/protomcp/workflow.py sdk/python/tests/test_workflow.py
-git commit -m "feat(workflow): step dispatch with state management, transitions, cancel, and on_complete"
-```
-
----
-
-## Chunk 3: Error Handling and Tool Visibility
-
-### Task 6: Error handling — stay in state, on_error transitions
-
-**Files:**
-- Create: `sdk/python/tests/test_workflow_errors.py`
-- Verify existing error handling in `workflow.py`
-
-- [ ] **Step 1: Write error handling tests**
-
-```python
-# sdk/python/tests/test_workflow_errors.py
-from protomcp.workflow import workflow, step, StepResult, clear_workflow_registry
-from protomcp.tool import get_registered_tools, clear_registry
-from protomcp.result import ToolResult
-
-def test_error_stays_in_state():
-    clear_workflow_registry()
-    clear_registry()
-    call_count = 0
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["done"])
-        def start(self, value: str) -> StepResult:
-            nonlocal call_count
-            call_count += 1
-            if value == "bad":
-                raise ValueError("invalid input")
-            return StepResult(result="ok")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="done")
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-
-    # First call fails
-    result = start.handler(value="bad")
-    assert result.is_error
-    assert "invalid input" in result.result
-
-    # Retry succeeds
-    result = start.handler(value="good")
-    assert not result.is_error
-    assert call_count == 2
-
-def test_on_error_transitions():
-    clear_workflow_registry()
-    clear_registry()
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["done"],
-              on_error={ValueError: "error_review"})
-        def start(self, value: str) -> StepResult:
-            if value == "bad":
-                raise ValueError("invalid")
-            return StepResult(result="ok")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="done")
-
-        @step(terminal=True)
-        def error_review(self) -> StepResult:
-            return StepResult(result="reviewed error")
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-    result = start.handler(value="bad")
-    assert result.is_error
-
-def test_on_error_catch_all():
-    clear_workflow_registry()
-    clear_registry()
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["done"],
-              on_error={Exception: "fallback"})
-        def start(self) -> StepResult:
-            raise RuntimeError("unexpected")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="done")
-
-        @step(terminal=True)
-        def fallback(self) -> StepResult:
-            return StepResult(result="recovered")
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-    result = start.handler()
-    assert result.is_error
-    assert "unexpected" in result.result
-
-def test_no_cancel_with_error_allows_retry():
-    clear_workflow_registry()
-    clear_registry()
-    attempts = 0
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["done"], no_cancel=True)
-        def start(self) -> StepResult:
-            nonlocal attempts
-            attempts += 1
-            if attempts < 3:
-                raise ValueError("not ready yet")
-            return StepResult(result="ok")
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="done")
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-
-    result = start.handler()
-    assert result.is_error
-    result = start.handler()
-    assert result.is_error
-    result = start.handler()
-    assert not result.is_error
-    assert attempts == 3
-
-def test_unmatched_error_stays_in_state():
-    clear_workflow_registry()
-    clear_registry()
-
-    @workflow("test")
-    class W:
-        @step(initial=True, next=["done"],
-              on_error={ValueError: "recovery"})
-        def start(self) -> StepResult:
-            raise TypeError("wrong type")  # not ValueError
-
-        @step(terminal=True)
-        def done(self) -> StepResult:
-            return StepResult(result="done")
-
-        @step(terminal=True)
-        def recovery(self) -> StepResult:
-            return StepResult(result="recovered")
-
-    tools = get_registered_tools()
-    start = [t for t in tools if t.name == "test.start"][0]
-    result = start.handler()
-    assert result.is_error
-    assert "wrong type" in result.result
-    # Should stay in state, not transition to recovery
-```
-
-- [ ] **Step 2: Run tests**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow_errors.py -v`
-Expected: All PASS (error handling already implemented in Task 5)
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add sdk/python/tests/test_workflow_errors.py
-git commit -m "test(workflow): error handling — stay in state, on_error transitions, no_cancel + retry"
-```
-
----
-
-### Task 7: Tool visibility — allow_during, block_during, step overrides
-
-**Files:**
-- Create: `sdk/python/tests/test_workflow_visibility.py`
-
-Note: Visibility tests need `tool_manager` to be connected. Since `tool_manager` requires a transport, these tests will mock it. The core `_matches_visibility` function can be tested directly.
-
-- [ ] **Step 1: Write visibility tests**
-
-```python
-# sdk/python/tests/test_workflow_visibility.py
-from protomcp.workflow import _matches_visibility
-
-def test_no_filters_blocks_all():
-    # When neither allow nor block specified (exclusive mode),
-    # the function isn't called — but if it were with None/None, allow all
-    assert _matches_visibility("status", None, None) is True
-
-def test_allow_pattern():
-    assert _matches_visibility("status", ["status", "logs.*"], None) is True
-    assert _matches_visibility("logs.tail", ["status", "logs.*"], None) is True
-    assert _matches_visibility("deploy.start", ["status", "logs.*"], None) is False
-
-def test_block_pattern():
-    assert _matches_visibility("status", None, ["deploy.*"]) is True
-    assert _matches_visibility("deploy.start", None, ["deploy.*"]) is False
-
-def test_allow_then_block():
-    # allow status and logs.*, but block logs.debug
-    allow = ["status", "logs.*"]
-    block = ["logs.debug"]
-    assert _matches_visibility("status", allow, block) is True
-    assert _matches_visibility("logs.tail", allow, block) is True
-    assert _matches_visibility("logs.debug", allow, block) is False
-    assert _matches_visibility("deploy.start", allow, block) is False
-
-def test_wildcard_patterns():
-    assert _matches_visibility("read_file", ["read_*"], None) is True
-    assert _matches_visibility("write_file", ["read_*"], None) is False
-
-def test_exact_match():
-    assert _matches_visibility("status", ["status"], None) is True
-    assert _matches_visibility("status2", ["status"], None) is False
-```
-
-- [ ] **Step 2: Run tests**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/test_workflow_visibility.py -v`
-Expected: All PASS
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add sdk/python/tests/test_workflow_visibility.py
-git commit -m "test(workflow): tool visibility — allow/block patterns, wildcards, combination filters"
-```
-
----
-
-## Chunk 4: Example, Docs, Full Test Suite
-
-### Task 8: Example and documentation
-
-**Files:**
-- Create: `examples/python/workflow_deploy.py`
-- Modify: `docs/src/content/docs/guides/writing-tools-python.mdx`
-- Modify: `docs/src/content/docs/reference/python-api.mdx`
-
-- [ ] **Step 1: Create deploy workflow example**
-
-```python
-# examples/python/workflow_deploy.py
-"""
-Workflow Example: Deployment Pipeline
-=====================================
-Demonstrates @workflow with multi-step state machine.
-Run with: pmcp dev -- python workflow_deploy.py
-"""
-from protomcp import workflow, step, StepResult, tool, ToolResult
-from protomcp.runner import run
-
-
-@workflow("deploy", allow_during=["status"])
-class DeployWorkflow:
-    def __init__(self):
-        self.pr_url = None
-        self.test_results = None
-
-    @step(initial=True, next=["approve", "reject"],
-          description="Review changes before deployment")
-    def review(self, pr_url: str) -> StepResult:
-        self.pr_url = pr_url
-        return StepResult(result=f"Reviewing {pr_url}: 5 files changed")
-
-    @step(next=["run_tests"],
-          description="Approve the changes for deployment")
-    def approve(self, reason: str) -> StepResult:
-        return StepResult(result=f"Approved: {reason}")
-
-    @step(terminal=True,
-          description="Reject the changes")
-    def reject(self, reason: str) -> StepResult:
-        return StepResult(result=f"Rejected: {reason}")
-
-    @step(next=["promote", "rollback"], no_cancel=True,
-          description="Run test suite against staging")
-    def run_tests(self) -> StepResult:
-        self.test_results = {"passed": 42, "failed": 0}
-        if self.test_results["failed"] == 0:
-            return StepResult(result="All 42 tests passed", next=["promote"])
-        return StepResult(result="Tests failed", next=["rollback"])
-
-    @step(terminal=True, no_cancel=True,
-          description="Deploy to production")
-    def promote(self) -> StepResult:
-        return StepResult(result=f"Deployed {self.pr_url} to production")
-
-    @step(terminal=True,
-          description="Roll back staging deployment")
-    def rollback(self) -> StepResult:
-        return StepResult(result="Rolled back staging")
-
-    def on_cancel(self, current_step, history):
-        return f"Deploy cancelled at step '{current_step}'"
-
-    def on_complete(self, history):
-        steps = " → ".join(s[0] for s in history)
-        print(f"[audit] Deploy complete: {steps}")
-
-
-@tool("Check deployment status", read_only=True)
-def status() -> ToolResult:
-    return ToolResult(result="All systems nominal")
-
-
-if __name__ == "__main__":
-    run()
-```
-
-- [ ] **Step 2: Add Workflows section to Python guide**
-
-Add a `## Workflows` section to `docs/src/content/docs/guides/writing-tools-python.mdx` covering:
-- `@workflow` and `@step` decorators
-- Step lifecycle (initial → transitions → terminal)
-- `StepResult` with dynamic `next`
-- `no_cancel` for committed steps
-- `on_cancel` and `on_complete` hooks
-- `allow_during` / `block_during` with glob patterns
-- Step-level visibility overrides
-- Error handling: stay in state, `on_error` transitions
-
-- [ ] **Step 3: Add Workflow API entries to python-api.mdx**
-
-Add reference entries for:
-- `@workflow(name, description, allow_during, block_during)`
-- `@step(initial, next, terminal, no_cancel, description, allow_during, block_during, on_error, requires, enum_fields)`
-- `StepResult(result, next)`
-- `WorkflowDef`, `StepDef`, `WorkflowState`
-- `get_registered_workflows()`, `clear_workflow_registry()`
-
-- [ ] **Step 4: Run full test suite**
-
-Run: `cd /Users/msilverblatt/hotmcp/sdk/python && uv run pytest tests/ -v`
-Expected: All PASS
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add examples/python/workflow_deploy.py docs/src/content/docs/guides/writing-tools-python.mdx docs/src/content/docs/reference/python-api.mdx
-git commit -m "docs: add workflow guide, API reference, and deploy pipeline example"
-```
-
----
-
-## Summary
-
-| Task | What | New/Modified files |
-|------|------|-------------------|
-| 1 | Data structures | `workflow.py`, `test_workflow.py` |
-| 2 | `@step` + `@workflow` decorators | `workflow.py`, `test_workflow.py` |
-| 3 | Graph validation | `workflow.py`, `test_workflow.py` |
-| 4 | Tool generation | `workflow.py`, `tool.py`, `__init__.py`, `test_workflow.py` |
-| 5 | Step dispatch + state + cancel | `workflow.py`, `test_workflow.py` |
-| 6 | Error handling tests | `test_workflow_errors.py` |
-| 7 | Visibility tests | `test_workflow_visibility.py` |
-| 8 | Example + docs | `workflow_deploy.py`, guide + API ref |
diff --git a/docs/superpowers/plans/2026-03-14-test-engine-playground.md b/docs/superpowers/plans/2026-03-14-test-engine-playground.md
deleted file mode 100644
index 1f167c6..0000000
--- a/docs/superpowers/plans/2026-03-14-test-engine-playground.md
+++ /dev/null
@@ -1,1584 +0,0 @@
-# Test Engine & Playground Implementation Plan
-
-> **For agentic workers:** REQUIRED: Use superpowers:subagent-driven-development (if subagents available) or superpowers:executing-plans to implement this plan. Steps use checkbox (`- [ ]`) syntax for tracking.
-
-**Goal:** Add `pmcp test` CLI and `pmcp playground` web UI, both powered by a shared test engine that acts as a full MCP client with protocol tracing.
-
-**Architecture:** A shared `internal/testengine/` package creates an MCP client connected to the tool process through the full protocol stack (bridge → mcp.Server → InMemoryTransport → mcp.Client). The CLI and playground are thin interfaces on top.
-
-**Tech Stack:** Go (test engine, playground backend), React + Tailwind + Vite (playground frontend), nhooyr.io/websocket (WebSocket server), official MCP Go SDK (mcp.Client, InMemoryTransport, LoggingTransport)
-
----
-
-## File Structure
-
-### Files to CREATE
-
-**Test Engine:**
-- `internal/testengine/engine.go` — Engine struct, New(), Start(), Stop(), MCP operation wrappers
-- `internal/testengine/trace.go` — TraceLog, TraceEntry, trace io.Writer that parses SDK log lines
-- `internal/testengine/backend.go` — toolBackend adapter (wraps process.Manager + toollist.Manager for bridge.FullBackend)
-- `internal/testengine/engine_test.go` — unit tests
-
-**CLI:**
-- `internal/cli/test.go` — RunTestList(), RunTestCall() functions
-- `internal/cli/format.go` — table formatting helpers for CLI output
-
-**Playground Backend:**
-- `internal/playground/server.go` — HTTP server, embed.FS, mux setup
-- `internal/playground/handlers.go` — REST endpoint handlers
-- `internal/playground/ws.go` — WebSocket hub, connection management, event broadcast
-
-**Playground Frontend:**
-- `internal/playground/frontend/package.json`
-- `internal/playground/frontend/vite.config.ts`
-- `internal/playground/frontend/tailwind.config.ts`
-- `internal/playground/frontend/index.html`
-- `internal/playground/frontend/src/App.tsx`
-- `internal/playground/frontend/src/types.ts`
-- `internal/playground/frontend/src/hooks/useWebSocket.ts`
-- `internal/playground/frontend/src/hooks/useApi.ts`
-- `internal/playground/frontend/src/components/TopBar.tsx`
-- `internal/playground/frontend/src/components/FeaturePicker.tsx`
-- `internal/playground/frontend/src/components/ToolForm.tsx`
-- `internal/playground/frontend/src/components/ResourceForm.tsx`
-- `internal/playground/frontend/src/components/PromptForm.tsx`
-- `internal/playground/frontend/src/components/ResultView.tsx`
-- `internal/playground/frontend/src/components/TracePanel.tsx`
-- `internal/playground/frontend/src/components/TraceEntry.tsx`
-- `internal/playground/frontend/src/components/ProgressBar.tsx`
-- `internal/playground/frontend/src/components/History.tsx`
-
-### Files to MODIFY
-
-- `internal/config/config.go` — Add `test` and `playground` commands, `TestSubcommand`, `TestToolName`, `TestArgs` fields
-- `cmd/protomcp/main.go` — Add `test` and `playground` command dispatch
-- `Makefile` — Add `playground-frontend` build target
-- `go.mod` — Add `nhooyr.io/websocket`
-
-### Files UNCHANGED
-
-- `internal/bridge/` — used as-is by the test engine
-- `internal/process/` — used as-is by the test engine
-- `internal/toollist/` — used as-is by the test engine backend adapter
-- `internal/reload/` — used as-is for hot reload in the engine
-
----
-
-## Chunk 1: Test Engine Foundation
-
-### Task 1: Add nhooyr.io/websocket dependency
-
-**Files:**
-- Modify: `go.mod`
-
-- [ ] **Step 1: Add the dependency**
-
-```bash
-cd /Users/msilverblatt/hotmcp-sdk-integration && go get nhooyr.io/websocket@latest
-```
-
-- [ ] **Step 2: Verify it resolves**
-
-```bash
-go mod tidy && go build ./cmd/... ./internal/...
-```
-Expected: builds successfully
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add go.mod go.sum
-git commit -m "deps: add nhooyr.io/websocket for playground"
-```
-
----
-
-### Task 2: Create TraceLog and trace writer
-
-**Files:**
-- Create: `internal/testengine/trace.go`
-- Test: `internal/testengine/trace_test.go`
-
-- [ ] **Step 1: Write the trace test**
-
-```go
-package testengine
-
-import (
-	"strings"
-	"testing"
-	"time"
-)
-
-func TestTraceWriter(t *testing.T) {
-	tl := NewTraceLog()
-	w := tl.Writer()
-
-	// Simulate LoggingTransport output
-	w.Write([]byte("write: {\"jsonrpc\":\"2.0\",\"id\":1,\"method\":\"initialize\"}\n"))
-	w.Write([]byte("read: {\"jsonrpc\":\"2.0\",\"id\":1,\"result\":{\"protocolVersion\":\"2025-03-26\"}}\n"))
-
-	entries := tl.Entries()
-	if len(entries) != 2 {
-		t.Fatalf("expected 2 entries, got %d", len(entries))
-	}
-	if entries[0].Direction != "send" {
-		t.Errorf("expected direction 'send', got %q", entries[0].Direction)
-	}
-	if entries[0].Method != "initialize" {
-		t.Errorf("expected method 'initialize', got %q", entries[0].Method)
-	}
-	if entries[1].Direction != "recv" {
-		t.Errorf("expected direction 'recv', got %q", entries[1].Direction)
-	}
-}
-
-func TestTraceLogSubscribe(t *testing.T) {
-	tl := NewTraceLog()
-	ch := tl.Subscribe()
-	defer tl.Unsubscribe(ch)
-
-	w := tl.Writer()
-	w.Write([]byte("write: {\"jsonrpc\":\"2.0\",\"id\":1,\"method\":\"ping\"}\n"))
-
-	select {
-	case entry := <-ch:
-		if entry.Method != "ping" {
-			t.Errorf("expected method 'ping', got %q", entry.Method)
-		}
-	case <-time.After(time.Second):
-		t.Fatal("timeout waiting for trace entry")
-	}
-}
-
-func TestTraceLogClear(t *testing.T) {
-	tl := NewTraceLog()
-	w := tl.Writer()
-	w.Write([]byte("write: {\"jsonrpc\":\"2.0\",\"id\":1,\"method\":\"ping\"}\n"))
-	tl.Clear()
-	if len(tl.Entries()) != 0 {
-		t.Errorf("expected 0 entries after clear, got %d", len(tl.Entries()))
-	}
-}
-```
-
-- [ ] **Step 2: Run test to verify it fails**
-
-```bash
-go test -v ./internal/testengine/ -run TestTrace
-```
-Expected: FAIL — types not defined
-
-- [ ] **Step 3: Write the implementation**
-
-```go
-package testengine
-
-import (
-	"bufio"
-	"encoding/json"
-	"io"
-	"strings"
-	"sync"
-	"time"
-)
-
-// TraceEntry represents a single JSON-RPC message captured from the protocol.
-type TraceEntry struct {
-	Timestamp time.Time `json:"timestamp"`
-	Direction string    `json:"direction"` // "send" or "recv"
-	Raw       string    `json:"raw"`       // full JSON-RPC message
-	Method    string    `json:"method"`    // parsed method name (empty for responses)
-}
-
-// TraceLog collects protocol trace entries and broadcasts to subscribers.
-type TraceLog struct {
-	mu      sync.Mutex
-	entries []TraceEntry
-	subs    []chan TraceEntry
-}
-
-// NewTraceLog creates an empty TraceLog.
-func NewTraceLog() *TraceLog {
-	return &TraceLog{}
-}
-
-// Writer returns an io.Writer that parses LoggingTransport output lines
-// into TraceEntry structs. Each line has the format:
-//   write: <json>
-//   read: <json>
-func (t *TraceLog) Writer() io.Writer {
-	return &traceWriter{log: t}
-}
-
-// Entries returns a snapshot of all trace entries.
-func (t *TraceLog) Entries() []TraceEntry {
-	t.mu.Lock()
-	defer t.mu.Unlock()
-	return append([]TraceEntry{}, t.entries...)
-}
-
-// Subscribe returns a channel that receives new trace entries as they arrive.
-func (t *TraceLog) Subscribe() chan TraceEntry {
-	t.mu.Lock()
-	defer t.mu.Unlock()
-	ch := make(chan TraceEntry, 64)
-	t.subs = append(t.subs, ch)
-	return ch
-}
-
-// Unsubscribe removes a subscriber channel.
-func (t *TraceLog) Unsubscribe(ch chan TraceEntry) {
-	t.mu.Lock()
-	defer t.mu.Unlock()
-	for i, s := range t.subs {
-		if s == ch {
-			t.subs = append(t.subs[:i], t.subs[i+1:]...)
-			close(ch)
-			return
-		}
-	}
-}
-
-// Clear removes all stored entries.
-func (t *TraceLog) Clear() {
-	t.mu.Lock()
-	defer t.mu.Unlock()
-	t.entries = nil
-}
-
-func (t *TraceLog) append(entry TraceEntry) {
-	t.mu.Lock()
-	defer t.mu.Unlock()
-	t.entries = append(t.entries, entry)
-	for _, ch := range t.subs {
-		select {
-		case ch <- entry:
-		default: // drop if subscriber is slow
-		}
-	}
-}
-
-// traceWriter implements io.Writer by parsing LoggingTransport log lines.
-type traceWriter struct {
-	log *TraceLog
-	buf []byte
-}
-
-func (w *traceWriter) Write(p []byte) (n int, err error) {
-	w.buf = append(w.buf, p...)
-	scanner := bufio.NewScanner(strings.NewReader(string(w.buf)))
-	var consumed int
-	for scanner.Scan() {
-		line := scanner.Text()
-		consumed += len(line) + 1 // +1 for newline
-
-		var direction, raw string
-		if strings.HasPrefix(line, "write: ") {
-			direction = "send"
-			raw = strings.TrimPrefix(line, "write: ")
-		} else if strings.HasPrefix(line, "read: ") {
-			direction = "recv"
-			raw = strings.TrimPrefix(line, "read: ")
-		} else {
-			continue
-		}
-
-		method := parseMethod(raw)
-		w.log.append(TraceEntry{
-			Timestamp: time.Now(),
-			Direction: direction,
-			Raw:       raw,
-			Method:    method,
-		})
-	}
-	w.buf = w.buf[consumed:]
-	return len(p), nil
-}
-
-// parseMethod extracts the "method" field from a JSON-RPC message, if present.
-func parseMethod(raw string) string {
-	var msg struct {
-		Method string `json:"method"`
-	}
-	json.Unmarshal([]byte(raw), &msg)
-	return msg.Method
-}
-```
-
-- [ ] **Step 4: Run tests**
-
-```bash
-go test -v ./internal/testengine/ -run TestTrace
-```
-Expected: all 3 tests pass
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/testengine/
-git commit -m "feat: add TraceLog — protocol trace capture with pub/sub"
-```
-
----
-
-### Task 3: Create backend adapter
-
-**Files:**
-- Create: `internal/testengine/backend.go`
-
-- [ ] **Step 1: Write the backend adapter**
-
-This adapts `process.Manager` + `toollist.Manager` to satisfy `bridge.FullBackend`. It's the same pattern as `toolBackend` in `cmd/protomcp/main.go` but extended for all backend interfaces.
-
-```go
-package testengine
-
-import (
-	"context"
-	"sync"
-
-	pb "github.com/msilverblatt/protomcp/gen/proto/protomcp"
-	"github.com/msilverblatt/protomcp/internal/process"
-	"github.com/msilverblatt/protomcp/internal/toollist"
-)
-
-// backend adapts process.Manager + toollist.Manager to bridge.FullBackend.
-type backend struct {
-	pm       *process.Manager
-	tlm      *toollist.Manager
-	mu       sync.RWMutex
-	allTools []*pb.ToolDefinition
-}
-
-func newBackend(pm *process.Manager, tlm *toollist.Manager, tools []*pb.ToolDefinition) *backend {
-	return &backend{pm: pm, tlm: tlm, allTools: tools}
-}
-
-func (b *backend) ActiveTools() []*pb.ToolDefinition {
-	b.mu.RLock()
-	defer b.mu.RUnlock()
-	activeNames := b.tlm.GetActive()
-	nameSet := make(map[string]bool, len(activeNames))
-	for _, n := range activeNames {
-		nameSet[n] = true
-	}
-	var result []*pb.ToolDefinition
-	for _, t := range b.allTools {
-		if nameSet[t.Name] {
-			result = append(result, t)
-		}
-	}
-	return result
-}
-
-func (b *backend) UpdateTools(tools []*pb.ToolDefinition) {
-	b.mu.Lock()
-	defer b.mu.Unlock()
-	b.allTools = tools
-}
-
-func (b *backend) CallTool(ctx context.Context, name, argsJSON string) (*pb.CallToolResponse, error) {
-	return b.pm.CallTool(ctx, name, argsJSON)
-}
-
-func (b *backend) ListResources(ctx context.Context) ([]*pb.ResourceDefinition, error) {
-	return b.pm.ListResources(ctx)
-}
-
-func (b *backend) ListResourceTemplates(ctx context.Context) ([]*pb.ResourceTemplateDefinition, error) {
-	return b.pm.ListResourceTemplates(ctx)
-}
-
-func (b *backend) ReadResource(ctx context.Context, uri string) (*pb.ReadResourceResponse, error) {
-	return b.pm.ReadResource(ctx, uri)
-}
-
-func (b *backend) ListPrompts(ctx context.Context) ([]*pb.PromptDefinition, error) {
-	return b.pm.ListPrompts(ctx)
-}
-
-func (b *backend) GetPrompt(ctx context.Context, name, argsJSON string) (*pb.GetPromptResponse, error) {
-	return b.pm.GetPrompt(ctx, name, argsJSON)
-}
-
-func (b *backend) Complete(ctx context.Context, refType, refName, argName, argValue string) (*pb.CompletionResponse, error) {
-	return b.pm.Complete(ctx, refType, refName, argName, argValue)
-}
-
-func (b *backend) SendSamplingResponse(reqID string, resp *pb.SamplingResponse) error {
-	return b.pm.SendSamplingResponse(reqID, resp)
-}
-
-func (b *backend) OnSampling(fn func(*pb.SamplingRequest, string)) {
-	b.pm.OnSampling(fn)
-}
-
-func (b *backend) SendListRootsResponse(reqID string, resp *pb.ListRootsResponse) error {
-	return b.pm.SendListRootsResponse(reqID, resp)
-}
-
-func (b *backend) OnListRoots(fn func(string)) {
-	b.pm.OnListRoots(fn)
-}
-```
-
-- [ ] **Step 2: Verify it compiles**
-
-```bash
-go build ./internal/testengine/
-```
-Expected: builds successfully
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add internal/testengine/backend.go
-git commit -m "feat: add backend adapter — bridges process.Manager to bridge.FullBackend"
-```
-
----
-
-### Task 4: Create the Engine
-
-**Files:**
-- Create: `internal/testengine/engine.go`
-- Test: `internal/testengine/engine_test.go`
-
-This is the core. The engine wires everything together: process manager → bridge → mcp.Server → InMemoryTransport → mcp.Client.
-
-- [ ] **Step 1: Write the engine**
-
-```go
-package testengine
-
-import (
-	"context"
-	"encoding/json"
-	"fmt"
-	"log/slog"
-	"os"
-	"time"
-
-	"github.com/modelcontextprotocol/go-sdk/mcp"
-	"github.com/msilverblatt/protomcp/internal/bridge"
-	"github.com/msilverblatt/protomcp/internal/config"
-	"github.com/msilverblatt/protomcp/internal/process"
-	"github.com/msilverblatt/protomcp/internal/toollist"
-)
-
-// CallResult wraps an MCP tool call result with metadata.
-type CallResult struct {
-	Result        *mcp.CallToolResult `json:"result"`
-	Duration      time.Duration       `json:"duration_ms"`
-	ToolsEnabled  []string            `json:"tools_enabled,omitempty"`
-	ToolsDisabled []string            `json:"tools_disabled,omitempty"`
-}
-
-// Option configures the Engine.
-type Option func(*engineConfig)
-
-type engineConfig struct {
-	runtime     string
-	socketPath  string
-	callTimeout time.Duration
-	logger      *slog.Logger
-}
-
-// WithRuntime overrides the auto-detected runtime command.
-func WithRuntime(cmd string) Option {
-	return func(c *engineConfig) { c.runtime = cmd }
-}
-
-// WithCallTimeout sets the timeout for tool calls.
-func WithCallTimeout(d time.Duration) Option {
-	return func(c *engineConfig) { c.callTimeout = d }
-}
-
-// WithLogger sets the logger.
-func WithLogger(l *slog.Logger) Option {
-	return func(c *engineConfig) { c.logger = l }
-}
-
-// Engine is a test engine that acts as a full MCP client.
-type Engine struct {
-	file    string
-	cfg     engineConfig
-	pm      *process.Manager
-	br      *bridge.Bridge
-	be      *backend
-	tlm     *toollist.Manager
-	client  *mcp.Client
-	session *mcp.ClientSession
-	trace   *TraceLog
-
-	// Tool list change tracking
-	toolsChangedMu   sync.Mutex
-	toolsChangedFn   func([]*mcp.Tool)
-	lastEnabled       []string
-	lastDisabled      []string
-}
-
-// New creates a new test engine for the given file.
-func New(file string, opts ...Option) *Engine {
-	cfg := engineConfig{
-		callTimeout: 5 * time.Minute,
-		logger:      slog.New(slog.NewTextHandler(os.Stderr, &slog.HandlerOptions{Level: slog.LevelWarn})),
-	}
-	for _, opt := range opts {
-		opt(&cfg)
-	}
-	return &Engine{
-		file:  file,
-		cfg:   cfg,
-		trace: NewTraceLog(),
-	}
-}
-
-// Start starts the tool process, wires the bridge, and connects the MCP client.
-func (e *Engine) Start(ctx context.Context) error {
-	// 1. Determine runtime
-	var runtimeCmd string
-	var runtimeArgs []string
-	if e.cfg.runtime != "" {
-		runtimeCmd = e.cfg.runtime
-		runtimeArgs = []string{e.file}
-	} else {
-		runtimeCmd, runtimeArgs = config.RuntimeCommand(e.file)
-	}
-
-	// 2. Start process manager
-	e.pm = process.NewManager(process.ManagerConfig{
-		File:        e.file,
-		RuntimeCmd:  runtimeCmd,
-		RuntimeArgs: runtimeArgs,
-		MaxRetries:  3,
-		CallTimeout: e.cfg.callTimeout,
-	})
-
-	tools, err := e.pm.Start(ctx)
-	if err != nil {
-		return fmt.Errorf("start tool process: %w", err)
-	}
-
-	// 3. Create tool list manager
-	e.tlm = toollist.New()
-	toolNames := make([]string, len(tools))
-	for i, t := range tools {
-		toolNames[i] = t.Name
-	}
-	e.tlm.SetRegistered(toolNames)
-
-	// 4. Create backend adapter
-	e.be = newBackend(e.pm, e.tlm, tools)
-
-	// 5. Create bridge (registers proxy handlers on mcp.Server)
-	e.br = bridge.New(e.be, e.cfg.logger)
-	e.br.SyncTools()
-	e.br.SyncResources()
-	e.br.SyncPrompts()
-
-	// 6. Wire tool list change callbacks
-	e.pm.OnEnableTools(func(names []string) {
-		e.tlm.Enable(names)
-		e.toolsChangedMu.Lock()
-		e.lastEnabled = append(e.lastEnabled, names...)
-		e.toolsChangedMu.Unlock()
-		e.br.SyncTools()
-	})
-	e.pm.OnDisableTools(func(names []string) {
-		e.tlm.Disable(names)
-		e.toolsChangedMu.Lock()
-		e.lastDisabled = append(e.lastDisabled, names...)
-		e.toolsChangedMu.Unlock()
-		e.br.SyncTools()
-	})
-
-	// 7. Create in-memory transport pair
-	serverTransport, clientTransport := mcp.NewInMemoryTransports()
-
-	// Wrap client transport with LoggingTransport for protocol tracing
-	tracingTransport := &mcp.LoggingTransport{
-		Transport: clientTransport,
-		Writer:    e.trace.Writer(),
-	}
-
-	// 8. Connect server first (required ordering)
-	serverDone := make(chan error, 1)
-	go func() {
-		_, err := e.br.Server.Connect(ctx, serverTransport, nil)
-		serverDone <- err
-	}()
-
-	// 9. Create and connect MCP client
-	e.client = mcp.NewClient(&mcp.Implementation{
-		Name:    "pmcp-test",
-		Version: "1.0.0",
-	}, &mcp.ClientOptions{
-		ToolListChangedHandler: func(ctx context.Context, req *mcp.ToolListChangedRequest) {
-			// Re-fetch tool list and notify subscribers
-			if e.session != nil {
-				result, err := e.session.ListTools(ctx, nil)
-				if err == nil && e.toolsChangedFn != nil {
-					e.toolsChangedFn(result.Tools)
-				}
-			}
-		},
-	})
-
-	e.session, err = e.client.Connect(ctx, tracingTransport, nil)
-	if err != nil {
-		e.pm.Stop()
-		return fmt.Errorf("connect MCP client: %w", err)
-	}
-
-	// Check server connected OK
-	select {
-	case sErr := <-serverDone:
-		if sErr != nil {
-			e.session.Close()
-			e.pm.Stop()
-			return fmt.Errorf("connect MCP server: %w", sErr)
-		}
-	case <-time.After(5 * time.Second):
-		e.session.Close()
-		e.pm.Stop()
-		return fmt.Errorf("server connect timed out")
-	}
-
-	return nil
-}
-
-// Stop shuts down the engine.
-func (e *Engine) Stop() {
-	if e.session != nil {
-		e.session.Close()
-	}
-	if e.pm != nil {
-		e.pm.Stop()
-	}
-}
-
-// Trace returns the protocol trace log.
-func (e *Engine) Trace() *TraceLog {
-	return e.trace
-}
-
-// OnToolsChanged registers a callback for tool list changes.
-func (e *Engine) OnToolsChanged(fn func([]*mcp.Tool)) {
-	e.toolsChangedFn = fn
-}
-
-// ListTools returns all registered tools via MCP protocol.
-func (e *Engine) ListTools(ctx context.Context) ([]*mcp.Tool, error) {
-	result, err := e.session.ListTools(ctx, nil)
-	if err != nil {
-		return nil, err
-	}
-	return result.Tools, nil
-}
-
-// CallTool calls a tool by name with the given arguments.
-func (e *Engine) CallTool(ctx context.Context, name string, args map[string]any) (*CallResult, error) {
-	// Clear tracked changes
-	e.toolsChangedMu.Lock()
-	e.lastEnabled = nil
-	e.lastDisabled = nil
-	e.toolsChangedMu.Unlock()
-
-	start := time.Now()
-	result, err := e.session.CallTool(ctx, &mcp.CallToolParams{
-		Name:      name,
-		Arguments: args,
-	})
-	duration := time.Since(start)
-
-	if err != nil {
-		return nil, err
-	}
-
-	e.toolsChangedMu.Lock()
-	enabled := append([]string{}, e.lastEnabled...)
-	disabled := append([]string{}, e.lastDisabled...)
-	e.toolsChangedMu.Unlock()
-
-	return &CallResult{
-		Result:        result,
-		Duration:      duration,
-		ToolsEnabled:  enabled,
-		ToolsDisabled: disabled,
-	}, nil
-}
-
-// ListResources returns all registered resources via MCP protocol.
-func (e *Engine) ListResources(ctx context.Context) ([]*mcp.Resource, error) {
-	result, err := e.session.ListResources(ctx, nil)
-	if err != nil {
-		return nil, err
-	}
-	return result.Resources, nil
-}
-
-// ReadResource reads a resource by URI.
-func (e *Engine) ReadResource(ctx context.Context, uri string) (*mcp.ReadResourceResult, error) {
-	return e.session.ReadResource(ctx, &mcp.ReadResourceParams{URI: uri})
-}
-
-// ListPrompts returns all registered prompts via MCP protocol.
-func (e *Engine) ListPrompts(ctx context.Context) ([]*mcp.Prompt, error) {
-	result, err := e.session.ListPrompts(ctx, nil)
-	if err != nil {
-		return nil, err
-	}
-	return result.Prompts, nil
-}
-
-// GetPrompt gets a prompt by name with arguments.
-func (e *Engine) GetPrompt(ctx context.Context, name string, args map[string]string) (*mcp.GetPromptResult, error) {
-	return e.session.GetPrompt(ctx, &mcp.GetPromptParams{
-		Name:      name,
-		Arguments: args,
-	})
-}
-
-// Reload triggers a hot reload of the tool process.
-func (e *Engine) Reload(ctx context.Context) error {
-	newTools, err := e.pm.Reload(ctx)
-	if err != nil {
-		return err
-	}
-	e.be.UpdateTools(newTools)
-	newNames := make([]string, len(newTools))
-	for i, t := range newTools {
-		newNames[i] = t.Name
-	}
-	e.tlm.SetRegistered(newNames)
-	e.br.SyncTools()
-	e.br.SyncResources()
-	e.br.SyncPrompts()
-	return nil
-}
-```
-
-Note: This file needs `import "sync"` — add it to the import block.
-
-- [ ] **Step 2: Write the E2E test**
-
-```go
-// In engine_test.go
-package testengine
-
-import (
-	"context"
-	"os"
-	"path/filepath"
-	"runtime"
-	"testing"
-)
-
-func repoRoot() string {
-	_, thisFile, _, _ := runtime.Caller(0)
-	return filepath.Join(filepath.Dir(thisFile), "..", "..")
-}
-
-func init() {
-	root := repoRoot()
-	pythonPath := filepath.Join(root, "sdk", "python", "src") +
-		string(os.PathListSeparator) +
-		filepath.Join(root, "sdk", "python", "gen")
-	existing := os.Getenv("PYTHONPATH")
-	if existing != "" {
-		pythonPath = pythonPath + string(os.PathListSeparator) + existing
-	}
-	os.Setenv("PYTHONPATH", pythonPath)
-}
-
-func TestEngineListTools(t *testing.T) {
-	fixture := filepath.Join(repoRoot(), "test", "e2e", "fixtures", "simple_tool.py")
-	e := New(fixture)
-	ctx := context.Background()
-
-	if err := e.Start(ctx); err != nil {
-		t.Fatalf("engine start: %v", err)
-	}
-	defer e.Stop()
-
-	tools, err := e.ListTools(ctx)
-	if err != nil {
-		t.Fatalf("list tools: %v", err)
-	}
-	if len(tools) == 0 {
-		t.Fatal("expected at least 1 tool")
-	}
-
-	// Verify trace captured the protocol exchange
-	entries := e.Trace().Entries()
-	if len(entries) < 2 {
-		t.Errorf("expected at least 2 trace entries (init + list), got %d", len(entries))
-	}
-}
-
-func TestEngineCallTool(t *testing.T) {
-	fixture := filepath.Join(repoRoot(), "test", "e2e", "fixtures", "simple_tool.py")
-	e := New(fixture)
-	ctx := context.Background()
-
-	if err := e.Start(ctx); err != nil {
-		t.Fatalf("engine start: %v", err)
-	}
-	defer e.Stop()
-
-	result, err := e.CallTool(ctx, "echo", map[string]any{"message": "hello"})
-	if err != nil {
-		t.Fatalf("call tool: %v", err)
-	}
-	if result.Result.IsError {
-		t.Fatalf("tool call returned error")
-	}
-	if result.Duration == 0 {
-		t.Error("expected non-zero duration")
-	}
-}
-```
-
-- [ ] **Step 3: Build the binary (needed for process manager)**
-
-```bash
-go build -o bin/pmcp ./cmd/protomcp/
-```
-
-- [ ] **Step 4: Run tests**
-
-```bash
-go test -v -timeout 30s ./internal/testengine/
-```
-Expected: all tests pass
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/testengine/
-git commit -m "feat: add test engine — MCP client with protocol tracing"
-```
-
----
-
-## Chunk 2: CLI Commands
-
-### Task 5: Add `test` and `playground` commands to config parser
-
-**Files:**
-- Modify: `internal/config/config.go`
-
-- [ ] **Step 1: Add new fields to Config**
-
-Add to the `Config` struct:
-```go
-// Test command fields
-TestSubcommand string // "list", "call", "scenario"
-TestToolName   string // tool name for "call"
-TestArgs       string // --args JSON string for "call"
-ShowTrace      bool   // --trace flag (default true)
-```
-
-- [ ] **Step 2: Add "test" and "playground" to command validation**
-
-Change the command check from:
-```go
-if cmd != "dev" && cmd != "run" && cmd != "validate" {
-```
-to:
-```go
-if cmd != "dev" && cmd != "run" && cmd != "validate" && cmd != "test" && cmd != "playground" {
-```
-
-Update the error message and usage string accordingly.
-
-- [ ] **Step 3: Parse test subcommands**
-
-After the file argument parsing, if `cfg.Command == "test"`, parse the next positional arg as the subcommand ("list", "call", "scenario"). For "call", parse the next arg as the tool name. Add `--args` flag parsing in the flag loop.
-
-Add `--trace` flag (default `true`, `--trace=false` disables).
-
-- [ ] **Step 4: Verify**
-
-```bash
-go build ./cmd/... ./internal/...
-```
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add internal/config/
-git commit -m "feat: add test and playground commands to config parser"
-```
-
----
-
-### Task 6: Create CLI formatters and test command handlers
-
-**Files:**
-- Create: `internal/cli/test.go`
-- Create: `internal/cli/format.go`
-
-- [ ] **Step 1: Write the format helpers**
-
-`internal/cli/format.go`:
-```go
-package cli
-
-import (
-	"encoding/json"
-	"fmt"
-	"strings"
-
-	"github.com/modelcontextprotocol/go-sdk/mcp"
-)
-
-func FormatToolTable(tools []*mcp.Tool) string {
-	var sb strings.Builder
-	sb.WriteString("  Tools\n")
-	sb.WriteString("  " + strings.Repeat("─", 64) + "\n")
-	for _, t := range tools {
-		params := formatParams(t.InputSchema)
-		sb.WriteString(fmt.Sprintf("  %-18s %-30s %s\n", t.Name, t.Description, params))
-	}
-	return sb.String()
-}
-
-func FormatResourceTable(resources []*mcp.Resource) string {
-	if len(resources) == 0 {
-		return ""
-	}
-	var sb strings.Builder
-	sb.WriteString("\n  Resources\n")
-	sb.WriteString("  " + strings.Repeat("─", 64) + "\n")
-	for _, r := range resources {
-		sb.WriteString(fmt.Sprintf("  %-18s %-30s %s\n", r.URI, r.Description, r.MIMEType))
-	}
-	return sb.String()
-}
-
-func FormatPromptTable(prompts []*mcp.Prompt) string {
-	if len(prompts) == 0 {
-		return ""
-	}
-	var sb strings.Builder
-	sb.WriteString("\n  Prompts\n")
-	sb.WriteString("  " + strings.Repeat("─", 64) + "\n")
-	for _, p := range prompts {
-		args := formatPromptArgs(p.Arguments)
-		sb.WriteString(fmt.Sprintf("  %-18s %-30s %s\n", p.Name, p.Description, args))
-	}
-	return sb.String()
-}
-
-func formatParams(schema any) string {
-	if schema == nil {
-		return ""
-	}
-	data, err := json.Marshal(schema)
-	if err != nil {
-		return ""
-	}
-	var s struct {
-		Properties map[string]struct {
-			Type string `json:"type"`
-		} `json:"properties"`
-		Required []string `json:"required"`
-	}
-	if json.Unmarshal(data, &s) != nil {
-		return ""
-	}
-	reqSet := make(map[string]bool)
-	for _, r := range s.Required {
-		reqSet[r] = true
-	}
-	var parts []string
-	for name, prop := range s.Properties {
-		req := "optional"
-		if reqSet[name] {
-			req = "required"
-		}
-		parts = append(parts, fmt.Sprintf("%s (%s, %s)", name, prop.Type, req))
-	}
-	return strings.Join(parts, ", ")
-}
-
-func formatPromptArgs(args []*mcp.PromptArgument) string {
-	var parts []string
-	for _, a := range args {
-		suffix := ""
-		if a.Required {
-			suffix = " (required)"
-		}
-		parts = append(parts, a.Name+suffix)
-	}
-	return strings.Join(parts, ", ")
-}
-```
-
-- [ ] **Step 2: Write the test command handlers**
-
-`internal/cli/test.go`:
-```go
-package cli
-
-import (
-	"context"
-	"encoding/json"
-	"fmt"
-	"os"
-	"time"
-
-	"github.com/msilverblatt/protomcp/internal/testengine"
-)
-
-func RunTestList(ctx context.Context, file, format string) error {
-	e := testengine.New(file)
-	if err := e.Start(ctx); err != nil {
-		return err
-	}
-	defer e.Stop()
-
-	tools, _ := e.ListTools(ctx)
-	resources, _ := e.ListResources(ctx)
-	prompts, _ := e.ListPrompts(ctx)
-
-	if format == "json" {
-		out := map[string]any{
-			"tools":     tools,
-			"resources": resources,
-			"prompts":   prompts,
-		}
-		data, _ := json.MarshalIndent(out, "", "  ")
-		fmt.Println(string(data))
-		return nil
-	}
-
-	fmt.Print(FormatToolTable(tools))
-	fmt.Print(FormatResourceTable(resources))
-	fmt.Print(FormatPromptTable(prompts))
-	fmt.Printf("\n  %d tools, %d resources, %d prompts\n", len(tools), len(resources), len(prompts))
-	return nil
-}
-
-func RunTestCall(ctx context.Context, file, toolName, argsJSON, format string, showTrace bool) error {
-	e := testengine.New(file)
-	if err := e.Start(ctx); err != nil {
-		return err
-	}
-	defer e.Stop()
-
-	var args map[string]any
-	if argsJSON != "" {
-		if err := json.Unmarshal([]byte(argsJSON), &args); err != nil {
-			return fmt.Errorf("invalid --args JSON: %w", err)
-		}
-	}
-
-	result, err := e.CallTool(ctx, toolName, args)
-	if err != nil {
-		return fmt.Errorf("call %s: %w", toolName, err)
-	}
-
-	if format == "json" {
-		out := map[string]any{
-			"result":         result.Result,
-			"duration_ms":    result.Duration.Milliseconds(),
-			"tools_enabled":  result.ToolsEnabled,
-			"tools_disabled": result.ToolsDisabled,
-			"trace":          e.Trace().Entries(),
-		}
-		data, _ := json.MarshalIndent(out, "", "  ")
-		fmt.Println(string(data))
-		return nil
-	}
-
-	// Human-readable output
-	fmt.Printf("\n  Result (%dms)\n", result.Duration.Milliseconds())
-	fmt.Println("  " + "────────────────────────────────────────────────────────────────")
-	for _, c := range result.Result.Content {
-		data, _ := json.Marshal(c)
-		fmt.Printf("  %s\n", data)
-	}
-
-	if showTrace {
-		fmt.Println("\n  Protocol Trace")
-		fmt.Println("  " + "────────────────────────────────────────────────────────────────")
-		entries := e.Trace().Entries()
-		if len(entries) > 0 {
-			base := entries[0].Timestamp
-			for _, entry := range entries {
-				elapsed := entry.Timestamp.Sub(base)
-				arrow := "→"
-				if entry.Direction == "recv" {
-					arrow = "←"
-				}
-				summary := entry.Method
-				if summary == "" {
-					summary = "(response)"
-				}
-				fmt.Printf("  %-7s %s %s\n", fmt.Sprintf("%dms", elapsed.Milliseconds()), arrow, summary)
-			}
-		}
-	}
-
-	if len(result.ToolsEnabled) > 0 || len(result.ToolsDisabled) > 0 {
-		fmt.Println("\n  Tool list changes")
-		fmt.Println("  " + "────────────────────────────────────────────────────────────────")
-		for _, name := range result.ToolsEnabled {
-			fmt.Printf("  + %-18s (enabled)\n", name)
-		}
-		for _, name := range result.ToolsDisabled {
-			fmt.Printf("  - %-18s (disabled)\n", name)
-		}
-	} else {
-		fmt.Println("\n  Tool list: no changes")
-	}
-
-	return nil
-}
-```
-
-- [ ] **Step 3: Verify build**
-
-```bash
-go build ./internal/cli/
-```
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add internal/cli/
-git commit -m "feat: add pmcp test CLI — list and call commands"
-```
-
----
-
-### Task 7: Wire test and playground commands in main.go
-
-**Files:**
-- Modify: `cmd/protomcp/main.go`
-
-- [ ] **Step 1: Add command dispatch**
-
-In main.go, after the existing `cfg.Command == "validate"` check, add:
-
-```go
-if cfg.Command == "test" {
-    runTest(ctx, cfg)
-    return
-}
-
-if cfg.Command == "playground" {
-    runPlayground(ctx, cfg)
-    return
-}
-```
-
-Add the `runTest` function:
-```go
-func runTest(ctx context.Context, cfg *config.Config) {
-    var err error
-    switch cfg.TestSubcommand {
-    case "list":
-        err = cli.RunTestList(ctx, cfg.File, cfg.Format)
-    case "call":
-        err = cli.RunTestCall(ctx, cfg.File, cfg.TestToolName, cfg.TestArgs, cfg.Format, cfg.ShowTrace)
-    case "scenario":
-        fmt.Println("Scenario runner coming in a future release.")
-        return
-    default:
-        fmt.Fprintf(os.Stderr, "unknown test subcommand: %s\n", cfg.TestSubcommand)
-        os.Exit(1)
-    }
-    if err != nil {
-        slog.Error("test failed", "error", err)
-        os.Exit(1)
-    }
-}
-```
-
-Add a placeholder `runPlayground`:
-```go
-func runPlayground(ctx context.Context, cfg *config.Config) {
-    fmt.Println("Playground coming soon. Use 'pmcp test' for now.")
-}
-```
-
-- [ ] **Step 2: Build and test manually**
-
-```bash
-go build -o bin/pmcp ./cmd/protomcp/
-bin/pmcp test test/e2e/fixtures/simple_tool.py list
-bin/pmcp test test/e2e/fixtures/simple_tool.py call echo --args '{"message":"hello"}'
-```
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add cmd/protomcp/ internal/config/
-git commit -m "feat: wire pmcp test commands in main.go"
-```
-
----
-
-## Chunk 3: Playground Backend
-
-### Task 8: Create playground HTTP server and REST handlers
-
-**Files:**
-- Create: `internal/playground/server.go`
-- Create: `internal/playground/handlers.go`
-
-- [ ] **Step 1: Write the server**
-
-`internal/playground/server.go`:
-```go
-package playground
-
-import (
-	"context"
-	"embed"
-	"fmt"
-	"io/fs"
-	"log/slog"
-	"net/http"
-
-	"github.com/msilverblatt/protomcp/internal/testengine"
-)
-
-//go:embed frontend/dist/*
-var frontendFS embed.FS
-
-// Server runs the playground HTTP server.
-type Server struct {
-	engine *testengine.Engine
-	hub    *Hub
-	logger *slog.Logger
-}
-
-// NewServer creates a playground server backed by the given engine.
-func NewServer(engine *testengine.Engine, logger *slog.Logger) *Server {
-	return &Server{
-		engine: engine,
-		hub:    NewHub(),
-		logger: logger,
-	}
-}
-
-// ListenAndServe starts the HTTP server.
-func (s *Server) ListenAndServe(ctx context.Context, addr string) error {
-	mux := http.NewServeMux()
-
-	// API routes
-	mux.HandleFunc("GET /api/tools", s.handleListTools)
-	mux.HandleFunc("GET /api/resources", s.handleListResources)
-	mux.HandleFunc("GET /api/prompts", s.handleListPrompts)
-	mux.HandleFunc("POST /api/call", s.handleCallTool)
-	mux.HandleFunc("POST /api/resource/read", s.handleReadResource)
-	mux.HandleFunc("POST /api/prompt/get", s.handleGetPrompt)
-	mux.HandleFunc("POST /api/reload", s.handleReload)
-	mux.HandleFunc("GET /api/trace", s.handleGetTrace)
-	mux.HandleFunc("GET /ws", s.handleWebSocket)
-
-	// Serve embedded frontend
-	distFS, err := fs.Sub(frontendFS, "frontend/dist")
-	if err != nil {
-		return fmt.Errorf("embed frontend: %w", err)
-	}
-	mux.Handle("/", http.FileServer(http.FS(distFS)))
-
-	// Wire trace events to WebSocket hub
-	traceCh := s.engine.Trace().Subscribe()
-	go func() {
-		for entry := range traceCh {
-			s.hub.Broadcast(Event{Type: "trace", Data: entry})
-		}
-	}()
-
-	// Start hub
-	go s.hub.Run(ctx)
-
-	srv := &http.Server{Addr: addr, Handler: mux}
-	go func() {
-		<-ctx.Done()
-		srv.Close()
-	}()
-
-	s.logger.Info("playground started", "addr", addr)
-	return srv.ListenAndServe()
-}
-```
-
-- [ ] **Step 2: Write the handlers**
-
-`internal/playground/handlers.go` — REST endpoint implementations. Each handler calls the engine, marshals the result to JSON, and writes the response. The tool call handler captures timing and tool list changes.
-
-- [ ] **Step 3: Verify build**
-
-```bash
-go build ./internal/playground/
-```
-
-Note: This will fail until the frontend dist directory exists. Create a placeholder:
-```bash
-mkdir -p internal/playground/frontend/dist
-echo '<!doctype html><html><body>Playground loading...</body></html>' > internal/playground/frontend/dist/index.html
-```
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add internal/playground/
-git commit -m "feat: add playground backend — REST API + WebSocket event stream"
-```
-
----
-
-### Task 9: Create WebSocket hub
-
-**Files:**
-- Create: `internal/playground/ws.go`
-
-- [ ] **Step 1: Write the WebSocket hub**
-
-The hub manages WebSocket connections, broadcasts events, and handles connect/disconnect. Uses `nhooyr.io/websocket`.
-
-```go
-package playground
-
-import (
-	"context"
-	"encoding/json"
-	"net/http"
-	"sync"
-
-	"nhooyr.io/websocket"
-)
-
-// Event is a typed message sent to WebSocket clients.
-type Event struct {
-	Type string `json:"type"`
-	Data any    `json:"data,omitempty"`
-}
-
-// Hub manages WebSocket connections and broadcasts events.
-type Hub struct {
-	mu      sync.Mutex
-	clients map[*websocket.Conn]context.CancelFunc
-}
-
-func NewHub() *Hub {
-	return &Hub{clients: make(map[*websocket.Conn]context.CancelFunc)}
-}
-
-func (h *Hub) Run(ctx context.Context) {
-	<-ctx.Done()
-	h.mu.Lock()
-	defer h.mu.Unlock()
-	for conn, cancel := range h.clients {
-		cancel()
-		conn.CloseNow()
-	}
-}
-
-func (h *Hub) Add(conn *websocket.Conn, cancel context.CancelFunc) {
-	h.mu.Lock()
-	defer h.mu.Unlock()
-	h.clients[conn] = cancel
-}
-
-func (h *Hub) Remove(conn *websocket.Conn) {
-	h.mu.Lock()
-	defer h.mu.Unlock()
-	if cancel, ok := h.clients[conn]; ok {
-		cancel()
-		delete(h.clients, conn)
-	}
-}
-
-func (h *Hub) Broadcast(event Event) {
-	data, err := json.Marshal(event)
-	if err != nil {
-		return
-	}
-	h.mu.Lock()
-	defer h.mu.Unlock()
-	for conn := range h.clients {
-		conn.Write(context.Background(), websocket.MessageText, data)
-	}
-}
-
-func (s *Server) handleWebSocket(w http.ResponseWriter, r *http.Request) {
-	conn, err := websocket.Accept(w, r, &websocket.AcceptOptions{
-		InsecureSkipVerify: true, // allow any origin for local dev
-	})
-	if err != nil {
-		return
-	}
-	ctx, cancel := context.WithCancel(r.Context())
-	s.hub.Add(conn, cancel)
-	defer s.hub.Remove(conn)
-
-	// Send initial connection event
-	s.hub.Broadcast(Event{Type: "connection", Data: map[string]string{"status": "connected"}})
-
-	// Keep connection alive until context cancelled
-	<-ctx.Done()
-}
-```
-
-- [ ] **Step 2: Build**
-
-```bash
-go build ./internal/playground/
-```
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add internal/playground/ws.go
-git commit -m "feat: add WebSocket hub for playground event broadcasting"
-```
-
----
-
-### Task 10: Wire playground command in main.go
-
-**Files:**
-- Modify: `cmd/protomcp/main.go`
-
-- [ ] **Step 1: Replace the placeholder `runPlayground`**
-
-```go
-func runPlayground(ctx context.Context, cfg *config.Config) {
-    e := testengine.New(cfg.File, testengine.WithLogger(logger))
-    if err := e.Start(ctx); err != nil {
-        slog.Error("failed to start engine", "error", err)
-        os.Exit(1)
-    }
-    defer e.Stop()
-
-    addr := fmt.Sprintf("%s:%d", cfg.Host, cfg.Port)
-    srv := playground.NewServer(e, logger)
-    if err := srv.ListenAndServe(ctx, addr); err != nil && err != http.ErrServerClosed {
-        slog.Error("playground error", "error", err)
-        os.Exit(1)
-    }
-}
-```
-
-- [ ] **Step 2: Build and test**
-
-```bash
-go build -o bin/pmcp ./cmd/protomcp/
-bin/pmcp playground test/e2e/fixtures/simple_tool.py --port 3000
-# Open http://localhost:3000 — should see placeholder HTML
-# Ctrl+C to stop
-```
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add cmd/protomcp/
-git commit -m "feat: wire pmcp playground command"
-```
-
----
-
-## Chunk 4: Playground Frontend
-
-### Task 11: Scaffold React + Tailwind + Vite frontend
-
-**Files:**
-- Create: `internal/playground/frontend/` (full React project)
-
-- [ ] **Step 1: Initialize the project**
-
-```bash
-cd internal/playground/frontend
-npm create vite@latest . -- --template react-ts
-npm install
-npm install -D tailwindcss @tailwindcss/vite
-```
-
-- [ ] **Step 2: Configure Tailwind**
-
-Add Tailwind plugin to `vite.config.ts`:
-```ts
-import { defineConfig } from 'vite'
-import react from '@vitejs/plugin-react'
-import tailwindcss from '@tailwindcss/vite'
-
-export default defineConfig({
-  plugins: [react(), tailwindcss()],
-  build: { outDir: 'dist' },
-})
-```
-
-Add `@import "tailwindcss";` to `src/index.css`.
-
-- [ ] **Step 3: Create shared types**
-
-`src/types.ts` — TypeScript types matching the backend JSON.
-
-- [ ] **Step 4: Create hooks**
-
-`src/hooks/useWebSocket.ts` — WebSocket connection with auto-reconnect.
-`src/hooks/useApi.ts` — REST API wrapper with loading states.
-
-- [ ] **Step 5: Create components**
-
-Build each component from the spec: TopBar, FeaturePicker, ToolForm, ResourceForm, PromptForm, ResultView, TracePanel, TraceEntry, ProgressBar, History.
-
-- [ ] **Step 6: Assemble in App.tsx**
-
-Two-panel layout with top bar. Wire everything together.
-
-- [ ] **Step 7: Build and verify**
-
-```bash
-cd internal/playground/frontend && npm run build
-cd ../../.. && go build -o bin/pmcp ./cmd/protomcp/
-bin/pmcp playground test/e2e/fixtures/simple_tool.py --port 3000
-# Open http://localhost:3000 — should see the playground UI
-```
-
-- [ ] **Step 8: Commit**
-
-```bash
-git add internal/playground/frontend/
-git commit -m "feat: add playground frontend — React + Tailwind interactive UI"
-```
-
----
-
-### Task 12: Add Makefile targets and update docs
-
-**Files:**
-- Modify: `Makefile`
-- Modify: `README.md`
-
-- [ ] **Step 1: Add Makefile targets**
-
-```makefile
-playground-frontend:
-	cd internal/playground/frontend && npm run build
-
-build: playground-frontend
-	go build -o bin/pmcp ./cmd/protomcp
-```
-
-- [ ] **Step 2: Update README**
-
-Add a "Testing & Playground" section to README.md showing `pmcp test list`, `pmcp test call`, and `pmcp playground` with a screenshot placeholder.
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add Makefile README.md
-git commit -m "docs: add testing and playground to README and Makefile"
-```
diff --git a/docs/superpowers/specs/2026-03-12-protomcp-design.md b/docs/superpowers/specs/2026-03-12-protomcp-design.md
deleted file mode 100644
index 783ace5..0000000
--- a/docs/superpowers/specs/2026-03-12-protomcp-design.md
+++ /dev/null
@@ -1,839 +0,0 @@
-# protomcp Design Spec
-
-## Problem Statement
-
-MCP (Model Context Protocol) has a powerful protocol, but it forces every tool developer to implement that protocol themselves. This creates three problems:
-
-1. **Language lock-in**: Tools are almost exclusively Python and TypeScript because nobody wants to implement the MCP protocol layer in other languages just to expose a function.
-2. **Restart hell**: During development, any code change requires restarting the MCP server process, which disconnects the client, loses conversation context, and breaks flow. This is the #1 developer pain point in the MCP ecosystem.
-3. **Static tool lists**: There's no practical way to dynamically show/hide tools based on application state. Developers resort to prompt engineering ("don't use this tool until...") which wastes tokens and is unreliable.
-
-## Solution
-
-**protomcp** is a language-agnostic MCP runtime. A single precompiled Go binary handles all MCP protocol concerns. Developers write plain functions in any language, decorate them, and protomcp handles transport, hot-reload, and dynamic tool management.
-
-The key architectural insight: the MCP protocol layer (JSON-RPC, transport negotiation, capability advertisement, notifications) almost never changes during development. What changes is the tool logic. protomcp splits on that boundary — the protocol layer is a stable Go binary, the tool logic is hot-reloadable user code in any language.
-
-## Architecture
-
-```
-[Host/Client]
-    | MCP protocol (stdio / SSE / streamable HTTP / gRPC / WebSocket)
-[protomcp binary (Go)]
-    | protobuf over unix socket
-[tool process (Python / TS / Go / Rust / anything)]
-```
-
-### Component Responsibilities
-
-**Go Binary (the runtime):**
-- Speaks all five MCP transports to the host
-- Communicates with tool processes over unix socket using protobuf
-- Watches files for changes, signals tool process to reload
-- Manages tool list state (enable/disable/allow/block/query)
-- Fires `notifications/tools/list_changed` on any tool set change
-- Proxies `tools/list` and `tools/call` — never interprets tool schemas
-- Spawns and manages the tool process lifecycle (see Tool Process Lifecycle below)
-- Handles middleware/hooks (auth, logging, rate limiting, custom interceptors)
-- Structured error handling with agent-friendly error types
-- Proxies progress notifications (`notifications/progress`) between tool process and host
-- Manages async task lifecycle (`tasks/get`, `tasks/result`, `tasks/cancel`, `tasks/list`)
-- Forwards cancellation requests (`notifications/cancelled`) to tool process
-- Exposes server logging via MCP `notifications/message` (structured log forwarding)
-- Graceful degradation — survives client disconnects, transport errors, tool process crashes
-- On reload: waits for in-flight calls by default, immediate reload opt-in via `--hot-reload immediate`
-
-**Protobuf Spec (the contract):**
-- Single `.proto` file defining all messages between Go binary and tool process
-- Generates types for Go, Python, TypeScript, Rust (and any other language with protobuf support)
-- Any language that can speak protobuf over a unix socket can expose MCP tools
-
-**Language Libraries (first-class: Python, TypeScript, Go, Rust):**
-- Decorator/registration API with automatic schema generation from language-native types
-  - Python: generated from type annotations at runtime via `inspect`
-  - TypeScript: uses Zod schemas for runtime type information (TS types are erased at compile time). The `tool()` function accepts a Zod schema for args, providing both runtime validation and JSON schema generation.
-  - Go: generated from struct tags
-  - Rust: generated via derive macros
-- `ToolResult` type with optional `enable_tools` / `disable_tools` fields
-- `tool_manager` client for programmatic list control
-- Progress reporting API (`report_progress(progress, total?, message?)`)
-- Support for async tools via `task_support` parameter on `@tool()` decorator
-- Module reload handler (language-specific mechanism)
-- Unix socket client (generated from protobuf)
-
-## Internal Protocol
-
-Communication between the Go binary and tool process uses protobuf over a unix socket.
-
-### Wire Format
-
-Messages are **length-prefixed**: each message is preceded by a 4-byte big-endian uint32 indicating the byte length of the serialized protobuf message that follows.
-
-All messages are wrapped in a single `Envelope` message with a `oneof` discriminator:
-
-```protobuf
-message Envelope {
-  oneof msg {
-    // Go -> Tool Process
-    ReloadRequest reload = 1;
-    ListToolsRequest list_tools = 2;
-    CallToolRequest call_tool = 3;
-
-    // Tool Process -> Go
-    ReloadResponse reload_response = 4;
-    ToolListResponse tool_list = 5;
-    CallToolResponse call_result = 6;
-    EnableToolsRequest enable_tools = 7;
-    DisableToolsRequest disable_tools = 8;
-    SetAllowedRequest set_allowed = 9;
-    SetBlockedRequest set_blocked = 10;
-    GetActiveToolsRequest get_active_tools = 11;
-    BatchUpdateRequest batch = 12;
-    ActiveToolsResponse active_tools = 13;
-
-    // Progress, cancellation, logging, tasks
-    ProgressNotification progress = 16;
-    CancelRequest cancel = 17;
-    LogMessage log = 18;
-    CreateTaskResponse create_task = 19;
-    TaskStatusRequest task_status = 20;
-    TaskStatusResponse task_status_response = 21;
-    TaskResultRequest task_result = 22;
-    TaskCancelRequest task_cancel = 23;
-  }
-  // Correlation ID for matching requests to responses.
-  // Required for CallToolRequest/CallToolResponse to support concurrent calls.
-  // Optional for other message types.
-  string request_id = 14;
-}
-```
-
-This gives both sides a single deserialization path: read 4 bytes for length, read that many bytes, deserialize as `Envelope`, switch on the `oneof` variant. No type-tag ambiguity, no framing confusion. Every language library gets this for free from protoc.
-
-### Messages: Go -> Tool Process
-
-- `ReloadRequest` — reimport modules, re-register tools
-- `ListToolsRequest` — return current tool definitions with schemas
-- `CallToolRequest(name, args)` — execute a tool and return the result
-
-### Messages: Tool Process -> Go
-
-- `ReloadResponse(success, error?)` — acknowledge reload with success/failure status and optional error message (e.g., syntax error, import error)
-- `ToolListResponse(tools[])` — current tool definitions with names, descriptions, and JSON schemas
-- `CallToolResponse(result, enable_tools?, disable_tools?)` — tool execution result with optional tool list mutations
-- `EnableToolsRequest(tool_names[])` — add tools to the active set (delta)
-- `DisableToolsRequest(tool_names[])` — remove tools from the active set (delta)
-- `SetAllowedRequest(tool_names[])` — only these tools are visible (allowlist)
-- `SetBlockedRequest(tool_names[])` — everything visible except these (blocklist)
-- `GetActiveToolsRequest()` — query current active tool set
-- `BatchUpdateRequest(enable?, disable?, allow?, block?)` — atomic multi-operation update, single `list_changed` notification
-- `ActiveToolsResponse(tool_names[])` — response to any tool list control command
-
-### Messages: Bidirectional (Progress, Cancellation, Logging)
-
-- `ProgressNotification(progress_token, progress, total?, message?)` — tool process reports progress on a long-running call; Go binary proxies as MCP `notifications/progress`
-- `CancelRequest(request_id)` — Go binary forwards MCP `notifications/cancelled` to tool process; tool process should abort the in-flight call and return a cancellation error
-- `LogMessage(level, logger?, data)` — tool process emits a structured log; Go binary forwards as MCP `notifications/message` with RFC 5424 severity level
-
-### Messages: Task (Async) Lifecycle
-
-- `CreateTaskResponse(task_id)` — tool process returns a task ID instead of a result for async tools; Go binary responds to client with `CreateTaskResult`
-- `TaskStatusRequest(task_id)` — Go binary forwards client `tasks/get` poll to tool process
-- `TaskStatusResponse(task_id, state, progress?, message?)` — tool process reports current task state (`running`, `completed`, `failed`, `cancelled`)
-- `TaskResultRequest(task_id)` — Go binary forwards client `tasks/result` to tool process
-- `TaskCancelRequest(task_id)` — Go binary forwards client `tasks/cancel` to tool process
-
-## Tool Process Lifecycle
-
-### Spawning
-
-The Go binary spawns the tool process as a child process. The runtime is determined by file extension:
-
-| Extension | Command |
-|-----------|---------|
-| `.py` | `python <file>` (or `python3`, respects `PROTOMCP_PYTHON` env var) |
-| `.ts` | `npx tsx <file>` (respects `PROTOMCP_NODE` env var) |
-| `.js` | `node <file>` |
-| `.go` | `go run <file>` |
-| `.rs` | `cargo run <file>` |
-| other | Treated as an executable binary, run directly |
-
-An explicit `--runtime <command>` flag overrides extension-based detection.
-
-### Startup Handshake
-
-1. Go binary creates a unix socket at `$XDG_RUNTIME_DIR/protomcp/<pid>.sock` (fallback: `/tmp/protomcp/<pid>.sock`)
-2. Go binary spawns tool process, passing the socket path via `PROTOMCP_SOCKET` environment variable
-3. Tool process connects to the socket
-4. Go binary sends `ListToolsRequest`
-5. Tool process responds with `ToolListResponse`
-6. Go binary is now ready to accept MCP connections from the host
-
-### Crash Recovery
-
-If the tool process exits unexpectedly:
-- Go binary logs the error with exit code and any stderr output
-- All pending tool calls receive an error response
-- Go binary attempts to restart the tool process (up to 3 retries with exponential backoff)
-- If restart succeeds, Go binary re-fetches the tool list and fires `list_changed` if it changed
-- If all retries fail, Go binary enters degraded mode: `tools/list` returns empty, all `tools/call` requests return an error explaining the tool process is down
-- The MCP connection to the host stays alive throughout — the client is never disconnected
-
-### Production Mode (`protomcp run`)
-
-Dynamic tool list management (enable/disable/allow/block) works identically in `run` mode. Only file-watching hot-reload is disabled.
-
-## Dynamic Tool Lists
-
-### Design Philosophy
-
-Instead of instructing an agent "don't use tool X until condition Y" (which wastes tokens and is unreliable), protomcp makes tools invisible until they should be available. The agent can't misuse what it can't see.
-
-### Update Vectors
-
-**1. Tool-call-driven (inline mutations):**
-
-Tool return values can include `enable_tools` and `disable_tools` fields. The Go binary intercepts these before proxying the result to the host, updates the active tool set, and fires `list_changed`.
-
-```python
-@tool(description="Verify credentials")
-def auth_check(token: str) -> ToolResult:
-    if verify(token):
-        return ToolResult(
-            result="Authenticated",
-            enable_tools=["delete_doc", "admin_panel"],
-            disable_tools=["auth_check"]
-        )
-```
-
-**2. Event-driven (programmatic control):**
-
-Tool list can be modified at any time from event handlers, background tasks, lock managers, etc.
-
-```python
-from protomcp import tool_manager
-
-def on_lock_acquired(resource):
-    tool_manager.disable([f"edit_{resource}"])
-
-def on_lock_released(resource):
-    tool_manager.enable([f"edit_{resource}"])
-```
-
-### Control Modes
-
-| Mode | Method | Behavior |
-|------|--------|----------|
-| Delta | `enable(tools)` / `disable(tools)` | Add/remove from current active set |
-| Allowlist | `set_allowed(tools)` | Only these tools visible, all others hidden |
-| Blocklist | `set_blocked(tools)` | All tools visible except these |
-| Query | `get_active_tools()` | Returns current active tool set |
-| Batch | `batch(enable?, disable?, allow?, block?)` | Atomic multi-op, single `list_changed` |
-
-### Mode Interaction Semantics
-
-The tool list operates in one of three modes at any time: **open** (default), **allowlist**, or **blocklist**.
-
-- **Open mode** (default): All registered tools are active. `enable()`/`disable()` apply deltas.
-- **Allowlist mode**: Entered by calling `set_allowed()`. Only listed tools are active. `enable()` adds to the allowlist. `disable()` removes from the allowlist. `set_blocked()` switches to blocklist mode (replaces, does not compose).
-- **Blocklist mode**: Entered by calling `set_blocked()`. All tools active except listed ones. `enable()` removes from the blocklist. `disable()` adds to the blocklist. `set_allowed()` switches to allowlist mode (replaces, does not compose).
-
-Calling `set_allowed([])` or `set_blocked([])` with an empty list resets to open mode.
-
-In `batch()`, if both `allow` and `block` are specified, the operation is rejected with an error. Delta operations (`enable`/`disable`) in a batch are applied after the mode-setting operation (`allow` or `block`), if present.
-
-All control methods work both inline (from tool return values) and programmatically (from event handlers). All tool list state lives in the Go binary — language libraries send commands, they don't track state.
-
-## Hot Reload
-
-### Mechanism
-
-1. Go binary watches the tool file(s) for changes using filesystem events
-2. On change detected, Go binary sends `Reload` message to tool process
-3. Tool process reimports modules using language-specific mechanism:
-   - Python: `importlib.reload()`
-   - TypeScript/Node: module cache invalidation
-   - Go: subprocess restart (Go plugins cannot be unloaded/reloaded once loaded)
-   - Rust: subprocess restart
-4. Tool process sends `ReloadResponse` indicating success or failure (with error details if e.g., syntax error). On failure, the Go binary logs the error and keeps serving the previous tool set.
-5. On success, tool process sends updated `ToolListResponse` to Go binary
-6. Go binary compares to previous list — if tools added/removed/changed, fires `list_changed`
-7. Client re-fetches tool list, sees updated tools
-8. No transport disconnection at any point — the MCP connection stays alive
-
-### In-Flight Call Handling
-
-- **Default**: Wait for any active tool call to finish before reloading (safe)
-- **Opt-in**: `--hot-reload immediate` reloads immediately without waiting. For interpreted languages (Python, TS), module reimport replaces functions in-place, so in-flight calls may execute a mix of old and new code or fail. This mode is intended for developers who know their tools are stateless and short-lived. The Go binary logs a warning when immediate reload interrupts an in-flight call.
-- **Timeout**: A configurable `--call-timeout <duration>` flag (default: 5m) prevents stuck tool calls from blocking reload indefinitely. If a call exceeds the timeout, it is cancelled and an error is returned to the client.
-
-### What Triggers a Reload
-
-- File modification detected by the Go binary's file watcher
-- Any file in the watched directory (or explicit file list) matching relevant extensions
-
-## Transport Support
-
-All five transports at launch:
-
-| Transport | Use Case | Notes |
-|-----------|----------|-------|
-| stdio | Local, Claude Desktop, most clients | Default. Go binary reads stdin, writes stdout |
-| Streamable HTTP | Modern remote connections | Single HTTP endpoint, optional SSE streaming |
-| SSE | Legacy remote connections | Deprecated in spec but still widely used |
-| gRPC | Google ecosystem, high-performance | Uses gRPC's HTTP/2 framework, separate from the internal protobuf-over-socket protocol. Shares `.proto` message definitions where applicable but serves a different role. |
-| WebSocket | Long-lived bidirectional, real-time | Session persistence across interruptions |
-
-Transport is selected via `--transport` flag. Default is `stdio`.
-
-## Middleware / Hooks
-
-The Go binary supports an interceptor chain for cross-cutting concerns. Middleware runs in the Go binary regardless of tool language — write it once, applies to all tools.
-
-### Built-in Middleware
-
-- **Logging**: Structured request/response logging with configurable verbosity
-- **Error handling**: Catches tool process errors, formats agent-friendly error messages with suggestions
-
-### Custom Middleware
-
-Users can register custom middleware that intercepts tool calls before/after execution. Middleware has access to:
-- Tool name and arguments (before)
-- Tool result (after)
-- Tool list state
-- Request metadata
-
-### Middleware Versioning
-
-Custom middleware is a v1.1 feature. In v1, only the built-in middleware (logging, error handling) ships. The middleware hook points will be designed in v1 to avoid breaking changes when custom middleware lands in v1.1.
-
-## Structured Error Handling
-
-Tool errors should be agent-friendly by default. The protobuf spec includes a structured error type:
-
-- `error_code`: machine-readable error category
-- `message`: human/agent-readable description
-- `suggestion`: actionable next step ("User not found. Try searching by email instead.")
-- `retryable`: boolean indicating if the operation can be retried
-
-The Go binary formats these consistently before sending to the host, regardless of how the tool process reported the error.
-
-## Progress Notifications
-
-Long-running tools can report incremental progress to the client.
-
-### Protocol Flow
-
-1. Client sends `tools/call` with `_meta.progressToken`
-2. Go binary forwards `CallToolRequest` to tool process, including the `progress_token`
-3. Tool process sends `ProgressNotification` messages as work progresses
-4. Go binary proxies each as MCP `notifications/progress` to the client
-5. Tool process eventually returns `CallToolResponse` as normal
-
-### Language API
-
-```python
-@tool(description="Index all documents")
-def index_documents(directory: str, ctx: ToolContext) -> str:
-    files = list_files(directory)
-    for i, f in enumerate(files):
-        index(f)
-        ctx.report_progress(progress=i + 1, total=len(files), message=f"Indexing {f}")
-    return f"Indexed {len(files)} documents"
-```
-
-```typescript
-export const indexDocuments = tool({
-  description: "Index all documents",
-  args: z.object({ directory: z.string() }),
-  handler: async (args, ctx) => {
-    const files = listFiles(args.directory);
-    for (let i = 0; i < files.length; i++) {
-      await index(files[i]);
-      ctx.reportProgress(i + 1, files.length, `Indexing ${files[i]}`);
-    }
-    return `Indexed ${files.length} documents`;
-  }
-});
-```
-
-The `ToolContext` (or `ctx`) is injected by the runtime when the tool handler signature requests it. If a tool doesn't need progress, it simply omits the `ctx` parameter.
-
-### Behavior
-
-- If the client did not send a `progressToken`, the Go binary silently drops `ProgressNotification` messages (no error to tool process)
-- `total` is optional — omit for indeterminate progress
-- `message` is optional — human-readable status for display
-
-## Tasks (Async Execution)
-
-Some tools take too long for a synchronous response. Tasks allow a tool to return immediately with a task ID, then the client polls for status and retrieves the result when ready.
-
-### Declaring Async Tools
-
-```python
-@tool(description="Run full analysis", task_support=True)
-async def run_analysis(dataset: str) -> str:
-    # Long-running work happens here
-    result = await heavy_computation(dataset)
-    return result
-```
-
-When `task_support=True`, the tool's MCP definition includes `execution.taskSupport: true` in its metadata. The Go binary advertises `tasks` capability in its MCP `initialize` response.
-
-### Protocol Flow
-
-1. Client sends `tools/call` for an async-capable tool
-2. Go binary forwards `CallToolRequest` to tool process
-3. Tool process begins async work and immediately returns `CreateTaskResponse(task_id)`
-4. Go binary responds to client with `CreateTaskResult { taskId, state: "running" }`
-5. Client polls with `tasks/get(task_id)` → Go binary forwards `TaskStatusRequest` → tool process responds with `TaskStatusResponse`
-6. When complete, client sends `tasks/result(task_id)` → Go binary forwards `TaskResultRequest` → tool process responds with `CallToolResponse` containing the final result
-7. Client can cancel with `tasks/cancel(task_id)` → Go binary forwards `TaskCancelRequest` → tool process aborts and responds with cancellation acknowledgment
-
-### Task State Machine
-
-```
-running → completed
-running → failed
-running → cancelled (via tasks/cancel)
-```
-
-### Task Lifecycle
-
-- Task state lives in the tool process (it owns the computation)
-- The Go binary tracks task IDs for routing and can return cached status if the tool process has crashed
-- Tasks survive hot-reloads — in-flight tasks continue in the old module context (consistent with default reload behavior)
-- Tasks do NOT survive tool process crashes — pending tasks are moved to `failed` state with an error message
-
-## Cancellation
-
-### Protocol Flow
-
-1. Client sends MCP `notifications/cancelled` with `requestId`
-2. Go binary looks up the in-flight call by `request_id`
-3. Go binary sends `CancelRequest(request_id)` to tool process
-4. Tool process should abort the operation and return a `CallToolResponse` with `isError: true` and error code `cancelled`
-
-### Language API
-
-```python
-@tool(description="Long operation")
-def long_operation(data: str, ctx: ToolContext) -> str:
-    for chunk in process_chunks(data):
-        if ctx.is_cancelled():
-            raise CancelledError("Operation cancelled by client")
-        handle(chunk)
-    return "Done"
-```
-
-The `ctx.is_cancelled()` check is cooperative — the tool process must check periodically. The Go binary sets the cancellation flag when it receives the cancel request.
-
-### Behavior
-
-- If `request_id` doesn't match any in-flight call, the cancellation is silently ignored (per MCP spec)
-- Cancellation is best-effort — the tool may complete before checking the flag
-- For async tasks, cancellation goes through `tasks/cancel` instead
-
-## Server Logging
-
-Tool processes can emit structured logs that are forwarded to the MCP client as `notifications/message`.
-
-### Protocol Flow
-
-1. Tool process sends `LogMessage(level, logger?, data)` to Go binary
-2. Go binary forwards as MCP `notifications/message` with the specified severity level
-
-### Severity Levels (RFC 5424)
-
-`emergency` | `alert` | `critical` | `error` | `warning` | `notice` | `info` | `debug`
-
-### Language API
-
-```python
-from protomcp import log
-
-log.info("Processing started", data={"file_count": 42})
-log.warning("Rate limit approaching", data={"remaining": 5})
-log.debug("Cache hit", logger="cache_layer", data={"key": "user_123"})
-```
-
-### Behavior
-
-- The Go binary's `--log-level` flag filters which log messages are forwarded to the client
-- Logs below the configured level are dropped (not forwarded)
-- `logger` is optional — used to identify the source component
-- `data` can be any JSON-serializable value
-
-## Structured Output
-
-Tools can declare an output schema, and the Go binary validates that the result matches before returning to the client.
-
-### Declaring Output Schema
-
-```python
-from protomcp import tool
-from dataclasses import dataclass
-
-@dataclass
-class SearchResult:
-    title: str
-    url: str
-    score: float
-
-@tool(description="Search documents", output_type=SearchResult)
-def search(query: str) -> list[SearchResult]:
-    return [SearchResult(title="Doc", url="https://...", score=0.95)]
-```
-
-```typescript
-const SearchResult = z.object({
-  title: z.string(),
-  url: z.string(),
-  score: z.number(),
-});
-
-export const search = tool({
-  description: "Search documents",
-  args: z.object({ query: z.string() }),
-  output: z.array(SearchResult),
-  handler: (args) => {
-    return [{ title: "Doc", url: "https://...", score: 0.95 }];
-  }
-});
-```
-
-### Behavior
-
-- When `output_type` / `output` is specified, the tool's MCP definition includes `outputSchema`
-- The Go binary includes `structuredContent` in the `CallToolResponse` alongside the text `content`
-- Schema validation happens in the language library before sending the response — validation errors become tool errors
-
-## Tool Metadata
-
-Tools can declare additional metadata that enhances their discoverability and presentation in MCP clients.
-
-### Fields
-
-- `title`: Human-readable display name (distinct from the function name used as the tool ID)
-- `readOnlyHint`, `destructiveHint`, `idempotentHint`, `openWorldHint`: Behavioral hints for the client (all optional booleans)
-
-```python
-@tool(
-    description="Delete a document permanently",
-    title="Delete Document",
-    destructive=True,
-    idempotent=True,
-)
-def delete_doc(doc_id: str) -> str:
-    db.delete(doc_id)
-    return f"Deleted {doc_id}"
-```
-
-### Behavior
-
-- Metadata is included in the tool's MCP definition under `annotations`
-- The Go binary passes through metadata from the tool process — it does not interpret or enforce hints
-- Hints are advisory — clients may use them to show confirmation dialogs, group tools, etc.
-
-## CLI
-
-Minimal, hardened, no bloat.
-
-### Commands
-
-- `protomcp dev <file>` — start dev server with file watching, hot-reload, rich log output
-- `protomcp run <file>` — production mode, no file watching
-
-### Flags
-
-- `--transport stdio|sse|http|grpc|ws` — transport selection (default: stdio)
-- `--hot-reload immediate` — don't wait for in-flight calls before reloading
-- `--call-timeout <duration>` — max time for a single tool call (default: 5m)
-- `--log-level debug|info|warn|error` — log verbosity (default: info)
-- `--socket <path>` — custom unix socket path (default: `$XDG_RUNTIME_DIR/protomcp/<pid>.sock`)
-- `--runtime <command>` — override language runtime detection (e.g., `--runtime "python3.12"`)
-- `--host <address>` — bind address for network transports (default: localhost)
-- `--port <number>` — port for network transports (default: 8080)
-
-### Dev Logs
-
-`protomcp dev` outputs rich structured logs showing:
-- Tool registrations on startup
-- File changes detected and reloads triggered
-- Tool list changes (added/removed/modified tools)
-- `list_changed` notifications sent
-- Tool call traces (name, args summary, duration, result summary)
-- Errors with full context
-
-## Developer Experience
-
-### Getting Started
-
-```bash
-brew install protomcp   # or download binary
-```
-
-### Minimal Tool File (Python)
-
-```python
-from protomcp import tool
-
-@tool(description="Add two numbers")
-def add(a: int, b: int) -> int:
-    return a + b
-```
-
-### Running
-
-```bash
-protomcp dev server.py
-```
-
-### MCP Client Configuration (one-time)
-
-```json
-{
-  "mcpServers": {
-    "my-tools": {
-      "command": "protomcp",
-      "args": ["dev", "server.py"]
-    }
-  }
-}
-```
-
-This configuration never changes. The Go binary is the MCP server forever. What tools exist is determined by the tool file, which hot-reloads.
-
-### Adding a Tool
-
-Edit `server.py`, add a new decorated function, save. Log shows:
-
-```
-[reload] server.py changed, reloading...
-[tools]  tool added: multiply
-[mcp]    firing list_changed notification
-```
-
-Agent immediately sees the new tool. No restart required.
-
-## Language Library API Surface
-
-Each first-class library (Python, TypeScript, Go, Rust) provides the same conceptual API adapted to language idioms.
-
-### Tool Registration
-
-```python
-# Python
-from protomcp import tool, ToolResult
-
-@tool(description="Search documents by query")
-def search_docs(query: str, limit: int = 10) -> list[dict]:
-    return db.search(query, limit)
-```
-
-```typescript
-// TypeScript — uses Zod for runtime schema generation (TS types are erased at compile time)
-import { tool, ToolResult } from 'protomcp';
-import { z } from 'zod';
-
-export const searchDocs = tool({
-  description: "Search documents by query",
-  args: z.object({
-    query: z.string().describe("Search query"),
-    limit: z.number().default(10).describe("Max results to return"),
-  }),
-  handler: (args) => {
-    return db.search(args.query, args.limit);
-  }
-});
-```
-
-### Tool List Control
-
-```python
-from protomcp import tool_manager
-
-# Delta
-tool_manager.enable(["query_db", "insert_record"])
-tool_manager.disable(["initialize_db"])
-
-# Allowlist / Blocklist
-tool_manager.set_allowed(["read_only_tool"])
-tool_manager.set_blocked(["dangerous_tool"])
-
-# Query
-active = tool_manager.get_active_tools()
-
-# Batch (atomic, single list_changed)
-tool_manager.batch(
-    enable=["tool_a", "tool_b"],
-    disable=["tool_c"]
-)
-```
-
-### Inline Tool List Mutations
-
-```python
-@tool(description="Connect to database")
-def connect_db(connection_string: str) -> ToolResult:
-    db.connect(connection_string)
-    return ToolResult(
-        result="Connected to database",
-        enable_tools=["query_db", "insert_record", "disconnect_db"],
-        disable_tools=["connect_db"]
-    )
-```
-
-### Progress Reporting
-
-```python
-@tool(description="Process dataset")
-def process_dataset(path: str, ctx: ToolContext) -> str:
-    items = load(path)
-    for i, item in enumerate(items):
-        process(item)
-        ctx.report_progress(i + 1, len(items), f"Processing {item.name}")
-    return f"Processed {len(items)} items"
-```
-
-### Async Tools
-
-```python
-@tool(description="Train model", task_support=True)
-async def train_model(config: dict) -> str:
-    result = await run_training(config)
-    return f"Model trained: accuracy={result.accuracy}"
-```
-
-### Cancellation
-
-```python
-@tool(description="Batch process")
-def batch_process(items: list[str], ctx: ToolContext) -> str:
-    for item in items:
-        if ctx.is_cancelled():
-            raise CancelledError("Cancelled by client")
-        process(item)
-    return "Done"
-```
-
-### Server Logging
-
-```python
-from protomcp import log
-
-@tool(description="Sync data")
-def sync_data(source: str) -> str:
-    log.info("Starting sync", data={"source": source})
-    result = sync(source)
-    log.info("Sync complete", data={"records": result.count})
-    return f"Synced {result.count} records"
-```
-
-## Documentation
-
-### Framework
-
-Documentation is built with **Starlight** (Astro) — the emerging standard for open source dev tools docs. Starlight ships minimal JavaScript, has built-in search and i18n, and is framework-agnostic (no React/Vue dependency).
-
-### Site Structure
-
-```
-docs/
-├── Getting Started
-│   ├── Installation
-│   ├── Quick Start (5-minute tutorial: install, write a tool, run)
-│   └── How It Works (architecture explainer with diagrams)
-├── Guides
-│   ├── Writing Tools (Python)
-│   ├── Writing Tools (TypeScript)
-│   ├── Writing Tools (Go)
-│   ├── Writing Tools (Rust)
-│   ├── Writing Tools (Other Languages)
-│   ├── Dynamic Tool Lists
-│   ├── Hot Reload
-│   ├── Progress Notifications
-│   ├── Async Tasks
-│   ├── Cancellation
-│   ├── Server Logging
-│   ├── Structured Output
-│   ├── Error Handling
-│   └── Production Deployment
-├── Reference
-│   ├── CLI Reference
-│   ├── Protobuf Spec
-│   ├── Python API
-│   ├── TypeScript API
-│   ├── Go API
-│   ├── Rust API
-│   └── Configuration
-├── Concepts
-│   ├── Architecture
-│   ├── Tool List Modes (open/allowlist/blocklist)
-│   ├── Transport Options
-│   └── MCP Protocol (for the curious — not required reading)
-└── Community
-    ├── Contributing
-    ├── Writing a Language Library
-    └── Changelog
-```
-
-### Documentation Standards
-
-- **Every feature has a guide and a reference page.** Guides explain when and why. Reference pages are exhaustive API docs.
-- **Every code example is tested.** Examples are extracted from actual test files or validated in CI. No stale examples.
-- **"Writing Tools (Other Languages)" guide** walks through implementing the protobuf contract from scratch in an unsupported language. This is a key differentiator — protomcp's promise is "any language," so the docs must prove it.
-- **Architecture diagrams** use Mermaid (Starlight has built-in support) showing the Go binary, unix socket, tool process, and MCP client relationships.
-- **Interactive examples** where possible — embedded terminal output showing hot-reload in action, tool list changes, etc.
-
-## Deliverables by Priority
-
-### v1.0 — Core
-
-1. Go binary with all five transports (stdio, SSE, streamable HTTP, gRPC, WebSocket)
-2. Protobuf spec (`.proto` file) defining the internal protocol
-3. Hot-reload with file watching and `list_changed` notifications
-4. Dynamic tool list management (enable/disable/allow/block/query/batch)
-5. Structured error handling with agent-friendly error types
-6. Progress notifications (proxy `notifications/progress` between tool process and host)
-7. Async task support (task lifecycle: create, poll, result, cancel)
-8. Cancellation (cooperative cancellation via `notifications/cancelled`)
-9. Server logging (structured log forwarding via `notifications/message`)
-10. Structured output (`outputSchema` + `structuredContent` validation)
-11. Tool metadata (title, behavioral hints/annotations)
-12. CLI: `protomcp dev` and `protomcp run`
-13. Python library (decorator API, schema generation, tool_manager, progress, async tasks, logging)
-14. TypeScript library (same API surface)
-15. Documentation site (Starlight): Getting Started, Guides (Python, TS, Dynamic Tool Lists, Hot Reload, Progress, Async Tasks, Logging), Reference (CLI, Protobuf Spec, Python API, TS API), Concepts (Architecture, Tool List Modes, Transports)
-
-### v1.1 — Expand
-
-10. Go library
-11. Rust library
-12. Middleware/hooks system (interceptor chain in Go binary)
-13. Auth support (OAuth 2.1, JWT, API Key) at the transport layer
-14. Build-time validation (tool naming, descriptions, argument structure)
-15. Documentation: Go/Rust guides and API reference, Middleware guide, Auth guide, "Writing a Language Library" community guide
-
-### v1.2 — Ecosystem
-
-16. OpenAPI spec ingestion (auto-generate tools from API specs)
-17. File-system routing (optional alternative to decorators)
-18. Additional community language libraries
-19. Documentation: OpenAPI guide, File-system routing guide, expanded community section
-
-## Non-Goals
-
-- No scaffolding generators (`protomcp init`, `protomcp create`)
-- No dashboards or web UIs
-- No Docker dependency
-- No class-based inheritance patterns
-- No opinion on how tool code is structured beyond the decorator API
-- No 1:1 REST-to-MCP mapping encouragement (docs should push "design for outcomes")
-
-## Open Questions
-
-1. **Multi-process support**: Should the Go binary support proxying to multiple tool processes simultaneously (multi-file, multi-language)? e.g., `protomcp dev server.py tools.ts`. The current protobuf protocol implicitly assumes a single tool process. If multi-process is a future possibility, the `.proto` should include a process/namespace identifier from day one to avoid a breaking protocol change later. **Recommendation**: Include an optional `namespace` field in the protobuf messages now, enforce single-process in v1, enable multi-process in a future version.
-2. **Config file format**: Should there be a config file for production deployments, or are CLI flags sufficient? **Recommendation**: CLI flags only for v1. Add optional `protomcp.toml` in v1.1 if users request it.
-3. **Directory watching**: Should `protomcp dev` support watching a directory of files, or only explicit file paths? **Recommendation**: Support both. `protomcp dev server.py` watches that file. `protomcp dev ./tools/` watches all matching files in the directory. File extension determines which files are relevant.
diff --git a/docs/superpowers/specs/2026-03-12-protomcp-v1.1-design.md b/docs/superpowers/specs/2026-03-12-protomcp-v1.1-design.md
deleted file mode 100644
index 4b0c28c..0000000
--- a/docs/superpowers/specs/2026-03-12-protomcp-v1.1-design.md
+++ /dev/null
@@ -1,368 +0,0 @@
-# protomcp v1.1 Design Spec
-
-**Goal:** Expand protomcp with Go and Rust SDKs, custom and auth middleware, build-time validation, CI/publishing pipeline, and comprehensive documentation for all new features.
-
-**Builds on:** v1.0 design spec (`docs/superpowers/specs/2026-03-12-protomcp-design.md`)
-
----
-
-## 1. Go SDK
-
-**Location:** `sdk/go/`
-
-**Module structure:**
-- `tool.go` — `Tool()` function for registering tools using functional options pattern
-- `result.go` — `ToolResult` struct
-- `context.go` — `ToolContext` with progress reporting, cancellation via `context.Context`
-- `manager.go` — `ToolManager` for dynamic enable/disable at runtime
-- `log.go` — Server logging (8 RFC 5424 levels)
-- `transport.go` — Unix socket connection + length-prefixed envelope framing
-- `runner.go` — Main loop: connect, handshake, listen, dispatch, reload
-
-**Protobuf:** Uses the already-generated code in `gen/proto/protomcp/`.
-
-**Go module strategy:** The Go SDK gets its own `go.mod` at `sdk/go/go.mod` with module path `github.com/msilverblatt/protomcp/sdk/go`. It depends on the root module for generated protobuf types (`github.com/msilverblatt/protomcp/gen/proto/protomcp`). Releases use Go multi-module tagging: `sdk/go/v1.1.0`. This keeps the SDK independently importable without pulling in the entire binary's dependency tree.
-
-**API surface example:**
-
-```go
-package main
-
-import "github.com/msilverblatt/protomcp/sdk/go/protomcp"
-
-func main() {
-    protomcp.Tool("add",
-        protomcp.Description("Add two numbers"),
-        protomcp.Args(protomcp.Int("a"), protomcp.Int("b")),
-        protomcp.Handler(func(ctx protomcp.ToolContext, args struct{ A, B int }) protomcp.ToolResult {
-            return protomcp.Result(fmt.Sprintf("%d", args.A+args.B))
-        }),
-    )
-    protomcp.Run()
-}
-```
-
-**Runtime detection in `cmd/protomcp/main.go`:** Detect `.go` files and use `go run`. Detect compiled Go binaries by checking ELF/Mach-O headers.
-
-**Tests:** Unit tests for each module + integration test against the Go binary.
-
----
-
-## 2. Rust SDK
-
-**Location:** `sdk/rust/`
-
-**Crate:** `protomcp` (Cargo crate)
-
-**Dependencies:** `prost` for protobuf, `tokio` for async runtime, `serde` + `serde_json` for argument parsing.
-
-**Module structure:**
-- `tool.rs` — Builder pattern for tool registration
-- `result.rs` — `ToolResult` struct
-- `context.rs` — `ToolContext` with progress reporting and cancellation via `tokio::CancellationToken`
-- `manager.rs` — `ToolManager` for dynamic enable/disable
-- `log.rs` — Server logging
-- `transport.rs` — Unix socket + envelope framing
-- `runner.rs` — Main loop
-- `lib.rs` — Public API exports
-
-**Protobuf generation:** `prost-build` in `build.rs`, reads from `proto/protomcp.proto`.
-
-**API surface example:**
-
-```rust
-use protomcp::{tool, ToolResult};
-
-#[tokio::main]
-async fn main() {
-    tool("add")
-        .description("Add two numbers")
-        .arg::<i64>("a")
-        .arg::<i64>("b")
-        .handler(|ctx, args| {
-            let sum = args["a"].as_i64() + args["b"].as_i64();
-            ToolResult::new(sum.to_string())
-        })
-        .register();
-
-    protomcp::run().await;
-}
-```
-
-**Runtime detection in `cmd/protomcp/main.go`:** Detect `.rs` files by checking for `Cargo.toml` in the same directory or parent. Use `cargo run --manifest-path <path>/Cargo.toml` (not `cargo run <file>` — that's invalid). For compiled Rust binaries, execute directly. Note: `cargo run` has slow cold builds (10-30s). The Rust guide should recommend pre-compiled binaries for production and note that dev mode will be slower than Python/TypeScript on first compile.
-
-**Tests:** Unit tests per module + integration test against the Go binary.
-
----
-
-## 3. Custom Middleware
-
-**Purpose:** Let tool processes register middleware that intercepts tool calls before/after the handler.
-
-**New protobuf messages** (added to `proto/protomcp.proto`):
-
-Field numbers in `Envelope.oneof`: `register_middleware = 24`, `register_middleware_response = 25`, `middleware_intercept = 26`, `middleware_intercept_response = 27` (continuing from the current max of 23).
-
-```protobuf
-message RegisterMiddlewareRequest {
-  string name = 1;
-  int32 priority = 2;  // lower runs first
-}
-
-message RegisterMiddlewareResponse {
-  bool success = 1;
-}
-
-message MiddlewareInterceptRequest {
-  string middleware_name = 1;
-  string phase = 2;  // "before" or "after"
-  string tool_name = 3;
-  string arguments_json = 4;
-  string result_json = 5;  // empty for "before" phase
-  bool is_error = 6;       // only set in "after" phase
-}
-
-message MiddlewareInterceptResponse {
-  string arguments_json = 1;  // potentially modified (before phase)
-  string result_json = 2;     // potentially modified (after phase)
-  bool reject = 3;            // if true, abort the call
-  string reject_reason = 4;
-}
-```
-
-**Extended handshake protocol:**
-
-The handshake is now a two-phase sequence:
-
-1. Go binary sends `ListToolsRequest`
-2. Tool process responds with `ToolListResponse`
-3. Tool process optionally sends zero or more `RegisterMiddlewareRequest` messages
-4. Go binary responds to each with `RegisterMiddlewareResponse`
-5. Tool process sends a final `ReloadResponse { success: true }` to signal handshake complete
-
-If the tool process has no middleware to register, it sends `ReloadResponse` immediately after `ToolListResponse`. The Go binary waits up to the configured timeout for the handshake-complete signal.
-
-Middleware registration is handshake-only. Middleware cannot be added or removed after the handshake completes. To change middleware, the tool process must be reloaded (which re-runs the handshake).
-
-**Middleware execution model:**
-
-The Go binary's `Chain()` function orchestrates everything. Built-in middleware (logging, errors, auth) runs as Go code in-process. Custom middleware runs via socket round-trips — when the chain reaches a custom middleware, the Go binary sends a `MiddlewareInterceptRequest` to the tool process (using `request_id` for correlation, routed through the existing `pending` map in `readLoop`) and waits for `MiddlewareInterceptResponse`.
-
-**Execution order:**
-1. Built-in logging middleware (Go, in-process)
-2. Built-in auth middleware (Go, in-process, if configured)
-3. User-registered middleware (sorted by priority, lower first — socket round-trip per middleware)
-4. Tool handler (socket round-trip)
-5. User-registered middleware (reverse order, "after" phase — socket round-trip per middleware)
-6. Built-in error formatting middleware (Go, in-process)
-
-**Performance note:** Each custom middleware adds 2 socket round-trips per tool call (before + after). For latency-sensitive use cases, keep custom middleware count low.
-
-**Go binary changes:**
-- `internal/middleware/custom.go` — dispatches intercept requests to tool process over the existing socket
-- `internal/middleware/chain.go` — updated to support dynamic registration and priority ordering
-- `internal/process/manager.go` — extended handshake to handle `RegisterMiddlewareRequest` after `ToolListResponse`
-
-**SDK support:** All four SDKs (Python, TypeScript, Go, Rust) get a `middleware()` registration function/decorator.
-
-**CLI:** No new flags needed. Middleware is registered by the tool process, not the CLI.
-
----
-
-## 4. Auth Middleware
-
-**Purpose:** Built-in authentication for network transports (HTTP, SSE, WebSocket, gRPC). Not applicable to stdio (inherently local).
-
-**Location:** `internal/middleware/auth.go`
-
-**CLI flags:**
-- `--auth token:<ENV_VAR>` — validates `Authorization: Bearer <token>` header against the value of the specified environment variable
-- `--auth apikey:<ENV_VAR>` — validates `X-API-Key` header against the value of the specified environment variable
-
-**Behavior:**
-- On valid credentials: request passes through to tool handler
-- On invalid/missing credentials: returns 401 Unauthorized (HTTP/SSE/WS) or UNAUTHENTICATED status (gRPC)
-- On stdio transport: `--auth` flag logs a warning at startup and proceeds without auth (stdio is inherently local)
-- Malformed `--auth` values (missing colon, unknown scheme, empty env var name): exit with error at startup
-- Env var not set at startup: exit with error at startup
-
-**Implementation:**
-- Registered as a built-in middleware with priority 0 (runs before all user middleware)
-- Reads env var value at startup, not per-request. Rotating credentials requires restart. File-based secrets are a potential future enhancement.
-- Supports multiple `--auth` flags for layered auth (all must pass)
-
-**Deferred:** OAuth 2.1 and JWT support are deferred beyond v1.1. The `--auth` flag syntax is extensible (`--auth jwt:<config>`) for future addition without breaking changes.
-
----
-
-## 5. Build-time Validation
-
-**Purpose:** `pmcp validate <file>` checks tool definitions without starting a server.
-
-**Location:** `cmd/protomcp/main.go` (new `validate` subcommand), `internal/validate/validate.go`
-
-**What it validates:**
-- Tool names: non-empty, matches `^[a-zA-Z_][a-zA-Z0-9_]*$`, no duplicates
-- Descriptions: non-empty
-- Argument schemas: valid JSON Schema structure, required fields present, types are recognized
-- Return types: ToolResult is properly constructed
-
-**`--strict` mode (additional checks):**
-- Description minimum length (10 chars)
-- All tools have at least one argument
-- No generic names ("tool1", "test", "foo")
-
-**How it works:**
-1. Spawns the tool process
-2. Performs handshake (sends `ListToolsRequest`, receives `ToolListResponse`)
-3. Validates each tool definition
-4. Prints results (tool name, status, issues)
-5. Exits with code 0 (pass) or 1 (fail)
-6. Kills the tool process on exit
-
-**Output formats:**
-
-Default (human-readable):
-```
-✓ add — OK
-✓ multiply — OK
-✗ — 2 errors:
-  · empty tool name
-  · "search" has no description
-```
-
-`--format json` (CI-friendly):
-```json
-{"tools": [{"name": "add", "status": "ok"}, {"name": "multiply", "status": "ok"}], "errors": [{"tool": "", "issue": "empty tool name"}, {"tool": "search", "issue": "no description"}], "pass": false}
-```
-
-**Prerequisites:** Validation spawns the tool process, so the language runtime must be installed and the tool file must be parseable/executable. This is not a static analysis tool.
-
----
-
-## 6. CI Pipeline
-
-**Location:** `.github/workflows/ci.yml`
-
-**Triggers:** Push to master, pull requests to master.
-
-**Jobs:**
-
-1. **go** — `go vet ./...`, `go test ./...`, `go build ./cmd/protomcp/`
-2. **python-sdk** — Install deps from `sdk/python/`, run `pytest`
-3. **typescript-sdk** — Install deps from `sdk/typescript/`, run `vitest`
-4. **go-sdk** — `go test ./sdk/go/...`
-5. **rust-sdk** — `cargo test` in `sdk/rust/`
-6. **e2e** — Build binary, run `go test ./test/e2e/`
-
-**Matrix:** Go job runs on latest Go. Python on 3.10+. Node on 20+. Rust on stable.
-
-**Linting:** `go vet` (Go), `ruff` (Python), `eslint` (TypeScript), `clippy` (Rust).
-
----
-
-## 7. Release & Publishing Pipeline
-
-**Location:** `.github/workflows/release.yml`
-
-**Trigger:** Push of `v*` tags.
-
-**Steps:**
-
-1. **Go binary** — GoReleaser (`.goreleaser.yml` already exists) builds multi-platform binaries and creates GitHub release
-2. **PyPI** — Build with `hatchling`, publish with `twine` using `PYPI_API_TOKEN` secret
-3. **npm** — `npm publish` from `sdk/typescript/` using `NPM_TOKEN` secret
-4. **Homebrew** — Update tap formula (`protomcp/homebrew-tap`) with new version and checksums
-5. **Crates.io** — `cargo publish` from `sdk/rust/` using `CARGO_REGISTRY_TOKEN` secret
-
----
-
-## 8. README Badge Fixes
-
-**Current state:** Build, npm, and PyPI badges point to non-existent resources.
-
-**Fix:** Once CI and publishing pipelines exist, all badges become functional:
-- Build badge: `.github/workflows/ci.yml` makes it real
-- npm badge: publishing to npm makes it real
-- PyPI badge: publishing to PyPI makes it real
-- Add new badge: Homebrew (links to tap repo)
-- Add new badge: crates.io (for Rust SDK)
-
----
-
-## 9. Documentation
-
-### New pages (Starlight docs)
-
-| File | Content |
-|------|---------|
-| `guides/writing-tools-go.mdx` | Go SDK guide: functional options, context.Context, progress, logging |
-| `guides/writing-tools-rust.mdx` | Rust SDK guide: builder pattern, tokio async, progress, logging |
-| `guides/middleware.mdx` | Custom middleware: registration, intercept phases, ordering, examples |
-| `guides/auth.mdx` | Auth middleware: token/apikey modes, transport behavior, examples |
-| `guides/writing-a-language-library.mdx` | Community guide: protobuf contract, envelope framing, handshake, required messages, testing against the Go binary |
-
-### Updated pages
-
-| File | Changes |
-|------|---------|
-| `reference/cli.mdx` | Add `validate` command, `--auth` flag docs |
-| `index.mdx` | Add Go/Rust to language list in cards |
-| `getting-started/quick-start.mdx` | Add Go and Rust quick start snippets |
-| `getting-started/installation.mdx` | Add Go module install, Rust crate install |
-
-### README updates
-
-- Add Go and Rust quick start examples
-- Update comparison table (add Go/Rust SDK row context)
-- Add middleware and validation to features list
-- Badges functional after CI/publishing
-
-### New examples
-
-| File | Tier |
-|------|------|
-| `examples/go/basic.go` | Minimal add/multiply |
-| `examples/go/real_world.go` | Progress, cancellation, logging |
-| `examples/go/full_showcase.go` | Structured output, dynamic tools, metadata, middleware |
-| `examples/rust/basic.rs` | Minimal add/multiply |
-| `examples/rust/real_world.rs` | Progress, cancellation, logging |
-| `examples/rust/full_showcase.rs` | Structured output, dynamic tools, metadata, middleware |
-
----
-
-## 10. Changes to Existing Code
-
-### `proto/protomcp.proto`
-- Add middleware message types (RegisterMiddleware, MiddlewareIntercept request/response) at field numbers 24-27
-- Regenerate protobuf code for all four SDKs: `protoc` for Go, `grpcio-tools` for Python, `ts-proto` for TypeScript, `prost-build` for Rust
-
-### `cmd/protomcp/main.go`
-- Add `validate` as a third command alongside `dev` and `run`
-- Add `--auth` flag parsing (repeatable)
-- Extend runtime detection for Go (`.go` files → `go run`) and Rust (`Cargo.toml` → `cargo run --manifest-path`)
-- Fix existing v1.0 bug: Rust runtime detection uses `cargo run <file>` which is invalid; must use `cargo run --manifest-path`
-
-### `internal/middleware/`
-- `auth.go` — new file, built-in auth middleware
-- `custom.go` — new file, user-registered middleware dispatch
-- `chain.go` — update to support dynamic registration and priority ordering
-
-### `internal/validate/`
-- `validate.go` — new file, validation logic
-- `validate_test.go` — new file, tests
-
-### `internal/config/config.go`
-- Add `Auth` and `Validate` config fields
-
-### `internal/process/manager.go`
-- Handle `RegisterMiddlewareRequest` during handshake phase
-
----
-
-## Non-goals for v1.1
-
-- Config file (`protomcp.toml`) — deferred unless users request it
-- OpenAPI spec ingestion — v1.2
-- File-system routing — v1.2
-- Plugin registry — v1.2
diff --git a/docs/superpowers/specs/2026-03-12-readme-demos-interactive-design.md b/docs/superpowers/specs/2026-03-12-readme-demos-interactive-design.md
deleted file mode 100644
index 77cc8de..0000000
--- a/docs/superpowers/specs/2026-03-12-readme-demos-interactive-design.md
+++ /dev/null
@@ -1,200 +0,0 @@
-# README, Working Demos & Interactive Demo Page — Design Spec
-
-## Overview
-
-Three deliverables to make protomcp (pmcp) immediately understandable and adoptable:
-
-1. **README.md** — project introduction with architecture diagram, dual-language quick start, feature highlights, and comparison table
-2. **Working code examples** — runnable demos at three complexity tiers in both Python and TypeScript
-3. **Interactive demo page** — Astro component-driven page in the Starlight docs site with animated architecture hero, terminal replay, and protocol view
-
-Primary audience: developers evaluating pmcp AND developers already adopting it.
-
----
-
-## 1. README.md
-
-**Location:** `/README.md` (repo root)
-
-### Structure
-
-1. **Project name + one-liner** — "Language-agnostic MCP runtime — write tools in any language, hot-reload without restarting your AI host."
-2. **Badges** — build status, license, Go version, npm version, PyPI version
-3. **Text-based architecture diagram** — ASCII art showing `MCP Host ←→ pmcp (Go) ←→ tool process`
-4. **Quick Start** — install via Homebrew, then two code blocks side by side: Python (`@tool` decorator) and TypeScript (`tool()` with Zod). Each followed by `pmcp dev <file>`.
-5. **Features** — bullet list: any language, hot reload, dynamic tool lists, 5 transports (stdio, SSE, HTTP, WebSocket, gRPC), structured output, async tasks, progress/cancellation, server logging, tool metadata/annotations
-6. **Comparison table** — pmcp vs FastMCP (Python) vs official MCP SDKs (TypeScript/Python). Columns: feature, pmcp, FastMCP (Python), MCP SDKs. Rows: language support, hot reload, dynamic tools, transport options, structured output, async tasks.
-7. **Examples** — brief description of `examples/` directory contents with links
-8. **Documentation** — link to Starlight docs site
-9. **License**
-
-### Constraints
-
-- No hallucinated URLs — only link to `https://github.com/msilverblatt/protomcp`
-- CLI command is `pmcp`, never `protomcp`
-- Both Python AND TypeScript examples in every code section
-- Badge URLs must be real (GitHub Actions, shields.io pattern)
-
----
-
-## 2. Working Code Examples
-
-**Location:** `examples/` at repo root
-
-### Directory Structure
-
-```
-examples/
-├── python/
-│   ├── basic.py
-│   ├── real_world.py
-│   ├── full_showcase.py
-│   └── requirements.txt
-├── typescript/
-│   ├── basic.ts
-│   ├── real-world.ts
-│   ├── full-showcase.ts
-│   ├── package.json
-│   └── tsconfig.json
-├── run-demo.sh
-└── README.md
-```
-
-### Example Tiers
-
-**Basic** (`basic.py`, `basic.ts`):
-- Single `add` tool
-- Minimal code — the absolute simplest starting point
-- Header comment: what it does, how to run (`pmcp dev examples/python/basic.py`)
-
-**Real-world** (`real_world.py`, `real-world.ts`):
-- File search tool that searches a directory for files matching a pattern
-- Demonstrates: `ToolContext` for progress reporting, `ServerLogger` for logging, `ctx.is_cancelled()` for cancellation support
-- Real-ish logic, not toy math
-
-**Full showcase** (`full_showcase.py`, `full-showcase.ts`):
-- Multi-tool server with 3-4 tools demonstrating the full feature set:
-  - Structured output with output schema
-  - Async task support (long-running operation)
-  - Dynamic tool lists (enable/disable tools at runtime)
-  - Tool metadata/annotations (destructive, read-only, idempotent hints)
-  - Progress reporting
-  - Cancellation
-  - Server logging at multiple levels
-- Each tool demonstrates a different subset of features
-
-### run-demo.sh
-
-- Checks that `pmcp` is installed
-- Uses stdio transport: starts `pmcp dev <file>` as a subprocess, pipes JSON-RPC messages to stdin, reads JSON-RPC responses from stdout
-- Performs the full MCP handshake for each example: `initialize` request → `initialized` notification → `tools/list` → `tools/call` with example arguments
-- JSON-RPC messages are constructed inline in the script (heredocs)
-- Prints a human-readable summary of each interaction (tool name, args, result)
-- Works with both Python and TypeScript examples
-- Exits cleanly with summary of what ran
-
-### examples/package.json
-
-- Minimal `package.json` with `protomcp` and `zod` as dependencies for the TypeScript examples
-- Includes a `tsconfig.json` with `moduleResolution: "node"`, `esModuleInterop: true`
-
-### examples/python/requirements.txt
-
-- Lists `protomcp` as the sole dependency for the Python examples
-
-### examples/README.md
-
-- Table listing each example file, what features it demonstrates, and the run command
-- Links to main README and docs
-
----
-
-## 3. Interactive Demo Page
-
-**Location:** `docs/src/content/docs/demo.mdx` + `docs/src/components/demo/`
-
-### Components
-
-```
-docs/src/components/demo/
-├── ArchitectureHero.astro
-├── TerminalReplay.astro
-└── ProtocolView.astro
-```
-
-### ArchitectureHero.astro (Hero Section)
-
-- Large animated diagram at the top of the page
-- Three boxes arranged horizontally: "MCP Host" (teal border) → "pmcp" (gold border) → "Your Code" (coral border)
-- Animated "message packet" (small colored div) flows left-to-right for a tool call, then right-to-left for the result
-- Arrow labels alternate between "JSON-RPC" (MCP side) and "protobuf" (tool side)
-- CSS `@keyframes` animation — no JavaScript required
-- Loops with a pause between cycles
-- Brief explanatory text below: "pmcp sits between your MCP host and your tool process. It translates JSON-RPC to protobuf, handles hot reload, and manages tool registration."
-
-### TerminalReplay.astro (Left Half Below Hero)
-
-- Dark terminal mockup (`background: #0d0d0d`, monospace font)
-- Simulated typing animation showing:
-  1. `$ pmcp dev tools.py`
-  2. `✓ connected · 3 tools registered`
-  3. `→ call add {"a": 2, "b": 3}`
-  4. `← result: 5`
-- CSS `@keyframes` with staged delays for each line
-- Tab toggle at top: "Python" / "TypeScript" — switches the filename and code style. Uses a small inline `<script>` tag (Astro client-side script) to toggle visibility classes on click.
-- Loops after completing
-
-### ProtocolView.astro (Right Half Below Hero)
-
-- Two columns side by side: "MCP (JSON-RPC)" and "protobuf (wire format)"
-- Shows the same `tools/call` request in both formats
-- Lines highlight sequentially (CSS animation) to show field-by-field mapping
-- Uses shared CSS custom properties for timing (`--cycle-duration`, `--phase-delay`) defined in a parent `<style>` in `demo.mdx`, so both TerminalReplay and ProtocolView stay in sync and can be adjusted from one place
-- JSON-RPC side shows the standard MCP request format
-- Protobuf side shows the Envelope with CallToolRequest
-
-### demo.mdx
-
-- Imports all three components
-- Brief intro text: "See how pmcp works — from the high-level architecture down to the wire protocol."
-- `<ArchitectureHero />` — hero section
-- Section heading: "In Action" with brief text
-- Flex container with `<TerminalReplay />` (left) and `<ProtocolView />` (right)
-- Bottom CTA: links to Quick Start guide and examples directory
-
-### Sidebar Integration
-
-- Add "Demo" as a top-level link item in the Starlight sidebar config in `astro.config.mjs`: `{ label: 'Demo', slug: 'demo' }` placed before the first group ("Getting Started")
-
-### Responsive Layout
-
-- ArchitectureHero boxes stack vertically on screens < 640px
-- TerminalReplay and ProtocolView stack vertically on screens < 768px (instead of side-by-side)
-- Use CSS media queries, no JS
-
----
-
-## 4. Integration
-
-### Cross-linking
-
-- **README** → links to demo page ("See it in action"), examples directory, and docs site
-- **Demo page** → links to quick start guide and examples
-- **Examples README** → links to main README and docs
-
-### Makefile
-
-- Add `demo` target that runs `examples/run-demo.sh`
-
-### .gitignore
-
-- Ensure `.superpowers/` is in `.gitignore`
-
----
-
-## Non-Goals
-
-- No live/interactive REPL in the browser (all animations are pre-scripted CSS)
-- No video recording or GIF generation
-- No CI/CD for the examples (they're documentation, tested manually)
-- No separate demo app or SPA — everything lives in the Starlight site
diff --git a/docs/superpowers/specs/2026-03-13-chunked-streaming-design.md b/docs/superpowers/specs/2026-03-13-chunked-streaming-design.md
deleted file mode 100644
index c8e80a6..0000000
--- a/docs/superpowers/specs/2026-03-13-chunked-streaming-design.md
+++ /dev/null
@@ -1,283 +0,0 @@
-# Chunked Streaming for Large Payloads
-
-## Goal
-
-Eliminate protomcp's large-payload performance gap vs FastMCP and build a streaming content transfer system that no other MCP implementation offers — enabling agents to efficiently exchange large data (files, datasets, images) over MCP.
-
-## Architecture
-
-Three phases, each building on the previous:
-
-1. **Phase C:** Zero-copy JSON passthrough — eliminate redundant parse/re-serialize in the handler
-2. **Phase A:** Chunked internal transfer — stream large payloads over the unix socket in fixed-size chunks
-3. **Phase B:** End-to-end streaming — stream large results all the way to the MCP host via a protomcp extension
-
-Each phase is independently shippable and backward compatible.
-
-## Current Bottleneck
-
-The tool result data path performs 6-7 copies of the payload:
-
-```
-Python SDK:  json.dumps(result) → protobuf serialize → socket sendall
-Go proxy:    socket read → protobuf deserialize → json.Unmarshal(result_json)
-             → json.Marshal(ToolsCallResult) → json.Marshal(JSONRPCResponse)
-```
-
-Benchmark results at 500KB: protomcp 17ms vs FastMCP 9ms. The gap grows with payload size.
-
----
-
-## Phase C: Zero-Copy JSON Passthrough
-
-### Problem
-
-`handler.go:handleToolsCall` parses `result_json` into `[]ContentItem` structs, then re-serializes them to JSON for the JSON-RPC response. For the common case (tool returns a valid content array), this parse/re-serialize is pure waste.
-
-### Design
-
-Replace the parse-and-rebuild with a direct `json.RawMessage` passthrough:
-
-**Before:**
-```go
-var content []ContentItem
-json.Unmarshal([]byte(resp.ResultJson), &content)
-result := ToolsCallResult{Content: content, IsError: resp.IsError}
-data, _ := json.Marshal(result)
-```
-
-**After:**
-```go
-result := RawToolsCallResult{
-    Content: json.RawMessage(resp.ResultJson),
-    IsError: resp.IsError,
-}
-data, _ := json.Marshal(result)
-```
-
-The `result_json` bytes pass through untouched. Use a fast check (first non-whitespace byte is `[`) to determine if the JSON is already a valid content array. If not, fall back to wrapping as a text content item — same as today's fallback path.
-
-### Files
-
-- `internal/mcp/handler.go` — modify `handleToolsCall` to use raw passthrough
-- `internal/mcp/types.go` — add `RawToolsCallResult` with `json.RawMessage` content field
-
-### Validation
-
-- All existing tests pass (behavior unchanged for well-formed results)
-- D4 payload benchmark (already exists in `fastmcp_deep_comparison_test.go`) shows improvement at 10KB+ sizes
-
----
-
-## Phase A: Chunked Internal Transfer
-
-### Problem
-
-Even with Phase C, the protobuf layer serializes/deserializes the entire payload as one message. A 5MB result means ~15MB peak memory (serialized + deserialized + working copies). The length-prefixed framing also means the Go `readLoop` blocks until the entire message is received.
-
-The existing `maxMessageSize` in `envelope.go` caps messages at 10MB, which limits non-chunked payloads. With chunking, individual messages stay small regardless of total payload size.
-
-### Design
-
-Add streaming message types to the internal protobuf protocol. When a tool result exceeds a configurable threshold, the SDK sends it as a stream of chunks.
-
-#### New Protobuf Messages
-
-```protobuf
-message StreamHeader {
-  string field_name = 1;     // which field is being streamed ("result_json")
-  uint64 total_size = 2;     // total bytes if known, 0 if unknown
-  uint32 chunk_size = 3;     // bytes per chunk
-}
-
-message StreamChunk {
-  bytes data = 1;            // chunk payload
-  bool final = 2;            // true on last chunk
-}
-```
-
-Added to `Envelope.oneof msg` at the next available field numbers:
-```protobuf
-StreamHeader stream_header = 28;
-StreamChunk stream_chunk = 29;
-```
-
-#### Wire Flow
-
-For a 512KB `result_json` with 64KB chunks:
-
-```
-Tool → Go:  Envelope { request_id: "req-5", stream_header: { field_name: "result_json", total_size: 524288, chunk_size: 65536 } }
-Tool → Go:  Envelope { request_id: "req-5", stream_chunk: { data: [65536 bytes], final: false } }
-Tool → Go:  Envelope { request_id: "req-5", stream_chunk: { data: [65536 bytes], final: false } }
-            ... (6 more chunks) ...
-Tool → Go:  Envelope { request_id: "req-5", stream_chunk: { data: [remaining], final: true } }
-```
-
-Each chunk is still a length-prefixed protobuf Envelope — the framing layer doesn't change. The chunks are just smaller messages.
-
-#### Go Side: readLoop Reassembly
-
-The `readLoop` is a single goroutine, so it naturally handles interleaved chunks from concurrent streams (multiple in-flight tool calls) without additional synchronization.
-
-When `readLoop` receives a `stream_header`:
-1. Create a `streamAssembly` struct keyed by `request_id`: `{ fieldName string, buf bytes.Buffer, totalSize uint64, created time.Time }`
-2. If `total_size > 0`, pre-allocate the buffer with `buf.Grow(totalSize)` to avoid repeated reallocation
-3. If `total_size == 0` (unknown), the buffer grows dynamically via `bytes.Buffer`'s internal doubling
-4. On each `stream_chunk` with matching `request_id`, append `data` to `buf`
-5. On `final: true`, construct a `CallToolResponse` with the assembled field, dispatch to the pending channel, remove from assembly map
-6. If `total_size > 0` and assembled size differs, log a warning but still dispatch (non-fatal)
-
-The `CallTool` caller sees no difference — it still receives a complete `*pb.CallToolResponse` from the channel.
-
-#### Error Handling and Cleanup
-
-- **Tool crash mid-stream:** The `readLoop` exits on socket EOF/error. All in-progress assemblies are abandoned. The `CallTool` callers time out via their existing `timer` and return an error. No leaked goroutines.
-- **Orphaned assemblies:** The `readLoop` periodically checks (on each envelope read) for assemblies older than `CallTimeout` and removes them. This handles edge cases where a tool sends a `stream_header` but never sends chunks.
-- **Unknown request_id on chunk:** Discard the chunk silently (same behavior as today for unmatched response envelopes).
-- **No explicit abort message:** The SDK can signal failure by sending a `CallToolResponse` with `is_error: true` instead of continuing chunks. The `readLoop` checks for a pending assembly on that `request_id` and cleans it up before dispatching the error response.
-
-#### SDK Side: Transparent Chunking
-
-The SDK's transport layer checks the serialized size of `result_json` before sending. If it exceeds the threshold (default 64KB), it:
-1. Sends a `StreamHeader` envelope with `total_size` set to the known length
-2. Sends N `StreamChunk` envelopes, each with up to `chunk_size` bytes
-3. The final chunk has `final: true`
-4. Tool author code is unchanged — chunking is entirely within the transport layer
-
-#### Threshold
-
-- Default: 64KB (configurable via environment variable `PROTOMCP_CHUNK_THRESHOLD`)
-- Below threshold: current single-message path, zero overhead
-- The threshold applies to the `result_json` field length, not the entire Envelope
-
-### Files
-
-- `proto/protomcp.proto` — add `StreamHeader`, `StreamChunk` to Envelope oneof (fields 28, 29)
-- `internal/process/manager.go` — `readLoop` stream assembly logic, orphan cleanup
-- `sdk/python/src/protomcp/transport.py` — chunked send logic
-- `sdk/typescript/src/transport.ts` — chunked send logic
-- Regenerate protobuf code for Go, Python, TypeScript
-
-### Validation
-
-- Existing tests pass (payloads under threshold use old path)
-- New unit tests for stream assembly in `manager_test.go` (happy path, crash mid-stream, unknown-size, interleaved streams)
-- D4 payload benchmark shows improvement at 100KB+ sizes
-
----
-
-## Phase B: End-to-End Streaming
-
-### Problem
-
-Even with internal chunking, the Go proxy must reassemble the entire result before writing the JSON-RPC response. For a 50MB result, the proxy buffers 50MB in memory. The MCP host also blocks until the full response arrives.
-
-No MCP implementation supports streaming tool results today. The spec doesn't address it. This is where protomcp can differentiate.
-
-### Design
-
-A protomcp-specific MCP extension — `x-protomcp-stream` — that lets hosts opt into chunked content delivery.
-
-#### Capability Negotiation
-
-During `initialize`, the host advertises streaming support:
-
-```json
-{
-  "method": "initialize",
-  "params": {
-    "capabilities": {
-      "x-protomcp-stream": { "maxChunkSize": 65536 }
-    }
-  }
-}
-```
-
-If the host does not advertise `x-protomcp-stream`, the proxy falls back to full buffering (Phase A reassembly + single JSON-RPC response). Full backward compatibility.
-
-The host's `maxChunkSize` is forwarded to the SDK as the chunk size for internal streaming (Phase A), aligning internal and external chunk boundaries to avoid re-buffering.
-
-#### Streaming JSON-RPC Response Format
-
-When streaming is enabled, large tool results are delivered as a sequence of JSON-RPC **notifications** (no `id` field) bracketed by the original response:
-
-```json
-{"jsonrpc":"2.0","method":"x-protomcp-stream/start","params":{"id":1,"streamId":"s-42","totalSize":524288}}
-{"jsonrpc":"2.0","method":"x-protomcp-stream/chunk","params":{"streamId":"s-42","data":"<base64 or raw text>"}}
-{"jsonrpc":"2.0","method":"x-protomcp-stream/chunk","params":{"streamId":"s-42","data":"<base64 or raw text>"}}
-{"jsonrpc":"2.0","id":1,"result":{"content":[],"isError":false,"x-stream-complete":"s-42"}}
-```
-
-This format is valid JSON-RPC 2.0: the `start` and `chunk` messages are notifications (no `id`), and the final message is a standard response with `id` and `result`. Hosts that don't understand the notifications ignore them per the JSON-RPC spec. The final response contains metadata; the actual content was delivered via chunks.
-
-#### Stream ID Generation
-
-Stream IDs are generated as `s-{monotonic counter}` scoped to the connection (transport instance). The counter is an atomic uint64 on the handler, ensuring uniqueness across concurrent tool calls on the same connection.
-
-#### Handler Architecture
-
-The current `Handler.Handle()` returns `(*JSONRPCResponse, error)`. For streaming, a new method is introduced:
-
-```go
-type StreamWriter interface {
-    WriteNotification(method string, params interface{}) error
-    WriteResponse(resp *JSONRPCResponse) error
-    Flush() error
-}
-```
-
-The handler detects streaming capability (stored during `initialize`) and, for large results, calls `StreamWriter` methods instead of returning a single response. The transport implementations (`stdio`, `http`, `sse`) each implement `StreamWriter`.
-
-For non-streaming hosts, the existing return-based interface is unchanged.
-
-#### Transport-Specific Delivery
-
-- **HTTP (streamable-http):** Chunked transfer encoding. Response headers sent on first write, chunks flushed as they arrive. Connection stays open until final response.
-- **SSE:** Each notification is an SSE `data:` event. Standard SSE framing.
-- **Stdio:** Each notification/response is a newline-delimited JSON line. Standard stdio framing.
-
-#### Backpressure
-
-The Go proxy reads the next internal chunk (Phase A) only after the previous chunk has been flushed to the transport via `StreamWriter.Flush()`. A slow HTTP client naturally throttles the tool process through the unix socket. No unbounded buffering anywhere in the pipeline.
-
-#### What This Enables
-
-- Tool processes return arbitrarily large results without OOM on any component
-- Hosts see first bytes immediately (time-to-first-byte improves UX for large results)
-- Agent-to-agent communication over MCP becomes viable for real data exchange
-- File transfer, dataset streaming, log tailing — all possible through standard MCP tools
-- Path to proposing this as a formal MCP spec extension
-
-### Files
-
-- `internal/mcp/handler.go` — detect streaming capability, use `StreamWriter` for large results
-- `internal/mcp/types.go` — `StreamWriter` interface, streaming notification types
-- `internal/transport/http.go` — implement `StreamWriter` with chunked transfer encoding
-- `internal/transport/stdio.go` — implement `StreamWriter` with NDJSON
-- `internal/transport/sse.go` — implement `StreamWriter` with SSE events
-
-### Validation
-
-- Non-streaming hosts get identical behavior to today (no `x-protomcp-stream` capability = full buffering)
-- New integration tests with a streaming-capable test client
-- Benchmark: time-to-first-byte for 1MB+ payloads
-- Memory profile: proxy RSS stays flat regardless of payload size
-
----
-
-## Phase Order and Independence
-
-| Phase | Depends On | Ships Independently | Breaking Changes |
-|-------|-----------|---------------------|-----------------|
-| C     | Nothing   | Yes                 | None            |
-| A     | Nothing   | Yes                 | None (proto additive) |
-| B     | A         | Yes (with A)        | None (opt-in extension) |
-
-Phase C and Phase A can be implemented in parallel. Phase B requires Phase A's chunking infrastructure on the internal side.
-
-## Success Criteria
-
-- **Phase C:** D4 benchmark at 100KB drops below FastMCP's 2.6ms
-- **Phase A:** D4 benchmark at 500KB drops below FastMCP's 9ms; memory profile shows no single allocation > chunk size for large payloads
-- **Phase B:** 50MB tool result streams to host with <100MB proxy RSS; time-to-first-byte < 10ms regardless of total payload size
diff --git a/docs/superpowers/specs/2026-03-14-server-defined-workflows-design.md b/docs/superpowers/specs/2026-03-14-server-defined-workflows-design.md
deleted file mode 100644
index 6259c48..0000000
--- a/docs/superpowers/specs/2026-03-14-server-defined-workflows-design.md
+++ /dev/null
@@ -1,483 +0,0 @@
-# Server-Defined Workflows
-
-## Problem
-
-Agents orchestrating multi-step processes must figure out which tools to call in what order, remember where they are, and avoid invalid sequences. This is error-prone — agents forget steps, call tools out of order, or skip required validation. The developer has no way to enforce a correct sequence at the protocol level.
-
-## Solution
-
-A `@workflow` decorator that lets the server define multi-step processes as state machines. The visible MCP tool surface reflects the current state — the agent only sees valid next actions. The server is the orchestrator; the agent is the executor.
-
-No protocol changes. Workflows compile down to standard tool definitions and dynamic tool list updates.
-
----
-
-## Core API
-
-### `@workflow(name, allow_during?, block_during?)`
-
-Class decorator. Registers a workflow definition. Methods decorated with `@step` become states in the state machine.
-
-```python
-from protomcp import workflow, step, StepResult
-
-@workflow("deploy")
-class DeployWorkflow:
-    @step(initial=True, next=["approve", "reject"])
-    def review(self, changes: str) -> StepResult:
-        return StepResult(result="3 files changed")
-
-    @step(next=["run_tests"])
-    def approve(self, reason: str) -> StepResult:
-        return StepResult(result="Approved")
-
-    @step(next=["promote", "rollback"])
-    def run_tests(self) -> StepResult:
-        results = execute_tests()
-        return StepResult(result=f"{results.passed} passed")
-
-    @step(terminal=True)
-    def promote(self) -> StepResult:
-        return StepResult(result="Live in production")
-
-    @step(terminal=True)
-    def rollback(self) -> StepResult:
-        return StepResult(result="Rolled back")
-
-    @step(terminal=True)
-    def reject(self, reason: str) -> StepResult:
-        return StepResult(result=f"Rejected: {reason}")
-```
-
-**Parameters:**
-
-| Parameter | Type | Default | Description |
-|-----------|------|---------|-------------|
-| `name` | `str` | required | Workflow name. Tools are registered as `{name}.{step_name}` |
-| `allow_during` | `list[str]` | `None` | Glob patterns of non-workflow tools allowed alongside workflow steps |
-| `block_during` | `list[str]` | `None` | Glob patterns of non-workflow tools hidden during the workflow |
-
-When neither is specified, the workflow is fully exclusive — only workflow steps and cancel are visible.
-
-When both are specified, `allow_during` is applied first (whitelist), then `block_during` removes from the result.
-
-### `@step(...)`
-
-Method decorator. Defines a state in the workflow graph.
-
-**Parameters:**
-
-| Parameter | Type | Default | Description |
-|-----------|------|---------|-------------|
-| `initial` | `bool` | `False` | This step is the entry point. Exactly one required per workflow |
-| `next` | `list[str]` | `None` | Step names that become available after this step completes |
-| `terminal` | `bool` | `False` | This step ends the workflow. Cannot have `next` |
-| `no_cancel` | `bool` | `False` | Do not inject cancel at this step. Agent must continue forward |
-| `allow_during` | `list[str]` | `None` | Override workflow-level tool visibility for this step |
-| `block_during` | `list[str]` | `None` | Override workflow-level tool visibility for this step |
-| `description` | `str` | `""` | Description shown to the agent |
-| `requires` | `list[str]` | `None` | Required parameters (from declarative validation) |
-| `enum_fields` | `dict` | `None` | Enum validation with fuzzy matching |
-
-Step-level `allow_during`/`block_during` **replaces** (does not merge with) the workflow-level setting.
-
-### `StepResult`
-
-Returned by step handlers.
-
-```python
-@dataclass
-class StepResult:
-    result: str = ""           # Text shown to the agent
-    next: list[str] | None = None  # Narrow the declared next set (must be subset)
-```
-
-If `next` is specified, it must be a subset of the step's declared `next`. The framework raises a runtime error if the handler returns a step not declared in the decorator. If `next` is not specified, all declared next steps are enabled.
-
-```python
-@step(next=["promote", "rollback", "retry"])
-def run_tests(self) -> StepResult:
-    results = execute_tests()
-    if results.all_passed:
-        return StepResult(result="All passed", next=["promote"])
-    else:
-        return StepResult(result="Failures detected", next=["retry", "rollback"])
-```
-
----
-
-## Workflow Lifecycle
-
-### 1. Registration
-
-When the `@workflow` class is processed:
-- Each `@step` method is collected
-- The step graph is validated (see Graph Validation below)
-- Tool definitions are generated using `strategy="separate"` — each step becomes `{workflow}.{step}`
-- Only the `initial` step is registered as enabled. All others + cancel start hidden
-- Registration-time warnings are logged for tool visibility contradictions
-
-### 2. Start
-
-When the agent calls the initial step tool (e.g., `deploy.review`):
-- The framework snapshots the current full tool list (`pre_workflow_tools`)
-- Creates a `WorkflowState` instance with the workflow class instance, empty history
-- Runs the step handler
-- Transitions to the next state (enables next steps, disables current, applies visibility rules)
-
-### 3. Transitions
-
-After each step handler completes:
-1. Record `(step_name, StepResult)` in history
-2. If terminal step: call `on_complete` if defined, restore `pre_workflow_tools`, done
-3. Compute the new visible tool set:
-   - Start with `{next step tools}`
-   - Add `{workflow}.cancel` unless `no_cancel=True` on all next steps
-   - Add non-workflow tools that pass the allow/block filter (step-level if specified, else workflow-level)
-4. Call `tool_manager.set_allowed(visible_set)`
-
-### 4. Cancel
-
-`{workflow}.cancel` is auto-injected at every step unless `no_cancel=True`. When called:
-- Calls `on_cancel(current_step, history)` on the workflow instance if defined
-- Restores `pre_workflow_tools`
-- Returns the `on_cancel` return value (or a default message) as the tool result
-
-### 5. Complete
-
-When a terminal step finishes:
-- Calls `on_complete(history)` on the workflow instance if defined
-- Restores `pre_workflow_tools`
-
----
-
-## Workflow State
-
-```python
-@dataclass
-class WorkflowState:
-    workflow_name: str
-    current_step: str
-    history: list[tuple[str, StepResult]]
-    pre_workflow_tools: list[str]  # snapshot for restore
-    instance: Any                  # workflow class instance
-```
-
-The workflow class is instantiated once when the workflow starts. The instance persists across all steps, so `self` carries state:
-
-```python
-@workflow("deploy")
-class DeployWorkflow:
-    def __init__(self):
-        self.pr_url = None
-        self.test_results = None
-
-    @step(initial=True, next=["approve", "reject"])
-    def review(self, pr_url: str) -> StepResult:
-        self.pr_url = pr_url
-        return StepResult(result="Ready for review")
-
-    @step(next=["run_tests"], no_cancel=True)
-    def approve(self, reason: str) -> StepResult:
-        return StepResult(result="Approved for testing")
-```
-
-**Internal state stack:** The framework uses a stack for `WorkflowState` (depth capped at 1 for now). This enables sub-workflows in a future version without breaking changes.
-
----
-
-## Error Handling Within Steps
-
-### Default behavior: stay in current state
-
-If a step handler raises an exception, the workflow does **not** transition. The current state is preserved — the same tools remain visible, including the step that just failed and cancel. The agent sees the error as a normal `ToolResult(is_error=True)` and can retry the same step or cancel.
-
-This is the right default because:
-- The agent can retry with different arguments (e.g., fix a typo in a file path)
-- The workflow state hasn't changed, so retrying is safe
-- No data has been committed to the "next" state
-
-```python
-@step(next=["verify"])
-def run_migration(self, target_version: str) -> StepResult:
-    run_db_migration(target_version)  # raises on failure
-    return StepResult(result="Migration complete")
-
-# If run_db_migration raises:
-# - Agent sees: "Error: migration failed: column already exists"
-# - Available tools: deploy.run_migration (retry), deploy.cancel
-# - Workflow stays in the run_migration state
-```
-
-### Explicit error transitions: `on_error`
-
-For cases where specific failures should route to specific steps, the `@step` decorator accepts `on_error` — a mapping from exception types to step names:
-
-```python
-@step(next=["verify"], on_error={
-    TimeoutError: "retry_with_backoff",
-    IntegrityError: "rollback",
-})
-def run_migration(self, target_version: str) -> StepResult:
-    run_db_migration(target_version)
-    return StepResult(result="Migration complete")
-```
-
-**Rules:**
-- `on_error` targets must be step names that exist in the workflow (validated at registration)
-- If the exception type matches an `on_error` entry, the workflow transitions to that step instead of staying put
-- If the exception type doesn't match any `on_error` entry, the default behavior applies (stay in current state)
-- The error message is still returned to the agent as `ToolResult(is_error=True)` so it has context
-- `on_error` transitions respect the target step's `no_cancel` and visibility settings
-
-### `on_error` with catch-all
-
-Use `Exception` as the key for a catch-all:
-
-```python
-@step(next=["verify"], on_error={
-    IntegrityError: "rollback",
-    Exception: "error_review",  # catch-all for unexpected failures
-})
-def run_migration(self, target_version: str) -> StepResult: ...
-```
-
-### Interaction with `no_cancel`
-
-If a step has `no_cancel=True` and the handler raises, the agent is still constrained — it can retry the step (since we stay in current state) but cannot cancel. This is intentional: `no_cancel` means "you must go forward," and retrying is going forward. If the developer wants a failure escape hatch on a `no_cancel` step, they use `on_error` to route to a recovery step.
-
-### Retry limits
-
-The framework does not impose retry limits — the agent can retry a failed step as many times as it wants. If the developer wants to limit retries, they track attempt count on `self` and return a `StepResult` that routes to an error step:
-
-```python
-@step(next=["verify", "abort"])
-def run_migration(self, target_version: str) -> StepResult:
-    self.migration_attempts = getattr(self, 'migration_attempts', 0) + 1
-    if self.migration_attempts > 3:
-        return StepResult(result="Too many failures", next=["abort"])
-    run_db_migration(target_version)
-    return StepResult(result="Migration complete", next=["verify"])
-```
-
----
-
-## Tool Visibility Rules
-
-### Workflow-level
-
-| Configuration | Behavior |
-|--------------|----------|
-| Neither `allow_during` nor `block_during` | Fully exclusive: only workflow steps + cancel visible |
-| `allow_during=["status", "logs.*"]` | Exclusive + these specific tools allowed |
-| `block_during=["deploy.*", "delete_*"]` | All tools visible except these |
-| Both specified | `allow_during` whitelist first, then `block_during` removes from result |
-
-Glob patterns: `*` matches within a name, `.*` matches namespaced tools (e.g., `logs.*` matches `logs.tail`, `logs.search`).
-
-### Step-level overrides
-
-If a step specifies `allow_during` or `block_during`, it **replaces** the workflow-level setting for that step entirely:
-
-```python
-@workflow("deploy", allow_during=["status", "logs.*"])
-class DeployWorkflow:
-    @step(initial=True, next=["approve"],
-          allow_during=["diff", "file_read", "status"])  # replaces workflow-level
-    def review(self, changes: str) -> StepResult: ...
-
-    @step(next=["verify"], no_cancel=True,
-          allow_during=[])  # full lockdown, not even status
-    def run_migration(self) -> StepResult: ...
-
-    @step(terminal=True)  # inherits workflow-level: status + logs.*
-    def verify(self) -> StepResult: ...
-```
-
-### Edge case: mid-workflow tool list changes
-
-If a non-workflow tool modifies the tool list (e.g., `status` enables `debug_dump`), the workflow's allow/block filter is reapplied on the next step transition. The workflow is authoritative.
-
----
-
-## Graph Validation
-
-### Hard errors (prevent registration)
-
-- No `initial=True` step defined
-- Multiple `initial=True` steps
-- A `next` reference points to a step name that doesn't exist in the workflow
-- A non-terminal step has no `next` defined (dead end)
-- A terminal step has `next` defined (contradiction)
-
-### Warnings (logged at startup)
-
-- A step is unreachable (not referenced by any other step's `next`, and not `initial`)
-- `no_cancel=True` on a terminal step (redundant)
-- Step allows a tool that the workflow blocks
-- Step or workflow references a tool name/pattern that isn't registered
-
----
-
-## Lifecycle Hooks
-
-### `on_cancel(current_step, history) -> str`
-
-Optional method on the workflow class. Called when the agent cancels. Return value becomes the tool result.
-
-```python
-def on_cancel(self, current_step: str, history: list) -> str:
-    cleanup_staging()
-    return "Deploy cancelled, staging cleaned up"
-```
-
-### `on_complete(history) -> None`
-
-Optional method on the workflow class. Called when a terminal step finishes. For cleanup, logging, audit trails.
-
-```python
-def on_complete(self, history: list) -> None:
-    log_audit_trail(history)
-```
-
----
-
-## Implementation Architecture
-
-### Builds on existing primitives
-
-| Feature | How workflows use it |
-|---------|---------------------|
-| Tool groups (separate strategy) | Each step becomes a `{workflow}.{step}` tool |
-| Dynamic tool lists (`tool_manager`) | `set_allowed()` enforces visibility on each transition |
-| Declarative validation | Steps can use `requires`, `enum_fields`, `cross_rules` |
-| Server context | Context resolvers inject into step handlers |
-| Local middleware | Middleware wraps step handlers like any tool call |
-| Telemetry | Step transitions emit `ToolCallEvent` with `action=step_name` |
-
-### New module
-
-`sdk/python/src/protomcp/workflow.py` — depends on `group.py`, `tool.py`, `manager.py`. Does NOT modify `runner.py`.
-
-### Key types
-
-- `WorkflowDef` — stores the workflow definition (name, steps, visibility config)
-- `StepDef` — stores step metadata (name, next, flags, handler)
-- `WorkflowState` — runtime state (current step, history, tool snapshot, instance)
-- `_active_workflow_stack: list[WorkflowState]` — module-level state, depth capped at 1
-
-### How it generates tools
-
-`@workflow` creates a tool group with `strategy="separate"`. The initial step's tool handler:
-1. Creates `WorkflowState`, snapshots tools
-2. Runs the step handler
-3. Computes next visible set
-4. Calls `tool_manager.set_allowed()`
-
-Subsequent step handlers:
-1. Validate the step is actually available (defensive check)
-2. Run the step handler
-3. If terminal: restore snapshot, call `on_complete`
-4. Else: compute next visible set, `set_allowed()`
-
-The cancel handler:
-1. Call `on_cancel` if defined
-2. Restore snapshot
-
-### No proto changes
-
-Workflows produce standard `ToolDefinition` messages. Transitions use standard `enable_tools`/`disable_tools` or `set_allowed`. The Go bridge and MCP host see normal tool list changes.
-
-### No runner changes
-
-Workflow tools are just tools with handlers that manage their own visibility via `tool_manager`. The runner dispatches them like any other tool.
-
----
-
-## Multi-SDK Support
-
-Workflows should be implemented in all 4 SDKs following the same pattern as tool groups:
-
-| SDK | API style |
-|-----|-----------|
-| Python | `@workflow` / `@step` decorators |
-| Go | `Workflow("name", opts...)` with `Step("name", opts...)` |
-| TypeScript | `workflow({name, steps: {...}})` |
-| Rust | `workflow("name").step("review", \|s\| ...).register()` |
-
----
-
-## Examples
-
-### Deployment pipeline
-
-```python
-@workflow("deploy", allow_during=["status", "logs.*"])
-class DeployWorkflow:
-    def __init__(self):
-        self.changes = None
-
-    @step(initial=True, next=["approve", "reject"],
-          allow_during=["diff", "file_read", "status"])
-    def review(self, pr_url: str) -> StepResult:
-        self.changes = fetch_diff(pr_url)
-        return StepResult(result=f"{len(self.changes)} files changed")
-
-    @step(next=["run_tests"])
-    def approve(self, reason: str) -> StepResult:
-        return StepResult(result="Approved for staging")
-
-    @step(terminal=True)
-    def reject(self, reason: str) -> StepResult:
-        return StepResult(result=f"Rejected: {reason}")
-
-    @step(next=["promote", "rollback"], no_cancel=True)
-    def run_tests(self) -> StepResult:
-        results = execute_tests()
-        if results.all_passed:
-            return StepResult(result="All passed", next=["promote"])
-        return StepResult(result="Failures", next=["rollback"])
-
-    @step(terminal=True, no_cancel=True)
-    def promote(self) -> StepResult:
-        deploy_to_prod()
-        return StepResult(result="Live in production")
-
-    @step(terminal=True)
-    def rollback(self) -> StepResult:
-        rollback_staging()
-        return StepResult(result="Rolled back")
-
-    def on_cancel(self, current_step, history):
-        cleanup_staging()
-        return "Deploy cancelled"
-
-    def on_complete(self, history):
-        log_audit_trail(history)
-```
-
-### Data onboarding
-
-```python
-@workflow("onboard", block_during=["deploy.*", "delete_*"])
-class OnboardWorkflow:
-    @step(initial=True, next=["add_source"])
-    def configure(self, project_name: str) -> StepResult:
-        init_project(project_name)
-        return StepResult(result=f"Project '{project_name}' created")
-
-    @step(next=["add_source", "select_model"],
-          description="Add a data source (CSV, database, API)")
-    def add_source(self, source_path: str, source_type: str = "csv") -> StepResult:
-        ingest(source_path, source_type)
-        return StepResult(result=f"Added {source_path}")
-
-    @step(next=["train"], requires=["model_type"])
-    def select_model(self, model_type: str) -> StepResult:
-        return StepResult(result=f"Selected {model_type}")
-
-    @step(terminal=True, no_cancel=True)
-    def train(self) -> StepResult:
-        run_training()
-        return StepResult(result="Training complete")
-```
diff --git a/docs/superpowers/specs/2026-03-14-test-engine-playground-design.md b/docs/superpowers/specs/2026-03-14-test-engine-playground-design.md
deleted file mode 100644
index fa0ca62..0000000
--- a/docs/superpowers/specs/2026-03-14-test-engine-playground-design.md
+++ /dev/null
@@ -1,492 +0,0 @@
-# Test Engine & Playground Design Spec
-
-## Goal
-
-Add testing and playground functionality to protomcp — a shared test engine that powers both a CLI (`pmcp test`) and a web UI (`pmcp playground`). The test engine acts as an MCP client, connecting through the full protocol stack to exercise tools, resources, and prompts with full protocol tracing.
-
-## Architecture
-
-```
-                        ┌──────────────────────┐
-                        │   pmcp test (CLI)    │
-                        └──────────┬───────────┘
-                                   │
-                        ┌──────────▼───────────┐
-                        │    Test Engine        │
-                        │  (internal/testengine)│
-                        └──────────┬───────────┘
-                                   │
-                        ┌──────────▼───────────┐     ┌──────────────────────┐
-                        │   pmcp playground    │────►│  React SPA (embed)   │
-                        │   (HTTP + WebSocket) │     │  internal/playground │
-                        └──────────────────────┘     └──────────────────────┘
-```
-
-The test engine is the shared foundation. The CLI and playground are thin interfaces on top of it. Neither contains business logic.
-
----
-
-## Test Engine (`internal/testengine/`)
-
-### Connection Model
-
-The test engine acts as a full MCP client. It starts a tool process via `process.Manager`, wires it through the bridge to an `mcp.Server`, then connects to that server using the official SDK's `mcp.Client` over an in-memory transport.
-
-```
-    mcp.Client (test engine)
-           │
-    InMemoryTransport pair
-           │
-    mcp.Server (official SDK)
-           │
-    bridge.Bridge
-           │
-    process.Manager
-           │
-    Your Tool Code
-```
-
-The SDK provides `mcp.NewInMemoryTransports()` which returns two connected transports — one for the server, one for the client. No ports, no stdio. The test engine connects the client side and gets a `ClientSession`.
-
-**Connection ordering:** The SDK requires the server to connect before the client (the client drives initialization). In `Engine.Start()`:
-1. Start `server.Connect(ctx, serverTransport, nil)` in a goroutine (non-blocking)
-2. Call `client.Connect(ctx, clientTransport, nil)` synchronously (blocks until initialize completes)
-3. The goroutine's `ServerSession` is kept alive for the engine's lifetime
-
-**Backend adapter:** `process.Manager` does not implement `bridge.FullBackend` directly — it's missing `ActiveTools()` (which filters by the tool list manager). The engine creates a `toolBackend` wrapper identical to the one in `cmd/protomcp/main.go`, combining the process manager with a `toollist.Manager`.
-
-### Protocol Tracing
-
-The SDK provides `mcp.LoggingTransport` which wraps any transport and writes every JSON-RPC message (both directions) to an `io.Writer`. We wrap the **client-side** in-memory transport with this to capture the full protocol trace from the client's perspective (`write` = request sent, `read` = response received).
-
-The trace writer feeds a `TraceLog` that stores entries and broadcasts to live subscribers (the playground's WebSocket).
-
-### Core Types
-
-```go
-package testengine
-
-type Engine struct {
-    client  *mcp.Client
-    session *mcp.ClientSession
-    server  *mcp.Server
-    pm      *process.Manager
-    bridge  *bridge.Bridge
-    trace   *TraceLog
-    toolsCh chan []*mcp.Tool  // pushed on tool list changes
-}
-
-type TraceEntry struct {
-    Timestamp time.Time `json:"timestamp"`
-    Direction string    `json:"direction"` // "send" or "recv"
-    Raw       string    `json:"raw"`       // full JSON-RPC message
-    Method    string    `json:"method"`    // parsed method name
-}
-
-type TraceLog struct {
-    mu      sync.Mutex
-    entries []TraceEntry
-    subs    []chan TraceEntry
-}
-
-type CallResult struct {
-    Result        *mcp.CallToolResult `json:"result"`
-    Duration      time.Duration       `json:"duration_ms"`
-    ToolsEnabled  []string            `json:"tools_enabled,omitempty"`
-    ToolsDisabled []string            `json:"tools_disabled,omitempty"`
-}
-
-type Option func(*engineConfig)
-type engineConfig struct {
-    runtime     string
-    socketPath  string
-    callTimeout time.Duration
-}
-```
-
-### Engine API
-
-```go
-func New(file string, opts ...Option) (*Engine, error)
-func (e *Engine) Start(ctx context.Context) error
-func (e *Engine) Stop()
-
-// MCP operations — all go through full protocol stack
-func (e *Engine) ListTools(ctx context.Context) ([]*mcp.Tool, error)
-func (e *Engine) CallTool(ctx context.Context, name string, args map[string]any) (*CallResult, error)
-func (e *Engine) ListResources(ctx context.Context) ([]*mcp.Resource, error)
-func (e *Engine) ReadResource(ctx context.Context, uri string) (*mcp.ReadResourceResult, error)
-func (e *Engine) ListPrompts(ctx context.Context) ([]*mcp.Prompt, error)
-func (e *Engine) GetPrompt(ctx context.Context, name string, args map[string]string) (*mcp.GetPromptResult, error)
-
-// Tracing
-func (e *Engine) Trace() *TraceLog
-func (e *Engine) SubscribeTrace() <-chan TraceEntry
-func (e *Engine) UnsubscribeTrace(ch <-chan TraceEntry)
-
-// Tool list change observation
-func (e *Engine) OnToolsChanged(fn func(tools []*mcp.Tool))
-
-// Hot reload
-func (e *Engine) Reload(ctx context.Context) error
-```
-
-### TraceLog API
-
-```go
-func (t *TraceLog) Entries() []TraceEntry         // snapshot
-func (t *TraceLog) Subscribe() chan TraceEntry     // live stream
-func (t *TraceLog) Unsubscribe(ch chan TraceEntry)
-func (t *TraceLog) Clear()
-```
-
-### Trace Writer
-
-A custom `io.Writer` that parses the SDK's log lines into `TraceEntry` structs. The `LoggingTransport` writes lines like:
-
-```
-read: {"jsonrpc":"2.0","id":1,"method":"initialize",...}
-write: {"jsonrpc":"2.0","id":1,"result":{...}}
-```
-
-The trace writer parses these, extracts direction and method, timestamps them, appends to the log, and broadcasts to subscribers.
-
-### Tool List Change Tracking
-
-Two mechanisms:
-
-1. **Process-level:** The engine wires `process.Manager.OnEnableTools` and `OnDisableTools` callbacks. When tool list changes occur during a `CallTool`, the engine captures the names in the `CallResult`.
-
-2. **MCP-level:** The engine sets `ClientOptions.ToolListChangedHandler` on the `mcp.Client`. When the server sends `notifications/tools/list_changed`, the handler calls `session.ListTools()` to fetch the updated list (the notification itself does not carry the list), then pushes the result to `toolsCh` and any registered callbacks.
-
-### Hot Reload
-
-The engine wraps `reload.NewWatcher` with the file path passed to `New(file)`. On file change:
-1. Call `pm.Reload(ctx)` to get updated tool definitions
-2. Re-sync the bridge: `bridge.SyncTools()`, `bridge.SyncResources()`, `bridge.SyncPrompts()`
-3. The server automatically sends `notifications/tools/list_changed` to the connected client
-4. The client's `ToolListChangedHandler` fires, re-fetches the tool list, and pushes to subscribers
-
-Note: The in-memory transport pair survives reload — the MCP session stays open. Only the registered handlers on the `mcp.Server` change (via the bridge sync methods). No transport recycling needed.
-
----
-
-## CLI: `pmcp test`
-
-### Command Structure
-
-Three subcommands added to the existing config parser:
-
-```
-pmcp test <file> list                              — list tools, resources, prompts
-pmcp test <file> call <name> --args '{...}'        — call a tool
-pmcp test <file> scenario <scenario.json>          — run scenario (V2)
-```
-
-The `test` command is added alongside `dev`, `run`, and `validate` in `config.Parse()`.
-
-### `pmcp test <file> list`
-
-Creates an engine, starts the tool process, discovers all features:
-
-```
-$ pmcp test tools.py list
-
-  Tools
-  ────────────────────────────────────────────────────────────────
-  add               Add two numbers              a (integer, required)
-                                                 b (integer, required)
-  get_weather       Get weather for a location   city (string, required)
-                                                 units (string, optional)
-
-  Resources
-  ────────────────────────────────────────────────────────────────
-  config://app      App configuration            application/json
-  notes://{id}      Read a note (template)       text/plain
-
-  Prompts
-  ────────────────────────────────────────────────────────────────
-  summarize         Summarize a document         topic (required), style
-
-  3 tools, 2 resources, 1 prompt
-```
-
-With `--format json`, outputs machine-readable JSON.
-
-### `pmcp test <file> call <name> --args '{...}'`
-
-Calls a single tool and shows result + protocol trace:
-
-```
-$ pmcp test tools.py call get_weather --args '{"city": "SF"}'
-
-  Result (247ms)
-  ────────────────────────────────────────────────────────────────
-  {"location": "SF", "temperature_f": 62.1, "conditions": "Foggy"}
-
-  Protocol Trace
-  ────────────────────────────────────────────────────────────────
-  0ms    → initialize {protocolVersion: "2025-03-26", ...}
-  1ms    ← initialize result {capabilities: {tools: {listChanged: true}}}
-  1ms    → notifications/initialized
-  2ms    → tools/call {name: "get_weather", arguments: {"city": "SF"}}
-  247ms  ← tools/call result {content: [{type: "text", text: "..."}]}
-
-  Tool list: no changes
-```
-
-If tool list changes occurred:
-```
-  Tool list changes
-  ────────────────────────────────────────────────────────────────
-  + create_record    (enabled)
-  - login            (disabled)
-```
-
-`--trace=false` suppresses the protocol trace. `--format json` outputs everything as JSON.
-
-### `pmcp test <file> scenario <file.json>` (V2)
-
-Prints "scenario runner coming in a future release" for now. The config parser accepts the command so the CLI surface is stable.
-
-### Config Changes
-
-```go
-// In config.go, add to Config:
-TestSubcommand string   // "list", "call", "scenario"
-TestToolName   string   // for "call" subcommand
-TestArgs       string   // --args JSON string
-TestScenario   string   // scenario file path
-```
-
----
-
-## Playground Backend (`internal/playground/`)
-
-### Server
-
-Started with `pmcp playground <file> [--port 3000]`. Creates a test engine, then serves:
-
-```
-GET  /                    → React SPA (embed.FS)
-GET  /api/tools           → list tools with full schemas
-GET  /api/resources       → list resources
-GET  /api/prompts         → list prompts with argument schemas
-POST /api/call            → call tool, return result + timing + tool list changes
-POST /api/resource/read   → read a resource by URI
-POST /api/prompt/get      → get prompt with arguments
-POST /api/reload          → trigger hot reload
-GET  /api/trace           → get full trace log
-GET  /ws                  → WebSocket event stream
-```
-
-### REST Endpoints
-
-All return JSON. Content-Type: application/json.
-
-`GET /api/tools` returns:
-```json
-{
-  "tools": [
-    {
-      "name": "get_weather",
-      "description": "Get weather for a location",
-      "inputSchema": {"type": "object", "properties": {"city": {"type": "string"}}, "required": ["city"]}
-    }
-  ]
-}
-```
-
-`POST /api/call` with `{"name": "get_weather", "args": {"city": "SF"}}` returns:
-```json
-{
-  "result": {"content": [{"type": "text", "text": "..."}], "isError": false},
-  "duration_ms": 247,
-  "tools_enabled": [],
-  "tools_disabled": []
-}
-```
-
-### WebSocket Event Stream
-
-`GET /ws` upgrades to WebSocket. Events are JSON with a `type` field:
-
-```json
-{"type": "trace", "entry": {"timestamp": "...", "direction": "send", "method": "tools/call", "raw": "..."}}
-{"type": "tools_changed", "tools": [...]}
-{"type": "progress", "token": "...", "progress": 5, "total": 10, "message": "Step 5/10"}
-{"type": "log", "level": "info", "message": "..."}
-{"type": "reload", "tool_count": 3}
-{"type": "connection", "status": "connected"}
-```
-
-Backend subscribes to `engine.SubscribeTrace()` and process manager callbacks, pushes through WebSocket.
-
-### Hot Reload
-
-File watcher runs in dev mode. On change: engine reloads, pushes `reload` event through WebSocket, frontend refreshes tool list.
-
-### Package Structure
-
-```
-internal/playground/
-  server.go       — HTTP server setup, embed.FS, mux
-  handlers.go     — REST endpoint handlers
-  ws.go           — WebSocket hub, connection management, event broadcast
-```
-
-### WebSocket Library
-
-Use `golang.org/x/net/websocket` (already a transitive dependency) or `nhooyr.io/websocket` (modern, context-aware). Recommend `nhooyr.io/websocket` for cleaner API and proper context cancellation.
-
----
-
-## Playground Frontend
-
-React SPA with Tailwind, built by Vite, embedded into Go binary via `//go:embed`.
-
-### Layout
-
-Two-panel layout with top bar.
-
-**Top Bar:**
-- Connection status (green/red dot)
-- File name being tested
-- Feature count: "4 tools, 2 resources, 1 prompt" — updates live
-- Reload button → `POST /api/reload`
-- Uptime timer
-
-**Left Panel — Interaction Space:**
-
-Feature picker at top with three tabs: Tools, Resources, Prompts. Each shows registered items. Selecting one opens an interaction form below.
-
-**Tool form:** Auto-generated from input schema.
-- `string` → text input
-- `integer`/`number` → number input
-- `boolean` → checkbox
-- `object`/`array` → JSON textarea with validation
-- Required fields marked with asterisk
-- "Call" button. Spinner while in-flight. Progress bar if progress notifications arrive.
-
-**Resource form:** URI input (pre-filled for static, editable for templates). "Read" button.
-
-**Prompt form:** Auto-generated from argument list. "Get" button.
-
-**Interaction history** below the form, newest at bottom, chat-style scroll:
-- Each entry: request (tool name + args) → result (formatted content)
-- Errors in red with error code
-- Tool list changes as inline system messages: "login enabled create_record, delete_record"
-- New tools animate into the picker with a 2-second highlight badge
-
-**Right Panel — Protocol Flow:**
-
-Scrolling log of every JSON-RPC message, timestamped from session start.
-
-- Outgoing (client → server): blue, `→` prefix
-- Incoming (server → client): green, `←` prefix
-- Notifications: yellow, `⚡` prefix
-- Errors: red
-
-Compact one-line summary per entry. Click to expand full JSON-RPC message.
-
-Auto-scrolls to bottom unless user has scrolled up. Clear button top-right.
-
-### Frontend Structure
-
-```
-internal/playground/frontend/
-  package.json
-  vite.config.ts
-  tailwind.config.ts
-  index.html
-  src/
-    App.tsx            — layout, panels, top bar
-    components/
-      TopBar.tsx       — connection status, counts, reload
-      FeaturePicker.tsx — tabbed tool/resource/prompt list
-      ToolForm.tsx     — auto-generated form from JSON schema
-      ResourceForm.tsx — URI input form
-      PromptForm.tsx   — argument form
-      ResultView.tsx   — formatted result display
-      TracePanel.tsx   — protocol flow log
-      TraceEntry.tsx   — single expandable trace entry
-      ProgressBar.tsx  — animated progress indicator
-      History.tsx      — interaction history container
-    hooks/
-      useWebSocket.ts  — WS connection, reconnect, event parsing
-      useApi.ts        — REST API calls with loading states
-    types.ts           — shared TypeScript types matching backend JSON
-```
-
-### Build & Embed
-
-```
-# In Makefile:
-playground-frontend:
-    cd internal/playground/frontend && npm run build
-
-# In Go:
-//go:embed frontend/dist/*
-var playgroundFS embed.FS
-```
-
-The React app builds to `frontend/dist/`. The Go binary embeds it. `pmcp playground` serves it at `/`.
-
----
-
-## V1 Scope
-
-**Ship:**
-- Test engine (`internal/testengine/`)
-- `pmcp test <file> list`
-- `pmcp test <file> call <tool> --args '{...}'`
-- `pmcp playground <file>` with interactive tool/resource/prompt calling and live protocol trace
-- Hot reload visibility in playground
-- Dynamic tool list tracking with visual feedback
-
-**Save for V2:**
-- `pmcp test <file> scenario <file.json>` — scenario runner with assertions
-- CI integration mode (`--ci` flag, exit codes, JUnit output)
-- Multi-agent view in playground
-- Prompt completion testing in playground
-
----
-
-## Build Order
-
-1. **Test engine** (`internal/testengine/`) — shared foundation
-2. **CLI** (`pmcp test list`, `pmcp test call`) — validates engine API, ships fast
-3. **Playground backend** (`internal/playground/`) — HTTP + WebSocket serving the engine
-4. **Playground frontend** (`internal/playground/frontend/`) — React SPA
-5. **Polish** — error states, loading states, reconnection, edge cases
-
----
-
-## Dependencies
-
-New:
-- `nhooyr.io/websocket` — WebSocket server for playground
-- React, Tailwind, Vite — frontend (embedded, not a Go dependency)
-
-Existing (already in go.mod):
-- `github.com/modelcontextprotocol/go-sdk/mcp` — Client, InMemoryTransport, LoggingTransport
-- `github.com/fsnotify/fsnotify` — file watching for hot reload
-
----
-
-## Error Handling
-
-- Engine start failure (bad file, missing runtime): clear error message, non-zero exit
-- Tool call failure: show error in result, full trace still captured
-- WebSocket disconnect: frontend auto-reconnects with exponential backoff
-- Process crash: engine detects via `pm.OnCrash()`, pushes error event, playground shows crash state
-- Hot reload failure: log error, keep running with old tools, push error event
-
----
-
-## Testing Strategy
-
-- `internal/testengine/` unit tests: mock process manager, verify trace capture, tool list tracking
-- `internal/playground/` handler tests: HTTP test server, verify REST responses
-- E2E: start engine with Python echo fixture, call tool, verify result and trace
-- Frontend: manual testing for V1, component tests in V2
diff --git a/examples/python/workflow_deploy.py b/examples/python/workflow_deploy.py
index c26bfe1..7b76db6 100644
--- a/examples/python/workflow_deploy.py
+++ b/examples/python/workflow_deploy.py
@@ -3,7 +3,7 @@
 =====================================
 Demonstrates @workflow with multi-step state machine.
 The agent only sees valid next steps at each point.
-Run with: pmcp dev -- python workflow_deploy.py
+Run with: pmcp dev examples/python/workflow_deploy.py
 """
 from protomcp import workflow, step, StepResult, tool, ToolResult
 from protomcp.runner import run
diff --git a/internal/process/manager.go b/internal/process/manager.go
index 113b9bc..dd5d725 100644
--- a/internal/process/manager.go
+++ b/internal/process/manager.go
@@ -923,12 +923,14 @@ func (m *Manager) readLoop() {
 		}
 
 		// Clean up orphaned stream assemblies.
+		m.mu.Lock()
 		now := time.Now()
 		for id, asm := range m.streams {
 			if now.Sub(asm.created) > m.cfg.CallTimeout {
 				delete(m.streams, id)
 			}
 		}
+		m.mu.Unlock()
 
 		env, rawPayload, err := envelope.ReadRaw(m.conn)
 		if err != nil {
@@ -1059,7 +1061,9 @@ func (m *Manager) readLoop() {
 				if sh.TotalSize > 0 {
 					assembly.buf.Grow(int(sh.TotalSize))
 				}
+				m.mu.Lock()
 				m.streams[reqID] = assembly
+				m.mu.Unlock()
 			}
 			continue
 		}
@@ -1084,13 +1088,17 @@ func (m *Manager) readLoop() {
 				}
 			} else {
 				// Reassembly mode.
+				m.mu.Lock()
 				assembly, ok := m.streams[reqID]
+				m.mu.Unlock()
 				if !ok {
 					continue
 				}
 				assembly.buf.Write(sc.Data)
 				if sc.Final {
+					m.mu.Lock()
 					delete(m.streams, reqID)
+					m.mu.Unlock()
 					result := &pb.Envelope{
 						RequestId: reqID,
 						Msg: &pb.Envelope_CallResult{
diff --git a/sdk/go/protomcp/runner.go b/sdk/go/protomcp/runner.go
index 606bc70..94f6941 100644
--- a/sdk/go/protomcp/runner.go
+++ b/sdk/go/protomcp/runner.go
@@ -56,6 +56,7 @@ func Run() {
 		case env.GetListTools() != nil:
 			handleListTools(tp, reqID)
 			sendMiddlewareRegistrations(tp)
+			sendDisableHiddenTools(tp)
 		case env.GetCallTool() != nil:
 			handleCallTool(tp, env.GetCallTool(), reqID)
 		case env.GetReload() != nil:
@@ -107,6 +108,23 @@ func handleListTools(tp *Transport, reqID string) {
 	})
 }
 
+func sendDisableHiddenTools(tp *Transport) {
+	var hidden []string
+	for _, t := range GetRegisteredTools() {
+		if t.Hidden {
+			hidden = append(hidden, t.Name)
+		}
+	}
+	if len(hidden) == 0 {
+		return
+	}
+	tp.Send(&pb.Envelope{
+		Msg: &pb.Envelope_DisableTools{
+			DisableTools: &pb.DisableToolsRequest{ToolNames: hidden},
+		},
+	})
+}
+
 func sendHandshakeComplete(tp *Transport) {
 	tp.Send(&pb.Envelope{
 		Msg: &pb.Envelope_ReloadResponse{
diff --git a/sdk/go/protomcp/tool.go b/sdk/go/protomcp/tool.go
index c5f6da1..48e5661 100644
--- a/sdk/go/protomcp/tool.go
+++ b/sdk/go/protomcp/tool.go
@@ -118,6 +118,7 @@ func IdempotentHint(v bool) ToolOption  { return func(td *ToolDef) { td.Idempote
 func ReadOnlyHint(v bool) ToolOption    { return func(td *ToolDef) { td.ReadOnly = v } }
 func OpenWorldHint(v bool) ToolOption   { return func(td *ToolDef) { td.OpenWorld = v } }
 func TaskSupportHint(v bool) ToolOption { return func(td *ToolDef) { td.TaskSupport = v } }
+func HiddenHint(h bool) ToolOption      { return func(d *ToolDef) { d.Hidden = h } }
 
 func (td ToolDef) InputSchemaJSON() string {
 	b, _ := json.Marshal(td.InputSchema)
diff --git a/sdk/python/gen/__pycache__/protomcp_pb2.cpython-312.pyc b/sdk/python/gen/__pycache__/protomcp_pb2.cpython-312.pyc
deleted file mode 100644
index fa90363..0000000
Binary files a/sdk/python/gen/__pycache__/protomcp_pb2.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/__init__.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/__init__.cpython-312.pyc
deleted file mode 100644
index 7d7b634..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/__init__.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/completion.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/completion.cpython-312.pyc
deleted file mode 100644
index 375345f..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/completion.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/context.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/context.cpython-312.pyc
deleted file mode 100644
index 32d82dc..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/context.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/log.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/log.cpython-312.pyc
deleted file mode 100644
index 15122b6..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/log.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/manager.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/manager.cpython-312.pyc
deleted file mode 100644
index 11dbf04..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/manager.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/middleware.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/middleware.cpython-312.pyc
deleted file mode 100644
index 2d5117c..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/middleware.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/prompt.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/prompt.cpython-312.pyc
deleted file mode 100644
index 060b936..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/prompt.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/resource.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/resource.cpython-312.pyc
deleted file mode 100644
index 77ad7e5..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/resource.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/result.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/result.cpython-312.pyc
deleted file mode 100644
index bde9ef6..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/result.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/runner.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/runner.cpython-312.pyc
deleted file mode 100644
index 5b62989..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/runner.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/tool.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/tool.cpython-312.pyc
deleted file mode 100644
index 7f2fb26..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/tool.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/__pycache__/transport.cpython-312.pyc b/sdk/python/src/protomcp/__pycache__/transport.cpython-312.pyc
deleted file mode 100644
index 3654937..0000000
Binary files a/sdk/python/src/protomcp/__pycache__/transport.cpython-312.pyc and /dev/null differ
diff --git a/sdk/python/src/protomcp/discovery.py b/sdk/python/src/protomcp/discovery.py
index 3af0a79..620ec18 100644
--- a/sdk/python/src/protomcp/discovery.py
+++ b/sdk/python/src/protomcp/discovery.py
@@ -28,8 +28,16 @@ def discover_handlers():
         return
     hot_reload = _config.get("hot_reload", False)
     if hot_reload and _loaded_modules:
+        from protomcp.tool import clear_registry
         from protomcp.group import clear_group_registry
+        from protomcp.workflow import clear_workflow_registry
+        from protomcp.server_context import clear_context_registry
+        from protomcp.local_middleware import clear_local_middleware
+        clear_registry()
         clear_group_registry()
+        clear_workflow_registry()
+        clear_context_registry()
+        clear_local_middleware()
         _loaded_modules.clear()
     for py_file in sorted(handlers_path.glob("*.py")):
         if py_file.name.startswith("_"):
diff --git a/sdk/python/src/protomcp/runner.py b/sdk/python/src/protomcp/runner.py
index 45e36ff..48189b3 100644
--- a/sdk/python/src/protomcp/runner.py
+++ b/sdk/python/src/protomcp/runner.py
@@ -1,5 +1,6 @@
 import json
 import os
+import re
 import sys
 import time
 
@@ -23,6 +24,11 @@
 from protomcp.sidecar import start_sidecars
 from protomcp.discovery import discover_handlers, get_config
 
+def _uri_matches_template(template: str, uri: str) -> bool:
+    """Check if a URI matches a URI template pattern like 'notes://{id}'."""
+    pattern = re.sub(r'\{[^}]+\}', '[^/]+', template)
+    return bool(re.fullmatch(pattern, uri))
+
 log: ServerLogger = ServerLogger(send_fn=lambda msg: None)
 
 _first_tool_call = True
@@ -303,9 +309,9 @@ def _handle_read_resource(transport, env):
             break
     if handler is None:
         for t in templates:
-            # Simple template matching — check if URI could match the template
-            handler = t.handler
-            break  # Templates need proper URI template matching; simplified for now
+            if _uri_matches_template(t.uri_template, uri):
+                handler = t.handler
+                break
 
     if handler is None:
         resp = pb.Envelope(
diff --git a/sdk/rust/src/group.rs b/sdk/rust/src/group.rs
index 4934409..63b1396 100644
--- a/sdk/rust/src/group.rs
+++ b/sdk/rust/src/group.rs
@@ -1,4 +1,4 @@
-use std::sync::Mutex;
+use std::sync::{Arc, Mutex};
 use serde_json::Value;
 use crate::context::ToolContext;
 use crate::result::ToolResult;
@@ -217,7 +217,7 @@ fn group_to_union_def(group: &GroupDef) -> ToolDef {
         name: group.name.clone(),
         description: desc,
         input_schema: schema,
-        handler: Box::new(move |ctx, args| {
+        handler: Arc::new(move |ctx, args| {
             dispatch_group_action_by_name(&group_name, ctx, args)
         }),
         destructive: false,
@@ -257,7 +257,7 @@ fn group_to_separate_defs(group: &GroupDef) -> Vec<ToolDef> {
             name: format!("{}.{}", group.name, act.name),
             description: desc,
             input_schema: schema,
-            handler: Box::new(move |ctx, args| {
+            handler: Arc::new(move |ctx, args| {
                 dispatch_specific_action(&group_name, &action_name, ctx, args)
             }),
             destructive: false,
diff --git a/sdk/rust/src/runner.rs b/sdk/rust/src/runner.rs
index 7217674..3b653bf 100644
--- a/sdk/rust/src/runner.rs
+++ b/sdk/rust/src/runner.rs
@@ -138,46 +138,36 @@ async fn handle_call_tool(transport: &Transport, req: &proto::CallToolRequest, r
         ..ToolCallEvent::new(&tool_name, "start")
     });
 
-    let result = with_registry(|tools| {
-        if let Some(tool_def) = tools.iter().find(|t| t.name == req.name) {
-            let cancelled = Arc::new(AtomicBool::new(false));
-            let ctx = ToolContext::new(
-                req.progress_token.clone(),
-                cancelled,
-                Box::new(|_| {}),
-            );
-
-            // Build local middleware chain around the tool handler
-            // We need to create a closure that captures the tool handler
-            let tool_name_inner = tool_def.name.clone();
-            let args_clone = args.clone();
-
-            // Since we can't move the handler out of the registry,
-            // call the handler directly but wrap via middleware chain
-            // We pass a handler that looks up and calls the tool
-            let handler: Box<dyn Fn(ToolContext, serde_json::Value) -> crate::result::ToolResult + Send + Sync> =
-                Box::new(move |ctx, args| {
-                    with_registry(|tools2| {
-                        if let Some(td) = tools2.iter().find(|t| t.name == tool_name_inner) {
-                            (td.handler)(ctx, args)
-                        } else {
-                            crate::result::ToolResult::error("Tool not found", "NOT_FOUND", "", false)
-                        }
-                    })
-                });
-
-            let chain = build_middleware_chain(&req.name, handler);
-            chain(ctx, args_clone)
-        } else {
-            crate::result::ToolResult::error(
-                format!("Tool not found: {}", req.name),
-                "NOT_FOUND",
-                "",
-                false,
-            )
-        }
+    let handler_opt = with_registry(|tools| {
+        tools.iter()
+            .find(|t| t.name == req.name)
+            .map(|t| t.handler.clone())
     });
 
+    let result = if let Some(handler) = handler_opt {
+        let cancelled = Arc::new(AtomicBool::new(false));
+        let ctx = ToolContext::new(
+            req.progress_token.clone(),
+            cancelled,
+            Box::new(|_| {}),
+        );
+
+        let chain_handler: Box<dyn Fn(ToolContext, serde_json::Value) -> crate::result::ToolResult + Send + Sync> =
+            Box::new(move |ctx, args| {
+                handler(ctx, args)
+            });
+
+        let chain = build_middleware_chain(&req.name, chain_handler);
+        chain(ctx, args)
+    } else {
+        crate::result::ToolResult::error(
+            format!("Tool not found: {}", req.name),
+            "NOT_FOUND",
+            "",
+            false,
+        )
+    };
+
     // Emit completion telemetry
     let duration = start_time.elapsed().as_millis() as i64;
     let phase = if result.is_error { "error" } else { "success" };
diff --git a/sdk/rust/src/tool.rs b/sdk/rust/src/tool.rs
index d2b1a46..e0a9c52 100644
--- a/sdk/rust/src/tool.rs
+++ b/sdk/rust/src/tool.rs
@@ -1,4 +1,4 @@
-use std::sync::Mutex;
+use std::sync::{Arc, Mutex};
 use serde_json::Value;
 use crate::context::ToolContext;
 use crate::result::ToolResult;
@@ -40,7 +40,7 @@ pub struct ToolDef {
     pub name: String,
     pub description: String,
     pub input_schema: Value,
-    pub handler: Box<dyn Fn(ToolContext, Value) -> ToolResult + Send + Sync>,
+    pub handler: Arc<dyn Fn(ToolContext, Value) -> ToolResult + Send + Sync>,
     pub destructive: bool,
     pub idempotent: bool,
     pub read_only: bool,
@@ -53,7 +53,7 @@ pub struct ToolBuilder {
     name: String,
     description: String,
     args: Vec<ArgDef>,
-    handler: Option<Box<dyn Fn(ToolContext, Value) -> ToolResult + Send + Sync>>,
+    handler: Option<Arc<dyn Fn(ToolContext, Value) -> ToolResult + Send + Sync>>,
     destructive: bool,
     idempotent: bool,
     read_only: bool,
@@ -126,7 +126,7 @@ impl ToolBuilder {
     where
         F: Fn(ToolContext, Value) -> ToolResult + Send + Sync + 'static,
     {
-        self.handler = Some(Box::new(f));
+        self.handler = Some(Arc::new(f));
         self
     }
 
@@ -154,7 +154,7 @@ impl ToolBuilder {
             name: self.name,
             description: self.description,
             input_schema,
-            handler: self.handler.unwrap_or_else(|| Box::new(|_, _| ToolResult::new(""))),
+            handler: self.handler.unwrap_or_else(|| Arc::new(|_, _| ToolResult::new(""))),
             destructive: self.destructive,
             idempotent: self.idempotent,
             read_only: self.read_only,
diff --git a/sdk/rust/src/workflow.rs b/sdk/rust/src/workflow.rs
index 24b5eee..b76f212 100644
--- a/sdk/rust/src/workflow.rs
+++ b/sdk/rust/src/workflow.rs
@@ -1,4 +1,4 @@
-use std::sync::Mutex;
+use std::sync::{Arc, Mutex};
 use serde_json::Value;
 use crate::context::ToolContext;
 use crate::result::ToolResult;
@@ -640,7 +640,7 @@ fn workflow_to_tool_defs(wf: &WorkflowDef) -> Vec<ToolDef> {
             name: tool_name,
             description: desc,
             input_schema: schema,
-            handler: Box::new(move |ctx, args| {
+            handler: Arc::new(move |ctx, args| {
                 handle_step_call(&wf_name, &sname, ctx, args)
             }),
             destructive: false,
@@ -660,7 +660,7 @@ fn workflow_to_tool_defs(wf: &WorkflowDef) -> Vec<ToolDef> {
             name: cancel_name,
             description: format!("Cancel the {} workflow", wf.name),
             input_schema: serde_json::json!({"type": "object", "properties": {}}),
-            handler: Box::new(move |_, _| {
+            handler: Arc::new(move |_, _| {
                 handle_cancel(&wf_name)
             }),
             destructive: false,
diff --git a/sdk/typescript/README.md b/sdk/typescript/README.md
new file mode 100644
index 0000000..fb18c00
--- /dev/null
+++ b/sdk/typescript/README.md
@@ -0,0 +1,88 @@
+# protomcp
+
+[![CI](https://github.com/msilverblatt/protomcp/actions/workflows/ci.yml/badge.svg)](https://github.com/msilverblatt/protomcp/actions/workflows/ci.yml)
+[![npm](https://img.shields.io/npm/v/protomcp)](https://www.npmjs.com/package/protomcp)
+[![License: MIT](https://img.shields.io/badge/License-MIT-blue.svg)](https://github.com/msilverblatt/protomcp/blob/main/LICENSE)
+
+TypeScript SDK for [protomcp](https://github.com/msilverblatt/protomcp) -- build MCP servers with tools, resources, and prompts in one file, one command.
+
+## Install
+
+```sh
+npm install protomcp
+```
+
+You also need the `pmcp` CLI:
+
+```sh
+brew install msilverblatt/tap/protomcp
+```
+
+## Quick Start
+
+```typescript
+// server.ts
+import { tool, resource, prompt, ToolResult } from 'protomcp';
+import { z } from 'zod';
+
+tool({
+  name: 'add',
+  description: 'Add two numbers',
+  args: z.object({ a: z.number(), b: z.number() }),
+  handler: ({ a, b }) => new ToolResult({ result: String(a + b) }),
+});
+
+resource({
+  uri: 'config://app',
+  description: 'App configuration',
+  handler: (uri) => ({ uri, text: '{"debug": false, "version": "2.1"}' }),
+});
+
+prompt({
+  name: 'explain',
+  description: 'Explain a concept',
+  arguments: [{ name: 'topic', required: true }],
+  handler: (args) => [{ role: 'user', content: `Explain ${args.topic} in simple terms` }],
+});
+```
+
+```sh
+pmcp dev server.ts
+```
+
+## Tool Groups
+
+Group related actions under a single tool with per-action schemas:
+
+```typescript
+import { toolGroup, ToolResult } from 'protomcp';
+import { z } from 'zod';
+
+toolGroup({
+  name: 'math',
+  description: 'Math operations',
+  actions: {
+    add: {
+      description: 'Add two numbers',
+      args: z.object({ a: z.number(), b: z.number() }),
+      handler: ({ a, b }) => new ToolResult({ result: String(a + b) }),
+    },
+    multiply: {
+      description: 'Multiply two numbers',
+      args: z.object({ a: z.number(), b: z.number() }),
+      handler: ({ a, b }) => new ToolResult({ result: String(a * b) }),
+    },
+  },
+});
+```
+
+## Documentation
+
+- [Full documentation](https://msilverblatt.github.io/protomcp/)
+- [TypeScript Guide](https://msilverblatt.github.io/protomcp/guides/writing-tools-typescript/)
+- [CLI Reference](https://msilverblatt.github.io/protomcp/reference/cli/)
+- [Examples](https://github.com/msilverblatt/protomcp/tree/main/examples/typescript)
+
+## License
+
+MIT
diff --git a/sdk/typescript/src/runner.ts b/sdk/typescript/src/runner.ts
index 81923dc..b8e1f57 100644
--- a/sdk/typescript/src/runner.ts
+++ b/sdk/typescript/src/runner.ts
@@ -1,6 +1,6 @@
 import * as process from 'process';
 import { Transport } from './transport.js';
-import { getRegisteredTools } from './tool.js';
+import { getRegisteredTools, getHiddenToolNames } from './tool.js';
 import { ToolResult } from './result.js';
 import { ToolContext } from './context.js';
 import { toolManager } from './manager.js';
@@ -95,6 +95,8 @@ export async function run(): Promise<void> {
     await transport.send(resp);
   }
 
+  let firstToolCall = true;
+
   while (true) {
     let env: Record<string, any>;
     try {
@@ -108,6 +110,13 @@ export async function run(): Promise<void> {
     if (env['msg'] === 'listTools') {
       await sendListTools(requestId);
       await sendMiddlewareRegistrations();
+      const hiddenNames = getHiddenToolNames();
+      if (hiddenNames.length > 0) {
+        const disableResp = Envelope.create({
+          disableTools: { toolNames: hiddenNames },
+        });
+        await transport.send(disableResp);
+      }
     } else if (env['msg'] === 'middlewareIntercept') {
       const req = env['middlewareIntercept'] ?? {};
       const mwName: string = req['middlewareName'] ?? '';
@@ -162,7 +171,10 @@ export async function run(): Promise<void> {
       let respMsg;
       try {
         // Start first_tool_call sidecars
-        await startSidecars('first_tool_call');
+        if (firstToolCall) {
+          firstToolCall = false;
+          await startSidecars('first_tool_call');
+        }
 
         let args = argumentsJson ? JSON.parse(argumentsJson) : {};
         const progressToken: string = req['progressToken'] ?? '';
diff --git a/sdk/typescript/src/workflow.ts b/sdk/typescript/src/workflow.ts
index f2ad32f..2cdfa13 100644
--- a/sdk/typescript/src/workflow.ts
+++ b/sdk/typescript/src/workflow.ts
@@ -3,7 +3,6 @@ import { zodToJsonSchema } from 'zod-to-json-schema';
 import type { ToolContext } from './context.js';
 import { type ToolDef, _setWorkflowsToToolDefs } from './tool.js';
 import { ToolResult } from './result.js';
-import { toolManager } from './manager.js';
 
 // ---------------------------------------------------------------------------
 // Types
@@ -192,7 +191,7 @@ function getStepVisibility(stepDef: StepDef, workflowDef: WorkflowDef): { allowD
   return { allowDuring: workflowDef.allowDuring, blockDuring: workflowDef.blockDuring };
 }
 
-function transitionToSteps(workflowDef: WorkflowDef, state: WorkflowState, nextStepNames: string[]): void {
+function transitionToSteps(workflowDef: WorkflowDef, state: WorkflowState, nextStepNames: string[]): string[] {
   const stepMap = new Map(workflowDef.steps.map(s => [s.name, s]));
 
   const allowedTools: string[] = [];
@@ -224,7 +223,7 @@ function transitionToSteps(workflowDef: WorkflowDef, state: WorkflowState, nextS
     }
   }
 
-  toolManager.setAllowed(allowedTools);
+  return allowedTools;
 }
 
 // ---------------------------------------------------------------------------
@@ -261,17 +260,11 @@ async function handleStepCall(workflowName: string, stepName: string, kwargs: Re
   let state = getActiveState();
 
   if (stepDef.initial) {
-    let preTools: string[] = [];
-    try {
-      preTools = await toolManager.getActiveTools();
-    } catch {
-      // If toolManager not connected, preWorkflowTools stays empty
-    }
     state = {
       workflowName,
       currentStep: stepName,
       history: [],
-      preWorkflowTools: preTools,
+      preWorkflowTools: [],
     };
     activeWorkflowStack.push(state);
   } else {
@@ -295,9 +288,11 @@ async function handleStepCall(workflowName: string, stepName: string, kwargs: Re
       for (const [substring, targetStep] of Object.entries(stepDef.onError)) {
         if (errMsg.includes(substring)) {
           state!.currentStep = targetStep;
-          transitionToSteps(wf, state!, [targetStep]);
+          const allowedTools = transitionToSteps(wf, state!, [targetStep]);
           return new ToolResult({
             result: `Error caught (${errMsg}), transitioning to '${targetStep}'`,
+            enableTools: allowedTools,
+            disableTools: [],
           });
         }
       }
@@ -344,13 +339,20 @@ async function handleStepCall(workflowName: string, stepName: string, kwargs: Re
       wf.onComplete(state!.history);
     }
     // Restore pre-workflow tools
-    toolManager.setAllowed(state!.preWorkflowTools);
     activeWorkflowStack.pop();
-    return new ToolResult({ result: result.result || 'Workflow complete' });
+    return new ToolResult({
+      result: result.result || 'Workflow complete',
+      enableTools: state!.preWorkflowTools,
+      disableTools: [],
+    });
   } else {
     // Transition to next steps
-    transitionToSteps(wf, state!, effectiveNext || []);
-    return new ToolResult({ result: result.result || `Proceed to: ${JSON.stringify(effectiveNext)}` });
+    const allowedTools = transitionToSteps(wf, state!, effectiveNext || []);
+    return new ToolResult({
+      result: result.result || `Proceed to: ${JSON.stringify(effectiveNext)}`,
+      enableTools: allowedTools,
+      disableTools: [],
+    });
   }
 }
 
@@ -377,9 +379,12 @@ function handleCancel(workflowName: string): ToolResult {
   }
 
   // Restore pre-workflow tools
-  toolManager.setAllowed(state.preWorkflowTools);
   activeWorkflowStack.pop();
-  return new ToolResult({ result: `Workflow '${workflowName}' cancelled` });
+  return new ToolResult({
+    result: `Workflow '${workflowName}' cancelled`,
+    enableTools: state.preWorkflowTools,
+    disableTools: [],
+  });
 }
 
 // ---------------------------------------------------------------------------