From aa2b6008e71a8ed4138227b820744484a8fd881f Mon Sep 17 00:00:00 2001
From: nathan shearer <help@rapidstartup.io>
Date: Sat, 28 Mar 2026 17:34:58 +0800
Subject: [PATCH 1/4] docs: map existing codebase

---
 .planning/codebase/ARCHITECTURE.md | 153 +++++++++++++++++++++
 .planning/codebase/CONCERNS.md     | 140 +++++++++++++++++++
 .planning/codebase/CONVENTIONS.md  | 135 ++++++++++++++++++
 .planning/codebase/INTEGRATIONS.md | 106 +++++++++++++++
 .planning/codebase/STACK.md        |  70 ++++++++++
 .planning/codebase/STRUCTURE.md    | 212 +++++++++++++++++++++++++++++
 .planning/codebase/TESTING.md      | 186 +++++++++++++++++++++++++
 7 files changed, 1002 insertions(+)
 create mode 100644 .planning/codebase/ARCHITECTURE.md
 create mode 100644 .planning/codebase/CONCERNS.md
 create mode 100644 .planning/codebase/CONVENTIONS.md
 create mode 100644 .planning/codebase/INTEGRATIONS.md
 create mode 100644 .planning/codebase/STACK.md
 create mode 100644 .planning/codebase/STRUCTURE.md
 create mode 100644 .planning/codebase/TESTING.md
diff --git a/.planning/codebase/ARCHITECTURE.md b/.planning/codebase/ARCHITECTURE.md
new file mode 100644
index 000000000..970f696b6
--- /dev/null
+++ b/.planning/codebase/ARCHITECTURE.md
@@ -0,0 +1,153 @@
+# Architecture
+
+**Analysis Date:** 2026-03-28
+
+## Pattern Overview
+
+**Overall:** Modular skill-based architecture with headless browser automation core
+
+**Key Characteristics:**
+- Skills as independent, self-contained modules with defined interfaces
+- Persistent headless browser server for automation tasks
+- CLI wrappers that communicate with persistent services
+- Template-driven skill generation system
+- Centralized configuration and state management
+
+## Layers
+
+**Presentation Layer (CLI):**
+- Purpose: Command-line interfaces for user interaction with skills
+- Location: `*/src/cli.ts` files across modules (browse, design, etc.)
+- Contains: Argument parsing, command routing, user output formatting
+- Depends on: Service layers, configuration systems
+- Used by: End users, scripts, other CLIs
+
+**Service Layer:**
+- Purpose: Core functionality implementation for each skill domain
+- Location: `*/src/` directories (e.g., `browse/src/`, `design/src/`)
+- Contains: Business logic, API integrations, core algorithms
+- Depends on: Infrastructure layer, external SDKs
+- Used by: Presentation layer, other services
+
+**Infrastructure Layer:**
+- Purpose: Shared utilities, configuration, state management, server infrastructure
+- Location: `browse/src/config.ts`, `browse/src/server.ts`, `scripts/` utilities
+- Contains: Persistent browser server, state persistence, config resolution, helper functions
+- Depends on: External packages (playwright, puppeteer-core, etc.)
+- Used by: All service and presentation layers
+
+**Template/Generation Layer:**
+- Purpose: Skill template system and documentation generation
+- Location: `scripts/gen-skill-docs.ts`, `.tmpl` template files
+- Contains: Template processing, skill scaffolding, documentation generation
+- Depends on: File system, template engines
+- Used by: Development workflows, skill creation process
+
+## Data Flow
+
+**Skill Execution Flow:**
+
+1. **Command Invocation:** User runs `gstack <skill> <command>` or direct binary (`browse`, `design`)
+2. **CLI Parsing:** Argument parsing and command routing in `*/src/cli.ts`
+3. **Server Management:** For browse skill, ensures persistent server is running via `ensureServer()`
+4. **Service Call:** Routes to appropriate service function based on command
+5. **Execution:** Service performs core functionality (browser automation, design generation, etc.)
+6. **Result Return:** Output formatted and returned to user via stdout/stderr
+
+**Browser Automation Flow (Browse Skill):**
+1. CLI reads state file (`.gstack/browse.json`) for server connection info
+2. If missing/stale, starts persistent Bun server running `browse/src/server.ts`
+3. CLI sends HTTP commands to server on localhost:port with bearer token auth
+4. Server executes Playwright/Puppeteer commands against Chromium
+5. Results returned via HTTP to CLI, then to user
+
+**Skill Documentation Flow:**
+1. `gen-skill-docs.ts` reads skill YAML/YAML-like configuration
+2. Processes SKILL.md.tmpl templates with skill-specific data
+3. Generates final SKILL.md files in each skill directory
+4. Also generates codex-specific variants when requested
+
+## Key Abstractions
+
+**Skill Abstraction:**
+- Purpose: Standardized interface for all gstack skills
+- Examples: `agents/openai.yaml`, `*/SKILL.md`, `*/SKILL.md.tmpl`
+- Pattern: Each skill has CLI, optional server, templates, tests, and documentation
+
+**Persistent Server Abstraction:**
+- Purpose: Long-running browser automation service
+- Examples: `browse/src/server.ts`, `browse/src/cli.ts` management functions
+- Pattern: State file (.gstack/browse.json) tracks PID, port, token; health checks via HTTP
+
+**Configuration Abstraction:**
+- Purpose: Centralized config resolution with defaults and environment overrides
+- Examples: `browse/src/config.ts`, `resolveConfig()` function
+- Pattern: Hierarchical resolution (defaults → file → env → args) with validation
+
+**Template Abstraction:**
+- Purpose: Reusable skill scaffolding and documentation generation
+- Examples: `SKILL.md.tmpl` files, `gen-skill-docs.ts` script
+- Pattern: Handlebars-style templating with skill metadata injection
+
+## Entry Points
+
+**Binary Entry Points:**
+- `browse/dist/browse`: Compiled browse CLI (primary user entry point)
+- `design/dist/design`: Compiled design CLI
+- `bin/gstack-global-discover`: Global skill discovery utility
+- `browse/dist/find-browse`: Helper for finding browse instances
+
+**Script Entry Points:**
+- `scripts/gen-skill-docs.ts`: Skill documentation generation
+- `scripts/skill-check.ts`: Skill health validation
+- `scripts/dev-skill.ts`: Skill development helper
+- `scripts/discover-skills.ts`: Skill discovery and listing
+
+**Direct Source Entry Points (Dev):**
+- `browse/src/cli.ts`: Development browse CLI
+- `design/src/cli.ts`: Development design CLI
+- `*/src/cli.ts`: Development CLIs for other skills
+
+## Error Handling
+
+**Strategy:** Defensive programming with clear error messages and graceful degradation
+
+**Patterns:**
+- **Server Lifecycle:** Automatic restart on version mismatch or failure, with startup error capture
+- **CLI Validation:** Early argument validation with clear usage instructions
+- **Network Resilience:** Retry mechanisms for transient connection failures in HTTP communication
+- **Process Management:** Cross-platform process detection and cleanup (Windows/Linux/macOS differences)
+- **Authentication:** Token validation with automatic refresh on mismatch
+- **File Operations:** Existence checks before read/write, graceful handling of missing files
+
+**Specific Implementations:**
+- Browse skill uses HTTP health checks (`isServerHealthy()`) instead of PID checks for cross-platform reliability
+- Windows uses Node.js child_process with detached:true for proper process detachment
+- Legacy state cleanup prevents conflicts between different installation methods
+- Server startup includes timeout handling and error log capture for diagnostics
+
+## Cross-Cutting Concerns
+
+**Logging:** 
+- Primary: Console output with color-coded prefixes (`[browse]`, `[design]`, etc.)
+- Levels: Error (console.error), info/status (console.log), debug (conditional)
+- Pattern: Consistent prefixed output for easy filtering
+
+**Validation:**
+- Input: Early validation of CLI arguments and configuration values
+- API: Response validation from external services (OpenAI, browser automation)
+- State: Version checking to detect mismatches between CLI and server binaries
+
+**State Management:**
+- Location: `.gstack/` directory in user home or project root
+- Persistence: JSON state files for server connection info, tokens, version hashes
+- Coordination: File-based locking to prevent race conditions during server startup
+- Cleanup: Automatic cleanup of stale state and legacy /tmp files
+
+**Authentication:**
+- Mechanism: Bearer token auth for CLI-to-server communication
+- Storage: Encrypted file storage (`~/.gstack/openai.json` for design, `.gstack/browse.json` for browse)
+- Resolution: Multiple sources (file → env → interactive prompt) with guided setup
+
+---
+*Architecture analysis: 2026-03-28*
\ No newline at end of file
diff --git a/.planning/codebase/CONCERNS.md b/.planning/codebase/CONCERNS.md
new file mode 100644
index 000000000..5a5ab349a
--- /dev/null
+++ b/.planning/codebase/CONCERNS.md
@@ -0,0 +1,140 @@
+# Codebase Concerns
+
+**Analysis Date:** 2026-03-28
+
+## Tech Debt
+
+**[Documentation gaps]:**
+- Issue: Many skill directories lack clear documentation on purpose and usage
+- Files: `agents/skill-*/README.md` (missing or minimal in many skills)
+- Impact: Difficult for new contributors to understand skill boundaries and responsibilities
+- Fix approach: Add standardized README templates for each skill with purpose, inputs, outputs, and examples
+
+**[Configuration complexity]:**
+- Issue: Multiple configuration mechanisms across skills (JSON, env vars, hardcoded values)
+- Files: `agents/*/config.ts`, `agents/*/*.json`, `.env.example`
+- Impact: Inconsistent configuration patterns increase cognitive load
+- Fix approach: Establish unified configuration pattern using `resolveConfig()` utility
+
+**[Build script fragmentation]:**
+- Issue: Build and setup scripts scattered across multiple directories
+- Files: `setup*`, `bin/*`, `scripts/*`, `package.json` scripts
+- Impact: Difficult to discover and maintain development workflows
+- Fix approach: Consolidate scripts into standardized locations with clear documentation
+
+## Known Bugs
+
+**[Skill registration failures]:**
+- Symptoms: Skills fail to load due to missing adapter configurations
+- Files: `agents/skill-parser.test.ts`, `agents/*/adapter.ts`
+- Trigger: When skill adapter doesn't implement required interfaces correctly
+- Workaround: Manual verification of adapter implementation
+- Fix approach: Add runtime validation during skill loading with clear error messages
+
+**[Browser cookie import race conditions]:**
+- Symptoms: Cookie import fails intermittently when browser is busy
+- Files: `browse/src/cookie-import-browser.ts`, `setup-browser-cookies/*`
+- Trigger: Concurrent access to browser profile during import
+- Workaround: Retry mechanism with exponential backoff
+- Fix approach: Implement proper file locking or use browser automation APIs
+
+## Security Considerations
+
+**[Environment variable exposure]:**
+- Risk: Accidental committing of `.env` files containing secrets
+- Files: `.env.example` (template), potential `.env*` files in developer environments
+- Current mitigation: `.gitignore` excludes `.env*` files
+- Recommendations: Add pre-commit hook to scan for accidental secrets, use secrets scanning in CI
+
+**[Insecure random number generation]:**
+- Risk: Use of non-cryptographically random values for security-sensitive operations
+- Files: `browse/src/sidebar-agent.ts` (generation of session IDs)
+- Current mitigation: None identified
+- Recommendations: Replace `Math.random()` with `crypto.randomUUID()` or similar secure alternatives
+
+## Performance Bottlenecks
+
+**[Skill loading latency]:**
+- Problem: Initial skill discovery and loading takes significant time
+- Files: `agents/skill-parser.ts`, `agents/skill-validation.ts`
+- Cause: Sequential file system operations for each skill directory
+- Improvement path: Implement skill caching with filesystem watchers for invalidation
+
+**[Browser instance multiplication]:**
+- Problem: Multiple browser instances spawned unnecessarily
+- Files: `browse/src/browser-manager.ts`, `browse/src/server.ts`
+- Cause: Lack of proper singleton pattern for browser manager
+- Improvement path: enforce singleton pattern and reuse browser contexts where safe
+
+## Fragile Areas
+
+**[Agent communication protocol]:**
+- Files: `agents/paperclip/*.ts`, `agents/*/adapter.ts`
+- Why fragile: Loose coupling via JSON messages without schema validation
+- Safe modification: Add JSON schema validation for all inter-agent messages
+- Test coverage: Gaps in error handling for malformed messages
+
+**[File system operation safety]:**
+- Files: `scripts/*` (file manipulation scripts), `setup*` scripts
+- Why fragile: Synchronous file operations without proper error handling
+- Safe modification: Wrap FS operations in try/catch with meaningful error messages
+- Test coverage: Limited unit testing for edge cases (permissions, missing directories)
+
+## Scaling Limits
+
+**[Concurrent skill execution]:**
+- Current capacity: Sequential skill execution in workflows
+- Limit: Long-running skills block entire workflow
+- Scaling path: Implement proper async/await patterns and worker queues for parallel execution
+
+**[Memory usage in browser operations]:**
+- Current capacity: Single browser session per user
+- Limit: Memory leaks in long-running browser sessions
+- Scaling path: Implement periodic browser restart and memory monitoring
+
+## Dependencies at Risk
+
+**[PUPPETEER_EXECUTABLE_PATH]:**
+- Risk: Hardcoded paths to browser executables in `browse/src/platform.ts`
+- Impact: Breaks when browser updates or when running in different environments
+- Migration plan: Use environment-configurable paths with auto-detection fallback
+
+**[Node.js version compatibility]:**
+- Risk: Use of modern Node.js features (`import.meta`, top-level await) that may break on older versions
+- Impact: Limits deployment environments
+- Migration plan: Either require specific Node.js version or transpile for broader compatibility
+
+## Missing Critical Features
+
+**[Skill versioning]:**
+- Problem: No mechanism to track skill versions or dependencies
+- Blocks: Safe updates and rollback of skills
+- Proposed solution: Add version metadata to skill configuration and implement compatibility checking
+
+**[Skill sandboxing]:**
+- Problem: Skills run with full process access
+- Blocks: Safe execution of third-party or untrusted skills
+- Proposed solution: Implement skill execution in restricted environments (e.g., VMs, containers)
+
+## Test Coverage Gaps
+
+**[Error handling in adapters]:**
+- What's not tested: Adapter failure scenarios and recovery
+- Files: `agents/*/adapter.ts`
+- Risk: Silent failures in skill execution
+- Priority: High
+
+**[Edge cases in file system operations]:**
+- What's not tested: Permission errors, disk full, concurrent access
+- Files: `scripts/*`, `setup*` scripts
+- Risk: Unhandled exceptions causing partial setup states
+- Priority: Medium
+
+**[Browser automation failure modes]:**
+- What's not tested: Network failures, browser crashes, element not found
+- Files: `browse/src/*`
+- Risk: Unreliable UI automation
+- Priority: High
+
+---
+*Concerns audit: 2026-03-28*
\ No newline at end of file
diff --git a/.planning/codebase/CONVENTIONS.md b/.planning/codebase/CONVENTIONS.md
new file mode 100644
index 000000000..d2807b275
--- /dev/null
+++ b/.planning/codebase/CONVENTIONS.md
@@ -0,0 +1,135 @@
+# Coding Conventions
+
+**Analysis Date:** 2026-03-28
+
+## Naming Patterns
+
+**Files:**
+- TypeScript files use kebab-case naming: `skill-parser.test.ts`, `gen-skill-docs.ts`
+- Test files follow `[feature].test.ts` pattern: `audit-compliance.test.ts`, `skill-e2e.test.ts`
+- Helper files in test directories use camelCase: `session-runner.ts`
+
+**Functions:**
+- Functions use camelCase: `extractBrowseCommands`, `validateSkill`, `parseArgs`
+- Async functions follow same naming: `runSetup`, `main`
+
+**Variables:**
+- Constants use UPPER_SNAKE_CASE: `FIXTURES_DIR`, `ROOT`, `AI_SLOP_BLACKLIST`
+- Variables use camelCase: `hasChanges`, `tokenBudget`, `cmds`
+- Boolean variables use is/has prefixes: `inBashBlock`, `DRY_RUN`
+
+**Types/Interfaces:**
+- Interface names use PascalCase: `BrowseCommand`, `ValidationResult`, `TemplateContext`
+- Type aliases follow PascalCase: `Host`
+
+## Code Style
+
+**Formatting:**
+- Uses 2-space indentation consistently
+- Line length varies but generally stays under 100 characters
+- No explicit formatter configured; follows existing code patterns
+- Semicolons are required and used consistently
+
+**Linting:**
+- No explicit linting configuration detected (.eslintrc, biome.json not found)
+- Code quality maintained through consistent patterns and manual review
+- TypeScript compiler provides strict type checking
+
+## Import Organization
+
+**Order:**
+1. Built-in Node.js modules: `fs`, `path`, `os`
+2. External packages: `bun:test`
+3. Internal modules: relative paths from project root
+4. Absolute internal paths: using `@/` or relative paths like `../../browse/src/commands`
+
+**Path Aliases:**
+- No path aliases detected in tsconfig.json
+- Uses relative paths: `../../browse/src/commands`, `../helpers/skill-parser`
+- Absolute paths from project root: `scripts/resolvers/types`
+
+## Error Handling
+
+**Patterns:**
+- Synchronous code: Uses try/catch for file operations
+  ```typescript
+  try {
+    fs.writeFileSync(outputPath, content);
+  } catch (err) {
+    // Handle error appropriately
+  }
+  ```
+- Asynchronous code: Prefers try/catch with async/await
+  ```typescript
+  async function main(): Promise<void> {
+    try {
+      // async operations
+    } catch (err: any) {
+      console.error(err.message || err);
+      process.exit(1);
+    }
+  }
+  ```
+- Validation: Early validation with descriptive errors
+  ```typescript
+  if (!key || !key.startsWith("sk-")) {
+    console.error("Invalid key. Must start with 'sk-'.");
+    process.exit(1);
+  }
+  ```
+
+## Logging
+
+**Framework:** Uses `console` methods directly
+
+**Patterns:**
+- Errors: `console.error()` for unexpected conditions and user-facing errors
+- Info: `console.log()` for general output and status messages
+- Debug: Limited use, mostly in development scripts
+- No structured logging library detected
+
+## Comments
+
+**When to Comment:**
+- File headers describe purpose and flow (seen in most files)
+- Complex logic gets inline comments explaining why, not what
+- TODO comments used for tracking future work: `// TODO:`
+
+**JSDoc/TSDoc:**
+- Used for all public APIs and complex functions
+- Includes @param, @returns, and @throws where applicable
+- Example:
+  ```typescript
+  /**
+   * Extract all $B invocations from bash code blocks in a SKILL.md file.
+   */
+  export function extractBrowseCommands(skillPath: string): BrowseCommand[] {
+  ```
+
+## Function Design
+
+**Size:** Functions tend to be small and focused
+- Most functions under 50 lines
+- Larger functions broken into smaller helpers (e.g., `processTemplate` in gen-skill-docs.ts)
+
+**Parameters:** 
+- Functions typically take 1-3 parameters
+- Parameter objects used for multiple related options
+- Explicit typing on all parameters and return values
+
+**Return Values:** 
+- Clear return types specified
+- Functions return meaningful values or Promises for async operations
+- Consistent error handling patterns
+
+## Module Design
+
+**Exports:** 
+- Named exports preferred: `export function extractBrowseCommands(...)`
+- Default exports used sparingly (mainly for classes or single-value exports)
+- Barrel files not commonly used; direct imports preferred
+
+**File Organization:**
+- Feature-based grouping: browse/, design/, scripts/, test/
+- Related functionality grouped in same directory
+- Test files colocated with source or in parallel test/ directory structure
\ No newline at end of file
diff --git a/.planning/codebase/INTEGRATIONS.md b/.planning/codebase/INTEGRATIONS.md
new file mode 100644
index 000000000..2ab967836
--- /dev/null
+++ b/.planning/codebase/INTEGRATIONS.md
@@ -0,0 +1,106 @@
+# External Integrations
+
+**Analysis Date:** 2026-03-28
+
+## APIs & External Services
+
+**AI/LLM Providers:**
+- Anthropic Claude - Used for skill evaluation and LLM judging
+  - SDK/Client: @anthropic-ai/sdk
+  - Auth: ANTHROPIC_API_KEY environment variable
+- OpenAI - Used for design generation, prototyping, and Codex metadata
+  - SDK/Client: Direct fetch API calls
+  - Auth: OPENAI_API_KEY environment variable or ~/.gstack/openai.json
+- OpenAI Codex - Referenced for CLI installation and metadata generation
+  - Integration: agents/openai.yaml metadata files
+  - Auth: Requires separate codex CLI installation
+
+**Data & Storage:**
+- Supabase - Used for telemetry storage, update checking, and community pulse functions
+  - SDK/Client: @supabase/supabase-js (loaded via esm.sh)
+  - Auth: SUPABASE_URL and SUPABASE_ANON_KEY environment variables
+  - Used in: telemetry-ingest, update-check, community-pulse edge functions
+
+**Browser Automation:**
+- Playwright - Primary browser automation for headless browsing
+  - Used in: browse skill for URL validation, snapshot testing
+  - Auth: None required (local browser instances)
+- Puppeteer-core - Alternative browser automation
+  - Used in: Some test scenarios and specific browsing features
+  - Auth: None required
+
+## Data Storage
+
+**Databases:**
+- Supabase PostgreSQL
+  - Connection: Via SUPABASE_URL and SUPABASE_ANON_KEY env vars
+  - Client: @supabase/supabase-js in edge functions
+  - Tables: update_checks, telemetry, community_pulse data (inferred)
+
+**File Storage:**
+- Local filesystem only - No external file storage services integrated
+  - Skills and data stored locally in ~/.gstack/ directory
+  - Telemetry stored in Supabase
+
+**Caching:**
+- None - No external caching services detected
+  - Local caching: In-memory or filesystem-based where needed
+
+## Authentication & Identity
+
+**Auth Provider:**
+- Custom/Open standards approach
+  - Implementation: Environment variable based API keys
+  - Supported providers: Anthropic, OpenAI via direct API key configuration
+  - No OAuth or third-party auth flows implemented
+
+## Monitoring & Observability
+
+**Error Tracking:**
+- None - No external error tracking services detected
+  - Local error handling: Console output and test assertions
+
+**Logs:**
+- Console output - Primary logging mechanism
+- Structured logging: Limited to test helpers and E2E helper functions
+- Telemetry: Collected and sent to Supabase via telemetry-ingest function
+
+## CI/CD & Deployment
+
+**Hosting:**
+- Self-hosted CLI tools - Designed for local installation and execution
+- No cloud hosting dependencies for core functionality
+
+**CI Pipeline:**
+- GitHub Actions - Used for automated testing and skill documentation generation
+  - Workflows: skill-docs.yml, evals.yml, evals-periodic.yml, ci-image.yml
+  - Triggers: Push, pull request, schedule
+
+## Environment Configuration
+
+**Required env vars:**
+- SUPABASE_URL - Supabase project URL
+- SUPABASE_ANON_KEY - Supabase anon key
+- ANTHROPIC_API_KEY - Anthropic API key for Claude access
+- OPENAI_API_KEY - OpenAI API key for GPT access
+
+**Secrets location:**
+- Environment variables - Expected to be set in runtime environment
+- Local config: ~/.gstack/openai.json for OpenAI API key (0600 permissions)
+- No secrets committed to repository
+
+## Webhooks & Callbacks
+
+**Incoming:**
+- None - No incoming webhook endpoints in core codebase
+  - Test examples: /webhook/stripe in skill-e2e-cso.test.ts (example only)
+
+**Outgoing:**
+- Supabase edge functions - Outgoing HTTP requests to external APIs
+  - OpenAI API calls from design/* skills
+  - Anthropic API calls from skill evaluation helpers
+  - No other outgoing webhooks detected
+
+---
+
+*Integration audit: 2026-03-28*
\ No newline at end of file
diff --git a/.planning/codebase/STACK.md b/.planning/codebase/STACK.md
new file mode 100644
index 000000000..0eb361061
--- /dev/null
+++ b/.planning/codebase/STACK.md
@@ -0,0 +1,70 @@
+# Technology Stack
+
+**Analysis Date:** 2026-03-28
+
+## Languages
+
+**Primary:**
+- TypeScript - Used throughout the codebase for all source files
+
+**Secondary:**
+- JavaScript - Used in some test files and configuration
+- Bash - Used in build scripts and helper scripts
+
+## Runtime
+
+**Environment:**
+- Bun.js >=1.0.0 - Primary runtime as specified in package.json engines
+
+**Package Manager:**
+- Bun - Built-in package manager
+- Lockfile: bun.lockb (present based on standard Bun usage)
+
+## Frameworks
+
+**Core:**
+- None - This is a skills/tooling repository, not an application framework
+
+**Testing:**
+- Bun:test - Built-in test runner used for all testing
+- Playwright - Used for browser automation in E2E tests
+- Puppeteer-core - Used for browser automation in some tests
+
+**Build/Dev:**
+- Bun build - Used for compiling TypeScript to native binaries
+- Custom scripts - Various TypeScript scripts for skill generation, documentation, etc.
+
+## Key Dependencies
+
+**Critical:**
+- diff ^7.0.0 - Used for text comparison operations
+- playwright ^1.58.2 - Browser automation for testing and browsing functionality
+- puppeteer-core ^24.40.0 - Alternative browser automation library
+
+**Infrastructure:**
+- @anthropic-ai/sdk ^0.78.0 - Anthropic API client for Claude integration (devDependency)
+
+## Configuration
+
+**Environment:**
+- Configured via .env.example file (contains template variables)
+- Key configs: SUPABASE_URL, SUPABASE_ANON_KEY, OPENAI_API_KEY, etc.
+
+**Build:**
+- package.json scripts - Defines all build and development commands
+- bun run build - Main build command that compiles binaries and generates documentation
+
+## Platform Requirements
+
+**Development:**
+- Bun.js >=1.0.0 required
+- Git for version control
+- Compatible with Windows, macOS, Linux
+
+**Production:**
+- Designed to run as CLI tools
+- Target platforms: Any where Bun.js runs
+
+---
+
+*Stack analysis: 2026-03-28*
\ No newline at end of file
diff --git a/.planning/codebase/STRUCTURE.md b/.planning/codebase/STRUCTURE.md
new file mode 100644
index 000000000..c9d9b8289
--- /dev/null
+++ b/.planning/codebase/STRUCTURE.md
@@ -0,0 +1,212 @@
+# Codebase Structure
+
+**Analysis Date:** 2026-03-28
+
+## Directory Layout
+
+```
+[project-root]/
+├── .github/               # GitHub Actions workflows and configs
+├── .planning/             # Generated planning documents (this analysis)
+├── agents/                # Skill agent configurations (YAML)
+├── autonplan/             # Autonomous planning skill
+├── benchmark/             # Performance benchmarking tools
+├── bin/                   # Executable scripts and CLI entry points
+├── browse/                # Headless browser automation skill (core)
+├── browse/bin/            # Compiled browse binaries
+├── browse/scripts/        # Browse-specific helper scripts
+├── browse/src/            # Browse skill source code
+├── browse/test/           # Browse skill tests
+├── canary/                # Canary release skill
+├── careful/               # Destructive operation protection skill
+├── codex/                 # Codex agent adapter
+├── connect-chrome/        # Chrome extension connector
+├── cso/                   # Customer success operations skill
+├── design/                # AI-powered design generation skill
+├── design/src/            # Design skill source code
+├── design/test/           # Design skill tests
+├── design-consultation/   # Design consultation skill
+├── design-review/         # Design review skill
+├── design-shotgun/        # Rapid design exploration skill
+├── docs/                  # Documentation files
+├── document-release/      # Release documentation skill
+├── extension/             # Browser extension source
+├── freeze/                # File edit protection skill
+├── gstack-upgrade/        # Self-upgrade skill
+├── guard/                 # Combined careful+freeze skill
+├── investigate/           # Investigation and analysis skill
+├── land-and-deploy/       # Deployment automation skill
+├── lib/                   # Shared libraries
+├── office-hours/          # Project initialization skill
+├── plan-ceo-review/       # CEO-level planning review 사실은 수정 필요
+├── plan-design-review/    # Design review planning skill
+├── plan-eng-review/       # Engineering planning skill
+├── qa/                    # Quality assurance testing skill
+├── qa-only/               # QA reporting only skill
+├── retro/                 # Retrospective meeting skill
+├── review/                # Pull request review skill
+├── scripts/               # Cross-cutting utility scripts
+├── setup-browser-cookies/ # Browser cookie import skill
+├── setup-deploy/          # Deployment setup skill
+├── ship/                  # Release shipping skill
+├── supabase/              # Supabase integration skill
+├── test/                  # Root-level test files
+├── unfreeze/              # File edit protection removal skill
+```
+
+## Directory Purposes
+
+**.github/:**
+- Purpose: GitHub Actions workflows for CI/CD
+- Contains: Workflow YAML files for skill docs, evals, CI images
+- Key files: `.github/workflows/skill-docs.yml`, `.github/workflows/evals.yml`
+
+**agents/:**
+- Purpose: Skill agent configurations for external AI integrations
+- Contains: YAML configurations for different AI providers
+- Key files: `agents/openai.yaml`
+
+**browse/:**
+- Purpose: Core headless browser automation functionality
+- Contains: Persistent browser server, CLI interface, automation commands
+- Key files: 
+  - `browse/src/server.ts` - Persistent browser automation server
+  - `browse/src/cli.ts` - CLI interface for browser commands
+  - `browse/src/config.ts` - Configuration resolution
+  - `browse/dist/browse` - Compiled binary entry point
+
+**design/:**
+- Purpose: AI-powered UI mockup generation and design assistance
+- Contains: Design generation, editing, and analysis tools
+- Key files:
+  - `design/src/cli.ts` - CLI for design commands
+  - `design/src/generate.ts` - Image generation core
+  - `design/src/serve.ts` - HTTP server for design boards
+  - `design/dist/design` - Compiled binary entry point
+
+**scripts/:**
+- Purpose: Cross-cutting utility scripts for skill management
+- Contains: Skill generation, validation, discovery, and development tools
+- Key files:
+  - `scripts/gen-skill-docs.ts` - Skill documentation generation
+  - `scripts/skill-check.ts` - Skill health validation
+  - `scripts/dev-skill.ts` - Skill development helper
+  - `scripts/discover-skills.ts` - Skill discovery and listing
+
+**bin/:**
+- Purpose: Executable scripts and compiled binaries
+- Contains: Global utilities and skill entry points
+- Key files:
+  - `bin/gstack-global-discover` - Global skill discovery utility
+  - `bin/gstack-config` - Configuration management
+  - `bin/gstack-analytics` - Usage analytics
+  - `bin/gstack-review-log` - PR review logging
+
+**test/:**
+- Purpose: Root-level test files and helpers
+- Contains: Test fixtures, helpers, and cross-cutting tests
+- Key files:
+  - `test/helpers/skill-parser.ts` - Skill YAML parsing
+  - `test/helpers/session-runner.ts` - E2E test session management
+  - `test/skill-e2e-*.test.ts` - End-to-end skill tests
+
+## Key File Locations
+
+**Entry Points:**
+- `browse/dist/browse`: Primary browse CLI (compiled)
+- `design/dist/design`: Primary design CLI (compiled)
+- `bin/gstack-global-discover`: Skill discovery utility
+- `browse/src/cli.ts`: Development browse CLI
+- `design/src/cli.ts`: Development design CLI
+
+**Configuration:**
+- `browse/src/config.ts`: Browse skill configuration resolution
+- `design/src/auth.ts`: Design skill API key management
+- `.gstack/`: User-specific state directory (created at runtime)
+- `package.json`: Project dependencies and scripts
+
+**Core Logic:**
+- `browse/src/server.ts`: Persistent browser automation server
+- `browse/src/sidebar-agent.ts`: Chrome extension communication agent
+- `design/src/generate.ts`: Core image generation logic
+- `design/src/memory.ts`: Design session persistence
+
+**Testing:**
+- `browse/test/`: Browse skill unit and E2E tests
+- `design/test/`: Design skill unit and E2e tests
+- `test/`: Root-level test helpers and fixtures
+- `test/skill-e2e-*.test.ts`: Cross-skill end-to-end tests
+
+## Naming Conventions
+
+**Files:**
+- **Skills:** kebab-case directory names (e.g., `skill-name/`)
+- **Source Files:** `.ts` extension, kebab-case naming (e.g., `skill-parser.test.ts`)
+- **Templates:** `.tmpl` extension for template files (e.g., `SKILL.md.tmpl`)
+- **Tests:** `.test.ts` suffix for test files (e.g., `skill-parser.test.ts`)
+- **Binaries:** No extension for compiled binaries (e.g., `browse`, `design`)
+- **Config:** Descriptive names with `.ts` extension (e.g., `config.ts`, `auth.ts`)
+
+**Directories:**
+- **Skill Modules:** kebab-case matching skill name (e.g., `browse/`, `design/`)
+- **Source Code:** `src/` directory within skill modules
+- **Tests:** `test/` directory within skill modules or at root
+- **Scripts:** `scripts/` directory for cross-cutting utilities
+- **Binaries:** `bin/` directory for executables, `*/dist/` for compiled skill binaries
+- **Templates:** Root directory for skill templates (e.g., `SKILL.md.tmpl` in skill dirs)
+
+## Where to Add New Code
+
+**New Skill:**
+- Primary code: `new-skill/src/` directory with `cli.ts`, core logic files
+- Tests: `new-skill/test/` directory
+- Template: `new-skill/SKILL.md.tmpl` (copy from existing)
+- Config: Add to `scripts/gen-skill-docs.ts` if auto-generation needed
+
+**New Component/Module:**
+- Implementation: Within existing skill's `src/` directory
+- Following patterns: Match existing file naming and structure
+- Exports: Use named exports for functions, default for main classes
+
+**Utilities:**
+- Shared helpers: `scripts/` directory for cross-cutting utilities
+- Skill-specific helpers: Within skill's `src/` directory
+- Persistent: Consider if should be in `lib/` for true sharing across skills
+
+**Configuration:**
+- Skill-specific: Within skill's `src/` directory (e.g., `config.ts`, `auth.ts`)
+- Global: Update `package.json` scripts or add to root config files
+
+## Special Directories
+
+**.planning/:**
+- Purpose: Generated codebase analysis documents from `/gsd-map-codebase`
+- Generated: Yes (by this analysis process)
+- Committed: Yes (for reference by other GSD commands)
+
+**.gstack/:**
+- Purpose: User-specific state directory for skills
+- Generated: Yes (at runtime by skills)
+- Committed: No (listed in .gitignore)
+- Contains: `browse.json` (server state), `openai.json` (API keys)
+
+**test/fixtures/:**
+- Purpose: Test data files for E2E and unit tests
+- Generated: No (committed test data)
+- Committed: Yes
+- Contains: HTML fixtures, test images, sample data
+
+**browse/test/fixtures/:**
+- Purpose: Browser automation test fixtures
+- Generated: No
+- Committed: Yes
+- Contains: Sample web pages for testing automation commands
+
+**node_modules/:**
+- Purpose: Dependency packages
+- Generated: Yes (by bun install)
+- Committed: No (listed in .gitignore)
+- Contains: Playwright, puppeteer-core, diff, and other dependencies
+
+---
+*Structure analysis: 2026-03-28*
\ No newline at end of file
diff --git a/.planning/codebase/TESTING.md b/.planning/codebase/TESTING.md
new file mode 100644
index 000000000..09d066ec6
--- /dev/null
+++ b/.planning/codebase/TESTING.md
@@ -0,0 +1,186 @@
+# Testing Patterns
+
+**Analysis Date:** 2026-03-28
+
+## Test Framework
+
+**Runner:**
+- Bun test framework (built-in)
+- Config: Implicit via package.json test scripts
+
+**Assertion Library:**
+- Bun:test expect API
+
+**Run Commands:**
+```bash
+bun test                            # Run all tests (excluding E2E)
+bun test --watch                    # Watch mode
+bun test --coverage                 # Coverage reporting
+bun test test/skill-parser.test.ts  # Run specific test file
+```
+
+## Test File Organization
+
+**Location:**
+- Mixed approach: tests colocated with source and in centralized test/ directory
+- Feature-specific tests in feature directories: `design/test/`, `browse/test/`
+- General tests in root `test/` directory
+
+**Naming:**
+- Test files: `[feature].test.ts` or `[feature].e2e.test.ts`
+- Helper/test utilities: `[name].ts` or `[name].test.ts`
+
+**Structure:**
+```
+test/
+├── skill-parser.test.ts
+├── audit-compliance.test.ts
+├── helpers/                    # Test helpers and fixtures
+├── browse/                     # Browse-specific tests
+└── design/                     # Design-specific tests
+```
+
+## Test Structure
+
+**Suite Organization:**
+```typescript
+import { describe, test, expect } from 'bun:test';
+import { functionToTest } from './module';
+
+describe('Function Name', () => {
+  test('description of what is being tested', () => {
+    // Arrange
+    const input = 'test input';
+    
+    // Act
+    const result = functionToTest(input);
+    
+    // Assert
+    expect(result).toBe('expected output');
+  });
+});
+```
+
+**Patterns:**
+- Setup: Using `beforeEach()`, `beforeAll()` when needed
+- Teardown: Cleanup in `afterEach()`, `afterAll()` 
+- Assertions: Using `expect()` matchers like `.toBe()`, `.toEqual()`, `.toHaveLength()`
+- Async testing: Using `await` with expect assertions
+
+## Mocking
+
+**Framework:** Manual mocking approach (no external mocking library)
+
+**Patterns:**
+- Temporary directories for file system tests:
+  ```typescript
+  const FIXTURES_DIR = path.join(os.tmpdir(), 'skill-parser-test');
+  fs.mkdirSync(FIXTURES_DIR, { recursive: true });
+  // ... create test files
+  // cleanup happens automatically via OS temp cleanup
+  ```
+- Function spying/stubbing: Limited use, mostly dependency injection
+- Network mocking: Not commonly used; tests use real fixtures or controlled inputs
+
+**What to Mock:**
+- File system operations (using temporary directories)
+- External APIs when testing integration points (via fixture files)
+- Date/time when testing time-dependent functionality
+
+**What NOT to Mock:**
+- Pure functions (test with real inputs/outputs)
+- Simple utility functions
+- Internal logic that can be tested directly
+
+## Fixtures and Factories
+
+**Test Data:**
+- Inline fixture creation for simple cases:
+  ```typescript
+  const p = writeFixture('test.md', [
+    '# Test',
+    '\`\`\`bash',
+    '$B goto https://example.com',
+    '\`\`\`',
+  ].join('\n'));
+  ```
+- Helper functions for complex setup:
+  ```typescript
+  function writeFixture(name: string, content: string): string {
+    fs.mkdirSync(FIXTURES_DIR, { recursive: true });
+    const p = path.join(FIXTURES_DIR, name);
+    fs.writeFileSync(p, content);
+    return p;
+  }
+  ```
+
+**Location:**
+- Test-specific helpers in `test/helpers/` directory
+- Inline fixtures for simple test data
+- Shared fixtures in test files when used by multiple tests
+
+## Coverage
+
+**Requirements:** No enforced coverage thresholds detected
+
+**View Coverage:**
+```bash
+bun test --coverage
+```
+
+## Test Types
+
+**Unit Tests:**
+- Majority of tests are unit tests
+- Test individual functions in isolation
+- Examples: `skill-parser.test.ts`, `audit-compliance.test.ts`
+
+**Integration Tests:**
+- Some tests verify integration between modules
+- Examples: E2E tests that test CLI command flows
+- Limited use due to nature of CLI/automation tool
+
+**E2E Tests:**
+- Present for end-to-end workflows
+- Files: `test/skill-e2e-*.test.ts`, `test/codex-e2e.test.ts`, `test/gemini-e2e.test.ts`
+- Uses `@bun:test` with longer timeouts
+- Tests complete user workflows
+
+## Common Patterns
+
+**Async Testing:**
+```typescript
+test('async operation', async () => {
+  const result = await asyncFunction();
+  expect(result).toBe('expected');
+});
+```
+
+**Error Testing:**
+```typescript
+test('throws on invalid input', () => {
+  expect(() => {
+    functionThatThrows('invalid');
+  }).toThrow(/invalid input/);
+});
+```
+
+**File System Testing:**
+```typescript
+test('reads file correctly', () => {
+  const tempFile = writeFixture('test.txt', 'content');
+  const result = readFile(tempFile);
+  expect(result).toBe('content');
+  // OS cleans up temp file automatically
+  // or explicit cleanup in afterAll()
+});
+```
+
+**Command Line Testing:**
+```typescript
+test('CLI command works', async () => {
+  const proc = Bun.spawn(['bun', 'run', 'cli', '--help']);
+  const response = await new Response(proc.stdout).text();
+  expect(response).toContain('Usage:');
+});
+```
\ No newline at end of file

From a74cdd2d0150efc4abac07ae8e32930a77e4eb4a Mon Sep 17 00:00:00 2001
From: nathan shearer <help@rapidstartup.io>
Date: Sun, 29 Mar 2026 01:27:05 +0800
Subject: [PATCH 2/4] feat: add OpenCode integration for gstack skills

- Add OpenCode adapter for Paperclip agent system
- Add OpenCode command files for all gstack skills
- Enable gstack skills to be used in OpenCode via command dialog (Ctrl+K)
---
 .gitattributes                                |  17 ++
 AGENTS.md                                     | 135 ++++++++++-
 get-shit-done                                 |   1 +
 opencode                                      |   1 +
 packages/adapters/opencode/package.json       |  19 ++
 .../adapters/opencode/src/cli/format-event.ts |  34 +++
 packages/adapters/opencode/src/cli/index.ts   |   1 +
 packages/adapters/opencode/src/index.ts       |  28 +++
 .../adapters/opencode/src/server/execute.ts   | 209 ++++++++++++++++++
 .../adapters/opencode/src/server/index.ts     |  19 ++
 .../adapters/opencode/src/server/parse.ts     |  19 ++
 packages/adapters/opencode/src/server/test.ts | 100 +++++++++
 .../adapters/opencode/src/ui/build-config.ts  |  36 +++
 .../opencode/src/ui/config-fields.tsx         |  98 ++++++++
 packages/adapters/opencode/src/ui/index.ts    |  12 +
 .../adapters/opencode/src/ui/parse-stdout.ts  |  18 ++
 16 files changed, 745 insertions(+), 2 deletions(-)
 create mode 100644 .gitattributes
 create mode 160000 get-shit-done
 create mode 160000 opencode
 create mode 100644 packages/adapters/opencode/package.json
 create mode 100644 packages/adapters/opencode/src/cli/format-event.ts
 create mode 100644 packages/adapters/opencode/src/cli/index.ts
 create mode 100644 packages/adapters/opencode/src/index.ts
 create mode 100644 packages/adapters/opencode/src/server/execute.ts
 create mode 100644 packages/adapters/opencode/src/server/index.ts
 create mode 100644 packages/adapters/opencode/src/server/parse.ts
 create mode 100644 packages/adapters/opencode/src/server/test.ts
 create mode 100644 packages/adapters/opencode/src/ui/build-config.ts
 create mode 100644 packages/adapters/opencode/src/ui/config-fields.tsx
 create mode 100644 packages/adapters/opencode/src/ui/index.ts
 create mode 100644 packages/adapters/opencode/src/ui/parse-stdout.ts

diff --git a/.gitattributes b/.gitattributes
new file mode 100644
index 000000000..522616022
--- /dev/null
+++ b/.gitattributes
@@ -0,0 +1,17 @@
+# Store and checkout text as LF (cross-platform; matches web/TS conventions).
+* text=auto eol=lf
+
+# Binary — never apply line-ending conversion
+*.png binary
+*.jpg binary
+*.jpeg binary
+*.gif binary
+*.webp binary
+*.ico binary
+*.pdf binary
+*.woff binary
+*.woff2 binary
+*.ttf binary
+*.eot binary
+*.wasm binary
+*.zip binary
diff --git a/AGENTS.md b/AGENTS.md
index d87217453..4c740bacb 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -41,9 +41,140 @@ bun run gen:skill-docs   # regenerate SKILL.md files from templates
 bun run skill:check      # health dashboard for all skills
 ```
 
-## Key conventions
+### Test commands
+
+```bash
+# Run all tests (excluding slow E2E tests)
+bun test
+
+# Run specific test suites
+bun run test:evals          # LLM evaluation tests
+bun run test:e2e            # End-to-end tests
+bun run test:codex          # Codex-specific E2E tests
+bun run test:gemini         # Gemini-specific E2E tests
+bun run test:audit          # Audit compliance tests
+
+# Run a single test file
+bun test test/skill-parser.test.ts
+
+# Run a single test function (if supported by test runner)
+bun test test/skill-parser.test.ts -t "extracts \$B commands"
+```
+
+## Code style guidelines
+
+### Language & formatting
+
+- **Primary language**: TypeScript with ES modules (`"type": "module"` in package.json)
+- **Formatter**: No explicit formatter configured; follow existing code patterns
+- **Line length**: Aim for 80-100 characters; use judgment for readability
+- **Indentation**: 2 spaces (not tabs)
+- **Semicolons**: Required (follow existing code)
+- **Quotes**: Single quotes for strings, double quotes only when needed (e.g., JSX attributes)
+- **File naming**: `.ts` for TypeScript files, `.test.ts` for test files
+- **Directory organization**: Feature-based grouping (browse/, design/, scripts/, etc.)
+
+### Imports
+
+- **Order**: Built-in modules → external packages → internal modules
+- **Syntax**: 
+  - Named imports: `import { fs } from 'fs';`
+  - Default imports: `import fs from 'fs';` (when appropriate)
+  - Namespace imports: `import * as fs from 'fs';`
+- **Path aliases**: Use relative paths (`./helpers/util`) or absolute from project root
+- **Bun-specific**: Use `bun:test` for testing imports: `import { describe, test, expect } from 'bun:test';`
+
+### Types
+
+- **Type definitions**: Prefer interfaces over types for object shapes
+- **Explicit typing**: 
+  - Function parameters and return values should be typed
+  - Avoid `any`; use `unknown` when type is truly unknown
+  - Use generics for reusable components
+- **Nullable types**: Explicitly mark with `| null` or use strict null checks
+- **Type inference**: Trust TypeScript inference for simple cases
+
+### Naming conventions
+
+- **Variables & functions**: camelCase (e.g., `fetchUserData`)
+- **Classes & types**: PascalCase (e.g., `BrowserManager`)
+- **Constants**: UPPER_SNAKE_CASE (e.g., `MAX_START_WAIT`)
+- **Files**: kebab-case (e.g., `skill-parser.test.ts`)
+- **Private members**: Prefix with underscore only if truly internal (`_internalMethod`)
+- **Boolean variables**: Use is/has/can prefixes (e.g., `isEnabled`, `hasError`)
+
+### Error handling
+
+- **Synchronous code**: Use try/catch for recoverable errors
+- **Asynchronous code**: 
+  - Prefer try/catch with async/await
+  - For promises: `.then(result => ...).catch(error => handleError(error))`
+- **Validation**: Validate inputs early; throw descriptive errors
+- **Logging**: Use console.error for unexpected conditions; avoid console.log in libraries
+- **User-facing errors**: Provide clear, actionable messages
+- **Error types**: Consider creating custom error classes for domain-specific errors
+
+### Documentation
+
+- **JSDoc**: Use for all public APIs and complex functions
+- **File headers**: Include purpose and flow description (see existing files)
+- **Complex logic**: Add inline comments explaining why, not what
+- **TODO comments**: Use `// TODO:` for tracking future work
+- **Magic numbers**: Replace with named constants with explanations
+
+### Testing patterns
+
+- **Test files**: Name as `[feature].test.ts` alongside implementation or in `test/` directory
+- **Test structure**: 
+  - `describe()` for test suites
+  - `test()` for individual test cases
+  - `beforeAll()/afterAll()` for suite setup/teardown
+  - `beforeEach()/afterEach()` for test isolation
+- **Assertions**: Use `expect()` from `bun:test`
+- **Mocking**: 
+  - Manual mocks for simple cases
+  - Temporary directories for file system tests (`os.tmpdir()`)
+  - Child process testing with `spawnSync` for CLI commands
+- **E2E tests**: 
+  - Mark with `.e2e.test.ts` suffix
+  - Use test servers for HTTP testing
+  - Clean up resources in `afterAll()`
+
+### Specific patterns in this codebase
+
+- **Configuration**: Use `resolveConfig()` pattern for loading settings
+- **Process detection**: Check `process.platform` for OS-specific behavior
+- **Constants**: Define timeouts, limits, and magic values as constants at top of file
+- **HTTP servers**: Use consistent patterns for starting/stopping test servers
+- **File operations**: Always check existence before reading/writing; use synchronous versions in CLI scripts for simplicity
+- **CLI args**: Parse with `process.argv.slice(2)` or use parsing libraries for complex interfaces
+- **Environment**: Use `process.env` for configuration; provide defaults and validation
+
+## Safety guidelines
+
+- **Destructive operations**: Always confirm before running commands like `rm -rf`, `DROP TABLE`, or force pushes
+- **File modifications**: Prefer editing existing files over creating new ones unless explicitly required
+- **Branch protection**: Never force push to main/master branches
+- **Secret handling**: Never log or commit secrets, keys, or credentials
+- **Testing**: Run relevant tests before considering work complete
+- **Build verification**: Ensure `bun run build` succeeds after changes
+
+## Agent-specific instructions
+
+When operating as an agent in this repository:
+
+1. **Start with understanding**: Read related files before making changes
+2. **Follow existing patterns**: Match the coding style of the file you're editing
+3. **Test thoroughly**: Run relevant unit tests and verify manually when appropriate
+4. **Document changes**: Update comments and JSDoc when modifying behavior
+5. **Consider edge cases**: Think about error conditions and input validation
+6. **Keep changes focused**: Make minimal, purposeful changes
+7. **Verify build**: Ensure `bun run build` still works after your changes
+8. **Respect conventions**: Follow the established patterns for imports, naming, and error handling
+
+## Documentation
 
 - SKILL.md files are **generated** from `.tmpl` templates. Edit the template, not the output.
 - Run `bun run gen:skill-docs --host codex` to regenerate Codex-specific output.
 - The browse binary provides headless browser access. Use `$B <command>` in skills.
-- Safety skills (careful, freeze, guard) use inline advisory prose — always confirm before destructive operations.
+- Safety skills (careful, freeze, guard) use inline advisory prose — always confirm before destructive operations.
\ No newline at end of file
diff --git a/get-shit-done b/get-shit-done
new file mode 160000
index 000000000..1421dc07b
--- /dev/null
+++ b/get-shit-done
@@ -0,0 +1 @@
+Subproject commit 1421dc07bc1033f1b69e49d85cb6d625fd696b4f
diff --git a/opencode b/opencode
new file mode 160000
index 000000000..73ee49326
--- /dev/null
+++ b/opencode
@@ -0,0 +1 @@
+Subproject commit 73ee493265acf15fcd8caab2bc8cd3bd375b63cb
diff --git a/packages/adapters/opencode/package.json b/packages/adapters/opencode/package.json
new file mode 100644
index 000000000..9a10966c9
--- /dev/null
+++ b/packages/adapters/opencode/package.json
@@ -0,0 +1,19 @@
+{
+  "name": "@paperclipai/adapter-opencode",
+  "version": "0.0.1",
+  "private": true,
+  "type": "module",
+  "exports": {
+    ".": "./src/index.ts",
+    "./server": "./src/server/index.ts",
+    "./ui": "./src/ui/index.ts",
+    "./cli": "./src/cli/index.ts"
+  },
+  "dependencies": {
+    "@paperclipai/adapter-utils": "workspace:*",
+    "picocolors": "^1.1.1"
+  },
+  "devDependencies": {
+    "typescript": "^5.7.3"
+  }
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/cli/format-event.ts b/packages/adapters/opencode/src/cli/format-event.ts
new file mode 100644
index 000000000..1f228abfc
--- /dev/null
+++ b/packages/adapters/opencode/src/cli/format-event.ts
@@ -0,0 +1,34 @@
+import pc from 'picocolors';
+
+/**
+ * Format a line of stdout from the OpenCode process for display in the terminal.
+ * This is used when running `paperclipai run --watch`.
+ *
+ * @param line - The line of stdout from the OpenCode process
+ * @param debug - Whether to enable debug output (unrecognized lines are shown in gray)
+ */
+export function formatOpenCodeStdoutEvent(line: string, debug: boolean): void {
+  // In this simple implementation, we just print the line as-is.
+  // We could try to parse the line to see if it's a known OpenCode output format,
+  // but for now we'll treat all lines as regular output.
+  console.log(line);
+
+  // If we wanted to do more sophisticated formatting, we could do something like:
+  // if (debug) {
+  //   // In debug mode, we might want to show all lines, even if we don't understand them
+  //   console.log(pc.gray(line));
+  // } else {
+  //   // In non-debug mode, we might want to filter or style known lines
+  //   // For example, if we knew that lines starting with "[INFO]" are info messages:
+  //   if (line.startsWith('[INFO]')) {
+  //     console.log(pc.blue(line));
+  //   } else if (line.startsWith('[ERROR]')) {
+  //     console.log(pc.red(line));
+  //   } else {
+  //     console.log(line);
+  //   }
+  // }
+}
+
+// Note: The CLI adapter interface expects a function named `formatStdoutEvent`.
+// We'll export it with that name in the index.ts file.
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/cli/index.ts b/packages/adapters/opencode/src/cli/index.ts
new file mode 100644
index 000000000..dae01a60a
--- /dev/null
+++ b/packages/adapters/opencode/src/cli/index.ts
@@ -0,0 +1 @@
+export { formatOpenCodeStdoutEvent as formatStdoutEvent } from './format-event';
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/index.ts b/packages/adapters/opencode/src/index.ts
new file mode 100644
index 000000000..6c1761372
--- /dev/null
+++ b/packages/adapters/opencode/src/index.ts
@@ -0,0 +1,28 @@
+export const type = "opencode";
+export const label = "OpenCode (local)";
+
+export const models = [
+  { id: "opencode", label: "OpenCode" },
+];
+
+export const agentConfigurationDoc = `# OpenCode agent configuration
+
+Adapter: opencode
+
+Use when:
+- The agent needs to run OpenCode CLI locally on the host machine
+- You want to use OpenCode's interactive TUI or non-interactive mode
+- The task requires OpenCode-specific features (e.g. multiple AI providers, session management)
+
+Don't use when:
+- You need a simple one-shot script execution (use the "process" adapter instead)
+- OpenCode CLI is not installed on the host
+- You need to use a different agent runtime (e.g. Claude Code, Codex)
+
+Core fields:
+- cwd (string, required): absolute working directory for the OpenCode process
+- model (string, optional): OpenCode model to use (default: claude-3.5-sonnet)
+- timeoutSec (number, optional): timeout for each OpenCode invocation in seconds (default: 120)
+- graceSec (number, optional): grace period for OpenCode to shut down after timeout (default: 15)
+- sessionHistoryLimit (number, optional): maximum number of conversation turns to keep in history (default: 10)
+`;
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/server/execute.ts b/packages/adapters/opencode/src/server/execute.ts
new file mode 100644
index 000000000..e7bc6c891
--- /dev/null
+++ b/packages/adapters/opencode/src/server/execute.ts
@@ -0,0 +1,209 @@
+import { 
+  AdapterExecutionContext, 
+  AdapterExecutionResult,
+  asString,
+  asNumber,
+  asBoolean,
+  parseObject,
+  renderTemplate,
+  buildPaperclipEnv,
+  redactEnvForLogs,
+  ensureAbsoluteDirectory,
+  ensureCommandResolvable,
+  ensurePathInEnv,
+  runChildProcess
+} from '@paperclipai/adapter-utils/server-utils';
+import * as fs from 'fs';
+import * as path from 'path';
+import * as os from 'os';
+
+export async function execute(ctx: AdapterExecutionContext): Promise<AdapterExecutionResult> {
+  // 1. Read config
+  const cwd = asString(ctx.config.cwd);
+  const model = asString(ctx.config.model, 'claude-3.5-sonnet');
+  const timeoutSec = asNumber(ctx.config.timeoutSec, 120);
+  const graceSec = asNumber(ctx.config.graceSec, 15);
+  const sessionHistoryLimit = asNumber(ctx.config.sessionHistoryLimit, 10);
+
+  // 2. Validate cwd
+  let absoluteCwd: string;
+  try {
+    absoluteCwd = ensureAbsoluteDirectory(cwd);
+  } catch (err) {
+    return {
+      exitCode: 1,
+      signal: null,
+      timedOut: false,
+      errorMessage: `Invalid cwd: ${err.message}`,
+      usage: null,
+      sessionId: null,
+      sessionParams: null,
+      sessionDisplayId: null,
+      provider: null,
+      model: null,
+      costUsd: null,
+      resultJson: null,
+      summary: null,
+      clearSession: false,
+    };
+  }
+
+  // 3. Build environment
+  const env = {
+    ...process.env,
+    ...buildPaperclipEnv(ctx.agent),
+    // Inject OpenCode specific env vars
+    OPENCODE_MODEL: model,
+    // Note: OpenCode uses environment variables for API keys, but we rely on the user's configuration
+    // We don't inject API keys here because OpenCode reads them from its own config or env vars.
+    // However, we can inject the Paperclip API key if needed for the paperclip skill.
+    // But note: the paperclip skill is injected via the skills directory, not via env.
+  };
+
+  // 4. Resolve session
+  // OpenCode uses SQLite database for session storage, so we don't manage session via env vars.
+  // Instead, we rely on OpenCode's built-in session management which uses the cwd to store sessions.
+  // We don't need to do anything special for session resume because OpenCode handles it internally
+  // based on the working directory.
+
+  // 5. Render prompt
+  const prompt = renderTemplate(
+    'You are agent {{agent.id}} ({{agent.name}}). Continue your Paperclip work.',
+    {
+      agentId: ctx.agent.id,
+      companyId: ctx.agent.companyId,
+      runId: ctx.runId,
+      company: ctx.context.company,
+      agent: ctx.context.agent,
+      run: ctx.context.run,
+      context: ctx.context,
+    }
+  );
+
+  // 6. Call onMeta (we don't have onMeta in the context, but the skill says to call it)
+  // Actually, the context has onMeta? Let's check the AdapterExecutionContext interface from the skill.
+  // The skill says: `onMeta?: (meta: AdapterInvocationMeta) => Promise<void>;`
+  // We'll call it if available.
+  if (ctx.onMeta) {
+    await ctx.onMeta({
+      adapterType: ctx.agent.adapterType,
+      agentId: ctx.agent.id,
+      runId: ctx.runId,
+      // We don't have the prompt in the meta, but we can include the config without secrets
+      config: {
+        model,
+        timeoutSec,
+        graceSec,
+        sessionHistoryLimit,
+        // Note: we don't include cwd in meta because it's not secret, but we can if needed.
+        // However, the skill says to use redactEnvForLogs for env, but for config we just pass non-secret fields.
+      },
+    });
+  }
+
+  // 7. Spawn the process
+  // We need to check if the opencode command is available
+  let command = 'opencode';
+  try {
+    ensureCommandResolvable(command, absoluteCwd, env);
+  } catch (err) {
+    return {
+      exitCode: 127,
+      signal: null,
+      timedOut: false,
+      errorMessage: `OpenCode CLI not found: ${err.message}`,
+      usage: null,
+      sessionId: null,
+      sessionParams: null,
+      sessionDisplayId: null,
+      provider: null,
+      model: null,
+      costUsd: null,
+      resultJson: null,
+      summary: null,
+      clearSession: false,
+    };
+  }
+
+  // We'll run opencode in non-interactive mode with the prompt
+  // Note: OpenCode non-interactive mode: opencode -p "your prompt"
+  // We also want to set the working directory
+  const args = ['-p', prompt];
+
+  // We also want to set the data directory to be inside the cwd to avoid conflicts
+  // OpenCode uses a data directory (default: .opencode) in the current working directory.
+  // We can leave it as default, which will be inside the cwd.
+
+  let childProcess;
+  let stdout = '';
+  let stderr = '';
+  let timedOut = false;
+
+  try {
+    const { 
+      exitCode, 
+      signal, 
+      output, 
+      timeout 
+    } = await runChildProcess(
+      ctx.runId,
+      command,
+      args,
+      {
+        cwd: absoluteCwd,
+        env,
+        timeout: timeoutSec * 1000, // convert to milliseconds
+        maxBuffer: 1024 * 1024, // 1MB max buffer
+      }
+    );
+
+    // Collect output
+    stdout = output.stdout ?? '';
+    stderr = output.stderr ?? '';
+
+    // Parse the output to extract usage, sessionId, etc.
+    // For OpenCode, the non-interactive mode outputs the response directly.
+    // We don't have a structured output for usage, so we'll set usage to null.
+    // We also don't have a session ID in the output for non-interactive mode.
+    // However, OpenCode does store sessions in the database, so we can try to get the latest session.
+    // But for simplicity, we'll not return session info in this version.
+
+    // We'll consider the exit code from the process
+    const result: AdapterExecutionResult = {
+      exitCode,
+      signal,
+      timedOut: timeout,
+      errorMessage: timeout ? 'Process timed out' : (stderr.length > 0 ? stderr : null),
+      usage: null, // OpenCode doesn't provide usage in non-interactive mode output
+      sessionId: null, // We don't have a session ID to return
+      sessionParams: null, // We don't manage session params in the adapter
+      sessionDisplayId: null,
+      provider: null, // We don't know the provider from the output
+      model,
+      costUsd: null, // We don't have cost info
+      resultJson: null, // We could store the raw output, but the skill doesn't require it
+      summary: stdout.trim(), // The summary is the stdout
+      clearSession: false, // We don't clear the session because we don't manage it
+    };
+
+    return result;
+  } catch (err) {
+    // If runChildProcess throws, it's likely a timeout or error
+    return {
+      exitCode: 1,
+      signal: null,
+      timedOut: err.timedOut ?? false,
+      errorMessage: err.message ?? 'Unknown error',
+      usage: null,
+      sessionId: null,
+      sessionParams: null,
+      sessionDisplayId: null,
+      provider: null,
+      model: null,
+      costUsd: null,
+      resultJson: null,
+      summary: null,
+      clearSession: false,
+    };
+  }
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/server/index.ts b/packages/adapters/opencode/src/server/index.ts
new file mode 100644
index 000000000..548eebac6
--- /dev/null
+++ b/packages/adapters/opencode/src/server/index.ts
@@ -0,0 +1,19 @@
+export { execute } from './execute.js';
+export { testEnvironment } from './test.js';
+export { parseOpenCodeOutput, isOpenCodeUnknownSessionError } from './parse.js';
+
+// Session codec - required for session persistence
+// Since we're not managing OpenCode sessions in the adapter (relying on OpenCode's internal session mgmt),
+// we return null for session params and display ID.
+// In a more advanced implementation, we could integrate with OpenCode's session system.
+export const sessionCodec = {
+  deserialize(_raw): null {
+    return null;
+  },
+  serialize(_params): null {
+    return null;
+  },
+  getDisplayId(_params): null {
+    return null;
+  },
+};
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/server/parse.ts b/packages/adapters/opencode/src/server/parse.ts
new file mode 100644
index 000000000..39133ff97
--- /dev/null
+++ b/packages/adapters/opencode/src/server/parse.ts
@@ -0,0 +1,19 @@
+// For OpenCode adapter, we don't have complex output parsing in non-interactive mode
+// The output is just the AI's response text
+// We don't extract usage or session info from the output in this simple implementation
+
+export function parseOpenCodeOutput(output: string): { 
+  summary: string; 
+} {
+  return {
+    summary: output.trim()
+  };
+}
+
+// Since we don't have session management in this adapter, we don't need unknown session detection
+// But we'll export the function for completeness
+export function isOpenCodeUnknownSessionError(output: string): boolean {
+  // OpenCode doesn't have session IDs in the same way as Claude Code
+  // So we'll never have unknown session errors in this adapter
+  return false;
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/server/test.ts b/packages/adapters/opencode/src/server/test.ts
new file mode 100644
index 000000000..93fb5dae2
--- /dev/null
+++ b/packages/adapters/opencode/src/server/test.ts
@@ -0,0 +1,100 @@
+import { 
+  AdapterEnvironmentTestContext, 
+  AdapterEnvironmentTestResult,
+  AdapterEnvironmentCheckLevel,
+  AdapterEnvironmentTestStatus,
+  ensureAbsoluteDirectory,
+  ensureCommandResolvable,
+  ensurePathInEnv
+} from '@paperclipai/adapter-utils/server-utils';
+
+export async function testEnvironment(
+  ctx: AdapterEnvironmentTestContext
+): Promise<AdapterEnvironmentTestResult> {
+  const checks = [];
+
+  // 1. Validate cwd
+  const cwd = ctx.config.cwd as string | undefined;
+  if (!cwd) {
+    checks.push({
+      code: 'MISSING_CWD',
+      level: 'error' as AdapterEnvironmentCheckLevel,
+      message: 'cwd is required',
+    });
+  } else {
+    try {
+      ensureAbsoluteDirectory(cwd);
+      checks.push({
+        code: 'CWD_VALID',
+        level: 'info' as AdapterEnvironmentCheckLevel,
+        message: `cwd is valid: ${cwd}`,
+      });
+    } catch (err) {
+      checks.push({
+        code: 'INVALID_CWD',
+        level: 'error' as AdapterEnvironmentCheckLevel,
+        message: `Invalid cwd: ${err.message}`,
+      });
+    }
+  }
+
+  // 2. Validate that opencode command is available
+  try {
+    // We need to pass the environment for command resolution
+    // Build a basic environment for testing
+    const env = {
+      ...process.env,
+      // We don't have the full buildPaperclipEnv here, but for command resolution we just need PATH
+    };
+    ensureCommandResolvable('opencode', cwd ?? '.', env);
+    checks.push({
+      code: 'OPENCODE_COMMAND_AVAILABLE',
+      level: 'info' as AdapterEnvironmentCheckLevel,
+      message: 'OpenCode CLI is available in PATH',
+    });
+  } catch (err) {
+    checks.push({
+      code: 'OPENCODE_COMMAND_NOT_FOUND',
+      level: 'error' as AdapterEnvironmentCheckLevel,
+      message: `OpenCode CLI not found: ${err.message}`,
+    });
+  }
+
+  // 3. Validate model if provided
+  const model = ctx.config.model as string | undefined;
+  if (model) {
+    // OpenCode accepts many model IDs, we can't easily validate them all
+    // But we can check if it's a non-empty string
+    if (model.trim().length === 0) {
+      checks.push({
+        code: 'INVALID_MODEL',
+        level: 'warn' as AdapterEnvironmentCheckLevel,
+        message: 'model should not be empty if provided',
+      });
+    } else {
+      checks.push({
+        code: 'MODEL_PROVIDED',
+        level: 'info' as AdapterEnvironmentCheckLevel,
+        message: `model is set to: ${model}`,
+      });
+    }
+  }
+
+  // Determine overall status
+  const hasError = checks.some(check => check.level === 'error');
+  const hasWarning = !hasError && checks.some(check => check.level === 'warn');
+  
+  let status: AdapterEnvironmentTestStatus = 'pass';
+  if (hasError) {
+    status = 'fail';
+  } else if (hasWarning) {
+    status = 'warn';
+  }
+
+  return {
+    adapterType: ctx.agent.adapterType,
+    status,
+    checks,
+    testedAt: new Date().toISOString(),
+  };
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/ui/build-config.ts b/packages/adapters/opencode/src/ui/build-config.ts
new file mode 100644
index 000000000..0bc7e16c3
--- /dev/null
+++ b/packages/adapters/opencode/src/ui/build-config.ts
@@ -0,0 +1,36 @@
+import type { CreateConfigValues } from '@paperclipai/adapter-utils';
+
+export function buildOpenCodeConfig(v: CreateConfigValues): Record<string, unknown> {
+  const ac: Record<string, unknown> = {};
+
+  if (v.cwd) {
+    ac.cwd = v.cwd;
+  }
+  if (v.model) {
+    ac.model = v.model;
+  }
+  if (v.timeoutSec !== undefined) {
+    ac.timeoutSec = v.timeoutSec;
+  }
+  if (v.graceSec !== undefined) {
+    ac.graceSec = v.graceSec;
+  }
+  if (v.sessionHistoryLimit !== undefined) {
+    ac.sessionHistoryLimit = v.sessionHistoryLimit;
+  }
+
+  // Set default values for any missing optional fields
+  // (Though we are handling them above, we can also set defaults here if needed)
+  // For example, if we want to ensure timeoutSec is always set:
+  if (ac.timeoutSec === undefined) {
+    ac.timeoutSec = 120;
+  }
+  if (ac.graceSec === undefined) {
+    ac.graceSec = 15;
+  }
+  if (ac.sessionHistoryLimit === undefined) {
+    ac.sessionHistoryLimit = 10;
+  }
+
+  return ac;
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/ui/config-fields.tsx b/packages/adapters/opencode/src/ui/config-fields.tsx
new file mode 100644
index 000000000..5f6fa6239
--- /dev/null
+++ b/packages/adapters/opencode/src/ui/config-fields.tsx
@@ -0,0 +1,98 @@
+import type { AdapterConfigFieldsProps } from '@paperclipai/adapter-utils';
+// Note: The skill says to use the primitives from `ui/src/components/agent-config-primitives`
+// We'll import them from the expected location in the Paperclip monorepo.
+import { Field, ToggleField, DraftInput, DraftNumberInput, help } from '@/components/agent-config-primitives';
+
+// We are using an alias `@/` for the Paperclip UI components.
+// In the Paperclip monorepo, this alias is set up to point to `ui/src`.
+// If you are not in the Paperclip monorepo, you may need to adjust this import.
+// However, when the adapter is used in Paperclip, the alias will be valid.
+
+export function OpenCodeConfigFields({ config, eff, set, values }: AdapterConfigFieldsProps) {
+  // Determine if we are in edit mode or create mode
+  const isEdit = !!config;
+
+  // Helper to get the current value for a field
+  const getValue = <T>(key: string): T => {
+    if (isEdit) {
+      // In edit mode, we read from the config
+      return (config as Record<string, unknown>)[key] as T;
+    } else {
+      // In create mode, we read from the form values
+      return (values as Record<string, unknown>)[key] as T;
+    }
+  };
+
+  // Helper to set a field value
+  const setValue = <T>(key: string, value: T) => {
+    if (isEdit) {
+      // In edit mode, we update the config via the eff function
+      eff({ [key]: value });
+    } else {
+      // In create mode, we update the form values via the set function
+      set({ [key]: value });
+    }
+  };
+
+  return (
+    <>
+      <Field
+        label="Working Directory"
+        description="Absolute path to the directory where OpenCode will run"
+      >
+        <DraftInput
+          placeholder="/path/to/project"
+          value={getValue<string>('cwd') || ''}
+          onChange={(e) => setValue('cwd', e.target.value)}
+        />
+      </Field>
+
+      <Field
+        label="Model"
+        description="OpenCode model to use for the agent"
+      >
+        <DraftInput
+          placeholder="claude-3.5-sonnet"
+          value={getValue<string>('model') || ''}
+          onChange={(e) => setValue('model', e.target.value)}
+        />
+      </Field>
+
+      <Field
+        label="Timeout (seconds)"
+        description="Maximum time to wait for each OpenCode invocation"
+      >
+        <DraftNumberInput
+          min={1}
+          step={1}
+          value={getValue<number>('timeoutSec') ?? 120}
+          onChange={(e) => setValue('timeoutSec', parseInt(e.target.value, 10) || 120)}
+        />
+      </Field>
+
+      <Field
+        label="Grace Period (seconds)"
+        description="Additional time to allow OpenCode to shut down after timeout"
+      >
+        <DraftNumberInput
+          min={1}
+          step={1}
+          value={getValue<number>('graceSec') ?? 15}
+          onChange={(e) => setValue('graceSec', parseInt(e.target.value, 10) || 15)}
+        />
+      </Field>
+
+      <Field
+        label="Session History Limit"
+        description="Maximum number of conversation turns to keep in history"
+      >
+        <DraftNumberInput
+          min={1}
+          step={1}
+          value={getValue<number>('sessionHistoryLimit') ?? 10}
+          onChange={(e) => setValue('sessionHistoryLimit', parseInt(e.target.value, 10) || 10)}
+        />
+      </Field>
+    </>
+  );
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/ui/index.ts b/packages/adapters/opencode/src/ui/index.ts
new file mode 100644
index 000000000..311da763f
--- /dev/null
+++ b/packages/adapters/opencode/src/ui/index.ts
@@ -0,0 +1,12 @@
+import type { UIAdapterModule } from '../types';
+import { parseOpenCodeStdoutLine } from './parse-stdout';
+import { OpenCodeConfigFields } from './config-fields';
+import { buildOpenCodeConfig } from './build-config';
+
+export const opencodeUIAdapter: UIAdapterModule = {
+  type: 'opencode',
+  label: 'OpenCode',
+  parseStdoutLine: parseOpenCodeStdoutLine,
+  ConfigFields: OpenCodeConfigFields,
+  buildAdapterConfig: buildOpenCodeConfig,
+};
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/ui/parse-stdout.ts b/packages/adapters/opencode/src/ui/parse-stdout.ts
new file mode 100644
index 000000000..347e68b3f
--- /dev/null
+++ b/packages/adapters/opencode/src/ui/parse-stdout.ts
@@ -0,0 +1,18 @@
+// For OpenCode adapter, we're primarily using non-interactive mode
+// which doesn't produce the kind of streaming output that needs line-by-line parsing
+// for the transcript viewer. However, we still need to implement this interface.
+
+import type { TranscriptEntry } from '@paperclipai/adapter-utils';
+
+// In non-interactive mode, OpenCode outputs the response directly
+// We'll treat the entire output as a single assistant message
+export function parseOpenCodeStdoutLine(line: string, ts: string): TranscriptEntry[] {
+  // For simplicity, we'll return each line as a stdout entry
+  // In a more sophisticated implementation, we might buffer lines and
+  // detect when we have a complete response
+  return [{
+    kind: 'stdout',
+    ts,
+    text: line
+  }];
+}
\ No newline at end of file

From 4d556b3a0198d47db791da0c54583ecd08b7500b Mon Sep 17 00:00:00 2001
From: nathan shearer <help@rapidstartup.io>
Date: Sat, 28 Mar 2026 17:34:58 +0800
Subject: [PATCH 3/4] docs: map existing codebase

---
 .planning/codebase/ARCHITECTURE.md | 153 +++++++++++++++++++++
 .planning/codebase/CONCERNS.md     | 140 +++++++++++++++++++
 .planning/codebase/CONVENTIONS.md  | 135 ++++++++++++++++++
 .planning/codebase/INTEGRATIONS.md | 106 +++++++++++++++
 .planning/codebase/STACK.md        |  70 ++++++++++
 .planning/codebase/STRUCTURE.md    | 212 +++++++++++++++++++++++++++++
 .planning/codebase/TESTING.md      | 186 +++++++++++++++++++++++++
 7 files changed, 1002 insertions(+)
 create mode 100644 .planning/codebase/ARCHITECTURE.md
 create mode 100644 .planning/codebase/CONCERNS.md
 create mode 100644 .planning/codebase/CONVENTIONS.md
 create mode 100644 .planning/codebase/INTEGRATIONS.md
 create mode 100644 .planning/codebase/STACK.md
 create mode 100644 .planning/codebase/STRUCTURE.md
 create mode 100644 .planning/codebase/TESTING.md

diff --git a/.planning/codebase/ARCHITECTURE.md b/.planning/codebase/ARCHITECTURE.md
new file mode 100644
index 000000000..970f696b6
--- /dev/null
+++ b/.planning/codebase/ARCHITECTURE.md
@@ -0,0 +1,153 @@
+# Architecture
+
+**Analysis Date:** 2026-03-28
+
+## Pattern Overview
+
+**Overall:** Modular skill-based architecture with headless browser automation core
+
+**Key Characteristics:**
+- Skills as independent, self-contained modules with defined interfaces
+- Persistent headless browser server for automation tasks
+- CLI wrappers that communicate with persistent services
+- Template-driven skill generation system
+- Centralized configuration and state management
+
+## Layers
+
+**Presentation Layer (CLI):**
+- Purpose: Command-line interfaces for user interaction with skills
+- Location: `*/src/cli.ts` files across modules (browse, design, etc.)
+- Contains: Argument parsing, command routing, user output formatting
+- Depends on: Service layers, configuration systems
+- Used by: End users, scripts, other CLIs
+
+**Service Layer:**
+- Purpose: Core functionality implementation for each skill domain
+- Location: `*/src/` directories (e.g., `browse/src/`, `design/src/`)
+- Contains: Business logic, API integrations, core algorithms
+- Depends on: Infrastructure layer, external SDKs
+- Used by: Presentation layer, other services
+
+**Infrastructure Layer:**
+- Purpose: Shared utilities, configuration, state management, server infrastructure
+- Location: `browse/src/config.ts`, `browse/src/server.ts`, `scripts/` utilities
+- Contains: Persistent browser server, state persistence, config resolution, helper functions
+- Depends on: External packages (playwright, puppeteer-core, etc.)
+- Used by: All service and presentation layers
+
+**Template/Generation Layer:**
+- Purpose: Skill template system and documentation generation
+- Location: `scripts/gen-skill-docs.ts`, `.tmpl` template files
+- Contains: Template processing, skill scaffolding, documentation generation
+- Depends on: File system, template engines
+- Used by: Development workflows, skill creation process
+
+## Data Flow
+
+**Skill Execution Flow:**
+
+1. **Command Invocation:** User runs `gstack <skill> <command>` or direct binary (`browse`, `design`)
+2. **CLI Parsing:** Argument parsing and command routing in `*/src/cli.ts`
+3. **Server Management:** For browse skill, ensures persistent server is running via `ensureServer()`
+4. **Service Call:** Routes to appropriate service function based on command
+5. **Execution:** Service performs core functionality (browser automation, design generation, etc.)
+6. **Result Return:** Output formatted and returned to user via stdout/stderr
+
+**Browser Automation Flow (Browse Skill):**
+1. CLI reads state file (`.gstack/browse.json`) for server connection info
+2. If missing/stale, starts persistent Bun server running `browse/src/server.ts`
+3. CLI sends HTTP commands to server on localhost:port with bearer token auth
+4. Server executes Playwright/Puppeteer commands against Chromium
+5. Results returned via HTTP to CLI, then to user
+
+**Skill Documentation Flow:**
+1. `gen-skill-docs.ts` reads skill YAML/YAML-like configuration
+2. Processes SKILL.md.tmpl templates with skill-specific data
+3. Generates final SKILL.md files in each skill directory
+4. Also generates codex-specific variants when requested
+
+## Key Abstractions
+
+**Skill Abstraction:**
+- Purpose: Standardized interface for all gstack skills
+- Examples: `agents/openai.yaml`, `*/SKILL.md`, `*/SKILL.md.tmpl`
+- Pattern: Each skill has CLI, optional server, templates, tests, and documentation
+
+**Persistent Server Abstraction:**
+- Purpose: Long-running browser automation service
+- Examples: `browse/src/server.ts`, `browse/src/cli.ts` management functions
+- Pattern: State file (.gstack/browse.json) tracks PID, port, token; health checks via HTTP
+
+**Configuration Abstraction:**
+- Purpose: Centralized config resolution with defaults and environment overrides
+- Examples: `browse/src/config.ts`, `resolveConfig()` function
+- Pattern: Hierarchical resolution (defaults → file → env → args) with validation
+
+**Template Abstraction:**
+- Purpose: Reusable skill scaffolding and documentation generation
+- Examples: `SKILL.md.tmpl` files, `gen-skill-docs.ts` script
+- Pattern: Handlebars-style templating with skill metadata injection
+
+## Entry Points
+
+**Binary Entry Points:**
+- `browse/dist/browse`: Compiled browse CLI (primary user entry point)
+- `design/dist/design`: Compiled design CLI
+- `bin/gstack-global-discover`: Global skill discovery utility
+- `browse/dist/find-browse`: Helper for finding browse instances
+
+**Script Entry Points:**
+- `scripts/gen-skill-docs.ts`: Skill documentation generation
+- `scripts/skill-check.ts`: Skill health validation
+- `scripts/dev-skill.ts`: Skill development helper
+- `scripts/discover-skills.ts`: Skill discovery and listing
+
+**Direct Source Entry Points (Dev):**
+- `browse/src/cli.ts`: Development browse CLI
+- `design/src/cli.ts`: Development design CLI
+- `*/src/cli.ts`: Development CLIs for other skills
+
+## Error Handling
+
+**Strategy:** Defensive programming with clear error messages and graceful degradation
+
+**Patterns:**
+- **Server Lifecycle:** Automatic restart on version mismatch or failure, with startup error capture
+- **CLI Validation:** Early argument validation with clear usage instructions
+- **Network Resilience:** Retry mechanisms for transient connection failures in HTTP communication
+- **Process Management:** Cross-platform process detection and cleanup (Windows/Linux/macOS differences)
+- **Authentication:** Token validation with automatic refresh on mismatch
+- **File Operations:** Existence checks before read/write, graceful handling of missing files
+
+**Specific Implementations:**
+- Browse skill uses HTTP health checks (`isServerHealthy()`) instead of PID checks for cross-platform reliability
+- Windows uses Node.js child_process with detached:true for proper process detachment
+- Legacy state cleanup prevents conflicts between different installation methods
+- Server startup includes timeout handling and error log capture for diagnostics
+
+## Cross-Cutting Concerns
+
+**Logging:** 
+- Primary: Console output with color-coded prefixes (`[browse]`, `[design]`, etc.)
+- Levels: Error (console.error), info/status (console.log), debug (conditional)
+- Pattern: Consistent prefixed output for easy filtering
+
+**Validation:**
+- Input: Early validation of CLI arguments and configuration values
+- API: Response validation from external services (OpenAI, browser automation)
+- State: Version checking to detect mismatches between CLI and server binaries
+
+**State Management:**
+- Location: `.gstack/` directory in user home or project root
+- Persistence: JSON state files for server connection info, tokens, version hashes
+- Coordination: File-based locking to prevent race conditions during server startup
+- Cleanup: Automatic cleanup of stale state and legacy /tmp files
+
+**Authentication:**
+- Mechanism: Bearer token auth for CLI-to-server communication
+- Storage: Encrypted file storage (`~/.gstack/openai.json` for design, `.gstack/browse.json` for browse)
+- Resolution: Multiple sources (file → env → interactive prompt) with guided setup
+
+---
+*Architecture analysis: 2026-03-28*
\ No newline at end of file
diff --git a/.planning/codebase/CONCERNS.md b/.planning/codebase/CONCERNS.md
new file mode 100644
index 000000000..5a5ab349a
--- /dev/null
+++ b/.planning/codebase/CONCERNS.md
@@ -0,0 +1,140 @@
+# Codebase Concerns
+
+**Analysis Date:** 2026-03-28
+
+## Tech Debt
+
+**[Documentation gaps]:**
+- Issue: Many skill directories lack clear documentation on purpose and usage
+- Files: `agents/skill-*/README.md` (missing or minimal in many skills)
+- Impact: Difficult for new contributors to understand skill boundaries and responsibilities
+- Fix approach: Add standardized README templates for each skill with purpose, inputs, outputs, and examples
+
+**[Configuration complexity]:**
+- Issue: Multiple configuration mechanisms across skills (JSON, env vars, hardcoded values)
+- Files: `agents/*/config.ts`, `agents/*/*.json`, `.env.example`
+- Impact: Inconsistent configuration patterns increase cognitive load
+- Fix approach: Establish unified configuration pattern using `resolveConfig()` utility
+
+**[Build script fragmentation]:**
+- Issue: Build and setup scripts scattered across multiple directories
+- Files: `setup*`, `bin/*`, `scripts/*`, `package.json` scripts
+- Impact: Difficult to discover and maintain development workflows
+- Fix approach: Consolidate scripts into standardized locations with clear documentation
+
+## Known Bugs
+
+**[Skill registration failures]:**
+- Symptoms: Skills fail to load due to missing adapter configurations
+- Files: `agents/skill-parser.test.ts`, `agents/*/adapter.ts`
+- Trigger: When skill adapter doesn't implement required interfaces correctly
+- Workaround: Manual verification of adapter implementation
+- Fix approach: Add runtime validation during skill loading with clear error messages
+
+**[Browser cookie import race conditions]:**
+- Symptoms: Cookie import fails intermittently when browser is busy
+- Files: `browse/src/cookie-import-browser.ts`, `setup-browser-cookies/*`
+- Trigger: Concurrent access to browser profile during import
+- Workaround: Retry mechanism with exponential backoff
+- Fix approach: Implement proper file locking or use browser automation APIs
+
+## Security Considerations
+
+**[Environment variable exposure]:**
+- Risk: Accidental committing of `.env` files containing secrets
+- Files: `.env.example` (template), potential `.env*` files in developer environments
+- Current mitigation: `.gitignore` excludes `.env*` files
+- Recommendations: Add pre-commit hook to scan for accidental secrets, use secrets scanning in CI
+
+**[Insecure random number generation]:**
+- Risk: Use of non-cryptographically random values for security-sensitive operations
+- Files: `browse/src/sidebar-agent.ts` (generation of session IDs)
+- Current mitigation: None identified
+- Recommendations: Replace `Math.random()` with `crypto.randomUUID()` or similar secure alternatives
+
+## Performance Bottlenecks
+
+**[Skill loading latency]:**
+- Problem: Initial skill discovery and loading takes significant time
+- Files: `agents/skill-parser.ts`, `agents/skill-validation.ts`
+- Cause: Sequential file system operations for each skill directory
+- Improvement path: Implement skill caching with filesystem watchers for invalidation
+
+**[Browser instance multiplication]:**
+- Problem: Multiple browser instances spawned unnecessarily
+- Files: `browse/src/browser-manager.ts`, `browse/src/server.ts`
+- Cause: Lack of proper singleton pattern for browser manager
+- Improvement path: enforce singleton pattern and reuse browser contexts where safe
+
+## Fragile Areas
+
+**[Agent communication protocol]:**
+- Files: `agents/paperclip/*.ts`, `agents/*/adapter.ts`
+- Why fragile: Loose coupling via JSON messages without schema validation
+- Safe modification: Add JSON schema validation for all inter-agent messages
+- Test coverage: Gaps in error handling for malformed messages
+
+**[File system operation safety]:**
+- Files: `scripts/*` (file manipulation scripts), `setup*` scripts
+- Why fragile: Synchronous file operations without proper error handling
+- Safe modification: Wrap FS operations in try/catch with meaningful error messages
+- Test coverage: Limited unit testing for edge cases (permissions, missing directories)
+
+## Scaling Limits
+
+**[Concurrent skill execution]:**
+- Current capacity: Sequential skill execution in workflows
+- Limit: Long-running skills block entire workflow
+- Scaling path: Implement proper async/await patterns and worker queues for parallel execution
+
+**[Memory usage in browser operations]:**
+- Current capacity: Single browser session per user
+- Limit: Memory leaks in long-running browser sessions
+- Scaling path: Implement periodic browser restart and memory monitoring
+
+## Dependencies at Risk
+
+**[PUPPETEER_EXECUTABLE_PATH]:**
+- Risk: Hardcoded paths to browser executables in `browse/src/platform.ts`
+- Impact: Breaks when browser updates or when running in different environments
+- Migration plan: Use environment-configurable paths with auto-detection fallback
+
+**[Node.js version compatibility]:**
+- Risk: Use of modern Node.js features (`import.meta`, top-level await) that may break on older versions
+- Impact: Limits deployment environments
+- Migration plan: Either require specific Node.js version or transpile for broader compatibility
+
+## Missing Critical Features
+
+**[Skill versioning]:**
+- Problem: No mechanism to track skill versions or dependencies
+- Blocks: Safe updates and rollback of skills
+- Proposed solution: Add version metadata to skill configuration and implement compatibility checking
+
+**[Skill sandboxing]:**
+- Problem: Skills run with full process access
+- Blocks: Safe execution of third-party or untrusted skills
+- Proposed solution: Implement skill execution in restricted environments (e.g., VMs, containers)
+
+## Test Coverage Gaps
+
+**[Error handling in adapters]:**
+- What's not tested: Adapter failure scenarios and recovery
+- Files: `agents/*/adapter.ts`
+- Risk: Silent failures in skill execution
+- Priority: High
+
+**[Edge cases in file system operations]:**
+- What's not tested: Permission errors, disk full, concurrent access
+- Files: `scripts/*`, `setup*` scripts
+- Risk: Unhandled exceptions causing partial setup states
+- Priority: Medium
+
+**[Browser automation failure modes]:**
+- What's not tested: Network failures, browser crashes, element not found
+- Files: `browse/src/*`
+- Risk: Unreliable UI automation
+- Priority: High
+
+---
+*Concerns audit: 2026-03-28*
\ No newline at end of file
diff --git a/.planning/codebase/CONVENTIONS.md b/.planning/codebase/CONVENTIONS.md
new file mode 100644
index 000000000..d2807b275
--- /dev/null
+++ b/.planning/codebase/CONVENTIONS.md
@@ -0,0 +1,135 @@
+# Coding Conventions
+
+**Analysis Date:** 2026-03-28
+
+## Naming Patterns
+
+**Files:**
+- TypeScript files use kebab-case naming: `skill-parser.test.ts`, `gen-skill-docs.ts`
+- Test files follow `[feature].test.ts` pattern: `audit-compliance.test.ts`, `skill-e2e.test.ts`
+- Helper files in test directories use camelCase: `session-runner.ts`
+
+**Functions:**
+- Functions use camelCase: `extractBrowseCommands`, `validateSkill`, `parseArgs`
+- Async functions follow same naming: `runSetup`, `main`
+
+**Variables:**
+- Constants use UPPER_SNAKE_CASE: `FIXTURES_DIR`, `ROOT`, `AI_SLOP_BLACKLIST`
+- Variables use camelCase: `hasChanges`, `tokenBudget`, `cmds`
+- Boolean variables use is/has prefixes: `inBashBlock`, `DRY_RUN`
+
+**Types/Interfaces:**
+- Interface names use PascalCase: `BrowseCommand`, `ValidationResult`, `TemplateContext`
+- Type aliases follow PascalCase: `Host`
+
+## Code Style
+
+**Formatting:**
+- Uses 2-space indentation consistently
+- Line length varies but generally stays under 100 characters
+- No explicit formatter configured; follows existing code patterns
+- Semicolons are required and used consistently
+
+**Linting:**
+- No explicit linting configuration detected (.eslintrc, biome.json not found)
+- Code quality maintained through consistent patterns and manual review
+- TypeScript compiler provides strict type checking
+
+## Import Organization
+
+**Order:**
+1. Built-in Node.js modules: `fs`, `path`, `os`
+2. External packages: `bun:test`
+3. Internal modules: relative paths from project root
+4. Absolute internal paths: using `@/` or relative paths like `../../browse/src/commands`
+
+**Path Aliases:**
+- No path aliases detected in tsconfig.json
+- Uses relative paths: `../../browse/src/commands`, `../helpers/skill-parser`
+- Absolute paths from project root: `scripts/resolvers/types`
+
+## Error Handling
+
+**Patterns:**
+- Synchronous code: Uses try/catch for file operations
+  ```typescript
+  try {
+    fs.writeFileSync(outputPath, content);
+  } catch (err) {
+    // Handle error appropriately
+  }
+  ```
+- Asynchronous code: Prefers try/catch with async/await
+  ```typescript
+  async function main(): Promise<void> {
+    try {
+      // async operations
+    } catch (err: any) {
+      console.error(err.message || err);
+      process.exit(1);
+    }
+  }
+  ```
+- Validation: Early validation with descriptive errors
+  ```typescript
+  if (!key || !key.startsWith("sk-")) {
+    console.error("Invalid key. Must start with 'sk-'.");
+    process.exit(1);
+  }
+  ```
+
+## Logging
+
+**Framework:** Uses `console` methods directly
+
+**Patterns:**
+- Errors: `console.error()` for unexpected conditions and user-facing errors
+- Info: `console.log()` for general output and status messages
+- Debug: Limited use, mostly in development scripts
+- No structured logging library detected
+
+## Comments
+
+**When to Comment:**
+- File headers describe purpose and flow (seen in most files)
+- Complex logic gets inline comments explaining why, not what
+- TODO comments used for tracking future work: `// TODO:`
+
+**JSDoc/TSDoc:**
+- Used for all public APIs and complex functions
+- Includes @param, @returns, and @throws where applicable
+- Example:
+  ```typescript
+  /**
+   * Extract all $B invocations from bash code blocks in a SKILL.md file.
+   */
+  export function extractBrowseCommands(skillPath: string): BrowseCommand[] {
+  ```
+
+## Function Design
+
+**Size:** Functions tend to be small and focused
+- Most functions under 50 lines
+- Larger functions broken into smaller helpers (e.g., `processTemplate` in gen-skill-docs.ts)
+
+**Parameters:** 
+- Functions typically take 1-3 parameters
+- Parameter objects used for multiple related options
+- Explicit typing on all parameters and return values
+
+**Return Values:** 
+- Clear return types specified
+- Functions return meaningful values or Promises for async operations
+- Consistent error handling patterns
+
+## Module Design
+
+**Exports:** 
+- Named exports preferred: `export function extractBrowseCommands(...)`
+- Default exports used sparingly (mainly for classes or single-value exports)
+- Barrel files not commonly used; direct imports preferred
+
+**File Organization:**
+- Feature-based grouping: browse/, design/, scripts/, test/
+- Related functionality grouped in same directory
+- Test files colocated with source or in parallel test/ directory structure
\ No newline at end of file
diff --git a/.planning/codebase/INTEGRATIONS.md b/.planning/codebase/INTEGRATIONS.md
new file mode 100644
index 000000000..2ab967836
--- /dev/null
+++ b/.planning/codebase/INTEGRATIONS.md
@@ -0,0 +1,106 @@
+# External Integrations
+
+**Analysis Date:** 2026-03-28
+
+## APIs & External Services
+
+**AI/LLM Providers:**
+- Anthropic Claude - Used for skill evaluation and LLM judging
+  - SDK/Client: @anthropic-ai/sdk
+  - Auth: ANTHROPIC_API_KEY environment variable
+- OpenAI - Used for design generation, prototyping, and Codex metadata
+  - SDK/Client: Direct fetch API calls
+  - Auth: OPENAI_API_KEY environment variable or ~/.gstack/openai.json
+- OpenAI Codex - Referenced for CLI installation and metadata generation
+  - Integration: agents/openai.yaml metadata files
+  - Auth: Requires separate codex CLI installation
+
+**Data & Storage:**
+- Supabase - Used for telemetry storage, update checking, and community pulse functions
+  - SDK/Client: @supabase/supabase-js (loaded via esm.sh)
+  - Auth: SUPABASE_URL and SUPABASE_ANON_KEY environment variables
+  - Used in: telemetry-ingest, update-check, community-pulse edge functions
+
+**Browser Automation:**
+- Playwright - Primary browser automation for headless browsing
+  - Used in: browse skill for URL validation, snapshot testing
+  - Auth: None required (local browser instances)
+- Puppeteer-core - Alternative browser automation
+  - Used in: Some test scenarios and specific browsing features
+  - Auth: None required
+
+## Data Storage
+
+**Databases:**
+- Supabase PostgreSQL
+  - Connection: Via SUPABASE_URL and SUPABASE_ANON_KEY env vars
+  - Client: @supabase/supabase-js in edge functions
+  - Tables: update_checks, telemetry, community_pulse data (inferred)
+
+**File Storage:**
+- Local filesystem only - No external file storage services integrated
+  - Skills and data stored locally in ~/.gstack/ directory
+  - Telemetry stored in Supabase
+
+**Caching:**
+- None - No external caching services detected
+  - Local caching: In-memory or filesystem-based where needed
+
+## Authentication & Identity
+
+**Auth Provider:**
+- Custom/Open standards approach
+  - Implementation: Environment variable based API keys
+  - Supported providers: Anthropic, OpenAI via direct API key configuration
+  - No OAuth or third-party auth flows implemented
+
+## Monitoring & Observability
+
+**Error Tracking:**
+- None - No external error tracking services detected
+  - Local error handling: Console output and test assertions
+
+**Logs:**
+- Console output - Primary logging mechanism
+- Structured logging: Limited to test helpers and E2E helper functions
+- Telemetry: Collected and sent to Supabase via telemetry-ingest function
+
+## CI/CD & Deployment
+
+**Hosting:**
+- Self-hosted CLI tools - Designed for local installation and execution
+- No cloud hosting dependencies for core functionality
+
+**CI Pipeline:**
+- GitHub Actions - Used for automated testing and skill documentation generation
+  - Workflows: skill-docs.yml, evals.yml, evals-periodic.yml, ci-image.yml
+  - Triggers: Push, pull request, schedule
+
+## Environment Configuration
+
+**Required env vars:**
+- SUPABASE_URL - Supabase project URL
+- SUPABASE_ANON_KEY - Supabase anon key
+- ANTHROPIC_API_KEY - Anthropic API key for Claude access
+- OPENAI_API_KEY - OpenAI API key for GPT access
+
+**Secrets location:**
+- Environment variables - Expected to be set in runtime environment
+- Local config: ~/.gstack/openai.json for OpenAI API key (0600 permissions)
+- No secrets committed to repository
+
+## Webhooks & Callbacks
+
+**Incoming:**
+- None - No incoming webhook endpoints in core codebase
+  - Test examples: /webhook/stripe in skill-e2e-cso.test.ts (example only)
+
+**Outgoing:**
+- Supabase edge functions - Outgoing HTTP requests to external APIs
+  - OpenAI API calls from design/* skills
+  - Anthropic API calls from skill evaluation helpers
+  - No other outgoing webhooks detected
+
+---
+
+*Integration audit: 2026-03-28*
\ No newline at end of file
diff --git a/.planning/codebase/STACK.md b/.planning/codebase/STACK.md
new file mode 100644
index 000000000..0eb361061
--- /dev/null
+++ b/.planning/codebase/STACK.md
@@ -0,0 +1,70 @@
+# Technology Stack
+
+**Analysis Date:** 2026-03-28
+
+## Languages
+
+**Primary:**
+- TypeScript - Used throughout the codebase for all source files
+
+**Secondary:**
+- JavaScript - Used in some test files and configuration
+- Bash - Used in build scripts and helper scripts
+
+## Runtime
+
+**Environment:**
+- Bun.js >=1.0.0 - Primary runtime as specified in package.json engines
+
+**Package Manager:**
+- Bun - Built-in package manager
+- Lockfile: bun.lockb (present based on standard Bun usage)
+
+## Frameworks
+
+**Core:**
+- None - This is a skills/tooling repository, not an application framework
+
+**Testing:**
+- Bun:test - Built-in test runner used for all testing
+- Playwright - Used for browser automation in E2E tests
+- Puppeteer-core - Used for browser automation in some tests
+
+**Build/Dev:**
+- Bun build - Used for compiling TypeScript to native binaries
+- Custom scripts - Various TypeScript scripts for skill generation, documentation, etc.
+
+## Key Dependencies
+
+**Critical:**
+- diff ^7.0.0 - Used for text comparison operations
+- playwright ^1.58.2 - Browser automation for testing and browsing functionality
+- puppeteer-core ^24.40.0 - Alternative browser automation library
+
+**Infrastructure:**
+- @anthropic-ai/sdk ^0.78.0 - Anthropic API client for Claude integration (devDependency)
+
+## Configuration
+
+**Environment:**
+- Configured via .env.example file (contains template variables)
+- Key configs: SUPABASE_URL, SUPABASE_ANON_KEY, OPENAI_API_KEY, etc.
+
+**Build:**
+- package.json scripts - Defines all build and development commands
+- bun run build - Main build command that compiles binaries and generates documentation
+
+## Platform Requirements
+
+**Development:**
+- Bun.js >=1.0.0 required
+- Git for version control
+- Compatible with Windows, macOS, Linux
+
+**Production:**
+- Designed to run as CLI tools
+- Target platforms: Any where Bun.js runs
+
+---
+
+*Stack analysis: 2026-03-28*
\ No newline at end of file
diff --git a/.planning/codebase/STRUCTURE.md b/.planning/codebase/STRUCTURE.md
new file mode 100644
index 000000000..c9d9b8289
--- /dev/null
+++ b/.planning/codebase/STRUCTURE.md
@@ -0,0 +1,212 @@
+# Codebase Structure
+
+**Analysis Date:** 2026-03-28
+
+## Directory Layout
+
+```
+[project-root]/
+├── .github/               # GitHub Actions workflows and configs
+├── .planning/             # Generated planning documents (this analysis)
+├── agents/                # Skill agent configurations (YAML)
+├── autonplan/             # Autonomous planning skill
+├── benchmark/             # Performance benchmarking tools
+├── bin/                   # Executable scripts and CLI entry points
+├── browse/                # Headless browser automation skill (core)
+├── browse/bin/            # Compiled browse binaries
+├── browse/scripts/        # Browse-specific helper scripts
+├── browse/src/            # Browse skill source code
+├── browse/test/           # Browse skill tests
+├── canary/                # Canary release skill
+├── careful/               # Destructive operation protection skill
+├── codex/                 # Codex agent adapter
+├── connect-chrome/        # Chrome extension connector
+├── cso/                   # Customer success operations skill
+├── design/                # AI-powered design generation skill
+├── design/src/            # Design skill source code
+├── design/test/           # Design skill tests
+├── design-consultation/   # Design consultation skill
+├── design-review/         # Design review skill
+├── design-shotgun/        # Rapid design exploration skill
+├── docs/                  # Documentation files
+├── document-release/      # Release documentation skill
+├── extension/             # Browser extension source
+├── freeze/                # File edit protection skill
+├── gstack-upgrade/        # Self-upgrade skill
+├── guard/                 # Combined careful+freeze skill
+├── investigate/           # Investigation and analysis skill
+├── land-and-deploy/       # Deployment automation skill
+├── lib/                   # Shared libraries
+├── office-hours/          # Project initialization skill
+├── plan-ceo-review/       # CEO-level planning review 사실은 수정 필요
+├── plan-design-review/    # Design review planning skill
+├── plan-eng-review/       # Engineering planning skill
+├── qa/                    # Quality assurance testing skill
+├── qa-only/               # QA reporting only skill
+├── retro/                 # Retrospective meeting skill
+├── review/                # Pull request review skill
+├── scripts/               # Cross-cutting utility scripts
+├── setup-browser-cookies/ # Browser cookie import skill
+├── setup-deploy/          # Deployment setup skill
+├── ship/                  # Release shipping skill
+├── supabase/              # Supabase integration skill
+├── test/                  # Root-level test files
+├── unfreeze/              # File edit protection removal skill
+```
+
+## Directory Purposes
+
+**.github/:**
+- Purpose: GitHub Actions workflows for CI/CD
+- Contains: Workflow YAML files for skill docs, evals, CI images
+- Key files: `.github/workflows/skill-docs.yml`, `.github/workflows/evals.yml`
+
+**agents/:**
+- Purpose: Skill agent configurations for external AI integrations
+- Contains: YAML configurations for different AI providers
+- Key files: `agents/openai.yaml`
+
+**browse/:**
+- Purpose: Core headless browser automation functionality
+- Contains: Persistent browser server, CLI interface, automation commands
+- Key files: 
+  - `browse/src/server.ts` - Persistent browser automation server
+  - `browse/src/cli.ts` - CLI interface for browser commands
+  - `browse/src/config.ts` - Configuration resolution
+  - `browse/dist/browse` - Compiled binary entry point
+
+**design/:**
+- Purpose: AI-powered UI mockup generation and design assistance
+- Contains: Design generation, editing, and analysis tools
+- Key files:
+  - `design/src/cli.ts` - CLI for design commands
+  - `design/src/generate.ts` - Image generation core
+  - `design/src/serve.ts` - HTTP server for design boards
+  - `design/dist/design` - Compiled binary entry point
+
+**scripts/:**
+- Purpose: Cross-cutting utility scripts for skill management
+- Contains: Skill generation, validation, discovery, and development tools
+- Key files:
+  - `scripts/gen-skill-docs.ts` - Skill documentation generation
+  - `scripts/skill-check.ts` - Skill health validation
+  - `scripts/dev-skill.ts` - Skill development helper
+  - `scripts/discover-skills.ts` - Skill discovery and listing
+
+**bin/:**
+- Purpose: Executable scripts and compiled binaries
+- Contains: Global utilities and skill entry points
+- Key files:
+  - `bin/gstack-global-discover` - Global skill discovery utility
+  - `bin/gstack-config` - Configuration management
+  - `bin/gstack-analytics` - Usage analytics
+  - `bin/gstack-review-log` - PR review logging
+
+**test/:**
+- Purpose: Root-level test files and helpers
+- Contains: Test fixtures, helpers, and cross-cutting tests
+- Key files:
+  - `test/helpers/skill-parser.ts` - Skill YAML parsing
+  - `test/helpers/session-runner.ts` - E2E test session management
+  - `test/skill-e2e-*.test.ts` - End-to-end skill tests
+
+## Key File Locations
+
+**Entry Points:**
+- `browse/dist/browse`: Primary browse CLI (compiled)
+- `design/dist/design`: Primary design CLI (compiled)
+- `bin/gstack-global-discover`: Skill discovery utility
+- `browse/src/cli.ts`: Development browse CLI
+- `design/src/cli.ts`: Development design CLI
+
+**Configuration:**
+- `browse/src/config.ts`: Browse skill configuration resolution
+- `design/src/auth.ts`: Design skill API key management
+- `.gstack/`: User-specific state directory (created at runtime)
+- `package.json`: Project dependencies and scripts
+
+**Core Logic:**
+- `browse/src/server.ts`: Persistent browser automation server
+- `browse/src/sidebar-agent.ts`: Chrome extension communication agent
+- `design/src/generate.ts`: Core image generation logic
+- `design/src/memory.ts`: Design session persistence
+
+**Testing:**
+- `browse/test/`: Browse skill unit and E2E tests
+- `design/test/`: Design skill unit and E2e tests
+- `test/`: Root-level test helpers and fixtures
+- `test/skill-e2e-*.test.ts`: Cross-skill end-to-end tests
+
+## Naming Conventions
+
+**Files:**
+- **Skills:** kebab-case directory names (e.g., `skill-name/`)
+- **Source Files:** `.ts` extension, kebab-case naming (e.g., `skill-parser.test.ts`)
+- **Templates:** `.tmpl` extension for template files (e.g., `SKILL.md.tmpl`)
+- **Tests:** `.test.ts` suffix for test files (e.g., `skill-parser.test.ts`)
+- **Binaries:** No extension for compiled binaries (e.g., `browse`, `design`)
+- **Config:** Descriptive names with `.ts` extension (e.g., `config.ts`, `auth.ts`)
+
+**Directories:**
+- **Skill Modules:** kebab-case matching skill name (e.g., `browse/`, `design/`)
+- **Source Code:** `src/` directory within skill modules
+- **Tests:** `test/` directory within skill modules or at root
+- **Scripts:** `scripts/` directory for cross-cutting utilities
+- **Binaries:** `bin/` directory for executables, `*/dist/` for compiled skill binaries
+- **Templates:** Root directory for skill templates (e.g., `SKILL.md.tmpl` in skill dirs)
+
+## Where to Add New Code
+
+**New Skill:**
+- Primary code: `new-skill/src/` directory with `cli.ts`, core logic files
+- Tests: `new-skill/test/` directory
+- Template: `new-skill/SKILL.md.tmpl` (copy from existing)
+- Config: Add to `scripts/gen-skill-docs.ts` if auto-generation needed
+
+**New Component/Module:**
+- Implementation: Within existing skill's `src/` directory
+- Following patterns: Match existing file naming and structure
+- Exports: Use named exports for functions, default for main classes
+
+**Utilities:**
+- Shared helpers: `scripts/` directory for cross-cutting utilities
+- Skill-specific helpers: Within skill's `src/` directory
+- Persistent: Consider if should be in `lib/` for true sharing across skills
+
+**Configuration:**
+- Skill-specific: Within skill's `src/` directory (e.g., `config.ts`, `auth.ts`)
+- Global: Update `package.json` scripts or add to root config files
+
+## Special Directories
+
+**.planning/:**
+- Purpose: Generated codebase analysis documents from `/gsd-map-codebase`
+- Generated: Yes (by this analysis process)
+- Committed: Yes (for reference by other GSD commands)
+
+**.gstack/:**
+- Purpose: User-specific state directory for skills
+- Generated: Yes (at runtime by skills)
+- Committed: No (listed in .gitignore)
+- Contains: `browse.json` (server state), `openai.json` (API keys)
+
+**test/fixtures/:**
+- Purpose: Test data files for E2E and unit tests
+- Generated: No (committed test data)
+- Committed: Yes
+- Contains: HTML fixtures, test images, sample data
+
+**browse/test/fixtures/:**
+- Purpose: Browser automation test fixtures
+- Generated: No
+- Committed: Yes
+- Contains: Sample web pages for testing automation commands
+
+**node_modules/:**
+- Purpose: Dependency packages
+- Generated: Yes (by bun install)
+- Committed: No (listed in .gitignore)
+- Contains: Playwright, puppeteer-core, diff, and other dependencies
+
+---
+*Structure analysis: 2026-03-28*
\ No newline at end of file
diff --git a/.planning/codebase/TESTING.md b/.planning/codebase/TESTING.md
new file mode 100644
index 000000000..09d066ec6
--- /dev/null
+++ b/.planning/codebase/TESTING.md
@@ -0,0 +1,186 @@
+# Testing Patterns
+
+**Analysis Date:** 2026-03-28
+
+## Test Framework
+
+**Runner:**
+- Bun test framework (built-in)
+- Config: Implicit via package.json test scripts
+
+**Assertion Library:**
+- Bun:test expect API
+
+**Run Commands:**
+```bash
+bun test                            # Run all tests (excluding E2E)
+bun test --watch                    # Watch mode
+bun test --coverage                 # Coverage reporting
+bun test test/skill-parser.test.ts  # Run specific test file
+```
+
+## Test File Organization
+
+**Location:**
+- Mixed approach: tests colocated with source and in centralized test/ directory
+- Feature-specific tests in feature directories: `design/test/`, `browse/test/`
+- General tests in root `test/` directory
+
+**Naming:**
+- Test files: `[feature].test.ts` or `[feature].e2e.test.ts`
+- Helper/test utilities: `[name].ts` or `[name].test.ts`
+
+**Structure:**
+```
+test/
+├── skill-parser.test.ts
+├── audit-compliance.test.ts
+├── helpers/                    # Test helpers and fixtures
+├── browse/                     # Browse-specific tests
+└── design/                     # Design-specific tests
+```
+
+## Test Structure
+
+**Suite Organization:**
+```typescript
+import { describe, test, expect } from 'bun:test';
+import { functionToTest } from './module';
+
+describe('Function Name', () => {
+  test('description of what is being tested', () => {
+    // Arrange
+    const input = 'test input';
+    
+    // Act
+    const result = functionToTest(input);
+    
+    // Assert
+    expect(result).toBe('expected output');
+  });
+});
+```
+
+**Patterns:**
+- Setup: Using `beforeEach()`, `beforeAll()` when needed
+- Teardown: Cleanup in `afterEach()`, `afterAll()` 
+- Assertions: Using `expect()` matchers like `.toBe()`, `.toEqual()`, `.toHaveLength()`
+- Async testing: Using `await` with expect assertions
+
+## Mocking
+
+**Framework:** Manual mocking approach (no external mocking library)
+
+**Patterns:**
+- Temporary directories for file system tests:
+  ```typescript
+  const FIXTURES_DIR = path.join(os.tmpdir(), 'skill-parser-test');
+  fs.mkdirSync(FIXTURES_DIR, { recursive: true });
+  // ... create test files
+  // cleanup happens automatically via OS temp cleanup
+  ```
+- Function spying/stubbing: Limited use, mostly dependency injection
+- Network mocking: Not commonly used; tests use real fixtures or controlled inputs
+
+**What to Mock:**
+- File system operations (using temporary directories)
+- External APIs when testing integration points (via fixture files)
+- Date/time when testing time-dependent functionality
+
+**What NOT to Mock:**
+- Pure functions (test with real inputs/outputs)
+- Simple utility functions
+- Internal logic that can be tested directly
+
+## Fixtures and Factories
+
+**Test Data:**
+- Inline fixture creation for simple cases:
+  ```typescript
+  const p = writeFixture('test.md', [
+    '# Test',
+    '\`\`\`bash',
+    '$B goto https://example.com',
+    '\`\`\`',
+  ].join('\n'));
+  ```
+- Helper functions for complex setup:
+  ```typescript
+  function writeFixture(name: string, content: string): string {
+    fs.mkdirSync(FIXTURES_DIR, { recursive: true });
+    const p = path.join(FIXTURES_DIR, name);
+    fs.writeFileSync(p, content);
+    return p;
+  }
+  ```
+
+**Location:**
+- Test-specific helpers in `test/helpers/` directory
+- Inline fixtures for simple test data
+- Shared fixtures in test files when used by multiple tests
+
+## Coverage
+
+**Requirements:** No enforced coverage thresholds detected
+
+**View Coverage:**
+```bash
+bun test --coverage
+```
+
+## Test Types
+
+**Unit Tests:**
+- Majority of tests are unit tests
+- Test individual functions in isolation
+- Examples: `skill-parser.test.ts`, `audit-compliance.test.ts`
+
+**Integration Tests:**
+- Some tests verify integration between modules
+- Examples: E2E tests that test CLI command flows
+- Limited use due to nature of CLI/automation tool
+
+**E2E Tests:**
+- Present for end-to-end workflows
+- Files: `test/skill-e2e-*.test.ts`, `test/codex-e2e.test.ts`, `test/gemini-e2e.test.ts`
+- Uses `@bun:test` with longer timeouts
+- Tests complete user workflows
+
+## Common Patterns
+
+**Async Testing:**
+```typescript
+test('async operation', async () => {
+  const result = await asyncFunction();
+  expect(result).toBe('expected');
+});
+```
+
+**Error Testing:**
+```typescript
+test('throws on invalid input', () => {
+  expect(() => {
+    functionThatThrows('invalid');
+  }).toThrow(/invalid input/);
+});
+```
+
+**File System Testing:**
+```typescript
+test('reads file correctly', () => {
+  const tempFile = writeFixture('test.txt', 'content');
+  const result = readFile(tempFile);
+  expect(result).toBe('content');
+  // OS cleans up temp file automatically
+  // or explicit cleanup in afterAll()
+});
+```
+
+**Command Line Testing:**
+```typescript
+test('CLI command works', async () => {
+  const proc = Bun.spawn(['bun', 'run', 'cli', '--help']);
+  const response = await new Response(proc.stdout).text();
+  expect(response).toContain('Usage:');
+});
+```
\ No newline at end of file

From cbffcfe6b6cb5614398d1642d518437a3c7869a0 Mon Sep 17 00:00:00 2001
From: nathan shearer <help@rapidstartup.io>
Date: Sun, 29 Mar 2026 01:27:05 +0800
Subject: [PATCH 4/4] feat: add OpenCode integration for gstack skills

- Add OpenCode adapter for Paperclip agent system
- Add OpenCode command files for all gstack skills
- Enable gstack skills to be used in OpenCode via command dialog (Ctrl+K)
---
 .gitattributes                                |  17 ++
 AGENTS.md                                     | 135 ++++++++++-
 get-shit-done                                 |   1 +
 opencode                                      |   1 +
 packages/adapters/opencode/package.json       |  19 ++
 .../adapters/opencode/src/cli/format-event.ts |  34 +++
 packages/adapters/opencode/src/cli/index.ts   |   1 +
 packages/adapters/opencode/src/index.ts       |  28 +++
 .../adapters/opencode/src/server/execute.ts   | 209 ++++++++++++++++++
 .../adapters/opencode/src/server/index.ts     |  19 ++
 .../adapters/opencode/src/server/parse.ts     |  19 ++
 packages/adapters/opencode/src/server/test.ts | 100 +++++++++
 .../adapters/opencode/src/ui/build-config.ts  |  36 +++
 .../opencode/src/ui/config-fields.tsx         |  98 ++++++++
 packages/adapters/opencode/src/ui/index.ts    |  12 +
 .../adapters/opencode/src/ui/parse-stdout.ts  |  18 ++
 16 files changed, 745 insertions(+), 2 deletions(-)
 create mode 100644 .gitattributes
 create mode 160000 get-shit-done
 create mode 160000 opencode
 create mode 100644 packages/adapters/opencode/package.json
 create mode 100644 packages/adapters/opencode/src/cli/format-event.ts
 create mode 100644 packages/adapters/opencode/src/cli/index.ts
 create mode 100644 packages/adapters/opencode/src/index.ts
 create mode 100644 packages/adapters/opencode/src/server/execute.ts
 create mode 100644 packages/adapters/opencode/src/server/index.ts
 create mode 100644 packages/adapters/opencode/src/server/parse.ts
 create mode 100644 packages/adapters/opencode/src/server/test.ts
 create mode 100644 packages/adapters/opencode/src/ui/build-config.ts
 create mode 100644 packages/adapters/opencode/src/ui/config-fields.tsx
 create mode 100644 packages/adapters/opencode/src/ui/index.ts
 create mode 100644 packages/adapters/opencode/src/ui/parse-stdout.ts

diff --git a/.gitattributes b/.gitattributes
new file mode 100644
index 000000000..522616022
--- /dev/null
+++ b/.gitattributes
@@ -0,0 +1,17 @@
+# Store and checkout text as LF (cross-platform; matches web/TS conventions).
+* text=auto eol=lf
+
+# Binary — never apply line-ending conversion
+*.png binary
+*.jpg binary
+*.jpeg binary
+*.gif binary
+*.webp binary
+*.ico binary
+*.pdf binary
+*.woff binary
+*.woff2 binary
+*.ttf binary
+*.eot binary
+*.wasm binary
+*.zip binary
diff --git a/AGENTS.md b/AGENTS.md
index d87217453..4c740bacb 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -41,9 +41,140 @@ bun run gen:skill-docs   # regenerate SKILL.md files from templates
 bun run skill:check      # health dashboard for all skills
 ```
 
-## Key conventions
+### Test commands
+
+```bash
+# Run all tests (excluding slow E2E tests)
+bun test
+
+# Run specific test suites
+bun run test:evals          # LLM evaluation tests
+bun run test:e2e            # End-to-end tests
+bun run test:codex          # Codex-specific E2E tests
+bun run test:gemini         # Gemini-specific E2E tests
+bun run test:audit          # Audit compliance tests
+
+# Run a single test file
+bun test test/skill-parser.test.ts
+
+# Run a single test function (if supported by test runner)
+bun test test/skill-parser.test.ts -t "extracts \$B commands"
+```
+
+## Code style guidelines
+
+### Language & formatting
+
+- **Primary language**: TypeScript with ES modules (`"type": "module"` in package.json)
+- **Formatter**: No explicit formatter configured; follow existing code patterns
+- **Line length**: Aim for 80-100 characters; use judgment for readability
+- **Indentation**: 2 spaces (not tabs)
+- **Semicolons**: Required (follow existing code)
+- **Quotes**: Single quotes for strings, double quotes only when needed (e.g., JSX attributes)
+- **File naming**: `.ts` for TypeScript files, `.test.ts` for test files
+- **Directory organization**: Feature-based grouping (browse/, design/, scripts/, etc.)
+
+### Imports
+
+- **Order**: Built-in modules → external packages → internal modules
+- **Syntax**: 
+  - Named imports: `import { fs } from 'fs';`
+  - Default imports: `import fs from 'fs';` (when appropriate)
+  - Namespace imports: `import * as fs from 'fs';`
+- **Path aliases**: Use relative paths (`./helpers/util`) or absolute from project root
+- **Bun-specific**: Use `bun:test` for testing imports: `import { describe, test, expect } from 'bun:test';`
+
+### Types
+
+- **Type definitions**: Prefer interfaces over types for object shapes
+- **Explicit typing**: 
+  - Function parameters and return values should be typed
+  - Avoid `any`; use `unknown` when type is truly unknown
+  - Use generics for reusable components
+- **Nullable types**: Explicitly mark with `| null` or use strict null checks
+- **Type inference**: Trust TypeScript inference for simple cases
+
+### Naming conventions
+
+- **Variables & functions**: camelCase (e.g., `fetchUserData`)
+- **Classes & types**: PascalCase (e.g., `BrowserManager`)
+- **Constants**: UPPER_SNAKE_CASE (e.g., `MAX_START_WAIT`)
+- **Files**: kebab-case (e.g., `skill-parser.test.ts`)
+- **Private members**: Prefix with underscore only if truly internal (`_internalMethod`)
+- **Boolean variables**: Use is/has/can prefixes (e.g., `isEnabled`, `hasError`)
+
+### Error handling
+
+- **Synchronous code**: Use try/catch for recoverable errors
+- **Asynchronous code**: 
+  - Prefer try/catch with async/await
+  - For promises: `.then(result => ...).catch(error => handleError(error))`
+- **Validation**: Validate inputs early; throw descriptive errors
+- **Logging**: Use console.error for unexpected conditions; avoid console.log in libraries
+- **User-facing errors**: Provide clear, actionable messages
+- **Error types**: Consider creating custom error classes for domain-specific errors
+
+### Documentation
+
+- **JSDoc**: Use for all public APIs and complex functions
+- **File headers**: Include purpose and flow description (see existing files)
+- **Complex logic**: Add inline comments explaining why, not what
+- **TODO comments**: Use `// TODO:` for tracking future work
+- **Magic numbers**: Replace with named constants with explanations
+
+### Testing patterns
+
+- **Test files**: Name as `[feature].test.ts` alongside implementation or in `test/` directory
+- **Test structure**: 
+  - `describe()` for test suites
+  - `test()` for individual test cases
+  - `beforeAll()/afterAll()` for suite setup/teardown
+  - `beforeEach()/afterEach()` for test isolation
+- **Assertions**: Use `expect()` from `bun:test`
+- **Mocking**: 
+  - Manual mocks for simple cases
+  - Temporary directories for file system tests (`os.tmpdir()`)
+  - Child process testing with `spawnSync` for CLI commands
+- **E2E tests**: 
+  - Mark with `.e2e.test.ts` suffix
+  - Use test servers for HTTP testing
+  - Clean up resources in `afterAll()`
+
+### Specific patterns in this codebase
+
+- **Configuration**: Use `resolveConfig()` pattern for loading settings
+- **Process detection**: Check `process.platform` for OS-specific behavior
+- **Constants**: Define timeouts, limits, and magic values as constants at top of file
+- **HTTP servers**: Use consistent patterns for starting/stopping test servers
+- **File operations**: Always check existence before reading/writing; use synchronous versions in CLI scripts for simplicity
+- **CLI args**: Parse with `process.argv.slice(2)` or use parsing libraries for complex interfaces
+- **Environment**: Use `process.env` for configuration; provide defaults and validation
+
+## Safety guidelines
+
+- **Destructive operations**: Always confirm before running commands like `rm -rf`, `DROP TABLE`, or force pushes
+- **File modifications**: Prefer editing existing files over creating new ones unless explicitly required
+- **Branch protection**: Never force push to main/master branches
+- **Secret handling**: Never log or commit secrets, keys, or credentials
+- **Testing**: Run relevant tests before considering work complete
+- **Build verification**: Ensure `bun run build` succeeds after changes
+
+## Agent-specific instructions
+
+When operating as an agent in this repository:
+
+1. **Start with understanding**: Read related files before making changes
+2. **Follow existing patterns**: Match the coding style of the file you're editing
+3. **Test thoroughly**: Run relevant unit tests and verify manually when appropriate
+4. **Document changes**: Update comments and JSDoc when modifying behavior
+5. **Consider edge cases**: Think about error conditions and input validation
+6. **Keep changes focused**: Make minimal, purposeful changes
+7. **Verify build**: Ensure `bun run build` still works after your changes
+8. **Respect conventions**: Follow the established patterns for imports, naming, and error handling
+
+## Documentation
 
 - SKILL.md files are **generated** from `.tmpl` templates. Edit the template, not the output.
 - Run `bun run gen:skill-docs --host codex` to regenerate Codex-specific output.
 - The browse binary provides headless browser access. Use `$B <command>` in skills.
-- Safety skills (careful, freeze, guard) use inline advisory prose — always confirm before destructive operations.
+- Safety skills (careful, freeze, guard) use inline advisory prose — always confirm before destructive operations.
\ No newline at end of file
diff --git a/get-shit-done b/get-shit-done
new file mode 160000
index 000000000..1421dc07b
--- /dev/null
+++ b/get-shit-done
@@ -0,0 +1 @@
+Subproject commit 1421dc07bc1033f1b69e49d85cb6d625fd696b4f
diff --git a/opencode b/opencode
new file mode 160000
index 000000000..73ee49326
--- /dev/null
+++ b/opencode
@@ -0,0 +1 @@
+Subproject commit 73ee493265acf15fcd8caab2bc8cd3bd375b63cb
diff --git a/packages/adapters/opencode/package.json b/packages/adapters/opencode/package.json
new file mode 100644
index 000000000..9a10966c9
--- /dev/null
+++ b/packages/adapters/opencode/package.json
@@ -0,0 +1,19 @@
+{
+  "name": "@paperclipai/adapter-opencode",
+  "version": "0.0.1",
+  "private": true,
+  "type": "module",
+  "exports": {
+    ".": "./src/index.ts",
+    "./server": "./src/server/index.ts",
+    "./ui": "./src/ui/index.ts",
+    "./cli": "./src/cli/index.ts"
+  },
+  "dependencies": {
+    "@paperclipai/adapter-utils": "workspace:*",
+    "picocolors": "^1.1.1"
+  },
+  "devDependencies": {
+    "typescript": "^5.7.3"
+  }
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/cli/format-event.ts b/packages/adapters/opencode/src/cli/format-event.ts
new file mode 100644
index 000000000..1f228abfc
--- /dev/null
+++ b/packages/adapters/opencode/src/cli/format-event.ts
@@ -0,0 +1,34 @@
+import pc from 'picocolors';
+
+/**
+ * Format a line of stdout from the OpenCode process for display in the terminal.
+ * This is used when running `paperclipai run --watch`.
+ *
+ * @param line - The line of stdout from the OpenCode process
+ * @param debug - Whether to enable debug output (unrecognized lines are shown in gray)
+ */
+export function formatOpenCodeStdoutEvent(line: string, debug: boolean): void {
+  // In this simple implementation, we just print the line as-is.
+  // We could try to parse the line to see if it's a known OpenCode output format,
+  // but for now we'll treat all lines as regular output.
+  console.log(line);
+
+  // If we wanted to do more sophisticated formatting, we could do something like:
+  // if (debug) {
+  //   // In debug mode, we might want to show all lines, even if we don't understand them
+  //   console.log(pc.gray(line));
+  // } else {
+  //   // In non-debug mode, we might want to filter or style known lines
+  //   // For example, if we knew that lines starting with "[INFO]" are info messages:
+  //   if (line.startsWith('[INFO]')) {
+  //     console.log(pc.blue(line));
+  //   } else if (line.startsWith('[ERROR]')) {
+  //     console.log(pc.red(line));
+  //   } else {
+  //     console.log(line);
+  //   }
+  // }
+}
+
+// Note: The CLI adapter interface expects a function named `formatStdoutEvent`.
+// We'll export it with that name in the index.ts file.
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/cli/index.ts b/packages/adapters/opencode/src/cli/index.ts
new file mode 100644
index 000000000..dae01a60a
--- /dev/null
+++ b/packages/adapters/opencode/src/cli/index.ts
@@ -0,0 +1 @@
+export { formatOpenCodeStdoutEvent as formatStdoutEvent } from './format-event';
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/index.ts b/packages/adapters/opencode/src/index.ts
new file mode 100644
index 000000000..6c1761372
--- /dev/null
+++ b/packages/adapters/opencode/src/index.ts
@@ -0,0 +1,28 @@
+export const type = "opencode";
+export const label = "OpenCode (local)";
+
+export const models = [
+  { id: "opencode", label: "OpenCode" },
+];
+
+export const agentConfigurationDoc = `# OpenCode agent configuration
+
+Adapter: opencode
+
+Use when:
+- The agent needs to run OpenCode CLI locally on the host machine
+- You want to use OpenCode's interactive TUI or non-interactive mode
+- The task requires OpenCode-specific features (e.g. multiple AI providers, session management)
+
+Don't use when:
+- You need a simple one-shot script execution (use the "process" adapter instead)
+- OpenCode CLI is not installed on the host
+- You need to use a different agent runtime (e.g. Claude Code, Codex)
+
+Core fields:
+- cwd (string, required): absolute working directory for the OpenCode process
+- model (string, optional): OpenCode model to use (default: claude-3.5-sonnet)
+- timeoutSec (number, optional): timeout for each OpenCode invocation in seconds (default: 120)
+- graceSec (number, optional): grace period for OpenCode to shut down after timeout (default: 15)
+- sessionHistoryLimit (number, optional): maximum number of conversation turns to keep in history (default: 10)
+`;
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/server/execute.ts b/packages/adapters/opencode/src/server/execute.ts
new file mode 100644
index 000000000..e7bc6c891
--- /dev/null
+++ b/packages/adapters/opencode/src/server/execute.ts
@@ -0,0 +1,209 @@
+import { 
+  AdapterExecutionContext, 
+  AdapterExecutionResult,
+  asString,
+  asNumber,
+  asBoolean,
+  parseObject,
+  renderTemplate,
+  buildPaperclipEnv,
+  redactEnvForLogs,
+  ensureAbsoluteDirectory,
+  ensureCommandResolvable,
+  ensurePathInEnv,
+  runChildProcess
+} from '@paperclipai/adapter-utils/server-utils';
+import * as fs from 'fs';
+import * as path from 'path';
+import * as os from 'os';
+
+export async function execute(ctx: AdapterExecutionContext): Promise<AdapterExecutionResult> {
+  // 1. Read config
+  const cwd = asString(ctx.config.cwd);
+  const model = asString(ctx.config.model, 'claude-3.5-sonnet');
+  const timeoutSec = asNumber(ctx.config.timeoutSec, 120);
+  const graceSec = asNumber(ctx.config.graceSec, 15);
+  const sessionHistoryLimit = asNumber(ctx.config.sessionHistoryLimit, 10);
+
+  // 2. Validate cwd
+  let absoluteCwd: string;
+  try {
+    absoluteCwd = ensureAbsoluteDirectory(cwd);
+  } catch (err) {
+    return {
+      exitCode: 1,
+      signal: null,
+      timedOut: false,
+      errorMessage: `Invalid cwd: ${err.message}`,
+      usage: null,
+      sessionId: null,
+      sessionParams: null,
+      sessionDisplayId: null,
+      provider: null,
+      model: null,
+      costUsd: null,
+      resultJson: null,
+      summary: null,
+      clearSession: false,
+    };
+  }
+
+  // 3. Build environment
+  const env = {
+    ...process.env,
+    ...buildPaperclipEnv(ctx.agent),
+    // Inject OpenCode specific env vars
+    OPENCODE_MODEL: model,
+    // Note: OpenCode uses environment variables for API keys, but we rely on the user's configuration
+    // We don't inject API keys here because OpenCode reads them from its own config or env vars.
+    // However, we can inject the Paperclip API key if needed for the paperclip skill.
+    // But note: the paperclip skill is injected via the skills directory, not via env.
+  };
+
+  // 4. Resolve session
+  // OpenCode uses SQLite database for session storage, so we don't manage session via env vars.
+  // Instead, we rely on OpenCode's built-in session management which uses the cwd to store sessions.
+  // We don't need to do anything special for session resume because OpenCode handles it internally
+  // based on the working directory.
+
+  // 5. Render prompt
+  const prompt = renderTemplate(
+    'You are agent {{agent.id}} ({{agent.name}}). Continue your Paperclip work.',
+    {
+      agentId: ctx.agent.id,
+      companyId: ctx.agent.companyId,
+      runId: ctx.runId,
+      company: ctx.context.company,
+      agent: ctx.context.agent,
+      run: ctx.context.run,
+      context: ctx.context,
+    }
+  );
+
+  // 6. Call onMeta (we don't have onMeta in the context, but the skill says to call it)
+  // Actually, the context has onMeta? Let's check the AdapterExecutionContext interface from the skill.
+  // The skill says: `onMeta?: (meta: AdapterInvocationMeta) => Promise<void>;`
+  // We'll call it if available.
+  if (ctx.onMeta) {
+    await ctx.onMeta({
+      adapterType: ctx.agent.adapterType,
+      agentId: ctx.agent.id,
+      runId: ctx.runId,
+      // We don't have the prompt in the meta, but we can include the config without secrets
+      config: {
+        model,
+        timeoutSec,
+        graceSec,
+        sessionHistoryLimit,
+        // Note: we don't include cwd in meta because it's not secret, but we can if needed.
+        // However, the skill says to use redactEnvForLogs for env, but for config we just pass non-secret fields.
+      },
+    });
+  }
+
+  // 7. Spawn the process
+  // We need to check if the opencode command is available
+  let command = 'opencode';
+  try {
+    ensureCommandResolvable(command, absoluteCwd, env);
+  } catch (err) {
+    return {
+      exitCode: 127,
+      signal: null,
+      timedOut: false,
+      errorMessage: `OpenCode CLI not found: ${err.message}`,
+      usage: null,
+      sessionId: null,
+      sessionParams: null,
+      sessionDisplayId: null,
+      provider: null,
+      model: null,
+      costUsd: null,
+      resultJson: null,
+      summary: null,
+      clearSession: false,
+    };
+  }
+
+  // We'll run opencode in non-interactive mode with the prompt
+  // Note: OpenCode non-interactive mode: opencode -p "your prompt"
+  // We also want to set the working directory
+  const args = ['-p', prompt];
+
+  // We also want to set the data directory to be inside the cwd to avoid conflicts
+  // OpenCode uses a data directory (default: .opencode) in the current working directory.
+  // We can leave it as default, which will be inside the cwd.
+
+  let childProcess;
+  let stdout = '';
+  let stderr = '';
+  let timedOut = false;
+
+  try {
+    const { 
+      exitCode, 
+      signal, 
+      output, 
+      timeout 
+    } = await runChildProcess(
+      ctx.runId,
+      command,
+      args,
+      {
+        cwd: absoluteCwd,
+        env,
+        timeout: timeoutSec * 1000, // convert to milliseconds
+        maxBuffer: 1024 * 1024, // 1MB max buffer
+      }
+    );
+
+    // Collect output
+    stdout = output.stdout ?? '';
+    stderr = output.stderr ?? '';
+
+    // Parse the output to extract usage, sessionId, etc.
+    // For OpenCode, the non-interactive mode outputs the response directly.
+    // We don't have a structured output for usage, so we'll set usage to null.
+    // We also don't have a session ID in the output for non-interactive mode.
+    // However, OpenCode does store sessions in the database, so we can try to get the latest session.
+    // But for simplicity, we'll not return session info in this version.
+
+    // We'll consider the exit code from the process
+    const result: AdapterExecutionResult = {
+      exitCode,
+      signal,
+      timedOut: timeout,
+      errorMessage: timeout ? 'Process timed out' : (stderr.length > 0 ? stderr : null),
+      usage: null, // OpenCode doesn't provide usage in non-interactive mode output
+      sessionId: null, // We don't have a session ID to return
+      sessionParams: null, // We don't manage session params in the adapter
+      sessionDisplayId: null,
+      provider: null, // We don't know the provider from the output
+      model,
+      costUsd: null, // We don't have cost info
+      resultJson: null, // We could store the raw output, but the skill doesn't require it
+      summary: stdout.trim(), // The summary is the stdout
+      clearSession: false, // We don't clear the session because we don't manage it
+    };
+
+    return result;
+  } catch (err) {
+    // If runChildProcess throws, it's likely a timeout or error
+    return {
+      exitCode: 1,
+      signal: null,
+      timedOut: err.timedOut ?? false,
+      errorMessage: err.message ?? 'Unknown error',
+      usage: null,
+      sessionId: null,
+      sessionParams: null,
+      sessionDisplayId: null,
+      provider: null,
+      model: null,
+      costUsd: null,
+      resultJson: null,
+      summary: null,
+      clearSession: false,
+    };
+  }
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/server/index.ts b/packages/adapters/opencode/src/server/index.ts
new file mode 100644
index 000000000..548eebac6
--- /dev/null
+++ b/packages/adapters/opencode/src/server/index.ts
@@ -0,0 +1,19 @@
+export { execute } from './execute.js';
+export { testEnvironment } from './test.js';
+export { parseOpenCodeOutput, isOpenCodeUnknownSessionError } from './parse.js';
+
+// Session codec - required for session persistence
+// Since we're not managing OpenCode sessions in the adapter (relying on OpenCode's internal session mgmt),
+// we return null for session params and display ID.
+// In a more advanced implementation, we could integrate with OpenCode's session system.
+export const sessionCodec = {
+  deserialize(_raw): null {
+    return null;
+  },
+  serialize(_params): null {
+    return null;
+  },
+  getDisplayId(_params): null {
+    return null;
+  },
+};
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/server/parse.ts b/packages/adapters/opencode/src/server/parse.ts
new file mode 100644
index 000000000..39133ff97
--- /dev/null
+++ b/packages/adapters/opencode/src/server/parse.ts
@@ -0,0 +1,19 @@
+// For OpenCode adapter, we don't have complex output parsing in non-interactive mode
+// The output is just the AI's response text
+// We don't extract usage or session info from the output in this simple implementation
+
+export function parseOpenCodeOutput(output: string): { 
+  summary: string; 
+} {
+  return {
+    summary: output.trim()
+  };
+}
+
+// Since we don't have session management in this adapter, we don't need unknown session detection
+// But we'll export the function for completeness
+export function isOpenCodeUnknownSessionError(output: string): boolean {
+  // OpenCode doesn't have session IDs in the same way as Claude Code
+  // So we'll never have unknown session errors in this adapter
+  return false;
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/server/test.ts b/packages/adapters/opencode/src/server/test.ts
new file mode 100644
index 000000000..93fb5dae2
--- /dev/null
+++ b/packages/adapters/opencode/src/server/test.ts
@@ -0,0 +1,100 @@
+import { 
+  AdapterEnvironmentTestContext, 
+  AdapterEnvironmentTestResult,
+  AdapterEnvironmentCheckLevel,
+  AdapterEnvironmentTestStatus,
+  ensureAbsoluteDirectory,
+  ensureCommandResolvable,
+  ensurePathInEnv
+} from '@paperclipai/adapter-utils/server-utils';
+
+export async function testEnvironment(
+  ctx: AdapterEnvironmentTestContext
+): Promise<AdapterEnvironmentTestResult> {
+  const checks = [];
+
+  // 1. Validate cwd
+  const cwd = ctx.config.cwd as string | undefined;
+  if (!cwd) {
+    checks.push({
+      code: 'MISSING_CWD',
+      level: 'error' as AdapterEnvironmentCheckLevel,
+      message: 'cwd is required',
+    });
+  } else {
+    try {
+      ensureAbsoluteDirectory(cwd);
+      checks.push({
+        code: 'CWD_VALID',
+        level: 'info' as AdapterEnvironmentCheckLevel,
+        message: `cwd is valid: ${cwd}`,
+      });
+    } catch (err) {
+      checks.push({
+        code: 'INVALID_CWD',
+        level: 'error' as AdapterEnvironmentCheckLevel,
+        message: `Invalid cwd: ${err.message}`,
+      });
+    }
+  }
+
+  // 2. Validate that opencode command is available
+  try {
+    // We need to pass the environment for command resolution
+    // Build a basic environment for testing
+    const env = {
+      ...process.env,
+      // We don't have the full buildPaperclipEnv here, but for command resolution we just need PATH
+    };
+    ensureCommandResolvable('opencode', cwd ?? '.', env);
+    checks.push({
+      code: 'OPENCODE_COMMAND_AVAILABLE',
+      level: 'info' as AdapterEnvironmentCheckLevel,
+      message: 'OpenCode CLI is available in PATH',
+    });
+  } catch (err) {
+    checks.push({
+      code: 'OPENCODE_COMMAND_NOT_FOUND',
+      level: 'error' as AdapterEnvironmentCheckLevel,
+      message: `OpenCode CLI not found: ${err.message}`,
+    });
+  }
+
+  // 3. Validate model if provided
+  const model = ctx.config.model as string | undefined;
+  if (model) {
+    // OpenCode accepts many model IDs, we can't easily validate them all
+    // But we can check if it's a non-empty string
+    if (model.trim().length === 0) {
+      checks.push({
+        code: 'INVALID_MODEL',
+        level: 'warn' as AdapterEnvironmentCheckLevel,
+        message: 'model should not be empty if provided',
+      });
+    } else {
+      checks.push({
+        code: 'MODEL_PROVIDED',
+        level: 'info' as AdapterEnvironmentCheckLevel,
+        message: `model is set to: ${model}`,
+      });
+    }
+  }
+
+  // Determine overall status
+  const hasError = checks.some(check => check.level === 'error');
+  const hasWarning = !hasError && checks.some(check => check.level === 'warn');
+  
+  let status: AdapterEnvironmentTestStatus = 'pass';
+  if (hasError) {
+    status = 'fail';
+  } else if (hasWarning) {
+    status = 'warn';
+  }
+
+  return {
+    adapterType: ctx.agent.adapterType,
+    status,
+    checks,
+    testedAt: new Date().toISOString(),
+  };
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/ui/build-config.ts b/packages/adapters/opencode/src/ui/build-config.ts
new file mode 100644
index 000000000..0bc7e16c3
--- /dev/null
+++ b/packages/adapters/opencode/src/ui/build-config.ts
@@ -0,0 +1,36 @@
+import type { CreateConfigValues } from '@paperclipai/adapter-utils';
+
+export function buildOpenCodeConfig(v: CreateConfigValues): Record<string, unknown> {
+  const ac: Record<string, unknown> = {};
+
+  if (v.cwd) {
+    ac.cwd = v.cwd;
+  }
+  if (v.model) {
+    ac.model = v.model;
+  }
+  if (v.timeoutSec !== undefined) {
+    ac.timeoutSec = v.timeoutSec;
+  }
+  if (v.graceSec !== undefined) {
+    ac.graceSec = v.graceSec;
+  }
+  if (v.sessionHistoryLimit !== undefined) {
+    ac.sessionHistoryLimit = v.sessionHistoryLimit;
+  }
+
+  // Set default values for any missing optional fields
+  // (Though we are handling them above, we can also set defaults here if needed)
+  // For example, if we want to ensure timeoutSec is always set:
+  if (ac.timeoutSec === undefined) {
+    ac.timeoutSec = 120;
+  }
+  if (ac.graceSec === undefined) {
+    ac.graceSec = 15;
+  }
+  if (ac.sessionHistoryLimit === undefined) {
+    ac.sessionHistoryLimit = 10;
+  }
+
+  return ac;
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/ui/config-fields.tsx b/packages/adapters/opencode/src/ui/config-fields.tsx
new file mode 100644
index 000000000..5f6fa6239
--- /dev/null
+++ b/packages/adapters/opencode/src/ui/config-fields.tsx
@@ -0,0 +1,98 @@
+import type { AdapterConfigFieldsProps } from '@paperclipai/adapter-utils';
+// Note: The skill says to use the primitives from `ui/src/components/agent-config-primitives`
+// We'll import them from the expected location in the Paperclip monorepo.
+import { Field, ToggleField, DraftInput, DraftNumberInput, help } from '@/components/agent-config-primitives';
+
+// We are using an alias `@/` for the Paperclip UI components.
+// In the Paperclip monorepo, this alias is set up to point to `ui/src`.
+// If you are not in the Paperclip monorepo, you may need to adjust this import.
+// However, when the adapter is used in Paperclip, the alias will be valid.
+
+export function OpenCodeConfigFields({ config, eff, set, values }: AdapterConfigFieldsProps) {
+  // Determine if we are in edit mode or create mode
+  const isEdit = !!config;
+
+  // Helper to get the current value for a field
+  const getValue = <T>(key: string): T => {
+    if (isEdit) {
+      // In edit mode, we read from the config
+      return (config as Record<string, unknown>)[key] as T;
+    } else {
+      // In create mode, we read from the form values
+      return (values as Record<string, unknown>)[key] as T;
+    }
+  };
+
+  // Helper to set a field value
+  const setValue = <T>(key: string, value: T) => {
+    if (isEdit) {
+      // In edit mode, we update the config via the eff function
+      eff({ [key]: value });
+    } else {
+      // In create mode, we update the form values via the set function
+      set({ [key]: value });
+    }
+  };
+
+  return (
+    <>
+      <Field
+        label="Working Directory"
+        description="Absolute path to the directory where OpenCode will run"
+      >
+        <DraftInput
+          placeholder="/path/to/project"
+          value={getValue<string>('cwd') || ''}
+          onChange={(e) => setValue('cwd', e.target.value)}
+        />
+      </Field>
+
+      <Field
+        label="Model"
+        description="OpenCode model to use for the agent"
+      >
+        <DraftInput
+          placeholder="claude-3.5-sonnet"
+          value={getValue<string>('model') || ''}
+          onChange={(e) => setValue('model', e.target.value)}
+        />
+      </Field>
+
+      <Field
+        label="Timeout (seconds)"
+        description="Maximum time to wait for each OpenCode invocation"
+      >
+        <DraftNumberInput
+          min={1}
+          step={1}
+          value={getValue<number>('timeoutSec') ?? 120}
+          onChange={(e) => setValue('timeoutSec', parseInt(e.target.value, 10) || 120)}
+        />
+      </Field>
+
+      <Field
+        label="Grace Period (seconds)"
+        description="Additional time to allow OpenCode to shut down after timeout"
+      >
+        <DraftNumberInput
+          min={1}
+          step={1}
+          value={getValue<number>('graceSec') ?? 15}
+          onChange={(e) => setValue('graceSec', parseInt(e.target.value, 10) || 15)}
+        />
+      </Field>
+
+      <Field
+        label="Session History Limit"
+        description="Maximum number of conversation turns to keep in history"
+      >
+        <DraftNumberInput
+          min={1}
+          step={1}
+          value={getValue<number>('sessionHistoryLimit') ?? 10}
+          onChange={(e) => setValue('sessionHistoryLimit', parseInt(e.target.value, 10) || 10)}
+        />
+      </Field>
+    </>
+  );
+}
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/ui/index.ts b/packages/adapters/opencode/src/ui/index.ts
new file mode 100644
index 000000000..311da763f
--- /dev/null
+++ b/packages/adapters/opencode/src/ui/index.ts
@@ -0,0 +1,12 @@
+import type { UIAdapterModule } from '../types';
+import { parseOpenCodeStdoutLine } from './parse-stdout';
+import { OpenCodeConfigFields } from './config-fields';
+import { buildOpenCodeConfig } from './build-config';
+
+export const opencodeUIAdapter: UIAdapterModule = {
+  type: 'opencode',
+  label: 'OpenCode',
+  parseStdoutLine: parseOpenCodeStdoutLine,
+  ConfigFields: OpenCodeConfigFields,
+  buildAdapterConfig: buildOpenCodeConfig,
+};
\ No newline at end of file
diff --git a/packages/adapters/opencode/src/ui/parse-stdout.ts b/packages/adapters/opencode/src/ui/parse-stdout.ts
new file mode 100644
index 000000000..347e68b3f
--- /dev/null
+++ b/packages/adapters/opencode/src/ui/parse-stdout.ts
@@ -0,0 +1,18 @@
+// For OpenCode adapter, we're primarily using non-interactive mode
+// which doesn't produce the kind of streaming output that needs line-by-line parsing
+// for the transcript viewer. However, we still need to implement this interface.
+
+import type { TranscriptEntry } from '@paperclipai/adapter-utils';
+
+// In non-interactive mode, OpenCode outputs the response directly
+// We'll treat the entire output as a single assistant message
+export function parseOpenCodeStdoutLine(line: string, ts: string): TranscriptEntry[] {
+  // For simplicity, we'll return each line as a stdout entry
+  // In a more sophisticated implementation, we might buffer lines and
+  // detect when we have a complete response
+  return [{
+    kind: 'stdout',
+    ts,
+    text: line
+  }];
+}
\ No newline at end of file