diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
new file mode 100644
index 0000000..5a42571
--- /dev/null
+++ b/.github/workflows/release.yml
@@ -0,0 +1,66 @@
+name: release
+
+# Triggered by the tags that scripts/release.sh pushes (vX.Y.Z). Builds
+# installers on each OS and publishes them to a GitHub Release, then
+# flips that release from draft to public once every OS has finished.
+on:
+  push:
+    tags:
+      - 'v*'
+
+permissions:
+  contents: write # create the release and upload assets
+
+concurrency:
+  group: release-${{ github.ref }}
+  cancel-in-progress: false
+
+jobs:
+  build:
+    name: build (${{ matrix.os }})
+    runs-on: ${{ matrix.os }}
+    strategy:
+      fail-fast: false
+      matrix:
+        os: [macos-latest, windows-latest, ubuntu-latest]
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Setup Node 22
+        uses: actions/setup-node@v4
+        with:
+          node-version: '22'
+          cache: npm
+
+      - name: Install dependencies
+        run: npm ci
+
+      - name: Build and publish to the draft release
+        run: npm run release:ci
+        env:
+          # Lets electron-builder create/upload to the GitHub Release.
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+          # Optional macOS code signing + notarization. These only take
+          # effect when the secrets exist; without them the macOS build
+          # is unsigned (and macOS auto-update stays disabled until they
+          # are added). Windows/Linux publish and auto-update regardless.
+          CSC_LINK: ${{ secrets.CSC_LINK }}
+          CSC_KEY_PASSWORD: ${{ secrets.CSC_KEY_PASSWORD }}
+          APPLE_ID: ${{ secrets.APPLE_ID }}
+          APPLE_APP_SPECIFIC_PASSWORD: ${{ secrets.APPLE_APP_SPECIFIC_PASSWORD }}
+          APPLE_TEAM_ID: ${{ secrets.APPLE_TEAM_ID }}
+
+  publish:
+    name: publish release
+    needs: build
+    runs-on: ubuntu-latest
+    permissions:
+      contents: write
+    steps:
+      # All OS builds succeeded and uploaded their assets to the draft
+      # release — flip it public and mark it the latest.
+      - name: Promote draft to published
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+        run: gh release edit "${GITHUB_REF_NAME}" --repo "${GITHUB_REPOSITORY}" --draft=false --latest
diff --git a/CHANGELOG.md b/CHANGELOG.md
index aaff195..7c13df0 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -7,6 +7,36 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ## [Unreleased]
 
+### AI (new)
+- **Ask AI on a snip** — capture a region and get it *solved/answered*
+  (math, code, questions, errors), not just described. A dockable chat
+  panel streams the response.
+- **Local-first routing** — on-device models via [Ollama](https://ollama.com)
+  with a first-run setup wizard; optional cloud providers as fallback.
+- **Providers**: Ollama (local), Anthropic Claude, OpenAI, Google Gemini,
+  DeepSeek (text), and Sarvam AI (Indic-strong Vision OCR → LLM solve).
+- **Autocorrect** for typed text and recognized handwriting (per-kind
+  toggles), **handwriting recognition** (drawn ink → text via a vision
+  model), and **trader chart analysis** from drawn levels.
+- **On-device learning (RAG)** — accepted corrections are remembered
+  locally to personalize suggestions; nothing leaves the machine.
+- **Per-profile** system prompts and model overrides in Settings → AI.
+- Follow-up questions retain full conversation context (image/OCR carried
+  across turns) until a new snip starts a fresh conversation.
+
+### Auto-update (new)
+- Background auto-update from GitHub Releases via `electron-updater`:
+  downloads in the background and applies on quit. Settings → Updates adds
+  an automatic-updates toggle, a manual check, and restart-to-update.
+  (macOS auto-update activates once the build is signed + notarized.)
+
+### Build & release (new)
+- Tag-driven release automation: `npm run release[:minor|:major]` bumps
+  the version, rolls the changelog, commits, tags, and pushes.
+- GitHub Actions builds macOS / Windows / Linux on a `v*` tag and
+  publishes installers + update manifests to GitHub Releases.
+- macOS builds now also emit a `.zip` (for Squirrel.Mac auto-update).
+
 ## [1.0.0] — 2026-05-20
 
 Initial open-source release of Lekhini, by
diff --git a/README.md b/README.md
index 329aa7c..460e6a9 100644
--- a/README.md
+++ b/README.md
@@ -35,6 +35,11 @@ content without switching apps.
   by default with a hotkey to toggle drawing.
 - **Undo/redo, clear, screenshot**, all from the toolbar or global
   hotkeys.
+- **AI, local-first.** Snip anything and **Ask AI** to solve/explain it,
+  autocorrect handwriting and typed text, and analyze trader charts —
+  running on-device via Ollama by default, with optional cloud providers.
+  Everything is opt-in and configured in **Settings → AI**. See
+  [docs/AI.md](./docs/AI.md).
 
 ## Tech stack
 
@@ -48,8 +53,12 @@ content without switching apps.
 - **Zustand** vanilla store with snapshot-based undo/redo history
 - **`electron-store`** for persisted orientation / theme / per-tool
   widths / active tool / color, with schema-tolerant hydration
-- **`electron-builder`** for notarized `.dmg` (and `nsis` /
-  `AppImage` for Windows / Linux)
+- **Local-first AI** — [Ollama](https://ollama.com) for on-device models,
+  with optional cloud providers (Anthropic, OpenAI, Gemini, DeepSeek,
+  Sarvam AI). See [docs/AI.md](./docs/AI.md).
+- **`electron-builder`** for `.dmg` + `.zip` (macOS), `nsis` (Windows),
+  `AppImage` (Linux), and **`electron-updater`** for background
+  auto-updates from GitHub Releases
 
 ## Architecture
 
@@ -154,29 +163,95 @@ After granting, quit and relaunch the app.
 
 Switch profile from **Settings → Profile**. The choice is remembered.
 
+## AI
+
+Lekhini's AI is **local-first and entirely opt-in**. With **Local AI**
+on, snips and text never leave your machine; cloud providers are an
+optional fallback you configure with your own API key. Nothing AI-related
+is enabled until you set one of them up.
+
+**What you can do**
+
+- **Ask AI about a snip** — drag a region, click **Ask AI**, and a chat
+  panel opens. It *solves/answers* what's in the image (math, code,
+  questions, errors), not just describes it. Follow-up questions keep the
+  full conversation context until you start a new snip.
+- **Autocorrect** — typed text and recognized handwriting can be cleaned
+  up automatically (toggle per kind in Settings).
+- **Handwriting recognition** — drawn ink is transcribed to text on
+  device via a vision model.
+- **Trader analysis** — the Trader profile can hand your drawn levels to
+  the AI for a written read.
+- **On-device learning (RAG)** — accepted corrections are remembered
+  locally to personalize future suggestions. Stored only on your machine.
+
+**Providers**
+
+| Provider | Kind | Vision | Notes |
+| --- | --- | --- | --- |
+| **Ollama (Local)** | on-device | yes | Default. Private, free, no key. |
+| **Anthropic Claude** | cloud | yes | API key required |
+| **OpenAI** | cloud | yes | API key required |
+| **Google Gemini** | cloud | yes | API key required |
+| **DeepSeek** | cloud | no (text) | Strong reasoning; image snips answer from text |
+| **Sarvam AI** | cloud | yes (OCR→LLM) | Indic-strong document OCR, then solves |
+
+**Configure** in **Settings → AI**: enable Local AI (a first-run wizard
+installs Ollama + recommended models), or pick a cloud provider and paste
+its key. Routing is local-first — if Local AI is on and a suitable model
+is installed it's used; otherwise the configured cloud provider is.
+
+Full details — architecture, the resolver, per-profile prompts/models,
+privacy, and how each provider is wired — are in
+**[docs/AI.md](./docs/AI.md)**.
+
+## Updates
+
+Installed builds **auto-update from GitHub Releases** via
+`electron-updater`. By default new versions download in the background
+and apply on the next quit/relaunch. Manage this in **Settings →
+Updates**: toggle **Automatic updates**, **Check for updates** on demand,
+or **Restart to update** once a version is downloaded.
+
+> macOS auto-update requires a signed + notarized build. Until signing
+> is configured, macOS users update manually (Settings → Updates links to
+> the latest GitHub Release); Windows and Linux auto-update out of the box.
+
 ## Building installers
 
+Build for the **current OS** (most reliable locally):
+
 ```bash
-# macOS — set these in your shell for signed/notarized builds
-export APPLE_ID="you@example.com"
-export APPLE_APP_SPECIFIC_PASSWORD="xxxx-xxxx-xxxx-xxxx"
-export APPLE_TEAM_ID="ABCDE12345"
-export CSC_LINK="path/to/DeveloperIDApplication.p12"
-export CSC_KEY_PASSWORD="..."
+npm run build            # installers for this OS → release/
+npm run build:unpacked   # unpacked app dir, no installer (fastest)
+```
 
-npm run build:mac       # produces release/Lekhini-1.0.0-arm64.dmg (+ x64)
-npm run build:win       # produces release/Lekhini Setup 1.0.0.exe
-npm run build:linux     # produces release/Lekhini-1.0.0.AppImage
+Per-OS targets (cross-OS locally needs the right toolchains — CI is the
+supported path for all three at once):
+
+```bash
+npm run build:mac        # release/Lekhini-<ver>-arm64.dmg (+ x64) + .zip
+npm run build:win        # release/Lekhini Setup <ver>.exe
+npm run build:linux      # release/Lekhini-<ver>.AppImage
+npm run build:all         # attempt mac + win + linux (-mwl)
 ```
 
-Unsigned local builds (no notarization):
+Optional **macOS signing + notarization** — set these in your shell (or
+as CI secrets) and the build signs automatically; omit them for an
+unsigned build:
 
 ```bash
-npm run build:unpacked
+export APPLE_ID="you@example.com"
+export APPLE_APP_SPECIFIC_PASSWORD="xxxx-xxxx-xxxx-xxxx"
+export APPLE_TEAM_ID="ABCDE12345"
+export CSC_LINK="path/to/DeveloperIDApplication.p12"
+export CSC_KEY_PASSWORD="..."
 ```
 
-GitHub Actions on `macos-14` is the recommended CI target — same
-`npm run build` command, with the secrets above set as repo secrets.
+**Automated multi-OS builds + releases** run in CI — pushing a `vX.Y.Z`
+tag builds macOS / Windows / Linux in parallel and publishes them to
+GitHub Releases. See [RELEASING.md](./RELEASING.md); the one-liner is
+`npm run release` (patch) / `release:minor` / `release:major`.
 
 ## Hard constraint: macOS fullscreen Spaces
 
diff --git a/RELEASING.md b/RELEASING.md
index 2778a0e..68030af 100644
--- a/RELEASING.md
+++ b/RELEASING.md
@@ -45,42 +45,61 @@ Bug fixes and small polish that don't change behavior intentionally:
 - Dependency bumps that don't change behavior.
 - Documentation-only changes.
 
-## Cutting a release
-
-1. Make sure `main` is green: `npm run typecheck` and `npm run build`
-   succeed locally. CI on the release commit must also be green.
-2. Decide the version bump (major / minor / patch) per the policy above.
-3. Update `CHANGELOG.md`:
-   - Move items from `[Unreleased]` into a new versioned section.
-   - Add a dated heading: `## [X.Y.Z] — YYYY-MM-DD`.
-   - Update the link references at the bottom of the file.
-4. Bump `package.json`'s `version` field to the new version. Do NOT
-   use `npm version` if your workflow doesn't also tag — keep these
-   steps explicit.
-5. Commit:
+## Cutting a release (automated)
+
+Releases are **tag-driven**. One command bumps the version, rolls the
+changelog, commits, tags, and pushes — then CI builds every OS and
+publishes the GitHub Release. You do not build or upload anything by hand.
+
+1. Make sure the branch is clean and green (`npm run typecheck`, and CI
+   on the latest commit is passing). Land all release-worthy changes
+   first, with notes under `## [Unreleased]` in `CHANGELOG.md`.
+2. Run the release script with the bump type:
+   ```bash
+   npm run release          # patch (X.Y.Z+1) — the default
+   npm run release:minor    # X.Y+1.0
+   npm run release:major    # X+1.0.0
+   # or an exact version:
+   bash scripts/release.sh 1.4.0
    ```
-   git add CHANGELOG.md package.json package-lock.json
-   git commit -m "chore: release vX.Y.Z"
-   ```
-6. Tag the commit:
-   ```
-   git tag -a vX.Y.Z -m "Lekhini vX.Y.Z"
-   ```
-7. Push commit and tag:
-   ```
-   git push origin main
-   git push origin vX.Y.Z
-   ```
-8. Build the installers (signed where applicable):
-   ```
-   npm run build:mac      # produces release/Lekhini-X.Y.Z-arm64.dmg
-   npm run build:win      # produces release/Lekhini Setup X.Y.Z.exe
-   npm run build:linux    # produces release/Lekhini-X.Y.Z.AppImage
-   ```
-9. Create a GitHub Release from the `vX.Y.Z` tag:
-   - Title: `vX.Y.Z`
-   - Body: copy the relevant CHANGELOG section.
-   - Attach the installers from step 8.
+   This (see `scripts/release.sh`):
+   - refuses to run on a dirty tree,
+   - validates with `npm run prebuild` (typecheck + build),
+   - bumps `package.json` + `package-lock.json` (no tag yet),
+   - rolls `CHANGELOG.md`: `[Unreleased]` → a dated `[X.Y.Z]` section and
+     updates the link refs (`scripts/update-changelog.mjs`),
+   - commits `chore(release): vX.Y.Z`, tags `vX.Y.Z`, and pushes both.
+3. The pushed tag triggers **`.github/workflows/release.yml`**, which:
+   - builds installers on macOS, Windows, and Linux in parallel
+     (`npm run release:ci` → `electron-builder --publish always`),
+   - uploads them plus the `latest*.yml` update manifests to a **draft**
+     GitHub Release for the tag,
+   - flips the release **public** once all three OSes succeed.
+4. Watch it at <https://github.com/opensourcebharat/lekhini/actions>.
+   When green, the release is live and installed apps will auto-update.
+
+### macOS signing (optional)
+
+The workflow signs + notarizes macOS builds **only when** these repo
+secrets exist; otherwise the macOS build is unsigned (and macOS
+auto-update stays disabled until they're added — Windows/Linux are
+unaffected): `CSC_LINK`, `CSC_KEY_PASSWORD`, `APPLE_ID`,
+`APPLE_APP_SPECIFIC_PASSWORD`, `APPLE_TEAM_ID`.
+
+### Local build (optional)
+
+To produce installers without releasing, use `npm run build` (current
+OS) or `npm run build:mac|win|linux`. These write to `release/` and do
+**not** publish.
+
+## Auto-update
+
+Installed apps check GitHub Releases via `electron-updater`
+(`src/main/updater.ts`), download in the background, and apply on quit.
+Users control this in **Settings → Updates** (toggle, manual check,
+restart-to-update). Because the feed is GitHub Releases, **every public
+release is automatically an update** for existing installs — so prefer
+small, frequent patch releases in the early stage.
 
 ## Tag naming
 
diff --git a/docs/AI.md b/docs/AI.md
new file mode 100644
index 0000000..b511f06
--- /dev/null
+++ b/docs/AI.md
@@ -0,0 +1,136 @@
+# AI in Lekhini
+
+Lekhini's AI is **local-first, private, and entirely opt-in**. Nothing
+AI-related runs until you turn it on, and with Local AI enabled your
+snips and text never leave your machine. Cloud providers are an optional
+fallback you configure with your own API key.
+
+This document explains what the AI features do, how routing works, how to
+configure each provider, where keys live, and how it's wired in code.
+
+---
+
+## What you can do
+
+| Feature | Where | What it does |
+| --- | --- | --- |
+| **Ask AI** | Snip → **Ask AI** | Opens a chat about the captured region and **solves/answers** it (math, code, a question, an error) rather than just describing it. |
+| **Follow-up chat** | Chat composer | Keeps the full conversation — the image (or its OCR text) is carried across turns — until a new snip starts a fresh conversation. |
+| **Autocorrect (typed)** | Settings → AI | Cleans grammar/spelling of typed text. |
+| **Autocorrect (drawn)** | Settings → AI | Cleans recognized handwriting. |
+| **Handwriting recognition** | Draw, then pause | Transcribes drawn ink to a text shape via a vision model. |
+| **Trader analysis** | Trader profile → Analyze | Sends your drawn levels (as numbers) for a written read. |
+| **On-device learning** | automatic | Remembers accepted corrections locally (RAG) to personalize future suggestions. |
+
+---
+
+## How routing works (local-first)
+
+A single resolver — `resolveProvider()` in
+[`src/main/ai/ipc.ts`](../src/main/ai/ipc.ts) — decides who serves each
+request:
+
+1. **Local first.** If **Local AI** is on, the Ollama service is running,
+   and a suitable model is installed, the request goes to Ollama. For an
+   image request it picks a **vision** model; for text, a **text** model.
+   Selection order: per-profile override → global default → the
+   profile's catalogue default → any installed model of the right kind.
+2. **Cloud fallback.** Otherwise, if a cloud provider is configured (has a
+   saved API key and is the active provider), the request goes there.
+3. **Nothing configured → no AI.** If neither is available, AI entry
+   points stay hidden/disabled and the chat shows a "set something up"
+   message. You must configure a provider before any AI feature works.
+
+The renderer stays provider-agnostic: it sends a request and subscribes
+to streamed chunks; the resolver picks local-vs-cloud and the concrete
+model server-side.
+
+---
+
+## Providers
+
+| Provider | Kind | Vision | Notes |
+| --- | --- | --- | --- |
+| **Ollama (Local)** | on-device | ✅ | Default. Private, free, no key. Models run via the local [Ollama](https://ollama.com) service. |
+| **Anthropic Claude** | cloud | ✅ | Native vision. |
+| **OpenAI** | cloud | ✅ | Native vision (`image_url`). |
+| **Google Gemini** | cloud | ✅ | Native vision (`inlineData`). |
+| **DeepSeek** | cloud | ❌ text-only | Strong reasoning; image snips are answered from text alone. Use a vision provider for image Q&A. |
+| **Sarvam AI** | cloud | ✅ (OCR→LLM) | Runs **Sarvam Vision** document OCR on the image, then solves with Sarvam's own chat model. Excellent for Indic + dense text. |
+
+**Sarvam's two-step pipeline** ([`src/main/ai/sarvam.ts`](../src/main/ai/sarvam.ts)):
+the snip PNG is wrapped in a zip and sent to Sarvam's job-based Document
+Intelligence (Vision) OCR; the extracted text is then embedded into the
+chat and solved by `sarvam-m` / `sarvam-30b` / `sarvam-105b`. OCR runs
+**once per conversation** (cached by session), so follow-ups are fast.
+
+---
+
+## Configuring it (Settings → AI)
+
+### Local AI (recommended)
+
+1. Toggle **Local AI (Ollama)** on. A first-run wizard checks for Ollama,
+   links you to install it if missing, starts the service, and downloads
+   a recommended model set (a small text model + a vision model + the
+   embedding model for learning).
+2. Optionally pin a **text** and **vision** model per profile, or install
+   extra models from the catalogue.
+
+Everything here stays on your device.
+
+### Cloud provider (optional fallback)
+
+1. Pick a provider under **Cloud fallback** and paste its API key, then
+   **Save**. **Test** confirms the round-trip.
+2. The provider/model you save becomes the active fallback used when
+   Local AI is off or has no suitable model installed.
+
+Get a key: Anthropic / OpenAI / Gemini / DeepSeek / Sarvam consoles are
+linked from each provider's row.
+
+### Other settings
+
+- **Autocorrect typed / drawn** — independent toggles (default off).
+- **Profile prompts** — override the built-in system prompt per profile.
+- **Default text font** — for newly created text shapes.
+- **Learning** — view/reset the on-device example store per profile.
+
+---
+
+## Privacy & where keys live
+
+- **Local AI**: text and images stay on your machine — nothing is sent to
+  a server.
+- **Cloud providers**: content goes directly to the provider you chose,
+  under its own data policy. Lekhini does not proxy or log it.
+- **API keys** are never stored in the plaintext settings file. They're
+  encrypted with the OS keychain (macOS Keychain / Windows DPAPI /
+  libsecret) via [`src/main/ai/credentials.ts`](../src/main/ai/credentials.ts),
+  in a sidecar `ai-credentials.json` decryptable only by your OS user.
+- **Learning (RAG)** examples are stored only on this device.
+
+---
+
+## Code map
+
+| Concern | File |
+| --- | --- |
+| Provider interface | [`src/main/ai/types.ts`](../src/main/ai/types.ts) |
+| Per-provider adapters | `src/main/ai/{anthropic,openai,gemini,deepseek,sarvam,ollama}.ts` |
+| Adapter registry (models, labels, key URLs) | [`src/main/ai/registry.ts`](../src/main/ai/registry.ts) |
+| Resolver + IPC + session image cache | [`src/main/ai/ipc.ts`](../src/main/ai/ipc.ts) |
+| Shared message assembly (history + first-turn image) | [`src/main/ai/messages.ts`](../src/main/ai/messages.ts) |
+| Local Ollama service + model catalogue | `src/main/ai/ollama*.ts` |
+| On-device learning (RAG) | `src/main/ai/rag.ts`, `ragIpc.ts` |
+| Encrypted API key store | [`src/main/ai/credentials.ts`](../src/main/ai/credentials.ts) |
+| Chat UI | [`src/renderer/toolbar/ChatPanel.tsx`](../src/renderer/toolbar/ChatPanel.tsx) |
+| Settings → AI UI | [`src/renderer/toolbar/App.tsx`](../src/renderer/toolbar/App.tsx) |
+
+**Adding a provider**: implement `ProviderAdapter.ask()` in a new
+`src/main/ai/<id>.ts`, add the id to `ProviderId` in
+[`src/shared/types.ts`](../src/shared/types.ts), register it in
+`registry.ts` (adapter + models + label + key URL), and add it to the
+cloud-provider checks in `ipc.ts`, the persistence validation in
+`hub.ts`, and the Settings maps in the toolbar `App.tsx`. The renderer,
+preload, and message assembly need no changes.
diff --git a/electron-builder.yml b/electron-builder.yml
index edb8b6a..1ea4c66 100644
--- a/electron-builder.yml
+++ b/electron-builder.yml
@@ -3,6 +3,18 @@ productName: Lekhini
 copyright: Copyright © 2026 Open Source Bharat — https://opensourcebharat.org
 asar: true
 
+# Auto-update feed + release target. electron-builder bakes this into
+# app-update.yml inside the build and, when run with --publish, uploads
+# the installers plus the latest*.yml manifests to GitHub Releases.
+# electron-updater reads the same feed at runtime to discover updates.
+publish:
+  provider: github
+  owner: opensourcebharat
+  repo: lekhini
+  # Upload to a DRAFT release; the release workflow flips it public only
+  # after every OS finishes, so users never see a half-uploaded release.
+  releaseType: draft
+
 # Single source-of-truth for the app icon. electron-builder auto-
 # generates the platform-specific .icns (macOS) and .ico (Windows)
 # from this PNG. Recommended: 1024×1024, transparent background.
@@ -17,6 +29,12 @@ files:
   - dist-electron
   - package.json
 
+# Bundled per-profile RAG seed examples ("intent files"), read at
+# runtime from process.resourcesPath/intent.
+extraResources:
+  - from: resources/intent
+    to: intent
+
 mac:
   category: public.app-category.productivity
   target:
@@ -24,6 +42,14 @@ mac:
       arch:
         - arm64
         - x64
+    # zip is what Squirrel.Mac consumes for auto-update; ship it
+    # alongside the dmg so updates work once the build is signed +
+    # notarized. (Unsigned builds still produce it; macOS just won't
+    # auto-apply until signing is configured.)
+    - target: zip
+      arch:
+        - arm64
+        - x64
   hardenedRuntime: true
   gatekeeperAssess: false
   entitlements: build/entitlements.mac.plist
diff --git a/package-lock.json b/package-lock.json
index 09e8166..99fb3fa 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -9,9 +9,16 @@
       "version": "1.0.0",
       "license": "MIT",
       "dependencies": {
+        "@anthropic-ai/sdk": "^0.97.1",
+        "@google/generative-ai": "^0.24.1",
         "active-win": "^8.2.1",
         "electron-store": "^10.0.0",
+        "electron-updater": "^6.8.3",
+        "jszip": "^3.10.1",
+        "marked": "^18.0.4",
+        "openai": "^6.38.0",
         "perfect-freehand": "^1.2.2",
+        "sarvamai": "^1.1.7",
         "solid-js": "^1.8.22",
         "zustand": "^4.5.5"
       },
@@ -27,6 +34,27 @@
         "vite-plugin-solid": "^2.10.2"
       }
     },
+    "node_modules/@anthropic-ai/sdk": {
+      "version": "0.97.1",
+      "resolved": "https://registry.npmjs.org/@anthropic-ai/sdk/-/sdk-0.97.1.tgz",
+      "integrity": "sha512-wOf7AUeJPitcVpvKO4UMu63mWH5SaVipkGd7OOQJt/G6VYGlV8D2Gp9dLxOrttDJh/9gqPqdaBwDGcBevumeAg==",
+      "license": "MIT",
+      "dependencies": {
+        "json-schema-to-ts": "^3.1.1",
+        "standardwebhooks": "^1.0.0"
+      },
+      "bin": {
+        "anthropic-ai-sdk": "bin/cli"
+      },
+      "peerDependencies": {
+        "zod": "^3.25.0 || ^4.0.0"
+      },
+      "peerDependenciesMeta": {
+        "zod": {
+          "optional": true
+        }
+      }
+    },
     "node_modules/@babel/code-frame": {
       "version": "7.29.0",
       "resolved": "https://registry.npmjs.org/@babel/code-frame/-/code-frame-7.29.0.tgz",
@@ -282,6 +310,15 @@
         "@babel/core": "^7.0.0-0"
       }
     },
+    "node_modules/@babel/runtime": {
+      "version": "7.29.2",
+      "resolved": "https://registry.npmjs.org/@babel/runtime/-/runtime-7.29.2.tgz",
+      "integrity": "sha512-JiDShH45zKHWyGe4ZNVRrCjBz8Nh9TMmZG1kh4QTK8hCBTWBi8Da+i7s1fJw7/lYpM4ccepSNfqzZ/QvABBi5g==",
+      "license": "MIT",
+      "engines": {
+        "node": ">=6.9.0"
+      }
+    },
     "node_modules/@babel/template": {
       "version": "7.28.6",
       "resolved": "https://registry.npmjs.org/@babel/template/-/template-7.28.6.tgz",
@@ -1111,6 +1148,15 @@
       "devOptional": true,
       "license": "MIT"
     },
+    "node_modules/@google/generative-ai": {
+      "version": "0.24.1",
+      "resolved": "https://registry.npmjs.org/@google/generative-ai/-/generative-ai-0.24.1.tgz",
+      "integrity": "sha512-MqO+MLfM6kjxcKoy0p1wRzG3b4ZZXtPI+z2IE26UogS2Cm/XHO+7gGRBh6gcJsOiIVoH93UwKvW4HdgiOZCy9Q==",
+      "license": "Apache-2.0",
+      "engines": {
+        "node": ">=18.0.0"
+      }
+    },
     "node_modules/@isaacs/cliui": {
       "version": "8.0.2",
       "resolved": "https://registry.npmjs.org/@isaacs/cliui/-/cliui-8.0.2.tgz",
@@ -1805,6 +1851,12 @@
         "url": "https://github.com/sindresorhus/is?sponsor=1"
       }
     },
+    "node_modules/@stablelib/base64": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/@stablelib/base64/-/base64-1.0.1.tgz",
+      "integrity": "sha512-1bnPQqSxSuc3Ii6MhBysoWCg58j97aUjuCSZrGSmDxNqtytIi0k8utUenAwTZN4V5mXXYGsVUI9zeBqy+jBOSQ==",
+      "license": "MIT"
+    },
     "node_modules/@szmarczak/http-timer": {
       "version": "4.0.6",
       "resolved": "https://registry.npmjs.org/@szmarczak/http-timer/-/http-timer-4.0.6.tgz",
@@ -2365,7 +2417,6 @@
       "version": "2.0.1",
       "resolved": "https://registry.npmjs.org/argparse/-/argparse-2.0.1.tgz",
       "integrity": "sha512-8+9WqebbFzpX9OR+Wa6O29asIogeRMzcGtAINdpMHHyAg10f05aSFVBbcEqGf/PXw1EjAZ+q2/bEBg3DvurK3Q==",
-      "dev": true,
       "license": "Python-2.0"
     },
     "node_modules/assert-plus": {
@@ -3280,7 +3331,6 @@
       "version": "1.0.2",
       "resolved": "https://registry.npmjs.org/core-util-is/-/core-util-is-1.0.2.tgz",
       "integrity": "sha512-3lqz5YjWTYnW6dlDa5TLaTCcShfar1e40rmcJVwCBJC6mWlFuj0eCHIElmG1g5kyuJ/GD+8Wn4FFCcz4gJPfaQ==",
-      "dev": true,
       "license": "MIT"
     },
     "node_modules/crc": {
@@ -3363,7 +3413,6 @@
       "version": "4.4.3",
       "resolved": "https://registry.npmjs.org/debug/-/debug-4.4.3.tgz",
       "integrity": "sha512-RGwwWnwQvkVfavKVt22FGLw+xYSdzARwm0ru6DhTVA3umU5hZc28V3kO4stgYryrTlLpuvgI9GiijltAjNbcqA==",
-      "devOptional": true,
       "license": "MIT",
       "dependencies": {
         "ms": "^2.1.3"
@@ -3924,6 +3973,82 @@
       "dev": true,
       "license": "ISC"
     },
+    "node_modules/electron-updater": {
+      "version": "6.8.3",
+      "resolved": "https://registry.npmjs.org/electron-updater/-/electron-updater-6.8.3.tgz",
+      "integrity": "sha512-Z6sgw3jgbikWKXei1ENdqFOxBP0WlXg3TtKfz0rgw2vIZFJUyI4pD7ZN7jrkm7EoMK+tcm/qTnPUdqfZukBlBQ==",
+      "license": "MIT",
+      "dependencies": {
+        "builder-util-runtime": "9.5.1",
+        "fs-extra": "^10.1.0",
+        "js-yaml": "^4.1.0",
+        "lazy-val": "^1.0.5",
+        "lodash.escaperegexp": "^4.1.2",
+        "lodash.isequal": "^4.5.0",
+        "semver": "~7.7.3",
+        "tiny-typed-emitter": "^2.1.0"
+      }
+    },
+    "node_modules/electron-updater/node_modules/builder-util-runtime": {
+      "version": "9.5.1",
+      "resolved": "https://registry.npmjs.org/builder-util-runtime/-/builder-util-runtime-9.5.1.tgz",
+      "integrity": "sha512-qt41tMfgHTllhResqM5DcnHyDIWNgzHvuY2jDcYP9iaGpkWxTUzV6GQjDeLnlR1/DtdlcsWQbA7sByMpmJFTLQ==",
+      "license": "MIT",
+      "dependencies": {
+        "debug": "^4.3.4",
+        "sax": "^1.2.4"
+      },
+      "engines": {
+        "node": ">=12.0.0"
+      }
+    },
+    "node_modules/electron-updater/node_modules/fs-extra": {
+      "version": "10.1.0",
+      "resolved": "https://registry.npmjs.org/fs-extra/-/fs-extra-10.1.0.tgz",
+      "integrity": "sha512-oRXApq54ETRj4eMiFzGnHWGy+zo5raudjuxN0b8H7s/RU2oW0Wvsx9O0ACRN/kRq9E8Vu/ReskGB5o3ji+FzHQ==",
+      "license": "MIT",
+      "dependencies": {
+        "graceful-fs": "^4.2.0",
+        "jsonfile": "^6.0.1",
+        "universalify": "^2.0.0"
+      },
+      "engines": {
+        "node": ">=12"
+      }
+    },
+    "node_modules/electron-updater/node_modules/jsonfile": {
+      "version": "6.2.1",
+      "resolved": "https://registry.npmjs.org/jsonfile/-/jsonfile-6.2.1.tgz",
+      "integrity": "sha512-zwOTdL3rFQ/lRdBnntKVOX6k5cKJwEc1HdilT71BWEu7J41gXIB2MRp+vxduPSwZJPWBxEzv4yH1wYLJGUHX4Q==",
+      "license": "MIT",
+      "dependencies": {
+        "universalify": "^2.0.0"
+      },
+      "optionalDependencies": {
+        "graceful-fs": "^4.1.6"
+      }
+    },
+    "node_modules/electron-updater/node_modules/semver": {
+      "version": "7.7.4",
+      "resolved": "https://registry.npmjs.org/semver/-/semver-7.7.4.tgz",
+      "integrity": "sha512-vFKC2IEtQnVhpT78h1Yp8wzwrf8CM+MzKMHGJZfBtzhZNycRFnXsHk6E5TxIkkMsgNS7mdX3AGB7x2QM2di4lA==",
+      "license": "ISC",
+      "bin": {
+        "semver": "bin/semver.js"
+      },
+      "engines": {
+        "node": ">=10"
+      }
+    },
+    "node_modules/electron-updater/node_modules/universalify": {
+      "version": "2.0.1",
+      "resolved": "https://registry.npmjs.org/universalify/-/universalify-2.0.1.tgz",
+      "integrity": "sha512-gptHNQghINnc/vTGIk0SOFGFNXw7JVrlRUtConJRlvaw6DuX0wO5Jeko9sWrMBhh+PsYAZ7oXAiOnf/UKogyiw==",
+      "license": "MIT",
+      "engines": {
+        "node": ">= 10.0.0"
+      }
+    },
     "node_modules/electron/node_modules/@types/node": {
       "version": "20.19.41",
       "resolved": "https://registry.npmjs.org/@types/node/-/node-20.19.41.tgz",
@@ -4163,6 +4288,12 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/fast-sha256": {
+      "version": "1.3.0",
+      "resolved": "https://registry.npmjs.org/fast-sha256/-/fast-sha256-1.3.0.tgz",
+      "integrity": "sha512-n11RGP/lrWEFI/bWdygLxhI+pVeo1ZYIVwvvPkW7azl/rOy+F3HYRZ2K5zeE9mmkhQppyv9sQFx0JM9UabnpPQ==",
+      "license": "Unlicense"
+    },
     "node_modules/fast-uri": {
       "version": "3.1.2",
       "resolved": "https://registry.npmjs.org/fast-uri/-/fast-uri-3.1.2.tgz",
@@ -4574,7 +4705,6 @@
       "version": "4.2.11",
       "resolved": "https://registry.npmjs.org/graceful-fs/-/graceful-fs-4.2.11.tgz",
       "integrity": "sha512-RbJ5/jmFcNNCcDV5o9eTnBLJ/HszWV0P73bc+Ff4nS/rJj+YaS6IGyiOL0VoBYX+l1Wrl3k63h/KrH+nhJ0XvQ==",
-      "devOptional": true,
       "license": "ISC"
     },
     "node_modules/has-flag": {
@@ -4802,6 +4932,12 @@
       ],
       "license": "BSD-3-Clause"
     },
+    "node_modules/immediate": {
+      "version": "3.0.6",
+      "resolved": "https://registry.npmjs.org/immediate/-/immediate-3.0.6.tgz",
+      "integrity": "sha512-XXOFtyqDjNDAQxVfYxuF7g9Il/IbWmmlQg2MYKOH8ExIT1qg6xc4zyS3HaEEATgs1btfzxq15ciUiY7gjSXRGQ==",
+      "license": "MIT"
+    },
     "node_modules/imurmurhash": {
       "version": "0.1.4",
       "resolved": "https://registry.npmjs.org/imurmurhash/-/imurmurhash-0.1.4.tgz",
@@ -4845,7 +4981,6 @@
       "version": "2.0.4",
       "resolved": "https://registry.npmjs.org/inherits/-/inherits-2.0.4.tgz",
       "integrity": "sha512-k/vGaX4/Yla3WzyMCvTQOXYeIHvqOKtnqBduzTHpzpQZzAskKMhZ2K+EnBiSM9zGSoIFeMpXKxa4dYeZIQqewQ==",
-      "devOptional": true,
       "license": "ISC"
     },
     "node_modules/ip-address": {
@@ -4928,9 +5063,7 @@
       "version": "1.0.0",
       "resolved": "https://registry.npmjs.org/isarray/-/isarray-1.0.0.tgz",
       "integrity": "sha512-VLghIWNM6ELQzo7zwmcg0NmTVyWKYjvIeM83yjp0wRDTmUnrM678fQbcKBo6n2CJEF0szoG//ytg+TKla89ALQ==",
-      "dev": true,
-      "license": "MIT",
-      "peer": true
+      "license": "MIT"
     },
     "node_modules/isbinaryfile": {
       "version": "5.0.7",
@@ -4997,7 +5130,6 @@
       "version": "4.1.1",
       "resolved": "https://registry.npmjs.org/js-yaml/-/js-yaml-4.1.1.tgz",
       "integrity": "sha512-qQKT4zQxXl8lLwBtHMWwaTcGfFOZviOJet3Oy/xmGk2gZH677CJM9EvtfdSkgWcATZhj/55JZ0rmy3myCT5lsA==",
-      "dev": true,
       "license": "MIT",
       "dependencies": {
         "argparse": "^2.0.1"
@@ -5026,6 +5158,19 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/json-schema-to-ts": {
+      "version": "3.1.1",
+      "resolved": "https://registry.npmjs.org/json-schema-to-ts/-/json-schema-to-ts-3.1.1.tgz",
+      "integrity": "sha512-+DWg8jCJG2TEnpy7kOm/7/AxaYoaRbjVB4LFZLySZlWn8exGs3A4OLJR966cVvU26N7X9TWxl+Jsw7dzAqKT6g==",
+      "license": "MIT",
+      "dependencies": {
+        "@babel/runtime": "^7.18.3",
+        "ts-algebra": "^2.0.0"
+      },
+      "engines": {
+        "node": ">=16"
+      }
+    },
     "node_modules/json-schema-traverse": {
       "version": "0.4.1",
       "resolved": "https://registry.npmjs.org/json-schema-traverse/-/json-schema-traverse-0.4.1.tgz",
@@ -5070,6 +5215,48 @@
         "graceful-fs": "^4.1.6"
       }
     },
+    "node_modules/jszip": {
+      "version": "3.10.1",
+      "resolved": "https://registry.npmjs.org/jszip/-/jszip-3.10.1.tgz",
+      "integrity": "sha512-xXDvecyTpGLrqFrvkrUSoxxfJI5AH7U8zxxtVclpsUtMCq4JQ290LY8AW5c7Ggnr/Y/oK+bQMbqK2qmtk3pN4g==",
+      "license": "(MIT OR GPL-3.0-or-later)",
+      "dependencies": {
+        "lie": "~3.3.0",
+        "pako": "~1.0.2",
+        "readable-stream": "~2.3.6",
+        "setimmediate": "^1.0.5"
+      }
+    },
+    "node_modules/jszip/node_modules/readable-stream": {
+      "version": "2.3.8",
+      "resolved": "https://registry.npmjs.org/readable-stream/-/readable-stream-2.3.8.tgz",
+      "integrity": "sha512-8p0AUk4XODgIewSi0l8Epjs+EVnWiK7NoDIEGU0HhE7+ZyY8D1IMY7odu5lRrFXGg71L15KG8QrPmum45RTtdA==",
+      "license": "MIT",
+      "dependencies": {
+        "core-util-is": "~1.0.0",
+        "inherits": "~2.0.3",
+        "isarray": "~1.0.0",
+        "process-nextick-args": "~2.0.0",
+        "safe-buffer": "~5.1.1",
+        "string_decoder": "~1.1.1",
+        "util-deprecate": "~1.0.1"
+      }
+    },
+    "node_modules/jszip/node_modules/safe-buffer": {
+      "version": "5.1.2",
+      "resolved": "https://registry.npmjs.org/safe-buffer/-/safe-buffer-5.1.2.tgz",
+      "integrity": "sha512-Gd2UZBJDkXlY7GbJxfsE8/nvKkUEU1G38c1siN6QP6a9PT9MmHB8GnpscSmMJSoF8LOIrt8ud/wPtojys4G6+g==",
+      "license": "MIT"
+    },
+    "node_modules/jszip/node_modules/string_decoder": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/string_decoder/-/string_decoder-1.1.1.tgz",
+      "integrity": "sha512-n/ShnvDi6FHbbVfviro+WojiFzv+s8MPMHBczVePfUpDJLwoLT0ht1l4YwBCbi8pJAveEEdnkHyPyTP/mzRfwg==",
+      "license": "MIT",
+      "dependencies": {
+        "safe-buffer": "~5.1.0"
+      }
+    },
     "node_modules/keyv": {
       "version": "4.5.4",
       "resolved": "https://registry.npmjs.org/keyv/-/keyv-4.5.4.tgz",
@@ -5084,7 +5271,6 @@
       "version": "1.0.5",
       "resolved": "https://registry.npmjs.org/lazy-val/-/lazy-val-1.0.5.tgz",
       "integrity": "sha512-0/BnGCCfyUMkBpeDgWihanIAF9JmZhHBgUhEqzvf+adhNGLoP6TaiI5oF8oyb3I45P+PcnrqihSf01M0l0G5+Q==",
-      "dev": true,
       "license": "MIT"
     },
     "node_modules/lazystream": {
@@ -5137,6 +5323,15 @@
         "safe-buffer": "~5.1.0"
       }
     },
+    "node_modules/lie": {
+      "version": "3.3.0",
+      "resolved": "https://registry.npmjs.org/lie/-/lie-3.3.0.tgz",
+      "integrity": "sha512-UaiMJzeWRlEujzAuw5LokY1L5ecNQYZKfmyZ9L7wDHb/p5etKaxXhohBcrw0EYby+G/NA52vRSN4N39dxHAIwQ==",
+      "license": "MIT",
+      "dependencies": {
+        "immediate": "~3.0.5"
+      }
+    },
     "node_modules/lodash": {
       "version": "4.18.1",
       "resolved": "https://registry.npmjs.org/lodash/-/lodash-4.18.1.tgz",
@@ -5160,6 +5355,12 @@
       "license": "MIT",
       "peer": true
     },
+    "node_modules/lodash.escaperegexp": {
+      "version": "4.1.2",
+      "resolved": "https://registry.npmjs.org/lodash.escaperegexp/-/lodash.escaperegexp-4.1.2.tgz",
+      "integrity": "sha512-TM9YBvyC84ZxE3rgfefxUWiQKLilstD6k7PTGt6wfbtXF8ixIJLOL3VYyV/z+ZiPLsVxAsKAFVwWlWeb2Y8Yyw==",
+      "license": "MIT"
+    },
     "node_modules/lodash.flatten": {
       "version": "4.4.0",
       "resolved": "https://registry.npmjs.org/lodash.flatten/-/lodash.flatten-4.4.0.tgz",
@@ -5168,6 +5369,13 @@
       "license": "MIT",
       "peer": true
     },
+    "node_modules/lodash.isequal": {
+      "version": "4.5.0",
+      "resolved": "https://registry.npmjs.org/lodash.isequal/-/lodash.isequal-4.5.0.tgz",
+      "integrity": "sha512-pDo3lu8Jhfjqls6GkMgpahsF9kCyayhgykjyLMNFTKWrpVdAQtYyB4muAMWozBB4ig/dtWAmsMxLEI8wuz+DYQ==",
+      "deprecated": "This package is deprecated. Use require('node:util').isDeepStrictEqual instead.",
+      "license": "MIT"
+    },
     "node_modules/lodash.isplainobject": {
       "version": "4.0.6",
       "resolved": "https://registry.npmjs.org/lodash.isplainobject/-/lodash.isplainobject-4.0.6.tgz",
@@ -5316,6 +5524,18 @@
         "node": ">=12"
       }
     },
+    "node_modules/marked": {
+      "version": "18.0.4",
+      "resolved": "https://registry.npmjs.org/marked/-/marked-18.0.4.tgz",
+      "integrity": "sha512-c/BTaKzg0G6ezQx97DAkYU7k0HM6ys0FqYeKBL6hlBByZwy+ycA1+f0vDdjMHKKeEjdgkx0GOv9Il6D+85cOqA==",
+      "license": "MIT",
+      "bin": {
+        "marked": "bin/marked.js"
+      },
+      "engines": {
+        "node": ">= 20"
+      }
+    },
     "node_modules/matcher": {
       "version": "3.0.0",
       "resolved": "https://registry.npmjs.org/matcher/-/matcher-3.0.0.tgz",
@@ -5564,7 +5784,6 @@
       "version": "2.1.3",
       "resolved": "https://registry.npmjs.org/ms/-/ms-2.1.3.tgz",
       "integrity": "sha512-6FlzubTLZG3J2a/NVCAleEhjzq5oxgHyaCU9yYXvcLsvoVaHJq/s5xXI6/XXP6tz7R9xAOtHnSO/tXtF3WRTlA==",
-      "devOptional": true,
       "license": "MIT"
     },
     "node_modules/nanoid": {
@@ -5850,6 +6069,27 @@
         "url": "https://github.com/sponsors/sindresorhus"
       }
     },
+    "node_modules/openai": {
+      "version": "6.38.0",
+      "resolved": "https://registry.npmjs.org/openai/-/openai-6.38.0.tgz",
+      "integrity": "sha512-AoMplt2UalrpgUDMh3L09QWjNRlgJPipclQvA6sYAaeF6nHNBMgmikAZGmcYLn8on4d9sQY9Q8bOLfrBS7Lc8g==",
+      "license": "Apache-2.0",
+      "bin": {
+        "openai": "bin/cli"
+      },
+      "peerDependencies": {
+        "ws": "^8.18.0",
+        "zod": "^3.25 || ^4.0"
+      },
+      "peerDependenciesMeta": {
+        "ws": {
+          "optional": true
+        },
+        "zod": {
+          "optional": true
+        }
+      }
+    },
     "node_modules/ora": {
       "version": "5.4.1",
       "resolved": "https://registry.npmjs.org/ora/-/ora-5.4.1.tgz",
@@ -5923,6 +6163,12 @@
       "dev": true,
       "license": "BlueOak-1.0.0"
     },
+    "node_modules/pako": {
+      "version": "1.0.11",
+      "resolved": "https://registry.npmjs.org/pako/-/pako-1.0.11.tgz",
+      "integrity": "sha512-4hLB8Py4zZce5s4yd9XzopqwVv/yGNhV1Bl8NTmCq1763HeK2+EwVTv+leGeL13Dnh2wfbqowVPXCIO0z4taYw==",
+      "license": "(MIT AND Zlib)"
+    },
     "node_modules/parse5": {
       "version": "7.3.0",
       "resolved": "https://registry.npmjs.org/parse5/-/parse5-7.3.0.tgz",
@@ -6089,9 +6335,7 @@
       "version": "2.0.1",
       "resolved": "https://registry.npmjs.org/process-nextick-args/-/process-nextick-args-2.0.1.tgz",
       "integrity": "sha512-3ouUOpQhtgrbOa17J7+uxOTpITYWaGP7/AhoR3+A+/1e9skrzelGi/dXzEYyvbxubEF6Wn2ypscTKiKJFFn1ag==",
-      "dev": true,
-      "license": "MIT",
-      "peer": true
+      "license": "MIT"
     },
     "node_modules/progress": {
       "version": "2.0.3",
@@ -6440,11 +6684,21 @@
         "truncate-utf8-bytes": "^1.0.0"
       }
     },
+    "node_modules/sarvamai": {
+      "version": "1.1.7",
+      "resolved": "https://registry.npmjs.org/sarvamai/-/sarvamai-1.1.7.tgz",
+      "integrity": "sha512-xROqWjLB2jajV+CFzMUAS913poGgpVP0t/ELwn4cAVNXX4dju/LcP8VrOWzIeU0LTK9n2M00UQEriJTYNrIrJw==",
+      "dependencies": {
+        "ws": "^8.16.0"
+      },
+      "engines": {
+        "node": ">=18.0.0"
+      }
+    },
     "node_modules/sax": {
       "version": "1.6.0",
       "resolved": "https://registry.npmjs.org/sax/-/sax-1.6.0.tgz",
       "integrity": "sha512-6R3J5M4AcbtLUdZmRv2SygeVaM7IhrLXu9BmnOGmmACak8fiUtOsYNWUS4uK7upbmHIBbLBeFeI//477BKLBzA==",
-      "dev": true,
       "license": "BlueOak-1.0.0",
       "engines": {
         "node": ">=11.0.0"
@@ -6529,6 +6783,12 @@
       "devOptional": true,
       "license": "ISC"
     },
+    "node_modules/setimmediate": {
+      "version": "1.0.5",
+      "resolved": "https://registry.npmjs.org/setimmediate/-/setimmediate-1.0.5.tgz",
+      "integrity": "sha512-MATJdZp8sLqDl/68LfQmbP8zKPLQNV6BIZoIgrscFDQ+RsvK/BxeDQOgyxKKoh0y/8h3BqVFnCqQ/gd+reiIXA==",
+      "license": "MIT"
+    },
     "node_modules/shebang-command": {
       "version": "2.0.0",
       "resolved": "https://registry.npmjs.org/shebang-command/-/shebang-command-2.0.0.tgz",
@@ -6720,6 +6980,16 @@
         "node": "^12.13.0 || ^14.15.0 || >=16.0.0"
       }
     },
+    "node_modules/standardwebhooks": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/standardwebhooks/-/standardwebhooks-1.0.0.tgz",
+      "integrity": "sha512-BbHGOQK9olHPMvQNHWul6MYlrRTAOKn03rOe4A8O3CLWhNf4YHBqq2HJKKC+sfqpxiBY52pNeesD6jIiLDz8jg==",
+      "license": "MIT",
+      "dependencies": {
+        "@stablelib/base64": "^1.0.0",
+        "fast-sha256": "^1.3.0"
+      }
+    },
     "node_modules/stat-mode": {
       "version": "1.0.0",
       "resolved": "https://registry.npmjs.org/stat-mode/-/stat-mode-1.0.0.tgz",
@@ -6935,6 +7205,12 @@
         "node": ">= 10.0.0"
       }
     },
+    "node_modules/tiny-typed-emitter": {
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/tiny-typed-emitter/-/tiny-typed-emitter-2.1.0.tgz",
+      "integrity": "sha512-qVtvMxeXbVej0cQWKqVSSAHmKZEHAvxdF8HEUBFWts8h+xEo5m/lEiPakuyZ3BnCBjOD8i24kzNOiOLLgsSxhA==",
+      "license": "MIT"
+    },
     "node_modules/tmp": {
       "version": "0.2.5",
       "resolved": "https://registry.npmjs.org/tmp/-/tmp-0.2.5.tgz",
@@ -6972,6 +7248,12 @@
         "utf8-byte-length": "^1.0.1"
       }
     },
+    "node_modules/ts-algebra": {
+      "version": "2.0.0",
+      "resolved": "https://registry.npmjs.org/ts-algebra/-/ts-algebra-2.0.0.tgz",
+      "integrity": "sha512-FPAhNPFMrkwz76P7cdjdmiShwMynZYN6SgOujD1urY4oNm80Ou9oMdmbR45LotcKOXoy7wSmHkRFE6Mxbrhefw==",
+      "license": "MIT"
+    },
     "node_modules/type-fest": {
       "version": "4.41.0",
       "resolved": "https://registry.npmjs.org/type-fest/-/type-fest-4.41.0.tgz",
@@ -7114,7 +7396,6 @@
       "version": "1.0.2",
       "resolved": "https://registry.npmjs.org/util-deprecate/-/util-deprecate-1.0.2.tgz",
       "integrity": "sha512-EPD5q1uXyFxJpCrLnCc1nHnq3gOa6DZBocAIiI2TaSCA7VCJ1UJDMagCzIkXNsUYfD1daK//LTEQ8xiIbrHtcw==",
-      "devOptional": true,
       "license": "MIT"
     },
     "node_modules/verror": {
@@ -7364,6 +7645,27 @@
       "devOptional": true,
       "license": "ISC"
     },
+    "node_modules/ws": {
+      "version": "8.21.0",
+      "resolved": "https://registry.npmjs.org/ws/-/ws-8.21.0.tgz",
+      "integrity": "sha512-Vsp28b7DRcimFQvrqu2Wek3z1iYxDCWqHYB8Qsnk/S4RfaCQzPGPyBNuVjJV3cd6UiKtUtp6sNM77gWvzcCH+g==",
+      "license": "MIT",
+      "engines": {
+        "node": ">=10.0.0"
+      },
+      "peerDependencies": {
+        "bufferutil": "^4.0.1",
+        "utf-8-validate": ">=5.0.2"
+      },
+      "peerDependenciesMeta": {
+        "bufferutil": {
+          "optional": true
+        },
+        "utf-8-validate": {
+          "optional": true
+        }
+      }
+    },
     "node_modules/xmlbuilder": {
       "version": "15.1.1",
       "resolved": "https://registry.npmjs.org/xmlbuilder/-/xmlbuilder-15.1.1.tgz",
diff --git a/package.json b/package.json
index 1de772f..aadac90 100644
--- a/package.json
+++ b/package.json
@@ -22,18 +22,29 @@
     "prebuild": "tsc --noEmit && vite build",
     "build": "npm run prebuild && electron-builder",
     "build:unpacked": "npm run prebuild && electron-builder --dir",
-    "build:mac":   "npm run prebuild && electron-builder --mac",
-    "build:win":   "npm run prebuild && electron-builder --win",
+    "build:mac": "npm run prebuild && electron-builder --mac",
+    "build:win": "npm run prebuild && electron-builder --win",
     "build:linux": "npm run prebuild && electron-builder --linux",
-    "build:all":   "npm run prebuild && electron-builder -mwl",
+    "build:all": "npm run prebuild && electron-builder -mwl",
+    "release:ci": "npm run prebuild && electron-builder --publish always",
+    "release": "bash scripts/release.sh",
+    "release:minor": "bash scripts/release.sh minor",
+    "release:major": "bash scripts/release.sh major",
     "typecheck": "tsc --noEmit",
     "format": "prettier --write .",
     "fix:electron": "bash scripts/fix-electron.sh"
   },
   "dependencies": {
+    "@anthropic-ai/sdk": "^0.97.1",
+    "@google/generative-ai": "^0.24.1",
     "active-win": "^8.2.1",
     "electron-store": "^10.0.0",
+    "electron-updater": "^6.8.3",
+    "jszip": "^3.10.1",
+    "marked": "^18.0.4",
+    "openai": "^6.38.0",
     "perfect-freehand": "^1.2.2",
+    "sarvamai": "^1.1.7",
     "solid-js": "^1.8.22",
     "zustand": "^4.5.5"
   },
diff --git a/resources/intent/general.jsonl b/resources/intent/general.jsonl
new file mode 100644
index 0000000..62e75ed
--- /dev/null
+++ b/resources/intent/general.jsonl
@@ -0,0 +1,6 @@
+{"original": "i dont no where its at", "corrected": "I don't know where it is."}
+{"original": "she dont have no time for this", "corrected": "She doesn't have any time for this."}
+{"original": "their going to they're house later", "corrected": "They're going to their house later."}
+{"original": "recieve the package tommorow", "corrected": "Receive the package tomorrow."}
+{"original": "me and him went to the store", "corrected": "He and I went to the store."}
+{"original": "its definately gonna happen", "corrected": "It's definitely going to happen."}
diff --git a/resources/intent/teacher.jsonl b/resources/intent/teacher.jsonl
new file mode 100644
index 0000000..9752c62
--- /dev/null
+++ b/resources/intent/teacher.jsonl
@@ -0,0 +1,5 @@
+{"original": "the mitochondria is the power house of cell", "corrected": "The mitochondria are the powerhouse of the cell."}
+{"original": "photosynthesis make food in plants", "corrected": "Photosynthesis makes food in plants."}
+{"original": "gravity pull things down to the ground", "corrected": "Gravity pulls things down toward the ground."}
+{"original": "their are three states of matter", "corrected": "There are three states of matter."}
+{"original": "the equation balance on both side", "corrected": "The equation balances on both sides."}
diff --git a/resources/intent/trader.jsonl b/resources/intent/trader.jsonl
new file mode 100644
index 0000000..d4c8bd5
--- /dev/null
+++ b/resources/intent/trader.jsonl
@@ -0,0 +1,5 @@
+{"original": "price broke the resistence and going up", "corrected": "Price broke the resistance and is moving up."}
+{"original": "its a bullish trend with higher high", "corrected": "It's a bullish trend with higher highs."}
+{"original": "support hold at the fib level", "corrected": "Support held at the Fibonacci level."}
+{"original": "the candle close above the moving avg", "corrected": "The candle closed above the moving average."}
+{"original": "volume is increasing on the breakout", "corrected": "Volume is increasing on the breakout."}
diff --git a/scripts/release.sh b/scripts/release.sh
new file mode 100755
index 0000000..e7834f3
--- /dev/null
+++ b/scripts/release.sh
@@ -0,0 +1,58 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+# Cut a release: validate, bump the version, roll the CHANGELOG, commit,
+# tag, and push. The pushed tag triggers .github/workflows/release.yml,
+# which builds macOS / Windows / Linux installers and publishes them to
+# GitHub Releases. This script does NOT build installers itself.
+#
+# Usage:
+#   scripts/release.sh [patch|minor|major|<x.y.z>]   (default: patch)
+# Or via npm:
+#   npm run release          # patch
+#   npm run release:minor
+#   npm run release:major
+
+ROOT="$(cd "$(dirname "$0")/.." && pwd)"
+cd "$ROOT"
+
+BUMP="${1:-patch}"
+
+# 1. Preconditions — clean tree so the release commit is exactly the
+#    version + changelog change and nothing else.
+if [ -n "$(git status --porcelain)" ]; then
+  echo "✗ Working tree not clean. Commit or stash changes first." >&2
+  exit 1
+fi
+BRANCH="$(git rev-parse --abbrev-ref HEAD)"
+echo "→ Releasing from '$BRANCH' (bump: $BUMP)"
+
+# 2. Validate before tagging anything (typecheck + full vite build).
+echo "→ Validating build (npm run prebuild)…"
+npm run prebuild
+
+# 3. Bump package.json + lockfile WITHOUT committing or tagging — we do
+#    those explicitly so the CHANGELOG lands in the same commit.
+npm version "$BUMP" --no-git-tag-version >/dev/null
+VERSION="$(node -p "require('./package.json').version")"
+TAG="v$VERSION"
+echo "→ New version: $VERSION"
+
+if git rev-parse "$TAG" >/dev/null 2>&1; then
+  echo "✗ Tag $TAG already exists. Never re-use a tag — bump again." >&2
+  exit 1
+fi
+
+# 4. Roll CHANGELOG: [Unreleased] → dated [VERSION] section + links.
+node scripts/update-changelog.mjs "$VERSION"
+
+# 5. Commit, tag, push. CI takes it from here.
+git add package.json package-lock.json CHANGELOG.md
+git commit -m "chore(release): $TAG"
+git tag -a "$TAG" -m "Lekhini $TAG"
+echo "→ Pushing '$BRANCH' and tag '$TAG'…"
+git push origin "$BRANCH"
+git push origin "$TAG"
+
+echo "✓ $TAG pushed. GitHub Actions will build + publish the release."
+echo "  Watch: https://github.com/opensourcebharat/lekhini/actions"
diff --git a/scripts/update-changelog.mjs b/scripts/update-changelog.mjs
new file mode 100644
index 0000000..5be598f
--- /dev/null
+++ b/scripts/update-changelog.mjs
@@ -0,0 +1,47 @@
+// Roll CHANGELOG.md for a release: move the "[Unreleased]" heading down
+// into a new dated "[VERSION]" section (leaving Unreleased empty for the
+// next cycle) and update the link references at the bottom of the file.
+// Invoked by scripts/release.sh with the freshly-bumped version.
+//
+// Usage: node scripts/update-changelog.mjs <version>
+
+import { readFileSync, writeFileSync } from 'node:fs';
+
+const version = process.argv[2];
+if (!version) {
+  console.error('usage: node scripts/update-changelog.mjs <version>');
+  process.exit(1);
+}
+
+const REPO = 'https://github.com/opensourcebharat/lekhini';
+const path = new URL('../CHANGELOG.md', import.meta.url);
+let md = readFileSync(path, 'utf8');
+
+const today = new Date().toISOString().slice(0, 10); // YYYY-MM-DD (UTC)
+
+const UNRELEASED = '## [Unreleased]';
+if (!md.includes(UNRELEASED)) {
+  console.error('CHANGELOG.md has no "## [Unreleased]" section.');
+  process.exit(1);
+}
+
+// 1. Insert the dated version heading just below [Unreleased], keeping
+//    an empty Unreleased section at the top.
+md = md.replace(UNRELEASED, `${UNRELEASED}\n\n## [${version}] — ${today}`);
+
+// 2. Find the previous version from the existing Unreleased compare link
+//    so we can build a proper compare range for the new one.
+const prevMatch = md.match(
+  /\[Unreleased\]:\s*\S+\/compare\/v(\d+\.\d+\.\d+(?:-[\w.]+)?)\.\.\.HEAD/,
+);
+const prev = prevMatch ? prevMatch[1] : null;
+
+// 3. Repoint [Unreleased] at the new version and add the version link.
+md = md.replace(/\[Unreleased\]:.*$/m, `[Unreleased]: ${REPO}/compare/v${version}...HEAD`);
+const versionLink = prev
+  ? `[${version}]: ${REPO}/compare/v${prev}...v${version}`
+  : `[${version}]: ${REPO}/releases/tag/v${version}`;
+md = md.replace(/(\[Unreleased\]:.*$)/m, `$1\n${versionLink}`);
+
+writeFileSync(path, md);
+console.log(`CHANGELOG.md rolled for v${version} (${today}).`);
diff --git a/src/main/ai/anthropic.ts b/src/main/ai/anthropic.ts
new file mode 100644
index 0000000..dc0c36d
--- /dev/null
+++ b/src/main/ai/anthropic.ts
@@ -0,0 +1,70 @@
+import Anthropic from '@anthropic-ai/sdk';
+import type { AskInput } from '../../shared/types';
+import type { ProviderAdapter } from './types';
+import { assembleTurns } from './messages';
+
+// The Anthropic SDK's MessageParam type is stricter than what's
+// useful at our boundary (media_type is a literal union; content is
+// a discriminated union per role). We build the array structurally
+// and cast at the call site — the runtime shape matches the SDK
+// expectations exactly. Stream shape documented at
+// https://docs.anthropic.com/en/api/messages-streaming.
+
+const MAX_TOKENS = 2048;
+
+// Anthropic only accepts these image MIME types — coerce so the SDK
+// doesn't reject. The user can only produce PNGs from snip today, so
+// the runtime path is always 'image/png'.
+function normaliseMime(mime: string): 'image/png' | 'image/jpeg' | 'image/gif' | 'image/webp' {
+  if (mime === 'image/jpeg' || mime === 'image/gif' || mime === 'image/webp') return mime;
+  return 'image/png';
+}
+
+function buildMessages(input: AskInput): Anthropic.MessageParam[] {
+  // The image rides the FIRST user turn so it stays in context across
+  // follow-ups; all other turns are plain text.
+  const { turns, firstUserIdx } = assembleTurns(input);
+  return turns.map((t, i): Anthropic.MessageParam => {
+    if (input.image && i === firstUserIdx) {
+      return {
+        role: 'user',
+        content: [
+          {
+            type: 'image',
+            source: {
+              type: 'base64',
+              media_type: normaliseMime(input.image.mime),
+              data: input.image.base64,
+            },
+          },
+          { type: 'text', text: t.content },
+        ],
+      };
+    }
+    return { role: t.role, content: t.content };
+  });
+}
+
+export const anthropic: ProviderAdapter = {
+  id: 'anthropic',
+  async *ask(input, apiKey, signal) {
+    const client = new Anthropic({ apiKey });
+    const stream = client.messages.stream(
+      {
+        model: input.model,
+        max_tokens: MAX_TOKENS,
+        system: input.systemPrompt,
+        messages: buildMessages(input),
+      },
+      { signal },
+    );
+    for await (const event of stream) {
+      if (
+        event.type === 'content_block_delta' &&
+        event.delta.type === 'text_delta'
+      ) {
+        yield event.delta.text;
+      }
+    }
+  },
+};
diff --git a/src/main/ai/credentials.ts b/src/main/ai/credentials.ts
new file mode 100644
index 0000000..74f26af
--- /dev/null
+++ b/src/main/ai/credentials.ts
@@ -0,0 +1,106 @@
+import { app, safeStorage } from 'electron';
+import fs from 'node:fs';
+import path from 'node:path';
+import type { ProviderId } from '../../shared/types';
+
+// API keys live OUTSIDE PersistedState (which is plaintext electron-store
+// JSON). Each key is encrypted with Electron's safeStorage and stashed
+// in a tiny sidecar file in userData/. safeStorage uses the platform
+// keychain underneath: macOS Keychain, Windows DPAPI, libsecret on
+// Linux. Decryption only succeeds for the same OS user account — so a
+// stolen config.json doesn't yield the keys.
+//
+// File format on disk:
+//   <userData>/ai-credentials.json
+//   {
+//     "anthropic": "<base64 ciphertext>",
+//     "openai":    "<base64 ciphertext>",
+//     "gemini":    "<base64 ciphertext>"
+//   }
+//
+// In-memory fallback: if safeStorage.isEncryptionAvailable() returns
+// false (rare — would happen on a freshly-installed Linux without
+// libsecret), keys live in process memory only and are LOST when the
+// app quits. We log a clear warning and the renderer surfaces that
+// state in the AI settings UI.
+
+const FILE_NAME = 'ai-credentials.json';
+
+let memoryFallback: Partial<Record<ProviderId, string>> | null = null;
+
+function filePath(): string {
+  return path.join(app.getPath('userData'), FILE_NAME);
+}
+
+function readStore(): Record<string, string> {
+  try {
+    const raw = fs.readFileSync(filePath(), 'utf-8');
+    const parsed = JSON.parse(raw);
+    return parsed && typeof parsed === 'object' ? parsed : {};
+  } catch {
+    return {};
+  }
+}
+
+function writeStore(store: Record<string, string>): void {
+  try {
+    fs.writeFileSync(filePath(), JSON.stringify(store), { mode: 0o600 });
+  } catch (err) {
+    console.warn('[pen] failed to persist AI credentials store', err);
+  }
+}
+
+export function encryptionAvailable(): boolean {
+  return safeStorage.isEncryptionAvailable();
+}
+
+export function setKey(provider: ProviderId, key: string): void {
+  const trimmed = key.trim();
+  if (!encryptionAvailable()) {
+    if (!memoryFallback) memoryFallback = {};
+    memoryFallback[provider] = trimmed;
+    console.warn(
+      '[pen] safeStorage unavailable; AI key for',
+      provider,
+      'held in process memory only (will be lost on quit)',
+    );
+    return;
+  }
+  const cipher = safeStorage.encryptString(trimmed).toString('base64');
+  const store = readStore();
+  store[provider] = cipher;
+  writeStore(store);
+}
+
+export function getKey(provider: ProviderId): string | null {
+  if (!encryptionAvailable()) {
+    return memoryFallback?.[provider] ?? null;
+  }
+  const store = readStore();
+  const cipher = store[provider];
+  if (!cipher) return null;
+  try {
+    return safeStorage.decryptString(Buffer.from(cipher, 'base64'));
+  } catch (err) {
+    console.warn('[pen] failed to decrypt AI key for', provider, err);
+    return null;
+  }
+}
+
+export function hasKey(provider: ProviderId): boolean {
+  if (!encryptionAvailable()) {
+    return Boolean(memoryFallback?.[provider]);
+  }
+  const store = readStore();
+  return typeof store[provider] === 'string' && store[provider].length > 0;
+}
+
+export function deleteKey(provider: ProviderId): void {
+  if (!encryptionAvailable()) {
+    if (memoryFallback) delete memoryFallback[provider];
+    return;
+  }
+  const store = readStore();
+  delete store[provider];
+  writeStore(store);
+}
diff --git a/src/main/ai/deepseek.ts b/src/main/ai/deepseek.ts
new file mode 100644
index 0000000..422e44f
--- /dev/null
+++ b/src/main/ai/deepseek.ts
@@ -0,0 +1,53 @@
+import OpenAI from 'openai';
+import type { AskInput } from '../../shared/types';
+import type { ProviderAdapter } from './types';
+import { assembleTurns } from './messages';
+
+// DeepSeek exposes an OpenAI-compatible API at api.deepseek.com, so we
+// reuse the OpenAI SDK with a different baseURL. Its chat models
+// (deepseek-chat = V3, deepseek-reasoner = R1) are TEXT-ONLY — they
+// reject image inputs — so we never attach the snip here. An image
+// session that resolves to DeepSeek is answered from the text alone;
+// for image Q&A the resolver prefers a local vision model or a
+// vision-capable cloud provider (Claude / GPT-4o / Gemini).
+
+const MAX_TOKENS = 2048;
+const BASE_URL = 'https://api.deepseek.com';
+
+type Message =
+  | { role: 'system'; content: string }
+  | { role: 'user'; content: string }
+  | { role: 'assistant'; content: string };
+
+function buildMessages(input: AskInput): Message[] {
+  // No image part — DeepSeek can't see it — but we still replay the full
+  // conversation so follow-ups keep their textual context. Empty opening
+  // turns fall back to the solve-oriented default inside assembleTurns.
+  const out: Message[] = [{ role: 'system', content: input.systemPrompt }];
+  const { turns } = assembleTurns(input);
+  for (const t of turns) out.push({ role: t.role, content: t.content });
+  return out;
+}
+
+export const deepseek: ProviderAdapter = {
+  id: 'deepseek',
+  async *ask(input, apiKey, signal) {
+    const client = new OpenAI({ apiKey, baseURL: BASE_URL });
+    const stream = await client.chat.completions.create(
+      {
+        model: input.model,
+        max_tokens: MAX_TOKENS,
+        // eslint-disable-next-line @typescript-eslint/no-explicit-any
+        messages: buildMessages(input) as any,
+        stream: true,
+      },
+      { signal },
+    );
+    for await (const chunk of stream) {
+      const delta = chunk.choices?.[0]?.delta?.content;
+      if (typeof delta === 'string' && delta.length > 0) {
+        yield delta;
+      }
+    }
+  },
+};
diff --git a/src/main/ai/gemini.ts b/src/main/ai/gemini.ts
new file mode 100644
index 0000000..4b0287c
--- /dev/null
+++ b/src/main/ai/gemini.ts
@@ -0,0 +1,50 @@
+import { GoogleGenerativeAI } from '@google/generative-ai';
+import type { AskInput } from '../../shared/types';
+import type { ProviderAdapter } from './types';
+import { assembleTurns } from './messages';
+
+// Gemini's generateContentStream API takes content parts as either
+// text or inlineData (base64 with mimeType). The streaming response
+// gives chunks where each .text() returns the new delta. The system
+// prompt is passed via `systemInstruction` on the model — separate
+// from the messages.
+
+type GeminiPart = { text: string } | { inlineData: { data: string; mimeType: string } };
+
+type GeminiContent = { role: 'user' | 'model'; parts: GeminiPart[] };
+
+function roleFor(role: 'user' | 'assistant'): 'user' | 'model' {
+  return role === 'assistant' ? 'model' : 'user';
+}
+
+function buildContents(input: AskInput): GeminiContent[] {
+  // Image attaches to the FIRST user turn so follow-ups keep it in view.
+  const { turns, firstUserIdx } = assembleTurns(input);
+  return turns.map((t, i): GeminiContent => {
+    const parts: GeminiPart[] = [];
+    if (input.image && i === firstUserIdx) {
+      parts.push({ inlineData: { data: input.image.base64, mimeType: input.image.mime } });
+    }
+    parts.push({ text: t.content });
+    return { role: roleFor(t.role), parts };
+  });
+}
+
+export const gemini: ProviderAdapter = {
+  id: 'gemini',
+  async *ask(input, apiKey, signal) {
+    const client = new GoogleGenerativeAI(apiKey);
+    const model = client.getGenerativeModel({
+      model: input.model,
+      systemInstruction: input.systemPrompt,
+    });
+    const result = await model.generateContentStream(
+      { contents: buildContents(input) },
+      { signal },
+    );
+    for await (const chunk of result.stream) {
+      const text = chunk.text();
+      if (text.length > 0) yield text;
+    }
+  },
+};
diff --git a/src/main/ai/ipc.ts b/src/main/ai/ipc.ts
new file mode 100644
index 0000000..cab8023
--- /dev/null
+++ b/src/main/ai/ipc.ts
@@ -0,0 +1,450 @@
+import { BrowserWindow, ipcMain, shell } from 'electron';
+import type {
+  AiStatus,
+  AskInput,
+  ChatSessionPayload,
+  ConnectionTestResult,
+  OllamaPullProgress,
+  ProfileId,
+  ProviderId,
+  StreamChunk,
+} from '../../shared/types';
+import { deleteKey, getKey, hasKey, setKey } from './credentials';
+import { defaultModelFor, getAdapter } from './registry';
+import { patch as patchHub, getState as getHubState } from '../hub';
+import {
+  OLLAMA_INSTALL_URL,
+  cancelPull,
+  deleteModel,
+  freeDiskBytes,
+  getStatus as getOllamaStatus,
+  listCatalog,
+  listInstalled,
+  pull as ollamaPull,
+  start as startOllama,
+} from './ollamaService';
+import { MODEL_CATALOG, PROFILE_MODELS } from './ollamaModels';
+import { capture as ragCapture, maybeSeed, retrieve as ragRetrieve } from './rag';
+
+// System prompts for the one-shot correction calls.
+const RECOGNIZE_PROMPT =
+  'You are a strict OCR engine for handwriting. Output ONLY the exact words ' +
+  'written in the image, transcribed verbatim and then lightly corrected for ' +
+  'spelling and grammar. Hard rules: do NOT describe the image; never say it is ' +
+  'a signature, handwriting, a drawing, or refer to "the image" or "the user"; ' +
+  'no quotes, labels, commentary, apologies, or markdown — just the words. If ' +
+  'you cannot read any actual words, output nothing at all (an empty response).';
+const AUTOCORRECT_PROMPT =
+  'You are an automated text-correction engine. Fix all grammar, spelling, ' +
+  "typos, and awkward phrasing in the user's input. Return ONLY the corrected " +
+  'text — no quotes, commentary, or explanation. Preserve the original meaning.';
+
+const isCloudProvider = (v: unknown): v is ProviderId =>
+  v === 'anthropic' ||
+  v === 'openai' ||
+  v === 'gemini' ||
+  v === 'deepseek' ||
+  v === 'sarvam';
+
+const tagInstalled = (tag: string | null | undefined, installed: string[]): boolean =>
+  !!tag &&
+  (installed.includes(tag) || installed.includes(tag.includes(':') ? tag : `${tag}:latest`));
+
+// Single chokepoint deciding which provider/model actually serves a
+// request. Local-first: if Local AI is enabled, the service is up, and
+// a suitable model is installed, route to Ollama; otherwise fall back
+// to a configured cloud provider; otherwise return a friendly error.
+type Resolved = { provider: ProviderId; model: string; key: string } | { error: string };
+
+async function resolveProvider(input: AskInput): Promise<Resolved> {
+  const hub = getHubState();
+  const wantsVision = !!input.image;
+  if (hub.aiLocalEnabled) {
+    const svc = await getOllamaStatus();
+    if (svc.running) {
+      const installed = await listInstalled();
+      const profile = input.profile ?? hub.profile;
+      const kind: 'text' | 'vision' = wantsVision ? 'vision' : 'text';
+      // Preference order: per-profile override → global default →
+      // catalogue default for the profile → any installed model of the
+      // right kind. First one that's actually installed wins.
+      const candidates = [
+        hub.aiProfileModels[profile]?.[kind],
+        wantsVision ? hub.aiLocalVisionModel : hub.aiLocalModel,
+        PROFILE_MODELS[profile]?.[kind],
+      ];
+      let model: string | null = candidates.find((c) => tagInstalled(c, installed)) ?? null;
+      if (!model) {
+        const cand = MODEL_CATALOG.find((m) => m.kind === kind && tagInstalled(m.tag, installed));
+        model = cand?.tag ?? null;
+      }
+      if (model) return { provider: 'ollama', model, key: '' };
+      // Local on but nothing usable → fall through to cloud.
+    }
+  }
+  // Cloud fallback — prefer the configured active provider, else honour
+  // an explicitly-requested cloud provider that happens to have a key.
+  if (isCloudProvider(hub.aiActiveProvider) && hasKey(hub.aiActiveProvider)) {
+    const p = hub.aiActiveProvider;
+    return { provider: p, model: hub.aiActiveModel ?? defaultModelFor(p), key: getKey(p)! };
+  }
+  if (isCloudProvider(input.provider) && hasKey(input.provider)) {
+    return {
+      provider: input.provider,
+      model: input.model || defaultModelFor(input.provider),
+      key: getKey(input.provider)!,
+    };
+  }
+  return {
+    error: 'No AI available. Enable Local AI and install a model, or add a cloud provider key.',
+  };
+}
+
+// Active in-flight requests, keyed by the requestId we hand back to
+// the renderer. Lets the chat panel cancel a stream cleanly via
+// ai:cancel. Removed on completion / error / cancellation.
+const inFlight = new Map<string, AbortController>();
+
+// Per-session snip cache. The renderer attaches the image only on the
+// first turn; we stash it by sessionId and re-attach it on follow-up
+// turns of the same conversation so context isn't lost. Bounded to the
+// active conversation — a new session evicts the previous one.
+const sessionImages = new Map<string, { mime: string; base64: string }>();
+
+let requestSeq = 0;
+function nextRequestId(): string {
+  return `ai-${Date.now()}-${++requestSeq}`;
+}
+
+function broadcastChunk(chunk: StreamChunk): void {
+  for (const win of BrowserWindow.getAllWindows()) {
+    if (!win.isDestroyed()) win.webContents.send('ai:chunk', chunk);
+  }
+}
+
+function isProviderId(value: unknown): value is ProviderId {
+  return (
+    value === 'anthropic' ||
+    value === 'openai' ||
+    value === 'gemini' ||
+    value === 'deepseek' ||
+    value === 'sarvam' ||
+    value === 'ollama'
+  );
+}
+
+export function registerAiIpc(): void {
+  ipcMain.handle('ai:set-key', (_evt, payload: { provider: ProviderId; key: string }) => {
+    if (!isProviderId(payload.provider)) return;
+    if (typeof payload.key !== 'string' || payload.key.trim().length === 0) {
+      deleteKey(payload.provider);
+      return;
+    }
+    setKey(payload.provider, payload.key);
+  });
+
+  ipcMain.handle('ai:delete-key', (_evt, payload: { provider: ProviderId }) => {
+    if (!isProviderId(payload.provider)) return;
+    deleteKey(payload.provider);
+  });
+
+  ipcMain.handle('ai:get-status', async (): Promise<AiStatus[]> => {
+    const cloud = (
+      ['anthropic', 'openai', 'gemini', 'deepseek', 'sarvam'] as ProviderId[]
+    ).map((provider) => ({
+      provider,
+      configured: hasKey(provider),
+    }));
+    // Local is "configured" when the service is up AND ≥1 model is installed.
+    const svc = await getOllamaStatus();
+    const installed = svc.running ? await listInstalled() : [];
+    cloud.push({ provider: 'ollama', configured: svc.running && installed.length > 0 });
+    return cloud;
+  });
+
+  // Tiny request that confirms the key reaches the provider and the
+  // model exists. We use the default model for each provider and ask
+  // it to reply with a single character — cheapest possible probe.
+  ipcMain.handle(
+    'ai:test-connection',
+    async (_evt, payload: { provider: ProviderId; model: string }): Promise<ConnectionTestResult> => {
+      const provider = payload.provider;
+      const model = payload.model;
+      if (!isProviderId(provider)) return { ok: false, message: 'Unknown provider' };
+      // Local (ollama) needs no key; cloud providers do.
+      const key = provider === 'ollama' ? '' : getKey(provider);
+      if (provider !== 'ollama' && !key) return { ok: false, message: 'No API key configured' };
+      const adapter = getAdapter(provider);
+      const ctrl = new AbortController();
+      const started = Date.now();
+      try {
+        const stream = adapter.ask(
+          {
+            provider,
+            model,
+            systemPrompt: 'You are a connection test. Reply with a single dot.',
+            history: [],
+            userMessage: 'ping',
+          },
+          key ?? '',
+          ctrl.signal,
+        );
+        let total = '';
+        for await (const chunk of stream) {
+          total += chunk;
+          // First chunk is enough to confirm the round-trip.
+          if (total.length > 0) {
+            ctrl.abort();
+            break;
+          }
+        }
+        return { ok: true, latencyMs: Date.now() - started };
+      } catch (err) {
+        // AbortError on success-with-early-break is expected
+        const msg = (err as Error)?.message ?? String(err);
+        if (msg.toLowerCase().includes('abort')) {
+          return { ok: true, latencyMs: Date.now() - started };
+        }
+        return { ok: false, message: msg };
+      }
+    },
+  );
+
+  ipcMain.handle(
+    'ai:ask',
+    async (_evt, input: AskInput): Promise<{ requestId: string }> => {
+      const requestId = nextRequestId();
+      // Carry the snip across follow-ups: cache it on first sight,
+      // re-attach it on later turns of the same conversation. Done
+      // BEFORE resolveProvider so wantsVision stays true and a vision
+      // conversation keeps routing to its vision model.
+      const sid = input.sessionId;
+      if (sid) {
+        if (input.image) {
+          sessionImages.clear();
+          sessionImages.set(sid, input.image);
+        } else {
+          const cached = sessionImages.get(sid);
+          if (cached) input.image = cached;
+        }
+      }
+      // The resolver decides local-vs-cloud and the concrete model,
+      // so the renderer can stay provider-agnostic.
+      const resolved = await resolveProvider(input);
+      if ('error' in resolved) {
+        broadcastChunk({ requestId, error: resolved.error, done: true });
+        return { requestId };
+      }
+      const adapter = getAdapter(resolved.provider);
+      const finalInput: AskInput = {
+        ...input,
+        provider: resolved.provider,
+        model: resolved.model,
+      };
+      const ctrl = new AbortController();
+      inFlight.set(requestId, ctrl);
+      // Stream in the background so the IPC invoke can return the
+      // requestId immediately. The renderer subscribes to 'ai:chunk'
+      // events and matches by requestId.
+      void (async () => {
+        try {
+          for await (const delta of adapter.ask(finalInput, resolved.key, ctrl.signal)) {
+            if (ctrl.signal.aborted) break;
+            broadcastChunk({ requestId, delta });
+          }
+          broadcastChunk({ requestId, done: true });
+        } catch (err) {
+          const msg = (err as Error)?.message ?? String(err);
+          // User-initiated abort isn't an error; just close cleanly.
+          if (ctrl.signal.aborted || msg.toLowerCase().includes('abort')) {
+            broadcastChunk({ requestId, done: true });
+          } else {
+            broadcastChunk({ requestId, error: msg, done: true });
+          }
+        } finally {
+          inFlight.delete(requestId);
+        }
+      })();
+      return { requestId };
+    },
+  );
+
+  ipcMain.handle('ai:cancel', (_evt, payload: { requestId: string }) => {
+    const ctrl = inFlight.get(payload.requestId);
+    if (ctrl) ctrl.abort();
+    inFlight.delete(payload.requestId);
+  });
+
+  // One-shot, non-streaming: drain the adapter into a single string.
+  // Both go through the resolver, so local-first + cloud-fallback apply.
+  async function runOneShot(input: AskInput): Promise<{ text: string; error?: string }> {
+    const resolved = await resolveProvider(input);
+    if ('error' in resolved) return { text: '', error: resolved.error };
+    const adapter = getAdapter(resolved.provider);
+    const ctrl = new AbortController();
+    const timer = setTimeout(() => ctrl.abort(), 30_000);
+    try {
+      let out = '';
+      for await (const delta of adapter.ask(
+        { ...input, provider: resolved.provider, model: resolved.model },
+        resolved.key,
+        ctrl.signal,
+      )) {
+        out += delta;
+      }
+      return { text: out.trim() };
+    } catch (err) {
+      const msg = (err as Error)?.message ?? String(err);
+      if (ctrl.signal.aborted || msg.toLowerCase().includes('abort')) {
+        return { text: '', error: 'Timed out' };
+      }
+      return { text: '', error: msg };
+    } finally {
+      clearTimeout(timer);
+    }
+  }
+
+  // Handwriting recognition: image → corrected plain text (vision model).
+  ipcMain.handle(
+    'ai:recognize',
+    (
+      _evt,
+      payload: { png: Uint8Array; mime?: string; profile?: ProfileId },
+    ): Promise<{ text: string; error?: string }> =>
+      runOneShot({
+        provider: 'ollama',
+        model: '',
+        systemPrompt: RECOGNIZE_PROMPT,
+        image: { mime: payload.mime ?? 'image/png', base64: Buffer.from(payload.png).toString('base64') },
+        history: [],
+        userMessage: 'Transcribe and correct the handwriting in this image.',
+        profile: payload.profile,
+      }),
+  );
+
+  // Typed-text autocorrect: text → corrected text (text model). Pulls
+  // the user's most similar accepted corrections (RAG) into the prompt
+  // as few-shot examples, and records the resulting pair to learn from.
+  ipcMain.handle(
+    'ai:autocorrect',
+    async (
+      _evt,
+      payload: { text: string; profile?: ProfileId },
+    ): Promise<{ text: string; error?: string }> => {
+      const text = (payload.text ?? '').toString();
+      if (text.trim().length === 0) return { text };
+      const profile = payload.profile ?? getHubState().profile;
+
+      const examples = await ragRetrieve(profile, text, 3);
+      const systemPrompt =
+        examples.length > 0
+          ? AUTOCORRECT_PROMPT +
+            '\n\nExamples of corrections this user prefers:\n' +
+            examples.map((e) => `"${e.original}" → "${e.corrected}"`).join('\n')
+          : AUTOCORRECT_PROMPT;
+
+      const result = await runOneShot({
+        provider: 'ollama',
+        model: '',
+        systemPrompt,
+        history: [],
+        userMessage: text,
+        profile,
+      });
+
+      // Learn from the applied correction (best-effort, non-blocking).
+      if (result.text && result.text.trim() !== text.trim()) {
+        void ragCapture({ profile, kind: 'typed', original: text, corrected: result.text });
+      }
+      // Self-heal seeding once embeddings are reachable.
+      void maybeSeed();
+      return result;
+    },
+  );
+
+  // ── Local Ollama service management ──
+  const broadcastPull = (p: OllamaPullProgress): void => {
+    for (const win of BrowserWindow.getAllWindows()) {
+      if (!win.isDestroyed()) win.webContents.send('ollama:pull-progress', p);
+    }
+  };
+  const refreshInstalled = async (): Promise<void> => {
+    patchHub({ aiInstalledModels: await listInstalled() });
+  };
+
+  ipcMain.handle('ollama:status', () => getOllamaStatus());
+  ipcMain.handle('ollama:start', () => startOllama());
+  ipcMain.handle('ollama:list-models', () => listCatalog());
+  ipcMain.handle('ollama:disk-space', () => freeDiskBytes());
+  ipcMain.handle('ollama:pull', async (_evt, payload: { model: string }) => {
+    await ollamaPull(payload.model, broadcastPull);
+    await refreshInstalled();
+    return { ok: true };
+  });
+  ipcMain.handle('ollama:cancel-pull', (_evt, payload: { model: string }) => {
+    cancelPull(payload.model);
+  });
+  ipcMain.handle('ollama:delete-model', async (_evt, payload: { model: string }) => {
+    await deleteModel(payload.model);
+    await refreshInstalled();
+  });
+  ipcMain.handle('ollama:install-help', () => {
+    void shell.openExternal(OLLAMA_INSTALL_URL);
+  });
+
+  // Renderer-facing chat:start handler. Calls startChatSession with
+  // the bytes the renderer hands over. Equivalent to the in-process
+  // startChatSession call that capture.ts makes for the snip-ask path.
+  ipcMain.handle(
+    'chat:start',
+    (_evt, payload: { png: Uint8Array; mime: string; profile: ProfileId }) => {
+      const sessionId = startChatSession(
+        Buffer.from(payload.png),
+        payload.mime,
+        payload.profile,
+      );
+      return { sessionId };
+    },
+  );
+
+  // Text-only chat session — no image. Used by the trader numeric
+  // analysis flow: the overlay computes its levels and hands the text
+  // here; the panel auto-fires it as the first user message.
+  ipcMain.handle(
+    'chat:start-text',
+    (_evt, payload: { text: string; profile: ProfileId }) => {
+      const sessionId = startTextChatSession(payload.text, payload.profile);
+      return { sessionId };
+    },
+  );
+}
+
+// Shared helper: broadcast a new chat session to every renderer and
+// open the dock-slot chat panel. Called by the chat:start IPC and
+// also by capture.ts when Ask AI is triggered from the snip menu.
+let chatSeq = 0;
+export function startChatSession(
+  png: Buffer,
+  mime: string,
+  profile: ProfileId,
+): string {
+  const sessionId = `chat-${Date.now()}-${++chatSeq}`;
+  const session: ChatSessionPayload = { sessionId, png, mime, profile };
+  for (const win of BrowserWindow.getAllWindows()) {
+    if (!win.isDestroyed()) win.webContents.send('chat:session', session);
+  }
+  patchHub({ chatOpen: true });
+  return sessionId;
+}
+
+// Text-only counterpart of startChatSession — broadcasts a session with
+// no image and an initial user message to auto-send.
+export function startTextChatSession(initialText: string, profile: ProfileId): string {
+  const sessionId = `chat-${Date.now()}-${++chatSeq}`;
+  const session: ChatSessionPayload = { sessionId, initialText, profile };
+  for (const win of BrowserWindow.getAllWindows()) {
+    if (!win.isDestroyed()) win.webContents.send('chat:session', session);
+  }
+  patchHub({ chatOpen: true });
+  return sessionId;
+}
diff --git a/src/main/ai/messages.ts b/src/main/ai/messages.ts
new file mode 100644
index 0000000..3028936
--- /dev/null
+++ b/src/main/ai/messages.ts
@@ -0,0 +1,34 @@
+import type { AskInput } from '../../shared/types';
+import { SOLVE_FIRST_TURN } from '../../shared/constants';
+
+export interface AssembledTurn {
+  role: 'user' | 'assistant';
+  content: string;
+}
+
+// Assemble the full ordered turn list for one request — prior history
+// plus the current user message — and report the index of the FIRST
+// user turn. That index is where every adapter attaches the image, so
+// follow-up turns keep the original visual/OCR context instead of only
+// replaying the assistant's earlier answer.
+//
+// An empty user turn (the auto-fired opening turn carries no text — the
+// image + system prompt are the request) falls back to SOLVE_FIRST_TURN
+// so the model gets a clear instruction and the conversation always
+// starts with a non-empty user message (Anthropic requires the first
+// message to be a user turn).
+export function assembleTurns(input: AskInput): {
+  turns: AssembledTurn[];
+  firstUserIdx: number;
+} {
+  const turns: AssembledTurn[] = input.history.map((t) => ({
+    role: t.role,
+    content: t.role === 'user' && t.content.length === 0 ? SOLVE_FIRST_TURN : t.content,
+  }));
+  turns.push({
+    role: 'user',
+    content: input.userMessage.length > 0 ? input.userMessage : SOLVE_FIRST_TURN,
+  });
+  const firstUserIdx = turns.findIndex((t) => t.role === 'user');
+  return { turns, firstUserIdx };
+}
diff --git a/src/main/ai/ollama.ts b/src/main/ai/ollama.ts
new file mode 100644
index 0000000..8dcc86c
--- /dev/null
+++ b/src/main/ai/ollama.ts
@@ -0,0 +1,78 @@
+import type { AskInput } from '../../shared/types';
+import type { ProviderAdapter } from './types';
+import { OLLAMA_HOST } from './ollamaService';
+import { assembleTurns } from './messages';
+
+// Ollama's /api/chat message shape. Vision models accept raw base64
+// strings in `images` (NO `data:` prefix, unlike OpenAI's data URL).
+interface OllamaMessage {
+  role: 'system' | 'user' | 'assistant';
+  content: string;
+  images?: string[];
+}
+
+function buildMessages(input: AskInput): OllamaMessage[] {
+  const out: OllamaMessage[] = [{ role: 'system', content: input.systemPrompt }];
+  // Image rides the FIRST user turn so follow-ups keep it in view.
+  const { turns, firstUserIdx } = assembleTurns(input);
+  turns.forEach((t, i) => {
+    const msg: OllamaMessage = { role: t.role, content: t.content };
+    if (input.image && i === firstUserIdx) msg.images = [input.image.base64];
+    out.push(msg);
+  });
+  return out;
+}
+
+async function safeText(res: Response): Promise<string> {
+  try {
+    return (await res.text()).slice(0, 200);
+  } catch {
+    return '';
+  }
+}
+
+// Local provider. `apiKey` is ignored — models run on-device via the
+// Ollama service. Streams NDJSON from /api/chat, yielding content
+// deltas exactly like the cloud adapters so the IPC layer is unchanged.
+export const ollama: ProviderAdapter = {
+  id: 'ollama',
+  async *ask(input, _apiKey, signal) {
+    const res = await fetch(`${OLLAMA_HOST}/api/chat`, {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify({
+        model: input.model,
+        messages: buildMessages(input),
+        stream: true,
+      }),
+      signal,
+    });
+    if (!res.ok || !res.body) {
+      throw new Error(`Ollama ${res.status}: ${(await safeText(res)) || res.statusText}`);
+    }
+    const reader = res.body.getReader();
+    const decoder = new TextDecoder();
+    let buf = '';
+    for (;;) {
+      const { value, done } = await reader.read();
+      if (done) break;
+      buf += decoder.decode(value, { stream: true });
+      let nl: number;
+      while ((nl = buf.indexOf('\n')) >= 0) {
+        const line = buf.slice(0, nl).trim();
+        buf = buf.slice(nl + 1);
+        if (!line) continue;
+        let obj: { message?: { content?: unknown }; error?: unknown; done?: boolean };
+        try {
+          obj = JSON.parse(line);
+        } catch {
+          continue;
+        }
+        if (obj.error) throw new Error(String(obj.error));
+        const delta = obj.message?.content;
+        if (typeof delta === 'string' && delta.length > 0) yield delta;
+        if (obj.done) return;
+      }
+    }
+  },
+};
diff --git a/src/main/ai/ollamaModels.ts b/src/main/ai/ollamaModels.ts
new file mode 100644
index 0000000..15043e4
--- /dev/null
+++ b/src/main/ai/ollamaModels.ts
@@ -0,0 +1,63 @@
+import type { ProfileId } from '../../shared/types';
+
+// The local model catalogue surfaced in the installer. Sizes are the
+// approximate on-disk footprint of the Q4_K_M quant Ollama pulls for
+// each tag — used only for the disk-space pre-check and the UI, so a
+// rough estimate is fine. All tags below are official Ollama library
+// tags (no Modelfile needed) at time of writing; `qwen2.5vl` should be
+// re-verified against the user's Ollama version (fallback: moondream).
+const GB = 1024 * 1024 * 1024;
+
+export interface CatalogEntry {
+  tag: string;
+  label: string;
+  kind: 'text' | 'vision' | 'embed';
+  approxBytes: number;
+  // A short "why pick this" note for the installer row.
+  note?: string;
+}
+
+export const MODEL_CATALOG: CatalogEntry[] = [
+  // ── Text ──
+  { tag: 'llama3.2:1b', label: 'Llama 3.2 1B', kind: 'text', approxBytes: 1.3 * GB, note: 'Tiny, fast — grammar / formatting' },
+  { tag: 'qwen2.5:1.5b', label: 'Qwen 2.5 1.5B', kind: 'text', approxBytes: 1.0 * GB, note: 'Great text cleanup' },
+  { tag: 'qwen2.5:3b', label: 'Qwen 2.5 3B', kind: 'text', approxBytes: 2.0 * GB, note: 'Stronger reasoning / analysis' },
+  { tag: 'smollm2:1.7b', label: 'SmolLM2 1.7B', kind: 'text', approxBytes: 1.0 * GB, note: 'Lite on-device utility' },
+  // ── Vision ──
+  { tag: 'moondream', label: 'Moondream 2 (2B)', kind: 'vision', approxBytes: 1.7 * GB, note: 'Fast OCR / screenshot Q&A' },
+  { tag: 'qwen2.5vl:3b', label: 'Qwen 2.5-VL 3B', kind: 'vision', approxBytes: 3.2 * GB, note: 'Best small vision (verify tag)' },
+  // ── Embeddings (RAG, Phase 4) ──
+  { tag: 'nomic-embed-text', label: 'Nomic Embed Text', kind: 'embed', approxBytes: 0.27 * GB, note: 'Embeddings for learning' },
+];
+
+export function catalogEntry(tag: string): CatalogEntry | undefined {
+  return MODEL_CATALOG.find((m) => m.tag === tag);
+}
+
+// Per-profile, per-task default model tags. The resolver uses these
+// when the user hasn't set an explicit override and falls back to the
+// first installed model of the right kind if the default isn't pulled.
+export interface ProfileModels {
+  text: string;
+  vision: string;
+}
+
+export const PROFILE_MODELS: Record<ProfileId, ProfileModels> = {
+  // Qwen2.5-VL is the vision default everywhere — it's far better at
+  // reading handwriting / dense text than moondream, which matters most
+  // for the drawn-ink recognition path. moondream stays in the catalogue
+  // as a lighter option for low-RAM machines.
+  general: { text: 'llama3.2:1b', vision: 'qwen2.5vl:3b' },
+  teacher: { text: 'qwen2.5:3b', vision: 'qwen2.5vl:3b' },
+  trader: { text: 'qwen2.5:3b', vision: 'qwen2.5vl:3b' },
+};
+
+// Default set pulled on first run: a fast tiny text model for autocorrect,
+// a capable vision model for screenshot Q&A + handwriting OCR, and the
+// embedding model for the learning loop. Heavier per-profile text models
+// (e.g. qwen2.5:3b) are opt-in. Low-RAM users can swap the vision model
+// to the lighter `moondream` from the catalogue.
+export const DEFAULT_PULL_SET: string[] = ['llama3.2:1b', 'qwen2.5vl:3b', 'nomic-embed-text'];
+
+// Embedding model tag used by the RAG layer (Phase 4).
+export const EMBED_MODEL = 'nomic-embed-text';
diff --git a/src/main/ai/ollamaService.ts b/src/main/ai/ollamaService.ts
new file mode 100644
index 0000000..c02199c
--- /dev/null
+++ b/src/main/ai/ollamaService.ts
@@ -0,0 +1,246 @@
+import { spawn, execFile, type ChildProcess } from 'node:child_process';
+import { existsSync } from 'node:fs';
+import { statfs } from 'node:fs/promises';
+import { promisify } from 'node:util';
+import os from 'node:os';
+import type {
+  LocalModelInfo,
+  OllamaPullProgress,
+  OllamaServiceStatus,
+} from '../../shared/types';
+import { DEFAULT_PULL_SET, MODEL_CATALOG } from './ollamaModels';
+
+const execFileP = promisify(execFile);
+
+// Ollama's local HTTP endpoint. Honour OLLAMA_HOST if the user has
+// pointed their daemon elsewhere, else the documented default.
+export const OLLAMA_HOST =
+  process.env.OLLAMA_HOST && /^https?:\/\//.test(process.env.OLLAMA_HOST)
+    ? process.env.OLLAMA_HOST
+    : 'http://127.0.0.1:11434';
+
+export const OLLAMA_INSTALL_URL = 'https://ollama.com/download';
+
+// The daemon we spawned (if any). We only kill what we started — a
+// pre-existing user daemon is left running on quit.
+let spawned: ChildProcess | null = null;
+
+// In-flight pulls keyed by model tag, so a pull can be cancelled.
+const pulls = new Map<string, AbortController>();
+
+const sleep = (ms: number): Promise<void> => new Promise((r) => setTimeout(r, ms));
+
+async function probeVersion(): Promise<string | null> {
+  try {
+    const res = await fetch(`${OLLAMA_HOST}/api/version`, {
+      signal: AbortSignal.timeout(1500),
+    });
+    if (!res.ok) return null;
+    const j = (await res.json()) as { version?: unknown };
+    return typeof j.version === 'string' ? j.version : 'unknown';
+  } catch {
+    return null;
+  }
+}
+
+function candidatePaths(): string[] {
+  if (process.platform === 'darwin') {
+    return [
+      '/usr/local/bin/ollama',
+      '/opt/homebrew/bin/ollama',
+      '/Applications/Ollama.app/Contents/Resources/ollama',
+    ];
+  }
+  if (process.platform === 'win32') {
+    const la = process.env.LOCALAPPDATA ?? '';
+    return [`${la}\\Programs\\Ollama\\ollama.exe`];
+  }
+  return ['/usr/local/bin/ollama', '/usr/bin/ollama', '/bin/ollama'];
+}
+
+async function findBinary(): Promise<string | null> {
+  for (const p of candidatePaths()) {
+    if (existsSync(p)) return p;
+  }
+  try {
+    const cmd = process.platform === 'win32' ? 'where' : 'which';
+    const { stdout } = await execFileP(cmd, ['ollama']);
+    const line = stdout.split(/\r?\n/).find((l) => l.trim().length > 0);
+    if (line && existsSync(line.trim())) return line.trim();
+  } catch {
+    /* not on PATH */
+  }
+  return null;
+}
+
+export async function getStatus(): Promise<OllamaServiceStatus> {
+  const version = await probeVersion();
+  if (version) return { installed: true, running: true, version };
+  const bin = await findBinary();
+  return { installed: bin != null, running: false };
+}
+
+async function waitForReady(timeoutMs: number): Promise<boolean> {
+  const started = Date.now();
+  let delay = 200;
+  while (Date.now() - started < timeoutMs) {
+    if (await probeVersion()) return true;
+    await sleep(delay);
+    delay = Math.min(Math.round(delay * 1.5), 1500);
+  }
+  return false;
+}
+
+export async function start(): Promise<OllamaServiceStatus> {
+  // Already serving (possibly a daemon the user started themselves) —
+  // attach, never double-spawn.
+  if (await probeVersion()) return getStatus();
+  const bin = await findBinary();
+  if (!bin) return { installed: false, running: false, error: 'Ollama is not installed' };
+  try {
+    spawned = spawn(bin, ['serve'], { stdio: 'ignore' });
+    spawned.on('exit', () => {
+      spawned = null;
+    });
+  } catch (err) {
+    return { installed: true, running: false, error: (err as Error).message };
+  }
+  const ready = await waitForReady(15000);
+  return ready
+    ? getStatus()
+    : { installed: true, running: false, error: 'Ollama did not become ready' };
+}
+
+export async function listInstalled(): Promise<string[]> {
+  try {
+    const res = await fetch(`${OLLAMA_HOST}/api/tags`);
+    if (!res.ok) return [];
+    const j = (await res.json()) as { models?: Array<{ name?: unknown }> };
+    return Array.isArray(j.models)
+      ? j.models.map((m) => m.name).filter((n): n is string => typeof n === 'string')
+      : [];
+  } catch {
+    return [];
+  }
+}
+
+export async function listCatalog(): Promise<LocalModelInfo[]> {
+  const installed = new Set(await listInstalled());
+  // Ollama records bare tags as ':latest'; match both forms.
+  const isInstalled = (tag: string): boolean =>
+    installed.has(tag) || installed.has(tag.includes(':') ? tag : `${tag}:latest`);
+  return MODEL_CATALOG.map((e) => ({
+    tag: e.tag,
+    label: e.label,
+    kind: e.kind,
+    approxBytes: e.approxBytes,
+    installed: isInstalled(e.tag),
+    defaultPull: DEFAULT_PULL_SET.includes(e.tag),
+  }));
+}
+
+export async function pull(
+  model: string,
+  onProgress: (p: OllamaPullProgress) => void,
+): Promise<void> {
+  if (pulls.has(model)) return; // already pulling
+  const ctrl = new AbortController();
+  pulls.set(model, ctrl);
+  try {
+    const res = await fetch(`${OLLAMA_HOST}/api/pull`, {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify({ name: model, stream: true }),
+      signal: ctrl.signal,
+    });
+    if (!res.ok || !res.body) {
+      onProgress({ model, status: 'error', error: `HTTP ${res.status}`, done: true });
+      return;
+    }
+    const reader = res.body.getReader();
+    const decoder = new TextDecoder();
+    let buf = '';
+    for (;;) {
+      const { value, done } = await reader.read();
+      if (done) break;
+      buf += decoder.decode(value, { stream: true });
+      let nl: number;
+      while ((nl = buf.indexOf('\n')) >= 0) {
+        const line = buf.slice(0, nl).trim();
+        buf = buf.slice(nl + 1);
+        if (!line) continue;
+        try {
+          const o = JSON.parse(line) as {
+            status?: unknown;
+            completed?: number;
+            total?: number;
+            error?: unknown;
+          };
+          if (o.error) {
+            onProgress({ model, status: 'error', error: String(o.error), done: true });
+            return;
+          }
+          onProgress({
+            model,
+            status: String(o.status ?? ''),
+            completed: o.completed,
+            total: o.total,
+          });
+        } catch {
+          /* ignore non-JSON keepalive lines */
+        }
+      }
+    }
+    onProgress({ model, status: 'success', done: true });
+  } catch (err) {
+    const aborted = ctrl.signal.aborted;
+    onProgress({
+      model,
+      status: aborted ? 'cancelled' : 'error',
+      error: aborted ? undefined : (err as Error).message,
+      done: true,
+    });
+  } finally {
+    pulls.delete(model);
+  }
+}
+
+export function cancelPull(model: string): void {
+  pulls.get(model)?.abort();
+  pulls.delete(model);
+}
+
+export async function deleteModel(model: string): Promise<void> {
+  await fetch(`${OLLAMA_HOST}/api/delete`, {
+    method: 'DELETE',
+    headers: { 'Content-Type': 'application/json' },
+    body: JSON.stringify({ name: model }),
+  });
+}
+
+// Free bytes on the volume where models are stored (~ user home). -1
+// when it can't be determined, so callers can skip the pre-check
+// rather than block on a bad reading.
+export async function freeDiskBytes(): Promise<number> {
+  try {
+    const s = await statfs(os.homedir());
+    return s.bavail * s.bsize;
+  } catch {
+    return -1;
+  }
+}
+
+// Kill only a daemon WE spawned; abort any in-flight pulls. Wired to
+// app 'before-quit'.
+export function shutdown(): void {
+  for (const c of pulls.values()) c.abort();
+  pulls.clear();
+  if (spawned && !spawned.killed) {
+    try {
+      spawned.kill();
+    } catch {
+      /* already gone */
+    }
+    spawned = null;
+  }
+}
diff --git a/src/main/ai/openai.ts b/src/main/ai/openai.ts
new file mode 100644
index 0000000..7a500ef
--- /dev/null
+++ b/src/main/ai/openai.ts
@@ -0,0 +1,66 @@
+import OpenAI from 'openai';
+import type { AskInput } from '../../shared/types';
+import type { ProviderAdapter } from './types';
+import { assembleTurns } from './messages';
+
+// OpenAI's chat.completions API takes vision via `image_url` content
+// parts on user messages. The URL can be a data: URL so we don't need
+// to host the image anywhere. Stream chunks arrive with deltas under
+// choices[0].delta.content as strings (null when the message starts).
+
+const MAX_TOKENS = 2048;
+
+type ContentPart =
+  | { type: 'text'; text: string }
+  | { type: 'image_url'; image_url: { url: string } };
+
+type OpenAIMessage =
+  | { role: 'system'; content: string }
+  | { role: 'user'; content: string | ContentPart[] }
+  | { role: 'assistant'; content: string };
+
+function buildMessages(input: AskInput): OpenAIMessage[] {
+  const out: OpenAIMessage[] = [{ role: 'system', content: input.systemPrompt }];
+  // Image attaches to the FIRST user turn so follow-ups keep it in view.
+  const { turns, firstUserIdx } = assembleTurns(input);
+  turns.forEach((t, i) => {
+    if (input.image && i === firstUserIdx) {
+      out.push({
+        role: 'user',
+        content: [
+          {
+            type: 'image_url',
+            image_url: { url: `data:${input.image.mime};base64,${input.image.base64}` },
+          },
+          { type: 'text', text: t.content },
+        ],
+      });
+    } else {
+      out.push({ role: t.role, content: t.content });
+    }
+  });
+  return out;
+}
+
+export const openai: ProviderAdapter = {
+  id: 'openai',
+  async *ask(input, apiKey, signal) {
+    const client = new OpenAI({ apiKey });
+    const stream = await client.chat.completions.create(
+      {
+        model: input.model,
+        max_tokens: MAX_TOKENS,
+        // eslint-disable-next-line @typescript-eslint/no-explicit-any
+        messages: buildMessages(input) as any,
+        stream: true,
+      },
+      { signal },
+    );
+    for await (const chunk of stream) {
+      const delta = chunk.choices?.[0]?.delta?.content;
+      if (typeof delta === 'string' && delta.length > 0) {
+        yield delta;
+      }
+    }
+  },
+};
diff --git a/src/main/ai/rag.ts b/src/main/ai/rag.ts
new file mode 100644
index 0000000..cb5235c
--- /dev/null
+++ b/src/main/ai/rag.ts
@@ -0,0 +1,245 @@
+import { app } from 'electron';
+import { promises as fs } from 'node:fs';
+import path from 'node:path';
+import type { ProfileId } from '../../shared/types';
+import { OLLAMA_HOST } from './ollamaService';
+import { EMBED_MODEL } from './ollamaModels';
+
+// Local, privacy-preserving "self-learning" via RAG. Accepted
+// corrections + bundled per-profile intent examples are embedded with
+// a local model and stored on disk; the closest ones are retrieved as
+// few-shot context for future corrections. No data leaves the device.
+//
+// The store is a single JSON file with brute-force cosine search. At
+// the realistic scale (hundreds–few thousand examples) this is fast
+// and dependency-free; swapping in sqlite-vec later is a drop-in for
+// the same retrieve()/capture() surface.
+
+export type RagKind = 'typed' | 'drawn' | 'analysis' | 'chat';
+
+interface RagEntry {
+  id: number;
+  profile: ProfileId;
+  kind: RagKind;
+  original: string;
+  corrected: string;
+  accepted: boolean;
+  source: 'user' | 'seed';
+  createdAt: number;
+  embedding: number[];
+}
+
+export interface CaptureInput {
+  profile: ProfileId;
+  kind: RagKind;
+  original: string;
+  corrected: string;
+  accepted?: boolean;
+  source?: 'user' | 'seed';
+}
+
+const PROFILES: ProfileId[] = ['general', 'teacher', 'trader'];
+// Keep brute-force search snappy: cap stored user examples per profile
+// (seeds are exempt). Oldest user entries are evicted first.
+const MAX_USER_PER_PROFILE = 500;
+const SIM_FLOOR = 0.55; // ignore weak matches
+
+let entries: RagEntry[] = [];
+let nextId = 1;
+let loaded = false;
+let dbPath = '';
+let saveTimer: ReturnType<typeof setTimeout> | null = null;
+
+function file(): string {
+  if (!dbPath) dbPath = path.join(app.getPath('userData'), 'lekhini-rag.json');
+  return dbPath;
+}
+
+async function load(): Promise<void> {
+  if (loaded) return;
+  loaded = true;
+  try {
+    const raw = await fs.readFile(file(), 'utf8');
+    const data = JSON.parse(raw) as { entries?: RagEntry[] };
+    entries = Array.isArray(data.entries) ? data.entries : [];
+    nextId = entries.reduce((m, e) => Math.max(m, e.id), 0) + 1;
+  } catch {
+    entries = [];
+  }
+}
+
+function scheduleSave(): void {
+  if (saveTimer) return;
+  saveTimer = setTimeout(() => {
+    saveTimer = null;
+    void persist();
+  }, 500);
+}
+
+async function persist(): Promise<void> {
+  try {
+    await fs.writeFile(file(), JSON.stringify({ entries }), 'utf8');
+  } catch {
+    /* best-effort */
+  }
+}
+
+// Embed text with the local embedding model. Returns null whenever the
+// model/service isn't available — callers treat that as "RAG off".
+async function embed(text: string): Promise<number[] | null> {
+  try {
+    const res = await fetch(`${OLLAMA_HOST}/api/embeddings`, {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify({ model: EMBED_MODEL, prompt: text }),
+      signal: AbortSignal.timeout(8000),
+    });
+    if (!res.ok) return null;
+    const j = (await res.json()) as { embedding?: number[] };
+    return Array.isArray(j.embedding) && j.embedding.length > 0 ? j.embedding : null;
+  } catch {
+    return null;
+  }
+}
+
+function cosine(a: number[], b: number[]): number {
+  const n = Math.min(a.length, b.length);
+  let dot = 0;
+  let na = 0;
+  let nb = 0;
+  for (let i = 0; i < n; i++) {
+    dot += a[i] * b[i];
+    na += a[i] * a[i];
+    nb += b[i] * b[i];
+  }
+  if (na === 0 || nb === 0) return 0;
+  return dot / (Math.sqrt(na) * Math.sqrt(nb));
+}
+
+function evictIfNeeded(profile: ProfileId): void {
+  const userEntries = entries.filter((e) => e.profile === profile && e.source === 'user');
+  if (userEntries.length <= MAX_USER_PER_PROFILE) return;
+  const excess = userEntries.length - MAX_USER_PER_PROFILE;
+  const evictIds = new Set(
+    userEntries
+      .sort((a, b) => a.createdAt - b.createdAt)
+      .slice(0, excess)
+      .map((e) => e.id),
+  );
+  entries = entries.filter((e) => !evictIds.has(e.id));
+}
+
+export async function capture(input: CaptureInput): Promise<void> {
+  await load();
+  const original = input.original.trim();
+  const corrected = input.corrected.trim();
+  if (!original || !corrected || original === corrected) return;
+  // De-dupe identical originals within a profile.
+  if (entries.some((e) => e.profile === input.profile && e.original === original)) return;
+  const embedding = await embed(original);
+  if (!embedding) return; // embeddings unavailable → silently skip
+  entries.push({
+    id: nextId++,
+    profile: input.profile,
+    kind: input.kind,
+    original,
+    corrected,
+    accepted: input.accepted ?? true,
+    source: input.source ?? 'user',
+    createdAt: Date.now(),
+    embedding,
+  });
+  evictIfNeeded(input.profile);
+  scheduleSave();
+}
+
+export async function retrieve(
+  profile: ProfileId,
+  query: string,
+  k = 3,
+): Promise<{ original: string; corrected: string }[]> {
+  await load();
+  const q = query.trim();
+  if (!q || entries.length === 0) return [];
+  const emb = await embed(q);
+  if (!emb) return [];
+  return entries
+    .filter((e) => e.profile === profile && e.accepted)
+    .map((e) => ({ e, s: cosine(emb, e.embedding) }))
+    .filter((x) => x.s >= SIM_FLOOR)
+    .sort((a, b) => b.s - a.s)
+    .slice(0, k)
+    .map((x) => ({ original: x.e.original, corrected: x.e.corrected }));
+}
+
+export async function stats(): Promise<Record<ProfileId, number>> {
+  await load();
+  const out: Record<ProfileId, number> = { general: 0, teacher: 0, trader: 0 };
+  for (const e of entries) out[e.profile] = (out[e.profile] ?? 0) + 1;
+  return out;
+}
+
+export async function resetProfile(profile: ProfileId): Promise<void> {
+  await load();
+  entries = entries.filter((e) => e.profile !== profile);
+  await persist();
+}
+
+// ── Intent-file seeding ─────────────────────────────────────────────
+
+function intentDirs(): string[] {
+  const dirs: string[] = [];
+  if (process.resourcesPath) dirs.push(path.join(process.resourcesPath, 'intent'));
+  dirs.push(path.join(app.getAppPath(), 'resources', 'intent'));
+  dirs.push(path.join(app.getAppPath(), '..', 'resources', 'intent'));
+  return dirs;
+}
+
+async function loadIntentFile(profile: ProfileId): Promise<{ original: string; corrected: string }[]> {
+  for (const base of intentDirs()) {
+    try {
+      const raw = await fs.readFile(path.join(base, `${profile}.jsonl`), 'utf8');
+      return raw
+        .split(/\r?\n/)
+        .filter((l) => l.trim().length > 0)
+        .map((l) => {
+          try {
+            return JSON.parse(l) as { original?: string; corrected?: string };
+          } catch {
+            return {};
+          }
+        })
+        .filter((o): o is { original: string; corrected: string } => !!o.original && !!o.corrected);
+    } catch {
+      /* try next dir */
+    }
+  }
+  return [];
+}
+
+let seeding = false;
+// Ingest the bundled per-profile examples once embeddings are available.
+// Self-healing: if Ollama/the embed model isn't up yet, nothing is
+// recorded and a later call retries. Fire-and-forget.
+export async function maybeSeed(): Promise<void> {
+  if (seeding) return;
+  seeding = true;
+  try {
+    await load();
+    for (const profile of PROFILES) {
+      if (entries.some((e) => e.profile === profile && e.source === 'seed')) continue;
+      const pairs = await loadIntentFile(profile);
+      for (const p of pairs) {
+        await capture({
+          profile,
+          kind: 'typed',
+          original: p.original,
+          corrected: p.corrected,
+          source: 'seed',
+        });
+      }
+    }
+  } finally {
+    seeding = false;
+  }
+}
diff --git a/src/main/ai/ragIpc.ts b/src/main/ai/ragIpc.ts
new file mode 100644
index 0000000..a32dec8
--- /dev/null
+++ b/src/main/ai/ragIpc.ts
@@ -0,0 +1,39 @@
+import { ipcMain } from 'electron';
+import type { ProfileId } from '../../shared/types';
+import { capture, maybeSeed, resetProfile, stats, type RagKind } from './rag';
+
+const isProfile = (v: unknown): v is ProfileId =>
+  v === 'general' || v === 'teacher' || v === 'trader';
+
+export function registerRagIpc(): void {
+  // Examples-learned counts per profile (drives the Learning settings).
+  ipcMain.handle('rag:stats', () => stats());
+
+  // Forget everything learned for one profile (seed examples included).
+  ipcMain.handle('rag:reset-profile', (_evt, payload: { profile: ProfileId }) => {
+    if (!isProfile(payload?.profile)) return;
+    return resetProfile(payload.profile);
+  });
+
+  // Record a correction the user accepted/edited, so it becomes
+  // few-shot context for future corrections.
+  ipcMain.handle(
+    'rag:capture',
+    (
+      _evt,
+      payload: { profile: ProfileId; kind: RagKind; original: string; corrected: string },
+    ) => {
+      if (!isProfile(payload?.profile)) return;
+      return capture({
+        profile: payload.profile,
+        kind: payload.kind,
+        original: payload.original,
+        corrected: payload.corrected,
+      });
+    },
+  );
+
+  // Background-seed the bundled intent examples once embeddings are
+  // available (self-heals on later launches if Ollama is down now).
+  void maybeSeed();
+}
diff --git a/src/main/ai/registry.ts b/src/main/ai/registry.ts
new file mode 100644
index 0000000..daf161a
--- /dev/null
+++ b/src/main/ai/registry.ts
@@ -0,0 +1,93 @@
+import type { ProviderId } from '../../shared/types';
+import type { ModelOption, ProviderAdapter } from './types';
+import { anthropic } from './anthropic';
+import { openai } from './openai';
+import { gemini } from './gemini';
+import { deepseek } from './deepseek';
+import { sarvam } from './sarvam';
+import { ollama } from './ollama';
+import { MODEL_CATALOG } from './ollamaModels';
+import { OLLAMA_INSTALL_URL } from './ollamaService';
+
+const ADAPTERS: Record<ProviderId, ProviderAdapter> = {
+  anthropic,
+  openai,
+  gemini,
+  deepseek,
+  sarvam,
+  ollama,
+};
+
+export function getAdapter(id: ProviderId): ProviderAdapter {
+  const adapter = ADAPTERS[id];
+  if (!adapter) throw new Error(`Unknown AI provider: ${id}`);
+  return adapter;
+}
+
+// Vision-capable models exposed in the Settings dropdown. The first
+// `recommended: true` entry is the default when the user picks a new
+// provider. Keep this list small — every model adds a row to the
+// dropdown and a maintenance line as providers rotate IDs.
+export const MODELS_BY_PROVIDER: Record<ProviderId, ModelOption[]> = {
+  anthropic: [
+    { id: 'claude-sonnet-4-5', label: 'Claude Sonnet 4.5', recommended: true },
+    { id: 'claude-opus-4-5', label: 'Claude Opus 4.5' },
+    { id: 'claude-haiku-4-5', label: 'Claude Haiku 4.5 (fast / cheap)' },
+  ],
+  openai: [
+    { id: 'gpt-4o', label: 'GPT-4o', recommended: true },
+    { id: 'gpt-4o-mini', label: 'GPT-4o mini (fast / cheap)' },
+  ],
+  gemini: [
+    { id: 'gemini-2.0-flash', label: 'Gemini 2.0 Flash', recommended: true },
+    { id: 'gemini-1.5-pro', label: 'Gemini 1.5 Pro' },
+  ],
+  // DeepSeek is text-only (no vision); great for reasoning / math on
+  // typed questions and text follow-ups. deepseek-reasoner (R1) shows
+  // its chain-of-thought; deepseek-chat (V3) is the faster general model.
+  deepseek: [
+    { id: 'deepseek-chat', label: 'DeepSeek V3 (chat)', recommended: true },
+    { id: 'deepseek-reasoner', label: 'DeepSeek R1 (reasoner)' },
+  ],
+  // Sarvam solves from its own Vision OCR. sarvam-m is the confirmed
+  // stable default; the larger models reason better on complex problems.
+  sarvam: [
+    { id: 'sarvam-m', label: 'Sarvam-M (24B)', recommended: true },
+    { id: 'sarvam-30b', label: 'Sarvam-30B' },
+    { id: 'sarvam-105b', label: 'Sarvam-105B (strongest)' },
+  ],
+  // For local, the real source of truth is which tags are installed
+  // (the Local AI settings query Ollama directly). This static list
+  // just gives defaultModelFor() a sane fallback.
+  ollama: MODEL_CATALOG.filter((m) => m.kind !== 'embed').map((m) => ({
+    id: m.tag,
+    label: m.label,
+    recommended: m.tag === 'llama3.2:1b',
+  })),
+};
+
+export function defaultModelFor(provider: ProviderId): string {
+  const list = MODELS_BY_PROVIDER[provider];
+  return (list.find((m) => m.recommended) ?? list[0]).id;
+}
+
+export const PROVIDER_LABELS: Record<ProviderId, string> = {
+  anthropic: 'Anthropic Claude',
+  openai: 'OpenAI ChatGPT',
+  gemini: 'Google Gemini',
+  deepseek: 'DeepSeek',
+  sarvam: 'Sarvam AI',
+  ollama: 'Local (Ollama)',
+};
+
+// The Settings UI uses this to render Set up → links to provider
+// console pages for users to grab an API key. Local has no key — its
+// link points at the Ollama install/download page instead.
+export const PROVIDER_KEY_URLS: Record<ProviderId, string> = {
+  anthropic: 'https://console.anthropic.com/settings/keys',
+  openai: 'https://platform.openai.com/api-keys',
+  gemini: 'https://aistudio.google.com/app/apikey',
+  deepseek: 'https://platform.deepseek.com/api_keys',
+  sarvam: 'https://dashboard.sarvam.ai',
+  ollama: OLLAMA_INSTALL_URL,
+};
diff --git a/src/main/ai/sarvam.ts b/src/main/ai/sarvam.ts
new file mode 100644
index 0000000..cb375ca
--- /dev/null
+++ b/src/main/ai/sarvam.ts
@@ -0,0 +1,220 @@
+import OpenAI from 'openai';
+import JSZip from 'jszip';
+import { SarvamAIClient } from 'sarvamai';
+import type { AskInput } from '../../shared/types';
+import type { ProviderAdapter } from './types';
+import { assembleTurns } from './messages';
+
+// Sarvam AI is integrated as a self-contained vision provider: when a
+// snip image rides the request we first run it through Sarvam's
+// Document Intelligence (Vision) OCR to extract the text, then hand
+// that text to Sarvam's chat model to actually SOLVE the problem. With
+// no image it's a plain chat call.
+//
+// Two transports:
+//   • OCR   — the official `sarvamai` SDK orchestrates the async,
+//             job-based Document Intelligence flow (createJob → upload
+//             → start → poll → download). Upload accepts only PDF/ZIP,
+//             so the PNG snip is wrapped in a single-entry ZIP; output
+//             comes back as a ZIP we unpack in memory with JSZip.
+//   • solve — Sarvam's chat endpoint is OpenAI-compatible, so we reuse
+//             the `openai` SDK with a baseURL override (same trick as
+//             deepseek.ts) to stream the answer.
+
+const MAX_TOKENS = 2048;
+const CHAT_BASE_URL = 'https://api.sarvam.ai/v1';
+
+// Keep the interactive snip flow snappy: poll a bit faster than the
+// SDK default (2s) and cap total wait so a stuck job surfaces an error
+// instead of hanging the chat. ~1.5s × 30 ≈ 45s ceiling.
+const OCR_POLL_INTERVAL_MS = 1500;
+const OCR_MAX_POLLS = 30;
+
+type Message =
+  | { role: 'system'; content: string }
+  | { role: 'user'; content: string }
+  | { role: 'assistant'; content: string };
+
+// Per-session OCR cache. The snip is transcribed exactly once per
+// conversation; follow-up turns reuse the text instead of re-running
+// the (slow, job-based) Vision job. Bounded to the active session —
+// any new sessionId evicts the rest.
+const ocrCache = new Map<string, string>();
+
+// Build the chat message list. The OCR'd image text is embedded into
+// the FIRST user turn (not the latest follow-up) so every replayed turn
+// carries the original problem; the model solves from the transcription.
+function buildMessages(input: AskInput, ocrText: string | null): Message[] {
+  const out: Message[] = [{ role: 'system', content: input.systemPrompt }];
+  const { turns, firstUserIdx } = assembleTurns(input);
+  turns.forEach((t, i) => {
+    if (ocrText && ocrText.trim().length > 0 && i === firstUserIdx) {
+      out.push({
+        role: 'user',
+        content: `Text extracted from the image:\n\n${ocrText.trim()}\n\n${t.content}`,
+      });
+    } else {
+      out.push({ role: t.role, content: t.content });
+    }
+  });
+  return out;
+}
+
+// PK\x03\x04 — local file header magic that starts every ZIP archive.
+function isZip(bytes: Uint8Array): boolean {
+  return bytes[0] === 0x50 && bytes[1] === 0x4b && bytes[2] === 0x03 && bytes[3] === 0x04;
+}
+
+// Very small HTML→text fallback for when the only output is .html.
+function stripHtml(html: string): string {
+  return html
+    .replace(/<style[\s\S]*?<\/style>/gi, '')
+    .replace(/<script[\s\S]*?<\/script>/gi, '')
+    .replace(/<[^>]+>/g, ' ')
+    .replace(/&nbsp;/g, ' ')
+    .replace(/\s+\n/g, '\n')
+    .replace(/[ \t]{2,}/g, ' ')
+    .trim();
+}
+
+// Pull human-readable text out of one downloaded output payload. The
+// Document Intelligence output is delivered as a ZIP of per-page files;
+// we prefer Markdown, then plain text, then HTML, then JSON.
+async function textFromPayload(bytes: Uint8Array): Promise<string> {
+  if (!isZip(bytes)) {
+    return new TextDecoder().decode(bytes);
+  }
+  const zip = await JSZip.loadAsync(bytes);
+  const files = Object.values(zip.files).filter((f) => !f.dir);
+  const pick = (exts: string[]): typeof files =>
+    files
+      .filter((f) => exts.some((e) => f.name.toLowerCase().endsWith(e)))
+      .sort((a, b) => a.name.localeCompare(b.name));
+
+  const md = pick(['.md', '.markdown', '.txt']);
+  if (md.length) return (await Promise.all(md.map((f) => f.async('string')))).join('\n\n');
+
+  const html = pick(['.html', '.htm']);
+  if (html.length) {
+    return (await Promise.all(html.map((f) => f.async('string').then(stripHtml)))).join('\n\n');
+  }
+
+  const json = pick(['.json']);
+  if (json.length) {
+    // Structured page data — flatten any string leaves into text.
+    const texts: string[] = [];
+    for (const f of json) {
+      try {
+        collectStrings(JSON.parse(await f.async('string')), texts);
+      } catch {
+        /* skip unparseable */
+      }
+    }
+    return texts.join('\n');
+  }
+  return '';
+}
+
+// Recursively gather string values from the structured JSON output.
+function collectStrings(node: unknown, out: string[]): void {
+  if (typeof node === 'string') {
+    if (node.trim().length > 0) out.push(node);
+  } else if (Array.isArray(node)) {
+    for (const v of node) collectStrings(v, out);
+  } else if (node && typeof node === 'object') {
+    for (const v of Object.values(node)) collectStrings(v, out);
+  }
+}
+
+// Run the snip PNG through Sarvam Document Intelligence and return the
+// extracted text. Throws with a clear message on failure so the chat
+// panel surfaces it.
+async function runOcr(
+  image: { mime: string; base64: string },
+  apiKey: string,
+  signal: AbortSignal,
+): Promise<string> {
+  const client = new SarvamAIClient({ apiSubscriptionKey: apiKey });
+
+  // Upload requires PDF or ZIP. Wrap the PNG in a flat single-entry ZIP
+  // and hand it over as a File so the SDK keeps the .zip name (a bare
+  // Blob would be uploaded as "document.pdf" and rejected).
+  const zip = new JSZip();
+  zip.file('snip.png', Buffer.from(image.base64, 'base64'));
+  const zipBuf = await zip.generateAsync({ type: 'arraybuffer' });
+  const zipFile = new File([zipBuf], 'snip.zip', { type: 'application/zip' });
+
+  const job = await client.documentIntelligence.createJob({
+    language: 'en-IN',
+    outputFormat: 'md',
+    pollingIntervalMs: OCR_POLL_INTERVAL_MS,
+    maxPollingAttempts: OCR_MAX_POLLS,
+  });
+  if (signal.aborted) throw new Error('aborted');
+
+  await job.uploadFile(zipFile);
+  await job.start();
+  const status = await job.waitUntilComplete();
+  if (signal.aborted) throw new Error('aborted');
+  // 'Completed' and 'PartiallyCompleted' both yield usable output; only
+  // a hard failure (or a still-running job that hit the poll ceiling)
+  // is an error.
+  if (status.job_state !== 'Completed' && status.job_state !== 'PartiallyCompleted') {
+    throw new Error(`Sarvam OCR ${status.job_state}: ${status.error_message ?? 'failed'}`);
+  }
+
+  const links = await job.getDownloadLinks();
+  const urls = Object.values(links.download_urls ?? {})
+    .map((d) => d.file_url)
+    .filter((u): u is string => typeof u === 'string' && u.length > 0);
+  if (urls.length === 0) throw new Error('Sarvam OCR returned no output files');
+
+  const parts: string[] = [];
+  for (const url of urls) {
+    const res = await fetch(url, { signal });
+    if (!res.ok) continue;
+    const text = await textFromPayload(new Uint8Array(await res.arrayBuffer()));
+    if (text.trim().length > 0) parts.push(text);
+  }
+  return parts.join('\n\n');
+}
+
+export const sarvam: ProviderAdapter = {
+  id: 'sarvam',
+  async *ask(input, apiKey, signal) {
+    // Main re-injects the cached snip on every turn of an image
+    // conversation, so OCR once and reuse the text on follow-ups rather
+    // than re-running the slow job each time.
+    let ocrText: string | null = null;
+    if (input.image) {
+      const sid = input.sessionId;
+      if (sid && ocrCache.has(sid)) {
+        ocrText = ocrCache.get(sid) ?? null;
+      } else {
+        ocrText = await runOcr(input.image, apiKey, signal);
+        if (sid) {
+          ocrCache.clear(); // bound the cache to the active conversation
+          ocrCache.set(sid, ocrText);
+        }
+      }
+    }
+
+    const client = new OpenAI({ apiKey, baseURL: CHAT_BASE_URL });
+    const stream = await client.chat.completions.create(
+      {
+        model: input.model,
+        max_tokens: MAX_TOKENS,
+        // eslint-disable-next-line @typescript-eslint/no-explicit-any
+        messages: buildMessages(input, ocrText) as any,
+        stream: true,
+      },
+      { signal },
+    );
+    for await (const chunk of stream) {
+      const delta = chunk.choices?.[0]?.delta?.content;
+      if (typeof delta === 'string' && delta.length > 0) {
+        yield delta;
+      }
+    }
+  },
+};
diff --git a/src/main/ai/types.ts b/src/main/ai/types.ts
new file mode 100644
index 0000000..63e7fac
--- /dev/null
+++ b/src/main/ai/types.ts
@@ -0,0 +1,23 @@
+import type { AskInput, ProviderId } from '../../shared/types';
+
+export type { ProviderId, AskInput } from '../../shared/types';
+
+// Each provider implements this interface in a separate file. The
+// async iterable yields plain text deltas; the IPC layer pipes them
+// to the renderer as 'ai:chunk' events. AbortSignal is honoured by
+// all three SDKs (Anthropic / OpenAI / Gemini) and lets the renderer
+// cancel an in-flight stream from the chat panel.
+export interface ProviderAdapter {
+  id: ProviderId;
+  ask(
+    input: AskInput,
+    apiKey: string,
+    signal: AbortSignal,
+  ): AsyncIterable<string>;
+}
+
+export interface ModelOption {
+  id: string;
+  label: string;
+  recommended?: boolean;
+}
diff --git a/src/main/capture.ts b/src/main/capture.ts
index 0ef37f8..b58b06f 100644
--- a/src/main/capture.ts
+++ b/src/main/capture.ts
@@ -15,6 +15,8 @@ import { getOverlays } from './windows/overlay';
 import { notifyStatus, onFocusRecheck, screenStatus } from './permissions';
 import { persisted } from './persistence';
 import { patch as patchHub } from './hub';
+import { startChatSession } from './ai/ipc';
+import type { ProfileId } from '../shared/types';
 
 interface Rect {
   x: number;
@@ -121,6 +123,33 @@ export async function copyFocusedSnipToClipboard(): Promise<void> {
   clipboard.writeImage(img);
 }
 
+// Start an AI chat about the user's current snip selection. Same
+// capture + composite path Save / Copy use; the bytes are handed to
+// startChatSession which broadcasts chat:session and opens the dock
+// chat panel.
+export async function askAiAboutFocusedSnip(profile: ProfileId): Promise<void> {
+  if (!gateScreenForCapture('clipboard')) return;
+  const displayId = getFocusedDisplayId();
+  const rect = snipSelections.get(displayId);
+  if (!rect) return;
+  const display = screen.getAllDisplays().find((d) => d.id === displayId);
+  if (!display) return;
+  const overlay = getOverlays().get(displayId);
+  if (!overlay || overlay.isDestroyed()) return;
+
+  // Hide the dashed selection so it isn't baked into the PNG sent
+  // to the AI (the existing crop rect is already in hand).
+  setSnipSelection(displayId, null);
+  await waitMs(60);
+
+  const png = await captureCroppedComposite(overlay, display, rect);
+  if (!png) {
+    handleCaptureFailure();
+    return;
+  }
+  startChatSession(png, 'image/png', profile);
+}
+
 export async function captureFocusedDisplay(): Promise<void> {
   if (!gateScreenForCapture('capture')) return;
 
@@ -317,6 +346,9 @@ export function registerCaptureIpc() {
   ipcMain.handle('snip:clear', (_evt, payload: { displayId: number }) => {
     setSnipSelection(payload.displayId, null);
   });
+  ipcMain.handle('snip:ask-ai', async (_evt, payload: { profile: ProfileId }) => {
+    await askAiAboutFocusedSnip(payload.profile);
+  });
   // Renderer-triggered folder picker, used by the "Change…" button in
   // Settings → File save. Returns the chosen path so the renderer can
   // patch the hub with it (which is what persists + broadcasts to
diff --git a/src/main/hotkeys.ts b/src/main/hotkeys.ts
index 8f11eb4..c740460 100644
--- a/src/main/hotkeys.ts
+++ b/src/main/hotkeys.ts
@@ -23,6 +23,7 @@ export function registerHotkeys() {
   ipcMain.handle('relay:undo', () => sendToFocusedOverlay('overlay:undo'));
   ipcMain.handle('relay:redo', () => sendToFocusedOverlay('overlay:redo'));
   ipcMain.handle('relay:clear', () => sendToAllOverlays('overlay:clear'));
+  ipcMain.handle('relay:analyze', () => sendToFocusedOverlay('overlay:analyze'));
   ipcMain.handle('capture:trigger', () => captureFocusedDisplay());
   ipcMain.handle('snip:copy', () => copyFocusedSnipToClipboard());
 }
diff --git a/src/main/hub.ts b/src/main/hub.ts
index db099dc..1814025 100644
--- a/src/main/hub.ts
+++ b/src/main/hub.ts
@@ -3,11 +3,13 @@ import { DEFAULT_SETTINGS, GRAPHITE_COLOR } from '../shared/constants';
 import { DEFAULT_PROFILE } from '../shared/profiles';
 import { persisted, PERSISTED_DEFAULTS, save } from './persistence';
 import type {
+  AiProfileModels,
   Calibration,
   HubStateUpdate,
   Orientation,
   PerToolWidth,
   ProfileId,
+  ProviderId,
   Theme,
   ToolId,
   ToolSettings,
@@ -34,6 +36,26 @@ export interface HubState {
   // in hub so main can grow the toolbar window to fit, the same way
   // it does for settingsOpen.
   statusPanelOpen: boolean;
+  // AI chat panel visibility — transient like statusPanelOpen.
+  // Mutually exclusive with settingsOpen + statusPanelOpen at the
+  // dock slot level.
+  chatOpen: boolean;
+  // Persisted AI configuration mirrored into the hub so renderers
+  // can subscribe via the existing hub.onBroadcast pipe.
+  aiActiveProvider: ProviderId | null;
+  aiActiveModel: string | null;
+  aiProfilePrompts: Partial<Record<ProfileId, string>>;
+  // Local-first (Ollama) AI configuration, mirrored from persistence.
+  aiLocalEnabled: boolean;
+  aiInstalledModels: string[];
+  aiLocalModel: string | null;
+  aiLocalVisionModel: string | null;
+  aiProfileModels: AiProfileModels;
+  autocorrectTyped: boolean;
+  autocorrectDrawn: boolean;
+  defaultTextFont: string;
+  aiOnboarded: boolean;
+  autoUpdate: boolean;
 }
 
 const state: HubState = {
@@ -52,6 +74,20 @@ const state: HubState = {
   saveDir: null,
   alwaysAskSavePath: false,
   statusPanelOpen: false,
+  chatOpen: false,
+  aiActiveProvider: null,
+  aiActiveModel: null,
+  aiProfilePrompts: {},
+  aiLocalEnabled: false,
+  aiInstalledModels: [],
+  aiLocalModel: null,
+  aiLocalVisionModel: null,
+  aiProfileModels: {},
+  autocorrectTyped: false,
+  autocorrectDrawn: false,
+  defaultTextFont: 'system-ui, -apple-system, sans-serif',
+  aiOnboarded: false,
+  autoUpdate: true,
 };
 
 const subscribers = new Set<BrowserWindow>();
@@ -114,6 +150,39 @@ export function hydrateFromPersistence(): void {
   // older installs without this key fall through to the default.
   state.saveDir = typeof p.saveDir === 'string' ? p.saveDir : null;
   state.alwaysAskSavePath = typeof p.alwaysAskSavePath === 'boolean' ? p.alwaysAskSavePath : false;
+  // AI config — schema-tolerant: missing fields fall back to null /
+  // empty so old installs upgrade cleanly when they first launch the
+  // build with AI integration.
+  state.aiActiveProvider =
+    p.aiActiveProvider === 'anthropic' ||
+    p.aiActiveProvider === 'openai' ||
+    p.aiActiveProvider === 'gemini' ||
+    p.aiActiveProvider === 'deepseek' ||
+    p.aiActiveProvider === 'sarvam' ||
+    p.aiActiveProvider === 'ollama'
+      ? p.aiActiveProvider
+      : null;
+  state.aiActiveModel = typeof p.aiActiveModel === 'string' ? p.aiActiveModel : null;
+  state.aiProfilePrompts =
+    p.aiProfilePrompts && typeof p.aiProfilePrompts === 'object' ? p.aiProfilePrompts : {};
+  // Local AI — schema-tolerant for installs that predate it.
+  state.aiLocalEnabled = typeof p.aiLocalEnabled === 'boolean' ? p.aiLocalEnabled : false;
+  state.aiInstalledModels = Array.isArray(p.aiInstalledModels)
+    ? p.aiInstalledModels.filter((m): m is string => typeof m === 'string')
+    : [];
+  state.aiLocalModel = typeof p.aiLocalModel === 'string' ? p.aiLocalModel : null;
+  state.aiLocalVisionModel = typeof p.aiLocalVisionModel === 'string' ? p.aiLocalVisionModel : null;
+  state.aiProfileModels =
+    p.aiProfileModels && typeof p.aiProfileModels === 'object' ? p.aiProfileModels : {};
+  state.autocorrectTyped = typeof p.autocorrectTyped === 'boolean' ? p.autocorrectTyped : false;
+  state.autocorrectDrawn = typeof p.autocorrectDrawn === 'boolean' ? p.autocorrectDrawn : false;
+  state.defaultTextFont =
+    typeof p.defaultTextFont === 'string' && p.defaultTextFont.length > 0
+      ? p.defaultTextFont
+      : PERSISTED_DEFAULTS.defaultTextFont;
+  state.aiOnboarded = typeof p.aiOnboarded === 'boolean' ? p.aiOnboarded : false;
+  // Default ON when absent (older installs predate auto-update).
+  state.autoUpdate = typeof p.autoUpdate === 'boolean' ? p.autoUpdate : true;
   // If the active tool is pencil, the canonical color is graphite —
   // don't restore a stray non-graphite value from a previous session.
   const colorForTool =
@@ -244,10 +313,21 @@ export function patch(update: HubStateUpdate) {
   if (update.settingsOpen !== undefined && update.settingsOpen !== state.settingsOpen) {
     state.settingsOpen = update.settingsOpen;
     changed.add('settingsOpen');
-    // Settings and flyout share the side panel slot; only one open at once.
-    if (state.settingsOpen && state.thicknessFlyoutOpen) {
-      state.thicknessFlyoutOpen = false;
-      changed.add('thicknessFlyoutOpen');
+    // The dock slot holds AT MOST ONE of: settings, status panel,
+    // chat panel, thickness flyout. Opening settings closes the rest.
+    if (state.settingsOpen) {
+      if (state.thicknessFlyoutOpen) {
+        state.thicknessFlyoutOpen = false;
+        changed.add('thicknessFlyoutOpen');
+      }
+      if (state.statusPanelOpen) {
+        state.statusPanelOpen = false;
+        changed.add('statusPanelOpen');
+      }
+      if (state.chatOpen) {
+        state.chatOpen = false;
+        changed.add('chatOpen');
+      }
     }
   }
   if (
@@ -280,13 +360,128 @@ export function patch(update: HubStateUpdate) {
   ) {
     state.statusPanelOpen = update.statusPanelOpen;
     changed.add('statusPanelOpen');
-    // Status panel and settings are mutually exclusive panels in the
-    // same dock slot — opening one closes the other so the renderer
-    // and main agree on what's showing.
-    if (state.statusPanelOpen && state.settingsOpen) {
-      state.settingsOpen = false;
-      changed.add('settingsOpen');
+    // Mutex with the other dock-slot panels.
+    if (state.statusPanelOpen) {
+      if (state.settingsOpen) {
+        state.settingsOpen = false;
+        changed.add('settingsOpen');
+      }
+      if (state.chatOpen) {
+        state.chatOpen = false;
+        changed.add('chatOpen');
+      }
+    }
+  }
+  if (update.chatOpen !== undefined && update.chatOpen !== state.chatOpen) {
+    state.chatOpen = update.chatOpen;
+    changed.add('chatOpen');
+    // Mutex with the other dock-slot panels.
+    if (state.chatOpen) {
+      if (state.settingsOpen) {
+        state.settingsOpen = false;
+        changed.add('settingsOpen');
+      }
+      if (state.statusPanelOpen) {
+        state.statusPanelOpen = false;
+        changed.add('statusPanelOpen');
+      }
+    }
+  }
+  if (
+    update.aiActiveProvider !== undefined &&
+    update.aiActiveProvider !== state.aiActiveProvider
+  ) {
+    state.aiActiveProvider = update.aiActiveProvider;
+    changed.add('aiActiveProvider');
+    save('aiActiveProvider', state.aiActiveProvider);
+  }
+  if (update.aiActiveModel !== undefined && update.aiActiveModel !== state.aiActiveModel) {
+    state.aiActiveModel = update.aiActiveModel;
+    changed.add('aiActiveModel');
+    save('aiActiveModel', state.aiActiveModel);
+  }
+  if (update.aiProfilePrompts !== undefined) {
+    // Merge — caller can patch a single profile's override without
+    // wiping the others. Empty-string entry removes the override.
+    const merged = { ...state.aiProfilePrompts, ...update.aiProfilePrompts };
+    for (const key of Object.keys(merged) as ProfileId[]) {
+      const v = merged[key];
+      if (typeof v !== 'string' || v.length === 0) delete merged[key];
     }
+    state.aiProfilePrompts = merged;
+    changed.add('aiProfilePrompts');
+    save('aiProfilePrompts', state.aiProfilePrompts);
+  }
+  if (update.aiLocalEnabled !== undefined && update.aiLocalEnabled !== state.aiLocalEnabled) {
+    state.aiLocalEnabled = update.aiLocalEnabled;
+    changed.add('aiLocalEnabled');
+    save('aiLocalEnabled', state.aiLocalEnabled);
+  }
+  if (update.aiInstalledModels !== undefined) {
+    state.aiInstalledModels = update.aiInstalledModels.filter(
+      (m): m is string => typeof m === 'string',
+    );
+    changed.add('aiInstalledModels');
+    save('aiInstalledModels', state.aiInstalledModels);
+  }
+  if (update.aiLocalModel !== undefined && update.aiLocalModel !== state.aiLocalModel) {
+    state.aiLocalModel = update.aiLocalModel;
+    changed.add('aiLocalModel');
+    save('aiLocalModel', state.aiLocalModel);
+  }
+  if (
+    update.aiLocalVisionModel !== undefined &&
+    update.aiLocalVisionModel !== state.aiLocalVisionModel
+  ) {
+    state.aiLocalVisionModel = update.aiLocalVisionModel;
+    changed.add('aiLocalVisionModel');
+    save('aiLocalVisionModel', state.aiLocalVisionModel);
+  }
+  if (update.aiProfileModels !== undefined) {
+    // Deep-merge per profile so a single profile's text/vision pick can
+    // be patched without wiping the rest. An empty string clears that
+    // slot back to the catalogue default.
+    const merged: AiProfileModels = { ...state.aiProfileModels };
+    for (const key of Object.keys(update.aiProfileModels) as ProfileId[]) {
+      const incoming = update.aiProfileModels[key] ?? {};
+      const slot = { ...merged[key], ...incoming };
+      if (slot.text === '') delete slot.text;
+      if (slot.vision === '') delete slot.vision;
+      if (slot.text === undefined && slot.vision === undefined) delete merged[key];
+      else merged[key] = slot;
+    }
+    state.aiProfileModels = merged;
+    changed.add('aiProfileModels');
+    save('aiProfileModels', state.aiProfileModels);
+  }
+  if (update.autocorrectTyped !== undefined && update.autocorrectTyped !== state.autocorrectTyped) {
+    state.autocorrectTyped = update.autocorrectTyped;
+    changed.add('autocorrectTyped');
+    save('autocorrectTyped', state.autocorrectTyped);
+  }
+  if (update.autocorrectDrawn !== undefined && update.autocorrectDrawn !== state.autocorrectDrawn) {
+    state.autocorrectDrawn = update.autocorrectDrawn;
+    changed.add('autocorrectDrawn');
+    save('autocorrectDrawn', state.autocorrectDrawn);
+  }
+  if (
+    update.defaultTextFont !== undefined &&
+    update.defaultTextFont !== state.defaultTextFont &&
+    update.defaultTextFont.length > 0
+  ) {
+    state.defaultTextFont = update.defaultTextFont;
+    changed.add('defaultTextFont');
+    save('defaultTextFont', state.defaultTextFont);
+  }
+  if (update.aiOnboarded !== undefined && update.aiOnboarded !== state.aiOnboarded) {
+    state.aiOnboarded = update.aiOnboarded;
+    changed.add('aiOnboarded');
+    save('aiOnboarded', state.aiOnboarded);
+  }
+  if (update.autoUpdate !== undefined && update.autoUpdate !== state.autoUpdate) {
+    state.autoUpdate = update.autoUpdate;
+    changed.add('autoUpdate');
+    save('autoUpdate', state.autoUpdate);
   }
   broadcast(changed);
 }
diff --git a/src/main/main.ts b/src/main/main.ts
index 58515a7..04f1608 100644
--- a/src/main/main.ts
+++ b/src/main/main.ts
@@ -10,6 +10,10 @@ import {
 import { createToolbar, getToolbar, registerToolbarIpc, resizeToolbar } from './windows/toolbar';
 import { registerPermissionsIpc } from './permissions';
 import { registerCaptureIpc } from './capture';
+import { registerAiIpc } from './ai/ipc';
+import { registerRagIpc } from './ai/ragIpc';
+import { shutdown as shutdownOllama } from './ai/ollamaService';
+import { initAutoUpdates, registerUpdaterIpc } from './updater';
 import {
   registerDrawingHotkeys,
   registerEscapeWhileDrawing,
@@ -36,6 +40,9 @@ app.whenReady().then(async () => {
   registerPermissionsIpc();
   registerCaptureIpc();
   registerToolbarIpc();
+  registerAiIpc();
+  registerRagIpc();
+  registerUpdaterIpc();
 
   for (const display of screen.getAllDisplays()) {
     console.log('[pen] creating overlay for display', display.id, display.bounds);
@@ -50,6 +57,10 @@ app.whenReady().then(async () => {
 
   registerHotkeys();
 
+  // Kick off background update checks once windows exist to receive the
+  // 'updater:status' broadcasts. No-op (→ 'unsupported') in dev / unsigned.
+  initAutoUpdates();
+
   onChange((state, changed) => {
     if (changed.has('drawMode')) {
       console.log('[pen] drawMode ->', state.drawMode);
@@ -59,16 +70,18 @@ app.whenReady().then(async () => {
       registerEscapeWhileDrawing(state.drawMode);
       registerDrawingHotkeys(state.drawMode);
     }
-    // The status panel (permission / save error) occupies the same
-    // dock slot as Settings in the toolbar, so we treat either being
-    // open as "the side panel is showing" for window-resize purposes.
-    const sidePanelOpen = state.settingsOpen || state.statusPanelOpen;
+    // Three panels share the dock slot: settings, status (permission
+    // / save error), and AI chat. Any of them being open means the
+    // toolbar window should grow to fit a side panel.
+    const sidePanelOpen =
+      state.settingsOpen || state.statusPanelOpen || state.chatOpen;
     if (changed.has('orientation')) {
       resizeToolbar(state.orientation, state.minimized, sidePanelOpen, 'default');
     } else if (
       changed.has('minimized') ||
       changed.has('settingsOpen') ||
-      changed.has('statusPanelOpen')
+      changed.has('statusPanelOpen') ||
+      changed.has('chatOpen')
     ) {
       resizeToolbar(state.orientation, state.minimized, sidePanelOpen, 'keep');
     }
@@ -79,6 +92,8 @@ app.whenReady().then(async () => {
 
 app.on('will-quit', () => {
   unregisterHotkeys();
+  // Stop only an Ollama daemon we spawned; abort any in-flight pulls.
+  shutdownOllama();
 });
 
 app.on('window-all-closed', () => {
diff --git a/src/main/persistence.ts b/src/main/persistence.ts
index 677e740..3ed27b0 100644
--- a/src/main/persistence.ts
+++ b/src/main/persistence.ts
@@ -1,5 +1,12 @@
 import { GRAPHITE_COLOR } from '../shared/constants';
-import type { Orientation, ProfileId, Theme, ToolId } from '../shared/types';
+import type {
+  AiProfileModels,
+  Orientation,
+  ProfileId,
+  ProviderId,
+  Theme,
+  ToolId,
+} from '../shared/types';
 
 export interface PersistedState {
   orientation: Orientation;
@@ -17,6 +24,35 @@ export interface PersistedState {
   // Off by default — the "remember + auto-save" UX is the recommended
   // path. Lives in Settings → File save.
   alwaysAskSavePath: boolean;
+  // AI integration. The provider/model pair the "Ask AI" button will
+  // use; `null` until the user has configured at least one provider.
+  // API keys themselves are NEVER in PersistedState — they live behind
+  // OS keychain via src/main/ai/credentials.ts.
+  aiActiveProvider: ProviderId | null;
+  aiActiveModel: string | null;
+  // Per-profile user overrides for the default AI system prompt.
+  // Falls back to the profile's built-in prompt (see profiles.ts)
+  // when a profile isn't present here.
+  aiProfilePrompts: Partial<Record<ProfileId, string>>;
+  // Local-first (Ollama) AI. When aiLocalEnabled and a model is
+  // installed, the resolver prefers local over any configured cloud
+  // provider. Keys are never needed for local.
+  aiLocalEnabled: boolean;
+  aiInstalledModels: string[];
+  aiLocalModel: string | null;
+  aiLocalVisionModel: string | null;
+  // Per-profile local model overrides (Phase 2 routing).
+  aiProfileModels: AiProfileModels;
+  // Autocorrect toggles (default OFF — raw stays raw).
+  autocorrectTyped: boolean;
+  autocorrectDrawn: boolean;
+  // CSS font-family for newly created text shapes.
+  defaultTextFont: string;
+  // First-run setup wizard completed (or skipped).
+  aiOnboarded: boolean;
+  // Background auto-update preference. Default ON — new versions
+  // download silently and apply on quit. Toggle in Settings → Updates.
+  autoUpdate: boolean;
 }
 
 export const PERSISTED_DEFAULTS: PersistedState = {
@@ -30,6 +66,19 @@ export const PERSISTED_DEFAULTS: PersistedState = {
   activeTool: 'pencil',
   saveDir: null,
   alwaysAskSavePath: false,
+  aiActiveProvider: null,
+  aiActiveModel: null,
+  aiProfilePrompts: {},
+  aiLocalEnabled: false,
+  aiInstalledModels: [],
+  aiLocalModel: null,
+  aiLocalVisionModel: null,
+  aiProfileModels: {},
+  autocorrectTyped: false,
+  autocorrectDrawn: false,
+  defaultTextFont: 'system-ui, -apple-system, sans-serif',
+  aiOnboarded: false,
+  autoUpdate: true,
 };
 
 interface MinimalStore {
diff --git a/src/main/preload.ts b/src/main/preload.ts
index a1f1ef4..120dbfa 100644
--- a/src/main/preload.ts
+++ b/src/main/preload.ts
@@ -1,5 +1,19 @@
 import { contextBridge, ipcRenderer } from 'electron';
-import type { HubStateUpdate, IpcChannel } from '../shared/types';
+import type {
+  AiStatus,
+  AskInput,
+  ChatSessionPayload,
+  ConnectionTestResult,
+  HubStateUpdate,
+  IpcChannel,
+  LocalModelInfo,
+  OllamaPullProgress,
+  OllamaServiceStatus,
+  ProfileId,
+  ProviderId,
+  StreamChunk,
+  UpdateStatus,
+} from '../shared/types';
 
 const api = {
   hub: {
@@ -16,6 +30,7 @@ const api = {
     onUndo: (cb: () => void) => bind('overlay:undo', cb),
     onRedo: (cb: () => void) => bind('overlay:redo', cb),
     onClear: (cb: () => void) => bind('overlay:clear', cb),
+    onAnalyze: (cb: () => void) => bind('overlay:analyze', cb),
     onScreenshot: (cb: (payload: { png: Uint8Array }) => void) =>
       bind('overlay:screenshot', cb as (v: unknown) => void),
     onSnip: (
@@ -43,11 +58,14 @@ const api = {
     clear: (payload: { displayId: number }) =>
       ipcRenderer.invoke('snip:clear' satisfies IpcChannel, payload),
     copy: () => ipcRenderer.invoke('snip:copy' satisfies IpcChannel),
+    askAi: (profile: ProfileId) =>
+      ipcRenderer.invoke('snip:ask-ai' satisfies IpcChannel, { profile }),
   },
   relay: {
     undo: () => ipcRenderer.invoke('relay:undo' satisfies IpcChannel),
     redo: () => ipcRenderer.invoke('relay:redo' satisfies IpcChannel),
     clear: () => ipcRenderer.invoke('relay:clear' satisfies IpcChannel),
+    analyze: () => ipcRenderer.invoke('relay:analyze' satisfies IpcChannel),
     screenshot: () => ipcRenderer.invoke('capture:trigger' satisfies IpcChannel),
   },
   win: {
@@ -91,6 +109,86 @@ const api = {
     openPath: (p: string) =>
       ipcRenderer.invoke('shell:open-path' satisfies IpcChannel, p),
   },
+  ai: {
+    setKey: (provider: ProviderId, key: string) =>
+      ipcRenderer.invoke('ai:set-key' satisfies IpcChannel, { provider, key }),
+    deleteKey: (provider: ProviderId) =>
+      ipcRenderer.invoke('ai:delete-key' satisfies IpcChannel, { provider }),
+    getStatus: () =>
+      ipcRenderer.invoke('ai:get-status' satisfies IpcChannel) as Promise<AiStatus[]>,
+    testConnection: (provider: ProviderId, model: string) =>
+      ipcRenderer.invoke('ai:test-connection' satisfies IpcChannel, {
+        provider,
+        model,
+      }) as Promise<ConnectionTestResult>,
+    ask: (input: AskInput) =>
+      ipcRenderer.invoke('ai:ask' satisfies IpcChannel, input) as Promise<{
+        requestId: string;
+      }>,
+    cancel: (requestId: string) =>
+      ipcRenderer.invoke('ai:cancel' satisfies IpcChannel, { requestId }),
+    onChunk: (cb: (c: StreamChunk) => void) =>
+      bind('ai:chunk', cb as (v: unknown) => void),
+    // One-shot correction calls (non-streaming).
+    recognize: (payload: { png: Uint8Array; mime?: string; profile?: ProfileId }) =>
+      ipcRenderer.invoke('ai:recognize' satisfies IpcChannel, payload) as Promise<{
+        text: string;
+        error?: string;
+      }>,
+    autocorrect: (payload: { text: string; profile?: ProfileId }) =>
+      ipcRenderer.invoke('ai:autocorrect' satisfies IpcChannel, payload) as Promise<{
+        text: string;
+        error?: string;
+      }>,
+  },
+  ollama: {
+    status: () =>
+      ipcRenderer.invoke('ollama:status' satisfies IpcChannel) as Promise<OllamaServiceStatus>,
+    start: () =>
+      ipcRenderer.invoke('ollama:start' satisfies IpcChannel) as Promise<OllamaServiceStatus>,
+    listModels: () =>
+      ipcRenderer.invoke('ollama:list-models' satisfies IpcChannel) as Promise<LocalModelInfo[]>,
+    diskSpace: () =>
+      ipcRenderer.invoke('ollama:disk-space' satisfies IpcChannel) as Promise<number>,
+    pull: (model: string) =>
+      ipcRenderer.invoke('ollama:pull' satisfies IpcChannel, { model }) as Promise<{ ok: boolean }>,
+    cancelPull: (model: string) =>
+      ipcRenderer.invoke('ollama:cancel-pull' satisfies IpcChannel, { model }) as Promise<void>,
+    deleteModel: (model: string) =>
+      ipcRenderer.invoke('ollama:delete-model' satisfies IpcChannel, { model }) as Promise<void>,
+    installHelp: () =>
+      ipcRenderer.invoke('ollama:install-help' satisfies IpcChannel) as Promise<void>,
+    onPullProgress: (cb: (p: OllamaPullProgress) => void) =>
+      bind('ollama:pull-progress', cb as (v: unknown) => void),
+  },
+  rag: {
+    stats: () =>
+      ipcRenderer.invoke('rag:stats' satisfies IpcChannel) as Promise<
+        Record<ProfileId, number>
+      >,
+    resetProfile: (profile: ProfileId) =>
+      ipcRenderer.invoke('rag:reset-profile' satisfies IpcChannel, { profile }) as Promise<void>,
+    capture: (payload: {
+      profile: ProfileId;
+      kind: 'typed' | 'drawn' | 'analysis' | 'chat';
+      original: string;
+      corrected: string;
+    }) => ipcRenderer.invoke('rag:capture' satisfies IpcChannel, payload) as Promise<void>,
+  },
+  chat: {
+    // Called by SnipActions in the overlay to hand a snip off to the
+    // toolbar's ChatPanel. Main relays via chat:session.
+    start: (payload: { png: Uint8Array; mime: string; profile: ProfileId }) =>
+      ipcRenderer.invoke('chat:start' satisfies IpcChannel, payload) as Promise<{
+        sessionId: string;
+      }>,
+    startText: (payload: { text: string; profile: ProfileId }) =>
+      ipcRenderer.invoke('chat:start-text' satisfies IpcChannel, payload) as Promise<{
+        sessionId: string;
+      }>,
+    onSession: (cb: (s: ChatSessionPayload) => void) =>
+      bind('chat:session', cb as (v: unknown) => void),
+  },
   app: {
     info: () =>
       ipcRenderer.invoke('app:info' satisfies IpcChannel) as Promise<{
@@ -99,6 +197,15 @@ const api = {
       }>,
     relaunch: () => ipcRenderer.invoke('app:relaunch' satisfies IpcChannel),
   },
+  updater: {
+    get: () => ipcRenderer.invoke('updater:get' satisfies IpcChannel) as Promise<UpdateStatus>,
+    check: () => ipcRenderer.invoke('updater:check' satisfies IpcChannel) as Promise<UpdateStatus>,
+    install: () => ipcRenderer.invoke('updater:install' satisfies IpcChannel) as Promise<void>,
+    openReleases: () =>
+      ipcRenderer.invoke('updater:open-releases' satisfies IpcChannel) as Promise<void>,
+    onStatus: (cb: (s: UpdateStatus) => void) =>
+      bind('updater:status', cb as (v: unknown) => void),
+  },
   env: {
     displayId: () => ipcRenderer.sendSync('overlay:display-id'),
   },
diff --git a/src/main/updater.ts b/src/main/updater.ts
new file mode 100644
index 0000000..65d023d
--- /dev/null
+++ b/src/main/updater.ts
@@ -0,0 +1,134 @@
+import { app, BrowserWindow, ipcMain, shell } from 'electron';
+// electron-updater is CommonJS; import the default and destructure so the
+// ESM↔CJS interop is stable across bundlers.
+import electronUpdater from 'electron-updater';
+import type { UpdateStatus } from '../shared/types';
+import { getState, onChange } from './hub';
+
+const { autoUpdater } = electronUpdater;
+
+// Where users go to grab a build by hand — the manual fallback when
+// auto-update can't run (dev, or unsigned macOS where Squirrel refuses
+// to apply an update). Derived from package.json's repository field.
+const RELEASES_URL = 'https://github.com/opensourcebharat/lekhini/releases/latest';
+
+// Re-check this often while the app stays open, so a long-running
+// session still notices a release without a restart.
+const CHECK_INTERVAL_MS = 6 * 60 * 60 * 1000; // 6 hours
+
+let status: UpdateStatus = { state: 'idle', currentVersion: '' };
+
+function broadcast(): void {
+  for (const win of BrowserWindow.getAllWindows()) {
+    if (!win.isDestroyed()) win.webContents.send('updater:status', status);
+  }
+}
+
+function setStatus(next: Partial<UpdateStatus>): void {
+  status = { ...status, ...next };
+  broadcast();
+}
+
+// Auto-update only works in a packaged build (a dev run has no
+// app-update.yml feed) — and on macOS only when the app is signed +
+// notarized. We can't cheaply detect signing, so we attempt the check
+// and map a signature error to 'unsupported' (the UI then offers a
+// manual download link instead of looking broken).
+function canUpdate(): boolean {
+  return app.isPackaged;
+}
+
+function isSignatureError(message: string): boolean {
+  return /code sign|signature|not signed|not been signed/i.test(message);
+}
+
+async function check(): Promise<void> {
+  if (!canUpdate()) return;
+  try {
+    await autoUpdater.checkForUpdates();
+  } catch (err) {
+    const msg = (err as Error)?.message ?? String(err);
+    setStatus({ state: isSignatureError(msg) ? 'unsupported' : 'error', message: msg });
+  }
+}
+
+function wireEvents(): void {
+  autoUpdater.on('checking-for-update', () => setStatus({ state: 'checking', message: undefined }));
+  autoUpdater.on('update-available', (info) =>
+    // With autoDownload on, electron-updater is already fetching; reflect
+    // that. With it off, we sit at 'available' until the user acts.
+    setStatus({
+      state: autoUpdater.autoDownload ? 'downloading' : 'available',
+      version: info.version,
+      percent: 0,
+    }),
+  );
+  autoUpdater.on('update-not-available', () => setStatus({ state: 'none', version: undefined }));
+  autoUpdater.on('download-progress', (p) =>
+    setStatus({ state: 'downloading', percent: Math.round(p.percent) }),
+  );
+  autoUpdater.on('update-downloaded', (info) =>
+    setStatus({ state: 'downloaded', version: info.version, percent: 100 }),
+  );
+  autoUpdater.on('error', (err) => {
+    const msg = (err as Error)?.message ?? String(err);
+    setStatus({ state: isSignatureError(msg) ? 'unsupported' : 'error', message: msg });
+  });
+}
+
+export function initAutoUpdates(): void {
+  status = { state: 'idle', currentVersion: app.getVersion() };
+
+  autoUpdater.autoDownload = getState().autoUpdate;
+  autoUpdater.autoInstallOnAppQuit = true;
+  autoUpdater.allowPrerelease = false;
+
+  wireEvents();
+
+  // Live-react to the Settings toggle: flip autoDownload, and if the user
+  // just enabled it while an update is already known, start fetching.
+  onChange((s, changed) => {
+    if (!changed.has('autoUpdate')) return;
+    autoUpdater.autoDownload = s.autoUpdate;
+    if (s.autoUpdate && status.state === 'available') void check();
+  });
+
+  if (!canUpdate()) {
+    setStatus({
+      state: 'unsupported',
+      message: 'Updates apply to installed builds only (you are running from source).',
+    });
+    return;
+  }
+
+  void check();
+  setInterval(() => void check(), CHECK_INTERVAL_MS);
+}
+
+export function registerUpdaterIpc(): void {
+  ipcMain.handle('updater:get', () => status);
+  ipcMain.handle('updater:check', async () => {
+    await check();
+    return status;
+  });
+  // Apply an update. If it's downloaded, quit + install now; if it's only
+  // been detected (autoDownload off), kick off the download — the UI then
+  // flips to "Restart to update" once 'update-downloaded' fires.
+  ipcMain.handle('updater:install', async () => {
+    if (!canUpdate()) return;
+    if (status.state === 'downloaded') {
+      // Defer so the IPC reply flushes before the app tears down.
+      setImmediate(() => autoUpdater.quitAndInstall());
+      return;
+    }
+    try {
+      await autoUpdater.downloadUpdate();
+    } catch (err) {
+      const msg = (err as Error)?.message ?? String(err);
+      setStatus({ state: isSignatureError(msg) ? 'unsupported' : 'error', message: msg });
+    }
+  });
+  ipcMain.handle('updater:open-releases', () => {
+    void shell.openExternal(RELEASES_URL);
+  });
+}
diff --git a/src/renderer/overlay/App.tsx b/src/renderer/overlay/App.tsx
index 9804517..a7e9390 100644
--- a/src/renderer/overlay/App.tsx
+++ b/src/renderer/overlay/App.tsx
@@ -5,7 +5,27 @@ import { attachPointerPipeline } from './canvas/pointerPipeline';
 import { cursorFor } from './cursors';
 import { store, type SnipRect } from './store';
 import { buildRegistry } from './tools/registry';
-import type { Item, Theme, ToolSettings, Whiteboard } from '../../shared/types';
+import { nextId } from './tools/types';
+import {
+  dominantColor,
+  groupBounds,
+  HANDWRITING_FONT,
+  isDescriptiveJunk,
+  isLikelyQuestion,
+  isRecognizableStroke,
+  rasterizeGroup,
+} from './canvas/recognize';
+import { buildTradeAnalysisText } from './canvas/ta';
+import type {
+  Calibration,
+  Item,
+  ProfileId,
+  StrokeItem,
+  TextShape,
+  Theme,
+  ToolSettings,
+  Whiteboard,
+} from '../../shared/types';
 import type { Tool, ToolContext } from './tools/types';
 
 export function OverlayApp() {
@@ -19,7 +39,21 @@ export function OverlayApp() {
   // can re-render on Solid's signal cycle. Synced inside the store
   // subscriber below.
   const [snipRectSig, setSnipRectSig] = createSignal<SnipRect | null>(null);
+  // AI-configuration mirror + current profile, used by the SnipActions
+  // Ask AI button. Updated from hub.onBroadcast below.
+  const [aiConfigured, setAiConfigured] = createSignal(false);
+  const [activeProfile, setActiveProfile] = createSignal<ProfileId>('general');
+  // Autocorrect + default-font settings, mirrored from the hub.
+  const [autocorrectTyped, setAutocorrectTyped] = createSignal(false);
+  const [autocorrectDrawn, setAutocorrectDrawn] = createSignal(false);
+  const [defaultFont, setDefaultFont] = createSignal('system-ui, -apple-system, sans-serif');
+  // Local AI usable = enabled with at least one model installed.
+  const [aiLocalReady, setAiLocalReady] = createSignal(false);
+  // Any AI path available (local or a configured cloud provider).
+  const aiAvailable = () => aiLocalReady() || aiConfigured();
   let currentTheme: Theme = 'dark';
+  // Latest pixel↔price calibration from the hub (null until set).
+  let currentCalibration: Calibration | null = null;
 
   const applyCursor = () => {
     if (!surface) return;
@@ -47,10 +81,134 @@ export function OverlayApp() {
       store.getState().snipRect,
     );
 
+    // ── Handwriting recognition controller ─────────────────────────
+    // After the user FINISHES drawing pen/pencil ink (long idle, and
+    // never while a stroke is in progress), the recent strokes are
+    // rasterized and sent to the AI for transcription + correction, then
+    // swapped for a single TextShape in one undo step. Gated by the
+    // autocorrectDrawn setting and AI availability.
+    //
+    // The idle must be generous: people pause between letters/words, so
+    // a short timer fires mid-word and overwrites half-written ink. We
+    // wait ~2.2s of no drawing AND cancel any pending pass the moment a
+    // new stroke starts (cancelRecognition on pointer-down).
+    const RECOGNIZE_IDLE_MS = 2200;
+    const recog = {
+      pending: new Set<string>(),
+      recognized: new Set<string>(),
+      timer: null as ReturnType<typeof setTimeout> | null,
+      inFlight: false,
+    };
+
+    const cancelRecognition = () => {
+      if (recog.timer !== null) {
+        clearTimeout(recog.timer);
+        recog.timer = null;
+      }
+    };
+
+    const scheduleRecognition = () => {
+      cancelRecognition();
+      recog.timer = setTimeout(() => {
+        recog.timer = null;
+        void runRecognition();
+      }, RECOGNIZE_IDLE_MS);
+    };
+
+    const onStrokeCommitted = (item: Item) => {
+      if (!autocorrectDrawn() || !aiAvailable()) return;
+      if (!isRecognizableStroke(item)) return;
+      recog.pending.add(item.id);
+      scheduleRecognition();
+    };
+
+    const runRecognition = async () => {
+      if (recog.inFlight) {
+        scheduleRecognition();
+        return;
+      }
+      if (!autocorrectDrawn()) {
+        recog.pending.clear();
+        return;
+      }
+      const byId = new Map(store.getState().items.map((i) => [i.id, i] as const));
+      const group: StrokeItem[] = [];
+      for (const id of recog.pending) {
+        const it = byId.get(id);
+        if (it && isRecognizableStroke(it) && !recog.recognized.has(id)) group.push(it);
+      }
+      recog.pending.clear();
+      if (group.length === 0) return;
+      const bounds = groupBounds(group);
+      // Require a real bit of writing — a single tiny mark is almost
+      // always an accidental tap, not a word worth transcribing.
+      if (bounds.w < 24 || bounds.h < 10) return;
+      // Claim these ids before the await so strokes drawn during the
+      // request form a fresh batch and these are never re-sent.
+      const ids = group.map((g) => g.id);
+      ids.forEach((id) => recog.recognized.add(id));
+
+      const dpr = Math.max(window.devicePixelRatio || 1, 2);
+      const png = await canvasToPng(rasterizeGroup(group, bounds, dpr));
+
+      recog.inFlight = true;
+      let text = '';
+      try {
+        const res = await window.pen.ai.recognize({
+          png,
+          mime: 'image/png',
+          profile: activeProfile(),
+        });
+        text = (res.text ?? '').trim();
+      } catch {
+        text = '';
+      } finally {
+        recog.inFlight = false;
+      }
+      // Strip wrapping quotes the model sometimes adds.
+      text = text.replace(/^["'“”‘’`]+|["'“”‘’`]+$/g, '').trim();
+      // Reject non-transcriptions: small vision models often DESCRIBE the
+      // image ("a signature", "the user wrote…", "this appears to be
+      // handwriting") instead of transcribing. Replacing the user's ink
+      // with that is worse than doing nothing, so keep the ink instead.
+      if (!text || isDescriptiveJunk(text)) return;
+
+      // The user may have undone or erased the ink during the request —
+      // only replace strokes that still exist.
+      const live = new Set(store.getState().items.map((i) => i.id));
+      const survivors = ids.filter((id) => live.has(id));
+      if (survivors.length === 0) return;
+
+      const textItem: TextShape = {
+        kind: 'text',
+        id: nextId('text'),
+        at: { x: bounds.x, y: bounds.y },
+        text,
+        color: dominantColor(group),
+        // Match the size the user actually drew (ink height), so the
+        // replacement neither balloons nor shrinks. Rendered in a
+        // handwriting font to stay realistic at that spot.
+        fontSize: Math.min(200, Math.max(12, Math.round(bounds.h * 0.8))),
+        fontFamily: HANDWRITING_FONT,
+      };
+      store.getState().replaceMany(survivors, [textItem]);
+
+      // If the user hand-wrote a question/request, also answer it in
+      // the chat panel — profile-aware (teacher explains, trader
+      // analyzes) via the profile system prompt. The tidy text stays
+      // on the canvas; the answer opens in the dock chat.
+      if (isLikelyQuestion(text)) {
+        void window.pen.chat.startText({ text, profile: activeProfile() });
+      }
+    };
+
     const ctx: ToolContext = {
       get settings() {
         return currentSettings;
       },
+      profile: () => activeProfile(),
+      defaultFont: () => defaultFont(),
+      autocorrectTyped: () => autocorrectTyped(),
       items: () => store.getState().items,
       selectedId: () => store.getState().selectedId,
       setDraft(item: Item | null) {
@@ -58,6 +216,7 @@ export function OverlayApp() {
       },
       commit(item: Item) {
         store.getState().commit(item);
+        onStrokeCommitted(item);
       },
       commitShapeAndSelect(item: Item) {
         store.getState().commit(item);
@@ -91,6 +250,10 @@ export function OverlayApp() {
       onDown(s, e) {
         if (!drawMode()) return;
         e.preventDefault();
+        // Starting a new stroke means the user isn't done writing —
+        // cancel any pending recognition so it never fires mid-word and
+        // overwrites half-finished ink.
+        cancelRecognition();
         // The user is starting an actual stroke — close any thickness
         // popup that was left open on the toolbar so it doesn't hover
         // over the drawing surface. Cheap; only fires when the popup
@@ -155,6 +318,13 @@ export function OverlayApp() {
     const unUndo = window.pen.overlay.onUndo(() => store.getState().undo());
     const unRedo = window.pen.overlay.onRedo(() => store.getState().redo());
     const unClear = window.pen.overlay.onClear(() => store.getState().clear());
+    // Trader hybrid: compute the drawn fib / trendline levels as text
+    // and open a text-only analysis chat (no chart image is sent).
+    const unAnalyze = window.pen.overlay.onAnalyze(() => {
+      const text = buildTradeAnalysisText(store.getState().items, currentCalibration);
+      if (!text) return; // nothing drawn to analyze
+      void window.pen.chat.startText({ text, profile: activeProfile() });
+    });
     const unShot = window.pen.overlay.onScreenshot(async ({ png }) => {
       const out = await composite(png, committed.getCanvas());
       await window.pen.overlay.sendScreenshotResult(out);
@@ -167,6 +337,27 @@ export function OverlayApp() {
       store.getState().setSnipRect(rect);
     });
 
+    // Mirror the AI / autocorrect / font fields from a hub snapshot.
+    type AiHubFields = {
+      aiActiveProvider?: string | null;
+      aiLocalEnabled?: boolean;
+      aiInstalledModels?: string[];
+      autocorrectTyped?: boolean;
+      autocorrectDrawn?: boolean;
+      defaultTextFont?: string;
+    };
+    const applyAiFields = (s: AiHubFields) => {
+      if ('aiActiveProvider' in s) setAiConfigured(s.aiActiveProvider != null);
+      if (typeof s.aiLocalEnabled === 'boolean' || Array.isArray(s.aiInstalledModels)) {
+        setAiLocalReady(!!s.aiLocalEnabled && (s.aiInstalledModels?.length ?? 0) > 0);
+      }
+      if (typeof s.autocorrectTyped === 'boolean') setAutocorrectTyped(s.autocorrectTyped);
+      if (typeof s.autocorrectDrawn === 'boolean') setAutocorrectDrawn(s.autocorrectDrawn);
+      if (typeof s.defaultTextFont === 'string' && s.defaultTextFont.length > 0) {
+        setDefaultFont(s.defaultTextFont);
+      }
+    };
+
     const unBroadcast = window.pen.hub.onBroadcast((state: unknown) => {
       const s = state as {
         activeTool?: string;
@@ -175,7 +366,10 @@ export function OverlayApp() {
         whiteboard?: Whiteboard;
         theme?: Theme;
         thicknessFlyoutOpen?: boolean;
-      };
+        profile?: ProfileId;
+        calibration?: Calibration | null;
+      } & AiHubFields;
+      if ('calibration' in s) currentCalibration = s.calibration ?? null;
       if (s.activeTool) store.getState().setActiveTool(s.activeTool as never);
       if (typeof s.drawMode === 'boolean') store.getState().setDrawMode(s.drawMode);
       if (s.settings) store.getState().setSettings(s.settings);
@@ -187,6 +381,8 @@ export function OverlayApp() {
       if (typeof s.thicknessFlyoutOpen === 'boolean') {
         toolbarFlyoutOpen = s.thicknessFlyoutOpen;
       }
+      applyAiFields(s);
+      if (s.profile) setActiveProfile(s.profile);
     });
 
     void window.pen.hub.get().then((state) => {
@@ -197,7 +393,10 @@ export function OverlayApp() {
         whiteboard: Whiteboard;
         theme?: Theme;
         thicknessFlyoutOpen?: boolean;
-      };
+        profile?: ProfileId;
+        calibration?: Calibration | null;
+      } & AiHubFields;
+      if ('calibration' in s) currentCalibration = s.calibration ?? null;
       store.getState().setActiveTool(s.activeTool as never);
       store.getState().setDrawMode(s.drawMode);
       store.getState().setSettings(s.settings);
@@ -206,6 +405,8 @@ export function OverlayApp() {
       if (typeof s.thicknessFlyoutOpen === 'boolean') {
         toolbarFlyoutOpen = s.thicknessFlyoutOpen;
       }
+      applyAiFields(s);
+      if (s.profile) setActiveProfile(s.profile);
       applyCursor();
     });
 
@@ -216,6 +417,7 @@ export function OverlayApp() {
       unUndo();
       unRedo();
       unClear();
+      unAnalyze();
       unShot();
       unSnip();
       unSnipSel();
@@ -263,7 +465,13 @@ export function OverlayApp() {
           (Order matters: snipRectSig() goes last so the && chain
           resolves to the SnipRect itself for Show's accessor.) */}
       <Show when={drawMode() && activeTool() === 'snip' && snipRectSig()}>
-        {(rect) => <SnipActions rect={rect()} />}
+        {(rect) => (
+          <SnipActions
+            rect={rect()}
+            aiConfigured={aiAvailable()}
+            profile={activeProfile()}
+          />
+        )}
       </Show>
     </div>
   );
@@ -273,15 +481,19 @@ export function OverlayApp() {
 // Anchored at the bottom-right corner of the rect with a small offset.
 // Falls back to inside-rect-bottom-right if the rect is too close to
 // the screen edge to fit the menu below it.
-function SnipActions(props: { rect: SnipRect }) {
-  const MENU_W = 168;
+function SnipActions(props: {
+  rect: SnipRect;
+  aiConfigured: boolean;
+  profile: ProfileId;
+}) {
+  // Wider menu when the Ask AI button is showing so the four buttons
+  // fit in one row without wrapping.
+  const MENU_W = () => (props.aiConfigured ? 232 : 168);
   const MENU_H = 32;
   const GAP = 8;
-  // Tracks an in-flight Copy so the button can show 'Copying…' and
-  // block double-clicks. Save is fire-and-forget (capture goes
-  // through the toolbar's save flow), so it doesn't get a busy state
-  // — the menu just dismisses immediately.
-  const [busy, setBusy] = createSignal<'copy' | null>(null);
+  // Tracks an in-flight Copy / AskAi so the button can show its
+  // busy label and block double-clicks. Save is fire-and-forget.
+  const [busy, setBusy] = createSignal<'copy' | 'ask' | null>(null);
 
   const clearSnip = (): void => {
     const displayId = window.pen.env.displayId();
@@ -316,21 +528,38 @@ function SnipActions(props: { rect: SnipRect }) {
     void window.pen.relay.screenshot();
     exitToIdle();
   };
+  const onAskAi = async (): Promise<void> => {
+    if (busy()) return;
+    setBusy('ask');
+    try {
+      // Main captures + composites + broadcasts chat:session →
+      // toolbar's ChatPanel picks it up and fires the first AI turn.
+      // Selection is cleared by capture.ts during the capture (same
+      // path Save / Copy use).
+      await window.pen.snip.askAi(props.profile);
+    } finally {
+      setBusy(null);
+      // Don't exitToIdle here — the user might want to keep snipping
+      // while chatting. The chat panel is in the toolbar window; the
+      // overlay stays interactive.
+    }
+  };
   const onCancel = (): void => clearSnip();
 
   const positioned = (): { left: string; top: string } => {
     const r = props.rect;
     const winW = window.innerWidth;
     const winH = window.innerHeight;
+    const menuW = MENU_W();
     // Default: below the rect, right-aligned to its right edge.
-    let left = r.x + r.w - MENU_W;
+    let left = r.x + r.w - menuW;
     let top = r.y + r.h + GAP;
     // If it would overflow the bottom of the screen, place ABOVE the rect.
     if (top + MENU_H > winH - 4) top = r.y - MENU_H - GAP;
     // If still off-screen (very tall rect near top), tuck inside the rect.
     if (top < 4) top = Math.min(r.y + r.h - MENU_H - GAP, winH - MENU_H - 4);
     // Horizontal clamping: never let the menu fall off either edge.
-    left = Math.max(4, Math.min(left, winW - MENU_W - 4));
+    left = Math.max(4, Math.min(left, winW - menuW - 4));
     return { left: `${left}px`, top: `${top}px` };
   };
 
@@ -356,6 +585,16 @@ function SnipActions(props: { rect: SnipRect }) {
       >
         Save
       </button>
+      <Show when={props.aiConfigured}>
+        <button
+          class="snip-action snip-action-ai"
+          onClick={() => void onAskAi()}
+          disabled={busy() !== null}
+          title="Send this snip to the AI for analysis"
+        >
+          {busy() === 'ask' ? 'Asking…' : 'Ask AI'}
+        </button>
+      </Show>
       <button
         class="snip-action snip-action-quiet"
         onClick={onCancel}
diff --git a/src/renderer/overlay/canvas/CommittedLayer.ts b/src/renderer/overlay/canvas/CommittedLayer.ts
index e1d0a56..7499fce 100644
--- a/src/renderer/overlay/canvas/CommittedLayer.ts
+++ b/src/renderer/overlay/canvas/CommittedLayer.ts
@@ -10,7 +10,7 @@ export class CommittedLayer {
 
   constructor(canvas: HTMLCanvasElement) {
     this.canvas = canvas;
-    const ctx = canvas.getContext('2d', { alpha: true });
+    const ctx = canvas.getContext('2d', { alpha: true, desynchronized: true });
     if (!ctx) throw new Error('CommittedLayer: 2D context unavailable');
     this.ctx = ctx;
     this.dpr = Math.max(window.devicePixelRatio || 1, 2);
diff --git a/src/renderer/overlay/canvas/LiveLayer.ts b/src/renderer/overlay/canvas/LiveLayer.ts
index a692ae1..afe09b9 100644
--- a/src/renderer/overlay/canvas/LiveLayer.ts
+++ b/src/renderer/overlay/canvas/LiveLayer.ts
@@ -6,11 +6,15 @@ export class LiveLayer {
   private ctx: CanvasRenderingContext2D;
   private dpr: number;
   private pending: Item | null = null;
-  private rafId: number | null = null;
 
   constructor(canvas: HTMLCanvasElement) {
     this.canvas = canvas;
-    const ctx = canvas.getContext('2d', { alpha: true });
+    // `desynchronized: true` opts into the low-latency canvas path: the
+    // browser is allowed to skip the normal compositor round-trip and
+    // push our pixels to the screen with minimal buffering. This is the
+    // single biggest lever for ink-to-screen latency on the live layer,
+    // where the in-progress stroke is redrawn every pointer frame.
+    const ctx = canvas.getContext('2d', { alpha: true, desynchronized: true });
     if (!ctx) throw new Error('LiveLayer: 2D context unavailable');
     this.ctx = ctx;
     // Floor at 2× so strokes stay crisp on standard-DPI external monitors
@@ -35,16 +39,13 @@ export class LiveLayer {
     this.ctx.setTransform(this.dpr, 0, 0, this.dpr, 0, 0);
   }
 
+  // Renders synchronously. The pointer pipeline already coalesces all
+  // moves within a frame into a single onMove → setDraft call (batched
+  // on its own requestAnimationFrame), so a second rAF here only added
+  // a wasted frame of latency. Drawing immediately on the current frame
+  // is one fewer hop between the hand and the screen.
   draft(item: Item | null): void {
     this.pending = item;
-    if (this.rafId !== null) return;
-    this.rafId = requestAnimationFrame(() => {
-      this.rafId = null;
-      this.flush();
-    });
-  }
-
-  private flush(): void {
     const { ctx } = this;
     ctx.save();
     ctx.setTransform(this.dpr, 0, 0, this.dpr, 0, 0);
@@ -54,7 +55,6 @@ export class LiveLayer {
   }
 
   clear(): void {
-    this.pending = null;
     this.draft(null);
   }
 }
diff --git a/src/renderer/overlay/canvas/drawItem.ts b/src/renderer/overlay/canvas/drawItem.ts
index a589ed4..d54eba2 100644
--- a/src/renderer/overlay/canvas/drawItem.ts
+++ b/src/renderer/overlay/canvas/drawItem.ts
@@ -1,5 +1,5 @@
 import { getStroke } from 'perfect-freehand';
-import { FIB_LEVELS } from '../../../shared/constants';
+import { FIB_LEVELS, fibColor } from '../../../shared/constants';
 import type { Item } from '../../../shared/types';
 
 // Two cached noise tiles for pencil rendering:
@@ -86,18 +86,19 @@ export function drawItem(ctx: CanvasRenderingContext2D, item: Item, live = false
 function drawStroke(
   ctx: CanvasRenderingContext2D,
   item: Extract<Item, { kind: 'stroke' }>,
-  _live: boolean,
+  live: boolean,
 ): void {
   if (item.points.length === 0) return;
   const tool = item.tool;
   const isHi = tool === 'highlighter';
   const isPencil = tool === 'pencil';
 
-  // Pencil renders at 0.85× the requested width — a hard pencil tip
+  // Pencil renders at 0.75× the requested width — a hard pencil tip
   // lays down a finer line than an inked brush of the same nominal
-  // size, and this scale is what makes the two tools read as
-  // mechanically different at the same slider value.
-  const widthScale = isPencil ? 0.85 : 1;
+  // size. This scale both makes the two tools read as mechanically
+  // different at the same slider value and keeps pencil handwriting
+  // compact, so small letters don't eat horizontal space.
+  const widthScale = isPencil ? 0.75 : 1;
   const baseWidth = isHi ? Math.max(item.width, 14) : item.width * widthScale;
   const effectiveWidth = baseWidth;
 
@@ -108,6 +109,42 @@ function drawStroke(
   const baseAlpha = isHi ? Math.min(item.opacity, 0.35) : item.opacity;
   const effectiveAlpha = isPencil ? baseAlpha * 0.88 : baseAlpha;
 
+  // Fast path for the in-progress (live) stroke: draw the points as a
+  // round-capped, round-joined polyline instead of running getStroke
+  // over the whole array every frame. getStroke is O(n) per call, and
+  // calling it each frame on a growing stroke is O(n²) — the dominant
+  // source of latency on long handwriting strokes. A polyline at the
+  // effective width is visually near-identical to the committed pen
+  // outline (which is now uniform / untapered) and to a pencil/marker
+  // core; the full getStroke render — plus pencil grain — runs once on
+  // commit. This keeps the live cursor glued to the hand regardless of
+  // stroke length.
+  if (live) {
+    ctx.save();
+    if (isHi) ctx.globalCompositeOperation = 'multiply';
+    ctx.globalAlpha = effectiveAlpha;
+    ctx.strokeStyle = item.color;
+    ctx.fillStyle = item.color;
+    ctx.lineWidth = effectiveWidth;
+    ctx.lineCap = 'round';
+    ctx.lineJoin = 'round';
+    const pts = item.points;
+    if (pts.length === 1) {
+      // A single down-sample has no segment to stroke — lay a dot so
+      // the very first contact is visible immediately.
+      ctx.beginPath();
+      ctx.arc(pts[0].x, pts[0].y, effectiveWidth / 2, 0, Math.PI * 2);
+      ctx.fill();
+    } else {
+      ctx.beginPath();
+      ctx.moveTo(pts[0].x, pts[0].y);
+      for (let i = 1; i < pts.length; i++) ctx.lineTo(pts[i].x, pts[i].y);
+      ctx.stroke();
+    }
+    ctx.restore();
+    return;
+  }
+
   // Tool-specific stroke profiles. The key distinctions:
   //
   //   pencil  — no simulated pressure (uniform mark), low thinning,
@@ -130,31 +167,40 @@ function drawStroke(
       end: { taper: 0, cap: true },
     };
   } else if (isPencil) {
-    // Tuned for fine-handwriting at sub-pixel widths: lower thinning so
-    // a 0.5–1px pencil doesn't get pinched into invisibility by
-    // perfect-freehand's outline algorithm, and lower streamline so the
-    // line actually follows the writer's wrist instead of being eaten
-    // by post-hoc smoothing. Tapers shrink proportionally so very fine
-    // strokes still end cleanly.
+    // Precise thin handwriting, same principle as the pen: a fully
+    // UNIFORM mark. thinning is now 0 (was 0.04) and the start/end
+    // tapers are dropped (were up to 4px / 7px) — together those were
+    // still widening mid-stroke and pinching the ends, the milder
+    // version of the pen's old ballooning. A hard graphite tip lays a
+    // constant-width line anyway; its "pencil" identity comes from the
+    // grain pass below, not from width variation. Low streamline keeps
+    // the line tracking the wrist for small letters.
     opts = {
-      thinning: 0.04,
+      thinning: 0,
       smoothing: 0.28,
       streamline: 0.18,
       easing: (t: number) => t,
       simulatePressure: false,
-      start: { taper: Math.min(effectiveWidth * 0.5, 4), cap: true },
-      end: { taper: Math.min(effectiveWidth * 0.7, 7), cap: true },
+      start: { taper: 0, cap: true },
+      end: { taper: 0, cap: true },
     };
   } else {
-    // pen
+    // pen — tuned for precise thin handwriting on a mouse/trackpad.
+    // simulatePressure is OFF: a mouse reports no real pressure, so
+    // perfect-freehand's velocity-derived fake pressure inflated slow
+    // strokes — and handwriting IS slow, so letters ballooned and
+    // smeared together ("large space with minimum movement"). With
+    // thinning 0 the pen lays a uniform-width line that tracks the hand
+    // 1:1, and the tapers are dropped so short strokes don't get pinched
+    // or stretched. Light streamline keeps curves smooth without lag.
     opts = {
-      thinning: 0.45,
-      smoothing: 0.55,
-      streamline: 0.5,
+      thinning: 0,
+      smoothing: 0.4,
+      streamline: 0.34,
       easing: (t: number) => t,
-      simulatePressure: true,
-      start: { taper: Math.min(effectiveWidth * 1, 12), cap: true },
-      end: { taper: Math.min(effectiveWidth * 1.8, 28), cap: true },
+      simulatePressure: false,
+      start: { taper: 0, cap: true },
+      end: { taper: 0, cap: true },
     };
   }
 
@@ -163,7 +209,7 @@ function drawStroke(
     {
       size: effectiveWidth,
       ...opts,
-      last: !_live,
+      last: !live,
     },
   );
   if (strokePoints.length < 2) return;
@@ -228,28 +274,98 @@ function drawLine(
   ctx.restore();
 }
 
+// Trailing-zero-free ratio label: 0, 0.236, 0.5, 1 …
+function formatFibLevel(L: number): string {
+  return String(L);
+}
+
+// Percentage readout for a level: 0%, 23.6%, 50%, 61.8%, 100% …
+function formatFibPct(L: number): string {
+  const p = L * 100;
+  return `${Number.isInteger(p) ? p : Number(p.toFixed(1))}%`;
+}
+
 function drawFib(ctx: CanvasRenderingContext2D, item: Extract<Item, { kind: 'fib' }>): void {
+  const levels = (item.levels.length ? item.levels : FIB_LEVELS).slice().sort((a, b) => a - b);
+  if (levels.length === 0) return;
+
+  // Horizontal span IS the box width the user dragged out — the hand
+  // tool's corner handles edit p1.x / p2.x to widen or narrow it, so we
+  // no longer force a fixed rightward extension. Only when the box is
+  // essentially zero-width (the fib was dragged straight down) do we
+  // fall back to a default projection so the levels stay visible.
+  const left = Math.min(item.p1.x, item.p2.x);
+  const right = Math.max(item.p1.x, item.p2.x);
+  const MIN_FIB_W = 16;
+  const DEFAULT_FIB_W = 220;
+  const xLeft = left;
+  const xRight = right - left >= MIN_FIB_W ? right : left + DEFAULT_FIB_W;
+  // A retracement is measured back from the END of the move toward its
+  // START, the same as TradingView / MT: 0% sits at the second point
+  // (p2, where the drag ended — the impulse's extreme) and 100% at the
+  // first point (p1, the move's origin). Level L is the fraction of the
+  // move retraced, so it interpolates from p2 (L=0) to p1 (L=1).
+  // Anchoring at p1 for L=0 — as the old code did — mirrored every
+  // level (e.g. the 0.618 line landed at the 0.382 position).
+  const yAt = (L: number): number => item.p2.y + (item.p1.y - item.p2.y) * L;
+
   ctx.save();
-  ctx.globalAlpha = item.opacity;
-  ctx.strokeStyle = item.color;
-  ctx.fillStyle = item.color;
-  ctx.lineWidth = 1;
+
+  // Translucent colored zones between consecutive levels — the banded
+  // look of a trading-chart fib. Each band is tinted with the color of
+  // the level it retraces INTO (its upper boundary), kept faint so the
+  // underlying chart stays readable through it.
+  for (let i = 0; i < levels.length - 1; i++) {
+    const yA = yAt(levels[i]);
+    const yB = yAt(levels[i + 1]);
+    ctx.globalAlpha = item.opacity * 0.1;
+    ctx.fillStyle = fibColor(levels[i + 1]);
+    ctx.fillRect(xLeft, Math.min(yA, yB), xRight - xLeft, Math.abs(yB - yA));
+  }
+
   ctx.font = '11px -apple-system, system-ui, sans-serif';
-  const dx = Math.abs(item.p2.x - item.p1.x);
-  const xLeft = Math.min(item.p1.x, item.p2.x) - 4;
-  const xRight = Math.max(item.p1.x, item.p2.x) + Math.max(dx, 120);
-  const levels = item.levels.length ? item.levels : FIB_LEVELS;
+  ctx.textBaseline = 'middle';
 
   for (const L of levels) {
-    const y = item.p1.y + (item.p2.y - item.p1.y) * L;
+    const y = yAt(L);
+    const col = fibColor(L);
+    // Emphasize the two levels traders watch most — the 50% midpoint
+    // and the 0.618 golden ratio — with a slightly heavier line.
+    const key = L === 0.5 || L === 0.618;
+
+    ctx.globalAlpha = item.opacity;
+    ctx.strokeStyle = col;
+    ctx.lineWidth = key ? 1.6 : 1;
+    // +0.5 keeps the 1px lines crisp on the device pixel grid.
     ctx.beginPath();
-    ctx.moveTo(xLeft, y);
-    ctx.lineTo(xRight, y);
+    ctx.moveTo(xLeft, y + 0.5);
+    ctx.lineTo(xRight, y + 0.5);
     ctx.stroke();
-    if (item.showLabels) {
-      ctx.fillText(`${L.toFixed(3)}`, xLeft - 32, y + 4);
+
+    if (!item.showLabels) continue;
+
+    const label = `${formatFibLevel(L)}  ${formatFibPct(L)}`;
+    const padX = 5;
+    const chipH = 16;
+    const chipW = ctx.measureText(label).width + padX * 2;
+    // Sit the chip just left of the lines; if that would run off the
+    // left edge, tuck it inside the level instead so it stays visible.
+    let chipX = xLeft - chipW - 6;
+    let textX = chipX + padX;
+    if (chipX < 2) {
+      chipX = xLeft + 6;
+      textX = chipX + padX;
     }
+
+    ctx.globalAlpha = item.opacity;
+    ctx.fillStyle = col;
+    ctx.beginPath();
+    ctx.roundRect(chipX, y - chipH / 2, chipW, chipH, 3);
+    ctx.fill();
+    ctx.fillStyle = '#ffffff';
+    ctx.fillText(label, textX, y);
   }
+
   ctx.restore();
 }
 
@@ -377,7 +493,10 @@ function drawArrow(ctx: CanvasRenderingContext2D, item: Extract<Item, { kind: 'a
 function drawText(ctx: CanvasRenderingContext2D, item: Extract<Item, { kind: 'text' }>): void {
   ctx.save();
   ctx.fillStyle = item.color;
-  ctx.font = `${item.fontSize}px -apple-system, system-ui, sans-serif`;
+  // Honor the per-item font family stamped from the user's default-font
+  // setting; fall back to the system stack for items saved before it.
+  const family = item.fontFamily ?? 'system-ui, -apple-system, sans-serif';
+  ctx.font = `${item.fontSize}px ${family}`;
   ctx.textBaseline = 'top';
   const lines = item.text.split('\n');
   for (let i = 0; i < lines.length; i++) {
diff --git a/src/renderer/overlay/canvas/handles.ts b/src/renderer/overlay/canvas/handles.ts
index 9bcca6d..e44237c 100644
--- a/src/renderer/overlay/canvas/handles.ts
+++ b/src/renderer/overlay/canvas/handles.ts
@@ -31,9 +31,14 @@ export function getHandles(item: Item): Handle[] {
       ];
     }
     case 'fib':
+      // Two diagonal (alternate) corners. Each corner carries both an
+      // x and a y, so dragging it resizes the fib's width AND height at
+      // once — and which corner is the swing low vs high follows the
+      // drag direction (top→bottom or bottom→top). This replaces the
+      // old centered handles that could only stretch height.
       return [
-        { id: 'p1', x: (item.p1.x + item.p2.x) / 2, y: item.p1.y },
-        { id: 'p2', x: (item.p1.x + item.p2.x) / 2, y: item.p2.y },
+        { id: 'p1', x: item.p1.x, y: item.p1.y },
+        { id: 'p2', x: item.p2.x, y: item.p2.y },
       ];
     case 'stroke':
     case 'text':
@@ -64,8 +69,9 @@ export function applyHandle(original: Item, hid: HandleId, x: number, y: number)
       return { ...original, p1: { x: nl, y: nt }, p2: { x: nr, y: nb } };
     }
     case 'fib':
-      if (hid === 'p1') return { ...original, p1: { x: original.p1.x, y: y } };
-      if (hid === 'p2') return { ...original, p2: { x: original.p2.x, y: y } };
+      // Corner drag edits both axes: x changes the width, y the height.
+      if (hid === 'p1') return { ...original, p1: { x, y } };
+      if (hid === 'p2') return { ...original, p2: { x, y } };
       return original;
     case 'stroke':
     case 'text':
diff --git a/src/renderer/overlay/canvas/recognize.ts b/src/renderer/overlay/canvas/recognize.ts
new file mode 100644
index 0000000..9e94384
--- /dev/null
+++ b/src/renderer/overlay/canvas/recognize.ts
@@ -0,0 +1,122 @@
+import type { Item, StrokeItem } from '../../../shared/types';
+import { drawItem } from './drawItem';
+
+// A cross-platform handwriting/script font stack. Recognized ink is
+// rendered in this so the converted text still reads as something the
+// user "wrote" rather than a typeset paragraph — keeping the markup
+// feeling realistic at the same place and size.
+export const HANDWRITING_FONT =
+  "'Segoe Print', 'Bradley Hand', 'Comic Sans MS', 'Snell Roundhand', cursive";
+
+// Heuristic: did the user hand-write a question / request (answer in
+// chat) rather than a note to tidy up in place? Catches a trailing '?'
+// and common interrogative / imperative openers used across profiles
+// (e.g. "what…", "explain…", "analyze…", "solve…").
+export function isLikelyQuestion(text: string): boolean {
+  const t = text.trim().toLowerCase();
+  if (!t) return false;
+  if (t.endsWith('?')) return true;
+  return /^(who|what|when|where|why|which|whom|whose|how|is|are|am|can|could|should|would|will|do|does|did|explain|define|describe|summarize|summarise|solve|calculate|analyse|analyze|compare|list|give|tell|find)\b/.test(
+    t,
+  );
+}
+
+// Detect when a vision model returned a DESCRIPTION of the image
+// instead of a transcription (small models love to say "a signature",
+// "the user wrote…", "this appears to be handwriting"). Such output
+// must never replace the user's ink. Also rejects model refusals and
+// absurdly long ramblings (a drawn word/phrase is short).
+export function isDescriptiveJunk(text: string): boolean {
+  const t = text.trim();
+  if (t.length === 0) return true;
+  if (t.length > 240) return true; // handwriting groups are short
+  return /\b(signature|the image|this image|an image|the drawing|a drawing|appears? to|looks? like|seems? to|handwrit|the user (wrote|typed|drew)|i (can )?see|i'?m sorry|sorry,|cannot (read|make out|determine)|can'?t (read|tell)|unable to|no (legible|readable|visible|discernible)|illegible|it'?s (a|an)\b)/i.test(
+    t,
+  );
+}
+
+// Only freehand ink (pencil / pen) is recognized as handwriting.
+// Highlighter is a marker, and every other Item is a shape — none of
+// those are text, so they're excluded from recognition entirely.
+export function isRecognizableStroke(item: Item): item is StrokeItem {
+  return item.kind === 'stroke' && (item.tool === 'pencil' || item.tool === 'pen');
+}
+
+export interface Bounds {
+  x: number;
+  y: number;
+  w: number;
+  h: number;
+}
+
+function strokeMinMax(s: StrokeItem): { minX: number; minY: number; maxX: number; maxY: number } {
+  let minX = Infinity;
+  let minY = Infinity;
+  let maxX = -Infinity;
+  let maxY = -Infinity;
+  for (const p of s.points) {
+    if (p.x < minX) minX = p.x;
+    if (p.y < minY) minY = p.y;
+    if (p.x > maxX) maxX = p.x;
+    if (p.y > maxY) maxY = p.y;
+  }
+  // Pad by half the stroke width so the rendered outline isn't clipped.
+  const pad = s.width / 2 + 1;
+  return { minX: minX - pad, minY: minY - pad, maxX: maxX + pad, maxY: maxY + pad };
+}
+
+export function groupBounds(strokes: StrokeItem[]): Bounds {
+  let minX = Infinity;
+  let minY = Infinity;
+  let maxX = -Infinity;
+  let maxY = -Infinity;
+  for (const s of strokes) {
+    const b = strokeMinMax(s);
+    if (b.minX < minX) minX = b.minX;
+    if (b.minY < minY) minY = b.minY;
+    if (b.maxX > maxX) maxX = b.maxX;
+    if (b.maxY > maxY) maxY = b.maxY;
+  }
+  return { x: minX, y: minY, w: maxX - minX, h: maxY - minY };
+}
+
+// The color used by the most strokes in the group (tie-break by total
+// point count) — used as the replacement text's color.
+export function dominantColor(strokes: StrokeItem[]): string {
+  const score = new Map<string, number>();
+  for (const s of strokes) {
+    score.set(s.color, (score.get(s.color) ?? 0) + s.points.length);
+  }
+  let best = strokes[0]?.color ?? '#3a3a3c';
+  let bestScore = -1;
+  for (const [color, n] of score) {
+    if (n > bestScore) {
+      bestScore = n;
+      best = color;
+    }
+  }
+  return best;
+}
+
+const RASTER_PAD = 12;
+
+// Render the stroke group to an offscreen canvas on a WHITE background
+// (vision models read dark-on-light far better than transparent ink).
+// Sized in device pixels at the same DPR floor the live/committed
+// layers use, then translated so the group's top-left maps to the pad
+// origin.
+export function rasterizeGroup(strokes: StrokeItem[], bounds: Bounds, dpr: number): HTMLCanvasElement {
+  const cssW = bounds.w + RASTER_PAD * 2;
+  const cssH = bounds.h + RASTER_PAD * 2;
+  const off = document.createElement('canvas');
+  off.width = Math.max(1, Math.ceil(cssW * dpr));
+  off.height = Math.max(1, Math.ceil(cssH * dpr));
+  const ctx = off.getContext('2d');
+  if (!ctx) return off;
+  ctx.setTransform(dpr, 0, 0, dpr, 0, 0);
+  ctx.fillStyle = '#ffffff';
+  ctx.fillRect(0, 0, cssW, cssH);
+  ctx.translate(-bounds.x + RASTER_PAD, -bounds.y + RASTER_PAD);
+  for (const s of strokes) drawItem(ctx, s);
+  return off;
+}
diff --git a/src/renderer/overlay/canvas/ta.ts b/src/renderer/overlay/canvas/ta.ts
new file mode 100644
index 0000000..194a081
--- /dev/null
+++ b/src/renderer/overlay/canvas/ta.ts
@@ -0,0 +1,92 @@
+import type { Calibration, FibShape, Item, LineShape } from '../../../shared/types';
+import { FIB_LEVELS } from '../../../shared/constants';
+
+// Map a pixel Y to a price using the two calibration anchor points.
+// Returns null when calibration is absent or degenerate.
+function priceAtPixelY(pixelY: number, calib: Calibration | null): number | null {
+  if (!calib) return null;
+  const dyPix = calib.p2.pixel.y - calib.p1.pixel.y;
+  if (dyPix === 0) return null;
+  const t = (pixelY - calib.p1.pixel.y) / dyPix;
+  return calib.p1.price + t * (calib.p2.price - calib.p1.price);
+}
+
+function fmtPrice(p: number): string {
+  // A few significant digits without trailing noise.
+  const abs = Math.abs(p);
+  const digits = abs >= 1000 ? 0 : abs >= 1 ? 2 : 5;
+  return p.toFixed(digits);
+}
+
+// Match drawItem's fib geometry: 0% sits at p2 (end of the move),
+// 100% at p1 (origin). yAt(L) interpolates from p2 → p1.
+function fibYAt(fib: FibShape, level: number): number {
+  return fib.p2.y + (fib.p1.y - fib.p2.y) * level;
+}
+
+function describeFib(fib: FibShape, index: number, calib: Calibration | null): string {
+  const levels = (fib.levels.length ? fib.levels : FIB_LEVELS).slice().sort((a, b) => a - b);
+  // Screen Y grows downward, so the end point being higher on screen
+  // (smaller y) means price moved UP into the swing high.
+  const movedUp = fib.p2.y < fib.p1.y;
+  const dir = movedUp ? 'up (swing low → swing high)' : 'down (swing high → swing low)';
+  const lines: string[] = [`Fibonacci retracement #${index + 1} — move drawn ${dir}:`];
+  for (const L of levels) {
+    const pct = `${Number((L * 100).toFixed(1))}%`;
+    const price = priceAtPixelY(fibYAt(fib, L), calib);
+    const priceStr = price != null ? ` ≈ ${fmtPrice(price)}` : '';
+    const tag = L === 0 ? ' (0% — end of move)' : L === 1 ? ' (100% — origin)' : '';
+    lines.push(`  • ${pct}${priceStr}${tag}`);
+  }
+  return lines.join('\n');
+}
+
+function describeLine(line: LineShape, index: number, calib: Calibration | null): string {
+  const kind = line.kind === 'trendline' ? 'Trendline' : 'Line';
+  // Rising on screen = end point higher (smaller y) as x increases.
+  const rising = line.p2.y < line.p1.y;
+  const slope = line.kind === 'trendline' ? (rising ? ' (rising)' : ' (falling)') : '';
+  const p1 = priceAtPixelY(line.p1.y, calib);
+  const p2 = priceAtPixelY(line.p2.y, calib);
+  const range =
+    p1 != null && p2 != null ? ` from ≈ ${fmtPrice(p1)} to ≈ ${fmtPrice(p2)}` : '';
+  return `${kind} #${index + 1}${slope}${range}`;
+}
+
+// Build the analysis prompt text from the user's drawn technical
+// markup. Returns null when there's nothing analyzable on the canvas.
+// The output is a self-contained user message: framing + the computed
+// numbers, so the trader text model never has to read a chart image.
+export function buildTradeAnalysisText(items: Item[], calib: Calibration | null): string | null {
+  const fibs = items.filter((i): i is FibShape => i.kind === 'fib');
+  const lines = items.filter(
+    (i): i is LineShape => i.kind === 'line' || i.kind === 'trendline',
+  );
+  if (fibs.length === 0 && lines.length === 0) return null;
+
+  const sections: string[] = [];
+  fibs.forEach((f, i) => sections.push(describeFib(f, i, calib)));
+  if (lines.length > 0) {
+    sections.push(
+      'Lines / trendlines:\n' +
+        lines.map((l, i) => `  • ${describeLine(l, i, calib)}`).join('\n'),
+    );
+  }
+  if (!calib) {
+    sections.push(
+      'Note: no price calibration is set, so levels are given as ' +
+        'retracement ratios rather than absolute prices.',
+    );
+  }
+
+  return (
+    'These are the technical levels I have marked on my chart, computed ' +
+    'numerically from my drawings (not read from an image — treat the ' +
+    'numbers as exact):\n\n' +
+    sections.join('\n\n') +
+    '\n\nUsing only these levels, give a concise read: the prevailing ' +
+    'trend, the key levels to watch, and one or two probabilistic ' +
+    'scenarios with an invalidation level for each. Observation only — ' +
+    'not financial advice.'
+  );
+}
diff --git a/src/renderer/overlay/index.html b/src/renderer/overlay/index.html
index bc56f06..c8eba0f 100644
--- a/src/renderer/overlay/index.html
+++ b/src/renderer/overlay/index.html
@@ -105,6 +105,19 @@
         font-weight: 600;
       }
       .snip-action-primary:hover { filter: brightness(1.05); }
+      /* Ask AI gets a distinct accent so it reads as a different
+         class of action than Copy/Save (which manipulate the
+         clipboard / file system). Muted purple-ish blue. */
+      .snip-action-ai {
+        background: rgba(132, 109, 224, 0.18);
+        color: #b6a7ff;
+        border-color: rgba(132, 109, 224, 0.35);
+        font-weight: 600;
+      }
+      .snip-action-ai:hover {
+        background: rgba(132, 109, 224, 0.30);
+        color: #ffffff;
+      }
       .snip-action-quiet {
         color: rgba(228, 228, 230, 0.65);
         padding: 6px 8px;
diff --git a/src/renderer/overlay/store.ts b/src/renderer/overlay/store.ts
index 0ac8be9..2ecb154 100644
--- a/src/renderer/overlay/store.ts
+++ b/src/renderer/overlay/store.ts
@@ -23,6 +23,9 @@ export interface OverlayState {
 interface OverlayActions {
   commit(item: Item): void;
   replace(itemId: string, next: Item): void;
+  // Remove several items and add new ones in ONE history entry, so the
+  // whole swap (e.g. recognized ink → corrected text) is a single undo.
+  replaceMany(removeIds: string[], add: Item[]): void;
   remove(itemId: string): void;
   setItem(itemId: string, next: Item): void;
   snapshot(): void;
@@ -64,6 +67,16 @@ export const store = createStore<Store>((set, get) => ({
     set({ items: nextItems, past: nextPast, future: [] });
   },
 
+  replaceMany(removeIds, add) {
+    const { items, past } = get();
+    const drop = new Set(removeIds);
+    const kept = items.filter((i) => !drop.has(i.id));
+    // No-op if nothing matched and nothing to add — don't pollute history.
+    if (kept.length === items.length && add.length === 0) return;
+    const nextPast = [...past, items].slice(-HISTORY_LIMIT);
+    set({ items: [...kept, ...add], past: nextPast, future: [] });
+  },
+
   remove(itemId) {
     const { items, past } = get();
     const nextItems = items.filter((i) => i.id !== itemId);
diff --git a/src/renderer/overlay/tools/pen.ts b/src/renderer/overlay/tools/pen.ts
index e24de3f..3319c78 100644
--- a/src/renderer/overlay/tools/pen.ts
+++ b/src/renderer/overlay/tools/pen.ts
@@ -66,12 +66,15 @@ class InputSmoother {
 export function makePen(tool: StrokeTool): Tool {
   let working: StrokeItem | null = null;
   const smoother = new InputSmoother();
-  // Pencil should TRACK the hand — a hard graphite tip doesn't flow,
-  // so we keep the input filter light (high alpha floor = minimal
-  // smoothing) and let the rendering grain do the work of feeling
-  // "real". Pen flows like ink, so it gets heavier input smoothing
-  // for soft cursive curves. Highlighter passes raw.
-  const smoothingFloor = tool === 'pencil' ? 0.6 : tool === 'pen' ? 0.35 : 1;
+  // Higher alpha floor = the rendered point sits closer to the true
+  // cursor, so the ink tracks the hand instead of trailing it. On a
+  // mouse/trackpad (no real pressure, coarser sampling) precise
+  // handwriting needs the line to land where the pointer actually is —
+  // lag reads as imprecision. Pencil already tracked tightly (0.6);
+  // pen is raised from 0.35 → 0.55 so it stops floating behind the
+  // cursor. Remaining jitter is cleaned up by perfect-freehand's
+  // streamline at commit time. Highlighter passes raw.
+  const smoothingFloor = tool === 'pencil' ? 0.6 : tool === 'pen' ? 0.55 : 1;
   const useSmoother = tool !== 'highlighter';
 
   const filter = (p: Point): Point =>
@@ -89,7 +92,12 @@ export function makePen(tool: StrokeTool): Tool {
       if (!working) return;
       const next = samples.map(sampleToPoint).map(filter);
       working.points.push(...next);
-      ctx.setDraft({ ...working, points: [...working.points] });
+      // Pass the working item by reference — the LiveLayer reads and
+      // draws it synchronously inside this call, so there's no need to
+      // clone. The previous `{ ...working, points: [...] }` copied the
+      // entire growing point array on every frame: O(n²) over a stroke,
+      // which is what made long handwriting strokes lag progressively.
+      ctx.setDraft(working);
     },
     onUp(sample, ctx) {
       if (!working) return;
diff --git a/src/renderer/overlay/tools/text.ts b/src/renderer/overlay/tools/text.ts
index 3a5beed..a7b7108 100644
--- a/src/renderer/overlay/tools/text.ts
+++ b/src/renderer/overlay/tools/text.ts
@@ -1,5 +1,5 @@
 import type { TextShape } from '../../../shared/types';
-import type { Tool } from './types';
+import type { Tool, ToolContext } from './types';
 import { nextId } from './types';
 
 export const text: Tool = {
@@ -8,16 +8,25 @@ export const text: Tool = {
     void ctx.requestFocus().then(() => {
       ctx.promptText({ x: sample.x, y: sample.y }, (value: string) => {
         void ctx.releaseFocus();
-        if (!value.trim()) return;
-        const item: TextShape = {
+        const raw = value.trim();
+        if (!raw) return;
+        const make = (content: string): TextShape => ({
           kind: 'text',
           id: nextId('text'),
           at: { x: sample.x, y: sample.y },
-          text: value,
+          text: content,
           color: ctx.settings.color,
           fontSize: Math.max(14, Math.round(ctx.settings.width * 4)),
-        };
-        ctx.commit(item);
+          fontFamily: ctx.defaultFont(),
+        });
+        // Raw stays raw unless the user enabled typed autocorrect. When
+        // on, run the text through the (local-first) corrector and
+        // commit the result; on any failure fall back to the raw text.
+        if (ctx.autocorrectTyped()) {
+          void correctThenCommit(ctx, raw, make);
+        } else {
+          ctx.commit(make(raw));
+        }
       });
     });
   },
@@ -28,3 +37,17 @@ export const text: Tool = {
     /* no-op */
   },
 };
+
+async function correctThenCommit(
+  ctx: ToolContext,
+  raw: string,
+  make: (text: string) => TextShape,
+): Promise<void> {
+  try {
+    const res = await window.pen.ai.autocorrect({ text: raw, profile: ctx.profile() });
+    const fixed = res.text && res.text.trim().length > 0 ? res.text.trim() : raw;
+    ctx.commit(make(fixed));
+  } catch {
+    ctx.commit(make(raw));
+  }
+}
diff --git a/src/renderer/overlay/tools/types.ts b/src/renderer/overlay/tools/types.ts
index c7f8275..a8111e1 100644
--- a/src/renderer/overlay/tools/types.ts
+++ b/src/renderer/overlay/tools/types.ts
@@ -1,4 +1,4 @@
-import type { Item, ToolSettings } from '../../../shared/types';
+import type { Item, ProfileId, ToolSettings } from '../../../shared/types';
 import type { PointerSample } from '../canvas/pointerPipeline';
 
 export interface ToolContext {
@@ -16,6 +16,10 @@ export interface ToolContext {
   releaseFocus(): Promise<void>;
   promptText(at: { x: number; y: number }, onCommit: (text: string) => void): void;
   drawMode(): boolean;
+  // Active profile + text-styling/AI settings, read live by tools.
+  profile(): ProfileId;
+  defaultFont(): string;
+  autocorrectTyped(): boolean;
 }
 
 export interface Tool {
diff --git a/src/renderer/penApi.d.ts b/src/renderer/penApi.d.ts
index 5665557..8266a31 100644
--- a/src/renderer/penApi.d.ts
+++ b/src/renderer/penApi.d.ts
@@ -1,4 +1,18 @@
-import type { HubStateUpdate, ScreenPermissionStatus } from '../shared/types';
+import type {
+  AiStatus,
+  AskInput,
+  ChatSessionPayload,
+  ConnectionTestResult,
+  HubStateUpdate,
+  LocalModelInfo,
+  OllamaPullProgress,
+  OllamaServiceStatus,
+  ProfileId,
+  ProviderId,
+  ScreenPermissionStatus,
+  StreamChunk,
+  UpdateStatus,
+} from '../shared/types';
 
 declare global {
   interface Window {
@@ -12,6 +26,7 @@ declare global {
         onUndo(cb: () => void): () => void;
         onRedo(cb: () => void): () => void;
         onClear(cb: () => void): () => void;
+        onAnalyze(cb: () => void): () => void;
         onScreenshot(cb: (payload: { png: Uint8Array }) => void): () => void;
         onSnip(
           cb: (payload: {
@@ -35,11 +50,13 @@ declare global {
         }): Promise<void>;
         clear(payload: { displayId: number }): Promise<void>;
         copy(): Promise<void>;
+        askAi(profile: ProfileId): Promise<void>;
       };
       relay: {
         undo(): Promise<void>;
         redo(): Promise<void>;
         clear(): Promise<void>;
+        analyze(): Promise<void>;
         screenshot(): Promise<void>;
       };
       win: {
@@ -70,10 +87,68 @@ declare global {
       shell: {
         openPath(p: string): Promise<void>;
       };
+      ai: {
+        setKey(provider: ProviderId, key: string): Promise<void>;
+        deleteKey(provider: ProviderId): Promise<void>;
+        getStatus(): Promise<AiStatus[]>;
+        testConnection(
+          provider: ProviderId,
+          model: string,
+        ): Promise<ConnectionTestResult>;
+        ask(input: AskInput): Promise<{ requestId: string }>;
+        cancel(requestId: string): Promise<void>;
+        onChunk(cb: (c: StreamChunk) => void): () => void;
+        recognize(payload: {
+          png: Uint8Array;
+          mime?: string;
+          profile?: ProfileId;
+        }): Promise<{ text: string; error?: string }>;
+        autocorrect(payload: {
+          text: string;
+          profile?: ProfileId;
+        }): Promise<{ text: string; error?: string }>;
+      };
+      ollama: {
+        status(): Promise<OllamaServiceStatus>;
+        start(): Promise<OllamaServiceStatus>;
+        listModels(): Promise<LocalModelInfo[]>;
+        diskSpace(): Promise<number>;
+        pull(model: string): Promise<{ ok: boolean }>;
+        cancelPull(model: string): Promise<void>;
+        deleteModel(model: string): Promise<void>;
+        installHelp(): Promise<void>;
+        onPullProgress(cb: (p: OllamaPullProgress) => void): () => void;
+      };
+      rag: {
+        stats(): Promise<Record<ProfileId, number>>;
+        resetProfile(profile: ProfileId): Promise<void>;
+        capture(payload: {
+          profile: ProfileId;
+          kind: 'typed' | 'drawn' | 'analysis' | 'chat';
+          original: string;
+          corrected: string;
+        }): Promise<void>;
+      };
+      chat: {
+        start(payload: {
+          png: Uint8Array;
+          mime: string;
+          profile: ProfileId;
+        }): Promise<{ sessionId: string }>;
+        startText(payload: { text: string; profile: ProfileId }): Promise<{ sessionId: string }>;
+        onSession(cb: (s: ChatSessionPayload) => void): () => void;
+      };
       app: {
         info(): Promise<{ name: string; version: string; packaged: boolean }>;
         relaunch(): Promise<void>;
       };
+      updater: {
+        get(): Promise<UpdateStatus>;
+        check(): Promise<UpdateStatus>;
+        install(): Promise<void>;
+        openReleases(): Promise<void>;
+        onStatus(cb: (s: UpdateStatus) => void): () => void;
+      };
       env: {
         displayId(): number;
       };
diff --git a/src/renderer/toolbar/App.tsx b/src/renderer/toolbar/App.tsx
index 403c099..a4f02b8 100644
--- a/src/renderer/toolbar/App.tsx
+++ b/src/renderer/toolbar/App.tsx
@@ -1,15 +1,96 @@
-import { createEffect, createMemo, createSignal, For, onMount, onCleanup, Show } from 'solid-js';
+import {
+  createEffect,
+  createMemo,
+  createSignal,
+  For,
+  Match,
+  onMount,
+  onCleanup,
+  Show,
+  Switch,
+} from 'solid-js';
 import { COLOR_PRESETS, THICKNESS_PRESETS } from '../../shared/constants';
-import { PROFILES, PROFILE_ORDER } from '../../shared/profiles';
+import { PROFILES, PROFILE_ORDER, resolveAiPrompt } from '../../shared/profiles';
 import type {
+  AiStatus,
+  ChatSessionPayload,
+  ConnectionTestResult,
+  LocalModelInfo,
+  OllamaPullProgress,
+  OllamaServiceStatus,
   Orientation,
   ProfileId,
+  ProviderId,
   Theme,
   ToolId,
   ToolSettings,
+  UpdateStatus,
   Whiteboard,
 } from '../../shared/types';
 import { Icons, Logo } from './icons';
+import { ChatPanel } from './ChatPanel';
+
+// The cloud providers (kept as an opt-in fallback). Local (Ollama)
+// has its own settings section, so these mirror maps are cloud-only.
+type CloudProviderId = 'anthropic' | 'openai' | 'gemini' | 'deepseek' | 'sarvam';
+
+const PROVIDER_LABELS: Record<CloudProviderId, string> = {
+  anthropic: 'Anthropic Claude',
+  openai: 'OpenAI ChatGPT',
+  gemini: 'Google Gemini',
+  deepseek: 'DeepSeek',
+  sarvam: 'Sarvam AI',
+};
+
+const PROVIDER_KEY_URLS: Record<CloudProviderId, string> = {
+  anthropic: 'https://console.anthropic.com/settings/keys',
+  openai: 'https://platform.openai.com/api-keys',
+  gemini: 'https://aistudio.google.com/app/apikey',
+  deepseek: 'https://platform.deepseek.com/api_keys',
+  sarvam: 'https://dashboard.sarvam.ai',
+};
+
+interface ModelOption {
+  id: string;
+  label: string;
+}
+
+// Kept in sync with src/main/ai/registry.ts. A static mirror is fine
+// — the list rotates with SDK releases, not user input.
+const MODELS_BY_PROVIDER: Record<CloudProviderId, ModelOption[]> = {
+  anthropic: [
+    { id: 'claude-sonnet-4-5', label: 'Claude Sonnet 4.5 (recommended)' },
+    { id: 'claude-opus-4-5', label: 'Claude Opus 4.5' },
+    { id: 'claude-haiku-4-5', label: 'Claude Haiku 4.5 (fast / cheap)' },
+  ],
+  openai: [
+    { id: 'gpt-4o', label: 'GPT-4o (recommended)' },
+    { id: 'gpt-4o-mini', label: 'GPT-4o mini (fast / cheap)' },
+  ],
+  gemini: [
+    { id: 'gemini-2.0-flash', label: 'Gemini 2.0 Flash (recommended)' },
+    { id: 'gemini-1.5-pro', label: 'Gemini 1.5 Pro' },
+  ],
+  // Text-only — see registry.ts. No vision; routes image snips to text.
+  deepseek: [
+    { id: 'deepseek-chat', label: 'DeepSeek V3 (recommended)' },
+    { id: 'deepseek-reasoner', label: 'DeepSeek R1 (reasoner)' },
+  ],
+  // Vision-capable via Sarvam's own OCR (image → text → solve).
+  sarvam: [
+    { id: 'sarvam-m', label: 'Sarvam-M 24B (recommended)' },
+    { id: 'sarvam-30b', label: 'Sarvam-30B' },
+    { id: 'sarvam-105b', label: 'Sarvam-105B (strongest)' },
+  ],
+};
+
+const DEFAULT_MODEL: Record<CloudProviderId, string> = {
+  anthropic: 'claude-sonnet-4-5',
+  openai: 'gpt-4o',
+  gemini: 'gemini-2.0-flash',
+  deepseek: 'deepseek-chat',
+  sarvam: 'sarvam-m',
+};
 
 // Status-panel discriminator. Both kinds reuse the existing
 // .settings-panel layout slot so they feel native to the toolbar
@@ -31,8 +112,32 @@ interface HubSnapshot {
   saveDir: string | null;
   alwaysAskSavePath: boolean;
   statusPanelOpen: boolean;
+  chatOpen: boolean;
+  aiActiveProvider: ProviderId | null;
+  aiActiveModel: string | null;
+  aiProfilePrompts: Partial<Record<ProfileId, string>>;
+  aiLocalEnabled: boolean;
+  aiInstalledModels: string[];
+  aiLocalModel: string | null;
+  aiLocalVisionModel: string | null;
+  aiProfileModels: Partial<Record<ProfileId, { text?: string; vision?: string }>>;
+  autocorrectTyped: boolean;
+  autocorrectDrawn: boolean;
+  defaultTextFont: string;
+  aiOnboarded: boolean;
+  autoUpdate: boolean;
 }
 
+// Curated, cross-platform-safe font choices for the default-text-font
+// picker. Values are CSS font-family stacks stamped onto TextShapes.
+const TEXT_FONTS: { label: string; value: string }[] = [
+  { label: 'System', value: 'system-ui, -apple-system, sans-serif' },
+  { label: 'Sans', value: 'Helvetica, Arial, sans-serif' },
+  { label: 'Serif', value: "Georgia, 'Times New Roman', serif" },
+  { label: 'Mono', value: "Menlo, Consolas, 'Courier New', monospace" },
+  { label: 'Rounded', value: "'SF Pro Rounded', 'Segoe UI', system-ui, sans-serif" },
+];
+
 type FlyoutTool = 'pencil' | 'pen' | 'eraser' | 'highlighter';
 const FLYOUT_TOOLS = new Set<ToolId>(['pencil', 'pen', 'eraser', 'highlighter']);
 const isFlyoutTool = (id: ToolId): id is FlyoutTool => FLYOUT_TOOLS.has(id);
@@ -114,6 +219,20 @@ export function ToolbarApp() {
     saveDir: null,
     alwaysAskSavePath: false,
     statusPanelOpen: false,
+    chatOpen: false,
+    aiActiveProvider: null,
+    aiActiveModel: null,
+    aiProfilePrompts: {},
+    aiLocalEnabled: false,
+    aiInstalledModels: [],
+    aiLocalModel: null,
+    aiLocalVisionModel: null,
+    aiProfileModels: {},
+    autocorrectTyped: false,
+    autocorrectDrawn: false,
+    defaultTextFont: 'system-ui, -apple-system, sans-serif',
+    aiOnboarded: false,
+    autoUpdate: true,
   });
   // Status-panel state. Mutually exclusive with the settings panel —
   // when one opens, the layout slot belongs to it. `panelError` holds
@@ -144,17 +263,194 @@ export function ToolbarApp() {
     version: '1.0.0',
     packaged: true,
   });
+  // Auto-update lifecycle, pushed from main via 'updater:status'.
+  const [updateStatus, setUpdateStatus] = createSignal<UpdateStatus | null>(null);
   let scrollRef: HTMLDivElement | undefined;
   let barMainRef: HTMLDivElement | undefined;
 
+  // ── AI Settings section state ───────────────────────────────────
+  // aiStatus tells us which providers have a key (renderer never sees
+  // the key itself). Selected dropdown values + keyInput are local
+  // working state until the user clicks Save.
+  const [aiStatus, setAiStatus] = createSignal<AiStatus[]>([]);
+  const [aiSelectedProvider, setAiSelectedProvider] = createSignal<CloudProviderId>('anthropic');
+  const [aiSelectedModel, setAiSelectedModel] = createSignal<string>(
+    DEFAULT_MODEL.anthropic,
+  );
+  const [aiKeyInput, setAiKeyInput] = createSignal('');
+  const [aiTestResult, setAiTestResult] = createSignal<ConnectionTestResult | null>(null);
+  const [aiBusy, setAiBusy] = createSignal<'saving' | 'testing' | null>(null);
+  // The current chat session, captured here (in the always-mounted
+  // toolbar) rather than inside ChatPanel — ChatPanel only mounts when
+  // chatOpen flips true, and main broadcasts chat:session at that same
+  // instant, so a listener inside the panel misses the first session.
+  // We subscribe in onMount below and hand it down as a prop.
+  const [chatSession, setChatSession] = createSignal<ChatSessionPayload | null>(null);
+
+  const refreshAiStatus = async (): Promise<void> => {
+    const status = await window.pen.ai.getStatus();
+    setAiStatus(status);
+  };
+
+  const isProviderConfigured = (id: ProviderId): boolean =>
+    aiStatus().find((s) => s.provider === id)?.configured ?? false;
+
+  // ── Local (Ollama) AI state ─────────────────────────────────────
+  const [ollamaStatus, setOllamaStatus] = createSignal<OllamaServiceStatus | null>(null);
+  const [localModels, setLocalModels] = createSignal<LocalModelInfo[]>([]);
+  // Per-tag pull progress, keyed by model tag. Present = pull in flight.
+  const [pulls, setPulls] = createSignal<Record<string, OllamaPullProgress>>({});
+
+  const refreshLocal = async (): Promise<void> => {
+    const st = await window.pen.ollama.status();
+    setOllamaStatus(st);
+    setLocalModels(st.running ? await window.pen.ollama.listModels() : []);
+  };
+
+  // ── Learning (RAG) state ────────────────────────────────────────
+  const [ragStats, setRagStats] = createSignal<Record<ProfileId, number>>({
+    general: 0,
+    teacher: 0,
+    trader: 0,
+  });
+  const refreshRag = async (): Promise<void> => {
+    setRagStats(await window.pen.rag.stats());
+  };
+  const resetLearning = async (profile: ProfileId): Promise<void> => {
+    await window.pen.rag.resetProfile(profile);
+    await refreshRag();
+  };
+
+  // ── First-run setup wizard ──────────────────────────────────────
+  const defaultModels = (): LocalModelInfo[] => localModels().filter((m) => m.defaultPull);
+  const defaultModelsTotalGB = (): string =>
+    (defaultModels().reduce((sum, m) => sum + m.approxBytes, 0) / 1e9).toFixed(1);
+  const defaultModelsReady = (): boolean => {
+    const d = defaultModels();
+    return d.length > 0 && d.every((m) => m.installed);
+  };
+  type WizardStep = 'checking' | 'install' | 'start' | 'download' | 'ready';
+  const wizardStep = (): WizardStep => {
+    const st = ollamaStatus();
+    if (!st) return 'checking';
+    if (!st.installed) return 'install';
+    if (!st.running) return 'start';
+    return defaultModelsReady() ? 'ready' : 'download';
+  };
+  const downloadRecommended = async (): Promise<void> => {
+    for (const m of defaultModels()) {
+      if (!m.installed && !pulls()[m.tag]) await pullModel(m.tag);
+    }
+  };
+  const finishOnboarding = (): void =>
+    void window.pen.hub.update({
+      aiLocalEnabled: true,
+      aiOnboarded: true,
+      settingsOpen: false,
+    });
+  const skipOnboarding = (): void => void window.pen.hub.update({ aiOnboarded: true });
+
+  const startOllama = async (): Promise<void> => {
+    setOllamaStatus(await window.pen.ollama.start());
+    await refreshLocal();
+  };
+
+  const pullModel = async (tag: string): Promise<void> => {
+    setPulls((p) => ({ ...p, [tag]: { model: tag, status: 'starting' } }));
+    await window.pen.ollama.pull(tag);
+    setPulls((p) => {
+      const next = { ...p };
+      delete next[tag];
+      return next;
+    });
+    await refreshLocal();
+  };
+
+  const cancelPull = (tag: string): void => {
+    void window.pen.ollama.cancelPull(tag);
+  };
+
+  const deleteModel = async (tag: string): Promise<void> => {
+    await window.pen.ollama.deleteModel(tag);
+    await refreshLocal();
+  };
+
+  const pullPct = (p: OllamaPullProgress): number | null => {
+    if (!p.total || !p.completed) return null;
+    return Math.min(100, Math.round((p.completed / p.total) * 100));
+  };
+
+  const toggleLocalEnabled = (): void => {
+    void window.pen.hub.update({ aiLocalEnabled: !hub().aiLocalEnabled });
+    if (!ollamaStatus()?.running) void startOllama();
+  };
+
+  const toggleAutocorrectTyped = (): void =>
+    void window.pen.hub.update({ autocorrectTyped: !hub().autocorrectTyped });
+  const toggleAutocorrectDrawn = (): void =>
+    void window.pen.hub.update({ autocorrectDrawn: !hub().autocorrectDrawn });
+  const setDefaultFont = (value: string): void =>
+    void window.pen.hub.update({ defaultTextFont: value });
+
+  // Per-profile model pickers (only installed models of each kind).
+  const installedOfKind = (kind: 'text' | 'vision'): LocalModelInfo[] =>
+    localModels().filter((m) => m.kind === kind && m.installed);
+  const setProfileModel = (profile: ProfileId, kind: 'text' | 'vision', tag: string): void =>
+    void window.pen.hub.update({ aiProfileModels: { [profile]: { [kind]: tag } } });
+
+  // Whenever the selected provider changes, snap the model dropdown
+  // to that provider's default (unless it's already a valid model
+  // for the provider — e.g. when the hub broadcasts an existing pair).
+  createEffect(() => {
+    const p = aiSelectedProvider();
+    const valid = MODELS_BY_PROVIDER[p].some((m) => m.id === aiSelectedModel());
+    if (!valid) setAiSelectedModel(DEFAULT_MODEL[p]);
+  });
+
+  // Sync the selected dropdowns to the persisted active provider
+  // once the hub state arrives.
+  createEffect(() => {
+    const ap = hub().aiActiveProvider;
+    const am = hub().aiActiveModel;
+    // The cloud dropdown only tracks cloud providers; local has its
+    // own section, so ignore an 'ollama' active provider here.
+    if (ap && ap !== 'ollama') setAiSelectedProvider(ap);
+    if (am) setAiSelectedModel(am);
+  });
+
   onMount(() => {
     void window.pen.hub.get().then((state) => {
       const s = state as HubSnapshot;
       setHub(s);
       if (s.settingsOpen) refreshSide();
+      // First launch → open Settings so the setup wizard is visible.
+      if (!s.aiOnboarded) void window.pen.hub.update({ settingsOpen: true });
     });
     void window.pen.win.platform().then(setPlatform);
     void window.pen.app.info().then(setAppInfo);
+    void window.pen.updater.get().then(setUpdateStatus);
+    const offUpdater = window.pen.updater.onStatus(setUpdateStatus);
+    onCleanup(offUpdater);
+    void refreshAiStatus();
+    void refreshLocal();
+    void refreshRag();
+    // Live pull progress for the local model installer.
+    const offPull = window.pen.ollama.onPullProgress((p) => {
+      setPulls((prev) => {
+        if (p.done) {
+          const next = { ...prev };
+          delete next[p.model];
+          return next;
+        }
+        return { ...prev, [p.model]: p };
+      });
+    });
+    onCleanup(offPull);
+    // Capture chat sessions for the ChatPanel. Subscribing here (always
+    // mounted) instead of inside the panel is what fixes the "first Ask
+    // AI does nothing" bug — see chatSession's declaration.
+    const offChat = window.pen.chat.onSession(setChatSession);
+    onCleanup(offChat);
     const off = window.pen.hub.onBroadcast((state) => {
       const s = state as HubSnapshot;
       setHub(s);
@@ -329,6 +625,7 @@ export function ToolbarApp() {
     void s.minimized;
     void s.settingsOpen;
     void s.statusPanelOpen;
+    void s.chatOpen;
     void s.thicknessFlyoutOpen;
     void s.profile;
     void s.activeTool;
@@ -455,6 +752,36 @@ export function ToolbarApp() {
   };
   const openScreenPrefs = () => void window.pen.permissions.open('screen');
   const relaunchApp = () => void window.pen.app.relaunch();
+
+  // ── Auto-update actions ─────────────────────────────────────────
+  const checkForUpdates = (): void => void window.pen.updater.check();
+  const installUpdate = (): void => void window.pen.updater.install();
+  const openReleases = (): void => void window.pen.updater.openReleases();
+  const toggleAutoUpdate = (): void =>
+    void window.pen.hub.update({ autoUpdate: !hub().autoUpdate });
+  // One-line, human-readable summary of the current update state.
+  const updateLine = (): string => {
+    const u = updateStatus();
+    if (!u) return '';
+    switch (u.state) {
+      case 'checking':
+        return 'Checking for updates…';
+      case 'available':
+        return `Update available: v${u.version}`;
+      case 'downloading':
+        return `Downloading v${u.version ?? ''}… ${u.percent ?? 0}%`;
+      case 'downloaded':
+        return `v${u.version} ready — restart to update`;
+      case 'none':
+        return "You're on the latest version";
+      case 'unsupported':
+        return 'Automatic updates unavailable on this build';
+      case 'error':
+        return `Update check failed${u.message ? `: ${u.message}` : ''}`;
+      default:
+        return '';
+    }
+  };
   const pickFolderFromError = async () => {
     const dir = (await window.pen.settings.pickSaveDir()) as string | null;
     if (dir) {
@@ -470,11 +797,93 @@ export function ToolbarApp() {
     if (panelKind() === 'permission') void recheckPermission();
   };
 
+  // ── AI action handlers ─────────────────────────────────────────
+  const saveAiKey = async (): Promise<void> => {
+    const key = aiKeyInput().trim();
+    if (key.length === 0) return;
+    setAiBusy('saving');
+    try {
+      await window.pen.ai.setKey(aiSelectedProvider(), key);
+      await refreshAiStatus();
+      setAiKeyInput('');
+      // Snap the active provider/model to what was just configured
+      // so the Ask AI button knows what to use.
+      void window.pen.hub.update({
+        aiActiveProvider: aiSelectedProvider(),
+        aiActiveModel: aiSelectedModel(),
+      });
+      setAiTestResult({ ok: true, message: 'Key saved' });
+    } finally {
+      setAiBusy(null);
+    }
+  };
+  const deleteAiKey = async (): Promise<void> => {
+    await window.pen.ai.deleteKey(aiSelectedProvider());
+    await refreshAiStatus();
+    setAiTestResult(null);
+    // If we just deleted the active provider's key, clear it from
+    // hub so the Ask AI button hides.
+    if (hub().aiActiveProvider === aiSelectedProvider()) {
+      void window.pen.hub.update({
+        aiActiveProvider: null,
+        aiActiveModel: null,
+      });
+    }
+  };
+  const testAiConnection = async (): Promise<void> => {
+    setAiBusy('testing');
+    setAiTestResult(null);
+    try {
+      const result = await window.pen.ai.testConnection(
+        aiSelectedProvider(),
+        aiSelectedModel(),
+      );
+      setAiTestResult(result);
+    } finally {
+      setAiBusy(null);
+    }
+  };
+  const setProfilePrompt = (profile: ProfileId, text: string): void => {
+    void window.pen.hub.update({
+      aiProfilePrompts: { [profile]: text },
+    });
+  };
+  const resetProfilePrompt = (profile: ProfileId): void => {
+    // Empty-string override is treated as "no override" by hub.patch,
+    // so the default from PROFILES kicks back in.
+    void window.pen.hub.update({
+      aiProfilePrompts: { [profile]: '' },
+    });
+  };
+  // Active model picker: whenever the user changes the model dropdown
+  // for the ALREADY-CONFIGURED active provider, persist that choice.
+  const onModelChange = (model: string): void => {
+    setAiSelectedModel(model);
+    if (
+      hub().aiActiveProvider === aiSelectedProvider() &&
+      model !== hub().aiActiveModel
+    ) {
+      void window.pen.hub.update({ aiActiveModel: model });
+    }
+  };
+  const closeChat = (): void => {
+    void window.pen.hub.update({ chatOpen: false });
+  };
+
   // Mirror the side-panel state into a CSS-friendly attribute so the
   // existing layout rules (flex-direction switch in v-mode, etc.)
   // apply uniformly whether settings or a status panel is open.
   const sidePanelOpen = createMemo(() =>
-    hub().settingsOpen || panelKind() !== null,
+    hub().settingsOpen || panelKind() !== null || hub().chatOpen,
+  );
+
+  // Any AI path usable: a cloud provider configured, OR Local AI on with
+  // at least one model installed. Gates every AI entry point so nothing
+  // AI-driven is offered until the user has configured something.
+  const aiReady = createMemo(
+    () =>
+      hub().aiActiveProvider != null ||
+      (hub().aiLocalEnabled && hub().aiInstalledModels.length > 0),
   );
 
   const showHint = (text: string) => setHint(text);
@@ -665,6 +1074,16 @@ export function ToolbarApp() {
                 onMouseEnter={() => showHint('Screenshot · ⌘⇧S')}
                 onMouseLeave={clearHint}
               >{Icons.camera()}</button>
+              <Show when={hub().profile === 'trader' && aiReady()}>
+                <button
+                  class="action-btn"
+                  onClick={() => window.pen.relay.analyze()}
+                  onMouseEnter={() => showHint('Analyze drawn levels with AI')}
+                  onMouseLeave={clearHint}
+                  title="Analyze chart (AI)"
+                  aria-label="Analyze chart"
+                >{Icons.fib()}</button>
+              </Show>
               <button
                 class={`action-btn ${hub().whiteboard !== 'off' ? 'tinted' : ''}`}
                 onClick={cycleBoard}
@@ -859,6 +1278,94 @@ export function ToolbarApp() {
               >{Icons.close()}</button>
             </div>
 
+            {/* ── First-run setup wizard ── */}
+            <Show when={!hub().aiOnboarded}>
+              <div class="settings-section ai-section">
+                <div class="settings-section-label">Set up local AI</div>
+                <Switch>
+                  <Match when={wizardStep() === 'checking'}>
+                    <div class="ai-disclosure">Checking for Ollama…</div>
+                  </Match>
+                  <Match when={wizardStep() === 'install'}>
+                    <div class="ai-disclosure">
+                      Lekhini runs AI privately on your device using Ollama. Install
+                      it once, then come back and re-check.
+                    </div>
+                    <div class="settings-row">
+                      <button
+                        class="settings-toggle"
+                        onClick={() => void window.pen.ollama.installHelp()}
+                      >
+                        Install Ollama
+                      </button>
+                      <button class="settings-toggle" onClick={() => void refreshLocal()}>
+                        Re-check
+                      </button>
+                    </div>
+                  </Match>
+                  <Match when={wizardStep() === 'start'}>
+                    <div class="ai-disclosure">Ollama is installed but not running.</div>
+                    <button class="settings-toggle" onClick={() => void startOllama()}>
+                      Start service
+                    </button>
+                  </Match>
+                  <Match when={wizardStep() === 'download'}>
+                    <div class="ai-disclosure">
+                      Download the recommended models (~{defaultModelsTotalGB()} GB
+                      total). One-time — it runs in the background.
+                    </div>
+                    <For each={defaultModels()}>
+                      {(m) => (
+                        <div class="settings-row">
+                          <span class="settings-row-label">
+                            {m.label} · {(m.approxBytes / 1e9).toFixed(1)} GB
+                          </span>
+                          <Show
+                            when={pulls()[m.tag]}
+                            fallback={
+                              <span class="ai-badge-configured">
+                                {m.installed ? '● Installed' : '—'}
+                              </span>
+                            }
+                          >
+                            {(p) => (
+                              <span class="ai-prompt-row-label">
+                                {pullPct(p()) != null
+                                  ? `${pullPct(p())}%`
+                                  : p().status || 'pulling…'}
+                              </span>
+                            )}
+                          </Show>
+                        </div>
+                      )}
+                    </For>
+                    <button
+                      class="settings-toggle status-btn-primary"
+                      onClick={() => void downloadRecommended()}
+                    >
+                      Download recommended
+                    </button>
+                  </Match>
+                  <Match when={wizardStep() === 'ready'}>
+                    <div class="ai-disclosure">✓ You're ready — local AI is set up.</div>
+                    <button class="settings-toggle status-btn-primary" onClick={finishOnboarding}>
+                      Finish
+                    </button>
+                  </Match>
+                </Switch>
+                <a
+                  class="ai-key-link"
+                  href="#"
+                  onClick={(e) => {
+                    e.preventDefault();
+                    skipOnboarding();
+                  }}
+                >
+                  Skip for now
+                </a>
+              </div>
+            </Show>
+
             <div class="settings-section">
               <div class="settings-section-label">Profile</div>
               <div class="profile-list">
@@ -904,6 +1411,365 @@ export function ToolbarApp() {
               </div>
             </div>
 
+            <div class="settings-section ai-section">
+              <div class="settings-section-label">AI</div>
+
+              {/* ── Local-first AI (Ollama) ── */}
+              <div class="settings-row">
+                <span class="settings-row-label">Local AI (Ollama)</span>
+                <button
+                  class={`settings-toggle ${hub().aiLocalEnabled ? 'on' : ''}`}
+                  onClick={toggleLocalEnabled}
+                >
+                  <span>{hub().aiLocalEnabled ? 'On' : 'Off'}</span>
+                </button>
+              </div>
+              <Show when={hub().aiLocalEnabled}>
+                <div class="settings-row settings-row-stack">
+                  <span class="settings-row-label">
+                    Service
+                    <Show when={ollamaStatus()?.running}>
+                      <span class="ai-badge-configured">
+                        ● Running{ollamaStatus()?.version ? ` ${ollamaStatus()!.version}` : ''}
+                      </span>
+                    </Show>
+                  </span>
+                  <Show when={ollamaStatus() && !ollamaStatus()!.installed}>
+                    <div class="ai-test-result fail">
+                      Ollama isn't installed.
+                      <a
+                        class="ai-key-link"
+                        href="#"
+                        onClick={(e) => {
+                          e.preventDefault();
+                          void window.pen.ollama.installHelp();
+                        }}
+                      >
+                        {' '}
+                        Install Ollama →
+                      </a>
+                    </div>
+                  </Show>
+                  <Show when={ollamaStatus()?.installed && !ollamaStatus()?.running}>
+                    <button class="settings-toggle" onClick={() => void startOllama()}>
+                      Start service
+                    </button>
+                  </Show>
+                </div>
+
+                <Show when={ollamaStatus()?.running}>
+                  <div class="settings-row settings-row-stack">
+                    <span class="settings-row-label">Models per profile</span>
+                    <For each={PROFILE_ORDER}>
+                      {(pid) => (
+                        <div class="ai-prompt-row">
+                          <div class="ai-prompt-row-head">
+                            <span class="ai-prompt-row-label">{PROFILES[pid].label}</span>
+                          </div>
+                          <select
+                            class="settings-toggle settings-toggle-wide ai-select"
+                            value={hub().aiProfileModels[pid]?.text ?? ''}
+                            onChange={(e) =>
+                              setProfileModel(
+                                pid,
+                                'text',
+                                (e.currentTarget as HTMLSelectElement).value,
+                              )
+                            }
+                          >
+                            <option value="">Text: Auto (recommended)</option>
+                            <For each={installedOfKind('text')}>
+                              {(m) => <option value={m.tag}>Text: {m.label}</option>}
+                            </For>
+                          </select>
+                          <select
+                            class="settings-toggle settings-toggle-wide ai-select"
+                            value={hub().aiProfileModels[pid]?.vision ?? ''}
+                            onChange={(e) =>
+                              setProfileModel(
+                                pid,
+                                'vision',
+                                (e.currentTarget as HTMLSelectElement).value,
+                              )
+                            }
+                          >
+                            <option value="">Vision: Auto (recommended)</option>
+                            <For each={installedOfKind('vision')}>
+                              {(m) => <option value={m.tag}>Vision: {m.label}</option>}
+                            </For>
+                          </select>
+                        </div>
+                      )}
+                    </For>
+                  </div>
+                  <div class="settings-row settings-row-stack">
+                    <span class="settings-row-label">Models</span>
+                    <For each={localModels()}>
+                      {(m) => (
+                        <div class="ai-prompt-row">
+                          <div class="ai-prompt-row-head">
+                            <span class="ai-prompt-row-label">
+                              {m.label} · {(m.approxBytes / 1e9).toFixed(1)} GB
+                            </span>
+                            <Show
+                              when={pulls()[m.tag]}
+                              fallback={
+                                <Show
+                                  when={m.installed}
+                                  fallback={
+                                    <button
+                                      class="ai-prompt-reset"
+                                      onClick={() => void pullModel(m.tag)}
+                                    >
+                                      Install
+                                    </button>
+                                  }
+                                >
+                                  <button
+                                    class="ai-prompt-reset"
+                                    onClick={() => void deleteModel(m.tag)}
+                                    title="Remove this model"
+                                  >
+                                    Remove
+                                  </button>
+                                </Show>
+                              }
+                            >
+                              {(p) => (
+                                <span class="ai-prompt-row-label">
+                                  {pullPct(p()) != null
+                                    ? `${pullPct(p())}%`
+                                    : p().status || 'pulling…'}
+                                  <button
+                                    class="ai-prompt-reset"
+                                    onClick={() => cancelPull(m.tag)}
+                                  >
+                                    Cancel
+                                  </button>
+                                </span>
+                              )}
+                            </Show>
+                          </div>
+                        </div>
+                      )}
+                    </For>
+                  </div>
+                </Show>
+              </Show>
+
+              {/* ── Autocorrect + default font ── */}
+              <div class="settings-row">
+                <span class="settings-row-label">Autocorrect typed text</span>
+                <button
+                  class={`settings-toggle ${hub().autocorrectTyped ? 'on' : ''}`}
+                  onClick={toggleAutocorrectTyped}
+                >
+                  <span>{hub().autocorrectTyped ? 'On' : 'Off'}</span>
+                </button>
+              </div>
+              <div class="settings-row">
+                <span class="settings-row-label">Autocorrect drawn text</span>
+                <button
+                  class={`settings-toggle ${hub().autocorrectDrawn ? 'on' : ''}`}
+                  onClick={toggleAutocorrectDrawn}
+                >
+                  <span>{hub().autocorrectDrawn ? 'On' : 'Off'}</span>
+                </button>
+              </div>
+              <div class="settings-row settings-row-stack">
+                <span class="settings-row-label">Default text font</span>
+                <select
+                  class="settings-toggle settings-toggle-wide ai-select"
+                  value={hub().defaultTextFont}
+                  onChange={(e) =>
+                    setDefaultFont((e.currentTarget as HTMLSelectElement).value)
+                  }
+                >
+                  <For each={TEXT_FONTS}>
+                    {(f) => <option value={f.value}>{f.label}</option>}
+                  </For>
+                </select>
+              </div>
+
+              {/* ── Cloud provider (optional fallback) ── */}
+              <div class="settings-section-label">Cloud fallback</div>
+              <div class="settings-row settings-row-stack">
+                <span class="settings-row-label">Provider</span>
+                <select
+                  class="settings-toggle settings-toggle-wide ai-select"
+                  value={aiSelectedProvider()}
+                  onChange={(e) =>
+                    setAiSelectedProvider(
+                      (e.currentTarget as HTMLSelectElement).value as CloudProviderId,
+                    )
+                  }
+                >
+                  <For each={Object.keys(PROVIDER_LABELS) as CloudProviderId[]}>
+                    {(p) => (
+                      <option value={p}>
+                        {PROVIDER_LABELS[p]}
+                        {isProviderConfigured(p) ? ' · configured' : ''}
+                      </option>
+                    )}
+                  </For>
+                </select>
+              </div>
+              <div class="settings-row settings-row-stack">
+                <span class="settings-row-label">Model</span>
+                <select
+                  class="settings-toggle settings-toggle-wide ai-select"
+                  value={aiSelectedModel()}
+                  onChange={(e) =>
+                    onModelChange((e.currentTarget as HTMLSelectElement).value)
+                  }
+                >
+                  <For each={MODELS_BY_PROVIDER[aiSelectedProvider()]}>
+                    {(m) => <option value={m.id}>{m.label}</option>}
+                  </For>
+                </select>
+              </div>
+              <div class="settings-row settings-row-stack">
+                <span class="settings-row-label">
+                  API key
+                  <Show when={isProviderConfigured(aiSelectedProvider())}>
+                    <span class="ai-badge-configured">● Configured</span>
+                  </Show>
+                </span>
+                <input
+                  class="ai-key-input"
+                  type="password"
+                  autocomplete="off"
+                  spellcheck={false}
+                  placeholder={
+                    isProviderConfigured(aiSelectedProvider())
+                      ? 'Replace key…'
+                      : 'Paste API key'
+                  }
+                  value={aiKeyInput()}
+                  onInput={(e) =>
+                    setAiKeyInput((e.currentTarget as HTMLInputElement).value)
+                  }
+                />
+                <div class="ai-key-actions">
+                  <button
+                    class="settings-toggle"
+                    onClick={() => void saveAiKey()}
+                    disabled={aiKeyInput().trim().length === 0 || aiBusy() !== null}
+                  >
+                    {aiBusy() === 'saving' ? 'Saving…' : 'Save'}
+                  </button>
+                  <button
+                    class="settings-toggle"
+                    onClick={() => void testAiConnection()}
+                    disabled={
+                      !isProviderConfigured(aiSelectedProvider()) || aiBusy() !== null
+                    }
+                  >
+                    {aiBusy() === 'testing' ? 'Testing…' : 'Test'}
+                  </button>
+                  <Show when={isProviderConfigured(aiSelectedProvider())}>
+                    <button
+                      class="settings-toggle ai-key-delete"
+                      onClick={() => void deleteAiKey()}
+                      title="Remove the saved key for this provider"
+                    >
+                      Delete
+                    </button>
+                  </Show>
+                </div>
+                <Show when={aiTestResult()}>
+                  {(r) => (
+                    <div
+                      class={`ai-test-result ${r().ok ? 'ok' : 'fail'}`}
+                    >
+                      {r().ok
+                        ? `✓ ${r().message ?? 'OK'}${
+                            r().latencyMs ? ` · ${r().latencyMs}ms` : ''
+                          }`
+                        : `✗ ${r().message ?? 'Failed'}`}
+                    </div>
+                  )}
+                </Show>
+                <a
+                  class="ai-key-link"
+                  href={PROVIDER_KEY_URLS[aiSelectedProvider()]}
+                  onClick={(e) => {
+                    e.preventDefault();
+                    void window.pen.shell.openPath(PROVIDER_KEY_URLS[aiSelectedProvider()]);
+                  }}
+                >
+                  Get a key →
+                </a>
+              </div>
+              <div class="settings-row settings-row-stack">
+                <span class="settings-row-label">Profile prompts</span>
+                <For each={PROFILE_ORDER}>
+                  {(pid) => (
+                    <div class="ai-prompt-row">
+                      <div class="ai-prompt-row-head">
+                        <span class="ai-prompt-row-label">{PROFILES[pid].label}</span>
+                        <Show when={hub().aiProfilePrompts[pid]}>
+                          <button
+                            class="ai-prompt-reset"
+                            onClick={() => resetProfilePrompt(pid)}
+                            title="Restore the built-in prompt"
+                          >
+                            Reset
+                          </button>
+                        </Show>
+                      </div>
+                      <textarea
+                        class="ai-prompt-textarea"
+                        rows={3}
+                        value={resolveAiPrompt(pid, hub().aiProfilePrompts)}
+                        onChange={(e) =>
+                          setProfilePrompt(
+                            pid,
+                            (e.currentTarget as HTMLTextAreaElement).value,
+                          )
+                        }
+                      />
+                    </div>
+                  )}
+                </For>
+              </div>
+              <div class="ai-disclosure">
+                With Local AI on, text and images stay on your device — nothing
+                is sent to a server. The cloud fallback (above) is only used when
+                Local AI is off or no local model is installed; in that case your
+                content goes directly to the selected provider under its own
+                data-handling policy. Lekhini does not log or proxy it.
+              </div>
+
+              {/* ── Learning (on-device RAG) ── */}
+              <div class="settings-section-label">Learning</div>
+              <For each={PROFILE_ORDER}>
+                {(pid) => (
+                  <div class="settings-row">
+                    <span class="settings-row-label">
+                      {PROFILES[pid].label}
+                      <span class="ai-badge-configured">
+                        {ragStats()[pid] ?? 0} examples
+                      </span>
+                    </span>
+                    <button
+                      class="settings-toggle"
+                      onClick={() => void resetLearning(pid)}
+                      disabled={(ragStats()[pid] ?? 0) === 0}
+                      title="Forget everything learned for this profile"
+                    >
+                      Reset
+                    </button>
+                  </div>
+                )}
+              </For>
+              <div class="ai-disclosure">
+                Autocorrect learns from the corrections you accept and from
+                bundled starter examples, stored only on this device. Requires
+                the local embedding model (nomic-embed-text).
+              </div>
+            </div>
+
             <div class="settings-section">
               <div class="settings-section-label">File save</div>
               <div class="settings-row">
@@ -929,6 +1795,72 @@ export function ToolbarApp() {
               </div>
             </div>
 
+            <div class="settings-section">
+              <div class="settings-section-label">Updates</div>
+              <div class="settings-row">
+                <span class="settings-row-label">Automatic updates</span>
+                <button
+                  class={`settings-toggle ${hub().autoUpdate ? 'on' : ''}`}
+                  onClick={toggleAutoUpdate}
+                >
+                  <span>{hub().autoUpdate ? 'On' : 'Off'}</span>
+                </button>
+              </div>
+              <div class="settings-row settings-row-stack">
+                <span class="settings-row-label">
+                  Version
+                  <span class="ai-badge-configured">v{appInfo().version}</span>
+                </span>
+                <Show when={updateLine()}>
+                  <div
+                    class={`ai-test-result ${
+                      updateStatus()?.state === 'error' ? 'fail' : 'ok'
+                    }`}
+                  >
+                    {updateLine()}
+                  </div>
+                </Show>
+                <div class="ai-key-actions">
+                  <button
+                    class="settings-toggle"
+                    onClick={checkForUpdates}
+                    disabled={
+                      updateStatus()?.state === 'checking' ||
+                      updateStatus()?.state === 'downloading'
+                    }
+                  >
+                    {updateStatus()?.state === 'checking' ? 'Checking…' : 'Check for updates'}
+                  </button>
+                  <Show
+                    when={
+                      updateStatus()?.state === 'downloaded' ||
+                      updateStatus()?.state === 'available'
+                    }
+                  >
+                    <button class="settings-toggle status-btn-primary" onClick={installUpdate}>
+                      {updateStatus()?.state === 'downloaded'
+                        ? 'Restart to update'
+                        : 'Download & install'}
+                    </button>
+                  </Show>
+                </div>
+                {/* Manual fallback when auto-update can't apply (dev run,
+                    or unsigned macOS where Squirrel refuses updates). */}
+                <Show when={updateStatus()?.state === 'unsupported'}>
+                  <a
+                    class="ai-key-link"
+                    href="#"
+                    onClick={(e) => {
+                      e.preventDefault();
+                      openReleases();
+                    }}
+                  >
+                    Download the latest from GitHub →
+                  </a>
+                </Show>
+              </div>
+            </div>
+
             <div class="settings-section">
               <div class="settings-section-label">About</div>
               <div class="about-card">
@@ -949,6 +1881,23 @@ export function ToolbarApp() {
           </div>
         </Show>
 
+        {/* ─── CHAT PANEL (AI integration) ──────────────────────────
+             Shares the dock slot with Settings + Status. Mutual
+             exclusion is enforced in hub.patch — opening this closes
+             the others. Settings still has render priority though,
+             so a user mid-chat who opens Settings sees Settings and
+             the chat is hidden until they close it. */}
+        <Show when={hub().chatOpen && !hub().settingsOpen && panelKind() === null}>
+          <ChatPanel
+            provider={hub().aiActiveProvider}
+            model={hub().aiActiveModel}
+            aiReady={aiReady()}
+            session={chatSession()}
+            promptOverrides={hub().aiProfilePrompts}
+            onClose={closeChat}
+          />
+        </Show>
+
         {/* ─── STATUS PANEL (permission / save error) ──────────────
              Reuses the .settings-panel layout slot so it docks like
              the Settings panel and grows the toolbar window the same
diff --git a/src/renderer/toolbar/ChatPanel.tsx b/src/renderer/toolbar/ChatPanel.tsx
new file mode 100644
index 0000000..3305f70
--- /dev/null
+++ b/src/renderer/toolbar/ChatPanel.tsx
@@ -0,0 +1,345 @@
+import { createEffect, createSignal, For, onCleanup, onMount, Show } from 'solid-js';
+import { marked } from 'marked';
+import { PROFILES, resolveAiPrompt } from '../../shared/profiles';
+import type {
+  ChatSessionPayload,
+  ChatTurn,
+  ProfileId,
+  ProviderId,
+} from '../../shared/types';
+import { Icons } from './icons';
+
+interface Props {
+  // Comes from hub.aiActiveProvider / aiActiveModel — the cloud
+  // fallback pair, null when no cloud provider is configured. Main's
+  // resolver may override this with a local model, so these are just a
+  // hint; routing is authoritative server-side.
+  provider: ProviderId | null;
+  model: string | null;
+  // True when ANY AI path is usable (local model installed OR a cloud
+  // provider configured). Drives the empty-state instead of provider.
+  aiReady: boolean;
+  // The active chat session, lifted to ToolbarApp (which is always
+  // mounted) so the very first snip isn't dropped. See the createEffect
+  // below for why this can't live as a subscription inside this panel.
+  session: ChatSessionPayload | null;
+  promptOverrides: Partial<Record<ProfileId, string>>;
+  onClose: () => void;
+}
+
+interface DisplayTurn extends ChatTurn {
+  // Streaming responses arrive in chunks; we mark the open assistant
+  // turn so we know which one to append to. Cleared when 'done'
+  // fires for the matching requestId.
+  pending?: boolean;
+  // Error string when the request failed mid-stream.
+  error?: string;
+}
+
+// Configure marked once. We don't enable HTML parsing (security: the
+// model could output <script>) — marked escapes by default.
+marked.setOptions({ breaks: true, gfm: true });
+
+export function ChatPanel(props: Props) {
+  const [session, setSession] = createSignal<ChatSessionPayload | null>(null);
+  const [turns, setTurns] = createSignal<DisplayTurn[]>([]);
+  const [composer, setComposer] = createSignal('');
+  const [activeRequest, setActiveRequest] = createSignal<string | null>(null);
+  let scrollEl: HTMLDivElement | undefined;
+  let composerEl: HTMLTextAreaElement | undefined;
+
+  // React to the session prop. The subscription that produces it lives
+  // in ToolbarApp (always mounted) rather than here, because this panel
+  // only mounts once hub.chatOpen flips true — and main broadcasts
+  // chat:session at the same moment it sets chatOpen. A listener inside
+  // this panel's onMount would miss the FIRST session every time (the
+  // event fired before the panel existed), which is exactly the "first
+  // Ask AI opens an empty chat, second one works" bug. Reacting to the
+  // prop runs the opening turn whether the session lands before or after
+  // mount. Each new sessionId resets the panel — old conversation is
+  // dropped (ephemeral by design in v1; persistence comes later).
+  let lastSessionId: string | null = null;
+  createEffect(() => {
+    const s = props.session;
+    if (!s || s.sessionId === lastSessionId) return;
+    lastSessionId = s.sessionId;
+    setSession(s);
+    setTurns([]);
+    setActiveRequest(null);
+    // Kick off the first AI turn automatically. Image sessions fire
+    // with "" (the image + system prompt carry the request); text
+    // sessions fire with their precomputed initialText.
+    void runTurn(s.initialText ?? '', s);
+  });
+
+  onMount(() => {
+    const offChunk = window.pen.ai.onChunk((c) => {
+      if (c.requestId !== activeRequest()) return;
+      setTurns((prev) => {
+        const next = [...prev];
+        const last = next[next.length - 1];
+        if (!last || last.role !== 'assistant') return prev;
+        if (c.error) {
+          next[next.length - 1] = { ...last, error: c.error, pending: false };
+        } else if (c.delta) {
+          next[next.length - 1] = { ...last, content: last.content + c.delta };
+        }
+        if (c.done) {
+          next[next.length - 1] = { ...next[next.length - 1], pending: false };
+        }
+        return next;
+      });
+      if (c.done) {
+        setActiveRequest(null);
+        queueMicrotask(focusComposer);
+      }
+    });
+    onCleanup(offChunk);
+  });
+
+  // Auto-scroll to the bottom as the assistant streams.
+  createEffect(() => {
+    void turns();
+    if (!scrollEl) return;
+    queueMicrotask(() => {
+      if (scrollEl) scrollEl.scrollTop = scrollEl.scrollHeight;
+    });
+  });
+
+  const focusComposer = (): void => composerEl?.focus();
+
+  // Build an asynchronous turn. On the FIRST user turn (no prior user
+  // history) we attach the image. Subsequent turns are text-only —
+  // each provider adapter follows the same convention.
+  const runTurn = async (
+    userMessage: string,
+    forSession?: ChatSessionPayload,
+  ): Promise<void> => {
+    const s = forSession ?? session();
+    if (!s) return;
+    if (!props.aiReady) {
+      setTurns((prev) => [
+        ...prev,
+        {
+          role: 'assistant',
+          content: '',
+          error:
+            'No AI available. Enable Local AI and install a model, or add a cloud provider key in Settings → AI.',
+        },
+      ]);
+      return;
+    }
+    // Snapshot the conversation BEFORE adding this turn — that's the
+    // history we replay. Building it after the pushes would duplicate
+    // the current message (also sent separately as userMessage).
+    const history: ChatTurn[] = turns()
+      .filter((t) => !t.pending && !t.error)
+      .map((t) => ({ role: t.role, content: t.content }));
+    // First turn = no prior user turn. The image attaches here; main
+    // caches it and re-injects it on follow-ups so context is retained.
+    const isFirstTurn = !history.some((h) => h.role === 'user');
+
+    // Record the user turn — INCLUDING the auto-fired opening turn whose
+    // text is empty (the image carries the request). Storing it keeps the
+    // original ask in the replayed history so follow-ups don't go amnesiac.
+    setTurns((prev) => [...prev, { role: 'user', content: userMessage }]);
+    // Push an open assistant turn that the streamed chunks will fill.
+    setTurns((prev) => [...prev, { role: 'assistant', content: '', pending: true }]);
+
+    const systemPrompt = resolveAiPrompt(s.profile, props.promptOverrides);
+    const image =
+      isFirstTurn && s.png
+        ? { mime: s.mime ?? 'image/png', base64: uint8ToBase64(s.png) }
+        : undefined;
+
+    try {
+      const { requestId } = await window.pen.ai.ask({
+        // Hints only — main's resolver picks local-vs-cloud and the
+        // concrete model. Default to local when no cloud pair is set.
+        provider: props.provider ?? 'ollama',
+        model: props.model ?? '',
+        systemPrompt,
+        image,
+        history,
+        userMessage,
+        profile: s.profile,
+        // Scopes the conversation so main caches the snip (and Sarvam its
+        // OCR) per chat, until a new snip starts a fresh session.
+        sessionId: s.sessionId,
+      });
+      setActiveRequest(requestId);
+    } catch (err) {
+      const msg = (err as Error)?.message ?? String(err);
+      setTurns((prev) => {
+        const next = [...prev];
+        const last = next[next.length - 1];
+        if (last && last.role === 'assistant') {
+          next[next.length - 1] = { ...last, error: msg, pending: false };
+        }
+        return next;
+      });
+    }
+  };
+
+  const onSend = (): void => {
+    const text = composer().trim();
+    if (text.length === 0 || activeRequest() !== null) return;
+    setComposer('');
+    void runTurn(text);
+  };
+
+  const onCancel = (): void => {
+    const id = activeRequest();
+    if (id) void window.pen.ai.cancel(id);
+    setActiveRequest(null);
+    setTurns((prev) => {
+      const next = [...prev];
+      const last = next[next.length - 1];
+      if (last && last.role === 'assistant' && last.pending) {
+        next[next.length - 1] = { ...last, pending: false };
+      }
+      return next;
+    });
+  };
+
+  const onComposerKey = (e: KeyboardEvent): void => {
+    if (e.key === 'Enter' && (e.metaKey || e.ctrlKey)) {
+      e.preventDefault();
+      onSend();
+    } else if (e.key === 'Escape') {
+      e.preventDefault();
+      props.onClose();
+    }
+  };
+
+  // The snip image is large (200KB-2MB Uint8Array); render it via
+  // an object URL so we don't have to base64-encode for an <img>.
+  const imageObjectUrl = (): string | null => {
+    const s = session();
+    if (!s || !s.png) return null;
+    const blob = new Blob([s.png as BlobPart], { type: s.mime ?? 'image/png' });
+    return URL.createObjectURL(blob);
+  };
+
+  const profileLabel = (): string => {
+    const s = session();
+    return s ? PROFILES[s.profile].label : '';
+  };
+
+  return (
+    <div class="settings-panel chat-panel">
+      <div class="settings-header">
+        <div class="chat-header-meta">
+          <span class="settings-title">Ask AI</span>
+          <Show when={props.provider && props.model} fallback={
+            <Show when={props.aiReady}>
+              <span class="chat-provider-badge">Local</span>
+            </Show>
+          }>
+            <span class="chat-provider-badge">
+              {props.provider} · {props.model}
+            </span>
+          </Show>
+        </div>
+        <button
+          class="winctl"
+          onClick={props.onClose}
+          title="Close chat"
+        >{Icons.close()}</button>
+      </div>
+
+      <Show when={session() && session()!.png}>
+        {(_present) => (
+          <div class="chat-thumb-wrap">
+            <img class="chat-thumb" src={imageObjectUrl() ?? ''} alt="Snip" />
+            <span class="chat-thumb-meta">{profileLabel()}</span>
+            <span class="chat-thumb-sessionid" title={session()!.sessionId} />
+          </div>
+        )}
+      </Show>
+
+      <Show when={!session()}>
+        <div class="chat-empty">
+          Start a chat by taking a snip and clicking <strong>Ask AI</strong>.
+        </div>
+      </Show>
+
+      <div class="chat-messages scroll-area" ref={scrollEl}>
+        {/* Hide the auto-fired opening user turn (empty text — the snip
+            thumbnail above already represents it); it exists only to
+            anchor the replayed history. */}
+        <For each={turns().filter((t) => t.role !== 'user' || t.content.length > 0)}>
+          {(turn) => (
+            <div class={`chat-bubble chat-bubble-${turn.role}`}>
+              <Show when={turn.role === 'assistant' && turn.pending && turn.content.length === 0}>
+                <span class="chat-typing">Thinking…</span>
+              </Show>
+              <Show when={turn.error}>
+                <span class="chat-error">⚠ {turn.error}</span>
+              </Show>
+              <Show when={turn.content.length > 0}>
+                <div
+                  class="chat-markdown"
+                  innerHTML={renderMarkdown(turn.content)}
+                />
+              </Show>
+            </div>
+          )}
+        </For>
+      </div>
+
+      <div class="chat-composer">
+        <textarea
+          ref={composerEl}
+          class="chat-input"
+          placeholder={
+            session() ? 'Ask a follow-up… (⌘↩ to send, Esc to close)' : 'Take a snip first'
+          }
+          value={composer()}
+          onInput={(e) => setComposer((e.currentTarget as HTMLTextAreaElement).value)}
+          onKeyDown={onComposerKey}
+          disabled={!session()}
+          rows={2}
+        />
+        <Show
+          when={activeRequest() === null}
+          fallback={
+            <button class="chat-send chat-cancel" onClick={onCancel}>
+              Cancel
+            </button>
+          }
+        >
+          <button
+            class="chat-send"
+            onClick={onSend}
+            disabled={!session() || composer().trim().length === 0}
+            title="Send (⌘↩)"
+          >
+            Send
+          </button>
+        </Show>
+      </div>
+    </div>
+  );
+}
+
+// Uint8Array → base64. atob/btoa don't accept binary directly, so we
+// build the string in chunks to avoid the call-stack limit on large
+// images.
+function uint8ToBase64(bytes: Uint8Array): string {
+  const CHUNK = 0x8000;
+  let s = '';
+  for (let i = 0; i < bytes.length; i += CHUNK) {
+    s += String.fromCharCode.apply(
+      null,
+      bytes.subarray(i, i + CHUNK) as unknown as number[],
+    );
+  }
+  return btoa(s);
+}
+
+function renderMarkdown(src: string): string {
+  // marked.parse returns string | Promise<string>; we use the sync
+  // path by passing no async options. Cast is safe.
+  return marked.parse(src) as string;
+}
diff --git a/src/renderer/toolbar/styles.css b/src/renderer/toolbar/styles.css
index 0d1fb36..d833c37 100644
--- a/src/renderer/toolbar/styles.css
+++ b/src/renderer/toolbar/styles.css
@@ -1146,3 +1146,357 @@ html, body {
 .bar[data-orient='v'] .bar-footer-controls {
   justify-content: center;
 }
+
+/* ─────────────────── AI SETTINGS SECTION ─────────────────── */
+/* Reuses .settings-row-stack for label-on-top layout. The provider
+   and model selects use a native <select> styled to match the
+   existing .settings-toggle palette. */
+
+.ai-section .ai-select {
+  appearance: auto;
+  background: var(--input-bg);
+  color: var(--text);
+  border: 1px solid var(--border);
+  border-radius: 6px;
+  padding: 5px 10px;
+  font-size: 11.5px;
+  cursor: pointer;
+}
+
+.ai-key-input {
+  appearance: none;
+  width: 100%;
+  background: var(--input-bg);
+  color: var(--text);
+  border: 1px solid var(--border);
+  border-radius: 6px;
+  padding: 6px 10px;
+  font-size: 12px;
+  font-family: "SF Mono", "JetBrains Mono", Menlo, monospace;
+  outline: none;
+  letter-spacing: 0.02em;
+}
+.ai-key-input:focus {
+  border-color: var(--gold);
+  box-shadow: 0 0 0 2px rgba(216, 181, 114, 0.18);
+}
+
+.ai-key-actions {
+  display: flex;
+  gap: 6px;
+  align-items: center;
+  flex-wrap: wrap;
+}
+.ai-key-actions .settings-toggle { padding: 5px 12px; }
+
+.ai-key-delete {
+  color: #e74c3c !important;
+  border-color: rgba(231, 76, 60, 0.30) !important;
+}
+.ai-key-delete:hover { background: rgba(231, 76, 60, 0.10) !important; }
+
+.ai-badge-configured {
+  display: inline-block;
+  margin-left: 8px;
+  font-size: 9.5px;
+  font-weight: 600;
+  letter-spacing: 0.04em;
+  text-transform: uppercase;
+  color: #34c759;
+}
+
+.ai-test-result {
+  font-size: 10.5px;
+  padding: 5px 8px;
+  border-radius: 5px;
+  font-weight: 500;
+}
+.ai-test-result.ok {
+  color: #34c759;
+  background: rgba(52, 199, 89, 0.10);
+  border: 1px solid rgba(52, 199, 89, 0.25);
+}
+.ai-test-result.fail {
+  color: #e74c3c;
+  background: rgba(231, 76, 60, 0.10);
+  border: 1px solid rgba(231, 76, 60, 0.25);
+}
+
+.ai-key-link {
+  font-size: 10.5px;
+  color: var(--hint-accent);
+  text-decoration: none;
+  align-self: flex-end;
+  cursor: pointer;
+}
+.ai-key-link:hover { text-decoration: underline; }
+
+.ai-prompt-row {
+  display: flex;
+  flex-direction: column;
+  gap: 4px;
+  margin-bottom: 6px;
+}
+.ai-prompt-row-head {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+}
+.ai-prompt-row-label {
+  font-size: 11px;
+  font-weight: 600;
+  color: var(--text);
+}
+.ai-prompt-reset {
+  appearance: none;
+  background: transparent;
+  border: none;
+  color: var(--hint-accent);
+  font-size: 10px;
+  cursor: pointer;
+  padding: 0;
+}
+.ai-prompt-reset:hover { text-decoration: underline; }
+
+.ai-prompt-textarea {
+  appearance: none;
+  width: 100%;
+  background: var(--input-bg);
+  color: var(--text);
+  border: 1px solid var(--border);
+  border-radius: 6px;
+  padding: 6px 8px;
+  font-size: 11px;
+  font-family: inherit;
+  line-height: 1.4;
+  resize: vertical;
+  outline: none;
+}
+.ai-prompt-textarea:focus {
+  border-color: var(--gold);
+  box-shadow: 0 0 0 2px rgba(216, 181, 114, 0.18);
+}
+
+.ai-disclosure {
+  font-size: 10px;
+  line-height: 1.4;
+  color: var(--hint);
+  font-style: italic;
+  padding: 6px 8px;
+  border-left: 2px solid var(--separator);
+  margin-top: 4px;
+}
+
+/* ─────────────────── CHAT PANEL ─────────────────── */
+
+.chat-panel {
+  /* Reuses .settings-panel chrome via shared class — these tweak
+     internal layout to host: header, thumbnail, message list, composer. */
+  padding: 10px 12px;
+  gap: 8px;
+}
+
+.chat-header-meta {
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  flex-wrap: wrap;
+  min-width: 0;
+  flex: 1 1 auto;
+}
+
+.chat-provider-badge {
+  font-size: 10px;
+  letter-spacing: 0.02em;
+  color: var(--hint);
+  background: var(--group-bg);
+  border: 1px solid var(--group-border);
+  padding: 2px 6px;
+  border-radius: 4px;
+  font-family: "SF Mono", "JetBrains Mono", Menlo, monospace;
+  white-space: nowrap;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  max-width: 220px;
+}
+
+.chat-thumb-wrap {
+  position: relative;
+  display: flex;
+  align-items: center;
+  gap: 8px;
+  padding: 6px;
+  background: var(--group-bg);
+  border: 1px solid var(--group-border);
+  border-radius: 6px;
+}
+.chat-thumb {
+  display: block;
+  max-width: 80px;
+  max-height: 60px;
+  border-radius: 4px;
+  object-fit: contain;
+  background: #000;
+}
+.chat-thumb-meta {
+  font-size: 10.5px;
+  color: var(--hint);
+  font-weight: 600;
+}
+
+.chat-empty {
+  font-size: 11px;
+  color: var(--hint);
+  padding: 16px 8px;
+  text-align: center;
+  font-style: italic;
+}
+
+.chat-messages {
+  flex: 1 1 auto;
+  min-height: 0;
+  overflow-y: auto;
+  display: flex;
+  flex-direction: column;
+  gap: 6px;
+  padding: 4px 2px;
+}
+
+.chat-bubble {
+  padding: 8px 10px;
+  border-radius: 8px;
+  font-size: 11.5px;
+  line-height: 1.45;
+  max-width: 100%;
+  word-wrap: break-word;
+  word-break: break-word;
+}
+.chat-bubble-user {
+  background: rgba(216, 181, 114, 0.14);
+  border: 1px solid rgba(216, 181, 114, 0.28);
+  color: var(--text);
+  align-self: flex-end;
+  max-width: 90%;
+}
+.chat-bubble-assistant {
+  background: var(--group-bg);
+  border: 1px solid var(--group-border);
+  color: var(--text);
+  align-self: flex-start;
+  max-width: 100%;
+}
+
+.chat-typing {
+  display: inline-block;
+  color: var(--hint);
+  font-style: italic;
+  animation: chatTypingPulse 1.4s ease-in-out infinite;
+}
+@keyframes chatTypingPulse {
+  0%, 100% { opacity: 0.45; }
+  50% { opacity: 0.85; }
+}
+
+.chat-error {
+  color: #e74c3c;
+  font-size: 11px;
+}
+
+/* Markdown rendering inside assistant bubbles — keep it tight; the
+   panel is narrow. */
+.chat-markdown { display: block; }
+.chat-markdown p { margin: 0 0 6px 0; }
+.chat-markdown p:last-child { margin-bottom: 0; }
+.chat-markdown ul, .chat-markdown ol { margin: 4px 0 6px 16px; padding: 0; }
+.chat-markdown li { margin-bottom: 2px; }
+.chat-markdown code {
+  background: var(--input-bg);
+  border: 1px solid var(--border);
+  border-radius: 3px;
+  padding: 0 4px;
+  font-family: "SF Mono", "JetBrains Mono", Menlo, monospace;
+  font-size: 10.5px;
+}
+.chat-markdown pre {
+  background: var(--input-bg);
+  border: 1px solid var(--border);
+  border-radius: 5px;
+  padding: 8px 10px;
+  overflow-x: auto;
+  margin: 4px 0 6px 0;
+}
+.chat-markdown pre code {
+  background: transparent;
+  border: none;
+  padding: 0;
+}
+.chat-markdown strong { font-weight: 600; }
+.chat-markdown em { font-style: italic; }
+.chat-markdown h1, .chat-markdown h2, .chat-markdown h3 {
+  font-size: 12px;
+  font-weight: 700;
+  margin: 6px 0 4px 0;
+}
+.chat-markdown a {
+  color: var(--gold);
+  text-decoration: underline;
+  text-decoration-thickness: 1px;
+}
+
+.chat-composer {
+  display: flex;
+  flex-direction: column;
+  gap: 4px;
+  flex-shrink: 0;
+  border-top: 1px solid var(--separator);
+  padding-top: 8px;
+}
+.chat-input {
+  appearance: none;
+  width: 100%;
+  background: var(--input-bg);
+  color: var(--text);
+  border: 1px solid var(--border);
+  border-radius: 6px;
+  padding: 6px 8px;
+  font-size: 12px;
+  font-family: inherit;
+  line-height: 1.4;
+  resize: vertical;
+  outline: none;
+}
+.chat-input:focus {
+  border-color: var(--gold);
+  box-shadow: 0 0 0 2px rgba(216, 181, 114, 0.18);
+}
+.chat-input[disabled] { opacity: 0.55; cursor: not-allowed; }
+
+.chat-send {
+  appearance: none;
+  align-self: flex-end;
+  background: linear-gradient(180deg, var(--gold) 0%, var(--gold-strong) 100%);
+  color: var(--gold-text);
+  border: 1px solid rgba(0, 0, 0, 0.25);
+  border-radius: 6px;
+  padding: 5px 14px;
+  font-size: 11.5px;
+  font-weight: 600;
+  cursor: pointer;
+  transition: filter 0.12s, transform 0.10s;
+}
+.chat-send:hover { filter: brightness(1.05); }
+.chat-send:active { transform: scale(0.97); }
+.chat-send[disabled] {
+  filter: grayscale(0.5);
+  opacity: 0.55;
+  cursor: not-allowed;
+}
+.chat-cancel {
+  background: transparent;
+  border-color: rgba(231, 76, 60, 0.4);
+  color: #e74c3c;
+}
+.chat-cancel:hover {
+  background: rgba(231, 76, 60, 0.10);
+  filter: none;
+}
diff --git a/src/shared/constants.ts b/src/shared/constants.ts
index 7cd28d2..037eb7b 100644
--- a/src/shared/constants.ts
+++ b/src/shared/constants.ts
@@ -19,8 +19,40 @@ export const HIGHLIGHTER_DEFAULT: ToolSettings = {
 
 export const FIB_LEVELS = [0, 0.236, 0.382, 0.5, 0.618, 0.786, 1.0];
 
+// Per-level colors for the Fibonacci retracement, matching the
+// convention traders are used to on TradingView / MT charts: each
+// ratio reads as a distinct hue so levels are identifiable at a glance
+// without checking the label. 0 and 1 (the swing endpoints) are
+// neutral grey; the inner ratios run warm→cool, with the 0.618 golden
+// ratio in its signature teal. Keyed by the ratio's string form.
+export const FIB_COLORS: Record<string, string> = {
+  '0': '#9598a1', // swing low/high — neutral grey
+  '0.236': '#f23645', // red
+  '0.382': '#ff9800', // orange
+  '0.5': '#4caf50', // green
+  '0.618': '#089981', // golden ratio — teal (the key level)
+  '0.786': '#2962ff', // blue
+  '1': '#9598a1', // full retrace — neutral grey
+};
+
+// Color for a given Fibonacci level, falling back to neutral grey for
+// any custom level not in the standard palette.
+export function fibColor(level: number): string {
+  return FIB_COLORS[String(level)] ?? '#9598a1';
+}
+
 export const SNAP_ANGLES_DEG = [0, 15, 30, 45, 60, 75, 90, 105, 120, 135, 150, 165, 180];
 
+// Default first user message for the auto-fired opening turn of an
+// "Ask AI" snip session. The user hasn't typed anything yet — the image
+// carries the request — so this is phrased to make the model SOLVE or
+// answer whatever is in the image rather than merely describe it. Used
+// by every provider adapter when input.userMessage is empty.
+export const SOLVE_FIRST_TURN =
+  'Solve or answer whatever is shown in this image. If it contains a ' +
+  'problem, question, equation, or task, work it out and give the final ' +
+  'answer with the key steps — do not just describe what you see.';
+
 // Initial sizes for the toolbar window. The renderer reports its
 // actual content size after mount and the window resizes to fit — so
 // these values just need to be a generous first-paint estimate close
diff --git a/src/shared/profiles.ts b/src/shared/profiles.ts
index 3c86d53..17ab3ea 100644
--- a/src/shared/profiles.ts
+++ b/src/shared/profiles.ts
@@ -5,6 +5,11 @@ export interface Profile {
   label: string;
   description: string;
   tools: ToolId[];
+  // Default system prompt used when the user clicks "Ask AI" on a
+  // snip while this profile is active. Overridable per profile in
+  // Settings → AI. The user override lives in
+  // PersistedState.aiProfilePrompts; this is the fallback.
+  aiPrompt: string;
 }
 
 export const PROFILES: Record<ProfileId, Profile> = {
@@ -13,6 +18,14 @@ export const PROFILES: Record<ProfileId, Profile> = {
     label: 'General',
     description: 'Everyday annotations — simple & common',
     tools: ['pencil', 'pen', 'eraser', 'hand', 'line', 'arrow', 'text', 'region', 'ellipse', 'snip'],
+    aiPrompt:
+      'You are a helpful assistant looking at a screenshot the user has ' +
+      'captured. Your job is to SOLVE or answer what is in the image, not ' +
+      'merely describe it. If it contains a problem, question, equation, ' +
+      'code, a multiple-choice item, an error message, or any task — work it ' +
+      'out and give the final answer, showing the key steps concisely. If the ' +
+      'user asks a specific question, answer it directly. Only fall back to a ' +
+      'short description when there is genuinely nothing to solve or answer.',
   },
   teacher: {
     id: 'teacher',
@@ -31,6 +44,14 @@ export const PROFILES: Record<ProfileId, Profile> = {
       'ellipse',
       'snip',
     ],
+    aiPrompt:
+      'You are tutoring a student from this captured image. If it shows a ' +
+      'problem or exercise (math, science, language, a question), SOLVE it ' +
+      'step by step so the student can follow the reasoning, then state the ' +
+      'final answer clearly. If it shows a concept or diagram instead, explain ' +
+      'what it is, why it matters, and the single key idea to take away. Plain ' +
+      'language; define any jargon. Be thorough on the solution, concise on ' +
+      'commentary.',
   },
   trader: {
     id: 'trader',
@@ -49,9 +70,30 @@ export const PROFILES: Record<ProfileId, Profile> = {
       'text',
       'snip',
     ],
+    aiPrompt:
+      'You are an experienced market analyst. Your input is either a price ' +
+      'chart image or a set of technical levels the user has marked, given ' +
+      'to you as computed numbers (treat any provided numbers as exact — do ' +
+      'not re-estimate them). In order: (1) name the instrument and timeframe ' +
+      'if known, (2) identify the prevailing trend, (3) call out the key ' +
+      'support / resistance and Fibonacci levels and notable patterns, (4) ' +
+      'offer one or two probabilistic scenarios with the invalidation level ' +
+      'for each. Be concise; do not give financial advice — frame everything ' +
+      'as observation.',
   },
 };
 
 export const DEFAULT_PROFILE: ProfileId = 'general';
 
 export const PROFILE_ORDER: ProfileId[] = ['general', 'teacher', 'trader'];
+
+// Returns the effective system prompt for a profile, preferring the
+// user's override (when set) and falling back to the profile default.
+export function resolveAiPrompt(
+  profile: ProfileId,
+  overrides: Partial<Record<ProfileId, string>>,
+): string {
+  const override = overrides[profile];
+  if (override && override.trim().length > 0) return override;
+  return PROFILES[profile].aiPrompt;
+}
diff --git a/src/shared/types.ts b/src/shared/types.ts
index e076d85..4cd0611 100644
--- a/src/shared/types.ts
+++ b/src/shared/types.ts
@@ -97,6 +97,10 @@ export interface TextShape {
   text: string;
   color: string;
   fontSize: number;
+  // CSS font-family stamped at creation from the user's default-font
+  // setting. Optional for back-compat with items saved before the
+  // setting existed; drawText falls back to the system stack.
+  fontFamily?: string;
 }
 
 export type Item =
@@ -148,8 +152,168 @@ export type HubStateUpdate = {
   // main can resize the toolbar window to fit it, the same way it
   // does for settingsOpen.
   statusPanelOpen?: boolean;
+  // AI integration. chatOpen is transient (panel visibility);
+  // the others persist in PersistedState too.
+  chatOpen?: boolean;
+  aiActiveProvider?: ProviderId | null;
+  aiActiveModel?: string | null;
+  aiProfilePrompts?: Partial<Record<ProfileId, string>>;
+  // Local (Ollama) AI. aiLocalEnabled flips local-first on; when on and
+  // a model is installed the resolver prefers local over cloud.
+  aiLocalEnabled?: boolean;
+  aiInstalledModels?: string[];
+  aiLocalModel?: string | null; // global default text model tag (fallback)
+  aiLocalVisionModel?: string | null; // global default vision model tag (fallback)
+  aiProfileModels?: AiProfileModels; // per-profile model overrides
+
+  // Autocorrect toggles — independent for typed text and drawn ink.
+  autocorrectTyped?: boolean;
+  autocorrectDrawn?: boolean;
+  // CSS font-family for newly created text (typed + recognized).
+  defaultTextFont?: string;
+  // First-run setup wizard completed (or skipped).
+  aiOnboarded?: boolean;
+  // Auto-update preference. When true (default) new versions download
+  // in the background and install on quit; when false the app only
+  // notifies and waits for an explicit "Restart to update".
+  autoUpdate?: boolean;
 };
 
+// Auto-update lifecycle, surfaced to the renderer via the 'updater:status'
+// event and the 'updater:get' snapshot. `unsupported` covers the macOS
+// unsigned case (Squirrel.Mac refuses unsigned updates) and dev runs —
+// there the UI offers a manual "Download from GitHub" link instead.
+export interface UpdateStatus {
+  state:
+    | 'idle'
+    | 'checking'
+    | 'available'
+    | 'downloading'
+    | 'downloaded'
+    | 'none'
+    | 'error'
+    | 'unsupported';
+  // Running app version (always populated).
+  currentVersion: string;
+  // The newer version, when one is available/downloaded.
+  version?: string;
+  // Download progress, 0–100, while state === 'downloading'.
+  percent?: number;
+  // Human-readable detail for 'error'/'unsupported'.
+  message?: string;
+}
+
+// ── AI integration types ───────────────────────────────────────────
+
+// 'ollama' is the local-first provider (no API key — models run on the
+// user's machine via the Ollama service). The cloud providers stay
+// available as an opt-in fallback. Note: DeepSeek is text-only (its API
+// rejects image input), so image snips routed to it answer from text
+// alone — for image Q&A prefer local vision or Claude / GPT-4o / Gemini.
+// 'sarvam' IS vision-capable: its adapter OCRs the image via Sarvam
+// Document Intelligence, then solves with Sarvam's own chat model.
+export type ProviderId = 'anthropic' | 'openai' | 'gemini' | 'deepseek' | 'sarvam' | 'ollama';
+
+export interface AiStatus {
+  provider: ProviderId;
+  configured: boolean;
+}
+
+// Per-profile local model overrides. Each profile can pin a text model
+// (grammar / chat / analysis) and a vision model (screenshot Q&A / OCR);
+// anything unset falls back to the catalogue default for that profile.
+export type AiProfileModels = Partial<Record<ProfileId, { text?: string; vision?: string }>>;
+
+// ── Local (Ollama) types ───────────────────────────────────────────
+
+// One entry in the local model catalogue surfaced in the installer.
+export interface LocalModelInfo {
+  // Ollama tag, e.g. 'llama3.2:1b'.
+  tag: string;
+  label: string;
+  kind: 'text' | 'vision' | 'embed';
+  approxBytes: number;
+  // True once the tag is present in the local Ollama library.
+  installed: boolean;
+  // True for the first-run default set the setup wizard pulls.
+  defaultPull?: boolean;
+}
+
+export interface OllamaServiceStatus {
+  installed: boolean; // ollama binary / daemon reachable
+  running: boolean; // /api/version answered
+  version?: string;
+  error?: string;
+}
+
+export interface OllamaPullProgress {
+  model: string;
+  status: string;
+  completed?: number;
+  total?: number;
+  done?: boolean;
+  error?: string;
+}
+
+export interface ChatTurn {
+  role: 'user' | 'assistant';
+  content: string;
+}
+
+export interface AskInput {
+  provider: ProviderId;
+  model: string;
+  systemPrompt: string;
+  // PNG attached to the FIRST user turn only. Renderer encodes the
+  // snip and sends bytes through IPC; main decodes and forwards to
+  // the provider in whatever shape it wants.
+  image?: { mime: string; base64: string };
+  history: ChatTurn[];
+  userMessage: string;
+  // The active profile, when known. Lets the resolver pick the
+  // per-profile model and (later) inject profile-specific RAG context.
+  profile?: ProfileId;
+  // The chat session this turn belongs to. Main caches the snip image
+  // (and, for Sarvam, the one-shot OCR text) per session so follow-up
+  // turns retain the original image/problem context without the
+  // renderer re-uploading it or re-running OCR each time.
+  sessionId?: string;
+}
+
+export interface StreamChunk {
+  requestId: string;
+  delta?: string;
+  done?: boolean;
+  error?: string;
+}
+
+export interface ConnectionTestResult {
+  ok: boolean;
+  message?: string;
+  // Round-trip duration in milliseconds, populated on ok=true.
+  latencyMs?: number;
+}
+
+// Payload of the chat:session broadcast — sent from main to every
+// renderer when SnipActions kicks off a new AI chat. The toolbar's
+// ChatPanel picks this up to render the image thumbnail + auto-fire
+// the first turn against the configured provider.
+export interface ChatSessionPayload {
+  sessionId: string;
+  // Image sessions (snip "Ask AI") carry a PNG; text-only sessions
+  // (e.g. the trader numeric-analysis flow) omit it.
+  png?: Uint8Array;
+  mime?: string;
+  // For a text-only session: the first user message to auto-send
+  // (e.g. the computed technical levels). Image sessions leave this
+  // empty and auto-fire with "".
+  initialText?: string;
+  // The profile the user was in when they clicked Ask AI. Stays
+  // bound to the chat — profile switches mid-conversation don't
+  // retroactively re-prime the system prompt.
+  profile: ProfileId;
+}
+
 export type IpcChannel =
   | 'hub:state:get'
   | 'hub:state:update'
@@ -179,6 +343,16 @@ export type IpcChannel =
   | 'toolbar:on-right-side'
   | 'toolbar:set-content-size'
   | 'app:info'
+  // Auto-update (electron-updater → GitHub Releases). `get` returns the
+  // current snapshot; `check` forces a check; `install` quits and
+  // applies a downloaded update; `open-releases` opens the GitHub
+  // Releases page (manual fallback, e.g. unsigned macOS); `status` is
+  // the push event the renderer subscribes to.
+  | 'updater:get'
+  | 'updater:check'
+  | 'updater:install'
+  | 'updater:open-releases'
+  | 'updater:status'
   | 'permissions:check'
   | 'permissions:open'
   | 'permissions:needed'
@@ -186,7 +360,49 @@ export type IpcChannel =
   | 'permissions:deep-recheck'
   | 'app:relaunch'
   | 'settings:save-dir:pick'
-  | 'shell:open-path';
+  | 'shell:open-path'
+  // AI integration
+  | 'ai:set-key'
+  | 'ai:delete-key'
+  | 'ai:get-status'
+  | 'ai:test-connection'
+  | 'ai:ask'
+  | 'ai:cancel'
+  | 'ai:chunk'
+  // Non-streaming one-shot calls: recognize handwriting (image→text)
+  // and autocorrect typed text (text→text). Both resolve provider/
+  // model the same way ai:ask does.
+  | 'ai:recognize'
+  | 'ai:autocorrect'
+  // Local Ollama service management.
+  | 'ollama:status'
+  | 'ollama:start'
+  | 'ollama:pull'
+  | 'ollama:pull-progress'
+  | 'ollama:cancel-pull'
+  | 'ollama:delete-model'
+  | 'ollama:list-models'
+  | 'ollama:disk-space'
+  | 'ollama:install-help'
+  // Local RAG "self-learning" store.
+  | 'rag:stats'
+  | 'rag:reset-profile'
+  | 'rag:capture'
+  // Cross-window chat-session handoff: overlay's SnipActions starts
+  // a chat with a snip image; main broadcasts a session event so the
+  // toolbar's ChatPanel receives the image and opens.
+  | 'chat:start'
+  | 'chat:start-text'
+  | 'chat:session'
+  // Trader hybrid: toolbar asks the focused overlay to compute its
+  // drawn technical levels and open a text-only analysis chat.
+  | 'relay:analyze'
+  | 'overlay:analyze'
+  // Renderer-friendly shortcut: ask AI about the current snip
+  // selection. Main captures + composites the focused display's
+  // snip (same path as Save), then internally calls chat:start with
+  // the bytes — no need for the renderer to handle PNG capture.
+  | 'snip:ask-ai';
 
 export interface CaptureSaved {
   path: string;
diff --git a/vite.config.ts b/vite.config.ts
index e0153b1..d277a32 100644
--- a/vite.config.ts
+++ b/vite.config.ts
@@ -21,7 +21,22 @@ export default defineConfig({
           build: {
             outDir: 'dist-electron/main',
             rollupOptions: {
-              external: ['electron', 'electron-store', 'active-win'],
+              // bufferutil / utf-8-validate are OPTIONAL native addons of
+              // `ws` (pulled in transitively by the sarvamai SDK). They
+              // aren't installed; `ws` already wraps their require() in a
+              // try/catch and falls back to pure JS. Marking them external
+              // keeps them as runtime requires instead of letting Rollup
+              // emit a hard-failing resolve stub.
+              external: [
+                'electron',
+                'electron-store',
+                'active-win',
+                // Loaded from node_modules at runtime (shipped in app
+                // dependencies); bundling it pulls in dynamic requires.
+                'electron-updater',
+                'bufferutil',
+                'utf-8-validate',
+              ],
             },
           },
         },