diff --git a/README.md b/README.md
index 0ef8221..b80f940 100644
--- a/README.md
+++ b/README.md
@@ -13,10 +13,11 @@ Character-focused local chatbot with RAG support (ChromaDB + LangChain), CLI and
 ## What It Includes
 
 - Local chat runtime backed by `llama-cpp-python`
-- Character-card-driven prompting (`cards/*.json`)
+- Character-card-driven prompting (`cards/*.json`) with avatar display
 - RAG retrieval from ChromaDB collections
 - Dynamic context budgeting and history management
 - GPU offload auto-layer calculation and KV cache quant support
+- Web UI (FastAPI + Jinja2 + HTMX): chat, session management, RAG management, diagnostics
 - Scripted workflows for analyzing, pushing, and managing RAG data
 
 ## Current Runtime Entry Points
@@ -75,9 +76,20 @@ Notes for web chat behavior:
 
 - Shows status updates (`Ready`, `Sending`, `Thinking`, `Streaming`, `Timed out`).
 - Applies a stream timeout and surfaces a `Retry` button on stream failure.
-- Supports named session save + explicit session picker load in the sidebar.
-- Shows both latest retrieval debug stats and per-turn retrieval trace history.
-- Provides quick actions for copy/export and command-equivalent controls (`clear`, `reload`, `help`).
+- Sidebar has three tabs: **Character** (avatar + card info), **Sessions** (save/load/search), **Debug** (per-turn retrieval trace + diagnostics).
+- Named session save/load and full-text session search with character and date filters.
+- Token budget bar in the Diagnostics tab shows real-time context-window allocation (system / history / RAG / examples / input / reserved / free).
+- Per-turn stats: estimated prompt and completion tokens, context window fill %, RAG chunks used.
+- Quick actions for copy/export (TXT, JSON, ZIP bundle) and command-equivalent controls (`clear`, `reload`, `help`).
+- Saveable preset profiles for retrieval settings (MMR, rerank, multi-query, k values).
+
+RAG management UI at **`/rag`** (link in the chat sidebar):
+
+- Upload new source files (`.txt`) and create ChromaDB collections directly from the browser.
+- View, lint, and run coverage analysis on `rag_data/` files.
+- List, query, rebuild, and delete collections.
+- Run fixture evaluations and view retrieval trend history.
+- View embedding benchmark results.
 
 ## Setup
 
diff --git a/cards/Shodan-specV2.jpg b/cards/Shodan-specV2.jpg
new file mode 100644
index 0000000..eb3c3b5
Binary files /dev/null and b/cards/Shodan-specV2.jpg differ
diff --git a/core/conversation_manager.py b/core/conversation_manager.py
index 6673e48..9dcc009 100644
--- a/core/conversation_manager.py
+++ b/core/conversation_manager.py
@@ -143,6 +143,17 @@ def __init__(self) -> None:
             "mes": {"mode": "unknown", "returned": 0, "candidates": 0, "queries": 0, "rerank_applied": False},
             "cleanup": {"main": 0, "mes": 0, "cross_removed": 0},
         }
+        self.last_token_budget: dict[str, int] = {
+            "system_prompt_tokens": 0,
+            "history_tokens": 0,
+            "rag_tokens": 0,
+            "examples_tokens": 0,
+            "input_tokens": 0,
+            "total_estimated": 0,
+            "context_window": 0,
+            "available_for_context": 0,
+            "reserved_for_response": 0,
+        }
         self._vector_client: object | None = None
         self._vector_embedder: object | None = None
         self._cross_encoder: object | None = None
diff --git a/core/conversation_prompt_history_mixin.py b/core/conversation_prompt_history_mixin.py
index 8720927..6bbde69 100644
--- a/core/conversation_prompt_history_mixin.py
+++ b/core/conversation_prompt_history_mixin.py
@@ -186,6 +186,18 @@ def _prepare_dynamic_vector_context(self, message: str, mes_example: str) -> tup
         vector_context = str(allocation["allocated_context"])
         allocated_history = str(allocation["allocated_history"])
 
+        self.last_token_budget = {
+            "system_prompt_tokens": budget.system_prompt_tokens,
+            "history_tokens": int(allocation["history_tokens"]),
+            "rag_tokens": int(allocation["context_tokens"]),
+            "examples_tokens": int(allocation["examples_tokens"]),
+            "input_tokens": int(allocation["input_tokens"]),
+            "total_estimated": int(allocation["total_allocated"]) + budget.system_prompt_tokens,
+            "context_window": budget.total_context,
+            "available_for_context": budget.available_for_context,
+            "reserved_for_response": budget.reserved_for_response,
+        }
+
         if self.runtime_config.debug_context:
             logger.debug(self.context_manager.get_context_info(budget, allocation))
 
diff --git a/core/rag_manager.py b/core/rag_manager.py
index dc0be54..f208a76 100644
--- a/core/rag_manager.py
+++ b/core/rag_manager.py
@@ -204,6 +204,36 @@ def file_content(config: RagScriptConfig, filename: str) -> str | None:
     return candidate.read_text(encoding="utf-8")
 
 
+def save_rag_file(config: RagScriptConfig, stem: str, content: bytes) -> dict[str, Any]:
+    """Save *content* as ``{stem}.txt`` in the rag_data directory.
+
+    Raises ``ValueError`` if *stem* is invalid.
+    Returns a file-info dict matching the shape produced by :func:`list_rag_files`.
+    """
+    if not is_valid_stem(stem):
+        msg = f"Invalid stem {stem!r}: only letters, digits, underscores, and hyphens are allowed."
+        raise ValueError(msg)
+    rag_dir = Path(config.documents_directory)
+    rag_dir.mkdir(parents=True, exist_ok=True)
+    dest = rag_dir / f"{stem}.txt"
+    dest.write_bytes(content)
+    return {
+        "name": dest.name,
+        "stem": stem,
+        "type": "message_examples" if stem.endswith("_message_examples") else "lore",
+        "size": len(content),
+        "has_metadata": (rag_dir / f"{stem}.json").exists(),
+    }
+
+
+def list_rag_stems(config: RagScriptConfig) -> list[str]:
+    """Return a sorted list of stems for all .txt files in rag_data/."""
+    rag_dir = Path(config.documents_directory)
+    if not rag_dir.exists():
+        return []
+    return sorted(p.stem for p in rag_dir.glob("*.txt"))
+
+
 # ---------------------------------------------------------------------------
 # Linting
 # ---------------------------------------------------------------------------
diff --git a/docs/future_work/COPILOT_COMPACT_REFERENCE.md b/docs/future_work/COPILOT_COMPACT_REFERENCE.md
index 8a8fbe7..83211f5 100644
--- a/docs/future_work/COPILOT_COMPACT_REFERENCE.md
+++ b/docs/future_work/COPILOT_COMPACT_REFERENCE.md
@@ -1,6 +1,6 @@
 # Copilot Compact Reference — Implemented State
 
-Last verified: 2026-03-29
+Last verified: 2026-04-03
 
 Use this as the single compact reference for implemented work across conversation quality, RAG quality, and web app behavior.
 
@@ -143,18 +143,46 @@ Primary files:
 - **Per-turn diagnostics panel**: collapsible sidebar panel showing Turn, Latency (s), Chars, Main chunks, MES chunks, Cross-removed, and Drift score (colour-coded at warning/fail thresholds) for the last 40 turns. Auto-refreshes after each stream. Route: `GET /chat/diagnostics`.
 - **Saveable preset profiles**: collapsible sidebar panel for saving/applying/deleting named snapshots of 7 retrieval settings (`use_mmr`, `rag_rerank_enabled`, `rag_sentence_compression_enabled`, `rag_multi_query_enabled`, `rag_k`, `rag_k_mes`, `debug_context`). Profiles persisted in `configs/profiles.json`; applied in-place to the live `ConversationRuntimeConfig` without restart. Routes: `GET/POST /settings/profiles/*`.
 - **One-click export bundle**: `GET /chat/export/bundle` downloads a ZIP containing `manifest.json`, `conversation.json` (full session), `retrieval_traces.json` (per-turn history), and `drift_history.json`. Button in composer quick-actions.
+- **RAG Management UI** (`/rag`): Standalone dark-theme page with left nav. Sections: Collections (list, detail, delete, ad-hoc query, rebuild/push with async job, fingerprint backfill), Files (list, view, lint run/fix, coverage analysis), Evaluate (fixture pack selector, run evaluate-fixtures, results table, retrieval trend history), Benchmark (last-run model comparison table). Long-running ops (push, evaluate) use in-memory `JobStore` + HTMX polling (`every 2s`). Link from chat sidebar.
+- **Session history search**: Collapsible "Search sessions" panel inside the Sessions sidebar panel. Searches all saved `logs/web_sessions/session_*.json` files by free text (matches session name and message content), character name filter, and optional date range. Returns matching sessions with inline message excerpts and a Load button. Route: `GET /sessions/search?q=&character=&from_date=&to_date=`.
+- **Token budget visualization + per-turn stats** (`/chat/diagnostics`): A stacked colour-coded bar at the top of the Diagnostics panel shows the current context-window allocation split across System prompt, History, RAG context, Examples, User input, Reserved, and Free headroom (green/yellow/red by fill %). The per-turn table now shows estimated Prompt tokens, estimated Completion tokens (chars/4), Context window % fill (colour-coded), and RAG chunks retrieved. A session-totals row below the table shows cumulative prompt/completion tokens and average context %. Backend: `ConversationManager.last_token_budget` dict populated from `ContextBudget` + `allocate_content()` return values in `_prepare_dynamic_vector_context()`; stored per trace in `_record_retrieval_trace`.
+- **Character avatar display + tabbed sidebar**: The chat sidebar is restructured into three tabs
+  — 🎭 Character, 💾 Sessions, 🔍 Debug — with a compact always-visible header showing a small
+  avatar and character name. The Character tab displays the full avatar image (if present) alongside
+  card metadata. Route: `GET /characters/avatar` returns the avatar as a `FileResponse`;
+  `_character_avatar_path()` searches `character_storage/<stem>/avatar.{ext}` then `cards/<stem>.{ext}`.
+  `has_avatar` bool is passed to the index template context.
+- **RAG file upload + create-collection from UI**: The RAG Files page now includes an "Upload
+  Source File" panel — file picker (`.txt`), auto-filled stem, optional collection name for
+  immediate ingest. Uploading without a collection name saves the file and refreshes the file list.
+  With a collection name it triggers a push job. Each lore file row has an "Ingest →" toggle that
+  reveals an inline form to build a collection from that file. The Collections page has a "Create
+  New Collection" section with a dropdown of existing file stems. New routes:
+  `POST /rag/files/upload` (multipart), `POST /rag/collections`.
+  New backend: `rag_manager.save_rag_file()`, `rag_manager.list_rag_stems()`.
+- **Bug fix — creating new ChromaDB collections**: `push_to_collection()` in
+  `scripts/rag/push_rag_data.py` previously only caught `ValueError` when deleting a non-existent
+  collection before recreating it. ChromaDB raises `chromadb.errors.NotFoundError` for missing
+  collections; that exception was uncaught and crashed the entire push. Fixed by widening the
+  `except` clause to use the already-defined `MISSING_COLLECTION_ERRORS` tuple
+  (`ValueError | NotFoundError`). This was a latent bug exposed by the first UI-driven
+  collection creation.
 
 Primary files:
 
 - `web_app.py`
 - `main.py`
 - `core/preset_profiles.py`
+- `core/rag_manager.py` (+ `save_rag_file`, `list_rag_stems`, `_character_avatar_path` helpers)
+- `core/job_queue.py`
+- `scripts/rag/push_rag_data.py` (bug fix: `MISSING_COLLECTION_ERRORS` in `push_to_collection`)
 - `templates/index.html`
 - `templates/chat_message_pair.html`
 - `templates/chat_messages.html`
 - `templates/chat_single_message.html`
 - `templates/diagnostics_panel.html`
 - `templates/presets_panel.html`
+- `templates/rag/layout.html` (+ 13 RAG partial templates incl. `upload_result.html`)
 
 ## Current Defaults Snapshot
 
diff --git a/docs/future_work/REFINEMENTS.md b/docs/future_work/REFINEMENTS.md
index b0c6ff0..c2b06a6 100644
--- a/docs/future_work/REFINEMENTS.md
+++ b/docs/future_work/REFINEMENTS.md
@@ -17,10 +17,25 @@ Implemented state lives in `docs/future_work/COPILOT_COMPACT_REFERENCE.md`.
 - ✅ Integrate conversation quality command into a single quality-gate workflow with retrieval and RAG-data checks. (2026-03-26)
 - ✅ Add CI regression policy for conversation quality baselines (warn vs hard fail by severity). (2026-03-26)
 - Add docs for fixture authoring rules and baseline refresh workflow.
+- **Character name mismatch on first turn (investigate).** On the first message of a session the
+  persona drift scorer may not match the character name correctly, producing an artificially high
+  drift score or misfire. Two candidate causes: (1) lazy initialisation — `character_name` may be
+  empty when the first `PersonaAnchor` is built, as card loading (`parse_prompt`) runs during
+  `__init__` before all attributes are set; (2) mes_example normalisation — the card linter
+  normalises `<USER>` / `<BOT>` markers to plain `user:` / `assistant:` format, stripping the
+  original character name from example turns, which may confuse the heuristic name-match on turn 1.
+  Investigation steps: add a log line in `_record_retrieval_trace` printing `character_name` and
+  `drift_score` at turn 1; check whether `PersonaAnchor.character_name` is populated before the
+  first call; and compare drift scores with and without mes_example injection on turn 1.
 
 ### RAG Data Quality
 
-*(All scoped items completed; implemented state is tracked in `docs/future_work/COPILOT_COMPACT_REFERENCE.md`.)*
+- **Shodan lore coverage is low.** The `rag_data/` source files for Shodan are sparse relative to the
+  character's depth. Coverage analysis shows many lore topics unmapped. Work needed: expand lore files
+  with canonical game text (System Shock 1 & 2 dialogue, environment descriptions, terminal messages),
+  re-run lint and coverage checks, then rebuild the collection.
+
+*(Previously scoped items completed; implemented state is tracked in `docs/future_work/COPILOT_COMPACT_REFERENCE.md`.)*
 
 ### Retrieval Quality
 
@@ -145,6 +160,134 @@ Each character maintains its own RAG collection and persona drift tracker. A tur
 **Large effort, Medium value.** Treat as a long-horizon milestone — do not start until §6–8 are
 stable. The only "Large" effort item in this backlog.
 
+### 11. Character Card Import & Avatar Support
+
+Improve the character loading pipeline to support richer card formats and give each character a
+visible identity in the UI.
+
+#### 11.1 Character Avatar / Icon Upload
+
+Each character should have an optional avatar image displayed in the chat UI next to assistant
+messages and in the character selector. Implementation:
+
+- Store avatars in `character_storage/<character_name>/avatar.png` (or `.jpg`, `.webp`).
+- Serve via `GET /characters/{name}/avatar` — returns the image, falls back to a generated
+  initial/monogram placeholder if no avatar is found.
+- Web UI: display avatar thumbnail in the chat header and optionally next to each assistant message
+  bubble. Upload button on the character settings page (see `UI_REFINEMENTS.md §C`).
+- Keep the image small (≤ 512 px, ≤ 200 KB) — resize on upload with Pillow.
+
+#### 11.2 Character Card V2 / V3 Import
+
+The project currently loads character data from plain JSON files in `cards/`. Extend this to
+support importing from standard character card formats used by the wider AI chat ecosystem.
+
+**Character Card V2 (PNG `chara` tEXt chunk):**
+- PNG files with a `chara` tEXt chunk containing base64-encoded JSON (TavernCardV2 format).
+- Fields map directly to existing config: `name`, `description`, `scenario`, `mes_example`,
+  `first_mes`, `personality`, `system_prompt`, `post_history_instructions`, `character_book`.
+- Already partially supported via `cards/leonardo_da_vinci.png` — formalise the import path.
+
+**Character Card V3 (CCv3 — the current community standard):**
+- Spec: <https://github.com/kwaroran/character-card-spec-v3/blob/main/SPEC_V3.md>
+- PNG/APNG: JSON embedded in `ccv3` tEXt chunk as UTF-8 → base64. If both `chara` and `ccv3`
+  chunks are present, prefer `ccv3`.
+- CHARX: zip file with `card.json` at root. Assets (icons, backgrounds, emotion sprites) live in
+  `assets/{type}/` subdirectories and can be accessed via `embeded://path` URIs.
+- JSON: plain `.json` file containing the CharacterCardV3 object directly.
+- V3 adds: `assets[]` (icon, background, emotion images), `nickname`, `group_only_greetings`,
+  `creation_date`, `modification_date`, `source[]`, multilingual creator notes.
+- **Implementation priority:** PNG V2 import is simplest and highest value (most cards in the wild
+  are V2 PNG). V3 PNG import is a small additional step. CHARX support can come later.
+- Use the `pypng` or `Pillow` library to read tEXt chunks; no heavyweight dependency needed.
+- On import: write a normalised JSON card to `cards/` and optionally extract the embedded avatar
+  to `character_storage/<name>/avatar.png`.
+
+**Suggested implementation order:**
+1. Formalise V2 PNG import (read `chara` chunk → normalise → save JSON + avatar).
+2. V3 PNG import (read `ccv3` chunk → normalise; fall back to `chara` if absent).
+3. Avatar display in web UI (§11.1 + `UI_REFINEMENTS.md §C`).
+4. CHARX import (zip extraction + asset handling).
+5. In-app card editor (§11.3 below).
+
+#### 11.3 In-App Character Card Editor
+
+A web-based form editor for creating and editing character cards without leaving the application.
+Several community implementations can be used as reference for field layout and PNG embedding:
+
+- [ZoltanAI/character-editor](https://github.com/ZoltanAI/character-editor) — lightweight
+  browser-side editor for V1/V2 cards; entirely static HTML/JS, good reference for field layout.
+- SillyTavern's built-in editor supports V2 fields and lorebook editing.
+- The [CCv3 spec](https://github.com/kwaroran/character-card-spec-v3/blob/main/SPEC_V3.md)
+  provides the canonical field reference for a V3-compatible editor.
+
+**Backend requirements:**
+
+- `GET /characters/{name}/edit` — load existing card fields into the edit form.
+- `POST /characters/{name}/edit` — validate and save edited fields to `cards/<name>.json`.
+- `GET /characters/new` / `POST /characters/new` — create a new card from scratch.
+- `POST /characters/{name}/export/png` — embed card JSON into a PNG tEXt chunk (`ccv3`) and
+  return the PNG for download. Uses the stored avatar as the base image.
+- `POST /characters/{name}/avatar` — upload a new avatar image (resize to ≤ 512 px with Pillow,
+  save to `character_storage/<stem>/avatar.png`). Replaces `UI_REFINEMENTS.md §C.2`.
+
+**Field coverage (minimum viable):**
+`name`, `description`, `scenario`, `personality`, `first_mes`, `mes_example`,
+`voice_instructions` (project-specific), `tags`, `creator`, `system_prompt`.
+Lorebook / `character_book` editing is out of scope for the initial version.
+
+**PNG embedding:**
+Read tEXt chunks with `struct` (stdlib) or `Pillow`; write `ccv3` chunk (base64-encoded UTF-8
+JSON). Also write a `chara` chunk for backward compatibility with V2 readers. No new heavy
+dependencies needed — `Pillow` is already a likely dependency for image resizing.
+
+**Effort:** Medium. The form and routing are straightforward; the PNG round-trip (read → edit →
+re-embed) is the only non-trivial part. Build after §11.1–11.2 so the parsing layer is shared.
+
+## §12 User-Facing Documentation Site
+
+A non-technical, friendly guide for people who want to use light-chat without programming knowledge,
+hosted alongside the repository as a static site.
+
+### Motivation
+
+The web UI has grown substantially (chat, RAG management, diagnostics, session search, character
+management). Many features have in-UI help text, but there is no cohesive end-user reference.
+A dedicated documentation site lowers the barrier to entry and helps non-technical users
+understand what the tool does and how to use it.
+
+### Hosting options (all compatible with GitHub Pages)
+
+| Option | Notes |
+|--------|-------|
+| **MkDocs Material** (recommended) | Python-based, clean modern theme, markdown source. Fits the project's Python tooling; `mkdocs gh-deploy` publishes to GitHub Pages. Add as a `uv` dev dependency. |
+| **Docsify** | Single HTML file + plain markdown; zero build step, works directly from a `docs/` folder on GitHub Pages. Good for rapid publishing. |
+| **Docusaurus** | Node.js/React, strong search and versioning. More setup overhead; worthwhile if the docs grow large. |
+
+**Recommended starting point:** MkDocs Material. One `mkdocs.yml` config, `uv add --dev mkdocs-material`,
+and `uv run mkdocs gh-deploy` is all that's needed. The source already lives in `docs/`.
+
+### Content scope (minimum viable)
+
+| Page | Audience-level description |
+|------|---------------------------|
+| **Welcome / What is this?** | Plain-language intro: local AI chatbot, character cards, no data sent to cloud |
+| **Getting started** | How to install, configure a model, and start the server |
+| **Using the chat** | Sending messages, sessions (save/load/search), keyboard shortcuts, export |
+| **Character cards** | What they are, where to put card files, adding an avatar image |
+| **Knowledge base (RAG)** | Plain-language: what a "collection" is, how to add a new character's info, what "coverage" means |
+| **Settings and profiles** | What each retrieval setting does in plain English; saving and applying profiles |
+| **Diagnostics panel** | What the token bar and per-turn table show; how to read drift scores |
+| **Troubleshooting** | Common errors, model not loading, no collections found, stream timeout |
+
+### Implementation notes
+
+- Place MkDocs source in `docs/` (already exists) with `mkdocs.yml` at the repository root.
+- Separate developer/contributor documentation (current `docs/`) from user-guide pages
+  (`docs/user_guide/`) using MkDocs navigation sections.
+- The in-UI help guides (chat sidebar and RAG page) can be reused or adapted as source material.
+- A GitHub Actions workflow can automate `mkdocs gh-deploy` on every push to `main`.
+
 *(Web UX and observability improvements are tracked in `docs/future_work/UI_REFINEMENTS.md`.)*
 
 ## Suggested Execution Order
@@ -159,10 +302,13 @@ stable. The only "Large" effort item in this backlog.
 8. ✅ Add retrieval trend rendering and debug export artifacts. (2026-03-26)
 9. Iterate on higher-level UX and explainability improvements — see `docs/future_work/UI_REFINEMENTS.md`.
 10. Add pressure-aware context compaction and per-turn token usage stats (§8).
-11. Implement Tier 1 markdown persona memory (§6) — requires user identity scoping first.
-12. Add conversation branching, character hot-reload, stop hooks, and skills macros (§7).
-13. CLI quality-of-life pass: themes and keybindings (§9).
-14. Multi-character conversation mode (§10) — long-horizon, after §6–8 are stable.
+11. Implement V2/V3 card import and avatar upload pipeline (§11.1–11.2).
+12. Build in-app character card editor with PNG export (§11.3 + `UI_REFINEMENTS.md §C.5`).
+13. Implement Tier 1 markdown persona memory (§6) — requires user identity scoping first.
+14. Add conversation branching, character hot-reload, stop hooks, and skills macros (§7).
+15. CLI quality-of-life pass: themes and keybindings (§9).
+16. Multi-character conversation mode (§10) — long-horizon, after §6–8 are stable.
+17. Publish user-facing documentation site (§12) — MkDocs Material on GitHub Pages.
 
 ## Next Steps
 
diff --git a/docs/future_work/UI_REFINEMENTS.md b/docs/future_work/UI_REFINEMENTS.md
index f68193b..e05119c 100644
--- a/docs/future_work/UI_REFINEMENTS.md
+++ b/docs/future_work/UI_REFINEMENTS.md
@@ -90,15 +90,14 @@ the `scripts/rag/` CLI toolset, accessible from the browser without a terminal.
 
 | Area | Features |
 |------|---------|
-| **RAG data files** | List, view, run linting, run coverage analysis |
-| **Collections** | List, inspect, delete, rebuild, query test |
+| **RAG data files** | List, view, upload new files, run linting, run coverage analysis |
+| **Collections** | List, inspect, delete, rebuild, create from uploaded file, query test |
 | **Fixture evaluation** | Run evaluate-fixtures, view results, view trend history |
 | **Embedding benchmarking** | Trigger benchmark run, view results |
 | **Collection migration** | Re-embed to new model, backfill fingerprints |
 
 Out of scope for this plan (requires broader changes):
 - In-browser text editing of `rag_data/` source files
-- File upload / new character creation
 - Real-time log streaming during long-running jobs (deferred to async job tracker)
 
 ### B.2 Routes
@@ -109,12 +108,14 @@ imports (no subprocess); UI responses use HTMX partial renders consistent with e
 | Method | Path | Purpose |
 |--------|------|---------|
 | GET | `/rag` | RAG management root panel |
-| GET | `/rag/files` | List `rag_data/` files with status badges |
+| GET | `/rag/files` | List `rag_data/` files with status badges; upload panel |
 | GET | `/rag/files/{filename}` | View file content (read-only) |
+| POST | `/rag/files/upload` | Upload a new `.txt` source file; optional immediate ingest |
 | POST | `/rag/lint` | Run message-example linting; return results table |
 | POST | `/rag/lint/fix` | Run linting with auto-fix; return diff summary |
 | POST | `/rag/coverage` | Run coverage analysis on a lore file; return score + report |
 | GET | `/rag/collections` | List ChromaDB collections with counts and fingerprints |
+| POST | `/rag/collections` | Create a new collection from an existing source file |
 | GET | `/rag/collections/{name}` | Collection detail: model, dimensions, sample docs |
 | DELETE | `/rag/collections/{name}` | Delete collection (with confirmation step) |
 | POST | `/rag/collections/{name}/query` | Ad-hoc test query; return top-k chunks with scores |
@@ -205,18 +206,97 @@ Or, given the project's existing pattern, call the CLI module functions directly
 ### B.8 Non-Goals (Deferred)
 
 - In-browser text editor for `rag_data/` source files (use VS Code or a dedicated CMS).
-- File upload for new character data (filesystem write from web raises deployment concerns).
 - Real-time log streaming for long-running jobs (stdout pipe to WebSocket — separate effort).
 - Multi-user / authentication (single-user local tool assumption).
 
 ---
 
+## C. Character Management UI
+
+UI surfaces for character card import, avatar upload, and character switching. Depends on
+`REFINEMENTS.md §11` backend work for card parsing and avatar storage.
+
+### C.1 Character Avatar Display
+
+Show a character avatar image in the chat interface.
+
+- Display the avatar in the chat header next to the character name.
+- Optionally show a small avatar thumbnail next to each assistant message bubble.
+- Fall back to a coloured monogram/initial placeholder if no avatar is set.
+- Source: `GET /characters/avatar` — served by the web app, returns the stored image or a
+  generated fallback.
+
+### C.2 Avatar Upload
+
+Allow uploading a custom avatar image for the active character.
+
+- Upload button in the character settings area (or a dedicated character management page).
+- Accepts PNG, JPEG, or WebP; server resizes to ≤ 512 px and saves to
+  `character_storage/<name>/avatar.png`.
+- Instant preview update after upload via HTMX partial replace.
+
+### C.3 Character Card Import
+
+A drag-and-drop or file-picker import flow for standard character card files.
+
+- Accepts: PNG (V2 `chara` chunk or V3 `ccv3` chunk), plain JSON (CCv2 or CCv3), and CHARX zip.
+- On import: extracts card fields, normalises to the project's JSON format, saves to `cards/`,
+  and optionally extracts the embedded avatar.
+- Shows a preview of extracted fields (name, description snippet, scenario snippet) before
+  confirming the import.
+- After import, allows immediately switching to the new character without restarting.
+- Route: `POST /characters/import` (multipart form upload).
+
+### C.4 Character Selector / Switcher
+
+A UI for browsing and switching the active character without restarting the server.
+
+- Lists all cards in `cards/` with avatar thumbnails, name, and a brief description snippet.
+- "Switch" button triggers a hot-reload (see `REFINEMENTS.md §7` character hot-reload).
+- Shows which character is currently active.
+- Route: `GET /characters` (list), `POST /characters/{name}/activate`.
+
+### C.5 In-App Character Card Editor
+
+A form-based editor for creating and editing character cards within the web UI. Several
+open-source implementations already exist and could be referenced or adapted:
+
+- [ZoltanAI/character-editor](https://github.com/ZoltanAI/character-editor) — standalone
+  browser-based editor for V1/V2 cards; good reference for field layout and PNG embedding.
+- SillyTavern has a built-in card editor that supports V2 and lorebook editing.
+- [character-card-spec-v3](https://github.com/kwaroran/character-card-spec-v3) provides the
+  canonical field reference for a V3-compatible editor.
+
+Scope for this project:
+
+- Edit core fields: name, description, scenario, personality, first message, mes_example,
+  voice instructions, tags.
+- Avatar upload inline (replaces §C.2 standalone upload).
+- Save as JSON to `cards/` and optionally export as CCv2/CCv3 PNG (embed in tEXt chunk).
+- Route: `GET /characters/{name}/edit`, `POST /characters/{name}/edit`.
+- Depends on `REFINEMENTS.md §11` card format backend and §C.3 import pipeline (shared parsing).
+
+**Note on avatar management without a full editor:** Until §C.5 is built, the simplest path
+is to drop an image file (`avatar.png`, `.jpg`, or `.webp`) into
+`character_storage/<character_stem>/` — the web app serves it automatically via
+`GET /characters/avatar`. The stem is the character name lowercased with spaces → underscores
+(e.g., "SHODAN" → `character_storage/shodan/avatar.jpg`).
+
+---
+
 ## Suggested Execution Order (UI)
 
-1. RAG Management UI (§B) as a self-contained milestone — implement §B.6 steps in order.
-2. Token budget visualization (§A.1) and per-turn token stats panel (§A.2) — low-risk extensions
+1. ✅ RAG Management UI (§B) as a self-contained milestone — implement §B.6 steps in order.
+2. ✅ Token budget visualization (§A.1) and per-turn token stats panel (§A.2) — low-risk extensions
    to the existing diagnostics panel; depends on `REFINEMENTS.md §8` backend work.
-3. Session history search (§A.4) — stateless read-only feature, no new backend state model needed.
-4. Conversation branching controls (§A.3) — depends on `REFINEMENTS.md §7` session state changes.
-5. Memory panel (§A.5) — depends on `REFINEMENTS.md §6` Tier 1 memory being implemented first.
-6. Skills dropdown (§A.6) — depends on `REFINEMENTS.md §7` skills config backend.
+3. ✅ Session history search (§A.4) — stateless read-only feature, no new backend state model needed.
+4. ✅ Character avatar display + tab sidebar (§C.1) — avatar served from `character_storage/<stem>/`.
+5. ✅ RAG file upload + create collection from UI (§B.1/B.2 extension) — `POST /rag/files/upload`,
+   `POST /rag/collections`; "Ingest →" per-file action; upload-and-ingest combined flow.
+6. Conversation branching controls (§A.3) — depends on `REFINEMENTS.md §7` session state changes.
+7. Memory panel (§A.5) — depends on `REFINEMENTS.md §6` Tier 1 memory being implemented first.
+8. Skills dropdown (§A.6) — depends on `REFINEMENTS.md §7` skills config backend.
+9. Avatar upload UI (§C.2) — small addition; no major backend dependency.
+10. Character card import UI (§C.3) — depends on `REFINEMENTS.md §11.2` import backend.
+11. Character switcher (§C.4) — depends on `REFINEMENTS.md §7` character hot-reload.
+12. In-app character card editor (§C.5) — largest UI item; depends on §C.3 + §C.4.
diff --git a/scripts/rag/push_rag_data.py b/scripts/rag/push_rag_data.py
index 2cc77bc..4265a89 100644
--- a/scripts/rag/push_rag_data.py
+++ b/scripts/rag/push_rag_data.py
@@ -236,7 +236,7 @@ def push_to_collection(
         try:
             context.client.delete_collection(collection_name)
             logger.info(f"Deleted existing collection: {collection_name}")
-        except ValueError:
+        except MISSING_COLLECTION_ERRORS:
             logger.debug(f"Collection {collection_name} doesn't exist, creating new")
     else:
         assert_collection_fingerprint_compatible(context.client, collection_name, expected_fingerprint)
diff --git a/templates/diagnostics_panel.html b/templates/diagnostics_panel.html
index d4d6b50..2183eeb 100644
--- a/templates/diagnostics_panel.html
+++ b/templates/diagnostics_panel.html
@@ -1,29 +1,69 @@
 <div id="diag-content">
+{% if last_budget and last_budget.context_window > 0 %}
+{% set cw = last_budget.context_window %}
+{% set sys_pct  = (last_budget.system_prompt_tokens  / cw * 100) | round(1) %}
+{% set hist_pct = (last_budget.history_tokens         / cw * 100) | round(1) %}
+{% set rag_pct  = (last_budget.rag_tokens             / cw * 100) | round(1) %}
+{% set ex_pct   = (last_budget.examples_tokens        / cw * 100) | round(1) %}
+{% set inp_pct  = (last_budget.input_tokens           / cw * 100) | round(1) %}
+{% set res_pct  = (last_budget.reserved_for_response  / cw * 100) | round(1) %}
+{% set used_pct = (last_budget.total_estimated        / cw * 100) | round(1) %}
+<div class="budget-section">
+  <div class="budget-label">
+    Context window: <strong>{{ last_budget.total_estimated }}</strong> / {{ cw }} tokens
+    <span class="budget-pct {% if used_pct > 90 %}bpct-red{% elif used_pct > 70 %}bpct-yellow{% else %}bpct-green{% endif %}">{{ used_pct }}%</span>
+  </div>
+  <div class="budget-bar" title="System: {{ sys_pct }}% | History: {{ hist_pct }}% | RAG: {{ rag_pct }}% | Examples: {{ ex_pct }}% | Input: {{ inp_pct }}% | Reserved: {{ res_pct }}%">
+    <div class="budget-seg seg-system"   style="width:{{ sys_pct }}%"  title="System prompt: {{ last_budget.system_prompt_tokens }} tok ({{ sys_pct }}%)"></div>
+    <div class="budget-seg seg-history"  style="width:{{ hist_pct }}%" title="History: {{ last_budget.history_tokens }} tok ({{ hist_pct }}%)"></div>
+    <div class="budget-seg seg-rag"      style="width:{{ rag_pct }}%"  title="RAG context: {{ last_budget.rag_tokens }} tok ({{ rag_pct }}%)"></div>
+    <div class="budget-seg seg-examples" style="width:{{ ex_pct }}%"   title="Examples: {{ last_budget.examples_tokens }} tok ({{ ex_pct }}%)"></div>
+    <div class="budget-seg seg-input"    style="width:{{ inp_pct }}%"  title="User input: {{ last_budget.input_tokens }} tok ({{ inp_pct }}%)"></div>
+    <div class="budget-seg seg-reserved" style="width:{{ res_pct }}%"  title="Reserved for response: {{ last_budget.reserved_for_response }} tok ({{ res_pct }}%)"></div>
+    <div class="budget-seg seg-headroom" style="flex:1"                title="Headroom (free)"></div>
+  </div>
+  <div class="budget-legend">
+    <span class="leg seg-system">System</span>
+    <span class="leg seg-history">History</span>
+    <span class="leg seg-rag">RAG</span>
+    <span class="leg seg-examples">Examples</span>
+    <span class="leg seg-input">Input</span>
+    <span class="leg seg-reserved">Reserved</span>
+    <span class="leg seg-headroom">Free</span>
+  </div>
+</div>
+{% endif %}
 {% if history %}
 <table class="diag-table">
     <thead>
         <tr>
-            <th>T</th>
-            <th>Latency</th>
-            <th>Chars</th>
-            <th>Main</th>
-            <th>MES</th>
-            <th>Cross−</th>
-            <th>Drift</th>
+            <th title="Turn number">T</th>
+            <th title="Response latency">Latency</th>
+            <th title="Estimated prompt tokens">Prompt~</th>
+            <th title="Estimated completion tokens">Compl~</th>
+            <th title="Context window fill %">Ctx%</th>
+            <th title="RAG chunks retrieved (main)">RAG</th>
+            <th title="Persona drift score">Drift</th>
         </tr>
     </thead>
     <tbody>
     {% for entry in history %}
         {% set r = entry.retrieval if entry.retrieval else {} %}
-        {% set cl = r.cleanup if r.cleanup else {} %}
         {% set drift = entry.persona.drift_score if entry.persona else none %}
+        {% set tb = entry.token_budget if entry.token_budget else {} %}
+        {% set cw = tb.context_window if tb.context_window else 0 %}
+        {% set used = tb.total_estimated if tb.total_estimated else 0 %}
+        {% set ctx_pct = (used / cw * 100) | round(0) | int if cw > 0 else none %}
+        {% set main_chunks = r.main.returned if r.main is defined else 0 %}
         <tr>
             <td>{{ entry.turn }}</td>
             <td>{{ "%.2fs" | format(entry.latency_s) if entry.latency_s is not none else "—" }}</td>
-            <td>{{ entry.chars_emitted if entry.chars_emitted is not none else "—" }}</td>
-            <td>{{ cl.main if cl.main is defined else 0 }}</td>
-            <td>{{ cl.mes if cl.mes is defined else 0 }}</td>
-            <td>{{ cl.cross_removed if cl.cross_removed is defined else 0 }}</td>
+            <td>{{ used if used > 0 else "—" }}</td>
+            <td>{{ entry.estimated_completion_tokens if entry.estimated_completion_tokens is not none else "—" }}</td>
+            <td{% if ctx_pct is not none %} style="color: {% if ctx_pct > 90 %}#f8b4b4{% elif ctx_pct > 70 %}#ffd166{% else %}#a8d8a8{% endif %}"{% endif %}>
+                {{ ctx_pct ~ "%" if ctx_pct is not none else "—" }}
+            </td>
+            <td>{{ main_chunks }}</td>
             <td{% if drift is not none %} style="color: {% if drift >= fail_threshold %}#f8b4b4{% elif drift >= warn_threshold %}#ffd166{% else %}#a8d8a8{% endif %}"{% endif %}>
                 {{ "%.3f" | format(drift) if drift is not none else "—" }}
             </td>
@@ -31,6 +71,23 @@
     {% endfor %}
     </tbody>
 </table>
+{% set ns = namespace(total_prompt=0, total_compl=0, count=0) %}
+{% for entry in history %}
+    {% set tb = entry.token_budget if entry.token_budget else {} %}
+    {% if tb.total_estimated and tb.total_estimated > 0 %}
+        {% set ns.total_prompt = ns.total_prompt + tb.total_estimated %}
+        {% set ns.total_compl  = ns.total_compl  + (entry.estimated_completion_tokens or 0) %}
+        {% set ns.count = ns.count + 1 %}
+    {% endif %}
+{% endfor %}
+{% if ns.count > 0 %}
+<div class="diag-totals">
+  Session totals — Prompt: <strong>{{ ns.total_prompt }}</strong> tok &nbsp;·&nbsp;
+  Completion: <strong>{{ ns.total_compl }}</strong> tok &nbsp;·&nbsp;
+  Avg ctx: <strong>{{ (ns.total_prompt / ns.count / (last_budget.context_window or 1) * 100) | round(1) if last_budget and last_budget.context_window else "—" }}%</strong>
+  ({{ ns.count }} turn{{ "s" if ns.count != 1 else "" }})
+</div>
+{% endif %}
 {% else %}
 <span class="diag-empty">No turns recorded yet.</span>
 {% endif %}
diff --git a/templates/index.html b/templates/index.html
index 4aa450b..235643c 100644
--- a/templates/index.html
+++ b/templates/index.html
@@ -31,16 +31,121 @@
         }
 
         .sidebar h1 {
-            margin: 0 0 0.5rem;
+            margin: 0;
+            font-size: 1rem;
+            white-space: nowrap;
+            overflow: hidden;
+            text-overflow: ellipsis;
+        }
+
+        .sidebar-header {
+            display: flex;
+            align-items: center;
+            gap: 0.55rem;
+            margin-bottom: 0.75rem;
+        }
+
+        .sidebar-avatar-sm {
+            width: 38px;
+            height: 38px;
+            border-radius: 50%;
+            object-fit: cover;
+            flex-shrink: 0;
+            border: 2px solid #2d3743;
+        }
+
+        .sidebar-avatar-sm-placeholder {
+            width: 38px;
+            height: 38px;
+            border-radius: 50%;
+            background: #1f2d3d;
+            border: 2px solid #2d3743;
+            display: flex;
+            align-items: center;
+            justify-content: center;
             font-size: 1.1rem;
+            font-weight: 700;
+            color: #7cb3e8;
+            flex-shrink: 0;
         }
 
-        .meta {
-            font-size: 0.9rem;
+        /* Sidebar tabs */
+        .sidebar-tabs {
+            display: flex;
+            gap: 2px;
+            margin-bottom: 0;
+        }
+
+        .sidebar-tab {
+            flex: 1;
+            padding: 0.35rem 0.2rem;
+            font-size: 0.73rem;
+            font-weight: 600;
+            background: #0f1317;
+            border: 1px solid #2d3743;
+            border-bottom: none;
+            border-radius: 5px 5px 0 0;
+            color: #8b949e;
+            cursor: pointer;
+            text-align: center;
+            transition: color 0.15s, background 0.15s;
+        }
+
+        .sidebar-tab:hover { color: #c9d1d9; }
+
+        .sidebar-tab.active {
+            background: #161b22;
+            color: #e6edf3;
+            border-color: #3d4751;
+        }
+
+        .sidebar-pane {
+            display: none;
+            border: 1px solid #3d4751;
+            border-radius: 0 0 8px 8px;
+            padding: 0.75rem;
+            background: #0f1317;
+        }
+
+        .sidebar-pane.active { display: block; }
+
+        /* Character tab */
+        .char-avatar-wrap {
+            display: flex;
+            justify-content: center;
+            margin-bottom: 0.75rem;
+        }
+
+        .char-avatar {
+            width: 180px;
+            height: 180px;
+            border-radius: 12px;
+            object-fit: cover;
+            border: 2px solid #2d3743;
+        }
+
+        .char-avatar-placeholder {
+            width: 180px;
+            height: 180px;
+            border-radius: 12px;
+            background: #1f2d3d;
+            border: 2px solid #2d3743;
+            display: flex;
+            align-items: center;
+            justify-content: center;
+            font-size: 4rem;
+            font-weight: 700;
+            color: #7cb3e8;
+        }
+
+        .char-meta {
+            font-size: 0.82rem;
             color: #98a6b6;
-            line-height: 1.5;
+            line-height: 1.7;
         }
 
+        .char-meta strong { color: #c9d1d9; }
+
         .sidebar-actions {
             display: grid;
             grid-template-columns: 1fr 1fr;
@@ -317,6 +422,65 @@
             color: #98a6b6;
         }
 
+        /* Token budget bar */
+        .budget-section {
+            margin: 0.5rem 0 0.75rem;
+        }
+        .budget-label {
+            font-size: 0.75rem;
+            color: #c5cdd6;
+            margin-bottom: 4px;
+            display: flex;
+            align-items: center;
+            gap: 0.4rem;
+        }
+        .budget-pct {
+            font-size: 0.7rem;
+            padding: 1px 5px;
+            border-radius: 3px;
+            font-weight: 600;
+        }
+        .bpct-green  { background: #1e3a2a; color: #a8d8a8; }
+        .bpct-yellow { background: #3a2e10; color: #ffd166; }
+        .bpct-red    { background: #3a1a1a; color: #f8b4b4; }
+        .budget-bar {
+            display: flex;
+            height: 12px;
+            border-radius: 4px;
+            overflow: hidden;
+            background: #1a1e2e;
+            cursor: help;
+        }
+        .budget-seg { min-width: 0; transition: width 0.4s; }
+        .seg-system   { background: #7c6fdc; }
+        .seg-history  { background: #3a9bd5; }
+        .seg-rag      { background: #48c774; }
+        .seg-examples { background: #f9a825; }
+        .seg-input    { background: #ff7043; }
+        .seg-reserved { background: #667788; }
+        .seg-headroom { background: #252840; flex: 1; }
+        .budget-legend {
+            display: flex;
+            flex-wrap: wrap;
+            gap: 4px 8px;
+            margin-top: 4px;
+        }
+        .budget-legend .leg {
+            font-size: 0.65rem;
+            padding: 1px 5px;
+            border-radius: 2px;
+            color: #0a0a14;
+            font-weight: 600;
+            opacity: 0.9;
+        }
+        .diag-totals {
+            font-size: 0.72rem;
+            color: #98a6b6;
+            margin-top: 0.5rem;
+            padding-top: 0.4rem;
+            border-top: 1px solid #2a2e3e;
+        }
+
         .profile-current-table {
             margin-top: 0.5rem;
         }
@@ -433,11 +597,139 @@
             color: #c9d1d9;
         }
 
-        .guide-item p {
-            margin: 0;
-            font-size: 0.77rem;
+        .search-result-item {
+            padding: 0.4rem 0.5rem;
+            border: 1px solid #2d3743;
+            border-radius: 6px;
+            background: #111418;
+            margin-top: 0.3rem;
+        }
+
+        .search-result-header {
+            display: flex;
+            align-items: baseline;
+            gap: 0.3rem;
+            margin-bottom: 0.2rem;
+            flex-wrap: wrap;
+        }
+
+        .search-result-name {
+            font-size: 0.78rem;
+            font-weight: 600;
+            color: #c9d1d9;
+            flex: 1;
+            min-width: 0;
+            overflow: hidden;
+            text-overflow: ellipsis;
+            white-space: nowrap;
+        }
+
+        .badge-char {
+            font-size: 0.68rem;
+            background: #1a2b3b;
+            color: #79c0ff;
+            padding: 0.1rem 0.35rem;
+            border-radius: 8px;
+            white-space: nowrap;
+        }
+
+        .search-result-date {
+            font-size: 0.7rem;
             color: #98a6b6;
-            line-height: 1.45;
+            white-space: nowrap;
+        }
+
+        .search-snippet {
+            font-size: 0.73rem;
+            color: #98a6b6;
+            line-height: 1.35;
+            margin-bottom: 0.15rem;
+            word-break: break-word;
+        }
+
+        .snip-role {
+            font-size: 0.65rem;
+            font-weight: 700;
+            text-transform: uppercase;
+            color: #4e8bc4;
+            margin-right: 0.25rem;
+        }
+
+        .search-load-btn {
+            margin-top: 0.3rem;
+            padding: 0.22rem 0.45rem;
+            font-size: 0.74rem;
+            background: #1e242b;
+            border: 1px solid #2d3743;
+            border-radius: 5px;
+            color: #79c0ff;
+            cursor: pointer;
+        }
+
+        .search-load-btn:hover {
+            background: #262d36;
+        }
+
+        #session-search summary {
+            font-size: 0.8rem;
+            color: #98a6b6;
+            cursor: pointer;
+            list-style: none;
+            padding: 0.25rem 0;
+            margin-top: 0.35rem;
+        }
+
+        #session-search summary::after {
+            content: " ▸";
+            font-size: 0.7rem;
+        }
+
+        #session-search[open] summary::after {
+            content: " ▾";
+        }
+
+        .search-form {
+            display: flex;
+            flex-direction: column;
+            gap: 0.3rem;
+            margin-top: 0.4rem;
+        }
+
+        .search-form input[type="text"],
+        .search-form input[type="date"] {
+            border: 1px solid #2d3743;
+            background: #111418;
+            color: #e6edf3;
+            border-radius: 5px;
+            padding: 0.3rem 0.45rem;
+            font-size: 0.78rem;
+            width: 100%;
+            box-sizing: border-box;
+        }
+
+        .search-form input[type="date"]::-webkit-calendar-picker-indicator {
+            filter: invert(0.65);
+        }
+
+        .search-date-row {
+            display: grid;
+            grid-template-columns: 1fr 1fr;
+            gap: 0.3rem;
+        }
+
+        .search-submit-btn {
+            padding: 0.3rem 0.5rem;
+            font-size: 0.78rem;
+            background: #1f6feb;
+            border: 1px solid #1f6feb;
+            border-radius: 5px;
+            color: white;
+            cursor: pointer;
+        }
+
+        #session-search-results {
+            max-height: 360px;
+            overflow-y: auto;
         }
     </style>
 </head>
@@ -445,12 +737,17 @@
 <body>
     <div class="layout">
         <aside class="sidebar">
-            <h1>{{ character_name }}</h1>
-            <div class="meta">
-                <div><strong>Model:</strong> {{ model_name or "N/A" }}</div>
-                <div><strong>Type:</strong> {{ model_type or "N/A" }}</div>
-                <div><strong>RAG:</strong> {{ rag_collection or "N/A" }}</div>
+            <!-- Always-visible compact header -->
+            <div class="sidebar-header">
+                {% if has_avatar %}
+                <img class="sidebar-avatar-sm" src="/characters/avatar" alt="{{ character_name }}" />
+                {% else %}
+                <div class="sidebar-avatar-sm-placeholder">{{ character_name[0] | upper if character_name else "?" }}</div>
+                {% endif %}
+                <h1>{{ character_name }}</h1>
             </div>
+
+            <!-- Action buttons always visible -->
             <div class="sidebar-actions">
                 <button type="button" id="help-btn" hx-post="/chat/action/help" hx-target="#chat-log"
                     hx-swap="beforeend">Help</button>
@@ -461,8 +758,32 @@ <h1>{{ character_name }}</h1>
                 <button type="button" id="load-latest-btn" hx-post="/chat/session/load-latest" hx-target="#chat-log"
                     hx-swap="innerHTML">Load Latest</button>
             </div>
-            <div class="session-panel">
-                <h2>Sessions</h2>
+
+            <!-- Tab bar -->
+            <div class="sidebar-tabs">
+                <button class="sidebar-tab active" data-tab="character">🎭 Character</button>
+                <button class="sidebar-tab" data-tab="sessions">💾 Sessions</button>
+                <button class="sidebar-tab" data-tab="debug">🔍 Debug</button>
+            </div>
+
+            <!-- Character tab -->
+            <div class="sidebar-pane active" id="tab-character">
+                <div class="char-avatar-wrap">
+                    {% if has_avatar %}
+                    <img class="char-avatar" src="/characters/avatar" alt="{{ character_name }}" />
+                    {% else %}
+                    <div class="char-avatar-placeholder">{{ character_name[0] | upper if character_name else "?" }}</div>
+                    {% endif %}
+                </div>
+                <div class="char-meta">
+                    <div><strong>Model:</strong> {{ model_name or "N/A" }}</div>
+                    <div><strong>Type:</strong> {{ model_type or "N/A" }}</div>
+                    <div><strong>RAG:</strong> {{ rag_collection or "N/A" }}</div>
+                </div>
+            </div>
+
+            <!-- Sessions tab -->
+            <div class="sidebar-pane" id="tab-sessions">
                 <div class="session-row">
                     <input id="session-name" type="text" placeholder="Session name (optional)" maxlength="80" />
                     <button type="button" id="save-named-btn">Save</button>
@@ -472,64 +793,85 @@ <h2>Sessions</h2>
                     <button type="button" id="load-selected-btn">Load</button>
                 </div>
                 <button type="button" id="refresh-sessions-btn">Refresh List</button>
+                <details id="session-search">
+                    <summary>🔍 Search sessions</summary>
+                    <form class="search-form"
+                        hx-get="/sessions/search"
+                        hx-target="#session-search-results"
+                        hx-swap="innerHTML"
+                        hx-trigger="submit">
+                        <input type="text" name="q" placeholder="Search text in messages…" maxlength="200" />
+                        <input type="text" name="character" placeholder="Character name filter…" maxlength="80" />
+                        <div class="search-date-row">
+                            <input type="date" name="from_date" title="From date" />
+                            <input type="date" name="to_date" title="To date" />
+                        </div>
+                        <button type="submit" class="search-submit-btn">Search</button>
+                    </form>
+                    <div id="session-search-results"></div>
+                </details>
             </div>
-            <div class="debug-panel">
-                <h2>Retrieval Debug</h2>
-                <div id="debug-content">No retrievals yet.</div>
-                <div id="debug-history-content">No retrieval history yet.</div>
-                <button type="button" id="refresh-debug-btn">Refresh Debug</button>
-            </div>
-            <details class="diag-panel">
-                <summary>Diagnostics</summary>
-                <div id="diag-content"><span class="diag-empty">No turns recorded yet.</span></div>
-                <button type="button" id="refresh-diag-btn">Refresh</button>
-            </details>
-            <details class="presets-panel"
-                     hx-get="/settings/profiles"
-                     hx-trigger="toggle once"
-                     hx-target="#presets-content"
-                     hx-swap="outerHTML">
-                <summary>Presets</summary>
-                <div id="presets-content">
-                    <span class="profile-empty">Loading…</span>
-                </div>
-            </details>
-            <a class="rag-link-btn" href="/rag">⚙ RAG Manager →</a>
-            <details class="guide-panel">
-                <summary>💡 How to use this chat</summary>
-                <div class="guide-item">
-                    <h3>Sending messages</h3>
-                    <p>Type in the box at the bottom and press <strong>Send</strong> (or hit Enter). The character will reply in real time. If the reply gets cut off, press <strong>Continue</strong> to pick up where it left off.</p>
-                </div>
-                <div class="guide-item">
-                    <h3>Clear &amp; Reload</h3>
-                    <p><strong>Clear</strong> removes messages from the screen but keeps the character loaded. <strong>Reload</strong> fully restarts the character — useful if responses drift off-topic or feel broken.</p>
-                </div>
-                <div class="guide-item">
-                    <h3>Sessions — saving &amp; loading</h3>
-                    <p>Type an optional name and press <strong>Save</strong> to store the current conversation. Use the dropdown to pick a past conversation and press <strong>Load</strong> to restore it. <strong>Load Latest</strong> skips the menu and restores your most recent save.</p>
-                </div>
-                <div class="guide-item">
-                    <h3>Copy Last &amp; Export</h3>
-                    <p><strong>Copy Last</strong> puts the character's most recent reply on your clipboard. The Export buttons let you download the full conversation as a plain text file, a structured JSON file, or a ZIP bundle that includes metadata.</p>
-                </div>
-                <div class="guide-item">
-                    <h3>RAG — the knowledge base</h3>
-                    <p>The <strong>RAG</strong> value at the top shows which knowledge collection the character is using. This is a database of text the AI can search through when answering your messages — think of it as the character's long-term memory or reference library. You can manage these collections in the <strong>RAG Manager</strong>.</p>
-                </div>
-                <div class="guide-item">
-                    <h3>Retrieval Debug</h3>
-                    <p>Shows what information was fetched from the knowledge base to help answer your last message — how many chunks were found, how they were ranked, and which collection was searched. Useful for understanding why the character knows (or doesn't know) something.</p>
-                </div>
-                <div class="guide-item">
-                    <h3>Diagnostics</h3>
-                    <p>Advanced statistics about response quality, token counts, and persona consistency scores. Mainly useful for developers fine-tuning the character.</p>
-                </div>
-                <div class="guide-item">
-                    <h3>Presets</h3>
-                    <p>Save and restore AI model settings (temperature, context size, repetition penalties, etc.). If you've found a configuration that works well, save it as a preset so you can switch back to it quickly.</p>
+
+            <!-- Debug tab -->
+            <div class="sidebar-pane" id="tab-debug">
+                <div class="debug-panel">
+                    <h2>Retrieval Debug</h2>
+                    <div id="debug-content">No retrievals yet.</div>
+                    <div id="debug-history-content">No retrieval history yet.</div>
+                    <button type="button" id="refresh-debug-btn">Refresh Debug</button>
                 </div>
-            </details>
+                <details class="diag-panel">
+                    <summary>Diagnostics</summary>
+                    <div id="diag-content"><span class="diag-empty">No turns recorded yet.</span></div>
+                    <button type="button" id="refresh-diag-btn">Refresh</button>
+                </details>
+                <details class="presets-panel"
+                         hx-get="/settings/profiles"
+                         hx-trigger="toggle once"
+                         hx-target="#presets-content"
+                         hx-swap="outerHTML">
+                    <summary>Presets</summary>
+                    <div id="presets-content">
+                        <span class="profile-empty">Loading…</span>
+                    </div>
+                </details>
+                <a class="rag-link-btn" href="/rag">⚙ RAG Manager →</a>
+                <details class="guide-panel">
+                    <summary>💡 How to use this chat</summary>
+                    <div class="guide-item">
+                        <h3>Sending messages</h3>
+                        <p>Type in the box at the bottom and press <strong>Send</strong> (or hit Enter). The character will reply in real time. If the reply gets cut off, press <strong>Continue</strong> to pick up where it left off.</p>
+                    </div>
+                    <div class="guide-item">
+                        <h3>Clear &amp; Reload</h3>
+                        <p><strong>Clear</strong> removes messages from the screen but keeps the character loaded. <strong>Reload</strong> fully restarts the character — useful if responses drift off-topic or feel broken.</p>
+                    </div>
+                    <div class="guide-item">
+                        <h3>Sessions — saving &amp; loading</h3>
+                        <p>Type an optional name and press <strong>Save</strong> to store the current conversation. Use the dropdown to pick a past conversation and press <strong>Load</strong> to restore it. <strong>Load Latest</strong> skips the menu and restores your most recent save. Use <strong>Search sessions</strong> to find older conversations by keyword, character name, or date.</p>
+                    </div>
+                    <div class="guide-item">
+                        <h3>Copy Last &amp; Export</h3>
+                        <p><strong>Copy Last</strong> puts the character's most recent reply on your clipboard. The Export buttons let you download the full conversation as a plain text file, a structured JSON file, or a ZIP bundle that includes metadata.</p>
+                    </div>
+                    <div class="guide-item">
+                        <h3>RAG — the knowledge base</h3>
+                        <p>The <strong>RAG</strong> value at the top shows which knowledge collection the character is using. This is a database of text the AI can search through when answering your messages — think of it as the character's long-term memory or reference library. You can manage these collections in the <strong>RAG Manager</strong>.</p>
+                    </div>
+                    <div class="guide-item">
+                        <h3>Retrieval Debug</h3>
+                        <p>Shows what information was fetched from the knowledge base to help answer your last message — how many chunks were found, how they were ranked, and which collection was searched. Useful for understanding why the character knows (or doesn't know) something.</p>
+                    </div>
+                    <div class="guide-item">
+                        <h3>Diagnostics</h3>
+                        <p>Advanced statistics shown after each reply: a colour-coded bar shows how the AI's memory window is split between the character description, conversation history, retrieved knowledge, and your message. The table shows estimated token counts per turn and how full the context window is. Green = plenty of room; yellow = getting full; red = nearly at the limit.</p>
+                    </div>
+                    <div class="guide-item">
+                        <h3>Presets</h3>
+                        <p>Save and restore AI model settings (temperature, context size, repetition penalties, etc.). If you've found a configuration that works well, save it as a preset so you can switch back to it quickly.</p>
+                    </div>
+                </details>
+            </div>
         </aside>
 
         <main class="main">
@@ -559,6 +901,17 @@ <h3>Presets</h3>
     </div>
 
     <script>
+        // Sidebar tab switching
+        document.querySelectorAll(".sidebar-tab").forEach((btn) => {
+            btn.addEventListener("click", () => {
+                document.querySelectorAll(".sidebar-tab").forEach((b) => b.classList.remove("active"));
+                document.querySelectorAll(".sidebar-pane").forEach((p) => p.classList.remove("active"));
+                btn.classList.add("active");
+                const pane = document.getElementById("tab-" + btn.dataset.tab);
+                if (pane) pane.classList.add("active");
+            });
+        });
+
         const chatForm = document.getElementById("chat-form");
         const chatLog = document.getElementById("chat-log");
         const userInput = document.getElementById("user-input");
diff --git a/templates/rag/collections_list.html b/templates/rag/collections_list.html
index 23df393..e1a070a 100644
--- a/templates/rag/collections_list.html
+++ b/templates/rag/collections_list.html
@@ -41,3 +41,44 @@
 {% else %}
 <p class="rag-empty">No collections found in <code>character_storage/</code>.</p>
 {% endif %}
+
+<div class="rag-subsection">
+    <div class="rag-subsection-header">➕ Create New Collection</div>
+    <p style="font-size:0.78rem;color:#98a6b6;margin:0 0 0.65rem">
+        Build a searchable knowledge base from a source file already in <code>rag_data/</code>.
+        The embedding model and chunk settings from your current config will be used.
+        This may take a minute or two depending on file size.
+    </p>
+    <form hx-post="/rag/collections"
+          hx-target="#create-collection-result"
+          hx-swap="innerHTML"
+          hx-indicator="#create-spinner"
+          style="display:flex;flex-direction:column;gap:0.5rem">
+        <div class="rag-form-row">
+            <label class="rag-label">Collection name:</label>
+            <input type="text" name="collection_name" class="rag-input" style="width:180px"
+                   placeholder="e.g. shodan" required
+                   pattern="[a-zA-Z0-9_\-]+" title="Letters, digits, underscores and hyphens only" />
+        </div>
+        <div class="rag-form-row">
+            <label class="rag-label">Source file:</label>
+            {% if existing_stems %}
+            <select name="stem" class="rag-select">
+                {% for s in existing_stems %}
+                <option value="{{ s }}">{{ s }}.txt</option>
+                {% endfor %}
+            </select>
+            {% else %}
+            <input type="text" name="stem" class="rag-input" style="width:180px"
+                   placeholder="e.g. shodan"
+                   pattern="[a-zA-Z0-9_\-]+" required />
+            <span class="rag-label">(no files found in <code>rag_data/</code> — upload one first)</span>
+            {% endif %}
+        </div>
+        <div class="rag-btn-group" style="margin-bottom:0">
+            <button type="submit" class="rag-btn rag-btn-primary">Create Collection</button>
+            <span id="create-spinner" class="htmx-indicator">Building…</span>
+        </div>
+    </form>
+    <div id="create-collection-result" style="margin-top:0.65rem;"></div>
+</div>
diff --git a/templates/rag/files_list.html b/templates/rag/files_list.html
index 518f222..ae2a5ba 100644
--- a/templates/rag/files_list.html
+++ b/templates/rag/files_list.html
@@ -1,5 +1,52 @@
 <div class="rag-section-header">RAG Files</div>
 
+{% if uploaded %}
+<div class="rag-msg rag-msg-ok">✓ Uploaded <strong>{{ uploaded }}</strong> to <code>rag_data/</code>.</div>
+{% endif %}
+
+<div style="border:1px solid #2d3743;border-radius:8px;padding:0.85rem;margin-bottom:1rem;background:#0f1317;">
+    <div class="rag-subsection-header" style="margin-bottom:0.55rem;">📤 Upload Source File</div>
+    <p style="font-size:0.78rem;color:#98a6b6;margin:0 0 0.65rem">
+        Upload a <code>.txt</code> file to <code>rag_data/</code>.
+        Optionally enter a collection name to build the knowledge base immediately after uploading.
+    </p>
+    <form hx-post="/rag/files/upload"
+          hx-target="#rag-main"
+          hx-swap="innerHTML"
+          hx-encoding="multipart/form-data"
+          hx-indicator="#upload-spinner"
+          style="display:flex;flex-direction:column;gap:0.5rem">
+        <div class="rag-form-row">
+            <label class="rag-label">File (.txt):</label>
+            <input type="file" name="file" accept=".txt" required
+                   class="rag-input"
+                   onchange="
+                     var n = this.files[0] ? this.files[0].name.replace(/\.txt$/i,'') : '';
+                     var s = n.toLowerCase().replace(/[^a-z0-9_-]/g,'_').replace(/^_+|_+$/g,'');
+                     document.getElementById('upload-stem').value = s;
+                     document.getElementById('upload-collection').value = s;
+                   " />
+        </div>
+        <div class="rag-form-row">
+            <label class="rag-label">Stem:</label>
+            <input type="text" name="stem" id="upload-stem" required
+                   class="rag-input rag-input-wide"
+                   placeholder="Auto-filled from filename"
+                   pattern="[a-zA-Z0-9_\-]+" title="Letters, digits, underscores and hyphens only" />
+        </div>
+        <div class="rag-form-row">
+            <label class="rag-label">Collection name <span style="color:#636e7b">(optional)</span>:</label>
+            <input type="text" name="collection_name" id="upload-collection"
+                   class="rag-input rag-input-wide"
+                   placeholder="Leave blank to upload only" />
+        </div>
+        <div class="rag-btn-group" style="margin-bottom:0">
+            <button type="submit" class="rag-btn rag-btn-primary">Upload</button>
+            <span id="upload-spinner" class="htmx-indicator">Uploading…</span>
+        </div>
+    </form>
+</div>
+
 <div class="rag-btn-group">
     <button class="rag-btn"
         hx-post="/rag/lint" hx-target="#lint-results" hx-swap="innerHTML"
@@ -48,6 +95,29 @@
                     hx-target="#coverage-results" hx-swap="innerHTML"
                     hx-indicator="#coverage-spinner">Coverage</button>
                 {% endif %}
+                {% if f.type == "lore" %}
+                <button class="rag-btn"
+                    onclick="
+                      var d=document.getElementById('ingest-{{ f.stem }}');
+                      d.style.display = d.style.display==='none' ? 'block' : 'none';
+                    ">Ingest →</button>
+                <div id="ingest-{{ f.stem }}" style="display:none;margin-top:0.45rem">
+                    <form hx-post="/rag/collections"
+                          hx-target="#ingest-result-{{ f.stem }}"
+                          hx-swap="innerHTML"
+                          hx-indicator="#ingest-spin-{{ f.stem }}"
+                          style="display:flex;gap:0.4rem;align-items:center;flex-wrap:wrap">
+                        <input type="hidden" name="stem" value="{{ f.stem }}" />
+                        <input type="text" name="collection_name"
+                               class="rag-input" style="width:150px"
+                               placeholder="Collection name"
+                               value="{{ f.stem }}" required />
+                        <button type="submit" class="rag-btn rag-btn-primary">Build</button>
+                        <span id="ingest-spin-{{ f.stem }}" class="htmx-indicator">Building…</span>
+                    </form>
+                    <div id="ingest-result-{{ f.stem }}" style="margin-top:0.4rem"></div>
+                </div>
+                {% endif %}
             </td>
         </tr>
     {% endfor %}
diff --git a/templates/rag/layout.html b/templates/rag/layout.html
index 3e5c3ab..ea0463b 100644
--- a/templates/rag/layout.html
+++ b/templates/rag/layout.html
@@ -411,7 +411,7 @@
                 <div style="font-size:0.74rem;color:#98a6b6;line-height:1.5;margin-top:0.5rem;display:flex;flex-direction:column;gap:0.6rem;">
                     <div>
                         <strong style="color:#c9d1d9">Collections</strong><br>
-                        A collection is a searchable knowledge base — a database of text chunks the AI searches through during chat. Each character typically has one named after them.
+                        A collection is a searchable knowledge base — a database of text chunks the AI searches through during chat. Each character typically has one named after them. Use <em>Create New Collection</em> to build one from a source file.
                     </div>
                     <div>
                         <strong style="color:#c9d1d9">Detail &amp; Query</strong><br>
@@ -419,7 +419,7 @@
                     </div>
                     <div>
                         <strong style="color:#c9d1d9">Files</strong><br>
-                        The raw text documents (lore files, dialogue examples) that the knowledge base is built from. You can view them, check formatting, and see coverage.
+                        The raw text documents (lore files, dialogue examples) that the knowledge base is built from. You can upload new files, view them, check formatting, and see coverage.
                     </div>
                     <div>
                         <strong style="color:#c9d1d9">Lint</strong><br>
diff --git a/templates/rag/upload_result.html b/templates/rag/upload_result.html
new file mode 100644
index 0000000..1c7718f
--- /dev/null
+++ b/templates/rag/upload_result.html
@@ -0,0 +1,16 @@
+<div class="rag-msg rag-msg-ok">✓ Uploaded <strong>{{ filename }}</strong> to <code>rag_data/</code>.</div>
+
+<p style="font-size:0.82rem;color:#98a6b6;margin:0.25rem 0 0.75rem">
+    Building collection <strong>{{ collection_name }}</strong>…
+</p>
+
+{% include "rag/push_status.html" %}
+
+<p style="margin-top:0.85rem;font-size:0.78rem;color:#636e7b">
+    <button class="rag-btn"
+        hx-get="/rag/files"
+        hx-target="#rag-main" hx-swap="innerHTML">← Back to Files</button>
+    <button class="rag-btn" style="margin-left:0.4rem"
+        hx-get="/rag/collections"
+        hx-target="#rag-main" hx-swap="innerHTML">View Collections</button>
+</p>
diff --git a/templates/sessions_search_results.html b/templates/sessions_search_results.html
new file mode 100644
index 0000000..e051155
--- /dev/null
+++ b/templates/sessions_search_results.html
@@ -0,0 +1,28 @@
+{% if results %}
+<p style="font-size:0.74rem;color:#98a6b6;margin:0.4rem 0 0.4rem">
+    {{ results | length }} session(s) found
+</p>
+{% for s in results %}
+<div class="search-result-item">
+    <div class="search-result-header">
+        <span class="search-result-name" title="{{ s.session_name }}">{{ s.session_name }}</span>
+        {% if s.character_name %}
+        <span class="badge-char">{{ s.character_name }}</span>
+        {% endif %}
+        <span class="search-result-date">{{ s.saved_at }}</span>
+    </div>
+    {% for snip in s.snippets %}
+    <div class="search-snippet">
+        <span class="snip-role">{{ snip.role }}</span>{{ snip.excerpt }}
+    </div>
+    {% endfor %}
+    <button type="button" class="search-load-btn"
+        hx-post="/chat/session/load"
+        hx-vals='{"session_id": "{{ s.session_id }}"}'
+        hx-target="#chat-log"
+        hx-swap="innerHTML">Load</button>
+</div>
+{% endfor %}
+{% else %}
+<p style="font-size:0.78rem;color:#98a6b6;margin:0.4rem 0 0">No matching sessions found.</p>
+{% endif %}
diff --git a/web_app.py b/web_app.py
index ea5e240..979f255 100644
--- a/web_app.py
+++ b/web_app.py
@@ -14,8 +14,8 @@
 from datetime import UTC, datetime
 from pathlib import Path
 
-from fastapi import FastAPI, Form, Query, Request
-from fastapi.responses import HTMLResponse, JSONResponse, Response, StreamingResponse
+from fastapi import FastAPI, File, Form, Query, Request, UploadFile
+from fastapi.responses import FileResponse, HTMLResponse, JSONResponse, Response, StreamingResponse
 from fastapi.templating import Jinja2Templates
 from loguru import logger
 from pydantic import BaseModel
@@ -34,6 +34,19 @@ class StreamRequest(BaseModel):
     continue_mode: bool = False
 
 
+_INVALID_STEM_HTML = (
+    "<p class='text-error'>"
+    "Invalid stem: only letters, digits, underscores, and hyphens are allowed."
+    "</p>"
+)
+_INVALID_COLL_HTML = (
+    "<p class='text-error'>"
+    "Invalid collection name: only letters, digits, underscores, and hyphens are allowed."
+    "</p>"
+)
+_MAX_UPLOAD_BYTES: int = 10 * 1024 * 1024  # 10 MB
+
+
 class ChatRuntime:
     """Holds shared chat runtime state for web requests."""
 
@@ -178,6 +191,125 @@ def _session_listing(runtime: ChatRuntime) -> list[dict[str, str]]:
     return sessions
 
 
+class _SessionSearchParams:
+    """Parsed search parameters for _search_sessions."""
+
+    ISO_DATE_LEN: int = 10
+
+    def __init__(  # noqa: PLR0913
+        self,
+        q: str = "",
+        character: str = "",
+        from_date: str = "",
+        to_date: str = "",
+        max_results: int = 30,
+        max_snippets: int = 3,
+    ) -> None:
+        self.q_lower = q.strip().lower()
+        self.char_lower = character.strip().lower()
+        self.max_results = max_results
+        self.max_snippets = max_snippets
+        self.from_dt = self._parse_date(from_date)
+        self.to_dt = self._parse_date(to_date, end_of_day=True)
+
+    @staticmethod
+    def _parse_date(date_str: str, *, end_of_day: bool = False) -> datetime | None:
+        if not date_str:
+            return None
+        with contextlib.suppress(ValueError):
+            dt = datetime.strptime(date_str, "%Y-%m-%d").replace(tzinfo=UTC)
+            return dt.replace(hour=23, minute=59, second=59) if end_of_day else dt
+        return None
+
+
+def _session_in_date_range(saved_at_str: str, from_dt: datetime | None, to_dt: datetime | None) -> bool:
+    """Return True when the session's saved_at falls within the given range."""
+    if not from_dt and not to_dt:
+        return True
+    saved_dt: datetime | None = None
+    with contextlib.suppress(ValueError):
+        saved_dt = datetime.fromisoformat(saved_at_str)
+        if saved_dt.tzinfo is None:
+            saved_dt = saved_dt.replace(tzinfo=UTC)
+    if saved_dt is None:
+        return True
+    if from_dt and saved_dt < from_dt:
+        return False
+    return not (to_dt and saved_dt > to_dt)
+
+
+def _build_snippets(ui_messages: list[dict[str, str]], q_lower: str, max_snippets: int) -> list[dict[str, str]]:
+    """Extract text excerpts from messages that contain q_lower."""
+    snippets: list[dict[str, str]] = []
+    for msg in ui_messages:
+        content = msg.get("content", "")
+        idx = content.lower().find(q_lower)
+        if idx >= 0:
+            start = max(0, idx - 45)
+            end = min(len(content), idx + len(q_lower) + 100)
+            prefix = "…" if start > 0 else ""
+            suffix = "…" if end < len(content) else ""
+            snippets.append({"role": msg["role"], "excerpt": prefix + content[start:end] + suffix})
+            if len(snippets) >= max_snippets:
+                break
+    return snippets
+
+
+def _search_sessions(  # noqa: PLR0913
+    runtime: ChatRuntime,
+    q: str = "",
+    character: str = "",
+    from_date: str = "",
+    to_date: str = "",
+    max_results: int = 30,
+    max_snippets: int = 3,
+) -> list[dict[str, object]]:
+    """Full-text search across saved session JSON files."""
+    params = _SessionSearchParams(q, character, from_date, to_date, max_results, max_snippets)
+    results: list[dict[str, object]] = []
+
+    for path in _list_session_files(runtime):
+        try:
+            payload = json.loads(path.read_text(encoding="utf-8"))
+        except Exception:
+            logger.warning("Could not parse session file {}", path.name)
+            continue
+        if not isinstance(payload, dict):
+            continue
+
+        session_name = str(payload.get("session_name") or path.stem.removeprefix("session_"))
+        char_name = str(payload.get("character_name") or "")
+        saved_at_str = str(payload.get("saved_at") or "")
+        ui_messages = _coerce_ui_messages(payload.get("ui_messages"))
+        session_id = path.stem.removeprefix("session_")
+
+        if params.char_lower and params.char_lower not in char_name.lower():
+            continue
+        if not _session_in_date_range(saved_at_str, params.from_dt, params.to_dt):
+            continue
+
+        snippets: list[dict[str, str]] = []
+        if params.q_lower:
+            name_match = params.q_lower in session_name.lower()
+            snippets = _build_snippets(ui_messages, params.q_lower, params.max_snippets)
+            if not name_match and not snippets:
+                continue
+
+        results.append(
+            {
+                "session_id": session_id,
+                "session_name": session_name,
+                "character_name": char_name,
+                "saved_at": saved_at_str[: _SessionSearchParams.ISO_DATE_LEN],
+                "snippets": snippets,
+            }
+        )
+        if len(results) >= params.max_results:
+            break
+
+    return results
+
+
 def _record_retrieval_trace(
     runtime: ChatRuntime,
     message: str,
@@ -192,8 +324,10 @@ def _record_retrieval_trace(
         "query": message[:200],
         "latency_s": round(latency_s, 2) if latency_s is not None else None,
         "chars_emitted": chars_emitted,
+        "estimated_completion_tokens": round(chars_emitted / 4) if chars_emitted is not None else None,
         "retrieval": manager.last_retrieval_debug,
         "persona": manager.last_persona_drift,
+        "token_budget": dict(manager.last_token_budget),
     }
     runtime.retrieval_history.append(trace)
     history_cap = runtime.MAX_RETRIEVAL_HISTORY_ENTRIES
@@ -218,6 +352,22 @@ def _coerce_ui_messages(raw_messages: object) -> list[dict[str, str]]:
     return parsed
 
 
+def _character_avatar_path(character_name: str) -> Path | None:
+    """Return path to the character's avatar image, or None if not found."""
+    stem = "".join(ch.lower() if ch.isalnum() else "_" for ch in character_name).strip("_")
+    # Check character_storage first (dedicated asset folder; supports uploads)
+    for ext in ("png", "jpg", "jpeg", "webp"):
+        storage = Path("character_storage") / stem / f"avatar.{ext}"
+        if storage.exists():
+            return storage
+    # Fall back to a matching image in cards/ (e.g. PNG card = its own avatar)
+    for ext in ("png", "jpg", "jpeg", "webp"):
+        card = Path("cards") / f"{stem}.{ext}"
+        if card.exists():
+            return card
+    return None
+
+
 @app.get("/", response_class=HTMLResponse)
 async def index(request: Request) -> HTMLResponse:
     """Render chat page."""
@@ -229,10 +379,23 @@ async def index(request: Request) -> HTMLResponse:
         "model_name": str(runtime.manager.configs.get("MODEL", "")),
         "model_type": str(runtime.manager.configs.get("MODEL_TYPE", "")),
         "rag_collection": str(runtime.manager.rag_collection),
+        "has_avatar": _character_avatar_path(runtime.manager.character_name) is not None,
     }
     return templates.TemplateResponse(request=request, name="index.html", context=context)
 
 
+@app.get("/characters/avatar")
+async def character_avatar(request: Request) -> FileResponse:
+    """Serve the current character's avatar image."""
+    runtime = _get_runtime(request)
+    path = _character_avatar_path(runtime.manager.character_name)
+    if path is None:
+        from fastapi import HTTPException  # noqa: PLC0415
+
+        raise HTTPException(status_code=404, detail="No avatar found")
+    return FileResponse(path)
+
+
 @app.get("/health")
 async def health(request: Request) -> dict[str, object]:
     """Lightweight health endpoint for runtime diagnostics."""
@@ -319,6 +482,7 @@ async def chat_diagnostics(request: Request) -> HTMLResponse:
     history = list(reversed(runtime.retrieval_history))
     html = templates.get_template("diagnostics_panel.html").render(
         history=history,
+        last_budget=dict(manager.last_token_budget),
         warn_threshold=manager.runtime_config.persona_drift_warning_threshold,
         fail_threshold=manager.runtime_config.persona_drift_fail_threshold,
     )
@@ -589,14 +753,33 @@ async def chat_session_load(request: Request, session_id: str = Form(...)) -> HT
         return HTMLResponse(content=_render_chat_log(runtime.ui_messages))
 
 
+@app.get("/sessions/search", response_class=HTMLResponse)
+async def sessions_search(
+    request: Request,
+    q: str = Query(default=""),
+    character: str = Query(default=""),
+    from_date: str = Query(default=""),
+    to_date: str = Query(default=""),
+) -> HTMLResponse:
+    """Full-text search across saved session JSON files; returns an HTMX partial."""
+    if not q.strip() and not character.strip() and not from_date and not to_date:
+        return HTMLResponse(content="")
+    runtime = _get_runtime(request)
+    results = await asyncio.to_thread(_search_sessions, runtime, q, character, from_date, to_date)
+    return templates.TemplateResponse(
+        "sessions_search_results.html",
+        {"request": request, "results": results, "q": q},
+    )
+
+
 def _render_profiles_panel(request: Request) -> HTMLResponse:
     runtime = _get_runtime(request)
     store = _get_profile_store(request)
-    html = templates.get_template("presets_panel.html").render(
+    rendered_html = templates.get_template("presets_panel.html").render(
         profiles=store.list_profiles(),
         current=store.current_values(runtime.manager.runtime_config),
     )
-    return HTMLResponse(content=html)
+    return HTMLResponse(content=rendered_html)
 
 
 @app.get("/settings/profiles", response_class=HTMLResponse)
@@ -656,9 +839,10 @@ async def rag_page(request: Request) -> HTMLResponse:
 async def rag_collections(request: Request) -> HTMLResponse:
     config = _get_rag_config(request)
     collections = await asyncio.to_thread(rag_manager.list_collections, config)
+    stems = await asyncio.to_thread(rag_manager.list_rag_stems, config)
     return templates.TemplateResponse(
         "rag/collections_list.html",
-        {"request": request, "collections": collections},
+        {"request": request, "collections": collections, "existing_stems": stems},
     )
 
 
@@ -667,9 +851,7 @@ async def rag_collection_detail(request: Request, name: str) -> HTMLResponse:
     config = _get_rag_config(request)
     info = await asyncio.to_thread(rag_manager.collection_info, config, name)
     if info is None:
-        return HTMLResponse(
-            content=f"<p>Collection <b>{html.escape(name)}</b> not found.</p>", status_code=404
-        )
+        return HTMLResponse(content=f"<p>Collection <b>{html.escape(name)}</b> not found.</p>", status_code=404)
     return templates.TemplateResponse(
         "rag/collection_detail.html",
         {"request": request, "info": info},
@@ -779,6 +961,109 @@ async def rag_file_view(request: Request, filename: str) -> HTMLResponse:
     )
 
 
+def _validate_upload_content(content: bytes) -> HTMLResponse | None:
+    """Validate uploaded file content; return an error HTMLResponse or None if valid."""
+    if len(content) > _MAX_UPLOAD_BYTES:
+        return HTMLResponse(
+            content=(
+                f"<p class='text-error'>File too large:"
+                f" maximum allowed size is {_MAX_UPLOAD_BYTES // (1024 * 1024)} MB.</p>"
+            ),
+            status_code=400,
+        )
+    try:
+        content.decode("utf-8")
+    except UnicodeDecodeError:
+        return HTMLResponse(
+            content="<p class='text-error'>Invalid file: only UTF-8 encoded text files are accepted.</p>",
+            status_code=400,
+        )
+    return None
+
+
+@app.post("/rag/files/upload", response_class=HTMLResponse)
+async def rag_file_upload(
+    request: Request,
+    stem: str = Form(...),
+    file: UploadFile = File(...),  # noqa: B008
+    collection_name: str = Form(""),
+) -> HTMLResponse:
+    """Upload a .txt source file to rag_data/. Optionally create a collection immediately."""
+    clean_stem = stem.strip()
+    if not rag_manager.is_valid_stem(clean_stem):
+        return HTMLResponse(content=_INVALID_STEM_HTML, status_code=400)
+    content = await file.read()
+    if (err := _validate_upload_content(content)) is not None:
+        return err
+    config = _get_rag_config(request)
+    try:
+        file_info = await asyncio.to_thread(rag_manager.save_rag_file, config, clean_stem, content)
+    except Exception as exc:
+        logger.warning("Failed to save uploaded file {!r}: {}", clean_stem, exc)
+        return HTMLResponse(
+            content=f"<p class='text-error'>Upload failed: {html.escape(str(exc))}</p>",
+            status_code=500,
+        )
+    clean_coll = collection_name.strip()
+    if clean_coll:
+        if not rag_manager.is_valid_stem(clean_coll):
+            return HTMLResponse(content=_INVALID_COLL_HTML, status_code=400)
+        job_store = _get_job_store(request)
+        job_id = job_store.submit(rag_manager.push_collection, config, clean_stem, clean_coll)
+        return templates.TemplateResponse(
+            "rag/upload_result.html",
+            {
+                "request": request,
+                "filename": file_info["name"],
+                "collection_name": clean_coll,
+                "job_id": job_id,
+                "status": "pending",
+                "elapsed_s": 0,
+                "result": None,
+                "error": None,
+                "kind": "push",
+            },
+        )
+    files = await asyncio.to_thread(rag_manager.list_rag_files, config)
+    return templates.TemplateResponse(
+        "rag/files_list.html",
+        {"request": request, "files": files, "uploaded": file_info["name"]},
+    )
+
+
+@app.post("/rag/collections", response_class=HTMLResponse)
+async def rag_collection_create(
+    request: Request,
+    collection_name: str = Form(...),
+    stem: str = Form(...),
+) -> HTMLResponse:
+    """Create a new collection by ingesting an existing rag_data source file."""
+    clean_stem = stem.strip()
+    clean_name = collection_name.strip()
+    if not rag_manager.is_valid_stem(clean_stem):
+        return HTMLResponse(content=_INVALID_STEM_HTML, status_code=400)
+    if not clean_name:
+        return HTMLResponse(
+            content="<p class='text-error'>Collection name is required.</p>",
+            status_code=400,
+        )
+    config = _get_rag_config(request)
+    job_store = _get_job_store(request)
+    job_id = job_store.submit(rag_manager.push_collection, config, clean_stem, clean_name)
+    return templates.TemplateResponse(
+        "rag/push_status.html",
+        {
+            "request": request,
+            "job_id": job_id,
+            "status": "pending",
+            "elapsed_s": 0,
+            "result": None,
+            "error": None,
+            "kind": "push",
+        },
+    )
+
+
 @app.post("/rag/lint", response_class=HTMLResponse)
 async def rag_lint(request: Request) -> HTMLResponse:
     config = _get_rag_config(request)