From 75605c7f71d1fb0dfd29aaf0e7003df73514acc0 Mon Sep 17 00:00:00 2001
From: ryderwishart <ryderwishart@gmail.com>
Date: Tue, 12 May 2026 16:46:29 -0600
Subject: [PATCH] Add character audio export functionality and update audio
 export options

- Introduced a new `characterAudioExporter` module for consolidating audio exports by character.
- Updated `exportHandler` to support new options for consolidating audio and specifying audio formats.
- Enhanced the project export view to include a preview feature for character audio.
- Added new entries to `.gitignore` for Glance memory shards.
- Made several functions in `audioExporter` module publicly accessible for use in the new character audio export logic.
---
 .gitignore                                  |   3 +
 src/exportHandler/audioExporter.ts          |  16 +-
 src/exportHandler/characterAudioExporter.ts | 552 ++++++++++++++++++++
 src/exportHandler/exportHandler.ts          |  32 +-
 src/projectManager/projectExportView.ts     | 305 ++++++++++-
 5 files changed, 892 insertions(+), 16 deletions(-)
 create mode 100644 src/exportHandler/characterAudioExporter.ts
diff --git a/.gitignore b/.gitignore
index f77a45c33..1dc717627 100644
--- a/.gitignore
+++ b/.gitignore
@@ -18,3 +18,6 @@ webviews/codex-webviews/vite.config.ts.timestamp-*.mjs
 
 # AI coding agents
 .claude/
+
+# Glance memory shards
+.glance/
diff --git a/src/exportHandler/audioExporter.ts b/src/exportHandler/audioExporter.ts
index 878496d38..e688678be 100644
--- a/src/exportHandler/audioExporter.ts
+++ b/src/exportHandler/audioExporter.ts
@@ -15,6 +15,10 @@ export const initializeAudioExporter = (context: vscode.ExtensionContext): void
     extensionContext = context;
 };
 
+export function getAudioExporterContext(): vscode.ExtensionContext | undefined {
+    return extensionContext;
+}
+
 // Debug logging for audio export diagnostics
 const DEBUG = false;
 function debug(...args: any[]) {
@@ -28,7 +32,7 @@ type ExportAudioOptions = {
 };
 
 
-function sanitizeFileComponent(input: string): string {
+export function sanitizeFileComponent(input: string): string {
     return input
         .replace(/\s+/g, "_")
         .replace(/[^a-zA-Z0-9._-]/g, "-")
@@ -108,7 +112,7 @@ function formatTimeRangeSuffix(start?: number, end?: number): string {
     return `_${s || ""}-${e || ""}`;
 }
 
-function getTargetLanguageCode(): string {
+export function getTargetLanguageCode(): string {
     const projectConfig = vscode.workspace.getConfiguration("codex-project-manager");
     const lang = projectConfig.get<any>("targetLanguage") || {};
     const code: string = lang.tag || lang.refName || "lang";
@@ -430,19 +434,19 @@ async function prepareAudioForExport(
     return { bytes: original, ext };
 }
 
-async function readNotebook(uri: vscode.Uri): Promise<CodexNotebookAsJSONData> {
+export async function readNotebook(uri: vscode.Uri): Promise<CodexNotebookAsJSONData> {
     const bytes = await vscode.workspace.fs.readFile(uri);
     return JSON.parse(Buffer.from(bytes).toString());
 }
 
-function isActiveCell(cell: any): boolean {
+export function isActiveCell(cell: any): boolean {
     const data = cell?.metadata?.data;
     const isMerged = !!(data && data.merged);
     const isDeleted = !!(data && data.deleted);
     return !isMerged && !isDeleted;
 }
 
-function pickAudioAttachmentForCell(cell: any): { id: string; url: string; start?: number; end?: number; } | null {
+export function pickAudioAttachmentForCell(cell: any): { id: string; url: string; start?: number; end?: number; } | null {
     const attachments = cell?.metadata?.attachments || {};
     if (!attachments || typeof attachments !== "object") return null;
     const selectedId: string | undefined = cell?.metadata?.selectedAudioId;
@@ -467,7 +471,7 @@ function pickAudioAttachmentForCell(cell: any): { id: string; url: string; start
     return candidates[0];
 }
 
-async function pathExists(uri: vscode.Uri): Promise<boolean> {
+export async function pathExists(uri: vscode.Uri): Promise<boolean> {
     try { await vscode.workspace.fs.stat(uri); return true; } catch { return false; }
 }
 
diff --git a/src/exportHandler/characterAudioExporter.ts b/src/exportHandler/characterAudioExporter.ts
new file mode 100644
index 000000000..aae807e9a
--- /dev/null
+++ b/src/exportHandler/characterAudioExporter.ts
@@ -0,0 +1,552 @@
+import * as vscode from "vscode";
+import { basename } from "path";
+import { CodexNotebookAsJSONData } from "@types";
+import { execFile } from "child_process";
+import { promisify } from "util";
+import * as os from "os";
+import * as fs from "fs";
+import * as path from "path";
+import { getFFmpegPath } from "../utils/ffmpegManager";
+import { EditMapUtils } from "../utils/editMapUtils";
+import {
+    sanitizeFileComponent,
+    getTargetLanguageCode,
+    pickAudioAttachmentForCell,
+    isActiveCell,
+    readNotebook,
+    pathExists,
+    getAudioExporterContext,
+} from "./audioExporter";
+
+const execFileAsync = promisify(execFile);
+
+const DEBUG = false;
+function debug(...args: any[]) {
+    if (DEBUG) {
+        console.log("[CharacterAudioExporter]", ...args);
+    }
+}
+
+export type CharacterAudioFormat = "wav" | "flac" | "opus";
+
+interface CharacterClip {
+    absolutePath: string;
+    startMs: number;
+    endMs?: number;
+    cellId: string;
+}
+
+interface CharacterInterval {
+    startSec: number;
+    endSec: number;
+    hasAudio: boolean;
+}
+
+export interface CharacterPreviewCharacter {
+    label: string;
+    key: string;
+    intervals: CharacterInterval[];
+    audioCellCount: number;
+    noAudioCellCount: number;
+    untimedCellCount: number;
+    speakingSecAudio: number;
+    speakingSecNoAudio: number;
+    lastEndSec: number;
+    willExport: boolean;
+}
+
+export interface CharacterPreviewFile {
+    fileBase: string;
+    episodeDurationSec: number;
+    characters: CharacterPreviewCharacter[];
+    skippedCells: number;
+    missingTiming: boolean;
+}
+
+export interface CharacterPreviewResult {
+    files: CharacterPreviewFile[];
+}
+
+function formatExtension(fmt: CharacterAudioFormat): string {
+    switch (fmt) {
+        case "flac": return ".flac";
+        case "opus": return ".opus";
+        case "wav":
+        default: return ".wav";
+    }
+}
+
+function codecArgs(fmt: CharacterAudioFormat, sampleRate: number): string[] {
+    switch (fmt) {
+        case "flac":
+            return ["-c:a", "flac", "-ar", String(sampleRate), "-ac", "1", "-compression_level", "8"];
+        case "opus":
+            return ["-c:a", "libopus", "-b:a", "64k", "-vbr", "on", "-ar", "48000", "-ac", "1"];
+        case "wav":
+        default:
+            return ["-ar", String(sampleRate), "-ac", "1", "-sample_fmt", "s16"];
+    }
+}
+
+function coerceFiniteNumber(value: unknown): number | undefined {
+    if (value === undefined || value === null) return undefined;
+    const num = typeof value === "number" ? value : Number(value);
+    return Number.isFinite(num) ? num : undefined;
+}
+
+// Resolve the current cell label, preferring the materialized value but falling
+// back to the most recent ["metadata", "cellLabel"] CRDT edit when the cell
+// hasn't been re-saved since the label change.
+function resolveCellLabel(cell: any): string | undefined {
+    const direct = cell?.metadata?.cellLabel;
+    if (typeof direct === "string" && direct.trim() !== "") return direct;
+
+    const edits = cell?.metadata?.edits;
+    if (!Array.isArray(edits) || edits.length === 0) return undefined;
+
+    const labelEditMap = EditMapUtils.cellLabel();
+    let latest: { value: unknown; timestamp: number; } | null = null;
+    for (const edit of edits) {
+        if (!edit || !Array.isArray(edit.editMap)) continue;
+        if (!EditMapUtils.equals(edit.editMap, labelEditMap)) continue;
+        const ts = typeof edit.timestamp === "number" ? edit.timestamp : 0;
+        if (!latest || ts > latest.timestamp) {
+            latest = { value: edit.value, timestamp: ts };
+        }
+    }
+    if (latest && typeof latest.value === "string" && latest.value.trim() !== "") {
+        return latest.value;
+    }
+    return undefined;
+}
+
+function computeEpisodeDurationSeconds(cells: CodexNotebookAsJSONData["cells"]): number {
+    let maxEnd = 0;
+    for (const cell of cells) {
+        if (cell.kind !== 2 && cell.kind !== 1) continue;
+        if (!isActiveCell(cell)) continue;
+        const data = (cell?.metadata?.data || {}) as { startTime?: unknown; endTime?: unknown; };
+        const end = coerceFiniteNumber(data.endTime) ?? coerceFiniteNumber(data.startTime);
+        if (end !== undefined && end > maxEnd) maxEnd = end;
+    }
+    return maxEnd;
+}
+
+interface CharacterGroup {
+    label: string;
+    clips: CharacterClip[];
+}
+
+function groupClipsByCharacter(
+    cells: CodexNotebookAsJSONData["cells"],
+    workspaceFolder: vscode.WorkspaceFolder
+): { groups: Map<string, CharacterGroup>; skipped: number; } {
+    const groups = new Map<string, CharacterGroup>();
+    let skipped = 0;
+
+    for (const cell of cells) {
+        if (cell.kind !== 2 && cell.kind !== 1) continue;
+        if (!isActiveCell(cell)) continue;
+        const cellId: string | undefined = cell?.metadata?.id;
+        if (!cellId) continue;
+
+        const pick = pickAudioAttachmentForCell(cell);
+        if (!pick) continue;
+
+        const data = (cell?.metadata?.data || {}) as { startTime?: unknown; endTime?: unknown; };
+        const startSec = coerceFiniteNumber(data.startTime);
+        if (startSec === undefined) {
+            // No timeline position — cannot place in consolidated track
+            skipped++;
+            continue;
+        }
+        const endSec = coerceFiniteNumber(data.endTime);
+
+        const srcPath = pick.url;
+        const absoluteSrc = srcPath.startsWith("/") || /^[A-Za-z]:\\/.test(srcPath)
+            ? vscode.Uri.file(srcPath)
+            : vscode.Uri.joinPath(workspaceFolder.uri, srcPath);
+
+        const resolvedLabel = resolveCellLabel(cell);
+        const labelStr = resolvedLabel && resolvedLabel.trim() !== ""
+            ? resolvedLabel
+            : "unlabeled";
+        const key = sanitizeFileComponent(labelStr.toLowerCase()) || "unlabeled";
+
+        if (!groups.has(key)) groups.set(key, { label: labelStr, clips: [] });
+        groups.get(key)!.clips.push({
+            absolutePath: absoluteSrc.fsPath,
+            startMs: Math.max(0, Math.floor(startSec * 1000)),
+            endMs: endSec !== undefined && endSec > startSec
+                ? Math.floor(endSec * 1000)
+                : undefined,
+            cellId,
+        });
+    }
+
+    return { groups, skipped };
+}
+
+async function renderCharacterTrack(
+    ffmpegBinaryPath: string,
+    clips: CharacterClip[],
+    trimDurationSec: number,
+    outputPath: string,
+    format: CharacterAudioFormat
+): Promise<void> {
+    if (trimDurationSec <= 0) {
+        throw new Error("Trim duration must be greater than 0");
+    }
+
+    const sampleRate = 48000;
+    const baseDurationStr = trimDurationSec.toFixed(3);
+    const outArgs = codecArgs(format, sampleRate);
+
+    // No clips for this character — just emit silence of trim length.
+    if (clips.length === 0) {
+        await execFileAsync(ffmpegBinaryPath, [
+            "-y",
+            "-f", "lavfi",
+            "-t", baseDurationStr,
+            "-i", `anullsrc=r=${sampleRate}:cl=mono`,
+            ...outArgs,
+            outputPath,
+        ], { maxBuffer: 1024 * 1024 * 50 });
+        return;
+    }
+
+    // Build filter_complex: each clip gets resampled to mono 48k, delayed to its
+    // cell's startTime, then mixed onto a silent base trimmed to this character's
+    // last endTime. `amix duration=first` clamps the result to the base length.
+    const filterLines: string[] = [];
+    for (let i = 0; i < clips.length; i++) {
+        const inputIdx = i + 1; // input 0 is the silent base
+        const delayMs = clips[i].startMs;
+        filterLines.push(
+            `[${inputIdx}:a]aresample=${sampleRate},aformat=channel_layouts=mono:sample_fmts=s16,adelay=${delayMs}:all=1[a${inputIdx}]`
+        );
+    }
+    const mixInputs = ["[0:a]", ...clips.map((_, i) => `[a${i + 1}]`)].join("");
+    filterLines.push(
+        `${mixInputs}amix=inputs=${clips.length + 1}:duration=first:normalize=0[out]`
+    );
+    const filterScript = filterLines.join(";\n");
+
+    const tempDir = os.tmpdir();
+    const uniq = `${Date.now()}-${Math.random().toString(36).slice(2)}`;
+    const scriptPath = path.join(tempDir, `codex-char-filter-${uniq}.txt`);
+    fs.writeFileSync(scriptPath, filterScript);
+
+    const args: string[] = [
+        "-y",
+        "-f", "lavfi",
+        "-t", baseDurationStr,
+        "-i", `anullsrc=r=${sampleRate}:cl=mono`,
+    ];
+    for (const clip of clips) {
+        args.push("-i", clip.absolutePath);
+    }
+    args.push(
+        "-filter_complex_script", scriptPath,
+        "-map", "[out]",
+        ...outArgs,
+        outputPath,
+    );
+
+    try {
+        await execFileAsync(ffmpegBinaryPath, args, { maxBuffer: 1024 * 1024 * 200 });
+    } finally {
+        try { fs.unlinkSync(scriptPath); } catch { /* ignore */ }
+    }
+}
+
+function computeTrimDurationSec(clips: CharacterClip[], fallbackSec: number): number {
+    let maxEndMs = 0;
+    for (const c of clips) {
+        if (c.endMs !== undefined && c.endMs > maxEndMs) maxEndMs = c.endMs;
+        else if (c.startMs > maxEndMs) maxEndMs = c.startMs;
+    }
+    if (maxEndMs <= 0) return fallbackSec;
+    // Small pad (250ms) so we don't truncate the very last sample on lossy codecs.
+    return Math.max(0.25, maxEndMs / 1000 + 0.25);
+}
+
+export interface CharacterExportOptions {
+    format?: CharacterAudioFormat;
+}
+
+export async function exportAudioByCharacter(
+    userSelectedPath: string,
+    filesToExport: string[],
+    options?: CharacterExportOptions
+): Promise<void> {
+    const format: CharacterAudioFormat = options?.format ?? "flac";
+    const ext = formatExtension(format);
+    const workspaceFolders = vscode.workspace.workspaceFolders;
+    if (!workspaceFolders || workspaceFolders.length === 0) {
+        vscode.window.showErrorMessage("No project folder found. Please open a project first.");
+        return;
+    }
+    const workspaceFolder = workspaceFolders[0];
+
+    const ffmpegBinaryPath = await getFFmpegPath(getAudioExporterContext());
+    if (!ffmpegBinaryPath) {
+        vscode.window.showErrorMessage("FFmpeg is not available; cannot consolidate audio by character.");
+        return;
+    }
+
+    const exportDir = vscode.Uri.file(userSelectedPath);
+    await vscode.workspace.fs.createDirectory(exportDir);
+
+    const selectedFiles = filesToExport.map((p) => vscode.Uri.file(p));
+    if (selectedFiles.length === 0) {
+        vscode.window.showInformationMessage("No files selected for export.");
+        return;
+    }
+
+    return vscode.window.withProgress(
+        {
+            location: vscode.ProgressLocation.Notification,
+            title: "Exporting Audio by Character",
+            cancellable: false,
+        },
+        async (progress) => {
+            const increment = 100 / selectedFiles.length;
+            let writtenCount = 0;
+            let charactersWritten = 0;
+            let skippedCellsTotal = 0;
+            const filesWithoutTiming: string[] = [];
+
+            for (const [index, file] of selectedFiles.entries()) {
+                const fileBase = basename(file.fsPath).split(".")[0] || "FILE";
+                progress.report({
+                    message: `Processing ${basename(file.fsPath)} (${index + 1}/${selectedFiles.length})`,
+                    increment,
+                });
+
+                let notebook: CodexNotebookAsJSONData;
+                try {
+                    notebook = await readNotebook(file);
+                } catch (e) {
+                    debug(`Failed to read notebook ${file.fsPath}:`, e);
+                    continue;
+                }
+
+                const episodeDurationSec = computeEpisodeDurationSeconds(notebook.cells);
+                if (episodeDurationSec <= 0) {
+                    filesWithoutTiming.push(fileBase);
+                    debug(`Skipping ${fileBase}: no timing data found`);
+                    continue;
+                }
+
+                const { groups, skipped } = groupClipsByCharacter(notebook.cells, workspaceFolder);
+                skippedCellsTotal += skipped;
+
+                if (groups.size === 0) {
+                    debug(`No character audio found for ${fileBase}`);
+                    continue;
+                }
+
+                const bookFolder = vscode.Uri.joinPath(exportDir, sanitizeFileComponent(fileBase));
+                await vscode.workspace.fs.createDirectory(bookFolder);
+
+                const langCode = getTargetLanguageCode();
+                const safeFileBase = sanitizeFileComponent(fileBase);
+
+                // Verify clip files exist; drop missing ones so ffmpeg doesn't fail.
+                for (const [charKey, group] of groups.entries()) {
+                    const verified: CharacterClip[] = [];
+                    for (const clip of group.clips) {
+                        if (await pathExists(vscode.Uri.file(clip.absolutePath))) {
+                            verified.push(clip);
+                        } else {
+                            debug(`Missing audio file for ${clip.cellId}: ${clip.absolutePath}`);
+                            skippedCellsTotal++;
+                        }
+                    }
+                    if (verified.length === 0) {
+                        continue;
+                    }
+                    // Sort by start time so the filter is deterministic and easier to debug.
+                    verified.sort((a, b) => a.startMs - b.startMs);
+
+                    // Trim to this character's last endTime (with a small pad) so silent tails
+                    // don't bloat the file. Files still start at 0 so they DAW-align.
+                    const trimSec = computeTrimDurationSec(verified, episodeDurationSec);
+
+                    const destName = `${safeFileBase}_${langCode}_${charKey}${ext}`;
+                    const destUri = vscode.Uri.joinPath(bookFolder, destName);
+
+                    try {
+                        await renderCharacterTrack(
+                            ffmpegBinaryPath,
+                            verified,
+                            trimSec,
+                            destUri.fsPath,
+                            format
+                        );
+                        writtenCount++;
+                        charactersWritten++;
+                    } catch (e) {
+                        console.error(`Failed to render character track ${destName}:`, e);
+                    }
+                }
+            }
+
+            const parts: string[] = [];
+            parts.push(`${writtenCount} file${writtenCount === 1 ? "" : "s"} written`);
+            if (skippedCellsTotal > 0) parts.push(`${skippedCellsTotal} cell${skippedCellsTotal === 1 ? "" : "s"} skipped (missing timing or file)`);
+            if (filesWithoutTiming.length > 0) parts.push(`${filesWithoutTiming.length} file${filesWithoutTiming.length === 1 ? "" : "s"} had no timing data`);
+
+            vscode.window.showInformationMessage(
+                `Audio export by character completed: ${parts.join(", ")}. Output: ${exportDir.fsPath}`
+            );
+            debug(`Summary: written=${writtenCount} chars=${charactersWritten} skipped=${skippedCellsTotal} no-timing=${filesWithoutTiming.length}`);
+        }
+    );
+}
+
+interface PreviewBuckets {
+    label: string;
+    intervals: CharacterInterval[];
+    audioCellCount: number;
+    noAudioCellCount: number;
+    untimedCellCount: number;
+}
+
+// Scan every active labelled cell — with or without audio — so the preview can
+// surface characters that exist in the script but haven't been recorded yet.
+function scanCharactersForPreview(
+    cells: CodexNotebookAsJSONData["cells"]
+): Map<string, PreviewBuckets> {
+    const buckets = new Map<string, PreviewBuckets>();
+    for (const cell of cells) {
+        if (cell.kind !== 2 && cell.kind !== 1) continue;
+        if (!isActiveCell(cell)) continue;
+        const cellId: string | undefined = cell?.metadata?.id;
+        if (!cellId) continue;
+
+        const resolvedLabel = resolveCellLabel(cell);
+        const labelStr = resolvedLabel && resolvedLabel.trim() !== ""
+            ? resolvedLabel
+            : "unlabeled";
+        const key = sanitizeFileComponent(labelStr.toLowerCase()) || "unlabeled";
+
+        if (!buckets.has(key)) {
+            buckets.set(key, {
+                label: labelStr,
+                intervals: [],
+                audioCellCount: 0,
+                noAudioCellCount: 0,
+                untimedCellCount: 0,
+            });
+        }
+        const bucket = buckets.get(key)!;
+
+        const data = (cell?.metadata?.data || {}) as { startTime?: unknown; endTime?: unknown; };
+        const startSec = coerceFiniteNumber(data.startTime);
+        const endSec = coerceFiniteNumber(data.endTime);
+        const hasAudio = !!pickAudioAttachmentForCell(cell);
+
+        if (startSec === undefined) {
+            bucket.untimedCellCount++;
+            continue;
+        }
+        bucket.intervals.push({
+            startSec,
+            endSec: endSec !== undefined && endSec > startSec ? endSec : startSec + 0.5,
+            hasAudio,
+        });
+        if (hasAudio) bucket.audioCellCount++;
+        else bucket.noAudioCellCount++;
+    }
+    return buckets;
+}
+
+/**
+ * Build a lightweight preview of which characters speak when in each selected
+ * file. Pure data — the webview turns this into vertically aligned timeline
+ * strips. Does not require ffmpeg or write any files.
+ */
+export async function getCharacterAudioPreview(
+    filesToExport: string[]
+): Promise<CharacterPreviewResult> {
+    const workspaceFolders = vscode.workspace.workspaceFolders;
+    if (!workspaceFolders || workspaceFolders.length === 0) {
+        return { files: [] };
+    }
+
+    const result: CharacterPreviewFile[] = [];
+
+    for (const filePath of filesToExport) {
+        const file = vscode.Uri.file(filePath);
+        const fileBase = basename(file.fsPath).split(".")[0] || "FILE";
+
+        let notebook: CodexNotebookAsJSONData;
+        try {
+            notebook = await readNotebook(file);
+        } catch {
+            continue;
+        }
+
+        const episodeDurationSec = computeEpisodeDurationSeconds(notebook.cells);
+        if (episodeDurationSec <= 0) {
+            result.push({
+                fileBase,
+                episodeDurationSec: 0,
+                characters: [],
+                skippedCells: 0,
+                missingTiming: true,
+            });
+            continue;
+        }
+
+        const buckets = scanCharactersForPreview(notebook.cells);
+
+        const characters: CharacterPreviewCharacter[] = [];
+        let skippedCells = 0;
+        for (const [key, bucket] of buckets.entries()) {
+            bucket.intervals.sort((a, b) => a.startSec - b.startSec);
+            const speakingSecAudio = bucket.intervals
+                .filter((i) => i.hasAudio)
+                .reduce((acc, i) => acc + Math.max(0, i.endSec - i.startSec), 0);
+            const speakingSecNoAudio = bucket.intervals
+                .filter((i) => !i.hasAudio)
+                .reduce((acc, i) => acc + Math.max(0, i.endSec - i.startSec), 0);
+            const lastEndSec = bucket.intervals.length
+                ? Math.max(...bucket.intervals.filter((i) => i.hasAudio).map((i) => i.endSec), 0)
+                : 0;
+            const willExport = bucket.audioCellCount > 0;
+            skippedCells += bucket.untimedCellCount;
+            characters.push({
+                label: bucket.label,
+                key,
+                intervals: bucket.intervals,
+                audioCellCount: bucket.audioCellCount,
+                noAudioCellCount: bucket.noAudioCellCount,
+                untimedCellCount: bucket.untimedCellCount,
+                speakingSecAudio,
+                speakingSecNoAudio,
+                lastEndSec,
+                willExport,
+            });
+        }
+        // Sort: characters with audio first, then by first appearance time.
+        characters.sort((a, b) => {
+            if (a.willExport !== b.willExport) return a.willExport ? -1 : 1;
+            const aStart = a.intervals[0]?.startSec ?? Infinity;
+            const bStart = b.intervals[0]?.startSec ?? Infinity;
+            return aStart - bStart;
+        });
+
+        result.push({
+            fileBase,
+            episodeDurationSec,
+            characters,
+            skippedCells,
+            missingTiming: false,
+        });
+    }
+
+    return { files: result };
+}
diff --git a/src/exportHandler/exportHandler.ts b/src/exportHandler/exportHandler.ts
index 913d7d74e..d97d5f13c 100644
--- a/src/exportHandler/exportHandler.ts
+++ b/src/exportHandler/exportHandler.ts
@@ -217,6 +217,8 @@ export interface ExportOptions {
     removeIds?: boolean;
     includeAudio?: boolean;
     includeTimestamps?: boolean;
+    consolidateByCharacter?: boolean;
+    consolidatedAudioFormat?: "wav" | "flac" | "opus";
 }
 
 // IDML Round-trip export: Uses idmlExporter or biblicaExporter based on filename
@@ -1774,8 +1776,15 @@ export async function exportCodexContent(
             exportPromises.push(exportCodexContentAsHtml(formatPath, filesToExport, options));
             break;
         case CodexExportFormat.AUDIO: {
-            const { exportAudioAttachments } = await import("./audioExporter");
-            exportPromises.push(exportAudioAttachments(wrapperPath, filesToExport, { includeTimestamps: options?.includeTimestamps }));
+            if (options?.consolidateByCharacter) {
+                const { exportAudioByCharacter } = await import("./characterAudioExporter");
+                exportPromises.push(exportAudioByCharacter(wrapperPath, filesToExport, {
+                    format: options?.consolidatedAudioFormat,
+                }));
+            } else {
+                const { exportAudioAttachments } = await import("./audioExporter");
+                exportPromises.push(exportAudioAttachments(wrapperPath, filesToExport, { includeTimestamps: options?.includeTimestamps }));
+            }
             break;
         }
         case CodexExportFormat.SUBTITLES_VTT_WITH_STYLES:
@@ -1805,12 +1814,19 @@ export async function exportCodexContent(
     }
 
     if (includeAudio) {
-        const { exportAudioAttachments } = await import("./audioExporter");
-        exportPromises.push(
-            exportAudioAttachments(audioPath, filesToExport, {
-                includeTimestamps: options?.includeTimestamps
-            })
-        );
+        if (options?.consolidateByCharacter) {
+            const { exportAudioByCharacter } = await import("./characterAudioExporter");
+            exportPromises.push(exportAudioByCharacter(audioPath, filesToExport, {
+                format: options?.consolidatedAudioFormat,
+            }));
+        } else {
+            const { exportAudioAttachments } = await import("./audioExporter");
+            exportPromises.push(
+                exportAudioAttachments(audioPath, filesToExport, {
+                    includeTimestamps: options?.includeTimestamps
+                })
+            );
+        }
     }
 
     await Promise.all(exportPromises);
diff --git a/src/projectManager/projectExportView.ts b/src/projectManager/projectExportView.ts
index aed40b1bb..4e33b7aac 100644
--- a/src/projectManager/projectExportView.ts
+++ b/src/projectManager/projectExportView.ts
@@ -211,6 +211,32 @@ export async function openProjectExportView(context: vscode.ExtensionContext) {
                 );
                 break;
             }
+            case "previewCharacterAudio": {
+                try {
+                    const { getCharacterAudioPreview } = await import(
+                        "../exportHandler/characterAudioExporter"
+                    );
+                    const preview = await getCharacterAudioPreview(
+                        (message.filesToExport as string[]) || []
+                    );
+                    safePostMessageToPanel(
+                        panel,
+                        { command: "characterAudioPreviewResult", preview },
+                        "ProjectExport"
+                    );
+                } catch (err) {
+                    safePostMessageToPanel(
+                        panel,
+                        {
+                            command: "characterAudioPreviewResult",
+                            preview: { files: [] },
+                            error: err instanceof Error ? err.message : String(err),
+                        },
+                        "ProjectExport"
+                    );
+                }
+                break;
+            }
             case "cancel":
                 panel.dispose();
                 break;
@@ -574,8 +600,93 @@ function getWebviewContent(
                     padding: 20px 24px;
                     max-width: 480px;
                     width: 90%;
+                    max-height: 90vh;
+                    display: flex;
+                    flex-direction: column;
                     box-shadow: 0 8px 32px rgba(0, 0, 0, 0.35);
                 }
+                .popup-card .popup-header { flex: 0 0 auto; }
+                .popup-card .popup-body {
+                    flex: 1 1 auto;
+                    min-height: 0;
+                    overflow-y: auto;
+                }
+                .popup-card.wide { max-width: 900px; }
+                .char-preview-file { margin-bottom: 18px; }
+                .char-preview-file h5 {
+                    margin: 0 0 6px 0;
+                    color: var(--vscode-foreground);
+                    font-size: 0.95em;
+                }
+                .char-preview-meta {
+                    color: var(--vscode-descriptionForeground);
+                    font-size: 0.8em;
+                    margin-bottom: 8px;
+                }
+                .char-row {
+                    display: grid;
+                    grid-template-columns: 160px 1fr 80px;
+                    gap: 10px;
+                    align-items: center;
+                    padding: 3px 0;
+                    font-size: 0.85em;
+                }
+                .char-row .char-label {
+                    color: var(--vscode-foreground);
+                    overflow: hidden;
+                    text-overflow: ellipsis;
+                    white-space: nowrap;
+                }
+                .char-row .char-timeline {
+                    position: relative;
+                    height: 14px;
+                    background: var(--vscode-input-background);
+                    border: 1px solid var(--vscode-input-border);
+                    border-radius: 2px;
+                    overflow: hidden;
+                }
+                .char-row .speech-segment {
+                    position: absolute;
+                    top: 0;
+                    bottom: 0;
+                    min-width: 1px;
+                    opacity: 0.85;
+                }
+                .char-row .speech-segment.has-audio {
+                    background: var(--vscode-charts-blue, #3b82f6);
+                }
+                .char-row .speech-segment.no-audio {
+                    background: var(--vscode-descriptionForeground, #6b7280);
+                    opacity: 0.45;
+                }
+                .char-row.no-audio .char-label {
+                    color: var(--vscode-descriptionForeground);
+                    font-style: italic;
+                }
+                .char-row .char-stats {
+                    color: var(--vscode-descriptionForeground);
+                    font-size: 0.8em;
+                    text-align: right;
+                    font-variant-numeric: tabular-nums;
+                }
+                .char-legend {
+                    display: flex;
+                    gap: 14px;
+                    margin: 4px 0 12px 0;
+                    font-size: 0.78em;
+                    color: var(--vscode-descriptionForeground);
+                    align-items: center;
+                }
+                .char-legend .swatch {
+                    display: inline-block;
+                    width: 12px;
+                    height: 10px;
+                    border-radius: 2px;
+                    margin-right: 4px;
+                    vertical-align: middle;
+                }
+                .char-legend .swatch.has-audio { background: var(--vscode-charts-blue, #3b82f6); }
+                .char-legend .swatch.no-audio { background: var(--vscode-descriptionForeground, #6b7280); opacity: 0.45; }
                 .popup-header {
                     display: flex;
                     align-items: center;
@@ -782,6 +893,26 @@ function getWebviewContent(
                                             <p>Export per-cell audio attachments alongside the selected export format, and embed timestamps in audio metadata (WAV, WebM, M4A)</p>
                                         </div>
                                     </div>
+                                    <div class="format-option audio-option" data-audio-mode="audio-by-character">
+                                        <div class="format-option-content">
+                                            <strong>Consolidate by Character</strong>
+                                            <p>One file per character label. All files start at 0:00 so they drop into a DAW aligned; each is trimmed to that character's last spoken line. Named &lt;file&gt;_&lt;lang&gt;_&lt;character&gt;.&lt;ext&gt;.</p>
+                                            <div id="characterAudioControls" style="display:none; margin-top:8px; flex-direction:column; gap:6px;">
+                                                <label style="display:flex; align-items:center; gap:8px; font-size:0.9em;">
+                                                    <span>Format:</span>
+                                                    <select id="characterAudioFormat" onclick="event.stopPropagation()" onchange="event.stopPropagation()" style="background:var(--vscode-input-background); color:var(--vscode-input-foreground); border:1px solid var(--vscode-input-border); border-radius:3px; padding:2px 6px;">
+                                                        <option value="flac" selected>FLAC (lossless, small)</option>
+                                                        <option value="wav">WAV (PCM, largest)</option>
+                                                        <option value="opus">Opus (lossy, smallest)</option>
+                                                    </select>
+                                                </label>
+                                                <button type="button" class="secondary" onclick="event.stopPropagation(); openCharacterPreview();" style="align-self:flex-start;">
+                                                    <i class="codicon codicon-preview"></i>
+                                                    Preview characters
+                                                </button>
+                                            </div>
+                                        </div>
+                                    </div>
                                 </div>
                             </div>
                         </div>
@@ -857,6 +988,28 @@ function getWebviewContent(
                 </div>
             </div>
 
+            <div class="popup-overlay" id="characterPreviewPopup" onclick="if(event.target===this)closeCharacterPreviewPopup()">
+                <div class="popup-card wide">
+                    <div class="popup-header" style="color: var(--vscode-foreground);">
+                        <i class="codicon codicon-preview"></i>
+                        <h4>Character Audio Preview</h4>
+                        <button class="popup-close" onclick="closeCharacterPreviewPopup()" title="Close">
+                            <i class="codicon codicon-close"></i>
+                        </button>
+                    </div>
+                    <div class="popup-body">
+                        <p style="color: var(--vscode-descriptionForeground); font-size: 0.85em; margin-top: 0;">
+                            One row per character per file. Blue bars are speaking turns with audio attached. Grey bars are lines that have timing but no audio yet — these characters won't be exported until recordings are added. Files start at 0:00 and are trimmed to that character's last <em>recorded</em> line.
+                        </p>
+                        <div class="char-legend">
+                            <span><span class="swatch has-audio"></span>has audio (exports)</span>
+                            <span><span class="swatch no-audio"></span>timed line, no audio (skipped)</span>
+                        </div>
+                        <div id="characterPreviewBody"></div>
+                    </div>
+                </div>
+            </div>
+
             <div class="popup-overlay" id="htmlMismatchPopup" onclick="if(event.target===this)closeHtmlMismatchPopup()">
                 <div class="popup-card">
                     <div class="popup-header">
@@ -883,7 +1036,7 @@ function getWebviewContent(
                 const isStreamOnly = ${JSON.stringify(isStreamOnly)};
                 let currentStep = 1;
                 let selectedFormat = null;
-                let selectedAudioMode = null; // null | 'audio' | 'audio-timestamps'
+                let selectedAudioMode = null; // null | 'audio' | 'audio-timestamps' | 'audio-by-character'
                 let exportPath = ${initialExportFolderJson};
                 let selectedFiles = new Set();
                 let selectedGroupKey = null;
@@ -1202,6 +1355,7 @@ function getWebviewContent(
                             opt.style.borderColor = '';
                         });
                     }
+                    try { updateCharacterAudioControls(); } catch (e) {}
                     updateStep2Button();
                 }
 
@@ -1299,8 +1453,150 @@ function getWebviewContent(
                             showHtmlMismatchPopup(message.mismatches);
                         }
                     }
+                    if (message.command === 'characterAudioPreviewResult') {
+                        renderCharacterPreview(message.preview, message.error);
+                    }
                 });
 
+                function updateCharacterAudioControls() {
+                    const controls = document.getElementById('characterAudioControls');
+                    if (!controls) return;
+                    controls.style.display = selectedAudioMode === 'audio-by-character' ? 'flex' : 'none';
+                }
+
+                function openCharacterPreview() {
+                    if (selectedFiles.size === 0) return;
+                    const body = document.getElementById('characterPreviewBody');
+                    if (body) {
+                        body.replaceChildren();
+                        const loading = document.createElement('p');
+                        loading.style.color = 'var(--vscode-descriptionForeground)';
+                        loading.textContent = 'Loading preview...';
+                        body.appendChild(loading);
+                    }
+                    const popup = document.getElementById('characterPreviewPopup');
+                    if (popup) popup.classList.add('visible');
+                    vscode.postMessage({
+                        command: 'previewCharacterAudio',
+                        filesToExport: Array.from(selectedFiles)
+                    });
+                }
+
+                function closeCharacterPreviewPopup() {
+                    const popup = document.getElementById('characterPreviewPopup');
+                    if (popup) popup.classList.remove('visible');
+                }
+
+                function formatMmSs(totalSeconds) {
+                    if (!Number.isFinite(totalSeconds) || totalSeconds <= 0) return '0:00';
+                    const total = Math.floor(totalSeconds);
+                    const m = Math.floor(total / 60);
+                    const s = total % 60;
+                    return m + ':' + String(s).padStart(2, '0');
+                }
+
+                function makeFileBlock(f) {
+                    const wrapper = document.createElement('div');
+                    wrapper.className = 'char-preview-file';
+                    const title = document.createElement('h5');
+                    title.textContent = f.fileBase;
+                    wrapper.appendChild(title);
+                    const meta = document.createElement('div');
+                    meta.className = 'char-preview-meta';
+                    if (f.missingTiming) {
+                        meta.textContent = 'No timing data — this file will be skipped.';
+                        wrapper.appendChild(meta);
+                        return wrapper;
+                    }
+                    if (!f.characters || f.characters.length === 0) {
+                        meta.textContent = 'Episode length: ' + formatMmSs(f.episodeDurationSec) + ' — no character audio found.';
+                        wrapper.appendChild(meta);
+                        return wrapper;
+                    }
+                    const exportingCount = (f.characters || []).filter(function(c) { return c.willExport; }).length;
+                    const totalCount = f.characters.length;
+                    const skippedNote = f.skippedCells > 0
+                        ? ' • ' + f.skippedCells + ' cell' + (f.skippedCells === 1 ? '' : 's') + ' missing timing'
+                        : '';
+                    meta.textContent = 'Episode length: ' + formatMmSs(f.episodeDurationSec) +
+                        ' • ' + totalCount + ' character' + (totalCount === 1 ? '' : 's') +
+                        ' (' + exportingCount + ' will export)' + skippedNote;
+                    wrapper.appendChild(meta);
+
+                    const dur = f.episodeDurationSec;
+                    for (const c of f.characters) {
+                        const row = document.createElement('div');
+                        row.className = 'char-row' + (c.willExport ? '' : ' no-audio');
+
+                        const label = document.createElement('div');
+                        label.className = 'char-label';
+                        const audioCount = c.audioCellCount || 0;
+                        const noAudioCount = c.noAudioCellCount || 0;
+                        const untimed = c.untimedCellCount || 0;
+                        const tooltipParts = [c.label];
+                        if (audioCount) tooltipParts.push(audioCount + ' with audio');
+                        if (noAudioCount) tooltipParts.push(noAudioCount + ' timed, no audio');
+                        if (untimed) tooltipParts.push(untimed + ' untimed');
+                        label.title = tooltipParts.join(' • ');
+                        label.textContent = c.label;
+                        row.appendChild(label);
+
+                        const timeline = document.createElement('div');
+                        timeline.className = 'char-timeline';
+                        for (const iv of (c.intervals || [])) {
+                            const seg = document.createElement('div');
+                            seg.className = 'speech-segment ' + (iv.hasAudio ? 'has-audio' : 'no-audio');
+                            const left = dur > 0 ? Math.max(0, Math.min(100, (iv.startSec / dur) * 100)) : 0;
+                            const widthRaw = dur > 0 ? ((iv.endSec - iv.startSec) / dur) * 100 : 0;
+                            const width = Math.max(0.2, Math.min(100 - left, widthRaw));
+                            seg.style.left = left.toFixed(3) + '%';
+                            seg.style.width = width.toFixed(3) + '%';
+                            timeline.appendChild(seg);
+                        }
+                        row.appendChild(timeline);
+
+                        const stats = document.createElement('div');
+                        stats.className = 'char-stats';
+                        if (c.willExport) {
+                            const trim = formatMmSs(c.lastEndSec);
+                            const audioSpeaking = formatMmSs(c.speakingSecAudio || 0);
+                            const noAudioSpeaking = (c.speakingSecNoAudio || 0) > 0 ? ' • ' + formatMmSs(c.speakingSecNoAudio) + ' no audio' : '';
+                            stats.title = 'Trim: ' + trim + ' • Speaking (audio): ' + audioSpeaking + noAudioSpeaking;
+                            stats.textContent = trim;
+                        } else {
+                            stats.title = 'No audio recorded yet — not exported';
+                            stats.textContent = 'no audio';
+                        }
+                        row.appendChild(stats);
+
+                        wrapper.appendChild(row);
+                    }
+                    return wrapper;
+                }
+
+                function renderCharacterPreview(preview, error) {
+                    const body = document.getElementById('characterPreviewBody');
+                    if (!body) return;
+                    body.replaceChildren();
+                    if (error) {
+                        const p = document.createElement('p');
+                        p.style.color = 'var(--vscode-errorForeground)';
+                        p.textContent = error;
+                        body.appendChild(p);
+                        return;
+                    }
+                    if (!preview || !preview.files || preview.files.length === 0) {
+                        const p = document.createElement('p');
+                        p.style.color = 'var(--vscode-descriptionForeground)';
+                        p.textContent = 'No files to preview.';
+                        body.appendChild(p);
+                        return;
+                    }
+                    for (const f of preview.files) {
+                        body.appendChild(makeFileBlock(f));
+                    }
+                }
+
                 document.addEventListener('DOMContentLoaded', () => {
                     renderFileGroups();
                     updateStep1Button();
@@ -1328,7 +1624,7 @@ function getWebviewContent(
                                 option.classList.add('selected');
                                 checkAudioSelectionMismatch();
                             }
-                            try { updateStep2Button(); updateExportButton(); } catch (e) {}
+                            try { updateStep2Button(); updateExportButton(); updateCharacterAudioControls(); } catch (e) {}
                         });
                     });
 
@@ -1465,6 +1761,11 @@ function getWebviewContent(
                     if (selectedAudioMode) {
                         options.includeAudio = true;
                         options.includeTimestamps = selectedAudioMode === 'audio-timestamps';
+                        options.consolidateByCharacter = selectedAudioMode === 'audio-by-character';
+                        if (options.consolidateByCharacter) {
+                            const fmtEl = document.getElementById('characterAudioFormat');
+                            options.consolidatedAudioFormat = (fmtEl && fmtEl.value) ? fmtEl.value : 'flac';
+                        }
                     }
                     vscode.postMessage({
                         command: 'export',