OpenLAIR · bbsngg · Apr 23, 2026 · Apr 12, 2026 · Apr 14, 2026 · Apr 23, 2026
diff --git a/server/index.js b/server/index.js
@@ -72,6 +72,7 @@ import computeRoutes from './routes/compute.js';
 import newsRoutes from './routes/news.js';
 import autoResearchRoutes from './routes/auto-research.js';
 import referencesRoutes from './routes/references.js';
+import quickQaRoutes from './routes/quick-qa.js';
 import { initializeDatabase, sessionDb, tagDb } from './database/db.js';
 import { validateApiKey, authenticateToken, authenticateWebSocket } from './middleware/auth.js';
 import { IS_PLATFORM } from './constants/config.js';
@@ -531,6 +532,8 @@ app.use('/api/auto-research', authenticateToken, autoResearchRoutes);
 // References (literature library) API Routes (protected)
 app.use('/api/references', authenticateToken, referencesRoutes);
 
+app.use('/api/quick-qa', authenticateToken, quickQaRoutes);
+
 // Agent API Routes (uses API key authentication)
 app.use('/api/agent', agentRoutes);
 

diff --git a/server/routes/quick-qa.js b/server/routes/quick-qa.js
@@ -0,0 +1,196 @@
+/**
+ * Quick Q&A Route
+ *
+ * Provides lightweight endpoints for inline Q&A in markdown preview mode:
+ * - Fast mode: quick haiku answer via SSE streaming
+ * - Think mode: detailed sonnet analysis via SSE streaming
+ * - Deep Research mode: comprehensive opus report via SSE streaming
+ */
+
+import { Router } from 'express';
+import { query } from '@anthropic-ai/claude-agent-sdk';
+import { readFileSync } from 'fs';
+import { join, dirname, resolve } from 'path';
+import { fileURLToPath } from 'url';
+import { projectDb } from '../database/db.js';
+
+const __filename = fileURLToPath(import.meta.url);
+const __dirname = dirname(__filename);
+
+const router = Router();
+
+// Active query abort controllers
+const activeQueries = new Map();
+
+// Set stream timeout once at module level to avoid per-request race conditions
+process.env.CLAUDE_CODE_STREAM_CLOSE_TIMEOUT = '300000';
+
+/**
+ * Validate that projectPath is a known project directory.
+ * Returns the resolved absolute path, or null if invalid.
+ */
+function validateProjectPath(projectPath) {
+  if (!projectPath || typeof projectPath !== 'string') return null;
+  const resolved = resolve(projectPath);
+  // Check that the path corresponds to a registered project
+  const allProjects = projectDb.getAllProjects() || [];
+  const isKnown = allProjects.some(p => {
+    if (!p.path) return false;
+    const projResolved = resolve(p.path);
+    return resolved === projResolved || resolved.startsWith(projResolved + '/');
+  });
+  return isKnown ? resolved : null;
+}
+
+const FAST_SYSTEM_PROMPT = `You are a helpful assistant providing quick, concise answers about text selected from markdown documents. Keep responses brief and direct. Use markdown formatting in your response when appropriate.`;
+
+const THINK_SYSTEM_PROMPT = `You are a deep-thinking assistant. Provide a detailed, well-reasoned analysis with thorough explanations. Break down concepts, explore implications, and provide comprehensive insights. Use markdown formatting with clear structure (headings, lists, etc.).`;
+
+// Load the inno-deep-research skill as the Deep Research system prompt (uses sonnet model)
+let RESEARCH_SYSTEM_PROMPT;
+try {
+  const skillPath = join(__dirname, '../../skills/inno-deep-research/SKILL.md');
+  const raw = readFileSync(skillPath, 'utf8');
+  // Strip YAML frontmatter (between --- markers) and use the rest as the prompt
+  const stripped = raw.replace(/^---[\s\S]*?---\s*/, '').trim();
+  RESEARCH_SYSTEM_PROMPT = stripped;
+  console.log('[QuickQA] Loaded inno-deep-research skill for Deep Research mode');
+} catch (err) {
+  console.warn('[QuickQA] Could not load inno-deep-research skill, using fallback:', err.message);
+  RESEARCH_SYSTEM_PROMPT = `You are a comprehensive research assistant. Provide a thorough research report that includes: overview and background, key concepts, current state of knowledge, different perspectives, related work, and conclusions. Use markdown formatting with clear structure, headings, and well-organized sections.`;
+}
+
+const MODE_CONFIG = {
+  fast: { model: 'haiku', systemPrompt: FAST_SYSTEM_PROMPT },
+  think: { model: 'sonnet', systemPrompt: THINK_SYSTEM_PROMPT },
+  research: { model: 'sonnet', systemPrompt: RESEARCH_SYSTEM_PROMPT },
+};
+
+function buildPrompt(selectedText, question, mode) {
+  if (mode === 'think') {
+    return question
+      ? `Please think deeply and provide a detailed, well-reasoned analysis of the following text, focusing on this question: ${question}\n\nSelected text:\n"""\n${selectedText}\n"""`
+      : `Please think deeply and provide a detailed, well-reasoned analysis of the following text. Break down the concepts, explore implications, and provide thorough explanations.\n\nSelected text:\n"""\n${selectedText}\n"""`;
+  }
+  if (mode === 'research') {
+    return question
+      ? `Please conduct a comprehensive deep research on the following topic/text, focusing on: ${question}\n\nProvide a thorough research report with: 1) Overview and background 2) Key concepts 3) Current state of knowledge 4) Different perspectives 5) Related work 6) Conclusions.\n\nSelected text:\n"""\n${selectedText}\n"""`
+      : `Please conduct a comprehensive deep research on the following topic/text. Provide a thorough research report with: 1) Overview and background 2) Key concepts 3) Current state of knowledge 4) Different perspectives 5) Related work 6) Conclusions.\n\nSelected text:\n"""\n${selectedText}\n"""`;
+  }
+  // fast
+  return question
+    ? `The user has selected the following text from a markdown document and has a question about it.\n\nSelected text:\n"""\n${selectedText}\n"""\n\nUser's question: ${question}\n\nPlease provide a concise, direct answer. Keep it brief and focused.`
+    : `The user has selected the following text from a markdown document and wants a quick explanation.\n\nSelected text:\n"""\n${selectedText}\n"""\n\nPlease provide a concise explanation of this text. Keep it brief and focused.`;
+}
+
+/**
+ * Shared SSE query handler for all modes (fast, think, research).
+ */
+async function handleQueryRequest(req, res) {
+  const { selectedText, question, projectPath, mode = 'fast' } = req.body;
+
+  if (!selectedText || selectedText.length < 2) {
+    return res.status(400).json({ error: 'Selected text must be at least 2 characters' });
+  }
+
+  const config = MODE_CONFIG[mode] || MODE_CONFIG.fast;
+  const queryId = `quick-qa-${mode}-${Date.now()}-${Math.random().toString(36).slice(2, 8)}`;
+
+  // Validate projectPath to prevent path traversal
+  const validatedCwd = validateProjectPath(projectPath) || process.cwd();
+
+  // Set up SSE
+  res.setHeader('Content-Type', 'text/event-stream');
+  res.setHeader('Cache-Control', 'no-cache');
+  res.setHeader('Connection', 'keep-alive');
+  res.setHeader('X-Query-Id', queryId);
+  res.flushHeaders();
+
+  const abortController = new AbortController();
+  activeQueries.set(queryId, abortController);
+
+  // Clean up on client disconnect
+  res.on('close', () => {
+    if (!res.writableFinished) {
+      abortController.abort();
+      activeQueries.delete(queryId);
+    }
+  });
+
+  const prompt = buildPrompt(selectedText, question, mode);
+
+  try {
+    const conversation = query({
+      prompt,
+      options: {
+        cwd: validatedCwd,
+        model: config.model,
+        systemPrompt: config.systemPrompt,
+        tools: [],
+        allowedTools: [],
+        settingSources: [],
+        permissionMode: 'default',
+      },
+    });
+
+    let hasStreamedContent = false;
+    let fullContent = '';
+
+    for await (const message of conversation) {
+      if (abortController.signal.aborted) break;
+
+      if (message.type === 'assistant' && message.message?.content) {
+        for (const block of message.message.content) {
+          if (block.type === 'text' && block.text) {
+            hasStreamedContent = true;
+            fullContent += block.text;
+            res.write(`data: ${JSON.stringify({ type: 'text', content: block.text })}\n\n`);
+          }
+        }
+      }
+
+      if (message.type === 'result') {
+        if (message.subtype === 'success' && message.result && !hasStreamedContent) {
+          fullContent = message.result;
+          res.write(`data: ${JSON.stringify({ type: 'text', content: message.result })}\n\n`);
+        } else if (message.subtype !== 'success') {
+          const errMsg = Array.isArray(message.errors) ? message.errors.join('\n') : 'Query failed';
+          res.write(`data: ${JSON.stringify({ type: 'error', message: errMsg })}\n\n`);
+        }
+      }
+    }
+
+    res.write(`data: ${JSON.stringify({ type: 'done', fullContent })}\n\n`);
+  } catch (error) {
+    if (error.name !== 'AbortError') {
+      console.error(`[QuickQA/${mode}] Error:`, error.message);
+      res.write(`data: ${JSON.stringify({ type: 'error', message: error.message })}\n\n`);
+    }
+  } finally {
+    activeQueries.delete(queryId);
+    res.end();
+  }
+}
+
+/**
+ * POST /api/quick-qa
+ * Unified endpoint for all modes. Pass { mode: 'fast' | 'think' | 'research' } in body.
+ */
+router.post('/', handleQueryRequest);
+
+/**
+ * POST /api/quick-qa/abort
+ * Aborts an active query.
+ */
+router.post('/abort', (req, res) => {
+  const { queryId } = req.body;
+  const controller = activeQueries.get(queryId);
+  if (controller) {
+    controller.abort();
+    activeQueries.delete(queryId);
+    return res.json({ success: true });
+  }
+  res.json({ success: false, message: 'Query not found' });
+});
+
+export default router;