From fbc071fe36982c6720cc3e778a2ec93b03bb1c7d Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Sun, 17 May 2026 16:24:52 -0700
Subject: [PATCH 01/18] Fix the on-prem graphrag-ui image build

- Supply the build context the UI image requires so its workflow
  build no longer fails.

Refs: GML-2093
---
 .github/workflows/onprem-build-nightly.yaml | 5 +++++
 .github/workflows/onprem-build-test.yaml    | 5 +++++
 .github/workflows/onprem-build.yaml         | 5 +++++
 3 files changed, 15 insertions(+)

diff --git a/.github/workflows/onprem-build-nightly.yaml b/.github/workflows/onprem-build-nightly.yaml
index 92b7c3c..fbde147 100644
--- a/.github/workflows/onprem-build-nightly.yaml
+++ b/.github/workflows/onprem-build-nightly.yaml
@@ -77,6 +77,11 @@ jobs:
       with:
         context: graphrag-ui/
         file: ./graphrag-ui/Dockerfile
+        # The UI Dockerfile reads VERSION from a named ``repo`` context;
+        # docker/build-push-action interprets undeclared contexts as image
+        # refs and tries to pull docker.io/library/repo:latest otherwise.
+        build-contexts: |
+          repo=.
         push: true
         tags: |
            ${{ env.IMAGE }}
diff --git a/.github/workflows/onprem-build-test.yaml b/.github/workflows/onprem-build-test.yaml
index 40d2914..8e1f9b0 100644
--- a/.github/workflows/onprem-build-test.yaml
+++ b/.github/workflows/onprem-build-test.yaml
@@ -63,6 +63,11 @@ jobs:
       with:
         context: graphrag-ui/
         file: ./graphrag-ui/Dockerfile
+        # The UI Dockerfile reads VERSION from a named ``repo`` context;
+        # docker/build-push-action interprets undeclared contexts as image
+        # refs and tries to pull docker.io/library/repo:latest otherwise.
+        build-contexts: |
+          repo=.
         push: true
         tags: |
           tigergraph/graphrag-ui:${{steps.get-image.outputs.IMAGE}}
diff --git a/.github/workflows/onprem-build.yaml b/.github/workflows/onprem-build.yaml
index 9fb26a4..4a32251 100644
--- a/.github/workflows/onprem-build.yaml
+++ b/.github/workflows/onprem-build.yaml
@@ -82,6 +82,11 @@ jobs:
       with:
         context: graphrag-ui/
         file: ./graphrag-ui/Dockerfile
+        # The UI Dockerfile reads VERSION from a named ``repo`` context;
+        # docker/build-push-action interprets undeclared contexts as image
+        # refs and tries to pull docker.io/library/repo:latest otherwise.
+        build-contexts: |
+          repo=.
         push: true
         tags: |
           tigergraph/graphrag-ui:${{steps.get-image.outputs.IMAGE}}

From a0e2fbdca8001d72752edc5283b7523fa5da3a19 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Mon, 18 May 2026 22:45:36 -0700
Subject: [PATCH 02/18] Consolidate v1.4.1 patch: scoped :latest tagging +
 cleaner login response

- Skip the :latest image tag on builds from non-main branches so
  backport rebuilds don't overwrite the most recently published image
- Reject invalid credentials cleanly and include the signed-in
  username in the login response

Refs: GML-2094
---
 .github/workflows/onprem-build.yaml | 29 ++++++++++++++++++++++-------
 graphrag/app/routers/ui.py          | 20 +++++++++++++++++++-
 2 files changed, 41 insertions(+), 8 deletions(-)

diff --git a/.github/workflows/onprem-build.yaml b/.github/workflows/onprem-build.yaml
index 4a32251..d28dfd4 100644
--- a/.github/workflows/onprem-build.yaml
+++ b/.github/workflows/onprem-build.yaml
@@ -43,7 +43,22 @@ jobs:
         echo "IMAGE=$IMAGE" >> $GITHUB_OUTPUT
         VERSION=$(cat VERSION)
         echo "VERSION=$VERSION" >> $GITHUB_OUTPUT
- 
+
+    # Only builds triggered from main update the :latest tag. Manual
+    # rebuilds of older release branches (e.g. release_1.3.1) skip
+    # :latest so a backport build doesn't overwrite the most recent
+    # published image.
+    - name: Decide whether to update :latest
+      id: latest-check
+      run: |
+        if [ "${GITHUB_REF}" = "refs/heads/main" ]; then
+          echo "push_latest=true" >> $GITHUB_OUTPUT
+          echo "Building from main — :latest will be updated."
+        else
+          echo "push_latest=false" >> $GITHUB_OUTPUT
+          echo "Not on main (ref=${GITHUB_REF}) — :latest will be left as-is."
+        fi
+
     - name: Build and push Docker image GraphRAG
       uses: docker/build-push-action@v5
       with:
@@ -53,8 +68,8 @@ jobs:
         tags: |
           tigergraph/graphrag:${{steps.get-image.outputs.IMAGE}}
           tigergraph/graphrag:${{steps.get-image.outputs.VERSION}}
-          tigergraph/graphrag:latest
- 
+          ${{ steps.latest-check.outputs.push_latest == 'true' && 'tigergraph/graphrag:latest' || '' }}
+
     - name: Build and push Docker image ECC
       uses: docker/build-push-action@v5
       with:
@@ -64,7 +79,7 @@ jobs:
         tags: |
           tigergraph/graphrag-ecc:${{steps.get-image.outputs.IMAGE}}
           tigergraph/graphrag-ecc:${{steps.get-image.outputs.VERSION}}
-          tigergraph/graphrag-ecc:latest
+          ${{ steps.latest-check.outputs.push_latest == 'true' && 'tigergraph/graphrag-ecc:latest' || '' }}
 
     - name: Build and push Docker image chat-history
       uses: docker/build-push-action@v5
@@ -75,8 +90,8 @@ jobs:
         tags: |
           tigergraph/chat-history:${{steps.get-image.outputs.IMAGE}}
           tigergraph/chat-history:${{steps.get-image.outputs.VERSION}}
-          tigergraph/chat-history:latest
-     
+          ${{ steps.latest-check.outputs.push_latest == 'true' && 'tigergraph/chat-history:latest' || '' }}
+
     - name: Build and push Docker image graphrag-ui
       uses: docker/build-push-action@v5
       with:
@@ -91,7 +106,7 @@ jobs:
         tags: |
           tigergraph/graphrag-ui:${{steps.get-image.outputs.IMAGE}}
           tigergraph/graphrag-ui:${{steps.get-image.outputs.VERSION}}
-          tigergraph/graphrag-ui:latest
+          ${{ steps.latest-check.outputs.push_latest == 'true' && 'tigergraph/graphrag-ui:latest' || '' }}
 
 #    - name: Set SSH key
 #      run: |
diff --git a/graphrag/app/routers/ui.py b/graphrag/app/routers/ui.py
index ff27e57..ebf32ae 100644
--- a/graphrag/app/routers/ui.py
+++ b/graphrag/app/routers/ui.py
@@ -49,6 +49,7 @@
 from fastapi.security import HTTPBasic, HTTPBasicCredentials
 from fastapi.security.http import HTTPBase
 from pyTigerGraph import TigerGraphConnection
+from pyTigerGraph.common.exception import TigerGraphException
 from tools.validation_utils import MapQuestionToSchemaException
 
 from common.config import db_config, graphrag_config, embedding_service, llm_config, service_status, get_chat_config, get_completion_config, get_embedding_config, get_multimodal_config, validate_graphname, get_llm_service, resolve_llm_services
@@ -357,6 +358,18 @@ def auth(usr: str, password: str, conn=None) -> tuple[list[str], TigerGraphConne
             status_code=status.HTTP_401_UNAUTHORIZED,
             detail="Incorrect username or password",
         )
+    except TigerGraphException as e:
+        # pyTigerGraph wraps auth rejections as a TigerGraphException
+        # ("Authentication failed.", ...) rather than HTTPError. Convert
+        # that class explicitly so the client sees a clean 401, not a
+        # generic 500.
+        msg = (str(e.args[0]) if e.args else str(e)).lower()
+        if "authentic" in msg or "token" in msg or "password" in msg:
+            raise HTTPException(
+                status_code=status.HTTP_401_UNAUTHORIZED,
+                detail="Authentication failed",
+            )
+        raise
     except Exception as e:
         raise e
     return graphs, conn
@@ -392,7 +405,12 @@ def login(auth: Annotated[list[str], Depends(ui_basic_auth)]):
     except Exception as e:
         logger.warning(f"Failed to fetch roles at login: {e}")
         global_roles, graph_roles = [], {}
-    return {"graphs": graphs, "roles": global_roles, "graph_roles": graph_roles}
+    return {
+        "graphs": graphs,
+        "roles": global_roles,
+        "graph_roles": graph_roles,
+        "username": creds.username,
+    }
 
 
 def _read_local_version(component: str) -> dict:

From cc2adf58ec7b6d1350e76baa2d070ec20ea6a36f Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Thu, 21 May 2026 16:10:57 -0700
Subject: [PATCH 03/18] Add token login option with API token / Secret choice

- Login keeps Username / Password as the default and adds a "Use token
  login" option offering API Token or Secret.
- API tokens authenticate as bearer tokens; username/password and
  Secret use basic auth. The backend accepts both schemes everywhere.
- The signed-in username and roles are resolved from TigerGraph after
  login, so the UI shows the real user for chat history, traces, and
  conversation ownership.
- Knowledge-graph rebuilds run under the signed-in user's credentials,
  including token logins.
- Connections always authenticate as the caller; a configured static
  token no longer overrides the per-user identity, and token
  acquisition is automatic.
- Login inputs no longer clip underscores on Chrome / macOS.

Refs: GML-2094
---
 CHANGELOG.md                                  |  12 +
 README.md                                     |   6 +-
 common/config.py                              |   5 +-
 common/db/connections.py                      | 109 +----
 docs/tutorials/configs/server_config.json     |   1 -
 .../configs/server_config.json.gemini         |   1 -
 .../configs/server_config.json.openai         |   1 -
 graphrag-ui/src/actions/ActionProvider.tsx    |   2 +-
 .../src/components/CustomChatMessage.tsx      |   8 +-
 graphrag-ui/src/components/Interact.tsx       |   4 +-
 graphrag-ui/src/components/Login.tsx          | 285 +++++++-----
 graphrag-ui/src/components/SideMenu.tsx       |   8 +-
 graphrag-ui/src/hooks/useIdleTimeout.ts       |   4 +-
 graphrag-ui/src/hooks/useRoles.ts             |   4 +-
 graphrag-ui/src/main.tsx                      |   2 +-
 graphrag-ui/src/pages/Setup.tsx               |  76 ++--
 graphrag-ui/src/pages/TraceLogs.tsx           |   4 +-
 .../src/pages/setup/CustomizePrompts.tsx      |   8 +-
 graphrag-ui/src/pages/setup/GraphDBConfig.tsx |  14 +-
 .../src/pages/setup/GraphRAGConfig.tsx        |   8 +-
 graphrag-ui/src/pages/setup/IngestGraph.tsx   |  62 +--
 graphrag-ui/src/pages/setup/KGAdmin.tsx       |  42 +-
 graphrag-ui/src/pages/setup/LLMConfig.tsx     |  14 +-
 graphrag-ui/src/pages/setup/SetupLayout.tsx   |   4 +-
 graphrag/app/routers/ui.py                    | 421 +++++++++++++-----
 25 files changed, 642 insertions(+), 463 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index b4c1d94..0a13c82 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,17 @@
 # Changelog
 
+## [1.4.1]
+
+### Added
+- **Token login** — the sign-in page adds a "Use token login" option with a choice of API Token or Secret, alongside the default username / password. The signed-in username and roles are resolved from TigerGraph after login so the UI shows the real user.
+
+### Changed
+- **Every request authenticates as the signed-in user**, end to end — graph operations, chat history, traces, and knowledge-graph rebuilds all run under the caller's identity (username / password, secret, or API token).
+- **TigerGraph token handling is automatic** — an api token is obtained from the caller's credentials only when the database requires one, unless a static api token is configured. The `getToken` config option is no longer needed and is now ignored.
+
+### Removed
+- **A configured static `apiToken` no longer overrides per-user credentials.** It is used only for the service's background operations; interactive requests always authenticate as the signed-in user.
+
 ## [1.4.0]
 
 ### Added
diff --git a/README.md b/README.md
index ce4f10d..01e44be 100644
--- a/README.md
+++ b/README.md
@@ -423,7 +423,7 @@ For examples of how to ingest documents through the backend API, refer to the **
 ## More Detailed Configurations
 
 ### DB configuration
-Copy the below into `configs/server_config.json` and edit the `hostname` and `getToken` fields to match your database's configuration. If token authentication is enabled in TigerGraph, set `getToken` to `true`. Set the timeout, memory threshold, and thread limit parameters as desired to control how much of the database's resources are consumed when answering a question.
+Copy the below into `configs/server_config.json` and edit the `hostname` to match your database's configuration. Token authentication is handled automatically — an api token is obtained from the username/password when the database requires one, unless a static api token is configured. Set the timeout, memory threshold, and thread limit parameters as desired to control how much of the database's resources are consumed when answering a question.
 
 ```json
 {
@@ -433,7 +433,6 @@ Copy the below into `configs/server_config.json` and edit the `hostname` and `ge
         "gsPort": "14240",
         "username": "tigergraph",
         "password": "tigergraph",
-        "getToken": false,
         "default_timeout": 300,
         "default_mem_threshold": 5000,
         "default_thread_limit": 8
@@ -448,9 +447,8 @@ Copy the below into `configs/server_config.json` and edit the `hostname` and `ge
 | `gsPort` | string | `"14240"` | GSQL port for TigerGraph admin operations. |
 | `username` | string | `"tigergraph"` | TigerGraph database username. |
 | `password` | string | `"tigergraph"` | TigerGraph database password. |
-| `getToken` | bool | `false` | Set to `true` if token authentication is enabled on TigerGraph. |
 | `graphname` | string | `""` | Default graph name. Usually left empty (selected at runtime). |
-| `apiToken` | string | `""` | Pre-generated API token. If set, token-based auth is used instead of username/password. |
+| `apiToken` | string | `""` | Optional pre-generated token for the service's background operations. Interactive requests always authenticate as the signed-in user. |
 | `default_timeout` | int | `300` | Default query timeout in seconds. |
 | `default_mem_threshold` | int | `5000` | Memory threshold (MB) for query execution. |
 | `default_thread_limit` | int | `8` | Max threads for query execution. |
diff --git a/common/config.py b/common/config.py
index dd59ad1..a18fe4d 100644
--- a/common/config.py
+++ b/common/config.py
@@ -532,6 +532,9 @@ def _build_embedding_store(graphname: str = "") -> TigerGraphEmbeddingStore:
     ``embedding_service`` for the model) so the result reflects the
     current config.
     """
+    # A static apiToken stays a service-side credential here; otherwise
+    # pyTigerGraph mints a REST++ token from the service username/password
+    # on demand, so no explicit getToken() is needed.
     conn = TigerGraphConnection(
         host=db_config.get("hostname", "http://tigergraph"),
         username=db_config.get("username", "tigergraph"),
@@ -541,8 +544,6 @@ def _build_embedding_store(graphname: str = "") -> TigerGraphEmbeddingStore:
         graphname=graphname or db_config.get("graphname", ""),
         apiToken=db_config.get("apiToken", ""),
     )
-    if not db_config.get("apiToken") and db_config.get("getToken"):
-        conn.getToken()
 
     store = TigerGraphEmbeddingStore(
         conn,
diff --git a/common/db/connections.py b/common/db/connections.py
index fab87c3..8b0840c 100644
--- a/common/db/connections.py
+++ b/common/db/connections.py
@@ -120,94 +120,31 @@ def get_db_connection_pwd_manual(
     return conn
 
 def elevate_db_connection_to_token(host, username, password, graphname, async_conn: bool = False) -> TigerGraphConnectionProxy:
-    # If a pre-existing apiToken is provided in config, use it directly
-    # and skip the getToken() call to avoid conflicts.
-    static_token = db_config.get("apiToken", "")
-
-    if static_token:
-        LogWriter.info("Using pre-configured apiToken from db_config")
-        if async_conn:
-            conn = AsyncTigerGraphConnection(
-                host=host,
-                username=username,
-                password=password,
-                graphname=graphname,
-                apiToken=static_token,
-                restppPort=db_config.get("restppPort", "9000"),
-                gsPort=db_config.get("gsPort", "14240"),
-            )
-        else:
-            conn = TigerGraphConnection(
-                host=host,
-                username=username,
-                password=password,
-                graphname=graphname,
-                apiToken=static_token,
-                restppPort=db_config.get("restppPort", "9000"),
-                gsPort=db_config.get("gsPort", "14240"),
-            )
-        return conn
-
-    conn = TigerGraphConnection(
-        host=host,
-        username=username,
-        password=password,
-        graphname=graphname,
-        restppPort=db_config.get("restppPort", "9000"),
-        gsPort=db_config.get("gsPort", "14240")
-    )
-    
-    if db_config.get("getToken"):
-        try:
-            apiToken = conn.getToken()[0]
-        except HTTPError:
-            LogWriter.error("Failed to get token")
-            raise HTTPException(
-                status_code=status.HTTP_401_UNAUTHORIZED,
-                detail="Incorrect username or password",
-                headers={"WWW-Authenticate": "Basic"},
-            )
-        except TigerGraphException as e:
-            LogWriter.error(f"Failed to get token: {e}")
-            raise HTTPException(
-                status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
-                detail="Failed to get token - is the database running?"
-            )
+    # pyTigerGraph determines on its own whether a REST++ token is needed
+    # and mints one from the username/password when so; we just build the
+    # connection with the caller's credentials.
+    if async_conn:
+        conn = AsyncTigerGraphConnection(
+            host=host,
+            username=username,
+            password=password,
+            graphname=graphname,
+            restppPort=db_config.get("restppPort", "9000"),
+            gsPort=db_config.get("gsPort", "14240")
+        )
 
-        if async_conn:
-            conn = AsyncTigerGraphConnection(
-                host=host,
-                username=username,
-                password=password,
-                graphname=graphname,
-                apiToken=apiToken,
-                restppPort=db_config.get("restppPort", "9000"),
-                gsPort=db_config.get("gsPort", "14240")
-            )
-        else:
-            conn = TigerGraphConnection(
-                host=db_config["hostname"],
-                username=username,
-                password=password,
-                graphname=graphname,
-                apiToken=apiToken,
-                restppPort=db_config.get("restppPort", "9000"),
-                gsPort=db_config.get("gsPort", "14240")
-            )
+        # temp fix for path
+        if conn.restppPort == conn.gsPort and "/restpp" not in conn.restppUrl:
+            conn.restppUrl = conn.restppUrl+"/restpp"
     else:
-        if async_conn:
-            conn = AsyncTigerGraphConnection(
-                host=host,
-                username=username,
-                password=password,
-                graphname=graphname,
-                restppPort=db_config.get("restppPort", "9000"),
-                gsPort=db_config.get("gsPort", "14240")
-            )
-
-            # temp fix for path
-            if conn.restppPort == conn.gsPort and "/restpp" not in conn.restppUrl:
-                conn.restppUrl = conn.restppUrl+"/restpp"
+        conn = TigerGraphConnection(
+            host=host,
+            username=username,
+            password=password,
+            graphname=graphname,
+            restppPort=db_config.get("restppPort", "9000"),
+            gsPort=db_config.get("gsPort", "14240")
+        )
 
     return conn
 
diff --git a/docs/tutorials/configs/server_config.json b/docs/tutorials/configs/server_config.json
index da46e28..2ee25f4 100644
--- a/docs/tutorials/configs/server_config.json
+++ b/docs/tutorials/configs/server_config.json
@@ -3,7 +3,6 @@
     "hostname": "http://tigergraph",
     "restppPort": "14240",
     "gsPort": "14240",
-    "getToken": false,
     "default_timeout": 300,
     "default_mem_threshold": 5000,
     "default_thread_limit": 8
diff --git a/docs/tutorials/configs/server_config.json.gemini b/docs/tutorials/configs/server_config.json.gemini
index 1e8740e..7a2da90 100644
--- a/docs/tutorials/configs/server_config.json.gemini
+++ b/docs/tutorials/configs/server_config.json.gemini
@@ -3,7 +3,6 @@
     "hostname": "http://tigergraph",
     "restppPort": "14240",
     "gsPort": "14240",
-    "getToken": false,
     "default_timeout": 300,
     "default_mem_threshold": 5000,
     "default_thread_limit": 8
diff --git a/docs/tutorials/configs/server_config.json.openai b/docs/tutorials/configs/server_config.json.openai
index da46e28..2ee25f4 100644
--- a/docs/tutorials/configs/server_config.json.openai
+++ b/docs/tutorials/configs/server_config.json.openai
@@ -3,7 +3,6 @@
     "hostname": "http://tigergraph",
     "restppPort": "14240",
     "gsPort": "14240",
-    "getToken": false,
     "default_timeout": 300,
     "default_mem_threshold": 5000,
     "default_thread_limit": 8
diff --git a/graphrag-ui/src/actions/ActionProvider.tsx b/graphrag-ui/src/actions/ActionProvider.tsx
index c73c182..22fee0b 100644
--- a/graphrag-ui/src/actions/ActionProvider.tsx
+++ b/graphrag-ui/src/actions/ActionProvider.tsx
@@ -89,7 +89,7 @@ const ActionProvider: React.FC<ActionProviderProps> = ({
   const { sendMessage, lastMessage, readyState } = useWebSocket(WS_URL, {
     onOpen: () => {
       // Send authentication credentials
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       console.log("Sending credentials, length:", creds ? creds.length : 0);
       queryGraphragWs2(creds!);
 
diff --git a/graphrag-ui/src/components/CustomChatMessage.tsx b/graphrag-ui/src/components/CustomChatMessage.tsx
index 43937ef..4043c24 100755
--- a/graphrag-ui/src/components/CustomChatMessage.tsx
+++ b/graphrag-ui/src/components/CustomChatMessage.tsx
@@ -105,7 +105,7 @@ const AuthenticatedImage: FC<{ src: string; alt: string }> = ({ src, alt }) => {
     const fetchImage = async () => {
       try {
         // Get credentials from sessionStorage (same pattern as Interact.tsx and SideMenu.tsx)
-        const creds = sessionStorage.getItem("creds");
+        const creds = sessionStorage.getItem("auth");
         if (!creds) {
           console.error("No credentials found in sessionStorage");
           setError(true);
@@ -119,7 +119,7 @@ const AuthenticatedImage: FC<{ src: string; alt: string }> = ({ src, alt }) => {
         // Fetch image with authentication header
         const response = await fetch(src, {
           headers: {
-            Authorization: `Basic ${creds}`,
+            Authorization: creds!,
           },
           credentials: 'include', // Include credentials in CORS requests
         });
@@ -259,7 +259,7 @@ export const CustomChatMessage: FC<IChatbotMessageProps> = ({
                 // HTTPBasic returns 401 + ``WWW-Authenticate: Basic`` and
                 // the browser pops up its native auth dialog. Better to
                 // tell the user to sign in again than to flash that popup.
-                const creds = sessionStorage.getItem("creds");
+                const creds = sessionStorage.getItem("auth");
                 if (!creds) {
                   await alert("Your session has expired. Please log in again.");
                   return;
@@ -270,7 +270,7 @@ export const CustomChatMessage: FC<IChatbotMessageProps> = ({
                 try {
                   const probe = await fetch(`/ui/trace/${messageId}`, {
                     method: "GET",
-                    headers: { Authorization: `Basic ${creds}` },
+                    headers: { Authorization: creds! },
                   });
                   if (!probe.ok) {
                     await alert("Trace log not found.");
diff --git a/graphrag-ui/src/components/Interact.tsx b/graphrag-ui/src/components/Interact.tsx
index ae93539..f5fff48 100644
--- a/graphrag-ui/src/components/Interact.tsx
+++ b/graphrag-ui/src/components/Interact.tsx
@@ -39,14 +39,14 @@ export const Interactions: FC<Interactions> = ({
   const canViewTrace = isSuperuser || isGlobalDesigner || isGraphAdmin;
 
   const sendFeedback = async (action: Feedback, message: Message) => {
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     setFeedback(action);
     message.feedback = action;
     await fetch(`${GRAPHRAG_URL}/ui/feedback`, {
       method: "POST",
       body: JSON.stringify(message),
       headers: {
-        Authorization: `Basic ${creds}`,
+        Authorization: creds!,
         "Content-Type": "application/json",
       },
     });
diff --git a/graphrag-ui/src/components/Login.tsx b/graphrag-ui/src/components/Login.tsx
index d753124..170c712 100644
--- a/graphrag-ui/src/components/Login.tsx
+++ b/graphrag-ui/src/components/Login.tsx
@@ -1,100 +1,116 @@
 "use client";
 
-import { useContext, createContext, useState, useEffect } from "react";
+import { useState, useEffect } from "react";
 import { useNavigate } from "react-router-dom";
 import { useTranslation } from "react-i18next";
 
-import { zodResolver } from "@hookform/resolvers/zod";
-import { useForm } from "react-hook-form";
-import { z } from "zod";
-
 import { Button } from "@/components/ui/button";
-import {
-  Form,
-  FormControl,
-  FormField,
-  FormItem,
-  FormDescription,
-  FormMessage,
-} from "@/components/ui/form";
 import { Input } from "@/components/ui/input";
 
 import { LANGUAGES } from "../constants";
 
-const formSchema = z.object({
-  email: z.string().min(2, {
-    message: "Username must be at least 2 characters.",
-  }),
-  password: z.string().min(2, {
-    message: "Password must be at least 2 characters.",
-  }),
-});
-
+// TigerGraph's native sentinel for secret-based auth. pyTigerGraph
+// handles this directly when sent as plain username/password.
+const SECRET_USERNAME = "__GSQL__secret";
 
 const WS_URL = "/ui/ui-login";
 
+type TokenType = "apiToken" | "secret";
+
+// Style applied to every credential input so Chrome on macOS doesn't
+// clip descenders / underscores when rendering long values.
+const INPUT_CLIP_FIX: React.CSSProperties = {
+  WebkitAppearance: "none",
+  appearance: "none",
+  lineHeight: "1.5",
+};
+
+const INPUT_STYLE = "dark:border-[#3D3D3D] h-14 py-3 dark:bg-shadeA";
+
 export function Login() {
   const { i18n, t } = useTranslation();
-  const [user, setUser] = useState("");
-  const [token, setToken] = useState(sessionStorage.getItem("site") || "");
+  const [useTokenLogin, setUseTokenLogin] = useState(false);
+  const [tokenType, setTokenType] = useState<TokenType>("apiToken");
+  const [email, setEmail] = useState("");
+  const [password, setPassword] = useState("");
+  const [tokenValue, setTokenValue] = useState("");
   const [hint, setHint] = useState("");
+  const [submitting, setSubmitting] = useState(false);
   const navigate = useNavigate();
 
   useEffect(() => {
-    const parseStore = JSON.parse(sessionStorage.getItem("site") || "{}");
-    setToken(parseStore);
-  }, []);
-
-  const loginAction = async (data: z.infer<typeof formSchema>) => {
-    const creds = btoa(`${data.email}:${data.password}`);
-    const username = data.email;
+    setHint("");
+  }, [useTokenLogin, tokenType, email, password, tokenValue]);
+
+  const loginAction = async (e: React.FormEvent) => {
+    e.preventDefault();
+
+    // Build the full Authorization header value. API tokens use
+    // ``Bearer <token>``; classic user/pass and TG ``__GSQL__secret``
+    // logins use ``Basic <b64>``. Backend resolves the real TG
+    // identity from SHOW USER and returns it in the response.
+    let authHeader: string;
+    let typedUsername = "";
+    if (useTokenLogin) {
+      const value = tokenValue.trim();
+      if (value.length < 8) {
+        setHint(
+          tokenType === "apiToken"
+            ? "Please enter an API token."
+            : "Please enter a secret."
+        );
+        return;
+      }
+      if (tokenType === "apiToken") {
+        authHeader = `Bearer ${value}`;
+      } else {
+        authHeader = `Basic ${btoa(`${SECRET_USERNAME}:${value}`)}`;
+      }
+    } else {
+      const username = email.trim();
+      if (username.length < 2 || password.length < 2) {
+        setHint("Please enter your username and password.");
+        return;
+      }
+      authHeader = `Basic ${btoa(`${username}:${password}`)}`;
+      typedUsername = username;
+    }
 
+    setSubmitting(true);
     try {
-      const res = await fetch("/ui/ui-login", {
+      const res = await fetch(WS_URL, {
         method: "POST",
-        headers: {
-          Authorization: `Basic ${creds}`,
-        },
+        headers: { Authorization: authHeader },
       });
 
       if (res.ok) {
         const data = await res.json();
-        sessionStorage.setItem("creds", creds);
+        sessionStorage.setItem("auth", authHeader);
         sessionStorage.setItem("site", JSON.stringify(data));
-        setUser(username);
-        sessionStorage.setItem("username", username);
+        // Server-resolved username works in every mode; fall back to
+        // the typed value for classic logins on older backends.
+        const resolved =
+          (typeof data.username === "string" && data.username) ||
+          typedUsername;
+        if (resolved) sessionStorage.setItem("username", resolved);
+        else sessionStorage.removeItem("username");
         navigate("/chat");
       } else if (res.status === 401 || res.status === 403) {
-        setHint("Invalid credentials");
-        navigate("/");
+        setHint(
+          useTokenLogin ? "Invalid or unauthorized token." : "Invalid credentials."
+        );
       } else {
         setHint(`Server error (${res.status}). Please try again later.`);
-        navigate("/");
       }
     } catch {
       setHint("Unable to connect to the server. Please try again later.");
-      navigate("/");
+    } finally {
+      setSubmitting(false);
     }
   };
 
-  const logOut = () => {
-    setUser("");
-    setToken("");
-    sessionStorage.removeItem("site");
-    navigate("/");
-  };
-
-  const form = useForm<z.infer<typeof formSchema>>({
-    resolver: zodResolver(formSchema),
-    defaultValues: {
-      email: "",
-      password: "",
-    },
-  });
-
   const onChangeLang = (e: React.ChangeEvent<HTMLSelectElement>) => {
-    const lang_code = e.target.value;
-    i18n.changeLanguage(lang_code);
+    i18n.changeLanguage(e.target.value);
   };
 
   return (
@@ -106,70 +122,101 @@ export function Login() {
         <br />
         TigerGraph GraphRAG
       </h1>
-      <h4 className="text-center mb-10 text-black dark:text-[#D9D9D9]">
+      <h4 className="text-center mb-8 text-black dark:text-[#D9D9D9]">
         {t("login")}
       </h4>
 
-      <Form {...form}>
-        <form onSubmit={form.handleSubmit(loginAction)}>
-          <FormField
-            control={form.control}
-            name="email"
-            render={({ field }) => (
-              <>
-                <FormItem className="mb-5">
-                  <FormControl>
-                    <Input
-                      placeholder={t("username")}
-                      {...field}
-                      className="dark:border-[#3D3D3D] py-6 dark:bg-shadeA"
-                    />
-                  </FormControl>
-                  <FormDescription></FormDescription>
-                  <FormMessage />
-                </FormItem>
-              </>
-            )}
-          />
-          <FormField
-            control={form.control}
-            name="password"
-            render={({ field }) => (
-              <>
-                <FormItem className="mb-5">
-                  <FormControl>
-                    <Input
-                      placeholder={t("password")}
-                      type="password"
-                      {...field}
-                      className="dark:border-[#3D3D3D] py-6 dark:bg-shadeA"
-                    />
-                  </FormControl>
-                  <FormDescription></FormDescription>
-                  <FormMessage />
-                </FormItem>
-              </>
-            )}
+      <form onSubmit={loginAction}>
+        {useTokenLogin ? (
+          <>
+            <div className="mb-5">
+              <label className="block text-sm font-medium mb-2 text-black dark:text-[#D9D9D9]">
+                Credential type
+              </label>
+              <select
+                value={tokenType}
+                onChange={(e) => setTokenType(e.target.value as TokenType)}
+                className="block w-full h-14 px-3 rounded-md border border-input bg-background dark:border-[#3D3D3D] dark:bg-shadeA text-sm"
+              >
+                <option value="apiToken">API Token</option>
+                <option value="secret">Secret</option>
+              </select>
+            </div>
+            <div className="mb-5">
+              <Input
+                placeholder={
+                  tokenType === "apiToken" ? "API Token" : "Secret"
+                }
+                type="password"
+                value={tokenValue}
+                onChange={(e) => setTokenValue(e.target.value)}
+                autoComplete="off"
+                className={INPUT_STYLE}
+                style={INPUT_CLIP_FIX}
+              />
+            </div>
+          </>
+        ) : (
+          <>
+            <div className="mb-5">
+              <Input
+                placeholder={t("username")}
+                value={email}
+                onChange={(e) => setEmail(e.target.value)}
+                autoComplete="username"
+                className={INPUT_STYLE}
+                style={INPUT_CLIP_FIX}
+              />
+            </div>
+            <div className="mb-5">
+              <Input
+                placeholder={t("password")}
+                type="password"
+                value={password}
+                onChange={(e) => setPassword(e.target.value)}
+                autoComplete="current-password"
+                className={INPUT_STYLE}
+                style={INPUT_CLIP_FIX}
+              />
+            </div>
+          </>
+        )}
+
+        <div className="flex items-center space-x-2 mb-2">
+          <input
+            type="checkbox"
+            id="useTokenLogin"
+            className="rounded border-gray-300 dark:border-[#3D3D3D]"
+            checked={useTokenLogin}
+            onChange={(e) => {
+              setUseTokenLogin(e.target.checked);
+              setTokenValue("");
+              setPassword("");
+            }}
           />
-          {/* <a href="#" className="text-xs text-right block">
-            {t("forgotPassword")}
-          </a> */}
-          <Button type="submit" className="gradient w-full text-white mt-10">
-            {t("submit")}
-          </Button>
-
-          { <div className="inline-flex items-center justify-center w-full">
-            <hr className="w-full h-px my-8 border-0 bg-gray-200 dark:bg-gray-700" />
-            <span className="absolute px-3 text-xs bg-background dark:border-[#3D3D3D] text-gray-900 -translate-x-1/2 left-1/2 dark:text-white">
-              {hint}
-            </span>
-          </div> }
-
-          {/* <a href="#" className="text-xs text-center block !text-tigerOrange">
-            {t("signUp")}
-          </a> */}
-        </form>
-      </Form>
+          <label
+            htmlFor="useTokenLogin"
+            className="text-sm text-black dark:text-[#D9D9D9] cursor-pointer"
+          >
+            Use token login
+          </label>
+        </div>
+
+        <Button
+          type="submit"
+          disabled={submitting}
+          className="gradient w-full text-white mt-6"
+        >
+          {submitting ? "Signing in…" : t("submit")}
+        </Button>
+
+        <div className="inline-flex items-center justify-center w-full">
+          <hr className="w-full h-px my-8 border-0 bg-gray-200 dark:bg-gray-700" />
+          <span className="absolute px-3 text-xs bg-background dark:border-[#3D3D3D] text-gray-900 -translate-x-1/2 left-1/2 dark:text-white">
+            {hint}
+          </span>
+        </div>
+      </form>
 
       <select
         defaultValue={i18n.language}
diff --git a/graphrag-ui/src/components/SideMenu.tsx b/graphrag-ui/src/components/SideMenu.tsx
index 79fe501..e2c3134 100644
--- a/graphrag-ui/src/components/SideMenu.tsx
+++ b/graphrag-ui/src/components/SideMenu.tsx
@@ -95,7 +95,7 @@ const SideMenu = ({
 
   const fetchHistory2 = useCallback(async () => {
     setConversationId([]);
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     const username = sessionStorage.getItem("username");
 
     if (!username) {
@@ -109,7 +109,7 @@ const SideMenu = ({
     const settings = {
       method: 'GET',
       headers: {
-        Authorization: `Basic ${creds}`,
+        Authorization: creds!,
         "Content-Type": "application/json",
       }
     }
@@ -209,7 +209,7 @@ const SideMenu = ({
       setExpandedConversations(prev => new Set([...prev, id]));
 
       // Store conversation data for the chat component
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       if (!creds) {
         return;
       }
@@ -217,7 +217,7 @@ const SideMenu = ({
       const settings = {
         method: 'GET',
         headers: {
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
           "Content-Type": "application/json",
         }
       }
diff --git a/graphrag-ui/src/hooks/useIdleTimeout.ts b/graphrag-ui/src/hooks/useIdleTimeout.ts
index 0b54892..76b66d3 100644
--- a/graphrag-ui/src/hooks/useIdleTimeout.ts
+++ b/graphrag-ui/src/hooks/useIdleTimeout.ts
@@ -14,7 +14,7 @@ export function useIdleTimeout(timeoutMs: number = DEFAULT_TIMEOUT_MS) {
   const timerRef = useRef<ReturnType<typeof setTimeout> | null>(null);
 
   const handleTimeout = useCallback(() => {
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     if (!creds) return; // Not logged in, nothing to do
 
     sessionStorage.clear();
@@ -27,7 +27,7 @@ export function useIdleTimeout(timeoutMs: number = DEFAULT_TIMEOUT_MS) {
       clearTimeout(timerRef.current);
     }
     // Only set timer if user is logged in
-    if (sessionStorage.getItem("creds")) {
+    if (sessionStorage.getItem("auth")) {
       timerRef.current = setTimeout(handleTimeout, timeoutMs);
     }
   }, [handleTimeout, timeoutMs]);
diff --git a/graphrag-ui/src/hooks/useRoles.ts b/graphrag-ui/src/hooks/useRoles.ts
index b9fd578..f6b2432 100644
--- a/graphrag-ui/src/hooks/useRoles.ts
+++ b/graphrag-ui/src/hooks/useRoles.ts
@@ -34,7 +34,7 @@ export function useRoles(refreshKey?: unknown): RolesState {
   );
 
   const loadRoles = useCallback(async () => {
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     if (!creds) {
       setUserRoles([]);
       setGraphRoles({});
@@ -58,7 +58,7 @@ export function useRoles(refreshKey?: unknown): RolesState {
     // Fallback: fetch from backend (for sessions created before login returned roles)
     try {
       const response = await fetch("/ui/roles", {
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
       if (!response.ok) {
         setUserRoles([]);
diff --git a/graphrag-ui/src/main.tsx b/graphrag-ui/src/main.tsx
index 1788c05..69a77e5 100755
--- a/graphrag-ui/src/main.tsx
+++ b/graphrag-ui/src/main.tsx
@@ -20,7 +20,7 @@ import "./components/i18n";
 
 /** Redirect to login if no credentials in session. */
 const RequireAuth = ({ children }: { children: any }) => {
-  if (!sessionStorage.getItem("creds")) {
+  if (!sessionStorage.getItem("auth")) {
     return <Navigate to="/" replace />;
   }
   return children;
diff --git a/graphrag-ui/src/pages/Setup.tsx b/graphrag-ui/src/pages/Setup.tsx
index f1a8d79..e660478 100644
--- a/graphrag-ui/src/pages/Setup.tsx
+++ b/graphrag-ui/src/pages/Setup.tsx
@@ -103,9 +103,9 @@ const [activeTab, setActiveTab] = useState("upload");
     if (!ingestGraphName) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch(`/ui/${ingestGraphName}/uploads/list`, {
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
       const data = await safeJson(response);
       setUploadedFiles(data.files || []);
@@ -152,13 +152,13 @@ const [activeTab, setActiveTab] = useState("upload");
     setUploadMessage("Uploading files...");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const formData = new FormData();
       filesArray.forEach((file) => formData.append("files", file));
 
       const response = await fetch(`/ui/${ingestGraphName}/uploads?overwrite=true`, {
         method: "POST",
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
         body: formData,
       });
 
@@ -201,7 +201,7 @@ const [activeTab, setActiveTab] = useState("upload");
     setUploadMessage("Total size exceeds limit. Uploading files one by one...");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       let uploadedCount = 0;
       let failedCount = 0;
       const totalFiles = filesArray.length;
@@ -219,7 +219,7 @@ const [activeTab, setActiveTab] = useState("upload");
         try {
           const response = await fetch(`/ui/${ingestGraphName}/uploads?overwrite=true`, {
             method: "POST",
-            headers: { Authorization: `Basic ${creds}` },
+            headers: { Authorization: creds! },
             body: formData,
           });
 
@@ -274,13 +274,13 @@ const [activeTab, setActiveTab] = useState("upload");
     console.log("Deleting file:", filename);
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
 
       // Delete original file
       const url = `/ui/${ingestGraphName}/uploads?filename=${encodeURIComponent(filename)}`;
       const response = await fetch(url, {
           method: "DELETE",
-          headers: { Authorization: `Basic ${creds}` },
+          headers: { Authorization: creds! },
         });
       const data = await response.json();
       setUploadMessage(`✅ ${data.message}`);
@@ -302,10 +302,10 @@ const [activeTab, setActiveTab] = useState("upload");
     if (!shouldDelete) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch(`/ui/${ingestGraphName}/uploads`, {
         method: "DELETE",
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
       const data = await response.json();
       
@@ -324,9 +324,9 @@ const [activeTab, setActiveTab] = useState("upload");
     if (!ingestGraphName) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch(`/ui/${ingestGraphName}/cloud/list`, {
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
       const data = await response.json();
       setDownloadedFiles(data.files || []);
@@ -346,7 +346,7 @@ const [activeTab, setActiveTab] = useState("upload");
     setDownloadMessage("Downloading files from cloud storage...");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       
       // Prepare request body based on provider
       let requestBody: any = { provider: cloudProvider };
@@ -397,7 +397,7 @@ const [activeTab, setActiveTab] = useState("upload");
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(requestBody),
       });
@@ -438,13 +438,13 @@ const [activeTab, setActiveTab] = useState("upload");
     if (!ingestGraphName) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       
       // Delete original file
       const url = `/ui/${ingestGraphName}/cloud/delete?filename=${encodeURIComponent(filename)}`;
       const response = await fetch(url, {
           method: "DELETE",
-          headers: { Authorization: `Basic ${creds}` },
+          headers: { Authorization: creds! },
         }
       );
       const data = await response.json();
@@ -463,10 +463,10 @@ const [activeTab, setActiveTab] = useState("upload");
     if (!shouldDelete) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch(`/ui/${ingestGraphName}/cloud/delete`, {
         method: "DELETE",
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
       const data = await response.json();
       setDownloadMessage(`✅ ${data.message}`);
@@ -486,7 +486,7 @@ const [activeTab, setActiveTab] = useState("upload");
     setIsIngesting(true);
     setIngestMessage("Ingesting documents into knowledge graph...");
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const folderPath = sourceType === "uploaded" ? `uploads/${ingestGraphName}` : `downloaded_files_cloud/${ingestGraphName}`;
       
       // Use existing ingestJobData if available, otherwise construct from folder path
@@ -505,7 +505,7 @@ const [activeTab, setActiveTab] = useState("upload");
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify({
           load_job_id: jobData.load_job_id,
@@ -548,7 +548,7 @@ const [activeTab, setActiveTab] = useState("upload");
     setIngestMessage("Step 1/2: Creating ingest job...");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
 
       // Step 1: Create ingest job
       const createIngestConfig = {
@@ -564,7 +564,7 @@ const [activeTab, setActiveTab] = useState("upload");
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(createIngestConfig),
       });
@@ -602,7 +602,7 @@ const [activeTab, setActiveTab] = useState("upload");
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(loadingInfo),
       });
@@ -644,7 +644,7 @@ const [activeTab, setActiveTab] = useState("upload");
     console.log("fileCount:", fileCount);
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
 
       // Call create_ingest to process files
       const createIngestConfig = {
@@ -662,7 +662,7 @@ const [activeTab, setActiveTab] = useState("upload");
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(createIngestConfig),
       });
@@ -742,7 +742,7 @@ const [activeTab, setActiveTab] = useState("upload");
     setIsIngesting(true);
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       let loadingInfo: any = {};
 
       if (skipBDAProcessing) {
@@ -796,7 +796,7 @@ const [activeTab, setActiveTab] = useState("upload");
           method: "POST",
           headers: {
             "Content-Type": "application/json",
-            Authorization: `Basic ${creds}`,
+            Authorization: creds!,
           },
           body: JSON.stringify(createIngestConfig),
         });
@@ -824,7 +824,7 @@ const [activeTab, setActiveTab] = useState("upload");
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(loadingInfo),
       });
@@ -860,11 +860,11 @@ const [activeTab, setActiveTab] = useState("upload");
     }
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const statusResponse = await fetch(`/ui/${graphName}/rebuild_status`, {
         method: "GET",
         headers: {
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
       });
 
@@ -931,13 +931,13 @@ const [activeTab, setActiveTab] = useState("upload");
     setRefreshMessage("Verifying rebuild status...");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
 
       // Final status check to prevent race conditions
       const statusCheckResponse = await fetch(`/ui/${refreshGraphName}/rebuild_status`, {
         method: "GET",
         headers: {
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
       });
 
@@ -957,7 +957,7 @@ const [activeTab, setActiveTab] = useState("upload");
       const response = await fetch(`/ui/${refreshGraphName}/rebuild_graph`, {
         method: "POST",
         headers: {
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
       });
 
@@ -1017,10 +1017,10 @@ const [activeTab, setActiveTab] = useState("upload");
         setRefreshGraphName(store.graphs[0]);
       }
     }
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     if (!creds) return;
     fetch("/ui/list_graphs", {
-      headers: { Authorization: `Basic ${creds}` },
+      headers: { Authorization: creds! },
     })
       .then((r) => (r.ok ? r.json() : null))
       .then((data) => {
@@ -1063,7 +1063,7 @@ const [activeTab, setActiveTab] = useState("upload");
 
     try {
       // Get credentials from sessionStorage
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       if (!creds) {
         throw new Error("Not authenticated. Please login first.");
       }
@@ -1073,7 +1073,7 @@ const [activeTab, setActiveTab] = useState("upload");
       const createResponse = await fetch(`/ui/${graphName}/create_graph`, {
         method: "POST",
         headers: {
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
       });
 
@@ -1105,7 +1105,7 @@ const [activeTab, setActiveTab] = useState("upload");
       const initResponse = await fetch(`/ui/${graphName}/initialize_graph`, {
         method: "POST",
         headers: {
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
       });
 
diff --git a/graphrag-ui/src/pages/TraceLogs.tsx b/graphrag-ui/src/pages/TraceLogs.tsx
index d5f0a0e..821059b 100644
--- a/graphrag-ui/src/pages/TraceLogs.tsx
+++ b/graphrag-ui/src/pages/TraceLogs.tsx
@@ -736,7 +736,7 @@ const TraceLogs: FC<TraceLogsProps> = ({ messageIdProp, onClose }) => {
       setLoading(false);
       return;
     }
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     // Skip the API call when there are no creds — sending ``Basic null``
     // makes FastAPI's HTTPBasic challenge with ``WWW-Authenticate: Basic``
     // which triggers the browser's native auth popup. Better to show
@@ -748,7 +748,7 @@ const TraceLogs: FC<TraceLogsProps> = ({ messageIdProp, onClose }) => {
     }
     setLoading(true);
     fetch(`/ui/trace/${messageId}`, {
-      headers: { Authorization: `Basic ${creds}` },
+      headers: { Authorization: creds! },
     })
       .then((res) => {
         if (!res.ok) throw new Error("Not found");
diff --git a/graphrag-ui/src/pages/setup/CustomizePrompts.tsx b/graphrag-ui/src/pages/setup/CustomizePrompts.tsx
index 92142e6..6c83d7a 100644
--- a/graphrag-ui/src/pages/setup/CustomizePrompts.tsx
+++ b/graphrag-ui/src/pages/setup/CustomizePrompts.tsx
@@ -68,13 +68,13 @@ const CustomizePrompts = () => {
     setSaveMessageType("");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const query = selectedGraph ? `?graphname=${encodeURIComponent(selectedGraph)}` : "";
       const response = await fetch(`/ui/prompts${query}`, {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify({
           prompt_type: promptId,
@@ -110,10 +110,10 @@ const CustomizePrompts = () => {
     setIsLoading(true);
     const effectiveGraph = graphname ?? selectedGraph;
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const query = effectiveGraph ? `?graphname=${encodeURIComponent(effectiveGraph)}` : "";
       const response = await fetch(`/ui/prompts${query}`, {
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
 
       if (!response.ok) {
diff --git a/graphrag-ui/src/pages/setup/GraphDBConfig.tsx b/graphrag-ui/src/pages/setup/GraphDBConfig.tsx
index 1d478cd..dabf97f 100644
--- a/graphrag-ui/src/pages/setup/GraphDBConfig.tsx
+++ b/graphrag-ui/src/pages/setup/GraphDBConfig.tsx
@@ -49,9 +49,9 @@ const GraphDBConfig = () => {
   const fetchConfig = async () => {
     setIsLoading(true);
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch("/ui/config", {
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
 
       if (!response.ok) {
@@ -99,7 +99,7 @@ const GraphDBConfig = () => {
     setConnectionTested(false);
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const testConfig: any = {
         hostname: effective(hostname, "hostname"),
         restppPort: effective(restppPort, "restppPort"),
@@ -116,7 +116,7 @@ const GraphDBConfig = () => {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(testConfig),
       });
@@ -150,7 +150,7 @@ const GraphDBConfig = () => {
     setMessageType("");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const effectiveHostname = effective(hostname, "hostname");
       const effectiveUsername = effective(username, "username");
       const dbConfigData: any = {
@@ -172,7 +172,7 @@ const GraphDBConfig = () => {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(dbConfigData),
       });
@@ -196,7 +196,7 @@ const GraphDBConfig = () => {
           
           setTimeout(() => {
             // Clear sessionStorage and redirect to login
-            sessionStorage.removeItem("creds");
+            sessionStorage.removeItem("auth");
             alert(reason);
             window.location.href = "/"; // Redirect to root (login page)
           }, 2000); // Give user 2 seconds to see the success message
diff --git a/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx b/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
index 962f505..2e439ca 100644
--- a/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
+++ b/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
@@ -109,7 +109,7 @@ const GraphRAGConfig = () => {
     setIsLoading(true);
     const effectiveScope = scope ?? configScope;
     const effectiveGraph = graphname ?? selectedGraph;
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     const params = new URLSearchParams();
     if (effectiveGraph) params.set("graphname", effectiveGraph);
     if (effectiveScope === "graph") params.set("scope", "graph");
@@ -134,7 +134,7 @@ const GraphRAGConfig = () => {
     for (let attempt = 1; attempt <= maxAttempts; attempt++) {
       try {
         const response = await fetch(url, {
-          headers: { Authorization: `Basic ${creds}` },
+          headers: { Authorization: creds! },
         });
         lastStatus = response.status;
         if (!response.ok) {
@@ -190,7 +190,7 @@ const GraphRAGConfig = () => {
     setMessageType("");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       
       // Build current UI state — only include non-empty fields
       const currentChunkerConfig: any = {};
@@ -321,7 +321,7 @@ const GraphRAGConfig = () => {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(graphragConfigData),
       });
diff --git a/graphrag-ui/src/pages/setup/IngestGraph.tsx b/graphrag-ui/src/pages/setup/IngestGraph.tsx
index 69197be..f91dfe2 100644
--- a/graphrag-ui/src/pages/setup/IngestGraph.tsx
+++ b/graphrag-ui/src/pages/setup/IngestGraph.tsx
@@ -95,9 +95,9 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     if (!ingestGraphName) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch(`/ui/${ingestGraphName}/uploads/list`, {
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
       const data = await response.json();
       setUploadedFiles(data.files || []);
@@ -153,7 +153,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     setIngestMessage("");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const formData = new FormData();
       filesArray.forEach((file) => formData.append("files", file));
 
@@ -161,7 +161,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
         `/ui/${ingestGraphName}/uploads?overwrite=true`,
         {
           method: "POST",
-          headers: { Authorization: `Basic ${creds}` },
+          headers: { Authorization: creds! },
           body: formData,
         }
       );
@@ -205,7 +205,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     setIngestMessage("");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       let uploadedCount = 0;
       let failedCount = 0;
       const totalFiles = filesArray.length;
@@ -229,7 +229,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
             `/ui/${ingestGraphName}/uploads?overwrite=true`,
             {
               method: "POST",
-              headers: { Authorization: `Basic ${creds}` },
+              headers: { Authorization: creds! },
               body: formData,
             }
           );
@@ -283,12 +283,12 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     if (!ingestGraphName) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch(
         `/ui/${ingestGraphName}/uploads?filename=${encodeURIComponent(filename)}`,
         {
           method: "DELETE",
-          headers: { Authorization: `Basic ${creds}` },
+          headers: { Authorization: creds! },
         }
       );
       const data = await response.json();
@@ -309,10 +309,10 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     if (!shouldDelete) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch(`/ui/${ingestGraphName}/uploads`, {
         method: "DELETE",
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
       const data = await response.json();
       setUploadMessage(`✅ ${data.message}`);
@@ -327,9 +327,9 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     if (!ingestGraphName) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch(`/ui/${ingestGraphName}/cloud/list`, {
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
       const data = await response.json();
       setDownloadedFiles(data.files || []);
@@ -349,7 +349,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     setDownloadMessage("Downloading files from cloud storage...");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
 
       // Prepare request body based on provider
       let requestBody: any = { provider: cloudProvider };
@@ -400,7 +400,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(requestBody),
       });
@@ -440,14 +440,14 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     if (!ingestGraphName) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch(
         `/ui/${ingestGraphName}/cloud/delete?filename=${encodeURIComponent(
           filename
         )}`,
         {
           method: "DELETE",
-          headers: { Authorization: `Basic ${creds}` },
+          headers: { Authorization: creds! },
         }
       );
       const data = await response.json();
@@ -468,10 +468,10 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     if (!shouldDelete) return;
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const response = await fetch(`/ui/${ingestGraphName}/cloud/delete`, {
         method: "DELETE",
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
       const data = await response.json();
       setDownloadMessage(`✅ ${data.message}`);
@@ -489,7 +489,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     setIsIngesting(true);
     setIngestMessage("Ingesting documents into knowledge graph...");
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const folderPath = sourceType === "uploaded" ? `uploads/${ingestGraphName}` : `downloaded_files_cloud/${ingestGraphName}`;
 
       // If no cached job from a prior create_ingest, run it now. The
@@ -506,7 +506,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
             method: "POST",
             headers: {
               "Content-Type": "application/json",
-              Authorization: `Basic ${creds}`,
+              Authorization: creds!,
             },
             body: JSON.stringify({
               data_source: "server",
@@ -536,7 +536,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify({
           load_job_id: jobData.load_job_id,
@@ -578,7 +578,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     setIngestMessage("Step 1/2: Creating ingest job...");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
 
       const createIngestConfig = {
         data_source: "server",
@@ -591,7 +591,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(createIngestConfig),
       });
@@ -626,7 +626,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
           method: "POST",
           headers: {
             "Content-Type": "application/json",
-            Authorization: `Basic ${creds}`,
+            Authorization: creds!,
           },
           body: JSON.stringify(loadingInfo),
         });
@@ -666,7 +666,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     console.log("fileCount:", fileCount);
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
 
       const createIngestConfig = {
         data_source: "server",
@@ -681,7 +681,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(createIngestConfig),
       });
@@ -772,7 +772,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     setIsIngesting(true);
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       let loadingInfo: any = {};
 
       if (skipBDAProcessing) {
@@ -832,7 +832,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
             method: "POST",
             headers: {
               "Content-Type": "application/json",
-              Authorization: `Basic ${creds}`,
+              Authorization: creds!,
             },
             body: JSON.stringify(createIngestConfig),
           }
@@ -867,7 +867,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(loadingInfo),
       });
@@ -915,10 +915,10 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
         setIngestGraphName(store.graphs[0]);
       }
     }
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     if (!creds) return;
     fetch("/ui/list_graphs", {
-      headers: { Authorization: `Basic ${creds}` },
+      headers: { Authorization: creds! },
     })
       .then((r) => (r.ok ? r.json() : null))
       .then((data) => {
diff --git a/graphrag-ui/src/pages/setup/KGAdmin.tsx b/graphrag-ui/src/pages/setup/KGAdmin.tsx
index 19b8ae8..f4b6f61 100644
--- a/graphrag-ui/src/pages/setup/KGAdmin.tsx
+++ b/graphrag-ui/src/pages/setup/KGAdmin.tsx
@@ -330,10 +330,10 @@ const KGAdmin = () => {
         setRefreshGraphName(store.graphs[0]);
       }
     }
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     if (!creds) return;
     fetch("/ui/list_graphs", {
-      headers: { Authorization: `Basic ${creds}` },
+      headers: { Authorization: creds! },
     })
       .then((r) => (r.ok ? r.json() : null))
       .then((data) => {
@@ -376,9 +376,9 @@ const KGAdmin = () => {
     if (isExtractingSchema || draftProposal) {
       setSchemaSource("samples");
     }
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     if (!creds) return;
-    fetch(`/ui/config`, { headers: { Authorization: `Basic ${creds}` } })
+    fetch(`/ui/config`, { headers: { Authorization: creds! } })
       .then((r) => (r.ok ? r.json() : null))
       .then((data) => {
         const cfg = data?.graphrag_config || {};
@@ -396,7 +396,7 @@ const KGAdmin = () => {
     // downstream parser would still drop reserved/structural names,
     // just without the inline message.
     fetch(`/ui/schema_reserved_names`, {
-      headers: { Authorization: `Basic ${creds}` },
+      headers: { Authorization: creds! },
     })
       .then((r) => (r.ok ? r.json() : null))
       .then((data) => {
@@ -474,7 +474,7 @@ const KGAdmin = () => {
     // user isn't logged out mid-extraction.
     pauseIdleTimer();
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       if (!creds) throw new Error("Not authenticated. Please login first.");
 
       // Step 1/2: upload + convert. Returns the saved filenames so we
@@ -485,7 +485,7 @@ const KGAdmin = () => {
         `/ui/${graphName}/convert_sample_files`,
         {
           method: "POST",
-          headers: { Authorization: `Basic ${creds}` },
+          headers: { Authorization: creds! },
           body: form,
         }
       );
@@ -504,7 +504,7 @@ const KGAdmin = () => {
         {
           method: "POST",
           headers: {
-            Authorization: `Basic ${creds}`,
+            Authorization: creds!,
             "Content-Type": "application/json",
           },
           body: JSON.stringify({
@@ -591,9 +591,9 @@ const KGAdmin = () => {
     setPrecheckRunning(true);
     setPrecheckMessage("");
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const eligResp = await fetch(`/ui/${graphName}/check_init_eligibility`, {
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
       const elig = await eligResp.json();
       if (!eligResp.ok) {
@@ -637,7 +637,7 @@ const KGAdmin = () => {
           {
             method: "POST",
             headers: {
-              Authorization: `Basic ${creds}`,
+              Authorization: creds!,
               "Content-Type": "application/json",
             },
             body: JSON.stringify({
@@ -695,7 +695,7 @@ const KGAdmin = () => {
     pauseIdleTimer();
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       if (!creds) {
         throw new Error("Not authenticated. Please login first.");
       }
@@ -703,7 +703,7 @@ const KGAdmin = () => {
       setStatusMessage("Step 1/2: Creating graph...");
       const createResponse = await fetch(`/ui/${graphName}/create_graph`, {
         method: "POST",
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
 
       const createData = await createResponse.json();
@@ -756,7 +756,7 @@ const KGAdmin = () => {
       const initResponse = await fetch(`/ui/${graphName}/initialize_graph`, {
         method: "POST",
         headers: {
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
           "Content-Type": "application/json",
         },
         body: JSON.stringify(initBody),
@@ -810,7 +810,7 @@ const KGAdmin = () => {
         try {
           statusResp = await fetch(
             `/ui/${graphName}/initialize_status`,
-            { headers: { Authorization: `Basic ${creds}` } }
+            { headers: { Authorization: creds! } }
           );
         } catch {
           // Transient network blip — retry on the next tick rather
@@ -863,7 +863,7 @@ const KGAdmin = () => {
           await fetch("/ui/prompts", {
             method: "POST",
             headers: {
-              Authorization: `Basic ${creds}`,
+              Authorization: creds!,
               "Content-Type": "application/json",
             },
             body: JSON.stringify({
@@ -921,10 +921,10 @@ const KGAdmin = () => {
     }
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const statusResponse = await fetch(`/ui/${graphName}/rebuild_status`, {
         method: "GET",
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
 
       if (statusResponse.ok) {
@@ -1003,12 +1003,12 @@ const KGAdmin = () => {
     setRefreshMessage("Verifying rebuild status...");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
 
       // Final status check to prevent race conditions
       const statusCheckResponse = await fetch(`/ui/${refreshGraphName}/rebuild_status`, {
         method: "GET",
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
 
       if (statusCheckResponse.ok) {
@@ -1026,7 +1026,7 @@ const KGAdmin = () => {
 
       const response = await fetch(`/ui/${refreshGraphName}/rebuild_graph`, {
         method: "POST",
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
 
       if (!response.ok) {
diff --git a/graphrag-ui/src/pages/setup/LLMConfig.tsx b/graphrag-ui/src/pages/setup/LLMConfig.tsx
index a33379c..1013c7d 100644
--- a/graphrag-ui/src/pages/setup/LLMConfig.tsx
+++ b/graphrag-ui/src/pages/setup/LLMConfig.tsx
@@ -175,13 +175,13 @@ const LLMConfig = () => {
     const effectiveScope = scope ?? configScope;
     const effectiveGraph = graphname ?? selectedGraph;
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const params = new URLSearchParams();
       if (effectiveGraph) params.set("graphname", effectiveGraph);
       if (effectiveScope === "graph") params.set("scope", "graph");
       const queryString = params.toString() ? `?${params.toString()}` : "";
       const response = await fetch(`/ui/config${queryString}`, {
-        headers: { Authorization: `Basic ${creds}` },
+        headers: { Authorization: creds! },
       });
 
       if (!response.ok) {
@@ -480,7 +480,7 @@ const LLMConfig = () => {
     setMessageType("");
 
     try {
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       let llmConfigData: any;
 
       // Graph admin saving chatbot config
@@ -503,7 +503,7 @@ const LLMConfig = () => {
           method: "POST",
           headers: {
             "Content-Type": "application/json",
-            Authorization: `Basic ${creds}`,
+            Authorization: creds!,
           },
           body: JSON.stringify(llmConfigData),
         });
@@ -527,7 +527,7 @@ const LLMConfig = () => {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(llmConfigData),
       });
@@ -614,14 +614,14 @@ const LLMConfig = () => {
         if (useCustomChatbot && !chatbotModelName.trim()) { failValidation("Chatbot Model is required when not inheriting from completion"); return; }
       }
       
-      const creds = sessionStorage.getItem("creds");
+      const creds = sessionStorage.getItem("auth");
       const llmConfigData = buildLLMConfigPayload();
 
       const response = await fetch("/ui/config/llm/test", {
         method: "POST",
         headers: {
           "Content-Type": "application/json",
-          Authorization: `Basic ${creds}`,
+          Authorization: creds!,
         },
         body: JSON.stringify(llmConfigData),
       });
diff --git a/graphrag-ui/src/pages/setup/SetupLayout.tsx b/graphrag-ui/src/pages/setup/SetupLayout.tsx
index 31cf93f..7720e4e 100644
--- a/graphrag-ui/src/pages/setup/SetupLayout.tsx
+++ b/graphrag-ui/src/pages/setup/SetupLayout.tsx
@@ -23,9 +23,9 @@ const SetupLayout = () => {
   // checks. Falls back to empty silently if the endpoint is unreachable.
   const [version, setVersion] = useState<string>("");
   useEffect(() => {
-    const creds = sessionStorage.getItem("creds");
+    const creds = sessionStorage.getItem("auth");
     if (!creds) return;
-    fetch("/ui/version", { headers: { Authorization: `Basic ${creds}` } })
+    fetch("/ui/version", { headers: { Authorization: creds! } })
       .then((r) => (r.ok ? r.json() : null))
       .then((data) => {
         const v = data?.graphrag?.version;
diff --git a/graphrag/app/routers/ui.py b/graphrag/app/routers/ui.py
index ebf32ae..27bc954 100644
--- a/graphrag/app/routers/ui.py
+++ b/graphrag/app/routers/ui.py
@@ -38,6 +38,7 @@
     Body,
     Depends,
     File,
+    Header,
     HTTPException,
     Path,
     Request,
@@ -46,8 +47,7 @@
     WebSocketDisconnect,
     status,
 )
-from fastapi.security import HTTPBasic, HTTPBasicCredentials
-from fastapi.security.http import HTTPBase
+from fastapi.security import HTTPBasicCredentials
 from pyTigerGraph import TigerGraphConnection
 from pyTigerGraph.common.exception import TigerGraphException
 from tools.validation_utils import MapQuestionToSchemaException
@@ -141,7 +141,6 @@ def _save_trace_log(message_id: str, conversation_id: str, user_query: str, resp
 use_cypher = os.getenv("USE_CYPHER", "false").lower() == "true"
 route_prefix = "/ui"  # APIRouter's prefix doesn't work with the websocket, so it has to be done here
 router = APIRouter(tags=["UI"])
-security = HTTPBasic()
 llm_config_lock = asyncio.Lock()
 
 # Cache for user role lookups (avoids repeated GSQL calls)
@@ -162,24 +161,44 @@ def _normalize_roles(raw_roles: str) -> list[str]:
     return [r.strip().lower() for r in re.split(r"[,\s]+", cleaned) if r.strip()]
 
 
-def _parse_user_roles_detail(user_info: str, username: str) -> tuple[list[str], dict[str, list[str]]]:
+def _parse_user_roles_detail(user_info: str) -> tuple[list[str], dict[str, list[str]], str]:
+    """Single-pass parser for ``SHOW USER`` output. Returns
+    ``(global_roles, graph_roles, current_user)`` where ``current_user``
+    is the username flagged by TG's ``*`` marker (the effective user
+    for the session that ran the call). Roles are extracted only from
+    that ``*``-marked block.
+
+    Returning the resolved user lets callers handle the case where the
+    login name was a sentinel like ``__GSQL__secret`` and the real
+    identity is whoever the secret belongs to.
+    """
     global_roles: list[str] = []
     graph_roles: dict[str, list[str]] = {}
+    current_user = ""
     is_user_section = False
     for line in user_info.splitlines():
-        line_stripped = line.strip()
+        line_stripped = line.lstrip()
+        # Capture the leading marker (``*`` for current user, ``-`` for
+        # the other users, possibly absent on a header) so we can pick
+        # the right block.
         match = re.match(
-            r"^[\*\-]?\s*\-?\s*(Name|User Name|User)\s*:\s*(.+)$",
+            r"^([\*\-])?\s*-?\s*(?:Name|User Name|User)\s*:\s*(.+)$",
             line_stripped,
             re.IGNORECASE,
         )
         if match:
-            current_name = match.group(2).strip()
-            is_user_section = current_name == username
+            marker = match.group(1)
+            name = match.group(2).strip()
+            if marker == "*":
+                current_user = name
+                is_user_section = True
+            else:
+                is_user_section = False
             continue
         if not is_user_section:
             continue
 
+        line_stripped = line_stripped.strip()
         roles_match = re.match(
             r"^[\*\-]?\s*\-?\s*(Global Roles|Roles)\s*:\s*(.+)$",
             line_stripped,
@@ -200,15 +219,26 @@ def _parse_user_roles_detail(user_info: str, username: str) -> tuple[list[str],
             if roles:
                 graph_roles[graph_name] = roles
 
-    return global_roles, graph_roles
+    return global_roles, graph_roles, current_user
 
 
-def _parse_user_roles(user_info: str, username: str) -> list[str]:
-    global_roles, _ = _parse_user_roles_detail(user_info, username)
+def _parse_user_roles(user_info: str, username: str = "") -> list[str]:
+    # ``username`` kept for back-compat; the parser now resolves the
+    # active user from SHOW USER's ``*`` marker.
+    global_roles, _, _ = _parse_user_roles_detail(user_info)
     return global_roles
 
-def _get_user_role_details(username: str, password: str) -> tuple[list[str], dict[str, list[str]]]:
-    """Get user roles with short TTL cache to avoid repeated GSQL calls."""
+def _get_user_role_details(
+    username: str, password: str
+) -> tuple[list[str], dict[str, list[str]], str]:
+    """Get user roles + resolved username with a short TTL cache.
+
+    Returns ``(global_roles, graph_roles, resolved_username)`` where
+    ``resolved_username`` is the user TG marks as current in ``SHOW
+    USER`` output. For sentinel logins (e.g. ``__GSQL__secret``) this
+    is the secret's owner; for classic user/password logins it matches
+    the input.
+    """
     pwd_hash = hashlib.sha256(password.encode()).hexdigest()[:16]
     cache_key = (username, pwd_hash)
     now = time.time()
@@ -218,14 +248,28 @@ def _get_user_role_details(username: str, password: str) -> tuple[list[str], dic
         if cached and (now - cached[0]) < _ROLE_CACHE_TTL:
             return cached[1]
 
-    conn = TigerGraphConnection(
-        host=db_config.get("hostname"),
-        username=username,
-        password=password,
-        gsPort=db_config.get("gsPort"),
-        restppPort=db_config.get("restppPort"),
-        graphname="",
-    )
+    # Mirror the auth() dispatch — API-token logins build the
+    # connection with ``apiToken``; secret logins
+    # (``__GSQL__secret``) and classic user/password both go through
+    # the username/password slots (pyTigerGraph routes the secret
+    # case natively).
+    if username == _UI_TOKEN_SENTINEL:
+        conn = TigerGraphConnection(
+            host=db_config.get("hostname"),
+            gsPort=db_config.get("gsPort"),
+            restppPort=db_config.get("restppPort"),
+            graphname="",
+            apiToken=password,
+        )
+    else:
+        conn = TigerGraphConnection(
+            host=db_config.get("hostname"),
+            username=username,
+            password=password,
+            gsPort=db_config.get("gsPort"),
+            restppPort=db_config.get("restppPort"),
+            graphname="",
+        )
 
     # Transient GSQL hiccups when the role-cache TTL expires were
     # surfacing as 403 "Unable to verify user roles" banners on the
@@ -235,7 +279,10 @@ def _get_user_role_details(username: str, password: str) -> tuple[list[str], dic
     for attempt in range(2):
         try:
             user_info = conn.gsql("SHOW USER")
-            result = _parse_user_roles_detail(user_info, username)
+            roles, graph_roles, resolved = _parse_user_roles_detail(user_info)
+            if not resolved:
+                resolved = username
+            result = (roles, graph_roles, resolved)
             with _role_cache_lock:
                 _role_cache[cache_key] = (now, result)
             return result
@@ -248,7 +295,7 @@ def _get_user_role_details(username: str, password: str) -> tuple[list[str], dic
 
 
 def _get_user_roles(username: str, password: str) -> list[str]:
-    global_roles, _ = _get_user_role_details(username, password)
+    global_roles, _, _ = _get_user_role_details(username, password)
     return global_roles
 
 def _require_roles(credentials: HTTPBasicCredentials, allowed_roles: set[str]) -> list[str]:
@@ -289,7 +336,7 @@ def _require_prompt_access(credentials: HTTPBasicCredentials, graphname: str | N
     if graphname:
         validate_graphname(graphname)
     try:
-        global_roles, graph_roles = _get_user_role_details(credentials.username, credentials.password)
+        global_roles, graph_roles, _ = _get_user_role_details(credentials.username, credentials.password)
     except Exception as e:
         logger.error(f"Failed to resolve user roles: {e}")
         raise HTTPException(status_code=403, detail="Unable to verify user roles.")
@@ -306,7 +353,7 @@ def _resolve_llm_config_access(
     if graphname:
         validate_graphname(graphname)
     try:
-        global_roles, graph_roles = _get_user_role_details(
+        global_roles, graph_roles, _ = _get_user_role_details(
             credentials.username, credentials.password
         )
     except Exception as e:
@@ -343,11 +390,103 @@ def _ecc_jobs_running(graphs: list[str], auth_header: str) -> bool:
     return False
 
 
+_UI_TOKEN_SENTINEL = "__graphrag_token__"
+
+
+def _parse_auth_header(authorization: str | None) -> HTTPBasicCredentials:
+    """Parse an ``Authorization`` header value into ``HTTPBasicCredentials``.
+
+    ``Basic <b64>`` decodes to the real username/password pair.
+    ``Bearer <token>`` is mapped to a synthetic
+    ``(_UI_TOKEN_SENTINEL, token)`` pair so downstream code that already
+    dispatches on the sentinel for API-token logins keeps working
+    unchanged.
+    """
+    if not authorization:
+        raise HTTPException(
+            status_code=status.HTTP_401_UNAUTHORIZED,
+            detail="Missing Authorization header",
+            headers={"WWW-Authenticate": "Basic"},
+        )
+    try:
+        scheme, _, value = authorization.partition(" ")
+    except Exception:
+        scheme, value = "", ""
+    scheme = scheme.strip().lower()
+    value = value.strip()
+    if scheme == "basic" and value:
+        try:
+            decoded = base64.b64decode(value).decode()
+            username, _, password = decoded.partition(":")
+        except Exception:
+            raise HTTPException(
+                status_code=status.HTTP_401_UNAUTHORIZED,
+                detail="Malformed Basic credentials",
+                headers={"WWW-Authenticate": "Basic"},
+            )
+        return HTTPBasicCredentials(username=username, password=password)
+    if scheme == "bearer" and value:
+        return HTTPBasicCredentials(username=_UI_TOKEN_SENTINEL, password=value)
+    raise HTTPException(
+        status_code=status.HTTP_401_UNAUTHORIZED,
+        detail="Unsupported Authorization scheme",
+        headers={"WWW-Authenticate": "Basic"},
+    )
+
+
+def _chat_history_auth_header(creds: HTTPBasicCredentials) -> str:
+    """Build the Basic-auth header used when proxying to chat-history.
+
+    Chat-history identifies the caller by the Basic-auth username only
+    (it ignores the password). For sentinel logins
+    (``__graphrag_token__`` / ``__GSQL__secret``) we substitute the
+    TG-resolved username so conversations get stored / fetched under
+    the user's real identity instead of the sentinel string.
+    """
+    try:
+        _, _, resolved = _get_user_role_details(creds.username, creds.password)
+    except Exception:
+        resolved = creds.username
+    username = resolved or creds.username
+    encoded = base64.b64encode(f"{username}:{creds.password}".encode()).decode()
+    return f"Basic {encoded}"
+
+
+def _ecc_auth_header(creds: HTTPBasicCredentials) -> str:
+    """Build the Authorization header used when forwarding to ECC.
+
+    API-token logins arrive as the ``__graphrag_token__`` sentinel;
+    forward them as ``Bearer <token>`` since ECC connects with the
+    token directly. Classic user/password and ``__GSQL__secret`` logins
+    forward as Basic, which ECC / pyTigerGraph handle natively.
+    """
+    if creds.username == _UI_TOKEN_SENTINEL:
+        return f"Bearer {creds.password}"
+    encoded = base64.b64encode(
+        f"{creds.username}:{creds.password}".encode()
+    ).decode()
+    return f"Basic {encoded}"
+
+
 def auth(usr: str, password: str, conn=None) -> tuple[list[str], TigerGraphConnection]:
     if conn is None:
-        conn = TigerGraphConnection(
-            host=db_config["hostname"], graphname="", username=usr, password=password
-        )
+        # Three Basic-auth shapes share the wire:
+        #   * regular ``user:password`` → classic mode
+        #   * ``__graphrag_token__:<jwt>`` → API token mode; pass the
+        #     token to pyTigerGraph as ``apiToken``
+        #   * ``__GSQL__secret:<secret>`` → TigerGraph's native secret
+        #     convention; pyTigerGraph already understands it when sent
+        #     as plain username/password, so no special handling here.
+        if usr == _UI_TOKEN_SENTINEL:
+            conn = TigerGraphConnection(
+                host=db_config["hostname"], graphname="",
+                apiToken=password,
+            )
+        else:
+            conn = TigerGraphConnection(
+                host=db_config["hostname"], graphname="",
+                username=usr, password=password,
+            )
 
     try:
         graph_list = conn.listGraphs()
@@ -376,17 +515,41 @@ def auth(usr: str, password: str, conn=None) -> tuple[list[str], TigerGraphConne
 
 
 def ws_basic_auth(auth_info: str, graphname=None):
-    auth_info = base64.b64decode(auth_info.encode()).decode()
-    auth_info = auth_info.split(":")
-    username = auth_info[0]
-    password = auth_info[1]
-    conn = get_db_connection_pwd_manual(graphname, username, password)
-    return auth(username, password, conn)
+    """Authenticate a WebSocket / internal call from a raw Authorization
+    header value (``Basic <b64>`` or ``Bearer <token>``).
+    """
+    creds = _parse_auth_header(auth_info)
+    if creds.username == _UI_TOKEN_SENTINEL:
+        # API-token logins: build a TG connection directly with the
+        # token; ``get_db_connection_pwd_manual`` only handles
+        # username/password.
+        conn = TigerGraphConnection(
+            host=db_config["hostname"],
+            graphname=graphname or "",
+            apiToken=creds.password,
+            restppPort=db_config.get("restppPort", "9000"),
+            gsPort=db_config.get("gsPort", "14240"),
+        )
+    else:
+        conn = get_db_connection_pwd_manual(
+            graphname, creds.username, creds.password
+        )
+    return auth(creds.username, creds.password, conn)
+
+
+def ui_creds(
+    authorization: Annotated[str | None, Header()] = None,
+) -> HTTPBasicCredentials:
+    """Parse ``Authorization`` (Basic or Bearer) into
+    ``HTTPBasicCredentials`` without contacting TigerGraph. Used by
+    endpoints that only need the caller's identity.
+    """
+    return _parse_auth_header(authorization)
 
 
 def ui_basic_auth(
-    creds: Annotated[HTTPBasicCredentials, Depends(security)],
-) -> list[str]:
+    creds: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
+) -> tuple[list[str], HTTPBasicCredentials]:
     """
     1) Try authenticating with DB.
     2) Get list of graphs user has access to
@@ -399,17 +562,23 @@ def ui_basic_auth(
 def login(auth: Annotated[list[str], Depends(ui_basic_auth)]):
     graphs = auth[0]
     creds = auth[1]
-    # Fetch roles at login so frontend doesn't need separate /roles calls
+    # Fetch roles + resolved username at login so the frontend doesn't
+    # need separate /roles or /whoami calls. ``resolved`` differs from
+    # ``creds.username`` only when the caller logged in via a sentinel
+    # (e.g. ``__GSQL__secret``), in which case ``resolved`` is the
+    # user the secret belongs to.
     try:
-        global_roles, graph_roles = _get_user_role_details(creds.username, creds.password)
+        global_roles, graph_roles, resolved = _get_user_role_details(
+            creds.username, creds.password
+        )
     except Exception as e:
         logger.warning(f"Failed to fetch roles at login: {e}")
-        global_roles, graph_roles = [], {}
+        global_roles, graph_roles, resolved = [], {}, creds.username
     return {
         "graphs": graphs,
         "roles": global_roles,
         "graph_roles": graph_roles,
-        "username": creds.username,
+        "username": resolved or creds.username,
     }
 
 
@@ -538,12 +707,11 @@ def add_feedback(
     creds: Annotated[tuple[list[str], HTTPBasicCredentials], Depends(ui_basic_auth)],
 ):
     creds = creds[1]
-    auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
     try:
         res = httpx.post(
             f"{graphrag_config['chat_history_api']}/conversation",
             json=message.model_dump(),
-            headers={"Authorization": f"Basic {auth}"},
+            headers={"Authorization": _chat_history_auth_header(creds)},
         )
         res.raise_for_status()
     except Exception as e:
@@ -588,11 +756,17 @@ def get_trace_log(
     # Per-user segregation. Legacy files (saved before this fix) have no
     # "username" field and therefore can't pass this check — they will 404
     # for everyone and age out via the existing 30-day cleanup.
+    # Compare against the TG-resolved username so sentinel logins (e.g.
+    # ``__GSQL__secret``) can still read their own traces.
     owner = data.get("username")
-    if owner != creds[1].username:
+    try:
+        _, _, resolved = _get_user_role_details(creds[1].username, creds[1].password)
+    except Exception:
+        resolved = creds[1].username
+    if owner != (resolved or creds[1].username):
         logger.warning(
-            "User %r attempted to read trace owned by %r (message_id=%s)",
-            creds[1].username, owner, message_id,
+            "User %r (resolved=%r) attempted to read trace owned by %r (message_id=%s)",
+            creds[1].username, resolved, owner, message_id,
         )
         raise HTTPException(status_code=404, detail="Trace log not found")
 
@@ -613,7 +787,9 @@ def create_graph(
     try:
         # Extract credentials from the dependency (same pattern as other endpoints)
         creds = creds[1]
-        auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
+        auth = "Basic " + base64.b64encode(
+            f"{creds.username}:{creds.password}".encode()
+        ).decode()
         _, conn = ws_basic_auth(auth, graphname)
 
         # Create the graph using GSQL
@@ -739,7 +915,7 @@ def _build_proposal_from_live_schema(
     return SchemaProposal(vertices=vertices, edges=edges)
 
 
-def _check_init_eligibility(auth_b64: str, graphname: str) -> dict:
+def _check_init_eligibility(auth_header: str, graphname: str) -> dict:
     """Introspect *graphname* and categorize its current schema state.
 
     Returns a dict with key ``state`` set to one of:
@@ -766,7 +942,7 @@ def _check_init_eligibility(auth_b64: str, graphname: str) -> dict:
     structural_e = {t.casefold() for t in GRAPHRAG_STRUCTURAL_EDGE_TYPES}
 
     try:
-        _, conn = ws_basic_auth(auth_b64, graphname)
+        _, conn = ws_basic_auth(auth_header, graphname)
     except Exception:
         # Graph doesn't exist (or auth failed mid-flight); treat as empty
         # so the create_graph + init path handles it.
@@ -829,15 +1005,15 @@ def check_init_eligibility(
         }
     """
     cred_obj = creds[1]
-    auth_b64 = base64.b64encode(
+    auth_header = "Basic " + base64.b64encode(
         f"{cred_obj.username}:{cred_obj.password}".encode()
     ).decode()
-    result = _check_init_eligibility(auth_b64, graphname)
+    result = _check_init_eligibility(auth_header, graphname)
     # Include edge endpoint pairs so the UI can show "FILED_BY (Filing → Company)"
     # alongside each edge name in the description-edit dialog.
     if result.get("state") == "user_types_present" and result.get("user_edge_types"):
         try:
-            _, conn = ws_basic_auth(auth_b64, graphname)
+            _, conn = ws_basic_auth(auth_header, graphname)
             from common.db.schema_utils import read_existing_schema
             existing = read_existing_schema(conn)
             pairs_map: dict[str, list[list[str]]] = {}
@@ -1016,13 +1192,13 @@ def init_graph(
             detail="schema_gsql and use_existing_schema are mutually exclusive.",
         )
     cred_obj = creds[1]
-    auth_b64 = base64.b64encode(
+    auth_header = "Basic " + base64.b64encode(
         f"{cred_obj.username}:{cred_obj.password}".encode()
     ).decode()
 
     # Pre-flight eligibility check: introspect the live schema and
     # decide whether to proceed, reject, or adopt existing types.
-    eligibility = _check_init_eligibility(auth_b64, graphname)
+    eligibility = _check_init_eligibility(auth_header, graphname)
     if eligibility["state"] == "structural_present":
         raise HTTPException(
             status_code=409,
@@ -1078,7 +1254,7 @@ def _run_init():
                 graphname, state="running",
                 message="Initializing structural schema",
             )
-            _, conn = ws_basic_auth(auth_b64, graphname)
+            _, conn = ws_basic_auth(auth_header, graphname)
             LogWriter.info(f"Initializing graph: {graphname}")
             resp = supportai.init_supportai(conn, graphname)
             schema_res, index_res, query_res = resp[0], resp[1], resp[2]
@@ -1451,20 +1627,20 @@ async def forceupdate(
     
     # Extract credentials from the dependency
     creds = creds[1]
-    auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
+    auth_header = _ecc_auth_header(creds)
 
     ecc_base = graphrag_config.get("ecc", "http://graphrag-ecc:8001")
     ecc_update_url = f"{ecc_base}/{graphname}/graphrag/consistency_update"
     ecc_status_url = f"{ecc_base}/{graphname}/graphrag/rebuild_status"
-    
+
     LogWriter.info(f"Sending ECC rebuild request to: {ecc_update_url}")
-    
+
     # Background task to trigger rebuild, monitor completion, and release lock
     async def rebuild_and_monitor():
         try:
             # Step 1: Trigger the ECC rebuild (non-blocking)
             async with httpx.AsyncClient(timeout=30.0) as client:
-                response = await client.get(ecc_update_url, headers={"Authorization": f"Basic {auth}"})
+                response = await client.get(ecc_update_url, headers={"Authorization": auth_header})
                 if response.status_code not in [200, 202]:
                     LogWriter.error(f"ECC rebuild trigger failed for {graphname}: {response.status_code} - {response.text}")
                     return
@@ -1483,8 +1659,8 @@ async def rebuild_and_monitor():
                 try:
                     async with httpx.AsyncClient(timeout=10.0) as client:
                         status_response = await client.get(
-                            ecc_status_url, 
-                            headers={"Authorization": f"Basic {auth}"}
+                            ecc_status_url,
+                            headers={"Authorization": auth_header}
                         )
                     
                     if status_response.status_code == 200:
@@ -1535,7 +1711,7 @@ def get_rebuild_status(
     """
     # Extract credentials from the dependency
     creds = creds[1]
-    auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
+    auth_header = _ecc_auth_header(creds)
 
     try:
         ecc_status_url = (
@@ -1543,10 +1719,10 @@ def get_rebuild_status(
             + f"/{graphname}/graphrag/rebuild_status"
         )
         LogWriter.info(f"Checking ECC status at: {ecc_status_url}")
-        
+
         response = httpx.get(
             ecc_status_url,
-            headers={"Authorization": f"Basic {auth}"},
+            headers={"Authorization": auth_header},
             timeout=30.0
         )
         
@@ -1608,7 +1784,9 @@ def create_ingest(
     try:
         # Extract credentials from the dependency (same pattern as other endpoints)
         creds = creds[1]
-        auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
+        auth = "Basic " + base64.b64encode(
+            f"{creds.username}:{creds.password}".encode()
+        ).decode()
         _, conn = ws_basic_auth(auth, graphname)
 
         # Create the ingest configuration
@@ -1658,7 +1836,9 @@ def ingest(
     try:
         # Extract credentials from the dependency (same pattern as other endpoints)
         creds = creds[1]
-        auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
+        auth = "Basic " + base64.b64encode(
+            f"{creds.username}:{creds.password}".encode()
+        ).decode()
         _, conn = ws_basic_auth(auth, graphname)
 
         # Run the ingestion
@@ -1699,7 +1879,9 @@ async def serve_image_from_vertex(
     try:
         # Extract credentials from the dependency (same pattern as graph_query and other endpoints)
         creds = creds[1]
-        auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
+        auth = "Basic " + base64.b64encode(
+            f"{creds.username}:{creds.password}".encode()
+        ).decode()
         _, conn = ws_basic_auth(auth, graphname)
         
         LogWriter.info(f"Serving image {image_id} from graph {graphname}")
@@ -1746,12 +1928,11 @@ async def get_user_conversations(
     creds: Annotated[tuple[list[str], HTTPBasicCredentials], Depends(ui_basic_auth)],
 ):
     creds = creds[1]
-    auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
     try:
         async with httpx.AsyncClient() as client:
             res = await client.get(
                 f"{graphrag_config['chat_history_api']}/user/{user_id}",
-                headers={"Authorization": f"Basic {auth}"},
+                headers={"Authorization": _chat_history_auth_header(creds)},
             )
             res.raise_for_status()
     except Exception as e:
@@ -1766,9 +1947,9 @@ async def get_user_conversations(
 
 @router.get(route_prefix + "/roles")
 async def get_user_roles(
-    credentials: Annotated[HTTPBasicCredentials, Depends(security)]
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)]
 ):
-    roles, graph_roles = _get_user_role_details(
+    roles, graph_roles, _ = _get_user_role_details(
         credentials.username, credentials.password
     )
     return {"roles": roles, "graph_roles": graph_roles}
@@ -1780,12 +1961,11 @@ async def get_conversation_contents(
     creds: Annotated[tuple[list[str], HTTPBasicCredentials], Depends(ui_basic_auth)],
 ):
     creds = creds[1]
-    auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
     try:
         async with httpx.AsyncClient() as client:
             res = await client.get(
                 f"{graphrag_config['chat_history_api']}/conversation/{conversation_id}",
-                headers={"Authorization": f"Basic {auth}"},
+                headers={"Authorization": _chat_history_auth_header(creds)},
             )
             res.raise_for_status()
     except Exception as e:
@@ -1802,12 +1982,11 @@ async def get_conversation_feedback(
     creds: Annotated[tuple[list[str], HTTPBasicCredentials], Depends(ui_basic_auth)],
 ):
     creds = creds[1]
-    auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
     try:
         async with httpx.AsyncClient() as client:
             res = await client.get(
                 f"{graphrag_config['chat_history_api']}/get_feedback",
-                headers={"Authorization": f"Basic {auth}"},
+                headers={"Authorization": _chat_history_auth_header(creds)},
             )
             res.raise_for_status()
     except httpx.HTTPStatusError as e:
@@ -1830,12 +2009,11 @@ async def delete_conversation(
 ):
     """Delete a conversation and all its messages."""
     creds = creds[1]
-    auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
     try:
         async with httpx.AsyncClient() as client:
             res = await client.delete(
                 f"{graphrag_config['chat_history_api']}/conversation/{conversation_id}",
-                headers={"Authorization": f"Basic {auth}"},
+                headers={"Authorization": _chat_history_auth_header(creds)},
             )
             res.raise_for_status()
     except httpx.HTTPStatusError as e:
@@ -1934,20 +2112,22 @@ async def run_agent(
     return resp
 
 
-async def load_conversation_history(conversation_id: str, usr_auth: str) -> list[dict[str, str]]:
+async def load_conversation_history(
+    conversation_id: str, usr_creds: HTTPBasicCredentials
+) -> list[dict[str, str]]:
     """
     Load conversation history from the chat history service.
     Returns a list of dicts with 'query', 'response', 'create_ts', and 'update_ts' keys.
     """
     if not conversation_id or conversation_id == "new":
         return []
-    
+
     ch = graphrag_config.get("chat_history_api")
     if ch is None:
         LogWriter.info("chat-history not enabled, returning empty history")
         return []
-    
-    headers = {"Authorization": f"Basic {usr_auth}"}
+
+    headers = {"Authorization": _chat_history_auth_header(usr_creds)}
     try:
         async with httpx.AsyncClient() as client:
             res = await client.get(
@@ -1982,10 +2162,12 @@ async def load_conversation_history(conversation_id: str, usr_auth: str) -> list
         return []
 
 
-async def write_message_to_history(message: Message, usr_auth: str):
+async def write_message_to_history(
+    message: Message, usr_creds: HTTPBasicCredentials
+):
     ch = graphrag_config.get("chat_history_api")
     if ch is not None:
-        headers = {"Authorization": f"Basic {usr_auth}"}
+        headers = {"Authorization": _chat_history_auth_header(usr_creds)}
         try:
             async with httpx.AsyncClient() as client:
                 res = await client.post(
@@ -2008,11 +2190,13 @@ async def graph_query(
     conversation_id: str | None = None,
 ):
     creds = creds[1]
-    auth = base64.b64encode(f"{creds.username}:{creds.password}".encode()).decode()
-    _, conn = ws_basic_auth(auth, graphname)
+    auth_header = "Basic " + base64.b64encode(
+        f"{creds.username}:{creds.password}".encode()
+    ).decode()
+    _, conn = ws_basic_auth(auth_header, graphname)
     try:
         # Load conversation history if conversation_id is provided
-        conversation_history = await load_conversation_history(conversation_id, auth) if conversation_id else []
+        conversation_history = await load_conversation_history(conversation_id, creds) if conversation_id else []
 
         # Use provided conversation ID or generate new one
         if not conversation_id or conversation_id == "new":
@@ -2040,7 +2224,7 @@ async def graph_query(
             role=Role.USER,
         )
         # save message
-        await write_message_to_history(message, auth)
+        await write_message_to_history(message, creds)
         prev_id = message.message_id
 
         # generate response and keep track of response time
@@ -2063,7 +2247,7 @@ async def graph_query(
             response_type=resp.response_type,
             query_sources=resp.query_sources,
         )
-        await write_message_to_history(message, auth)
+        await write_message_to_history(message, creds)
         await asyncio.to_thread(_save_trace_log, message.message_id, convo_id, data, resp, elapsed, creds.username)
         prev_id = message.message_id
 
@@ -2084,9 +2268,10 @@ async def chat(
 ):
     """
     WebSocket endpoint for chat functionality with conversation history support.
-    
+
     Expected message flow:
-    1. Authentication (base64 encoded username:password)
+    1. Authentication: full Authorization header value, ``Basic <b64>``
+       or ``Bearer <token>``.
     2. RAG pattern (e.g., "hybridsearch", "similaritysearch", etc.)
     3. Conversation ID (or "new" for new conversation)
     4. User messages
@@ -2116,8 +2301,17 @@ async def chat(
         usr_auth = await asyncio.wait_for(websocket.receive_text(), timeout=10.0)
         logger.info(f"Received authentication data, length: {len(usr_auth)}")
         _, conn = ws_basic_auth(usr_auth, graphname)
-        # Extract the authenticated username for trace-log ownership tracking.
-        ws_username = base64.b64decode(usr_auth.encode()).decode().split(":", 1)[0]
+        # Extract the authenticated username for trace-log ownership
+        # tracking. For sentinel logins (API token / secret) this is
+        # the sentinel itself; we resolve to the real TG identity below.
+        usr_creds = _parse_auth_header(usr_auth)
+        try:
+            _, _, ws_username = _get_user_role_details(
+                usr_creds.username, usr_creds.password
+            )
+        except Exception:
+            ws_username = usr_creds.username
+        ws_username = ws_username or usr_creds.username
         logger.info("Authentication successful")
     except asyncio.TimeoutError:
         logger.error("WebSocket authentication timeout - no credentials received")
@@ -2149,7 +2343,7 @@ async def chat(
     )
     
     # Load conversation history if not a new conversation
-    conversation_history = await load_conversation_history(conversation_id, usr_auth)
+    conversation_history = await load_conversation_history(conversation_id, usr_creds)
     
     # Use provided conversation ID or generate new one
     if conversation_id == "new" or not conversation_id:
@@ -2180,7 +2374,7 @@ async def chat(
                 role=Role.USER,
             )
             # save message
-            await write_message_to_history(message, usr_auth)
+            await write_message_to_history(message, usr_creds)
             prev_id = message.message_id
 
             # generate response and keep track of response time
@@ -2203,7 +2397,7 @@ async def chat(
                 response_type=resp.response_type,
                 query_sources=resp.query_sources,
             )
-            await write_message_to_history(message, usr_auth)
+            await write_message_to_history(message, usr_creds)
             await asyncio.to_thread(_save_trace_log, message.message_id, convo_id, data, resp, elapsed, ws_username)
             prev_id = message.message_id
 
@@ -2449,7 +2643,7 @@ async def clear_uploaded_files(
 @router.post(route_prefix + "/{graphname}/cloud/download")
 async def download_from_cloud(
     graphname: ValidGraphName,
-    credentials: Annotated[HTTPBase, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
     request_body: dict = Body(...),
 ):
     """
@@ -2678,7 +2872,7 @@ async def download_from_cloud(
 @router.get(route_prefix + "/{graphname}/cloud/list")
 async def list_cloud_downloads(
     graphname: ValidGraphName,
-    credentials: Annotated[HTTPBase, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
 ):
     """
     List downloaded files from cloud storage for a specific graph.
@@ -2725,7 +2919,7 @@ async def list_cloud_downloads(
 @router.delete(route_prefix + "/{graphname}/cloud/delete")
 async def delete_cloud_downloads(
     graphname: ValidGraphName,
-    credentials: Annotated[HTTPBase, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
     filename: str = None,
 ):
     """
@@ -2812,7 +3006,7 @@ async def delete_cloud_downloads(
 @router.post(f"{route_prefix}/config/llm")
 async def save_llm_config(
     request: Request,
-    credentials: Annotated[HTTPBasicCredentials, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
     llm_config_data: dict = Body(...)
 ):
     """
@@ -2822,9 +3016,7 @@ async def save_llm_config(
         graphname = llm_config_data.get("graphname")
         llm_access_mode = _resolve_llm_config_access(credentials, graphname)
         graphs = auth(credentials.username, credentials.password)[0]
-        auth_header = "Basic " + base64.b64encode(
-            f"{credentials.username}:{credentials.password}".encode()
-        ).decode()
+        auth_header = _ecc_auth_header(credentials)
         if _ecc_jobs_running(graphs, auth_header):
             raise HTTPException(
                 status_code=409,
@@ -2923,7 +3115,7 @@ async def save_llm_config(
 @router.post(f"{route_prefix}/config/llm/test")
 async def test_llm_config(
     request: Request,
-    credentials: Annotated[HTTPBasicCredentials, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
     llm_test_config: dict = Body(...)
 ):
     """
@@ -3268,7 +3460,7 @@ def _strip_auth(config: dict) -> dict:
 
 @router.get(f"{route_prefix}/config")
 async def get_config(
-    credentials: Annotated[HTTPBasicCredentials, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
     graphname: str | None = None,
     scope: str | None = None,
 ):
@@ -3358,7 +3550,7 @@ async def get_config(
 @router.post(f"{route_prefix}/config/db/test")
 async def test_db_connection(
     request: Request,
-    credentials: Annotated[HTTPBasicCredentials, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
     db_test_config: dict = Body(...)
 ):
     """
@@ -3379,10 +3571,9 @@ async def test_db_connection(
             restppPort=db_test_config["restppPort"],
             graphname="",
         )
-        
-        if db_test_config.get("getToken", False):
-            test_conn.getToken()
 
+        # listGraphs() exercises the credentials; pyTigerGraph mints a
+        # REST++ token on demand if the instance requires one.
         test_conn.listGraphs()
         
         return {
@@ -3403,7 +3594,7 @@ async def test_db_connection(
 @router.post(f"{route_prefix}/config/db")
 async def save_db_config(
     request: Request,
-    credentials: Annotated[HTTPBasicCredentials, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
     db_config_data: dict = Body(...)
 ):
     """
@@ -3412,9 +3603,7 @@ async def save_db_config(
     try:
         _require_roles(credentials, {"superuser"})
         graphs = auth(credentials.username, credentials.password)[0]
-        auth_header = "Basic " + base64.b64encode(
-            f"{credentials.username}:{credentials.password}".encode()
-        ).decode()
+        auth_header = _ecc_auth_header(credentials)
         if _ecc_jobs_running(graphs, auth_header):
             raise HTTPException(
                 status_code=409,
@@ -3448,7 +3637,7 @@ async def save_db_config(
 @router.post(f"{route_prefix}/config/graphrag")
 async def save_graphrag_config(
     request: Request,
-    credentials: Annotated[HTTPBasicCredentials, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
     graphrag_config_data: dict = Body(...)
 ):
     """
@@ -3458,9 +3647,7 @@ async def save_graphrag_config(
     try:
         _require_roles(credentials, {"superuser", "globaldesigner"})
         graphs = auth(credentials.username, credentials.password)[0]
-        auth_header = "Basic " + base64.b64encode(
-            f"{credentials.username}:{credentials.password}".encode()
-        ).decode()
+        auth_header = _ecc_auth_header(credentials)
         if _ecc_jobs_running(graphs, auth_header):
             raise HTTPException(
                 status_code=409,
@@ -3587,7 +3774,7 @@ def split_prompt_template(prompt_content: str, prompt_type: str) -> dict:
 
 @router.get(f"{route_prefix}/prompts")
 async def get_prompts(
-    credentials: Annotated[HTTPBasicCredentials, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
     graphname: str | None = None,
 ):
     """
@@ -3678,7 +3865,7 @@ def _get_prompt(prompt_type: str) -> dict:
 
 @router.post(f"{route_prefix}/prompts")
 async def save_prompts(
-    credentials: Annotated[HTTPBasicCredentials, Depends(security)],
+    credentials: Annotated[HTTPBasicCredentials, Depends(ui_creds)],
     prompt_data: dict = Body(...)
 ):
     """

From 61a3459350d7e54575972df8688a75c6fb1e4a10 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Tue, 26 May 2026 14:00:13 -0700
Subject: [PATCH 04/18] docs: note Windows config override for repo-root docker
 compose

- Document that Windows developers must replace the top-level config
  symlinks with real copies before running docker compose from the
  repo root.
---
 README.md | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/README.md b/README.md
index 01e44be..c6854a4 100644
--- a/README.md
+++ b/README.md
@@ -1022,6 +1022,12 @@ First, make sure that all your LLM service provider configuration files are work
 docker compose up -d --build
 ```
 
+> **Windows developers:** the repo's top-level `configs/nginx.conf` and `configs/server_config.json` are symlinks intended for POSIX shells and don't resolve on Windows. Before running `docker compose up -d` from the repo root, overwrite them with the tutorial copies:
+> ```sh
+> cp docs/tutorials/configs/nginx.conf configs/nginx.conf
+> cp docs/tutorials/configs/server_config.json configs/server_config.json
+> ```
+
 If you want to use Weights And Biases for logging the test results, your WandB API key needs to be set in an environment variable on the host machine.
 
 ```sh

From 9ea81316ba8c5fe4b9910b00aa9a6987b8431a2e Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Wed, 3 Jun 2026 13:41:05 -0700
Subject: [PATCH 05/18] Document Ingestion dialog: state sync, conflict prompt,
 filename rendering
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Closing and reopening the dialog mid-conversion reflects the server-side operation state — the Ingest button, status messages, and uploaded files list all match what the server is actually doing
- Filename collisions on upload are detected pre-flight; a styled prompt names the conflicting files and lets the user choose Replace or Cancel before any bytes cross the wire
- Sample documents used for schema extraction land alongside regular uploads so they remain visible after the extraction completes
- The Initialize Knowledge Graph dialog's Close button stays clickable during initialization, matching the rest of the admin dialogs
- Long filenames truncate with a hover tooltip and keep the delete button visible

Refs: GML-2095, GML-2096
---
 CHANGELOG.md                                  |   6 +
 common/utils/graph_locks.py                   |  27 +-
 common/utils/text_extractors.py               |   4 +-
 .../src/components/ui/confirm-dialog.tsx      |   2 +-
 graphrag-ui/src/pages/Setup.tsx               |  33 +-
 graphrag-ui/src/pages/setup/IngestGraph.tsx   |  85 ++-
 graphrag-ui/src/pages/setup/KGAdmin.tsx       |  32 +-
 graphrag-ui/src/utils/uploadConflicts.ts      |  65 +++
 graphrag/app/routers/ui.py                    | 524 ++++++++++++------
 graphrag/tests/test_v1_4_1_uploads_schema.py  | 454 +++++++++++++++
 10 files changed, 1053 insertions(+), 179 deletions(-)
 create mode 100644 graphrag-ui/src/utils/uploadConflicts.ts
 create mode 100644 graphrag/tests/test_v1_4_1_uploads_schema.py

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 0a13c82..f4af23e 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -4,10 +4,16 @@
 
 ### Added
 - **Token login** — the sign-in page adds a "Use token login" option with a choice of API Token or Secret, alongside the default username / password. The signed-in username and roles are resolved from TigerGraph after login so the UI shows the real user.
+- **Pre-flight upload conflict check** — a new endpoint reports which planned filenames already exist before the bytes are sent. The upload dialog uses it to prompt the user once with the conflicting names and offer Replace or Skip; large files no longer have to cross the wire twice when a collision is hit.
 
 ### Changed
 - **Every request authenticates as the signed-in user**, end to end — graph operations, chat history, traces, and knowledge-graph rebuilds all run under the caller's identity (username / password, secret, or API token).
 - **TigerGraph token handling is automatic** — an api token is obtained from the caller's credentials only when the database requires one, unless a static api token is configured. The `getToken` config option is no longer needed and is now ignored.
+- **Sample documents are visible in the upload dialog after schema extraction.** Earlier, files used for schema extraction landed in a hidden per-request subdirectory and disappeared from the dialog. They now live alongside regular uploads, and overwriting one drops the cached extract so the next ingest sees the new bytes.
+- **Schema extraction requires an explicit sample list.** The endpoint no longer treats a missing or empty `filenames` field as "use every JSONL in the temp folder," which silently mixed in stale samples from prior sessions. Callers must name each sample explicitly.
+- **One schema extraction at a time per graph.** Concurrent attempts on the same graph are rejected with 409 instead of racing on the shared sample folder.
+- **Document Ingestion dialog reflects server-side state on reopen.** Closing the dialog mid-conversion and reopening it no longer leaves the *Ingest* button incorrectly enabled. The dialog asks the server which operation, if any, currently holds the graph lock, and polls until that operation completes — so the button stays disabled, the uploaded files list re-populates, and the next upload doesn't collide with the prior conversion.
+- **Conflict prompts use the app's styled dialog** instead of the browser default. Choosing *Cancel* now aborts the upload cleanly — the button and status message reset right away.
 
 ### Removed
 - **A configured static `apiToken` no longer overrides per-user credentials.** It is used only for the service's background operations; interactive requests always authenticate as the signed-in user.
diff --git a/common/utils/graph_locks.py b/common/utils/graph_locks.py
index 9d09b5b..684a30b 100644
--- a/common/utils/graph_locks.py
+++ b/common/utils/graph_locks.py
@@ -14,6 +14,10 @@
 _graph_locks: Dict[str, threading.Lock] = {}
 _locks_dict_lock = threading.Lock()
 
+# Records the operation currently holding each graph's lock so the UI can
+# reflect long-running work when a dialog remounts.
+_current_operations: Dict[str, str] = {}
+
 # Global rebuild lock (only one rebuild at a time across all graphs)
 # Use asyncio.Lock for async operations
 _rebuild_lock: Optional[asyncio.Lock] = None
@@ -41,36 +45,49 @@ def get_graph_lock(graphname: str) -> threading.Lock:
 def acquire_graph_lock(graphname: str, operation: str = "operation") -> bool:
     """
     Try to acquire lock for a graph. Returns True if acquired, False if already locked.
-    
+
     Args:
         graphname: Name of the graph to lock
-        operation: Description of the operation (for logging)
+        operation: Description of the operation (for logging and status reporting)
     """
     lock = get_graph_lock(graphname)
     acquired = lock.acquire(blocking=False)
-    
+
     if acquired:
+        _current_operations[graphname] = operation
         logger.info(f"Lock acquired for graph '{graphname}' - {operation}")
     else:
         logger.warning(f"Lock already held for graph '{graphname}' - {operation} blocked")
-    
+
     return acquired
 
 
 def release_graph_lock(graphname: str, operation: str = "operation"):
     """
     Release the lock for a graph.
-    
+
     Args:
         graphname: Name of the graph to unlock
         operation: Description of the operation (for logging)
     """
     lock = get_graph_lock(graphname)
     if lock.locked():
+        _current_operations.pop(graphname, None)
         lock.release()
         logger.info(f"Lock released for graph '{graphname}' - {operation} completed")
 
 
+def get_current_operation(graphname: str) -> Optional[str]:
+    """Return the operation name currently holding ``graphname``'s lock,
+    or ``None`` if the lock is free. Used by status endpoints so the UI
+    can reflect long-running work that's still in flight on the server.
+    """
+    lock = _graph_locks.get(graphname)
+    if lock is None or not lock.locked():
+        return None
+    return _current_operations.get(graphname)
+
+
 def raise_if_locked(graphname: str, operation: str = "operation"):
     """
     Try to acquire lock or raise HTTPException with 409 Conflict status.
diff --git a/common/utils/text_extractors.py b/common/utils/text_extractors.py
index d8df543..aeb6031 100644
--- a/common/utils/text_extractors.py
+++ b/common/utils/text_extractors.py
@@ -258,7 +258,9 @@ async def _process_folder_async(self, folder_path, graphname, temp_folder, max_c
         def safe_walk(path):
             try:
                 for item in path.iterdir():
-                    if item.name.startswith(('.', '~', '$')) or 'BROMIUM' in item.name.upper():
+                    # ``_schema_*`` subdirs hold sample-doc staging
+                    # and must not be re-ingested as regular documents.
+                    if item.name.startswith(('.', '~', '$', '_schema_')) or 'BROMIUM' in item.name.upper():
                         continue
                     if item.is_file():
                         yield item
diff --git a/graphrag-ui/src/components/ui/confirm-dialog.tsx b/graphrag-ui/src/components/ui/confirm-dialog.tsx
index 3e3269a..34ead0d 100644
--- a/graphrag-ui/src/components/ui/confirm-dialog.tsx
+++ b/graphrag-ui/src/components/ui/confirm-dialog.tsx
@@ -37,7 +37,7 @@ export function ConfirmDialog({ message, onConfirm, onCancel }: ConfirmDialogPro
         onClick={(e) => e.stopPropagation()}
         style={{ pointerEvents: 'auto' }}
       >
-        <p className="mb-4 text-black dark:text-white text-left">{message}</p>
+        <p className="mb-4 text-black dark:text-white text-left whitespace-pre-line">{message}</p>
         <div className="flex justify-center gap-2">
           <button
             className="px-4 py-2 bg-gray-200 dark:bg-gray-700 text-black dark:text-white rounded hover:bg-gray-300 dark:hover:bg-gray-600 transition-colors cursor-pointer"
diff --git a/graphrag-ui/src/pages/Setup.tsx b/graphrag-ui/src/pages/Setup.tsx
index e660478..fce8d44 100644
--- a/graphrag-ui/src/pages/Setup.tsx
+++ b/graphrag-ui/src/pages/Setup.tsx
@@ -21,6 +21,7 @@ import {
 } from "@/components/ui/select";
 import { useConfirm } from "@/hooks/useConfirm";
 import { safeJson } from "@/utils/safeJson";
+import { resolveUploadConflicts } from "@/utils/uploadConflicts";
 
 const DEFAULT_MAX_UPLOAD_SIZE_MB = 100;
 const envUploadLimit = Number(import.meta.env.VITE_MAX_UPLOAD_SIZE_MB);
@@ -153,10 +154,21 @@ const [activeTab, setActiveTab] = useState("upload");
 
     try {
       const creds = sessionStorage.getItem("auth");
+      const queryString = await resolveUploadConflicts(
+        ingestGraphName,
+        filesArray.map((f) => f.name),
+        creds!,
+        confirm
+      );
+      if (queryString === null) {
+        setUploadMessage("Upload cancelled.");
+        setIsUploading(false);
+        return;
+      }
       const formData = new FormData();
       filesArray.forEach((file) => formData.append("files", file));
 
-      const response = await fetch(`/ui/${ingestGraphName}/uploads?overwrite=true`, {
+      const response = await fetch(`/ui/${ingestGraphName}/uploads${queryString}`, {
         method: "POST",
         headers: { Authorization: creds! },
         body: formData,
@@ -202,6 +214,19 @@ const [activeTab, setActiveTab] = useState("upload");
 
     try {
       const creds = sessionStorage.getItem("auth");
+      // Pre-flight the whole batch once so the user only sees a single
+      // conflict prompt covering every collision in the upload set.
+      const queryString = await resolveUploadConflicts(
+        ingestGraphName,
+        filesArray.map((f) => f.name),
+        creds!,
+        confirm
+      );
+      if (queryString === null) {
+        setUploadMessage("Upload cancelled.");
+        setIsUploading(false);
+        return;
+      }
       let uploadedCount = 0;
       let failedCount = 0;
       const totalFiles = filesArray.length;
@@ -210,14 +235,14 @@ const [activeTab, setActiveTab] = useState("upload");
       for (let i = 0; i < filesArray.length; i++) {
         const file = filesArray[i];
         const fileNumber = i + 1;
-        
+
         setUploadMessage(`Uploading file ${fileNumber}/${totalFiles}: ${file.name} (${formatBytes(file.size)})...`);
-        
+
         const formData = new FormData();
         formData.append("files", file);
 
         try {
-          const response = await fetch(`/ui/${ingestGraphName}/uploads?overwrite=true`, {
+          const response = await fetch(`/ui/${ingestGraphName}/uploads${queryString}`, {
             method: "POST",
             headers: { Authorization: creds! },
             body: formData,
diff --git a/graphrag-ui/src/pages/setup/IngestGraph.tsx b/graphrag-ui/src/pages/setup/IngestGraph.tsx
index f91dfe2..4c3d8e1 100644
--- a/graphrag-ui/src/pages/setup/IngestGraph.tsx
+++ b/graphrag-ui/src/pages/setup/IngestGraph.tsx
@@ -20,6 +20,7 @@ import {
 } from "@/components/ui/select";
 import { useConfirm } from "@/hooks/useConfirm";
 import { pingIdleTimer } from "@/hooks/useIdleTimeout";
+import { resolveUploadConflicts } from "@/utils/uploadConflicts";
 
 interface IngestGraphProps {
   isModal?: boolean;
@@ -154,11 +155,22 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
 
     try {
       const creds = sessionStorage.getItem("auth");
+      const queryString = await resolveUploadConflicts(
+        ingestGraphName,
+        filesArray.map((f) => f.name),
+        creds!,
+        confirm
+      );
+      if (queryString === null) {
+        setUploadMessage("Upload cancelled.");
+        setIsUploading(false);
+        return;
+      }
       const formData = new FormData();
       filesArray.forEach((file) => formData.append("files", file));
 
       const response = await fetch(
-        `/ui/${ingestGraphName}/uploads?overwrite=true`,
+        `/ui/${ingestGraphName}/uploads${queryString}`,
         {
           method: "POST",
           headers: { Authorization: creds! },
@@ -206,6 +218,19 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
 
     try {
       const creds = sessionStorage.getItem("auth");
+      // Pre-flight the whole batch once so the user only sees a single
+      // conflict prompt covering every collision in the upload set.
+      const queryString = await resolveUploadConflicts(
+        ingestGraphName,
+        filesArray.map((f) => f.name),
+        creds!,
+        confirm
+      );
+      if (queryString === null) {
+        setUploadMessage("Upload cancelled.");
+        setIsUploading(false);
+        return;
+      }
       let uploadedCount = 0;
       let failedCount = 0;
       const totalFiles = filesArray.length;
@@ -226,7 +251,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
 
         try {
           const response = await fetch(
-            `/ui/${ingestGraphName}/uploads?overwrite=true`,
+            `/ui/${ingestGraphName}/uploads${queryString}`,
             {
               method: "POST",
               headers: { Authorization: creds! },
@@ -957,6 +982,52 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     }
   }, [ingestGraphName]);
 
+  // Sync upload / ingest in-flight state from the server. The Radix
+  // Dialog unmounts this component when closed, so all local state
+  // (isUploading / isProcessingFiles / isIngesting / uploadedFiles)
+  // is lost across open/close cycles. On mount, ask the backend which
+  // operation — if any — currently holds the graph lock, and adopt
+  // that. While an operation is in flight, poll every 5s and clear
+  // local state + refresh the file list once the server is idle.
+  const lastServerOpRef = useRef<string | null>(null);
+  useEffect(() => {
+    if (!ingestGraphName) return;
+    let cancelled = false;
+    lastServerOpRef.current = null;
+
+    const sync = async () => {
+      try {
+        const creds = sessionStorage.getItem("auth");
+        if (!creds) return;
+        const r = await fetch(`/ui/${ingestGraphName}/upload_status`, {
+          headers: { Authorization: creds },
+        });
+        if (!r.ok || cancelled) return;
+        const d = await r.json();
+        if (cancelled) return;
+        const op: string | null = d?.operation || null;
+        setIsProcessingFiles(
+          op === "create_ingest" || op === "upload_files"
+        );
+        setIsIngesting(op === "ingest");
+        if (lastServerOpRef.current && !op) {
+          // Server-side work just finished — refresh the file list.
+          fetchUploadedFiles();
+        }
+        lastServerOpRef.current = op;
+      } catch {
+        /* leave local state alone on transient errors */
+      }
+    };
+
+    sync();
+    const id = setInterval(sync, 5000);
+    return () => {
+      cancelled = true;
+      clearInterval(id);
+    };
+  }, [ingestGraphName]);
+
   return (
     <div className={isModal ? "" : "p-8"}>
       <div className={isModal ? "" : "max-w-5xl mx-auto"}>
@@ -1152,7 +1223,10 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
                           key={index}
                           className="flex items-center justify-between p-2 bg-gray-50 dark:bg-shadeA rounded"
                         >
-                          <span className="text-sm text-black dark:text-white truncate flex-1">
+                          <span
+                            className="text-sm text-black dark:text-white truncate flex-1 min-w-0"
+                            title={file.filename}
+                          >
                             {file.filename}
                           </span>
                           <Button
@@ -1486,7 +1560,10 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
                           key={index}
                           className="flex justify-between items-center p-2 bg-gray-50 dark:bg-shadeA rounded text-sm"
                         >
-                          <span className="text-black dark:text-white truncate flex-1">
+                          <span
+                            className="text-black dark:text-white truncate flex-1 min-w-0"
+                            title={file.name}
+                          >
                             {file.name}
                           </span>
                           <Button
diff --git a/graphrag-ui/src/pages/setup/KGAdmin.tsx b/graphrag-ui/src/pages/setup/KGAdmin.tsx
index f4b6f61..564d49f 100644
--- a/graphrag-ui/src/pages/setup/KGAdmin.tsx
+++ b/graphrag-ui/src/pages/setup/KGAdmin.tsx
@@ -21,6 +21,7 @@ import {
 } from "@/components/ui/select";
 import { useConfirm } from "@/hooks/useConfirm";
 import { useAlert } from "@/hooks/useAlert";
+import { resolveUploadConflicts } from "@/utils/uploadConflicts";
 import { useNavigate } from "react-router-dom";
 import IngestGraph from "./IngestGraph";
 
@@ -477,12 +478,25 @@ const KGAdmin = () => {
       const creds = sessionStorage.getItem("auth");
       if (!creds) throw new Error("Not authenticated. Please login first.");
 
-      // Step 1/2: upload + convert. Returns the saved filenames so we
-      // know exactly which JSONLs to feed to the LLM in step 2.
+      // Step 1/2: upload + convert. Pre-flight the planned upload so
+      // the user only sees a conflict prompt for filenames that already
+      // live on the server. Returns the saved filenames so we know
+      // exactly which JSONLs to feed to the LLM in step 2.
+      const queryString = await resolveUploadConflicts(
+        graphName,
+        sampleFiles.map((f) => f.name),
+        creds!,
+        confirm
+      );
+      if (queryString === null) {
+        setStatusMessage("Schema extraction cancelled.");
+        setStatusType("");
+        return;
+      }
       const form = new FormData();
       sampleFiles.forEach((f) => form.append("files", f));
       const convertResp = await fetch(
-        `/ui/${graphName}/convert_sample_files`,
+        `/ui/${graphName}/convert_sample_files${queryString}`,
         {
           method: "POST",
           headers: { Authorization: creds! },
@@ -495,6 +509,14 @@ const KGAdmin = () => {
           convertData.detail || `Conversion failed: ${convertResp.statusText}`
         );
       }
+      if (convertData.status === "conflict") {
+        // Defensive: surface the server's conflict message instead of
+        // continuing into the LLM step with no converted samples.
+        throw new Error(
+          convertData.message ||
+            "Some sample filenames already exist on the server."
+        );
+      }
 
       // Step 2/2: LLM call. The status flip now reflects the real
       // backend phase change, not a timer.
@@ -508,7 +530,6 @@ const KGAdmin = () => {
             "Content-Type": "application/json",
           },
           body: JSON.stringify({
-            request_id: convertData.request_id || "",
             filenames: convertData.saved_files || [],
             vertex_hints: vertexHints,
             edge_hints: edgeHints,
@@ -2191,7 +2212,6 @@ const KGAdmin = () => {
                   <Button
                     variant="outline"
                     onClick={() => handleInitializeDialogChange(false)}
-                    disabled={isInitializing}
                     className="dark:border-[#3D3D3D]"
                   >
                     Close
@@ -2361,7 +2381,7 @@ const KGAdmin = () => {
           }}
         >
           <DialogContent
-            className="sm:max-w-[700px] bg-white dark:bg-background border-gray-300 dark:border-[#3D3D3D] max-h-[80vh] overflow-y-auto"
+            className="sm:max-w-[760px] bg-white dark:bg-background border-gray-300 dark:border-[#3D3D3D] max-h-[80vh] overflow-y-auto"
             onInteractOutside={(e) => e.preventDefault()}
           >
             <DialogHeader>
diff --git a/graphrag-ui/src/utils/uploadConflicts.ts b/graphrag-ui/src/utils/uploadConflicts.ts
new file mode 100644
index 0000000..dc10460
--- /dev/null
+++ b/graphrag-ui/src/utils/uploadConflicts.ts
@@ -0,0 +1,65 @@
+import { safeJson } from "./safeJson";
+
+/**
+ * Pre-flight the planned upload to detect filename collisions, then
+ * prompt the user once and resolve the chosen action into the query
+ * string for the subsequent ``POST /uploads`` (or
+ * ``POST /convert_sample_files``) call.
+ *
+ * Three outcomes:
+ *   * No conflicts → ``""`` (just send the upload as-is)
+ *   * User chose Replace → ``"?overwrite=true"``
+ *   * User cancelled → ``null`` (caller should abort the upload)
+ *
+ * If the pre-flight endpoint is unreachable or returns an error,
+ * falls back to ``"?overwrite=true"`` so the upload still proceeds.
+ *
+ * ``confirm`` is supplied by the caller (typically the ``useConfirm``
+ * hook) so the prompt uses the app's styled dialog instead of the
+ * browser default.
+ */
+export async function resolveUploadConflicts(
+  graphName: string,
+  filenames: string[],
+  creds: string,
+  confirm: (message: string) => Promise<boolean>
+): Promise<string | null> {
+  if (filenames.length === 0) {
+    return "";
+  }
+
+  let conflicts: string[] = [];
+  try {
+    const checkResp = await fetch(`/ui/${graphName}/uploads/check`, {
+      method: "POST",
+      headers: { Authorization: creds, "Content-Type": "application/json" },
+      body: JSON.stringify({ filenames }),
+    });
+    if (!checkResp.ok) {
+      // Pre-flight endpoint unreachable — fall back so the upload proceeds.
+      return "?overwrite=true";
+    }
+    const data = await safeJson(checkResp);
+    conflicts = Array.isArray(data?.conflicts) ? data.conflicts : [];
+  } catch {
+    return "?overwrite=true";
+  }
+
+  if (conflicts.length === 0) {
+    return "";
+  }
+
+  const one = conflicts.length === 1;
+  const bulletList = conflicts.map((n) => `  •  ${n}`).join("\n");
+  const replaceChosen = await confirm(
+    `${conflicts.length} file${one ? "" : "s"} already ${one ? "exists" : "exist"} on the server:\n\n` +
+      `${bulletList}\n\n` +
+      `Replace ${one ? "it" : "them"}?\n` +
+      `Cancel will abort the upload.`
+  );
+
+  if (replaceChosen) {
+    return "?overwrite=true";
+  }
+  return null;
+}
diff --git a/graphrag/app/routers/ui.py b/graphrag/app/routers/ui.py
index 27bc954..1551cfa 100644
--- a/graphrag/app/routers/ui.py
+++ b/graphrag/app/routers/ui.py
@@ -60,7 +60,7 @@
 from common.logs.log import req_id_cv
 from common.logs.logwriter import LogWriter
 from common.metrics.prometheus_metrics import metrics as pmetrics
-from common.utils.graph_locks import acquire_graph_lock, release_graph_lock, acquire_rebuild_lock, release_rebuild_lock, get_rebuilding_graph
+from common.utils.graph_locks import acquire_graph_lock, release_graph_lock, acquire_rebuild_lock, release_rebuild_lock, get_rebuilding_graph, get_current_operation
 from supportai import supportai
 from common.py_schemas.schemas import (
     AgentProgess,
@@ -1372,24 +1372,61 @@ def get_initialize_status(
     return _get_init_state(graphname)
 
 
+def _sweep_legacy_schema_subdirs(graphname: str) -> None:
+    """Remove any ``_schema_<id>/`` staging subdirectories under the
+    graph's uploads tree. Idempotent — safe to call on every
+    sample-upload request.
+    """
+    for parent in (
+        os.path.join("uploads", graphname),
+        os.path.join("uploads", "ingestion_temp", graphname),
+    ):
+        if not os.path.isdir(parent):
+            continue
+        for name in os.listdir(parent):
+            if name.startswith("_schema_"):
+                stale = os.path.join(parent, name)
+                if os.path.isdir(stale):
+                    try:
+                        shutil.rmtree(stale)
+                    except OSError as exc:
+                        logger.warning(
+                            f"Could not remove legacy schema subdir {stale}: {exc}"
+                        )
+
+
 @router.post(route_prefix + "/{graphname}/convert_sample_files")
 async def convert_sample_files(
     graphname: ValidGraphName,
     creds: Annotated[tuple[list[str], HTTPBasicCredentials], Depends(ui_basic_auth)],
     files: Annotated[list[UploadFile], File(description="Sample documents (≤5)")],
+    overwrite: bool = False,
+    skip: str | None = None,
 ):
     """
     Step 1/2 of the sample-doc schema extraction flow:
 
-    Save uploaded sample files into a fresh per-request subdirectory
-    under ``uploads/<graphname>/_schema_<request_id>/`` and convert
-    each to JSONL under
-    ``uploads/ingestion_temp/<graphname>/_schema_<request_id>/``.
-    Returns the list of saved filenames and the ``request_id`` so the
-    caller can pass both to ``POST /ui/<graph>/extract_schema_from_jsonl``.
+    Save uploaded sample files to ``uploads/<graphname>/`` and convert
+    each to JSONL under ``uploads/ingestion_temp/<graphname>/``. Files
+    are persisted so the Ingest Document dialog can reuse them, and
+    the JSONL cache means a subsequent Ingest run won't re-convert.
 
-    Each sample-upload request is isolated so stale files from prior
-    sessions can't be re-converted or pollute the resulting schema.
+    Returns the list of saved filenames so the caller can pass them
+    to ``POST /ui/<graph>/extract_schema_from_jsonl``.
+
+    Collision handling mirrors ``POST /uploads``:
+      * ``overwrite=false`` (default) and any filename already exists →
+        ``{"status": "conflict", "existing_files": [...]}`` is returned
+        and nothing is written. Pre-flight via ``POST /uploads/check``
+        before sending bytes to avoid re-uploading on conflict.
+      * ``overwrite=true`` replaces the existing file (and its cached
+        JSONL) before re-converting.
+      * ``skip`` is a comma-separated list of filenames to drop from the
+        incoming set silently — useful when the user chose "skip" on a
+        conflict prompt for a subset of files.
+
+    Concurrent schema-extraction requests against the same graph are
+    rejected with 409 — only one runs at a time.
 
     No LLM call. Caps come from ``graphrag_config``:
       * ``schema_max_sample_files`` (default 5) — file count
@@ -1402,69 +1439,121 @@ async def convert_sample_files(
     max_total_mb = int(graphrag_config.get("schema_max_total_mb", 50))
     max_total_bytes = max_total_mb * 1024 * 1024
 
-    if len(files) > max_files:
+    skip_set: set[str] = set()
+    if skip:
+        skip_set = {os.path.basename(s.strip()) for s in skip.split(",") if s.strip()}
+
+    accepted = [f for f in files if os.path.basename(f.filename or "") not in skip_set]
+    if len(accepted) > max_files:
         raise HTTPException(
             status_code=400,
-            detail=f"Too many files: got {len(files)}, max is {max_files}.",
+            detail=f"Too many files: got {len(accepted)}, max is {max_files}.",
         )
-    if not files:
+    if not accepted:
         raise HTTPException(status_code=400, detail="No files supplied.")
 
-    request_id = uuid.uuid4().hex[:12]
-    request_subdir = f"_schema_{request_id}"
-    upload_dir = os.path.join("uploads", graphname, request_subdir)
-    os.makedirs(upload_dir, exist_ok=True)
-    temp_folder = os.path.join("uploads", "ingestion_temp", graphname, request_subdir)
-    os.makedirs(temp_folder, exist_ok=True)
-
-    saved_basenames: list[str] = []
-    total_bytes = 0
-    for f in files:
-        data = await f.read()
-        total_bytes += len(data)
-        if total_bytes > max_total_bytes:
-            raise HTTPException(
-                status_code=400,
-                detail=(
-                    f"Total upload exceeds {max_total_mb} MB cap."
-                ),
+    acquired = await asyncio.to_thread(
+        acquire_graph_lock, graphname, "schema_extraction"
+    )
+    if not acquired:
+        raise HTTPException(
+            status_code=409,
+            detail=(
+                f"Graph '{graphname}' is already running schema extraction "
+                "or another ingest operation. Please wait and try again."
+            ),
+        )
+
+    try:
+        _sweep_legacy_schema_subdirs(graphname)
+
+        upload_dir = os.path.join("uploads", graphname)
+        os.makedirs(upload_dir, exist_ok=True)
+        temp_folder = os.path.join("uploads", "ingestion_temp", graphname)
+        os.makedirs(temp_folder, exist_ok=True)
+
+        if not overwrite:
+            existing = [
+                os.path.basename(f.filename or "")
+                for f in accepted
+                if os.path.exists(
+                    os.path.join(upload_dir, os.path.basename(f.filename or ""))
+                )
+            ]
+            if existing:
+                return {
+                    "status": "conflict",
+                    "message": (
+                        "Some files already exist. Resend with overwrite=true "
+                        "to replace them, or with skip=<filename,...> to drop "
+                        "specific files from the upload set."
+                    ),
+                    "existing_files": existing,
+                }
+
+        saved_basenames: list[str] = []
+        total_bytes = 0
+        for f in accepted:
+            data = await f.read()
+            total_bytes += len(data)
+            if total_bytes > max_total_bytes:
+                raise HTTPException(
+                    status_code=400,
+                    detail=f"Total upload exceeds {max_total_mb} MB cap.",
+                )
+            safe_name = os.path.basename(f.filename or "sample")
+            if safe_name in saved_basenames:
+                raise HTTPException(
+                    status_code=400,
+                    detail=(
+                        f"Duplicate filename '{safe_name}' in upload set. "
+                        "Rename one of the files and try again."
+                    ),
+                )
+
+            # On overwrite, drop the cached JSONL so the new bytes
+            # are re-converted instead of silently reusing the stale
+            # extract.
+            if overwrite:
+                stem = os.path.splitext(safe_name)[0]
+                cached_jsonl = os.path.join(temp_folder, f"{stem}.jsonl")
+                if os.path.exists(cached_jsonl):
+                    try:
+                        os.remove(cached_jsonl)
+                    except OSError as exc:
+                        logger.warning(
+                            f"Could not remove cached jsonl {cached_jsonl}: {exc}"
+                        )
+
+            target = os.path.join(upload_dir, safe_name)
+            with open(target, "wb") as out:
+                out.write(data)
+            saved_basenames.append(safe_name)
+
+        extractor = TextExtractor()
+        try:
+            result = await extractor._process_folder_async(
+                upload_dir, graphname, temp_folder
             )
-        safe_name = os.path.basename(f.filename or "sample")
-        if safe_name in saved_basenames:
+        except Exception as exc:
             raise HTTPException(
                 status_code=400,
-                detail=(
-                    f"Duplicate filename '{safe_name}' in upload set. "
-                    "Rename one of the files and try again."
-                ),
+                detail=f"Text extraction failed: {exc}",
             )
-        target = os.path.join(upload_dir, safe_name)
-        with open(target, "wb") as out:
-            out.write(data)
-        saved_basenames.append(safe_name)
 
-    extractor = TextExtractor()
-    try:
-        result = await extractor._process_folder_async(
-            upload_dir, graphname, temp_folder
+        LogWriter.info(
+            f"Converted sample files for {graphname}: "
+            f"{len(accepted)} uploaded, {result.get('num_documents', 0)} docs in JSONL"
         )
-    except Exception as exc:
-        raise HTTPException(
-            status_code=400,
-            detail=f"Text extraction failed: {exc}",
-        )
-
-    LogWriter.info(
-        f"Converted sample files for {graphname} (request {request_id}): "
-        f"{len(files)} uploaded, {result.get('num_documents', 0)} docs in JSONL"
-    )
-    return {
-        "status": "success",
-        "graphname": graphname,
-        "request_id": request_id,
-        "saved_files": list(saved_basenames),
-        "num_documents": result.get("num_documents", 0),
-    }
+        return {
+            "status": "success",
+            "graphname": graphname,
+            "saved_files": list(saved_basenames),
+            "skipped_files": sorted(skip_set),
+            "num_documents": result.get("num_documents", 0),
+        }
+    finally:
+        await asyncio.to_thread(release_graph_lock, graphname, "schema_extraction")
 
 
 @router.post(route_prefix + "/{graphname}/extract_schema_from_jsonl")
@@ -1482,39 +1571,49 @@ def extract_schema_from_jsonl(
     form-mode editor.
 
     Body:
-        ``{"request_id": "<id>", "filenames": ["report1.pdf", "report2.docx"]}``
-    ``request_id`` (returned by ``convert_sample_files``) selects the
-    per-request subdirectory under
-    ``uploads/ingestion_temp/<graphname>/_schema_<request_id>/`` so
-    only the JSONLs belonging to this sample-upload session feed the
-    LLM. If ``request_id`` is absent, the endpoint falls back to the
-    legacy per-graph temp folder for backward compatibility.
-    """
-    request_id = ""
+        ``{"filenames": ["report1.pdf", "report2.docx"]}``
+    The endpoint reads ``uploads/ingestion_temp/<graphname>/<stem>.jsonl``
+    for each listed name. ``filenames`` is required and must be a
+    non-empty list — every sample file the caller wants fed to the
+    schema-extraction LLM must be named explicitly.
+
+    Concurrent schema-extraction requests against the same graph are
+    rejected with 409 — only one runs at a time.
+    """
+    requested = []
     if isinstance(payload, dict):
-        request_id = str(payload.get("request_id") or "")
-    if request_id and not re.fullmatch(r"[A-Za-z0-9_-]+", request_id):
-        raise HTTPException(status_code=400, detail="Invalid request_id")
-    if request_id:
-        temp_folder = os.path.join(
-            "uploads", "ingestion_temp", graphname, f"_schema_{request_id}"
-        )
-    else:
-        temp_folder = os.path.join("uploads", "ingestion_temp", graphname)
-    if not os.path.isdir(temp_folder):
+        requested = payload.get("filenames") or []
+    if not requested:
         raise HTTPException(
             status_code=400,
             detail=(
-                f"No converted JSONLs found for graph {graphname}. "
-                "Run convert_sample_files first."
+                "No sample files specified. Pass 'filenames' as a non-empty "
+                "list naming each previously-converted sample to feed the "
+                "schema-extraction LLM."
             ),
         )
 
-    requested = []
-    if isinstance(payload, dict):
-        requested = payload.get("filenames") or []
+    acquired = acquire_graph_lock(graphname, "schema_extraction")
+    if not acquired:
+        raise HTTPException(
+            status_code=409,
+            detail=(
+                f"Graph '{graphname}' is already running schema extraction "
+                "or another ingest operation. Please wait and try again."
+            ),
+        )
+
+    try:
+        temp_folder = os.path.join("uploads", "ingestion_temp", graphname)
+        if not os.path.isdir(temp_folder):
+            raise HTTPException(
+                status_code=400,
+                detail=(
+                    f"No converted JSONLs found for graph {graphname}. "
+                    "Run convert_sample_files first."
+                ),
+            )
 
-    if requested:
         jsonl_paths = []
         missing_jsonls = []
         for name in requested:
@@ -1533,62 +1632,58 @@ def extract_schema_from_jsonl(
                     + ". Run convert_sample_files first for those files."
                 ),
             )
-    else:
-        jsonl_paths = [
-            os.path.join(temp_folder, fn)
-            for fn in os.listdir(temp_folder)
-            if fn.endswith(".jsonl")
-        ]
 
-    samples: list[dict] = []
-    for jp in jsonl_paths:
-        with open(jp, "r", encoding="utf-8") as jf:
-            for line in jf:
-                line = line.strip()
-                if not line:
-                    continue
-                try:
-                    samples.append(json.loads(line))
-                except json.JSONDecodeError:
-                    pass
+        samples: list[dict] = []
+        for jp in jsonl_paths:
+            with open(jp, "r", encoding="utf-8") as jf:
+                for line in jf:
+                    line = line.strip()
+                    if not line:
+                        continue
+                    try:
+                        samples.append(json.loads(line))
+                    except json.JSONDecodeError:
+                        pass
 
-    if not samples:
-        raise HTTPException(
-            status_code=400,
-            detail="No extractable text in the converted files.",
-        )
+        if not samples:
+            raise HTTPException(
+                status_code=400,
+                detail="No extractable text in the converted files.",
+            )
 
-    # Optional structured hints from the UI (TagInput chips). Each
-    # hint is ``{"name": str, "description": str}``. Backend ignores
-    # malformed entries silently — names are validated client-side.
-    vertex_hints = (payload or {}).get("vertex_hints") if isinstance(payload, dict) else None
-    edge_hints = (payload or {}).get("edge_hints") if isinstance(payload, dict) else None
+        # Optional structured hints from the UI (TagInput chips). Each
+        # hint is ``{"name": str, "description": str}``. Backend ignores
+        # malformed entries silently — names are validated client-side.
+        vertex_hints = (payload or {}).get("vertex_hints") if isinstance(payload, dict) else None
+        edge_hints = (payload or {}).get("edge_hints") if isinstance(payload, dict) else None
 
-    LogWriter.info(
-        f"Running schema extraction LLM for {graphname} "
-        f"({len(jsonl_paths)} JSONLs, {len(samples)} doc parts, "
-        f"{len(vertex_hints or [])} vertex hints, {len(edge_hints or [])} edge hints)"
-    )
-    llm_service = get_llm_service(get_completion_config(graphname))
-    gsql_text, rendered_prompt = schema_extraction_mod.extract_schema_gsql(
-        llm_service, samples,
-        vertex_hints=vertex_hints, edge_hints=edge_hints,
-    )
-    proposal = schema_utils_mod.parse_gsql_schema(gsql_text)
-    proposal.drop_dangling_pairs()
-    return {
-        "status": "success",
-        "graphname": graphname,
-        "schema_gsql": gsql_text,
-        "preview_gsql": schema_utils_mod.emit_preview_gsql(proposal),
-        "proposal": proposal.to_dict(),
-        "summary": schema_utils_mod.summarize(proposal),
-        # The fully-rendered prompt (default + suggested-types block).
-        # The UI saves this verbatim as the per-graph override after a
-        # successful initialize_graph so the addendum survives the
-        # session.
-        "rendered_prompt": rendered_prompt,
-    }
+        LogWriter.info(
+            f"Running schema extraction LLM for {graphname} "
+            f"({len(jsonl_paths)} JSONLs, {len(samples)} doc parts, "
+            f"{len(vertex_hints or [])} vertex hints, {len(edge_hints or [])} edge hints)"
+        )
+        llm_service = get_llm_service(get_completion_config(graphname))
+        gsql_text, rendered_prompt = schema_extraction_mod.extract_schema_gsql(
+            llm_service, samples,
+            vertex_hints=vertex_hints, edge_hints=edge_hints,
+        )
+        proposal = schema_utils_mod.parse_gsql_schema(gsql_text)
+        proposal.drop_dangling_pairs()
+        return {
+            "status": "success",
+            "graphname": graphname,
+            "schema_gsql": gsql_text,
+            "preview_gsql": schema_utils_mod.emit_preview_gsql(proposal),
+            "proposal": proposal.to_dict(),
+            "summary": schema_utils_mod.summarize(proposal),
+            # The fully-rendered prompt (default + suggested-types block).
+            # The UI saves this verbatim as the per-graph override after a
+            # successful initialize_graph so the addendum survives the
+            # session.
+            "rendered_prompt": rendered_prompt,
+        }
+    finally:
+        release_graph_lock(graphname, "schema_extraction")
 
 
 @router.post(route_prefix + "/{graphname}/rebuild_graph")
@@ -2426,6 +2521,37 @@ async def chat(
 # File Upload Functionality for Server +Multi
 # =====================================================
 
+@router.get(route_prefix + "/{graphname}/upload_status")
+async def get_upload_status(
+    graphname: ValidGraphName,
+    creds: Annotated[tuple[list[str], HTTPBasicCredentials], Depends(ui_basic_auth)],
+):
+    """Report whether a long-running upload/ingest operation is currently
+    holding the graph's lock. The Document Ingestion dialog polls this
+    on mount and during its lifetime so the Ingest button reflects
+    server-side state even after the dialog is closed and reopened.
+
+    Response::
+
+        {
+          "graphname": str,
+          "processing": bool,
+          "operation": "create_ingest" | "ingest" | "upload_files" |
+                       "schema_extraction" | "rebuild" | null
+        }
+    """
+    op = get_current_operation(graphname)
+    # The rebuild lock is a separate (global) lock — surface it under the
+    # same flag so the UI doesn't need a second endpoint.
+    if op is None and get_rebuilding_graph() == graphname:
+        op = "rebuild"
+    return {
+        "graphname": graphname,
+        "processing": op is not None,
+        "operation": op,
+    }
+
+
 @router.get(route_prefix + "/{graphname}/uploads/list")
 async def list_uploaded_files(
     graphname: ValidGraphName,
@@ -2467,21 +2593,70 @@ async def list_uploaded_files(
         raise HTTPException(status_code=500, detail=f"Error listing files: {str(e)}")
 
 
+@router.post(route_prefix + "/{graphname}/uploads/check")
+async def check_upload_conflicts(
+    graphname: ValidGraphName,
+    creds: Annotated[tuple[list[str], HTTPBasicCredentials], Depends(ui_basic_auth)],
+    payload: Annotated[dict, Body(...)],
+):
+    """
+    Pre-flight a planned upload: given a list of filenames, return which
+    ones already exist for ``graphname``. The client can then prompt the
+    user once and resend the actual bytes with ``overwrite=true`` or
+    ``skip=<filename,...>`` — so a conflict response doesn't waste the
+    upload bandwidth.
+
+    Body:
+        ``{"filenames": ["report.pdf", "transactions.csv", ...]}``
+    Response:
+        ``{"conflicts": ["report.pdf"]}``
+    """
+    requested = payload.get("filenames") or []
+    if not isinstance(requested, list):
+        raise HTTPException(
+            status_code=400, detail="'filenames' must be a list of strings.",
+        )
+
+    upload_dir = os.path.join("uploads", graphname)
+    if not os.path.isdir(upload_dir):
+        return {"graphname": graphname, "conflicts": []}
+
+    conflicts = []
+    for name in requested:
+        if not isinstance(name, str) or not name:
+            continue
+        safe_name = os.path.basename(name)
+        if os.path.exists(os.path.join(upload_dir, safe_name)):
+            conflicts.append(safe_name)
+    return {"graphname": graphname, "conflicts": conflicts}
+
+
 @router.post(route_prefix + "/{graphname}/uploads")
 async def upload_files(
     graphname: ValidGraphName,
     creds: Annotated[tuple[list[str], HTTPBasicCredentials], Depends(ui_basic_auth)],
     files: list[UploadFile] = File(...),
     overwrite: bool = False,
+    skip: str | None = None,
 ):
     """
     Upload one or multiple files for a specific graphname.
     Files are stored in uploads/{graphname}/ directory.
-    
+
     Parameters:
     - graphname: The graph name to associate files with
     - files: List of files to upload
-    - overwrite: If False (default), will reject if files already exist
+    - overwrite: If False (default), will reject if any non-skipped file
+      already exists (all-or-nothing conflict response). If True, replace
+      existing files and drop their cached JSONLs so the next ingest
+      re-converts the new bytes.
+    - skip: Optional comma-separated list of filenames to silently drop
+      from the upload set. Used after the client prompts the user on a
+      pre-flight conflict and the user chose "skip" for a subset of
+      files.
+
+    Pre-flight via ``POST /uploads/check`` to avoid re-uploading bytes
+    when a collision is hit.
     """
     # Acquire graph lock
     acquired = await asyncio.to_thread(acquire_graph_lock, graphname, "upload_files")
@@ -2490,56 +2665,89 @@ async def upload_files(
             status_code=409,
             detail=f"Graph '{graphname}' is currently being processed by another operation. Please wait and try again."
         )
-    
+
     try:
         upload_dir = os.path.join("uploads", graphname)
         os.makedirs(upload_dir, exist_ok=True)
-        
+        temp_folder = os.path.join("uploads", "ingestion_temp", graphname)
+
+        skip_set: set[str] = set()
+        if skip:
+            skip_set = {
+                os.path.basename(s.strip()) for s in skip.split(",") if s.strip()
+            }
+        accepted = [
+            f for f in files
+            if os.path.basename(f.filename or "") not in skip_set
+        ]
+
         # Check for existing files if overwrite is False
         if not overwrite:
             existing_files = []
-            for file in files:
-                file_path = os.path.join(upload_dir, file.filename)
+            for file in accepted:
+                file_path = os.path.join(
+                    upload_dir, os.path.basename(file.filename or "")
+                )
                 if os.path.exists(file_path):
-                    existing_files.append(file.filename)
-            
+                    existing_files.append(os.path.basename(file.filename or ""))
+
             if existing_files:
                 return {
                     "status": "conflict",
-                    "message": "Some files already exist. Set overwrite=true to replace them.",
+                    "message": (
+                        "Some files already exist. Resend with overwrite=true "
+                        "to replace them, or with skip=<filename,...> to drop "
+                        "specific files from the upload set."
+                    ),
                     "existing_files": existing_files,
                 }
-        
+
         # Save uploaded files
         uploaded_files = []
         total_size = 0
-        
-        for file in files:
-            file_path = os.path.join(upload_dir, file.filename)
-            
+
+        for file in accepted:
+            safe_name = os.path.basename(file.filename or "")
+            file_path = os.path.join(upload_dir, safe_name)
+
+            # On overwrite, drop the cached JSONL so the next ingest
+            # re-converts the new bytes instead of silently reusing the
+            # stale extract.
+            if overwrite and os.path.isdir(temp_folder):
+                stem = os.path.splitext(safe_name)[0]
+                cached_jsonl = os.path.join(temp_folder, f"{stem}.jsonl")
+                if os.path.exists(cached_jsonl):
+                    try:
+                        os.remove(cached_jsonl)
+                    except OSError as exc:
+                        logger.warning(
+                            f"Could not remove cached jsonl {cached_jsonl}: {exc}"
+                        )
+
             # Write file to disk
             with open(file_path, "wb") as f:
                 content = await file.read()
                 f.write(content)
                 file_size = len(content)
                 total_size += file_size
-            
+
             uploaded_files.append({
-                "filename": file.filename,
+                "filename": safe_name,
                 "size": file_size,
                 "path": file_path,
             })
-            
-            logger.info(f"Uploaded file {file.filename} ({file_size} bytes) for graph {graphname}")
-        
+
+            logger.info(f"Uploaded file {safe_name} ({file_size} bytes) for graph {graphname}")
+
         return {
             "status": "success",
             "message": f"Successfully uploaded {len(uploaded_files)} file(s)",
             "graphname": graphname,
             "uploaded_files": uploaded_files,
+            "skipped_files": sorted(skip_set),
             "total_size": total_size,
         }
-    
+
     except HTTPException:
         raise
     except Exception as e:
diff --git a/graphrag/tests/test_v1_4_1_uploads_schema.py b/graphrag/tests/test_v1_4_1_uploads_schema.py
new file mode 100644
index 0000000..74ee10f
--- /dev/null
+++ b/graphrag/tests/test_v1_4_1_uploads_schema.py
@@ -0,0 +1,454 @@
+# Copyright (c) 2024-2026 TigerGraph, Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import io
+import os
+import shutil
+import sys
+import tempfile
+import unittest
+from pathlib import Path
+from unittest.mock import AsyncMock, MagicMock, patch
+
+from fastapi.testclient import TestClient
+from app.main import app
+
+# main.py uses ``import routers`` (absolute), so the module is registered
+# as ``routers.ui`` in sys.modules.  Alias it to ``app.routers.ui`` so the
+# @patch() targets resolve to the same module object.
+sys.modules.setdefault("app.routers.ui", sys.modules["routers.ui"])
+
+from app.routers.ui import _sweep_legacy_schema_subdirs
+from common.utils.graph_locks import (
+    acquire_graph_lock,
+    get_current_operation,
+    release_graph_lock,
+)
+
+
+GRAPH = "TestGraph"
+
+
+def _ok_auth():
+    """Mock ``auth()`` to return a single accessible graph + dummy creds."""
+    return ([GRAPH], MagicMock(username="testuser", password="testpass"))
+
+
+class _ChdirTempDir:
+    """Context manager that chdirs into a fresh temp dir for the duration
+    of a test. Restores CWD on exit even if the test raises.
+    """
+
+    def __init__(self):
+        self.tmp = None
+        self.prev = None
+
+    def __enter__(self):
+        self.prev = os.getcwd()
+        self.tmp = tempfile.mkdtemp(prefix="graphrag_v141_test_")
+        os.chdir(self.tmp)
+        return Path(self.tmp)
+
+    def __exit__(self, *exc):
+        os.chdir(self.prev)
+        shutil.rmtree(self.tmp, ignore_errors=True)
+
+
+class TestUploadsCheck(unittest.TestCase):
+    """``POST /ui/{graph}/uploads/check`` reports which planned filenames
+    already exist for the graph, so the client can prompt once before
+    sending bytes.
+    """
+
+    def setUp(self):
+        self.client = TestClient(app)
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_returns_conflicts_for_existing_files(self, _mock_auth):
+        with _ChdirTempDir() as tmp:
+            upload_dir = tmp / "uploads" / GRAPH
+            upload_dir.mkdir(parents=True)
+            (upload_dir / "report.pdf").write_bytes(b"old")
+            (upload_dir / "summary.docx").write_bytes(b"old")
+
+            resp = self.client.post(
+                f"/ui/{GRAPH}/uploads/check",
+                json={"filenames": ["report.pdf", "summary.docx", "new.csv"]},
+                auth=("testuser", "testpass"),
+            )
+
+        self.assertEqual(resp.status_code, 200)
+        body = resp.json()
+        self.assertEqual(set(body["conflicts"]), {"report.pdf", "summary.docx"})
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_returns_empty_when_no_conflicts(self, _mock_auth):
+        with _ChdirTempDir() as tmp:
+            (tmp / "uploads" / GRAPH).mkdir(parents=True)
+
+            resp = self.client.post(
+                f"/ui/{GRAPH}/uploads/check",
+                json={"filenames": ["fresh.pdf"]},
+                auth=("testuser", "testpass"),
+            )
+
+        self.assertEqual(resp.status_code, 200)
+        self.assertEqual(resp.json()["conflicts"], [])
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_returns_empty_when_graph_dir_missing(self, _mock_auth):
+        with _ChdirTempDir():
+            resp = self.client.post(
+                f"/ui/{GRAPH}/uploads/check",
+                json={"filenames": ["whatever.pdf"]},
+                auth=("testuser", "testpass"),
+            )
+
+        self.assertEqual(resp.status_code, 200)
+        self.assertEqual(resp.json()["conflicts"], [])
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_rejects_non_list_filenames(self, _mock_auth):
+        with _ChdirTempDir():
+            resp = self.client.post(
+                f"/ui/{GRAPH}/uploads/check",
+                json={"filenames": "report.pdf"},
+                auth=("testuser", "testpass"),
+            )
+
+        self.assertEqual(resp.status_code, 400)
+
+
+class TestUploadsOverwriteSkip(unittest.TestCase):
+    """``POST /ui/{graph}/uploads`` honours the overwrite / skip params."""
+
+    def setUp(self):
+        self.client = TestClient(app)
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_overwrite_false_returns_conflict_envelope_on_collision(self, _mock_auth):
+        with _ChdirTempDir() as tmp:
+            (tmp / "uploads" / GRAPH).mkdir(parents=True)
+            (tmp / "uploads" / GRAPH / "report.pdf").write_bytes(b"old")
+
+            resp = self.client.post(
+                f"/ui/{GRAPH}/uploads",
+                files=[("files", ("report.pdf", io.BytesIO(b"new"), "application/pdf"))],
+                auth=("testuser", "testpass"),
+            )
+
+        self.assertEqual(resp.status_code, 200)
+        body = resp.json()
+        self.assertEqual(body["status"], "conflict")
+        self.assertIn("report.pdf", body["existing_files"])
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_overwrite_true_drops_cached_jsonl(self, _mock_auth):
+        with _ChdirTempDir() as tmp:
+            upload_dir = tmp / "uploads" / GRAPH
+            upload_dir.mkdir(parents=True)
+            (upload_dir / "report.pdf").write_bytes(b"old")
+            temp_folder = tmp / "uploads" / "ingestion_temp" / GRAPH
+            temp_folder.mkdir(parents=True)
+            (temp_folder / "report.jsonl").write_text("stale-extract")
+
+            resp = self.client.post(
+                f"/ui/{GRAPH}/uploads?overwrite=true",
+                files=[("files", ("report.pdf", io.BytesIO(b"new"), "application/pdf"))],
+                auth=("testuser", "testpass"),
+            )
+
+            self.assertEqual(resp.status_code, 200)
+            self.assertEqual(resp.json()["status"], "success")
+            # File replaced with new bytes
+            self.assertEqual((upload_dir / "report.pdf").read_bytes(), b"new")
+            # Cached extract removed so the next ingest re-converts
+            self.assertFalse((temp_folder / "report.jsonl").exists())
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_skip_drops_listed_files_from_upload_set(self, _mock_auth):
+        with _ChdirTempDir() as tmp:
+            (tmp / "uploads" / GRAPH).mkdir(parents=True)
+            (tmp / "uploads" / GRAPH / "keep_me.pdf").write_bytes(b"old")
+
+            resp = self.client.post(
+                f"/ui/{GRAPH}/uploads?skip=keep_me.pdf",
+                files=[
+                    ("files", ("keep_me.pdf", io.BytesIO(b"new"), "application/pdf")),
+                    ("files", ("fresh.pdf", io.BytesIO(b"fresh"), "application/pdf")),
+                ],
+                auth=("testuser", "testpass"),
+            )
+
+            self.assertEqual(resp.status_code, 200)
+            body = resp.json()
+            self.assertEqual(body["status"], "success")
+            self.assertEqual(
+                [u["filename"] for u in body["uploaded_files"]],
+                ["fresh.pdf"],
+            )
+            # Skipped file untouched on disk
+            self.assertEqual(
+                (tmp / "uploads" / GRAPH / "keep_me.pdf").read_bytes(),
+                b"old",
+            )
+
+
+class TestExtractSchemaRequiresFilenames(unittest.TestCase):
+    """``POST /ui/{graph}/extract_schema_from_jsonl`` rejects requests
+    that don't name the samples to feed to the LLM.
+    """
+
+    def setUp(self):
+        self.client = TestClient(app)
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_empty_filenames_returns_400(self, _mock_auth):
+        with _ChdirTempDir():
+            resp = self.client.post(
+                f"/ui/{GRAPH}/extract_schema_from_jsonl",
+                json={"filenames": []},
+                auth=("testuser", "testpass"),
+            )
+
+        self.assertEqual(resp.status_code, 400)
+        self.assertIn("non-empty", resp.json()["detail"].lower())
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_missing_filenames_returns_400(self, _mock_auth):
+        with _ChdirTempDir():
+            resp = self.client.post(
+                f"/ui/{GRAPH}/extract_schema_from_jsonl",
+                json={},
+                auth=("testuser", "testpass"),
+            )
+
+        self.assertEqual(resp.status_code, 400)
+        self.assertIn("non-empty", resp.json()["detail"].lower())
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    @patch("app.routers.ui.acquire_graph_lock", return_value=False)
+    def test_lock_held_returns_409(self, _mock_lock, _mock_auth):
+        with _ChdirTempDir():
+            resp = self.client.post(
+                f"/ui/{GRAPH}/extract_schema_from_jsonl",
+                json={"filenames": ["report.pdf"]},
+                auth=("testuser", "testpass"),
+            )
+
+        self.assertEqual(resp.status_code, 409)
+        self.assertIn("schema extraction", resp.json()["detail"].lower())
+
+
+class TestConvertSampleFiles(unittest.TestCase):
+    """``POST /ui/{graph}/convert_sample_files`` writes samples to the
+    flat ``uploads/{graph}/`` layout and prompts on filename collisions.
+    """
+
+    def setUp(self):
+        self.client = TestClient(app)
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_writes_to_flat_layout_and_returns_saved_files(self, _mock_auth):
+        async def _fake_process(self, folder, graphname, temp):
+            stem = "report"
+            Path(temp).mkdir(parents=True, exist_ok=True)
+            Path(temp, f"{stem}.jsonl").write_text('{"text":"hello"}\n')
+            return {"num_documents": 1}
+
+        with _ChdirTempDir() as tmp, patch(
+            "app.routers.ui.TextExtractor._process_folder_async",
+            new=_fake_process,
+        ):
+            resp = self.client.post(
+                f"/ui/{GRAPH}/convert_sample_files",
+                files=[("files", ("report.pdf", io.BytesIO(b"x"), "application/pdf"))],
+                auth=("testuser", "testpass"),
+            )
+
+            self.assertEqual(resp.status_code, 200, resp.text)
+            body = resp.json()
+            self.assertEqual(body["status"], "success")
+            self.assertEqual(body["saved_files"], ["report.pdf"])
+            # File landed in the flat upload directory, NOT a _schema_* subdir
+            self.assertTrue((tmp / "uploads" / GRAPH / "report.pdf").exists())
+            # No request-id field surfaces to the caller in the new contract
+            self.assertNotIn("request_id", body)
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_sweeps_legacy_schema_subdirs_on_entry(self, _mock_auth):
+        async def _fake_process(self, folder, graphname, temp):
+            Path(temp).mkdir(parents=True, exist_ok=True)
+            return {"num_documents": 0}
+
+        with _ChdirTempDir() as tmp, patch(
+            "app.routers.ui.TextExtractor._process_folder_async",
+            new=_fake_process,
+        ):
+            stale_a = tmp / "uploads" / GRAPH / "_schema_old1"
+            stale_b = tmp / "uploads" / "ingestion_temp" / GRAPH / "_schema_old2"
+            stale_a.mkdir(parents=True)
+            stale_b.mkdir(parents=True)
+            (stale_a / "ghost.pdf").write_bytes(b"x")
+            (stale_b / "ghost.jsonl").write_text("x")
+
+            resp = self.client.post(
+                f"/ui/{GRAPH}/convert_sample_files",
+                files=[("files", ("fresh.pdf", io.BytesIO(b"y"), "application/pdf"))],
+                auth=("testuser", "testpass"),
+            )
+
+            self.assertEqual(resp.status_code, 200, resp.text)
+            self.assertFalse(stale_a.exists())
+            self.assertFalse(stale_b.exists())
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_returns_conflict_envelope_on_collision(self, _mock_auth):
+        with _ChdirTempDir() as tmp:
+            (tmp / "uploads" / GRAPH).mkdir(parents=True)
+            (tmp / "uploads" / GRAPH / "report.pdf").write_bytes(b"old")
+
+            resp = self.client.post(
+                f"/ui/{GRAPH}/convert_sample_files",
+                files=[("files", ("report.pdf", io.BytesIO(b"new"), "application/pdf"))],
+                auth=("testuser", "testpass"),
+            )
+
+            self.assertEqual(resp.status_code, 200)
+            body = resp.json()
+            self.assertEqual(body["status"], "conflict")
+            self.assertIn("report.pdf", body["existing_files"])
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    @patch("app.routers.ui.acquire_graph_lock", return_value=False)
+    def test_lock_held_returns_409(self, _mock_lock, _mock_auth):
+        with _ChdirTempDir():
+            resp = self.client.post(
+                f"/ui/{GRAPH}/convert_sample_files",
+                files=[("files", ("any.pdf", io.BytesIO(b"x"), "application/pdf"))],
+                auth=("testuser", "testpass"),
+            )
+
+        self.assertEqual(resp.status_code, 409)
+
+
+class TestLegacySubdirSweep(unittest.TestCase):
+    """``_sweep_legacy_schema_subdirs`` is idempotent and tolerant of
+    missing directories.
+    """
+
+    def test_removes_schema_subdirs_under_both_trees(self):
+        with _ChdirTempDir() as tmp:
+            a = tmp / "uploads" / GRAPH / "_schema_x"
+            b = tmp / "uploads" / "ingestion_temp" / GRAPH / "_schema_y"
+            other = tmp / "uploads" / GRAPH / "regular_subdir"
+            for d in (a, b, other):
+                d.mkdir(parents=True)
+                (d / "file.bin").write_bytes(b"x")
+
+            _sweep_legacy_schema_subdirs(GRAPH)
+
+            self.assertFalse(a.exists())
+            self.assertFalse(b.exists())
+            # Non-schema subdirs are untouched
+            self.assertTrue(other.exists())
+            self.assertTrue((other / "file.bin").exists())
+
+    def test_is_idempotent_when_no_subdirs_exist(self):
+        with _ChdirTempDir():
+            # Nothing to do; must not raise.
+            _sweep_legacy_schema_subdirs(GRAPH)
+            _sweep_legacy_schema_subdirs(GRAPH)
+
+
+class TestGraphLockOperationTracking(unittest.TestCase):
+    """``acquire_graph_lock`` records the operation name so
+    ``get_current_operation`` can report it; release clears it.
+    """
+
+    def setUp(self):
+        # Ensure each test starts with a free lock for the test graph.
+        release_graph_lock(GRAPH, "test_cleanup")
+
+    def tearDown(self):
+        release_graph_lock(GRAPH, "test_cleanup")
+
+    def test_get_current_operation_none_when_unlocked(self):
+        self.assertIsNone(get_current_operation(GRAPH))
+
+    def test_get_current_operation_returns_op_name_while_held(self):
+        acquired = acquire_graph_lock(GRAPH, "create_ingest")
+        self.assertTrue(acquired)
+        self.assertEqual(get_current_operation(GRAPH), "create_ingest")
+
+    def test_release_clears_current_operation(self):
+        acquire_graph_lock(GRAPH, "ingest")
+        self.assertEqual(get_current_operation(GRAPH), "ingest")
+        release_graph_lock(GRAPH, "ingest")
+        self.assertIsNone(get_current_operation(GRAPH))
+
+
+class TestUploadStatusEndpoint(unittest.TestCase):
+    """``GET /ui/{graph}/upload_status`` surfaces the current lock state
+    so the Document Ingestion dialog can stay in sync with server-side
+    work that's still in flight after the dialog was closed.
+    """
+
+    def setUp(self):
+        self.client = TestClient(app)
+        release_graph_lock(GRAPH, "test_cleanup")
+
+    def tearDown(self):
+        release_graph_lock(GRAPH, "test_cleanup")
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_processing_false_when_no_lock_held(self, _mock_auth):
+        resp = self.client.get(
+            f"/ui/{GRAPH}/upload_status", auth=("testuser", "testpass"),
+        )
+        self.assertEqual(resp.status_code, 200)
+        body = resp.json()
+        self.assertFalse(body["processing"])
+        self.assertIsNone(body["operation"])
+
+    @patch("app.routers.ui.auth", return_value=_ok_auth())
+    def test_processing_true_while_create_ingest_holds_lock(self, _mock_auth):
+        acquire_graph_lock(GRAPH, "create_ingest")
+        try:
+            resp = self.client.get(
+                f"/ui/{GRAPH}/upload_status", auth=("testuser", "testpass"),
+            )
+        finally:
+            release_graph_lock(GRAPH, "create_ingest")
+        self.assertEqual(resp.status_code, 200)
+        body = resp.json()
+        self.assertTrue(body["processing"])
+        self.assertEqual(body["operation"], "create_ingest")
+
+
+class TestTextExtractorSkipFilter(unittest.TestCase):
+    """``TextExtractor`` must skip ``_schema_*`` subdirs when walking a
+    folder so sample-doc staging is never re-ingested as regular
+    documents.
+    """
+
+    def test_safe_walk_filter_includes_schema_prefix(self):
+        src = Path(__file__).resolve().parents[2] / "common" / "utils" / "text_extractors.py"
+        text = src.read_text()
+        # The filter is a tuple of literal prefixes inside safe_walk.
+        self.assertIn("'_schema_'", text)
+
+
+if __name__ == "__main__":
+    unittest.main()

From 679b515efb4d4a1748406317331a65fbe9b11c60 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Wed, 3 Jun 2026 13:42:17 -0700
Subject: [PATCH 06/18] Embedding store: auto-recovery, in-UI status, graceful
 chat fallback

- The vector store reconnects automatically after a transient TigerGraph outage; retry backs off from 10 seconds to 5 minutes
- Chat stays available when vector search is unavailable; graph-traversal questions answer normally
- The Graph Database Configuration page shows the current vector store state and offers a Reconnect control when it is unavailable
- Test Connection reports the TigerGraph version and whether vector search will be available on the configured database
- Saving a new database configuration refreshes the in-page status so the operator sees whether the embedding store recovered on the new credentials

Refs: GML-2092
---
 CHANGELOG.md                                  |   2 +
 common/config.py                              |  35 +++++
 graphrag-ui/src/pages/setup/GraphDBConfig.tsx | 127 +++++++++++++++++-
 graphrag/app/routers/ui.py                    | 107 +++++++++++++--
 4 files changed, 256 insertions(+), 15 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index f4af23e..8c7bf58 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -14,6 +14,8 @@
 - **One schema extraction at a time per graph.** Concurrent attempts on the same graph are rejected with 409 instead of racing on the shared sample folder.
 - **Document Ingestion dialog reflects server-side state on reopen.** Closing the dialog mid-conversion and reopening it no longer leaves the *Ingest* button incorrectly enabled. The dialog asks the server which operation, if any, currently holds the graph lock, and polls until that operation completes — so the button stays disabled, the uploaded files list re-populates, and the next upload doesn't collide with the prior conversion.
 - **Conflict prompts use the app's styled dialog** instead of the browser default. Choosing *Cancel* now aborts the upload cleanly — the button and status message reset right away.
+- **The vector store recovers without a container restart.** When the initial connection to TigerGraph fails (e.g. cold start, transient network blip), the service used to stay broken until the operator restarted the container — chat connections were rejected silently with WebSocket close 1013. The vector store now retries automatically in the background (10s → 30s → 60s → 120s → 300s backoff), and a new ``POST /ui/admin/retry_embedding_store`` lets superusers force a retry immediately after fixing the underlying issue.
+- **Chat stays available when vector search is unavailable.** The chat WebSocket no longer closes hard with 1013 on vector-store failures. Instead it accepts the connection, surfaces a notice to the client, and lets graph-traversal questions answer normally — only questions that genuinely require a vector lookup fail, and they fail gracefully through the synthesizer.
 
 ### Removed
 - **A configured static `apiToken` no longer overrides per-user credentials.** It is used only for the service's background operations; interactive requests always authenticate as the signed-in user.
diff --git a/common/config.py b/common/config.py
index a18fe4d..170259e 100644
--- a/common/config.py
+++ b/common/config.py
@@ -632,8 +632,43 @@ def reset_embedding_store() -> None:
     threading.Thread(target=_init_embedding_store, daemon=True).start()
 
 
+def _retry_embedding_store_loop():
+    """Daemon target. While the embedding store is in error state,
+    retry the build every so often so a transient TigerGraph outage
+    self-heals without a container restart. Backs off after each
+    failure (10s → 30s → 60s → 120s → 300s cap).
+    """
+    import time
+    backoff = [10, 30, 60, 120, 300]
+    attempt = 0
+    while True:
+        # Wait for the initial one-shot init to complete (success or
+        # failure) before starting the retry cadence.
+        _embedding_store_ready.wait()
+        if service_status["embedding_store"]["status"] != "error":
+            attempt = 0
+            time.sleep(backoff[-1])
+            continue
+        delay = backoff[min(attempt, len(backoff) - 1)]
+        attempt += 1
+        time.sleep(delay)
+        if service_status["embedding_store"]["status"] != "error":
+            attempt = 0
+            continue
+        logger.info(
+            f"Retrying embedding store init (attempt {attempt}, "
+            f"next backoff {backoff[min(attempt, len(backoff)-1)]}s)…"
+        )
+        _embedding_store_ready.clear()
+        _init_embedding_store()
+        if service_status["embedding_store"]["status"] == "ok":
+            logger.info("Embedding store init recovered.")
+            attempt = 0
+
+
 if os.getenv("INIT_EMBED_STORE", "true") == "true":
     threading.Thread(target=_init_embedding_store, daemon=True).start()
+    threading.Thread(target=_retry_embedding_store_loop, daemon=True).start()
 
 
 def reload_llm_config(new_llm_config: dict = None):
diff --git a/graphrag-ui/src/pages/setup/GraphDBConfig.tsx b/graphrag-ui/src/pages/setup/GraphDBConfig.tsx
index dabf97f..66015f5 100644
--- a/graphrag-ui/src/pages/setup/GraphDBConfig.tsx
+++ b/graphrag-ui/src/pages/setup/GraphDBConfig.tsx
@@ -1,7 +1,8 @@
 import React, { useState, useEffect } from "react";
-import { Server, Save, CheckCircle2 } from "lucide-react";
+import { Server, Save, CheckCircle2, AlertCircle, RefreshCw, Loader2 } from "lucide-react";
 import { Input } from "@/components/ui/input";
 import { Button } from "@/components/ui/button";
+import { safeJson } from "@/utils/safeJson";
 
 const GraphDBConfig = () => {
   // Default values for fields — shown as placeholders, used if user leaves field empty
@@ -41,6 +42,65 @@ const GraphDBConfig = () => {
   const [message, setMessage] = useState("");
   const [messageType, setMessageType] = useState<"success" | "error" | "">("");
 
+  // Vector store status — polled from /health so the operator sees
+  // when the background retry loop has recovered the store and can
+  // force an immediate retry after fixing TigerGraph.
+  const [storeStatus, setStoreStatus] = useState<"ok" | "initializing" | "error" | "unknown">("unknown");
+  const [storeError, setStoreError] = useState<string | null>(null);
+  const [isRetryingStore, setIsRetryingStore] = useState(false);
+  const [retryMessage, setRetryMessage] = useState("");
+
+  const fetchStoreStatus = async () => {
+    try {
+      const creds = sessionStorage.getItem("auth");
+      if (!creds) return;
+      const r = await fetch("/ui/admin/embedding_store_status", {
+        headers: { Authorization: creds },
+      });
+      if (!r.ok) return;
+      const data = await safeJson(r);
+      setStoreStatus(data?.status || "unknown");
+      setStoreError(data?.error || null);
+    } catch {
+      // Ignore — leave previous status visible.
+    }
+  };
+
+  // One-shot status check on page entry — vector-store outages are
+  // rare and the background retry loop self-heals; if the operator
+  // needs to force recovery they click Retry Connection (shown only
+  // on error).
+  useEffect(() => {
+    fetchStoreStatus();
+  }, []);
+
+  const handleRetryEmbeddingStore = async () => {
+    setIsRetryingStore(true);
+    setRetryMessage("");
+    try {
+      const creds = sessionStorage.getItem("auth");
+      const r = await fetch("/ui/admin/retry_embedding_store", {
+        method: "POST",
+        headers: { Authorization: creds! },
+      });
+      const data = await safeJson(r);
+      if (!r.ok) {
+        throw new Error(data.detail || `Retry failed: ${r.statusText}`);
+      }
+      setStoreStatus(data.status || "unknown");
+      setStoreError(data.error || null);
+      if (data.status === "ok") {
+        setRetryMessage("✅ Vector store reconnected.");
+      } else {
+        setRetryMessage(`⚠️ Retry attempted, store still ${data.status}.`);
+      }
+    } catch (err: any) {
+      setRetryMessage(`❌ ${err.message || "Retry failed."}`);
+    } finally {
+      setIsRetryingStore(false);
+    }
+  };
+
   useEffect(() => {
     fetchConfig();
   }, []);
@@ -125,7 +185,15 @@ const GraphDBConfig = () => {
 
       if (response.ok && result.status === "success") {
         setConnectionTested(true);
-        setMessage("Connection successful! You can now save the configuration.");
+        const versionBit = result.tg_version
+          ? ` (TigerGraph ${result.tg_version})`
+          : "";
+        const vectorBit = result.vector_details
+          ? `\nVector Store: ${result.vector_supported ? "✓" : "⚠️"} ${result.vector_details}`
+          : "";
+        setMessage(
+          `Connection successful${versionBit}. You can now save the configuration.${vectorBit}`
+        );
         setMessageType("success");
       } else {
         setMessage(result.message || "Connection test failed");
@@ -204,6 +272,13 @@ const GraphDBConfig = () => {
           // Update originals after successful save (only if no redirect)
           setOriginalHostname(effectiveHostname);
           setOriginalUsername(effectiveUsername);
+          // Reflect the just-triggered embedding-store re-init in the
+          // indicator. Background init typically lands within a few
+          // seconds; poll a second time so the operator sees the real
+          // outcome (ok or error) without navigating away.
+          fetchStoreStatus();
+          setTimeout(fetchStoreStatus, 3000);
+          setTimeout(fetchStoreStatus, 8000);
         }
       } else {
         setMessage(result.detail || "Failed to save configuration");
@@ -459,7 +534,7 @@ const GraphDBConfig = () => {
 
                 {message && (
                   <div
-                    className={`p-4 rounded-lg ${
+                    className={`p-4 rounded-lg whitespace-pre-line ${
                       messageType === "success"
                         ? "bg-green-50 dark:bg-green-900/20 text-green-800 dark:text-green-200"
                         : "bg-red-50 dark:bg-red-900/20 text-red-800 dark:text-red-200"
@@ -493,11 +568,57 @@ const GraphDBConfig = () => {
                       Enter password or API token to test connection
                     </p>
                   )}
+
+                  <div className="ml-auto flex items-center gap-2">
+                    {storeStatus === "error" ? (
+                      <Button
+                        onClick={handleRetryEmbeddingStore}
+                        disabled={isRetryingStore}
+                        variant="outline"
+                        className="dark:border-[#3D3D3D] text-red-700 dark:text-red-300 border-red-300 dark:border-red-900"
+                      >
+                        {isRetryingStore ? (
+                          <Loader2 className="h-4 w-4 mr-2 animate-spin" />
+                        ) : (
+                          <RefreshCw className="h-4 w-4 mr-2" />
+                        )}
+                        {isRetryingStore ? "Reconnecting…" : "Reconnect Vector Store"}
+                      </Button>
+                    ) : (
+                      <span
+                        className="text-sm text-gray-700 dark:text-gray-300 inline-flex items-center gap-1.5"
+                        title={
+                          storeStatus === "ok"
+                            ? "Vector store connected"
+                            : storeStatus === "initializing"
+                            ? "Vector store initializing"
+                            : "Vector store status unavailable"
+                        }
+                      >
+                        Vector Store
+                        {storeStatus === "ok" && (
+                          <CheckCircle2 className="h-4 w-4 text-green-600 dark:text-green-400" />
+                        )}
+                        {storeStatus === "initializing" && (
+                          <Loader2 className="h-4 w-4 text-blue-600 dark:text-blue-400 animate-spin" />
+                        )}
+                        {storeStatus === "unknown" && (
+                          <AlertCircle className="h-4 w-4 text-gray-400" />
+                        )}
+                      </span>
+                    )}
+                  </div>
                 </div>
               </div>
             </div>
             </div>
           </fieldset>
+
+          {storeStatus === "error" && (storeError || retryMessage) && (
+            <div className="mt-4 px-4 py-2 rounded-lg bg-red-50 dark:bg-red-900/20 text-red-700 dark:text-red-300 text-sm break-words">
+              {retryMessage || storeError}
+            </div>
+          )}
         </div>
       </div>
     </div>
diff --git a/graphrag/app/routers/ui.py b/graphrag/app/routers/ui.py
index 1551cfa..ab9c5f0 100644
--- a/graphrag/app/routers/ui.py
+++ b/graphrag/app/routers/ui.py
@@ -661,6 +661,37 @@ def get_version():
     }
 
 
+@router.get(f"{route_prefix}/admin/embedding_store_status")
+def embedding_store_status(
+    creds: Annotated[tuple[list[str], HTTPBasicCredentials], Depends(ui_basic_auth)],
+):
+    """Return the current vector-store status without re-running init.
+    Used by the Graph Database Config page to poll status; only routed
+    through nginx's ``/ui/`` path so the UI can reach it.
+    """
+    _require_roles(creds[1], {"superuser", "globaldesigner"})
+    return service_status["embedding_store"]
+
+
+@router.post(f"{route_prefix}/admin/retry_embedding_store")
+def retry_embedding_store_now(
+    creds: Annotated[tuple[list[str], HTTPBasicCredentials], Depends(ui_basic_auth)],
+):
+    """Re-run the embedding-store init right now. Use after fixing the
+    underlying issue (e.g. TigerGraph just came back up) instead of
+    waiting for the background retry loop to wake.
+
+    Restricted to superuser / globaldesigner — the call holds the
+    request thread while the init runs (typically <1s when TG is
+    reachable, longer if it isn't).
+    """
+    _require_roles(creds[1], {"superuser", "globaldesigner"})
+    from common.config import _init_embedding_store, _embedding_store_ready
+    _embedding_store_ready.clear()
+    _init_embedding_store()
+    return service_status["embedding_store"]
+
+
 @router.get(f"{route_prefix}/list_graphs")
 def list_graphs(auth: Annotated[list[str], Depends(ui_basic_auth)]):
     """Return the live list of graphs the authenticated user has access
@@ -2374,21 +2405,29 @@ async def chat(
     # Embedding store unavailable: WebSocket routes can't return an
     # HTTPException — ASGI requires the handshake to be sent (or the
     # connection explicitly closed) before the callable returns.
-    # Accept, surface the error to the client, then close with a
-    # well-defined status code (1013 = Try Again Later).
-    if service_status["embedding_store"]["error"]:
+    await websocket.accept()
+
+    # If the embedding store is currently unavailable, advise the
+    # client up-front. The chat still proceeds: agent paths that rely
+    # on graph traversal (generate_function / generate_cypher /
+    # entity-relationship retrieval) work without vector search, and
+    # the auto-mode selector skips vector retrievers downstream. Only
+    # questions that genuinely require a vector lookup return a
+    # graceful per-question error through the synthesizer.
+    if service_status["embedding_store"]["status"] != "ok":
         try:
-            await websocket.accept()
             await websocket.send_json({
+                "notice": "vector_search_unavailable",
+                "status": service_status["embedding_store"]["status"],
                 "error": service_status["embedding_store"]["error"],
-                "code": "embedding_store_unavailable",
+                "message": (
+                    "Vector search is currently unavailable; graph "
+                    "traversal questions still work and the service "
+                    "will recover automatically."
+                ),
             })
-            await websocket.close(code=1013, reason="Embedding store unavailable")
         except Exception:
             pass
-        return
-
-    await websocket.accept()
 
     # AUTH with proper error handling and timeout
     try:
@@ -3763,6 +3802,11 @@ async def test_db_connection(
 ):
     """
     Test database connection with provided credentials from UI.
+
+    Also probes vector-search capability (TigerGraph version and whether
+    the ``gds.vector`` package is installed) so the operator knows
+    upfront whether saving this configuration will yield a working
+    vector store, not just a reachable database.
     """
     try:
         _require_roles(credentials, {"superuser"})
@@ -3783,12 +3827,51 @@ async def test_db_connection(
         # listGraphs() exercises the credentials; pyTigerGraph mints a
         # REST++ token on demand if the instance requires one.
         test_conn.listGraphs()
-        
+
+        # Vector capability probe — separate from the auth/reachability
+        # check so version / GDS results report independently.
+        # Hard requirement is TG version >= 4.2; the GDS package is
+        # installed automatically by the embedding-store init on first
+        # use if missing, so its absence is informational, not a
+        # failure.
+        tg_version = ""
+        vector_supported = False
+        vector_details = ""
+        try:
+            tg_version = str(test_conn.getVer())
+            ver_parts = tg_version.split(".")
+            major = int(ver_parts[0]) if ver_parts and ver_parts[0].isdigit() else 0
+            minor = int(ver_parts[1]) if len(ver_parts) > 1 and ver_parts[1].isdigit() else 0
+            if major < 4 or (major == 4 and minor < 2):
+                vector_supported = False
+                vector_details = (
+                    f"TigerGraph {tg_version} does not support vector search "
+                    "(4.2 or later required)."
+                )
+            else:
+                vector_supported = True
+                try:
+                    sub_packages = test_conn.gsql("SHOW PACKAGE gds")
+                except Exception:
+                    sub_packages = ""
+                if "- vector" in str(sub_packages):
+                    vector_details = "GDS installed."
+                else:
+                    vector_details = (
+                        "GDS will be installed automatically on first init "
+                        "(may take a few minutes)."
+                    )
+        except Exception as vec_err:
+            vector_details = f"Vector capability probe failed: {vec_err}"
+
         return {
             "status": "success",
-            "message": "Connection successful"
+            "message": "Connection successful",
+            "tg_version": tg_version,
+            "vector_supported": vector_supported,
+            "vector_details": vector_details,
         }
-        
+
     except HTTPException:
         raise
     except Exception as e:

From f60d76a68386aedb003799fc0c068fad7ecf0079 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Wed, 3 Jun 2026 11:48:18 -0700
Subject: [PATCH 07/18] Pre-install per-graph vector utility queries at graph
 init

Triggers TigerGraphEmbeddingStore.__init__'s install_vector_queries() at the end of init_supportai by building the per-graph store there, so the first chat question doesn't pay the install cost. The store wrapper's existing idempotent check stays as the safety net for graphs created outside the init path.

Refs: GML-2099
---
 graphrag/app/supportai/supportai.py | 20 ++++++++++++++++++++
 1 file changed, 20 insertions(+)

diff --git a/graphrag/app/supportai/supportai.py b/graphrag/app/supportai/supportai.py
index f38eba9..df09942 100644
--- a/graphrag/app/supportai/supportai.py
+++ b/graphrag/app/supportai/supportai.py
@@ -142,6 +142,26 @@ def init_supportai(conn: TigerGraphConnection, graphname: str) -> tuple[dict, di
     )
     logger.info(f"Done installing supportai query all with status {query_res}")
 
+    # Pre-install the per-graph utility vector queries (get_topk_similar,
+    # get_topk_closest, etc.) so the first chat request doesn't pay the
+    # install cost. ``TigerGraphEmbeddingStore.__init__`` runs the
+    # install when bound to a graph whose schema has ``Dimension=``;
+    # the embedding-store wrapper itself is idempotent and the install
+    # is a no-op when the queries already exist.
+    try:
+        from common.config import get_embedding_store
+        get_embedding_store(graphname)
+        logger.info(
+            f"Per-graph vector utility queries ready for {graphname}"
+        )
+    except Exception as exc:
+        # Non-fatal — the chat path will install them on first use as
+        # before; just log so the operator sees the slip.
+        logger.warning(
+            f"Could not pre-install vector utility queries for "
+            f"{graphname}: {exc}"
+        )
+
     return schema_res, index_res, query_res
 
 

From 0eb6a88771160906a07b0443bdfc3ff2159ee7a8 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Wed, 3 Jun 2026 10:50:44 -0700
Subject: [PATCH 08/18] Bump VERSION to 1.4.1

Refs: GML-2093
---
 VERSION | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/VERSION b/VERSION
index 88c5fb8..347f583 100644
--- a/VERSION
+++ b/VERSION
@@ -1 +1 @@
-1.4.0
+1.4.1

From 7476b7fff4aaff0a18753d9cf9132c9618f8f080 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Wed, 3 Jun 2026 14:26:40 -0700
Subject: [PATCH 09/18] Pin pyTigerGraph to 2.0.4+

Earlier 2.0.x patches handed back an empty REST++ token from the auth helper on TigerGraph 4.2 instances, breaking embedding-store init in graphrag-ecc whenever its image was built before 2026-05-19. The 2.0.4 release restored correct token issuance.

Refs: GML-2093
---
 common/requirements.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/common/requirements.txt b/common/requirements.txt
index f4d5ac6..a52f992 100644
--- a/common/requirements.txt
+++ b/common/requirements.txt
@@ -140,7 +140,7 @@ python-multipart==0.0.20
 python-iso639==2025.2.18
 python-magic==0.4.27
 pyTigerDriver==1.0.15
-pyTigerGraph>=2.0.3
+pyTigerGraph>=2.0.4
 pytz==2025.2
 PyYAML==6.0.2
 rapidfuzz==3.13.0

From 9453d9e0c292f9668a95d9bbc32119dac145af62 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Wed, 3 Jun 2026 17:07:19 -0700
Subject: [PATCH 10/18] Keep the query_guidance partial out of the editable
 query_generation prompt

The runtime supplies {query_guidance} as a partial; the operator who edits the query_generation prompt in the UI must not be able to delete or rename it. The split marker now matches the {query_guidance} line so the placeholder lands in the template-variables block alongside {vertices}, {format_instructions}, and the rest.

Refs: GML-2093
---
 graphrag/app/routers/ui.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/graphrag/app/routers/ui.py b/graphrag/app/routers/ui.py
index ab9c5f0..6073dfb 100644
--- a/graphrag/app/routers/ui.py
+++ b/graphrag/app/routers/ui.py
@@ -4029,6 +4029,10 @@ async def save_graphrag_config(
         r'(?ms)^#######\s*-Data-.*$',
     ],
     "query_generation": [
+        # ``{query_guidance}`` is a runtime-supplied partial — the user
+        # must not be able to delete it from the editable body, so the
+        # template-variables block starts at that placeholder line.
+        r'(?m)^\{query_guidance\}\s*$',
         r'(?ms)^##\s*Inputs\b.*$',
         r'(?ms)^\{format_instructions\}.*$',
     ],

From bde609df841f1098aac01f083c8fd1f26dfe85d3 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Wed, 3 Jun 2026 20:23:56 -0700
Subject: [PATCH 11/18] Speed up and tune image description on PDF ingestion

- Run more image-description requests in parallel during PDF ingestion, and raise the AWS Bedrock connection-pool default so concurrent multimodal and embedding calls do not back up
- Skip and exclude images below a configurable minimum size, as well as any image the multimodal model flags as decorative, so the graph stays free of useless Image vertices
- Add per-graph and global toggles on the GraphRAG Configuration page to turn image description on/off and adjust the minimum image size
- Ask the multimodal model to describe each image in the document's own language so the alt-text matches the surrounding chunk for retrieval

Refs: GML-2097
---
 CHANGELOG.md                                  |  2 +
 README.md                                     | 14 +++++
 common/embeddings/embedding_services.py       |  2 +-
 common/llm_services/aws_bedrock_service.py    |  2 +-
 common/utils/image_data_extractor.py          | 63 +++++++++++++++++--
 common/utils/text_extractors.py               | 58 +++++++++++++++--
 .../src/pages/setup/GraphRAGConfig.tsx        | 46 +++++++++++++-
 7 files changed, 173 insertions(+), 14 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8c7bf58..a42d941 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -16,6 +16,8 @@
 - **Conflict prompts use the app's styled dialog** instead of the browser default. Choosing *Cancel* now aborts the upload cleanly — the button and status message reset right away.
 - **The vector store recovers without a container restart.** When the initial connection to TigerGraph fails (e.g. cold start, transient network blip), the service used to stay broken until the operator restarted the container — chat connections were rejected silently with WebSocket close 1013. The vector store now retries automatically in the background (10s → 30s → 60s → 120s → 300s backoff), and a new ``POST /ui/admin/retry_embedding_store`` lets superusers force a retry immediately after fixing the underlying issue.
 - **Chat stays available when vector search is unavailable.** The chat WebSocket no longer closes hard with 1013 on vector-store failures. Instead it accepts the connection, surfaces a notice to the client, and lets graph-traversal questions answer normally — only questions that genuinely require a vector lookup fail, and they fail gracefully through the synthesizer.
+- **PDF ingestion is faster on image-heavy documents.** Image-description workers now run with a larger parallel pool, and tiny decorative images skip the multimodal LLM entirely. On AWS Bedrock deployments the connection pool default is also raised so concurrent describe calls no longer queue behind a 20-connection cap.
+- **Image description is tunable per graph or globally.** Two new `graphrag_config` keys — `extract_images` and `min_image_dim_px` — control whether the multimodal LLM is invoked on extracted images and the smallest image dimension that goes to the LLM (smaller images skip the call). Both are editable from the *GraphRAG Configuration* page in the UI, globally or per graph. Disabling does not alter the Image vertex type or loading job, so re-enabling later requires no schema change. The multimodal describe pass now reuses `default_concurrency` instead of a separate knob, so one setting tunes parallelism across the pipeline.
 
 ### Removed
 - **A configured static `apiToken` no longer overrides per-user credentials.** It is used only for the service's background operations; interactive requests always authenticate as the signed-in user.
diff --git a/README.md b/README.md
index c6854a4..739c699 100644
--- a/README.md
+++ b/README.md
@@ -498,6 +498,8 @@ Copy the below code into `configs/server_config.json`. You shouldn’t need to c
 | `doc_process_switch` | bool | `true` | Enable/disable document processing during knowledge graph build. |
 | `entity_extraction_switch` | bool | same as `doc_process_switch` | Enable/disable entity extraction during knowledge graph build. |
 | `community_detection_switch` | bool | same as `entity_extraction_switch` | Enable/disable community detection during knowledge graph build. |
+| `extract_images` | bool | `true` | Run the multimodal LLM on images extracted from documents to generate alt-text. Set to `false` to skip the image-description pass entirely — much faster, at the cost of losing image content from retrieval. Configurable per graph. |
+| `min_image_dim_px` | int | `100` | Smallest side (in px) an image must have to be sent to the multimodal LLM. Smaller images are tagged "decorative image" without an LLM call. Configurable per graph. |
 | `load_batch_size` | int | `500` | Batch size for document loading. |
 | `upsert_delay` | int | `0` | Delay in seconds between loading batches. |
 | `default_concurrency` | int | `10` | Base concurrency level for parallel processing. Configurable per graph. |
@@ -771,12 +773,19 @@ In addition to the `AZURE_OPENAI_ENDPOINT`, `AZURE_OPENAI_API_KEY`, and `azure_d
             "model_kwargs": {
                 "temperature": 0,
             },
+            "boto3_config": {
+                "max_pool_connections": 50,
+                "read_timeout": 300,
+                "retries": 5
+            },
             "prompt_path": "./common/prompts/aws_bedrock_claude3haiku/"
         }
     }
 }
 ```
 
+`boto3_config` is optional (the defaults shown above are also the built-in defaults). Raise `max_pool_connections` if `PDF_IMAGE_CONCURRENCY` is set above `50`. The same block can be set on `embedding_service` when using Bedrock embeddings.
+
 #### Ollama
 
 ```json
@@ -983,6 +992,11 @@ When customizing:
 - **`reuse_embedding: true`** skips re-embedding identical text — major saving on re-ingest of unchanged documents.
 - **Choose `llm_model` thoughtfully** — entity / relationship extraction tolerates cheaper / faster models (Haiku, Nova-lite, Flash); response synthesis benefits from stronger ones (Sonnet, GPT-4-class). The `multimodal_service` is independent — set it to a vision-capable model only when you actually ingest images.
 - **`load_batch_size`** and **`upsert_delay`** control ingestion pressure on TigerGraph. Defaults are fine for most loads; lower the batch size if you see write timeouts.
+- **Image-description speed.** On image-heavy documents, every image is sent to the multimodal LLM, which dominates ingest time. Tune via `graphrag_config` (global or per graph) — both knobs are also editable from the *GraphRAG Configuration* page in the UI:
+    - `extract_images` (default `true`) — set to `false` to skip image description entirely.
+    - `min_image_dim_px` (default `100`) — smaller images are tagged "decorative image" without an LLM call.
+    - Multimodal calls share the same `default_concurrency` semaphore as the rest of the pipeline — raise it to parallelize more describe calls; lower it if the multimodal provider's rate limit is hit.
+    - AWS Bedrock users can further tune connection pool sizing via `boto3_config` in `llm_config`.
 
 ### 7. A working tuning loop
 
diff --git a/common/embeddings/embedding_services.py b/common/embeddings/embedding_services.py
index 6f170d0..e032c54 100644
--- a/common/embeddings/embedding_services.py
+++ b/common/embeddings/embedding_services.py
@@ -209,7 +209,7 @@ def __init__(self, config):
 
         boto3_config = config.get("boto3_config", {})
         client_config = botocore.config.Config(
-            max_pool_connections=boto3_config.get("max_pool_connections", 20),
+            max_pool_connections=boto3_config.get("max_pool_connections", 50),
             read_timeout=boto3_config.get("read_timeout", 300),
             retries={"max_attempts": boto3_config.get("retries", 5)},
         )
diff --git a/common/llm_services/aws_bedrock_service.py b/common/llm_services/aws_bedrock_service.py
index ce6056c..4e6096f 100644
--- a/common/llm_services/aws_bedrock_service.py
+++ b/common/llm_services/aws_bedrock_service.py
@@ -93,7 +93,7 @@ def __init__(self, config):
 
         boto3_config = config.get("boto3_config", {})
         client_config = botocore.config.Config(
-            max_pool_connections=boto3_config.get("max_pool_connections", 20),
+            max_pool_connections=boto3_config.get("max_pool_connections", 50),
             read_timeout=boto3_config.get("read_timeout", 300),
             retries={"max_attempts": boto3_config.get("retries", 5)},
         )
diff --git a/common/utils/image_data_extractor.py b/common/utils/image_data_extractor.py
index 575264a..5ffd189 100644
--- a/common/utils/image_data_extractor.py
+++ b/common/utils/image_data_extractor.py
@@ -1,6 +1,7 @@
 import base64
 import io
 import logging
+import os
 from langchain_core.messages import HumanMessage, SystemMessage
 from common.config import get_llm_service, get_multimodal_config
 
@@ -9,6 +10,54 @@
 _multimodal_client = None
 _multimodal_provider = None
 
+
+def _graphrag_cfg(graphname=None) -> dict:
+    try:
+        from common.config import get_graphrag_config
+        return get_graphrag_config(graphname) or {}
+    except Exception:
+        return {}
+
+
+def should_extract_images(graphname=None) -> bool:
+    """Whether to run the multimodal LLM on extracted images. Resolved from
+    per-graph or global ``graphrag_config.extract_images``; defaults to True."""
+    cfg = _graphrag_cfg(graphname)
+    if "extract_images" in cfg:
+        return bool(cfg["extract_images"])
+    return True
+
+
+def min_image_dim_px(graphname=None) -> int:
+    """Smallest side (in px) an image must have to be sent to the LLM.
+    Resolved from per-graph or global ``graphrag_config.min_image_dim_px``;
+    defaults to 100."""
+    cfg = _graphrag_cfg(graphname)
+    try:
+        return int(cfg.get("min_image_dim_px", 100))
+    except (TypeError, ValueError):
+        return 100
+
+
+def image_describe_workers(graphname=None) -> int:
+    """Per-PDF thread-pool size for the multimodal describe pass.
+    Reuses ``graphrag_config.default_concurrency`` (defaults to 10) so
+    deployments only tune one concurrency knob."""
+    cfg = _graphrag_cfg(graphname)
+    try:
+        return max(1, int(cfg.get("default_concurrency", 10)))
+    except (TypeError, ValueError):
+        return 10
+
+
+def is_decorative(description: str) -> bool:
+    """True when the multimodal LLM signalled the image carries no
+    retrieval-worthy content. Robust to trailing punctuation / case."""
+    if not description:
+        return False
+    cleaned = description.strip().lower().rstrip(".").strip()
+    return cleaned == "decorative image"
+
 def _get_client():
     global _multimodal_client, _multimodal_provider
     if _multimodal_client is None and get_multimodal_config():
@@ -38,7 +87,6 @@ def describe_image_with_llm(file_path):
     """
     try:
         from PIL import Image as PILImage
-        import os
         import time
 
         client = _get_client()
@@ -72,10 +120,15 @@ def describe_image_with_llm(file_path):
                             "or branding mark, identified by name. Do NOT describe "
                             "layout, background color, decorative styling, slide "
                             "templates, or generic visual impressions — those add "
-                            "no retrieval value. If the image is purely decorative "
-                            "(no text, no data, no diagram), reply with just "
-                            "\"decorative image\" and nothing else. Respond as a "
-                            "SINGLE plain-text paragraph — no markdown headings, no "
+                            "no retrieval value. Write the description in the same "
+                            "language as the text inside the image; if the image "
+                            "has no text, infer the document's language from any "
+                            "visible labels, captions, or branding and match that. "
+                            "Default to English only if no language signal is "
+                            "present. If the image is purely decorative (no text, "
+                            "no data, no diagram), reply with just \"decorative "
+                            "image\" and nothing else. Respond as a SINGLE "
+                            "plain-text paragraph — no markdown headings, no "
                             "bullet lists, no blank lines. The reply is used "
                             "verbatim as the alt-text inside `![alt](url)`."
                         ),
diff --git a/common/utils/text_extractors.py b/common/utils/text_extractors.py
index aeb6031..cee0419 100644
--- a/common/utils/text_extractors.py
+++ b/common/utils/text_extractors.py
@@ -453,7 +453,15 @@ def _extract_pdf_with_images_as_docs(file_path, base_doc_id, graphname=None):
     try:
         import pymupdf4llm
         from PIL import Image as PILImage
-        from common.utils.image_data_extractor import describe_image_with_llm
+        from common.utils.image_data_extractor import (
+            describe_image_with_llm,
+            image_describe_workers,
+            is_decorative,
+            min_image_dim_px,
+            should_extract_images,
+        )
+
+        _is_decorative = is_decorative
 
         # Ensure clean slate - remove folder if it exists from failed previous run
         if image_output_folder.exists():
@@ -537,19 +545,30 @@ def _extract_pdf_with_images_as_docs(file_path, base_doc_id, graphname=None):
         # mutate the same shared string and must run in deterministic
         # order. Concurrency cap is intentionally small to stay below
         # Bedrock's per-account throttle.
-        image_workers = int(os.environ.get("PDF_IMAGE_CONCURRENCY", "8"))
+        image_workers = image_describe_workers(graphname)
+        extract_images_enabled = should_extract_images(graphname)
+        min_dim = min_image_dim_px(graphname)
 
         def _describe_and_encode(img_ref: dict) -> dict:
             """Run on a worker thread. Returns one of:
               * ``{"ok": True, "img_ref", "description", "image_base64",
                   "width", "height"}``
+              * ``{"ok": True, "img_ref", "skip": True}`` for decorative
+                or too-small images that should be dropped from the JSONL
               * ``{"ok": False, "img_ref", "error"}``
             Never raises.
             """
             try:
                 img_path = Path(img_ref["path"])
-                description = describe_image_with_llm(str(img_path))
                 pil_image = PILImage.open(img_path)
+                too_small = (
+                    pil_image.width < min_dim or pil_image.height < min_dim
+                )
+                if not extract_images_enabled or too_small:
+                    return {"ok": True, "skip": True, "img_ref": img_ref}
+                description = describe_image_with_llm(str(img_path))
+                if _is_decorative(description):
+                    return {"ok": True, "skip": True, "img_ref": img_ref}
                 if pil_image.mode != "RGB":
                     pil_image = pil_image.convert("RGB")
                 buffer = io.BytesIO()
@@ -595,6 +614,16 @@ def _describe_and_encode(img_ref: dict) -> dict:
                     )
                 continue
 
+            if d.get("skip"):
+                skipped_path = img_ref.get("path", "")
+                if skipped_path:
+                    markdown_content = re.sub(
+                        r'!\[.*?\]\(' + re.escape(skipped_path) + r'\)',
+                        "",
+                        markdown_content,
+                    )
+                continue
+
             image_id = img_ref["image_id"]
             markdown_content = insert_description_by_id(
                 markdown_content, image_id, d["description"]
@@ -660,12 +689,29 @@ def _extract_standalone_image_as_doc(file_path, base_doc_id, graphname=None):
     """
     try:
         from PIL import Image as PILImage
-        from common.utils.image_data_extractor import describe_image_with_llm
+        from common.utils.image_data_extractor import (
+            describe_image_with_llm,
+            is_decorative,
+            min_image_dim_px,
+            should_extract_images,
+        )
 
         pil_image = PILImage.open(file_path)
-        if pil_image.width < 100 or pil_image.height < 100:
-            pass
+        min_dim = min_image_dim_px(graphname)
+        if not should_extract_images(graphname) or (
+            pil_image.width < min_dim or pil_image.height < min_dim
+        ):
+            logger.info(
+                f"Skipping standalone image {file_path}: decorative or below "
+                f"min dimension ({min_dim}px)"
+            )
+            return []
         description = describe_image_with_llm(str(Path(file_path).absolute()))
+        if is_decorative(description):
+            logger.info(
+                f"Skipping standalone image {file_path}: LLM marked as decorative"
+            )
+            return []
         buffer = io.BytesIO()
         if pil_image.mode != 'RGB':
             pil_image = pil_image.convert('RGB')
diff --git a/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx b/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
index 2e439ca..aa24821 100644
--- a/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
+++ b/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
@@ -39,6 +39,8 @@ const GraphRAGConfig = () => {
   const [loadBatchSize, setLoadBatchSize] = useState("500");
   const [upsertDelay, setUpsertDelay] = useState("0");
   const [maxConcurrency, setMaxConcurrency] = useState("10");
+  const [extractImages, setExtractImages] = useState(true);
+  const [minImageDimPx, setMinImageDimPx] = useState("100");
 
   // Schema-aware initialization (Phase 1 sample-doc path)
   const [schemaMaxSampleFiles, setSchemaMaxSampleFiles] = useState("5");
@@ -91,6 +93,8 @@ const GraphRAGConfig = () => {
     setLoadBatchSize(String(graphragConfig.load_batch_size ?? 500));
     setUpsertDelay(String(graphragConfig.upsert_delay ?? 0));
     setMaxConcurrency(String(graphragConfig.default_concurrency ?? 10));
+    setExtractImages(graphragConfig.extract_images ?? true);
+    setMinImageDimPx(String(graphragConfig.min_image_dim_px ?? 100));
     setSchemaMaxSampleFiles(String(graphragConfig.schema_max_sample_files ?? 5));
     setSchemaMaxTotalMb(String(graphragConfig.schema_max_total_mb ?? 50));
     setStrictMode(graphragConfig.strict_mode ?? false);
@@ -215,6 +219,8 @@ const GraphRAGConfig = () => {
         load_batch_size: parseInt(loadBatchSize),
         upsert_delay: parseInt(upsertDelay),
         default_concurrency: parseInt(maxConcurrency),
+        extract_images: extractImages,
+        min_image_dim_px: parseInt(minImageDimPx),
         schema_max_sample_files: parseInt(schemaMaxSampleFiles),
         schema_max_total_mb: parseInt(schemaMaxTotalMb),
         strict_mode: strictMode,
@@ -242,6 +248,8 @@ const GraphRAGConfig = () => {
         load_batch_size: 500,
         upsert_delay: 0,
         default_concurrency: 10,
+        extract_images: true,
+        min_image_dim_px: 100,
         schema_max_sample_files: 5,
         schema_max_total_mb: 50,
         strict_mode: false,
@@ -789,10 +797,46 @@ const GraphRAGConfig = () => {
                       onChange={(e) => setMaxConcurrency(e.target.value)}
                     />
                     <p className="text-xs text-gray-500 dark:text-gray-400 mt-1">
-                      Max concurrent workers for graph queries, LLM, and embedding calls
+                      Maximum LLM, embedding, and graph database requests running at the same time.
                     </p>
                   </div>
                 </div>
+
+                <div className="mt-6">
+                  <div className="flex items-center space-x-2">
+                    <input
+                      type="checkbox"
+                      id="extractImages"
+                      className="rounded border-gray-300 dark:border-[#3D3D3D]"
+                      checked={extractImages}
+                      onChange={(e) => setExtractImages(e.target.checked)}
+                    />
+                    <label htmlFor="extractImages" className="text-sm font-medium text-black dark:text-white">
+                      Generate image descriptions during PDF ingestion
+                    </label>
+                  </div>
+                  <p className="text-xs text-gray-600 dark:text-[#D9D9D9] mt-1 ml-6">
+                    Sends each extracted image to the multimodal LLM for alt-text. Disable to skip image content entirely.
+                  </p>
+                </div>
+
+                <div className="mt-4 max-w-sm">
+                  <label className="block text-sm font-medium mb-2 text-black dark:text-white">
+                    Min Image Dimension
+                  </label>
+                  <Input
+                    type="number"
+                    min="0"
+                    className="dark:border-[#3D3D3D] dark:bg-background"
+                    placeholder="100"
+                    value={minImageDimPx}
+                    onChange={(e) => setMinImageDimPx(e.target.value)}
+                    disabled={!extractImages}
+                  />
+                  <p className="text-xs text-gray-500 dark:text-gray-400 mt-1">
+                    Smallest side (in px) an image must have to be described.
+                  </p>
+                </div>
               </div>
             )}
           </div>

From 3f9fa40bf3a963f5db7d417f86701e316129a547 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Thu, 4 Jun 2026 09:58:29 -0700
Subject: [PATCH 12/18] Fall back to hybrid search when community search misses
 or fails

- Auto-selected community search now retries once with hybrid search when it returns no community summaries or the retriever raises, instead of short-circuiting to "couldn't find"
- Manual community search remains unchanged so user picks are not second-guessed

Refs: GML-2098
---
 CHANGELOG.md                           |  1 +
 graphrag/app/agent/agent_graph.py      | 64 +++++++++++++++++++-------
 graphrag/app/agent/method_selector.py  | 46 +++++++++---------
 graphrag/tests/test_method_selector.py | 19 ++++----
 4 files changed, 83 insertions(+), 47 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index a42d941..a50cf0b 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -18,6 +18,7 @@
 - **Chat stays available when vector search is unavailable.** The chat WebSocket no longer closes hard with 1013 on vector-store failures. Instead it accepts the connection, surfaces a notice to the client, and lets graph-traversal questions answer normally — only questions that genuinely require a vector lookup fail, and they fail gracefully through the synthesizer.
 - **PDF ingestion is faster on image-heavy documents.** Image-description workers now run with a larger parallel pool, and tiny decorative images skip the multimodal LLM entirely. On AWS Bedrock deployments the connection pool default is also raised so concurrent describe calls no longer queue behind a 20-connection cap.
 - **Image description is tunable per graph or globally.** Two new `graphrag_config` keys — `extract_images` and `min_image_dim_px` — control whether the multimodal LLM is invoked on extracted images and the smallest image dimension that goes to the LLM (smaller images skip the call). Both are editable from the *GraphRAG Configuration* page in the UI, globally or per graph. Disabling does not alter the Image vertex type or loading job, so re-enabling later requires no schema change. The multimodal describe pass now reuses `default_concurrency` instead of a separate knob, so one setting tunes parallelism across the pipeline.
+- **Community search falls back to hybrid search when it returns nothing or fails.** Auto-selected community queries that miss (no relevant community summaries) or hit a retriever error are now retried once with hybrid graph-hop search before returning a "couldn't find" answer. Manually-picked community search is unchanged.
 
 ### Removed
 - **A configured static `apiToken` no longer overrides per-user credentials.** It is used only for the service's background operations; interactive requests always authenticate as the signed-in user.
diff --git a/graphrag/app/agent/agent_graph.py b/graphrag/app/agent/agent_graph.py
index 921fa8e..1c2925e 100644
--- a/graphrag/app/agent/agent_graph.py
+++ b/graphrag/app/agent/agent_graph.py
@@ -561,11 +561,12 @@ def supportai_search(self, state):
            auto-selection regardless of configuration — manual users still get
            the best vector method when the structured-data path has exhausted
            its retries.
-        2. **In-lane fallback.** After the first chunk-based retriever runs, if
-           it returned fewer than `top_k` chunks (signal: insufficient context),
-           runs a second method per `INLANE_FALLBACK_TABLE` and uses its context
-           for downstream generation. Single retry only; skipped for manual
-           mode and community search.
+        2. **In-lane fallback.** After the first retriever runs, if it returned
+           insufficient context or raised an exception, runs a second method
+           per `INLANE_FALLBACK_TABLE` and uses its context for downstream
+           generation. Single retry only; skipped for manual mode. Insufficient
+           is defined per method: chunk-based methods need at least `top_k`
+           chunks; community needs at least one community summary.
         3. **Out-of-corpus short-circuit.** If after all retrieval attempts the
            result is still empty, marks the context so `generate_answer`
            returns an honest "couldn't find" message instead of letting the
@@ -604,37 +605,68 @@ def supportai_search(self, state):
         state["chosen_retriever_source"] = chosen_source
         self._record_selection_metric(method, chosen_source)
 
-        # First retrieval attempt
-        result_state = self._dispatch_retriever(method, state)
+        # First retrieval attempt. Catch exceptions so a transient retriever
+        # failure becomes an in-lane fallback rather than a 500 — the user
+        # gets the same outcome as "returned empty," and any method with an
+        # entry in INLANE_FALLBACK_TABLE is eligible.
+        retriever_error: Optional[Exception] = None
+        try:
+            result_state = self._dispatch_retriever(method, state)
+        except Exception as exc:  # noqa: BLE001
+            retriever_error = exc
+            logger.warning(
+                f"Retriever {method} raised: {exc}; "
+                "treating as empty result for fallback consideration"
+            )
+            result_state = dict(state)
+            result_state["context"] = {
+                "function_call": None,
+                "result": {"final_retrieval": {}},
+            }
+            result_state["lookup_source"] = "supportai"
 
-        # In-lane fallback (Feature 2) — chunk-based methods only, single retry,
-        # skipped for manual users so we don't second-guess their pick.
+        # In-lane fallback — a single retry through INLANE_FALLBACK_TABLE.
+        # Skipped for manual users so we don't second-guess their pick.
         ctx = result_state.get("context") if isinstance(result_state.get("context"), dict) else {}
         result = ctx.get("result") if isinstance(ctx.get("result"), dict) else {}
         final_retrieval = result.get("final_retrieval") if isinstance(result, dict) else None
         top_k = self._graphrag_cfg.get("top_k", 5)
         can_inlane_fallback = (
             chosen_source != "manual"
-            and method in CHUNK_BASED_METHODS
+            and method in INLANE_FALLBACK_TABLE
             and not result_state.get("inlane_fallback_attempted")
-            and has_insufficient_context(final_retrieval, method, top_k)
+            and (retriever_error is not None
+                 or has_insufficient_context(final_retrieval, method, top_k))
         )
         if can_inlane_fallback:
             fallback_method = INLANE_FALLBACK_TABLE.get(method)
             if fallback_method:
                 label_old = self._METHOD_DISPLAY_NAMES.get(method, method)
                 label_new = self._METHOD_DISPLAY_NAMES.get(fallback_method, fallback_method)
-                self.emit_progress(
-                    f"Insufficient context from {label_old} search, trying {label_new} search"
-                )
+                if retriever_error is not None:
+                    fallback_reason = f"fallback from {label_old} (search failed)"
+                    progress = (
+                        f"{label_old} search did not complete, trying {label_new} search"
+                    )
+                else:
+                    fallback_reason = (
+                        f"fallback from {label_old} (returned insufficient context)"
+                    )
+                    progress = (
+                        f"Insufficient context from {label_old} search, trying {label_new} search"
+                    )
+                self.emit_progress(progress)
                 result_state["inlane_fallback_attempted"] = True
                 result_state["inlane_fallback_from"] = method
-                # Update the active method/source for the second pass.
                 method = fallback_method
                 chosen_source = "inlane_fallback"
-                chosen_reason = f"fallback from {label_old} (returned fewer than top_k chunks)"
+                chosen_reason = fallback_reason
                 self._record_selection_metric(method, chosen_source)
                 result_state = self._dispatch_retriever(method, result_state)
+        elif retriever_error is not None:
+            # No fallback path available — re-raise so the caller sees the
+            # original failure instead of an empty-result short-circuit.
+            raise retriever_error
 
         # Mirror the (final) choice onto the context dict so it lands on
         # GraphRAGResponse.query_sources without further plumbing.
diff --git a/graphrag/app/agent/method_selector.py b/graphrag/app/agent/method_selector.py
index 15d46ad..724c735 100644
--- a/graphrag/app/agent/method_selector.py
+++ b/graphrag/app/agent/method_selector.py
@@ -55,27 +55,26 @@
 FALLBACK_METHOD = METHOD_HYBRID
 
 
-# In-lane fallback table: when a chunk-based method returns insufficient context,
-# try this method instead. Subset-aware — never falls back to a method whose
-# results are a strict subset of the failing method's seeds (e.g., similarity is
-# a subset of contextual/hybrid, so we don't fall back to it from those).
+# In-lane fallback table: when a retriever returns insufficient context (or
+# raises), try this method instead. Subset-aware — never falls back to a method
+# whose results are a strict subset of the failing method's seeds (e.g.,
+# similarity is a subset of contextual/hybrid, so we don't fall back to it from
+# those).
 #
-# The table fires once per question. Community is the terminal step from hybrid
-# because its retrieval surface (community summaries) is fundamentally different
-# from chunk retrieval — when chunk-based search finds little, thematic
-# summaries may still cover the question.
+# The table fires once per question. Community falls back to hybrid so that
+# thematic questions that miss (no relevant community summaries) still get a
+# chance at the entity-driven graph-hop retriever before short-circuiting to
+# "couldn't find."
 INLANE_FALLBACK_TABLE = {
     METHOD_SIMILARITY: METHOD_HYBRID,    # point lookup → graph-hop expansion
     METHOD_CONTEXTUAL: METHOD_HYBRID,    # sibling expansion thin → try graph hops
     METHOD_HYBRID: METHOD_COMMUNITY,     # entity-driven thin → try thematic summaries
-    # No fallback FROM community — its top-k semantics differ; the in-lane
-    # trigger doesn't apply, and falling back to a chunk method when community
-    # missed is a different problem (handled by router_fallback / out-of-corpus).
+    METHOD_COMMUNITY: METHOD_HYBRID,     # no relevant communities → try entity-driven graph hops
 }
 
 
 def has_insufficient_context(retrieval_dict, method: str, top_k: int) -> bool:
-    """Decide whether a chunk-based retriever returned fewer items than asked.
+    """Decide whether a retriever returned too little context to answer from.
 
     Args:
         retrieval_dict: the `final_retrieval` dict from the retriever output, or None.
@@ -83,19 +82,22 @@ def has_insufficient_context(retrieval_dict, method: str, top_k: int) -> bool:
         top_k: the requested number of chunks for this retrieval.
 
     Returns:
-        True if the result is "insufficient" — i.e., the method is chunk-based and
-        the retrieved count is strictly below `top_k`. Empty results count as
-        insufficient. Returns False for community search (different semantics) and
-        for any non-dict input.
-
-    Note: this is the trigger for the in-lane fallback in supportai_search.
-    Community search is excluded because its top_k caps community summaries, not
-    chunks, and a small number of returned summaries doesn't mean "no context."
+        True if the result is "insufficient":
+          * For chunk-based methods: fewer than `top_k` chunks returned.
+          * For community search: zero communities returned (top_k caps
+            community summaries, not chunks, so any non-empty result counts
+            as having some context).
+          * For any unknown method or non-dict input: True if missing / malformed,
+            otherwise False.
+
+    This is the trigger for the in-lane fallback in supportai_search.
     """
-    if method not in CHUNK_BASED_METHODS:
-        return False
     if not isinstance(retrieval_dict, dict):
         return True  # empty / malformed → insufficient
+    if method == METHOD_COMMUNITY:
+        return len(retrieval_dict) == 0
+    if method not in CHUNK_BASED_METHODS:
+        return False
     return len(retrieval_dict) < top_k
 
 
diff --git a/graphrag/tests/test_method_selector.py b/graphrag/tests/test_method_selector.py
index 6f6f975..bdcd238 100644
--- a/graphrag/tests/test_method_selector.py
+++ b/graphrag/tests/test_method_selector.py
@@ -329,10 +329,10 @@ def test_hybrid_falls_back_to_community(self):
         # Different retrieval surface (community summaries vs chunks).
         self.assertEqual(INLANE_FALLBACK_TABLE[METHOD_HYBRID], METHOD_COMMUNITY)
 
-    def test_community_has_no_fallback(self):
-        # Community's top-k semantics differ; the in-lane trigger doesn't fire
-        # for it, so a fallback entry would be unused.
-        self.assertNotIn(METHOD_COMMUNITY, INLANE_FALLBACK_TABLE)
+    def test_community_falls_back_to_hybrid(self):
+        # When community search misses (no relevant summaries) or fails, try
+        # the entity-driven graph-hop retriever before giving up.
+        self.assertEqual(INLANE_FALLBACK_TABLE[METHOD_COMMUNITY], METHOD_HYBRID)
 
     def test_no_self_fallback(self):
         # A method should never fall back to itself.
@@ -365,11 +365,12 @@ def test_above_top_k_is_sufficient(self):
         above = {f"chunk{i}": "text" for i in range(7)}
         self.assertFalse(has_insufficient_context(above, METHOD_HYBRID, top_k=5))
 
-    def test_community_always_returns_false(self):
-        """Community has different top_k semantics (community summaries, not
-        chunks). It should never trigger the insufficient-context path."""
-        self.assertFalse(has_insufficient_context({}, METHOD_COMMUNITY, top_k=5))
-        self.assertFalse(has_insufficient_context(None, METHOD_COMMUNITY, top_k=5))
+    def test_empty_community_is_insufficient(self):
+        """Community returning zero summaries is treated as insufficient so the
+        in-lane fallback can fire. A non-empty result is sufficient regardless
+        of the top_k cap (community top_k counts summaries, not chunks)."""
+        self.assertTrue(has_insufficient_context({}, METHOD_COMMUNITY, top_k=5))
+        self.assertTrue(has_insufficient_context(None, METHOD_COMMUNITY, top_k=5))
         partial = {f"comm{i}": "summary" for i in range(2)}
         self.assertFalse(has_insufficient_context(partial, METHOD_COMMUNITY, top_k=5))
 

From 628298013df77687f10bfccdd93d2f8c18618214 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Thu, 4 Jun 2026 10:12:16 -0700
Subject: [PATCH 13/18] Harden v1.4.1 paths surfaced by code review

- Ensure the decorative-image marker stays in English even when document descriptions are localized, so small/decorative images stay out of the JSONL
- Release the image file handle when an image is skipped, preventing handle build-up on image-heavy PDFs
- Serialize embedding-store rebuilds across the background retry loop, the manual retry endpoint, and the db-config reload so concurrent calls cannot stomp shared state
- Send the vector-search-unavailable notice only to authenticated chat clients, and drop the raw error string from it
- Wrap the API-token TigerGraph connection the same way the password path does so version checks work for token logins
- Block the GraphRAG Configuration save button when the page failed to load the current config, so a stale reference cannot strip valid overrides
- Cancel in-flight GraphRAG Configuration fetches when the scope or graph changes so the latest selection always wins
- Prevent the Document Ingestion dialog from re-enabling the Ingest button between a click and the server registering the job, removing the double-submit window
- Cancel pending GraphDB redirect/refresh timers when the page is left so they cannot run on an unrelated page

Refs: GML-2092, GML-2094, GML-2095, GML-2097
---
 common/config.py                              | 26 ++++++---
 common/utils/image_data_extractor.py          | 10 ++--
 common/utils/text_extractors.py               | 43 +++++++-------
 graphrag-ui/src/pages/setup/GraphDBConfig.tsx | 24 ++++++--
 .../src/pages/setup/GraphRAGConfig.tsx        | 25 +++++++-
 graphrag-ui/src/pages/setup/IngestGraph.tsx   | 37 +++++++++++-
 graphrag/app/routers/ui.py                    | 57 +++++++++++--------
 7 files changed, 157 insertions(+), 65 deletions(-)

diff --git a/common/config.py b/common/config.py
index 170259e..cd51d6a 100644
--- a/common/config.py
+++ b/common/config.py
@@ -519,6 +519,11 @@ def get_llm_service(service_config: dict) -> LLM_Model:
 _embedding_store_ready = threading.Event()
 _embedding_stores: dict = {}
 _embedding_stores_lock = threading.Lock()
+# Serializes default-store init across the background retry loop, the manual
+# /ui/admin/retry_embedding_store endpoint, and reset_embedding_store callers
+# (db-config reload). Without it two _init_embedding_store threads could run
+# concurrently and stomp ``embedding_store`` + ``service_status``.
+_embedding_store_init_lock = threading.Lock()
 service_status["embedding_store"] = {
     "status": "initializing",
     "error": "Embedding store is still initializing",
@@ -560,16 +565,21 @@ def _init_embedding_store():
     """Background thread target. Builds the default embedding store
     without blocking module import — TigerGraph may be slow on first
     connect, and we don't want app startup to wait on it.
+
+    Serialized via ``_embedding_store_init_lock`` so concurrent calls
+    (initial startup + background retry loop + manual retry endpoint +
+    db-config reload) cannot stomp the shared globals.
     """
     global embedding_store
-    try:
-        embedding_store = _build_embedding_store()
-        service_status["embedding_store"] = {"status": "ok", "error": None}
-    except Exception as e:
-        service_status["embedding_store"] = {"status": "error", "error": str(e)}
-        logger.error(f"Failed to initialize embedding store: {e}")
-    finally:
-        _embedding_store_ready.set()
+    with _embedding_store_init_lock:
+        try:
+            embedding_store = _build_embedding_store()
+            service_status["embedding_store"] = {"status": "ok", "error": None}
+        except Exception as e:
+            service_status["embedding_store"] = {"status": "error", "error": str(e)}
+            logger.error(f"Failed to initialize embedding store: {e}")
+        finally:
+            _embedding_store_ready.set()
 
 
 def get_embedding_store(graphname: str | None = None, timeout: float = 0):
diff --git a/common/utils/image_data_extractor.py b/common/utils/image_data_extractor.py
index 5ffd189..95b4581 100644
--- a/common/utils/image_data_extractor.py
+++ b/common/utils/image_data_extractor.py
@@ -125,10 +125,12 @@ def describe_image_with_llm(file_path):
                             "has no text, infer the document's language from any "
                             "visible labels, captions, or branding and match that. "
                             "Default to English only if no language signal is "
-                            "present. If the image is purely decorative (no text, "
-                            "no data, no diagram), reply with just \"decorative "
-                            "image\" and nothing else. Respond as a SINGLE "
-                            "plain-text paragraph — no markdown headings, no "
+                            "present. EXCEPTION: if the image is purely decorative "
+                            "(no text, no data, no diagram), reply with exactly the "
+                            "English phrase \"decorative image\" (lowercase, no "
+                            "punctuation, no translation) and nothing else — this "
+                            "is a fixed sentinel, never localized. Respond as a "
+                            "SINGLE plain-text paragraph — no markdown headings, no "
                             "bullet lists, no blank lines. The reply is used "
                             "verbatim as the alt-text inside `![alt](url)`."
                         ),
diff --git a/common/utils/text_extractors.py b/common/utils/text_extractors.py
index cee0419..503acad 100644
--- a/common/utils/text_extractors.py
+++ b/common/utils/text_extractors.py
@@ -560,28 +560,27 @@ def _describe_and_encode(img_ref: dict) -> dict:
             """
             try:
                 img_path = Path(img_ref["path"])
-                pil_image = PILImage.open(img_path)
-                too_small = (
-                    pil_image.width < min_dim or pil_image.height < min_dim
-                )
-                if not extract_images_enabled or too_small:
-                    return {"ok": True, "skip": True, "img_ref": img_ref}
-                description = describe_image_with_llm(str(img_path))
-                if _is_decorative(description):
-                    return {"ok": True, "skip": True, "img_ref": img_ref}
-                if pil_image.mode != "RGB":
-                    pil_image = pil_image.convert("RGB")
-                buffer = io.BytesIO()
-                pil_image.save(buffer, format="JPEG", quality=95)
-                image_base64 = base64.b64encode(buffer.getvalue()).decode("utf-8")
-                return {
-                    "ok": True,
-                    "img_ref": img_ref,
-                    "description": description,
-                    "image_base64": image_base64,
-                    "width": pil_image.width,
-                    "height": pil_image.height,
-                }
+                with PILImage.open(img_path) as pil_image:
+                    too_small = (
+                        pil_image.width < min_dim or pil_image.height < min_dim
+                    )
+                    if not extract_images_enabled or too_small:
+                        return {"ok": True, "skip": True, "img_ref": img_ref}
+                    description = describe_image_with_llm(str(img_path))
+                    if _is_decorative(description):
+                        return {"ok": True, "skip": True, "img_ref": img_ref}
+                    rgb_image = pil_image if pil_image.mode == "RGB" else pil_image.convert("RGB")
+                    buffer = io.BytesIO()
+                    rgb_image.save(buffer, format="JPEG", quality=95)
+                    image_base64 = base64.b64encode(buffer.getvalue()).decode("utf-8")
+                    return {
+                        "ok": True,
+                        "img_ref": img_ref,
+                        "description": description,
+                        "image_base64": image_base64,
+                        "width": pil_image.width,
+                        "height": pil_image.height,
+                    }
             except Exception as img_error:  # noqa: BLE001 — keep going
                 return {"ok": False, "img_ref": img_ref, "error": img_error}
 
diff --git a/graphrag-ui/src/pages/setup/GraphDBConfig.tsx b/graphrag-ui/src/pages/setup/GraphDBConfig.tsx
index 66015f5..06e66af 100644
--- a/graphrag-ui/src/pages/setup/GraphDBConfig.tsx
+++ b/graphrag-ui/src/pages/setup/GraphDBConfig.tsx
@@ -1,4 +1,4 @@
-import React, { useState, useEffect } from "react";
+import React, { useState, useEffect, useRef } from "react";
 import { Server, Save, CheckCircle2, AlertCircle, RefreshCw, Loader2 } from "lucide-react";
 import { Input } from "@/components/ui/input";
 import { Button } from "@/components/ui/button";
@@ -74,6 +74,22 @@ const GraphDBConfig = () => {
     fetchStoreStatus();
   }, []);
 
+  // Track every setTimeout we schedule so we can cancel them on unmount.
+  // Otherwise a redirect/alert/refresh timer fires after the user navigates
+  // away, possibly wiping auth from a page they're now on.
+  const timeoutsRef = useRef<ReturnType<typeof setTimeout>[]>([]);
+  const scheduleTimeout = (fn: () => void, ms: number) => {
+    const id = setTimeout(fn, ms);
+    timeoutsRef.current.push(id);
+    return id;
+  };
+  useEffect(() => {
+    return () => {
+      timeoutsRef.current.forEach(clearTimeout);
+      timeoutsRef.current = [];
+    };
+  }, []);
+
   const handleRetryEmbeddingStore = async () => {
     setIsRetryingStore(true);
     setRetryMessage("");
@@ -262,7 +278,7 @@ const GraphDBConfig = () => {
             ? "GraphDB hostname changed. Please relogin with the new credentials to connect to the new instance."
             : "GraphDB username changed. Please relogin with the new credentials.";
           
-          setTimeout(() => {
+          scheduleTimeout(() => {
             // Clear sessionStorage and redirect to login
             sessionStorage.removeItem("auth");
             alert(reason);
@@ -277,8 +293,8 @@ const GraphDBConfig = () => {
           // seconds; poll a second time so the operator sees the real
           // outcome (ok or error) without navigating away.
           fetchStoreStatus();
-          setTimeout(fetchStoreStatus, 3000);
-          setTimeout(fetchStoreStatus, 8000);
+          scheduleTimeout(fetchStoreStatus, 3000);
+          scheduleTimeout(fetchStoreStatus, 8000);
         }
       } else {
         setMessage(result.detail || "Failed to save configuration");
diff --git a/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx b/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
index aa24821..dd618f8 100644
--- a/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
+++ b/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
@@ -60,6 +60,7 @@ const GraphRAGConfig = () => {
 
   const [isLoading, setIsLoading] = useState(false);
   const [isSaving, setIsSaving] = useState(false);
+  const [loadFailed, setLoadFailed] = useState(false);
   const [message, setMessage] = useState("");
   const [messageType, setMessageType] = useState<"success" | "error" | "">("");
 
@@ -70,11 +71,18 @@ const GraphRAGConfig = () => {
   // Track configs as loaded from API so we only save what's needed
   const loadedGlobalConfig = useRef<Record<string, any>>({});
   const loadedGraphOverrides = useRef<Record<string, any>>({});
+  // AbortController for in-flight fetchConfig. Toggling scope/graph rapidly
+  // would otherwise let the older request resolve last, leaving the UI
+  // showing the wrong scope's values.
+  const fetchAbortRef = useRef<AbortController | null>(null);
 
   useEffect(() => {
     const site = JSON.parse(sessionStorage.getItem("site") || "{}");
     setAvailableGraphs(site.graphs || []);
     fetchConfig();
+    return () => {
+      fetchAbortRef.current?.abort();
+    };
   }, []);
 
 
@@ -120,6 +128,12 @@ const GraphRAGConfig = () => {
     const queryString = params.toString() ? `?${params.toString()}` : "";
     const url = `/ui/config${queryString}`;
 
+    // Cancel any prior in-flight fetch; only the latest scope/graph
+    // selection should win.
+    fetchAbortRef.current?.abort();
+    const ac = new AbortController();
+    fetchAbortRef.current = ac;
+
     // Transient backend failures (cold start, brief upstream timeouts via
     // nginx, momentary 502/503/504) are common right after a service
     // restart and produced the intermittent "Failed to fetch configuration"
@@ -139,6 +153,7 @@ const GraphRAGConfig = () => {
       try {
         const response = await fetch(url, {
           headers: { Authorization: creds! },
+          signal: ac.signal,
         });
         lastStatus = response.status;
         if (!response.ok) {
@@ -168,9 +183,13 @@ const GraphRAGConfig = () => {
         // Clear any prior transient error banner on success.
         setMessage("");
         setMessageType("");
+        setLoadFailed(false);
         setIsLoading(false);
         return;
       } catch (error: any) {
+        // Superseded by a newer fetch — bail silently so the loading
+        // banner doesn't flicker an error for a request we cancelled.
+        if (error?.name === "AbortError") return;
         lastErr = error;
         if (attempt < maxAttempts && shouldRetry(lastStatus, error)) {
           await new Promise((r) => setTimeout(r, 500 * attempt));
@@ -185,6 +204,10 @@ const GraphRAGConfig = () => {
       `Failed to load configuration${lastStatus ? ` (HTTP ${lastStatus})` : ""}. Please retry.`
     );
     setMessageType("error");
+    // Block Save: the loaded reference is stale/empty, so diffing against it
+    // can silently strip valid overrides (per-graph mode) or save defaults
+    // over server state (global mode).
+    setLoadFailed(true);
     setIsLoading(false);
   };
 
@@ -1038,7 +1061,7 @@ const GraphRAGConfig = () => {
             </div>
           )}
 
-          <Button onClick={handleSave} disabled={isSaving} className="gradient text-white w-full">
+          <Button onClick={handleSave} disabled={isSaving || isLoading || loadFailed} title={loadFailed ? "Reload the page or click Retry to fetch the current configuration before saving" : undefined} className="gradient text-white w-full">
             {isSaving ? (
               <>
                 <Loader2 className="h-4 w-4 mr-2 animate-spin" />
diff --git a/graphrag-ui/src/pages/setup/IngestGraph.tsx b/graphrag-ui/src/pages/setup/IngestGraph.tsx
index 4c3d8e1..feb4bfe 100644
--- a/graphrag-ui/src/pages/setup/IngestGraph.tsx
+++ b/graphrag-ui/src/pages/setup/IngestGraph.tsx
@@ -193,6 +193,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
         setIsUploading(false);
 
         console.log("Calling handleCreateIngestAfterUpload from main upload...");
+        recentProcessClickRef.current = Date.now();
         setIsProcessingFiles(true);
         handleCreateIngestAfterUpload("uploaded", uploadedCount).catch((err) => {
           console.error("Error in background processing:", err);
@@ -288,6 +289,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
       await fetchUploadedFiles();
 
       console.log("Calling handleCreateIngestAfterUpload...");
+      recentProcessClickRef.current = Date.now();
       setIsProcessingFiles(true);
       try {
         await handleCreateIngestAfterUpload("uploaded", uploadedCount);
@@ -440,6 +442,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
         setDownloadMessage("✅ Successfully downloaded the files. Processing...");
         await fetchDownloadedFiles();
         setIsDownloading(false);
+        recentProcessClickRef.current = Date.now();
         setIsProcessingFiles(true);
         handleCreateIngestAfterUpload("downloaded", downloadCount).catch((err) => {
           console.error("Error in background processing:", err);
@@ -511,6 +514,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
       setIngestMessage("❌ Please select a graph");
       return;
     }
+    recentIngestClickRef.current = Date.now();
     setIsIngesting(true);
     setIngestMessage("Ingesting documents into knowledge graph...");
     try {
@@ -599,6 +603,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
     const folderPath = sourceType === "uploaded" ? `uploads/${ingestGraphName}` : `downloaded_files_cloud/${ingestGraphName}`;
     const fileCount = sourceType === "uploaded" ? uploadedFiles.length : downloadedFiles.length;
 
+    recentIngestClickRef.current = Date.now();
     setIsIngesting(true);
     setIngestMessage("Step 1/2: Creating ingest job...");
 
@@ -794,6 +799,7 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
       return;
     }
 
+    recentIngestClickRef.current = Date.now();
     setIsIngesting(true);
 
     try {
@@ -990,6 +996,15 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
   // that. While an operation is in flight, poll every 5s and clear
   // local state + refresh the file list once the server is idle.
   const lastServerOpRef = useRef<string | null>(null);
+  // Grace-window timestamps: a click sets local state to true before the
+  // server has registered the operation, so the next poll would otherwise
+  // immediately downgrade local state and re-enable the button — letting a
+  // quick second click double-POST. We hold local "true" until either the
+  // server acknowledges the op (then real completion drives the downgrade)
+  // or the grace window expires.
+  const recentIngestClickRef = useRef<number>(0);
+  const recentProcessClickRef = useRef<number>(0);
+  const POLL_GRACE_MS = 8000;
   useEffect(() => {
     if (!ingestGraphName) return;
     let cancelled = false;
@@ -1006,10 +1021,28 @@ const IngestGraph: React.FC<IngestGraphProps> = ({ isModal = false }) => {
         const d = await r.json();
         if (cancelled) return;
         const op: string | null = d?.operation || null;
+
+        const isIngestingFromServer = op === "ingest";
+        const isProcessingFromServer =
+          op === "create_ingest" || op === "upload_files";
+        const serverEverSawIngest = lastServerOpRef.current === "ingest";
+        const serverEverSawProcess =
+          lastServerOpRef.current === "create_ingest" ||
+          lastServerOpRef.current === "upload_files";
+        const now = Date.now();
+        const ingestClickFresh =
+          now - recentIngestClickRef.current < POLL_GRACE_MS;
+        const processClickFresh =
+          now - recentProcessClickRef.current < POLL_GRACE_MS;
+
+        setIsIngesting(
+          isIngestingFromServer ||
+            (ingestClickFresh && !serverEverSawIngest)
+        );
         setIsProcessingFiles(
-          op === "create_ingest" || op === "upload_files"
+          isProcessingFromServer ||
+            (processClickFresh && !serverEverSawProcess)
         );
-        setIsIngesting(op === "ingest");
         if (lastServerOpRef.current && !op) {
           // Server-side work just finished — refresh the file list.
           fetchUploadedFiles();
diff --git a/graphrag/app/routers/ui.py b/graphrag/app/routers/ui.py
index 6073dfb..7a2d3d1 100644
--- a/graphrag/app/routers/ui.py
+++ b/graphrag/app/routers/ui.py
@@ -60,6 +60,7 @@
 from common.logs.log import req_id_cv
 from common.logs.logwriter import LogWriter
 from common.metrics.prometheus_metrics import metrics as pmetrics
+from common.metrics.tg_proxy import TigerGraphConnectionProxy
 from common.utils.graph_locks import acquire_graph_lock, release_graph_lock, acquire_rebuild_lock, release_rebuild_lock, get_rebuilding_graph, get_current_operation
 from supportai import supportai
 from common.py_schemas.schemas import (
@@ -522,14 +523,22 @@ def ws_basic_auth(auth_info: str, graphname=None):
     if creds.username == _UI_TOKEN_SENTINEL:
         # API-token logins: build a TG connection directly with the
         # token; ``get_db_connection_pwd_manual`` only handles
-        # username/password.
-        conn = TigerGraphConnection(
+        # username/password. Mirror the customizeHeader + Proxy wrap
+        # used by the password path so downstream code that depends on
+        # proxy-only attributes (e.g. version checks) works the same
+        # for token logins.
+        raw_conn = TigerGraphConnection(
             host=db_config["hostname"],
             graphname=graphname or "",
             apiToken=creds.password,
             restppPort=db_config.get("restppPort", "9000"),
             gsPort=db_config.get("gsPort", "14240"),
         )
+        raw_conn.customizeHeader(
+            timeout=db_config.get("default_timeout", 60) * 1000,
+            responseSize=5000000,
+        )
+        conn = TigerGraphConnectionProxy(raw_conn, auth_mode="token")
     else:
         conn = get_db_connection_pwd_manual(
             graphname, creds.username, creds.password
@@ -2407,34 +2416,34 @@ async def chat(
     # connection explicitly closed) before the callable returns.
     await websocket.accept()
 
-    # If the embedding store is currently unavailable, advise the
-    # client up-front. The chat still proceeds: agent paths that rely
-    # on graph traversal (generate_function / generate_cypher /
-    # entity-relationship retrieval) work without vector search, and
-    # the auto-mode selector skips vector retrievers downstream. Only
-    # questions that genuinely require a vector lookup return a
-    # graceful per-question error through the synthesizer.
-    if service_status["embedding_store"]["status"] != "ok":
-        try:
-            await websocket.send_json({
-                "notice": "vector_search_unavailable",
-                "status": service_status["embedding_store"]["status"],
-                "error": service_status["embedding_store"]["error"],
-                "message": (
-                    "Vector search is currently unavailable; graph "
-                    "traversal questions still work and the service "
-                    "will recover automatically."
-                ),
-            })
-        except Exception:
-            pass
-
     # AUTH with proper error handling and timeout
     try:
         logger.info(f"WebSocket connected, waiting for authentication for graph: {graphname}")
         usr_auth = await asyncio.wait_for(websocket.receive_text(), timeout=10.0)
         logger.info(f"Received authentication data, length: {len(usr_auth)}")
         _, conn = ws_basic_auth(usr_auth, graphname)
+
+        # If the embedding store is currently unavailable, advise the
+        # client now that the caller is authenticated. The chat still
+        # proceeds: agent paths that rely on graph traversal
+        # (generate_function / generate_cypher / entity-relationship
+        # retrieval) work without vector search, and the auto-mode
+        # selector skips vector retrievers downstream. Only questions
+        # that genuinely require a vector lookup return a graceful
+        # per-question error through the synthesizer.
+        if service_status["embedding_store"]["status"] != "ok":
+            try:
+                await websocket.send_json({
+                    "notice": "vector_search_unavailable",
+                    "status": service_status["embedding_store"]["status"],
+                    "message": (
+                        "Vector search is currently unavailable; graph "
+                        "traversal questions still work and the service "
+                        "will recover automatically."
+                    ),
+                })
+            except Exception:
+                pass
         # Extract the authenticated username for trace-log ownership
         # tracking. For sentinel logins (API token / secret) this is
         # the sentinel itself; we resolve to the real TG identity below.

From bbdd0807601466403f129205a62fa5554344f2b0 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Thu, 4 Jun 2026 12:22:06 -0700
Subject: [PATCH 14/18] Tighten v1.4.1 auth, upload, and config-save paths

- Make the GraphRAG Configuration save a no-op when the page failed to load its baseline or the caller isn't signed in, so a programmatic save cannot overwrite server state without a current reference
- Schema-extraction conversion only walks the files in the current request, no longer re-converting unrelated files that already live in the per-graph upload directory
- Reject Basic auth payloads that omit the colon separator, instead of letting them silently become empty-password login attempts
- Use the full SHA-256 hex as the role-cache key suffix so two distinct API tokens with the same hash prefix cannot share cached identity

Refs: GML-2092, GML-2094, GML-2095, GML-2096
---
 README.md                                     |   2 +-
 common/utils/text_extractors.py               |  13 +-
 .../src/pages/setup/GraphRAGConfig.tsx        |  16 ++-
 graphrag/app/routers/ui.py                    | 119 +++++++++++-------
 4 files changed, 94 insertions(+), 56 deletions(-)

diff --git a/README.md b/README.md
index 739c699..c368979 100644
--- a/README.md
+++ b/README.md
@@ -784,7 +784,7 @@ In addition to the `AZURE_OPENAI_ENDPOINT`, `AZURE_OPENAI_API_KEY`, and `azure_d
 }
 ```
 
-`boto3_config` is optional (the defaults shown above are also the built-in defaults). Raise `max_pool_connections` if `PDF_IMAGE_CONCURRENCY` is set above `50`. The same block can be set on `embedding_service` when using Bedrock embeddings.
+`boto3_config` is optional (the defaults shown above are also the built-in defaults). The same block can be set on `embedding_service` when using Bedrock embeddings.
 
 #### Ollama
 
diff --git a/common/utils/text_extractors.py b/common/utils/text_extractors.py
index 503acad..7858979 100644
--- a/common/utils/text_extractors.py
+++ b/common/utils/text_extractors.py
@@ -537,14 +537,11 @@ def _extract_pdf_with_images_as_docs(file_path, base_doc_id, graphname=None):
                 "position": 0
             }]
         # Phase 1 — describe + base64-encode every image in parallel.
-        # Each worker hits Bedrock for the description and reads the
-        # image off disk, so they're I/O-bound; a small thread pool
-        # cuts wall-clock proportionally for image-heavy PDFs.
-        # Markdown mutations stay in phase 2 (next loop) because
-        # insert_description_by_id / replace_path_with_tg_protocol
-        # mutate the same shared string and must run in deterministic
-        # order. Concurrency cap is intentionally small to stay below
-        # Bedrock's per-account throttle.
+        # Each worker is I/O-bound (one multimodal request + a disk read),
+        # so a thread pool cuts wall-clock proportionally for image-heavy
+        # PDFs. Markdown mutations stay in phase 2 because
+        # insert_description_by_id / replace_path_with_tg_protocol mutate
+        # the same shared string and must run in deterministic order.
         image_workers = image_describe_workers(graphname)
         extract_images_enabled = should_extract_images(graphname)
         min_dim = min_image_dim_px(graphname)
diff --git a/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx b/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
index dd618f8..2228690 100644
--- a/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
+++ b/graphrag-ui/src/pages/setup/GraphRAGConfig.tsx
@@ -212,13 +212,25 @@ const GraphRAGConfig = () => {
   };
 
   const handleSave = async () => {
+    // Hard guards — the button's disabled prop is cosmetic; this is the
+    // runtime check, since handleSave can also be invoked programmatically.
+    if (isLoading || loadFailed) {
+      setMessage("Reload the current configuration before saving.");
+      setMessageType("error");
+      return;
+    }
+    const creds = sessionStorage.getItem("auth");
+    if (!creds) {
+      setMessage("Not signed in. Please sign in again.");
+      setMessageType("error");
+      return;
+    }
+
     setIsSaving(true);
     setMessage("");
     setMessageType("");
 
     try {
-      const creds = sessionStorage.getItem("auth");
-      
       // Build current UI state — only include non-empty fields
       const currentChunkerConfig: any = {};
       if (chunkSize !== "") currentChunkerConfig.chunk_size = parseInt(chunkSize);
diff --git a/graphrag/app/routers/ui.py b/graphrag/app/routers/ui.py
index 7a2d3d1..9e1df27 100644
--- a/graphrag/app/routers/ui.py
+++ b/graphrag/app/routers/ui.py
@@ -21,6 +21,7 @@
 import os
 import re
 import shutil
+import tempfile
 import threading
 import time
 import traceback
@@ -240,7 +241,12 @@ def _get_user_role_details(
     is the secret's owner; for classic user/password logins it matches
     the input.
     """
-    pwd_hash = hashlib.sha256(password.encode()).hexdigest()[:16]
+    # Use the full SHA-256 hex (64 chars). Token logins share the
+    # ``_UI_TOKEN_SENTINEL`` username, so the hash is the only thing
+    # distinguishing one token from another in the cache key — a
+    # truncated hash would let two distinct tokens whose hash prefixes
+    # collide serve each other's cached roles.
+    pwd_hash = hashlib.sha256(password.encode()).hexdigest()
     cache_key = (username, pwd_hash)
     now = time.time()
 
@@ -418,13 +424,23 @@ def _parse_auth_header(authorization: str | None) -> HTTPBasicCredentials:
     if scheme == "basic" and value:
         try:
             decoded = base64.b64decode(value).decode()
-            username, _, password = decoded.partition(":")
         except Exception:
             raise HTTPException(
                 status_code=status.HTTP_401_UNAUTHORIZED,
                 detail="Malformed Basic credentials",
                 headers={"WWW-Authenticate": "Basic"},
             )
+        # RFC 7617: Basic payload MUST be ``user-id ":" password``. Reject
+        # payloads with no colon outright — partition silently produces an
+        # empty password otherwise, which would turn a malformed header
+        # into an empty-password login attempt.
+        if ":" not in decoded:
+            raise HTTPException(
+                status_code=status.HTTP_401_UNAUTHORIZED,
+                detail="Malformed Basic credentials",
+                headers={"WWW-Authenticate": "Basic"},
+            )
+        username, _, password = decoded.partition(":")
         return HTTPBasicCredentials(username=username, password=password)
     if scheme == "bearer" and value:
         return HTTPBasicCredentials(username=_UI_TOKEN_SENTINEL, password=value)
@@ -1533,53 +1549,66 @@ async def convert_sample_files(
 
         saved_basenames: list[str] = []
         total_bytes = 0
-        for f in accepted:
-            data = await f.read()
-            total_bytes += len(data)
-            if total_bytes > max_total_bytes:
-                raise HTTPException(
-                    status_code=400,
-                    detail=f"Total upload exceeds {max_total_mb} MB cap.",
+        # Conversion runs over a request-scoped staging directory so the
+        # schema-extraction step only sees the just-uploaded files — not
+        # whatever else already lives in the per-graph upload directory.
+        staging_dir = tempfile.mkdtemp(prefix=f"sample_convert_{graphname}_")
+        try:
+            for f in accepted:
+                data = await f.read()
+                total_bytes += len(data)
+                if total_bytes > max_total_bytes:
+                    raise HTTPException(
+                        status_code=400,
+                        detail=f"Total upload exceeds {max_total_mb} MB cap.",
+                    )
+                safe_name = os.path.basename(f.filename or "sample")
+                if safe_name in saved_basenames:
+                    raise HTTPException(
+                        status_code=400,
+                        detail=(
+                            f"Duplicate filename '{safe_name}' in upload set. "
+                            "Rename one of the files and try again."
+                        ),
+                    )
+
+                # On overwrite, drop the cached JSONL so the new bytes
+                # are re-converted instead of silently reusing the stale
+                # extract.
+                if overwrite:
+                    stem = os.path.splitext(safe_name)[0]
+                    cached_jsonl = os.path.join(temp_folder, f"{stem}.jsonl")
+                    if os.path.exists(cached_jsonl):
+                        try:
+                            os.remove(cached_jsonl)
+                        except OSError as exc:
+                            logger.warning(
+                                f"Could not remove cached jsonl {cached_jsonl}: {exc}"
+                            )
+
+                # Persist the file in the per-graph upload directory so
+                # it's visible in the upload dialog later, and stage a
+                # copy in the request-private staging directory so the
+                # conversion step only walks the current batch.
+                target = os.path.join(upload_dir, safe_name)
+                with open(target, "wb") as out:
+                    out.write(data)
+                with open(os.path.join(staging_dir, safe_name), "wb") as out:
+                    out.write(data)
+                saved_basenames.append(safe_name)
+
+            extractor = TextExtractor()
+            try:
+                result = await extractor._process_folder_async(
+                    staging_dir, graphname, temp_folder
                 )
-            safe_name = os.path.basename(f.filename or "sample")
-            if safe_name in saved_basenames:
+            except Exception as exc:
                 raise HTTPException(
                     status_code=400,
-                    detail=(
-                        f"Duplicate filename '{safe_name}' in upload set. "
-                        "Rename one of the files and try again."
-                    ),
+                    detail=f"Text extraction failed: {exc}",
                 )
-
-            # On overwrite, drop the cached JSONL so the new bytes
-            # are re-converted instead of silently reusing the stale
-            # extract.
-            if overwrite:
-                stem = os.path.splitext(safe_name)[0]
-                cached_jsonl = os.path.join(temp_folder, f"{stem}.jsonl")
-                if os.path.exists(cached_jsonl):
-                    try:
-                        os.remove(cached_jsonl)
-                    except OSError as exc:
-                        logger.warning(
-                            f"Could not remove cached jsonl {cached_jsonl}: {exc}"
-                        )
-
-            target = os.path.join(upload_dir, safe_name)
-            with open(target, "wb") as out:
-                out.write(data)
-            saved_basenames.append(safe_name)
-
-        extractor = TextExtractor()
-        try:
-            result = await extractor._process_folder_async(
-                upload_dir, graphname, temp_folder
-            )
-        except Exception as exc:
-            raise HTTPException(
-                status_code=400,
-                detail=f"Text extraction failed: {exc}",
-            )
+        finally:
+            shutil.rmtree(staging_dir, ignore_errors=True)
 
         LogWriter.info(
             f"Converted sample files for {graphname}: "

From 801dade63fee44ccc5132326d6a00e2b28e1aeb6 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Thu, 4 Jun 2026 14:44:19 -0700
Subject: [PATCH 15/18] Pass the sample filenames to the conversion walk
 instead of staging

- Restrict the sample-doc conversion to just the files in the current
  request by passing their basenames to the extractor, instead of
  staging duplicates into a request-scoped temp directory
- Drop the now-unused staging dir scaffold and the tempfile import

Refs: GML-2095, GML-2096
---
 common/utils/text_extractors.py |  12 +++-
 graphrag/app/routers/ui.py      | 104 +++++++++++++++-----------------
 2 files changed, 58 insertions(+), 58 deletions(-)

diff --git a/common/utils/text_extractors.py b/common/utils/text_extractors.py
index 7858979..4459f60 100644
--- a/common/utils/text_extractors.py
+++ b/common/utils/text_extractors.py
@@ -236,10 +236,16 @@ def _write_to_jsonl(self, jsonl_file, doc_entries):
                 json_line = json.dumps(doc_data, ensure_ascii=False)
                 f.write(json_line + '\n')
 
-    async def _process_folder_async(self, folder_path, graphname, temp_folder, max_concurrent=10):
+    async def _process_folder_async(self, folder_path, graphname, temp_folder, filenames=None, max_concurrent=10):
         """
         Async version of process_folder for parallel file processing.
         Creates one JSONL file per input file.
+
+        When *filenames* is supplied, only files whose basename appears
+        in that list are processed; everything else in the folder is
+        ignored. This lets a caller (e.g. the sample-doc schema-extraction
+        flow) reuse a shared upload directory without re-converting
+        files that belong to a previous request.
         """
         logger.info(f"Processing local folder ASYNC: {folder_path} for graph: {graphname} (max_concurrent={max_concurrent})")
 
@@ -255,6 +261,8 @@ async def _process_folder_async(self, folder_path, graphname, temp_folder, max_c
         os.makedirs(temp_folder, exist_ok=True)
         logger.info(f"Saving processed documents to: {temp_folder}")
 
+        allowed_basenames = set(filenames) if filenames is not None else None
+
         def safe_walk(path):
             try:
                 for item in path.iterdir():
@@ -276,6 +284,8 @@ def safe_walk(path):
             if file_path.is_file():
                 if file_path.name.startswith(('.', '~', '$')) or 'BROMIUM' in file_path.name.upper():
                     continue
+                if allowed_basenames is not None and file_path.name not in allowed_basenames:
+                    continue
                 file_ext = file_path.suffix.lower()
                 if file_ext == '.jsonl':
                     dest = os.path.join(temp_folder, file_path.name)
diff --git a/graphrag/app/routers/ui.py b/graphrag/app/routers/ui.py
index 9e1df27..c0d5426 100644
--- a/graphrag/app/routers/ui.py
+++ b/graphrag/app/routers/ui.py
@@ -21,7 +21,6 @@
 import os
 import re
 import shutil
-import tempfile
 import threading
 import time
 import traceback
@@ -1549,66 +1548,57 @@ async def convert_sample_files(
 
         saved_basenames: list[str] = []
         total_bytes = 0
-        # Conversion runs over a request-scoped staging directory so the
-        # schema-extraction step only sees the just-uploaded files — not
-        # whatever else already lives in the per-graph upload directory.
-        staging_dir = tempfile.mkdtemp(prefix=f"sample_convert_{graphname}_")
-        try:
-            for f in accepted:
-                data = await f.read()
-                total_bytes += len(data)
-                if total_bytes > max_total_bytes:
-                    raise HTTPException(
-                        status_code=400,
-                        detail=f"Total upload exceeds {max_total_mb} MB cap.",
-                    )
-                safe_name = os.path.basename(f.filename or "sample")
-                if safe_name in saved_basenames:
-                    raise HTTPException(
-                        status_code=400,
-                        detail=(
-                            f"Duplicate filename '{safe_name}' in upload set. "
-                            "Rename one of the files and try again."
-                        ),
-                    )
-
-                # On overwrite, drop the cached JSONL so the new bytes
-                # are re-converted instead of silently reusing the stale
-                # extract.
-                if overwrite:
-                    stem = os.path.splitext(safe_name)[0]
-                    cached_jsonl = os.path.join(temp_folder, f"{stem}.jsonl")
-                    if os.path.exists(cached_jsonl):
-                        try:
-                            os.remove(cached_jsonl)
-                        except OSError as exc:
-                            logger.warning(
-                                f"Could not remove cached jsonl {cached_jsonl}: {exc}"
-                            )
-
-                # Persist the file in the per-graph upload directory so
-                # it's visible in the upload dialog later, and stage a
-                # copy in the request-private staging directory so the
-                # conversion step only walks the current batch.
-                target = os.path.join(upload_dir, safe_name)
-                with open(target, "wb") as out:
-                    out.write(data)
-                with open(os.path.join(staging_dir, safe_name), "wb") as out:
-                    out.write(data)
-                saved_basenames.append(safe_name)
-
-            extractor = TextExtractor()
-            try:
-                result = await extractor._process_folder_async(
-                    staging_dir, graphname, temp_folder
+        for f in accepted:
+            data = await f.read()
+            total_bytes += len(data)
+            if total_bytes > max_total_bytes:
+                raise HTTPException(
+                    status_code=400,
+                    detail=f"Total upload exceeds {max_total_mb} MB cap.",
                 )
-            except Exception as exc:
+            safe_name = os.path.basename(f.filename or "sample")
+            if safe_name in saved_basenames:
                 raise HTTPException(
                     status_code=400,
-                    detail=f"Text extraction failed: {exc}",
+                    detail=(
+                        f"Duplicate filename '{safe_name}' in upload set. "
+                        "Rename one of the files and try again."
+                    ),
                 )
-        finally:
-            shutil.rmtree(staging_dir, ignore_errors=True)
+
+            # On overwrite, drop the cached JSONL so the new bytes
+            # are re-converted instead of silently reusing the stale
+            # extract.
+            if overwrite:
+                stem = os.path.splitext(safe_name)[0]
+                cached_jsonl = os.path.join(temp_folder, f"{stem}.jsonl")
+                if os.path.exists(cached_jsonl):
+                    try:
+                        os.remove(cached_jsonl)
+                    except OSError as exc:
+                        logger.warning(
+                            f"Could not remove cached jsonl {cached_jsonl}: {exc}"
+                        )
+
+            target = os.path.join(upload_dir, safe_name)
+            with open(target, "wb") as out:
+                out.write(data)
+            saved_basenames.append(safe_name)
+
+        extractor = TextExtractor()
+        try:
+            # Restrict the conversion walk to just this request's files
+            # so unrelated files that already live in ``upload_dir`` from
+            # earlier uploads are not re-converted.
+            result = await extractor._process_folder_async(
+                upload_dir, graphname, temp_folder,
+                filenames=saved_basenames,
+            )
+        except Exception as exc:
+            raise HTTPException(
+                status_code=400,
+                detail=f"Text extraction failed: {exc}",
+            )
 
         LogWriter.info(
             f"Converted sample files for {graphname}: "

From 8cb28887a49e3778e8bed68b7a3334fe13a8436c Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Fri, 5 Jun 2026 09:30:40 -0700
Subject: [PATCH 16/18] Redirect the chat WebSocket to the sign-in page when
 session auth is missing

- Send the user back to the sign-in page when the chat WebSocket opens
  without credentials in session storage, instead of sending a "null"
  auth header and letting the server close the connection silently
  (mirrors the same defensive check used elsewhere in the chat UI)

Refs: GML-2094
---
 graphrag-ui/src/actions/ActionProvider.tsx | 19 +++++++++++++------
 1 file changed, 13 insertions(+), 6 deletions(-)

diff --git a/graphrag-ui/src/actions/ActionProvider.tsx b/graphrag-ui/src/actions/ActionProvider.tsx
index 22fee0b..196a5b4 100644
--- a/graphrag-ui/src/actions/ActionProvider.tsx
+++ b/graphrag-ui/src/actions/ActionProvider.tsx
@@ -88,13 +88,20 @@ const ActionProvider: React.FC<ActionProviderProps> = ({
   );
   const { sendMessage, lastMessage, readyState } = useWebSocket(WS_URL, {
     onOpen: () => {
-      // Send authentication credentials
+      // Defensive: the route guard normally ensures ``auth`` is set
+      // before the chat page mounts, but idle-timeout expiry mid-session
+      // or a logout from another tab can clear it before the WebSocket
+      // (re)opens. Without this check we'd send "null" as the auth
+      // header and the server would close the WebSocket with no
+      // user-actionable message.
       const creds = sessionStorage.getItem("auth");
-      console.log("Sending credentials, length:", creds ? creds.length : 0);
-      queryGraphragWs2(creds!);
-
-      // Send RAG pattern
-      //sendMessage(selectedRagPattern);
+      if (!creds) {
+        console.error("No auth credentials available; redirecting to login");
+        alert("Your session has expired. Please log in again.");
+        window.location.href = "/";
+        return;
+      }
+      queryGraphragWs2(creds);
 
       // Send conversation ID (or "new" for new conversation)
       const conversationId = conversationManager.getCurrentConversationId();

From a449a404f7a0b0175a6ef480a711f513eeb5f16d Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Fri, 5 Jun 2026 09:48:30 -0700
Subject: [PATCH 17/18] Show underscores in extracted-schema name and
 description inputs

- Wrap the four schema-edit name and description inputs in a styled
  container so the inner input has no height constraint, mirroring
  the pattern already used by the graph-name combo box. macOS browsers
  otherwise clip the underscore character at the bottom of a height-
  constrained input element.

Refs: GML-2096
---
 graphrag-ui/src/pages/setup/KGAdmin.tsx | 182 ++++++++++++++----------
 1 file changed, 104 insertions(+), 78 deletions(-)

diff --git a/graphrag-ui/src/pages/setup/KGAdmin.tsx b/graphrag-ui/src/pages/setup/KGAdmin.tsx
index 564d49f..b84490e 100644
--- a/graphrag-ui/src/pages/setup/KGAdmin.tsx
+++ b/graphrag-ui/src/pages/setup/KGAdmin.tsx
@@ -25,6 +25,16 @@ import { resolveUploadConflicts } from "@/utils/uploadConflicts";
 import { useNavigate } from "react-router-dom";
 import IngestGraph from "./IngestGraph";
 
+// Same trick used in Login.tsx — Chrome / Safari on macOS clip the
+// underscore descender inside ``<input>`` even when CSS says there is
+// room. Disabling the native input rendering with ``appearance: none``
+// and pinning an explicit line-height makes the underscore render.
+const INPUT_CLIP_FIX: React.CSSProperties = {
+  WebkitAppearance: "none",
+  appearance: "none",
+  lineHeight: "1.5",
+};
+
 const KGAdmin = () => {
   const [confirm, confirmDialog, isConfirmDialogOpen] = useConfirm();
   const [showAlert, alertDialog] = useAlert();
@@ -1547,24 +1557,28 @@ const KGAdmin = () => {
                                   >
                                     {collapsedVertices.has(vIdx) ? "▶" : "▼"}
                                   </button>
-                                  <Input
-                                    placeholder="VertexName"
-                                    value={v.name}
-                                    onChange={(e) =>
-                                      setDraftProposal((p) =>
-                                        p
-                                          ? {
-                                              ...p,
-                                              vertices: p.vertices.map((vv, i) =>
-                                                i === vIdx ? { ...vv, name: e.target.value } : vv
-                                              ),
-                                            }
-                                          : p
-                                      )
-                                    }
-                                    disabled={isInitializing || isExtractingSchema}
-                                    className="flex-1 h-8 text-sm dark:border-[#3D3D3D] dark:bg-shadeA"
-                                  />
+                                  <div className="flex-1 flex h-7 items-center rounded-md border border-input bg-background dark:border-[#3D3D3D] dark:bg-shadeA px-3 focus-within:ring-2 focus-within:ring-ring focus-within:ring-offset-2 ring-offset-background">
+                                    <input
+                                      type="text"
+                                      placeholder="VertexName"
+                                      value={v.name}
+                                      onChange={(e) =>
+                                        setDraftProposal((p) =>
+                                          p
+                                            ? {
+                                                ...p,
+                                                vertices: p.vertices.map((vv, i) =>
+                                                  i === vIdx ? { ...vv, name: e.target.value } : vv
+                                                ),
+                                              }
+                                            : p
+                                        )
+                                      }
+                                      disabled={isInitializing || isExtractingSchema}
+                                      className="flex-1 bg-transparent outline-none border-0 p-0 text-sm text-black dark:text-white placeholder:text-muted-foreground disabled:opacity-50"
+                                      style={INPUT_CLIP_FIX}
+                                    />
+                                  </div>
                                   {collapsedVertices.has(vIdx) && (
                                     <span className="text-xs text-gray-500 dark:text-gray-400 truncate max-w-[40%]">
                                       {v.attributes.length} attr{v.attributes.length === 1 ? "" : "s"}
@@ -1589,26 +1603,30 @@ const KGAdmin = () => {
                                   </button>
                                 </div>
                                 {!collapsedVertices.has(vIdx) && (<>
-                                <Input
-                                  placeholder="Description (1 sentence)"
-                                  value={v.description}
-                                  onChange={(e) =>
-                                    setDraftProposal((p) =>
-                                      p
-                                        ? {
-                                            ...p,
-                                            vertices: p.vertices.map((vv, i) =>
-                                              i === vIdx
-                                                ? { ...vv, description: e.target.value }
-                                                : vv
-                                            ),
-                                          }
-                                        : p
-                                    )
-                                  }
-                                  disabled={isInitializing || isExtractingSchema}
-                                  className="h-8 text-sm dark:border-[#3D3D3D] dark:bg-shadeA"
-                                />
+                                <div className="flex h-7 items-center rounded-md border border-input bg-background dark:border-[#3D3D3D] dark:bg-shadeA px-3 focus-within:ring-2 focus-within:ring-ring focus-within:ring-offset-2 ring-offset-background">
+                                  <input
+                                    type="text"
+                                    placeholder="Description (1 sentence)"
+                                    value={v.description}
+                                    onChange={(e) =>
+                                      setDraftProposal((p) =>
+                                        p
+                                          ? {
+                                              ...p,
+                                              vertices: p.vertices.map((vv, i) =>
+                                                i === vIdx
+                                                  ? { ...vv, description: e.target.value }
+                                                  : vv
+                                              ),
+                                            }
+                                          : p
+                                      )
+                                    }
+                                    disabled={isInitializing || isExtractingSchema}
+                                    className="flex-1 bg-transparent outline-none border-0 p-0 text-sm text-black dark:text-white placeholder:text-muted-foreground disabled:opacity-50"
+                                    style={INPUT_CLIP_FIX}
+                                  />
+                                </div>
                                 <div className="text-xs text-gray-500 dark:text-gray-400">
                                   Attributes ({v.attributes.length}); primary key <code>id</code> auto-added
                                   {attributesCollapsed && (
@@ -1823,26 +1841,30 @@ const KGAdmin = () => {
                                   >
                                     {collapsedEdges.has(eIdx) ? "▶" : "▼"}
                                   </button>
-                                  <Input
-                                    placeholder="EDGE_NAME"
-                                    value={e.name}
-                                    onChange={(ev) =>
-                                      setDraftProposal((p) =>
-                                        p
-                                          ? {
-                                              ...p,
-                                              edges: p.edges.map((ee, i) =>
-                                                i === eIdx
-                                                  ? { ...ee, name: ev.target.value }
-                                                  : ee
-                                              ),
-                                            }
-                                          : p
-                                      )
-                                    }
-                                    disabled={isInitializing || isExtractingSchema}
-                                    className="flex-1 h-8 text-sm dark:border-[#3D3D3D] dark:bg-shadeA"
-                                  />
+                                  <div className="flex-1 flex h-7 items-center rounded-md border border-input bg-background dark:border-[#3D3D3D] dark:bg-shadeA px-3 focus-within:ring-2 focus-within:ring-ring focus-within:ring-offset-2 ring-offset-background">
+                                    <input
+                                      type="text"
+                                      placeholder="EDGE_NAME"
+                                      value={e.name}
+                                      onChange={(ev) =>
+                                        setDraftProposal((p) =>
+                                          p
+                                            ? {
+                                                ...p,
+                                                edges: p.edges.map((ee, i) =>
+                                                  i === eIdx
+                                                    ? { ...ee, name: ev.target.value }
+                                                    : ee
+                                                ),
+                                              }
+                                            : p
+                                        )
+                                      }
+                                      disabled={isInitializing || isExtractingSchema}
+                                      className="flex-1 bg-transparent outline-none border-0 p-0 text-sm text-black dark:text-white placeholder:text-muted-foreground disabled:opacity-50"
+                                      style={INPUT_CLIP_FIX}
+                                    />
+                                  </div>
                                   {collapsedEdges.has(eIdx) && (
                                     <span className="text-xs text-gray-500 dark:text-gray-400 truncate max-w-[40%]">
                                       {e.pairs.length} pair{e.pairs.length === 1 ? "" : "s"}, {e.attributes.length} attr
@@ -1868,26 +1890,30 @@ const KGAdmin = () => {
                                   </button>
                                 </div>
                                 {!collapsedEdges.has(eIdx) && (<>
-                                <Input
-                                  placeholder="Description (1 sentence)"
-                                  value={e.description}
-                                  onChange={(ev) =>
-                                    setDraftProposal((p) =>
-                                      p
-                                        ? {
-                                            ...p,
-                                            edges: p.edges.map((ee, i) =>
-                                              i === eIdx
-                                                ? { ...ee, description: ev.target.value }
-                                                : ee
-                                            ),
-                                          }
-                                        : p
-                                    )
-                                  }
-                                  disabled={isInitializing || isExtractingSchema}
-                                  className="h-8 text-sm dark:border-[#3D3D3D] dark:bg-shadeA"
-                                />
+                                <div className="flex h-7 items-center rounded-md border border-input bg-background dark:border-[#3D3D3D] dark:bg-shadeA px-3 focus-within:ring-2 focus-within:ring-ring focus-within:ring-offset-2 ring-offset-background">
+                                  <input
+                                    type="text"
+                                    placeholder="Description (1 sentence)"
+                                    value={e.description}
+                                    onChange={(ev) =>
+                                      setDraftProposal((p) =>
+                                        p
+                                          ? {
+                                              ...p,
+                                              edges: p.edges.map((ee, i) =>
+                                                i === eIdx
+                                                  ? { ...ee, description: ev.target.value }
+                                                  : ee
+                                              ),
+                                            }
+                                          : p
+                                      )
+                                    }
+                                    disabled={isInitializing || isExtractingSchema}
+                                    className="flex-1 bg-transparent outline-none border-0 p-0 text-sm text-black dark:text-white placeholder:text-muted-foreground disabled:opacity-50"
+                                    style={INPUT_CLIP_FIX}
+                                  />
+                                </div>
                                 <div className="text-xs text-gray-500 dark:text-gray-400">
                                   Endpoints (FROM → TO):
                                 </div>

From b6e64fe284700ab42cd9701dca92b9a7bc31a935 Mon Sep 17 00:00:00 2001
From: Chengbiao Jin <chengbiao.jin@tigergraph.com>
Date: Fri, 5 Jun 2026 11:43:46 -0700
Subject: [PATCH 18/18] Improve answer fidelity for multilingual numeric-heavy
 questions

- Synthesizer prompt: answer in the question's language, quote exact
  values verbatim, list candidates before stating a max / min /
  comparison conclusion
- Multimodal image-describe prompt: for time-series charts, transcribe
  every (period, value) pair instead of summarizing the trend
- README tuning guideline: document raising chunk_size to keep large
  statistical tables whole on table-heavy corpora
---
 README.md                            |  3 ++-
 common/llm_services/base_llm.py      |  3 +++
 common/utils/image_data_extractor.py | 40 +++++++++++++++-------------
 3 files changed, 27 insertions(+), 19 deletions(-)

diff --git a/README.md b/README.md
index c368979..4e85aff 100644
--- a/README.md
+++ b/README.md
@@ -923,8 +923,9 @@ A bad answer at step 4 is rarely fixed by editing the response prompt; usually i
 | Answers miss context that's clearly in the source | chunks too small or no overlap | raise `chunk_size`; bump `overlap_size` (default 1/8 of `chunk_size`); lower `threshold` (`semantic`) |
 | Tables / figures get fragmented | wrong chunker for the source | use `markdown` for markdown / docs converted to markdown; use `html` for HTML pages with structure; use `regex` with a custom `pattern` for structured logs |
 | Cross-section reasoning fails | no overlap | increase `overlap_size` to ~25% of `chunk_size` |
+| Long tables get split mid-row and the answer loses column headers | `chunk_size` (default `2048`) is smaller than the table's serialized length | raise `chunker_config.chunk_size` to fit the largest table whole — for table-heavy regulator / industry reports, **`4096`–`8192` is often the right range** |
 
-Default starting point for prose: `chunker: "semantic"`, `threshold: 0.95`, `chunker_config.method: "percentile"`. Move to `markdown` chunker with `chunk_size: 2048` and `overlap_size: 256` if your source is markdown-heavy and table integrity matters.
+Default starting point for prose: `chunker: "semantic"`, `threshold: 0.95`, `chunker_config.method: "percentile"`. Move to `markdown` chunker with `chunk_size: 2048` and `overlap_size: 256` if your source is markdown-heavy and table integrity matters. For corpora dominated by large statistical tables (regulatory reports, fiscal yearbooks, multi-year financial summaries), start with `markdown`/`html` chunker and `chunk_size: 8192` so each table stays in one chunk.
 
 ### 3. Extraction — make the graph clean before tuning retrieval
 
diff --git a/common/llm_services/base_llm.py b/common/llm_services/base_llm.py
index bf24588..e5f04dc 100644
--- a/common/llm_services/base_llm.py
+++ b/common/llm_services/base_llm.py
@@ -498,6 +498,9 @@ def chatbot_response_prompt(self):
 - **Tables**: every row, including the header, starts on a new line.
 - **Output as JSON** — escape characters as needed so the response is valid JSON. Include every field required by the format instructions; set unknown fields to empty.
 - Treat context keys as citations only when asked; otherwise do NOT include citations in the final answer.
+- **Match the question's language.** Write the entire response (titles, bullet labels, prose, numeric formatting) in the same language the user asked in. Keep proper-noun terms (BSI, DeFi, GDP, etc.) in their original script.
+- **Quote exact values from the source.** Numbers, units, time periods, and named entities must appear verbatim — do not round, approximate, or translate units. If the source says `10,678億円`, write `10,678億円`, not `about 10 trillion yen`.
+- **For comparison or "which is the highest" questions, list each candidate's value before stating the conclusion.** Show the working — do not jump directly to a one-line answer.
 
 ## Inputs
 - **Question**: {question}
diff --git a/common/utils/image_data_extractor.py b/common/utils/image_data_extractor.py
index 95b4581..6be929c 100644
--- a/common/utils/image_data_extractor.py
+++ b/common/utils/image_data_extractor.py
@@ -115,24 +115,28 @@ def describe_image_with_llm(file_path):
                             "captions, and footnotes; (2) the data and structure of "
                             "any chart, graph, or table — name the chart type, the "
                             "axes / columns, and the values or trend the chart "
-                            "actually shows; (3) the entities, relationships, or "
-                            "process steps in any diagram or flowchart; (4) any logo "
-                            "or branding mark, identified by name. Do NOT describe "
-                            "layout, background color, decorative styling, slide "
-                            "templates, or generic visual impressions — those add "
-                            "no retrieval value. Write the description in the same "
-                            "language as the text inside the image; if the image "
-                            "has no text, infer the document's language from any "
-                            "visible labels, captions, or branding and match that. "
-                            "Default to English only if no language signal is "
-                            "present. EXCEPTION: if the image is purely decorative "
-                            "(no text, no data, no diagram), reply with exactly the "
-                            "English phrase \"decorative image\" (lowercase, no "
-                            "punctuation, no translation) and nothing else — this "
-                            "is a fixed sentinel, never localized. Respond as a "
-                            "SINGLE plain-text paragraph — no markdown headings, no "
-                            "bullet lists, no blank lines. The reply is used "
-                            "verbatim as the alt-text inside `![alt](url)`."
+                            "actually shows. For time-series charts (line / bar / "
+                            "stacked bar with a time-period axis), TRANSCRIBE every "
+                            "(period, value) pair you can read in the format "
+                            "`period: value; period: value; …` — do not summarize "
+                            "the trend in place of the values; (3) the entities, "
+                            "relationships, or process steps in any diagram or "
+                            "flowchart; (4) any logo or branding mark, identified by "
+                            "name. Do NOT describe layout, background color, "
+                            "decorative styling, slide templates, or generic visual "
+                            "impressions — those add no retrieval value. Write the "
+                            "description in the same language as the text inside the "
+                            "image; if the image has no text, infer the document's "
+                            "language from any visible labels, captions, or branding "
+                            "and match that. Default to English only if no language "
+                            "signal is present. EXCEPTION: if the image is purely "
+                            "decorative (no text, no data, no diagram), reply with "
+                            "exactly the English phrase \"decorative image\" "
+                            "(lowercase, no punctuation, no translation) and nothing "
+                            "else — this is a fixed sentinel, never localized. "
+                            "Respond as a SINGLE plain-text paragraph — no markdown "
+                            "headings, no bullet lists, no blank lines. The reply is "
+                            "used verbatim as the alt-text inside `![alt](url)`."
                         ),
                     },
                     _build_image_content_block(image_base64, "image/jpeg"),