From 7c72097dacc5dbd48ab4532bb2b19ae533818b08 Mon Sep 17 00:00:00 2001
From: michael-wojcik <5386199+michael-wojcik@users.noreply.github.com>
Date: Tue, 5 May 2026 17:05:49 -0400
Subject: [PATCH 1/8] feat: add fixture-parity capture-provenance convention
 for hook stdin captures

Establishes pact-plugin/tests/fixtures/wake_lifecycle/ as the canonical
location for hook PostToolUse stdin captures, with a `_meta` sibling-key
provenance convention (capture_session_id, capture_date, capture_method,
issue_ref).

Structural defense against the failure class that produced #620: hand-
constructed fixtures diverged from production payload shape, tests stayed
green while production was broken. The README mandates the convention for
future hook-stdin fixtures.

Initial fixtures cite #612 (logging-shim capture from session pact-56ce3a2a
on 2026-05-02): TaskCreate production-nested shape, TaskUpdate flat shape
(fossilized for future regression backstop), and the broken pre-#620
legacy shape preserved as a regression backstop.

Refs: #612, #620
---
 .../tests/fixtures/wake_lifecycle/README.md   | 70 +++++++++++++++++++
 .../task_create_legacy_fixture_shape.json     | 18 +++++
 .../task_create_production_shape.json         | 27 +++++++
 .../task_update_production_shape.json         | 22 ++++++
 4 files changed, 137 insertions(+)
 create mode 100644 pact-plugin/tests/fixtures/wake_lifecycle/README.md
 create mode 100644 pact-plugin/tests/fixtures/wake_lifecycle/task_create_legacy_fixture_shape.json
 create mode 100644 pact-plugin/tests/fixtures/wake_lifecycle/task_create_production_shape.json
 create mode 100644 pact-plugin/tests/fixtures/wake_lifecycle/task_update_production_shape.json

diff --git a/pact-plugin/tests/fixtures/wake_lifecycle/README.md b/pact-plugin/tests/fixtures/wake_lifecycle/README.md
new file mode 100644
index 00000000..a8450bd6
--- /dev/null
+++ b/pact-plugin/tests/fixtures/wake_lifecycle/README.md
@@ -0,0 +1,70 @@
+# wake_lifecycle hook stdin fixtures
+
+Captured `PostToolUse` stdin payloads for the
+`pact-plugin/hooks/wake_lifecycle_emitter.py` hook. These fixtures fossilize
+the **production** shape of `tool_response` for `TaskCreate` and `TaskUpdate`
+so tests cannot silently drift away from what the platform actually delivers.
+
+Background: between PR #603 (regression introduction) and #620 (fix), every
+test in `test_inbox_wake_lifecycle_emitter.py` used a hand-constructed flat
+`tool_response: {"id": "..."}` payload. Production `TaskCreate` `tool_response`
+is **nested** (`tool_response.task.id`) per #612's logging-shim capture from
+session `pact-56ce3a2a` on 2026-05-02. The hook silently returned `None` on
+every TaskCreate while tests stayed green. This directory exists to make that
+class of failure structurally impossible going forward.
+
+## Capture-provenance convention (MANDATORY)
+
+Every fixture in this directory MUST be a JSON object with a sibling
+top-level `_meta` key documenting where the payload came from:
+
+```json
+{
+  "_meta": {
+    "capture_session_id": "pact-56ce3a2a",
+    "capture_date": "2026-05-02",
+    "capture_method": "logging-shim",
+    "issue_ref": "#612"
+  },
+  "tool_name": "TaskCreate",
+  "tool_input": { "...": "..." },
+  "tool_response": { "task": { "id": "...", "...": "..." } }
+}
+```
+
+`_meta` is a sibling top-level key. It is NOT nested inside `tool_input` or
+`tool_response`. Tests read it for diagnostic context and ignore it when
+piping the payload through the hook (the hook itself ignores unknown
+top-level keys).
+
+### `_meta` fields
+
+| Field                 | Required | Purpose                                                                    |
+| --------------------- | -------- | -------------------------------------------------------------------------- |
+| `capture_session_id`  | Yes      | PACT session ID where the payload was captured (e.g., `pact-56ce3a2a`).    |
+| `capture_date`        | Yes      | ISO-8601 date of capture (e.g., `2026-05-02`).                             |
+| `capture_method`      | Yes      | How it was captured: `logging-shim`, `manual-stdin-redirect`, or `legacy`. |
+| `issue_ref`           | Yes      | Issue or PR that justifies preserving this fixture (e.g., `#612`).         |
+| `notes`               | No       | Free-form notes (e.g., "preserved as regression backstop").                |
+
+### `capture_method` values
+
+- `logging-shim` — payload was captured by an in-hook stdin logger writing
+  the raw stdin bytes to a side-channel file. Highest fidelity; preferred for
+  any new fixture covering platform-shape behavior.
+- `manual-stdin-redirect` — payload was captured by tee-ing the hook's
+  stdin into a file during a real PACT session. Equivalent fidelity to
+  logging-shim; noted separately for traceability.
+- `legacy` — payload predates the convention and was hand-constructed.
+  Permitted ONLY for backward-compat regression backstops (i.e., tests that
+  intentionally assert behavior on the broken pre-fix shape). Never use
+  `legacy` for new shape-resilience fixtures.
+
+## Future hooks
+
+This convention applies to **all future hook-stdin fixtures**, not just
+wake_lifecycle. When adding fixtures for another hook (e.g., the
+`peer_inject` SubagentStart payload referenced by the audit-test addendum
+on PR B / #628), create a sibling subdirectory with its own README and
+mirror this convention. The provenance-capture discipline IS the structural
+defense against the failure class that #620 surfaced.
diff --git a/pact-plugin/tests/fixtures/wake_lifecycle/task_create_legacy_fixture_shape.json b/pact-plugin/tests/fixtures/wake_lifecycle/task_create_legacy_fixture_shape.json
new file mode 100644
index 00000000..200da5b6
--- /dev/null
+++ b/pact-plugin/tests/fixtures/wake_lifecycle/task_create_legacy_fixture_shape.json
@@ -0,0 +1,18 @@
+{
+  "_meta": {
+    "capture_session_id": "n/a",
+    "capture_date": "pre-2026-05-02",
+    "capture_method": "legacy",
+    "issue_ref": "#620",
+    "notes": "Legacy hand-constructed TaskCreate fixture preserved for regression backstop. This is the FLAT tool_response.id shape that test fixtures used between PR #603 and #620; it does NOT match production. Kept here so a test can assert the function still extracts a task_id from this shape (the fix is additive — flat fallback remains, nested probe is added ahead of it). DO NOT use this shape for new tests; new tests MUST use task_create_production_shape.json."
+  },
+  "tool_name": "TaskCreate",
+  "session_id": "synthetic-legacy",
+  "cwd": "/tmp/proj",
+  "tool_input": {
+    "taskId": "5"
+  },
+  "tool_response": {
+    "id": "5"
+  }
+}
diff --git a/pact-plugin/tests/fixtures/wake_lifecycle/task_create_production_shape.json b/pact-plugin/tests/fixtures/wake_lifecycle/task_create_production_shape.json
new file mode 100644
index 00000000..2ecf7ef6
--- /dev/null
+++ b/pact-plugin/tests/fixtures/wake_lifecycle/task_create_production_shape.json
@@ -0,0 +1,27 @@
+{
+  "_meta": {
+    "capture_session_id": "pact-56ce3a2a",
+    "capture_date": "2026-05-02",
+    "capture_method": "logging-shim",
+    "issue_ref": "#612",
+    "notes": "Captured TaskCreate PostToolUse stdin showing the nested tool_response.task.id production shape. This is the shape every TaskCreate has carried since PR #603, but tests prior to #620 used the legacy flat shape (see task_create_legacy_fixture_shape.json) and the divergence stayed undetected because _extract_task_id silently returned None."
+  },
+  "tool_name": "TaskCreate",
+  "session_id": "pact-56ce3a2a",
+  "cwd": "/Users/mj/Sites/collab/PACT-prompt",
+  "tool_input": {
+    "subject": "First active teammate task",
+    "description": "Initial work item dispatched to a teammate.",
+    "activeForm": "Working on first item"
+  },
+  "tool_response": {
+    "task": {
+      "id": "5",
+      "subject": "First active teammate task",
+      "status": "pending",
+      "owner": "backend-coder",
+      "blockedBy": [],
+      "blocks": []
+    }
+  }
+}
diff --git a/pact-plugin/tests/fixtures/wake_lifecycle/task_update_production_shape.json b/pact-plugin/tests/fixtures/wake_lifecycle/task_update_production_shape.json
new file mode 100644
index 00000000..29e580bd
--- /dev/null
+++ b/pact-plugin/tests/fixtures/wake_lifecycle/task_update_production_shape.json
@@ -0,0 +1,22 @@
+{
+  "_meta": {
+    "capture_session_id": "pact-56ce3a2a",
+    "capture_date": "2026-05-02",
+    "capture_method": "logging-shim",
+    "issue_ref": "#612",
+    "notes": "Captured TaskUpdate PostToolUse stdin showing the FLAT tool_response.id shape. TaskUpdate is currently flat in production (unlike TaskCreate which is nested). Fossilized here so a future platform shape change is caught by the parametrized shape-resilience test rather than silently regressing. The hook's flat-shape probe MUST keep working for this payload."
+  },
+  "tool_name": "TaskUpdate",
+  "session_id": "pact-56ce3a2a",
+  "cwd": "/Users/mj/Sites/collab/PACT-prompt",
+  "tool_input": {
+    "taskId": "5",
+    "status": "completed"
+  },
+  "tool_response": {
+    "id": "5",
+    "subject": "First active teammate task",
+    "status": "completed",
+    "owner": "backend-coder"
+  }
+}

From d151d876bfbd7ba0f4f718fc342b8f38d5a9ae94 Mon Sep 17 00:00:00 2001
From: michael-wojcik <5386199+michael-wojcik@users.noreply.github.com>
Date: Tue, 5 May 2026 17:06:04 -0400
Subject: [PATCH 2/8] fix: extend _extract_task_id to probe nested
 tool_response.task.id (#620)

Production TaskCreate `tool_response` is nested (`tool_response.task.id`)
per #612 logging-shim evidence. The prior flat-only probe returned None
on every TaskCreate, killing the auto-Arm path on the first 0->1 active-
task transition since #603 merged. Manual `/PACT:watch-inbox` continued
to work, masking the regression.

Extends `_extract_task_id` with three-block precedence: tool_input -->
tool_response.task (nested, NEW) --> tool_response (flat, fallback).
Public contract unchanged; signature widened to `dict[str, Any] | None`
to make the pre-existing None-input defense honest. Docstring enumerates
all 8 probe paths in precedence order and documents the WHY (cites
#612 + capture session pact-56ce3a2a 2026-05-02).

Tests:
  - New TestExtractTaskIdShapeResilience class with 7 named methods
    pinning behavior across input-side, nested-response, and flat-
    response paths plus failure modes (unknown shape, empty dicts,
    non-string ids, None input).
  - End-to-end regression test piping the captured production fixture
    through the full hook entry-point asserts an Arm directive is
    emitted.
  - 12 existing TaskCreate fixture stubs rewritten from flat to nested
    shape to match production going forward.

Counter-test-by-revert verified: cardinality {3} on revert (the named
#620 regression test, the end-to-end fixture test, and the
None-input-defense test that fossilizes the isinstance guard).

Refs: #620, #612, PR #603
---
 pact-plugin/hooks/wake_lifecycle_emitter.py   |  52 +++++-
 .../test_inbox_wake_lifecycle_emitter.py      | 156 ++++++++++++++++--
 2 files changed, 191 insertions(+), 17 deletions(-)

diff --git a/pact-plugin/hooks/wake_lifecycle_emitter.py b/pact-plugin/hooks/wake_lifecycle_emitter.py
index ce5dec5c..17db4f76 100644
--- a/pact-plugin/hooks/wake_lifecycle_emitter.py
+++ b/pact-plugin/hooks/wake_lifecycle_emitter.py
@@ -142,16 +142,42 @@ def _is_lead_session(input_data: dict[str, Any], team_name: str) -> bool:
     return raw_session_id == lead_session_id
 
 
-def _extract_task_id(input_data: dict[str, Any]) -> str | None:
+def _extract_task_id(input_data: dict[str, Any] | None) -> str | None:
     """
     Pull the task_id out of the PostToolUse payload.
 
     PostToolUse stdin shape carries the original tool_input under
-    "tool_input" and the tool's response under "tool_response". Both
-    TaskCreate and TaskUpdate accept/return a task with an `id` field.
-    Defensively probe both paths; return None if neither yields a
-    string id.
+    "tool_input" and the tool's response under "tool_response".
+    TaskCreate's tool_response is nested — the created task is wrapped
+    under a "task" key (`tool_response.task.id`) — while TaskUpdate's
+    tool_response is flat (`tool_response.id`). Probe in precedence
+    order, returning the first non-empty string match:
+
+      1. tool_input.taskId
+      2. tool_input.task_id
+      3. tool_response.task.id
+      4. tool_response.task.taskId
+      5. tool_response.task.task_id
+      6. tool_response.id
+      7. tool_response.taskId
+      8. tool_response.task_id
+
+    WHY the nested `tool_response.task.*` probes precede the flat
+    `tool_response.*` probes: production-typical TaskCreate payloads
+    are nested (per #612 logging-shim capture from session
+    pact-56ce3a2a on 2026-05-02). Placing nested probes first means
+    the production-common case hits the first matching probe; the
+    flat probes remain as fallback for TaskUpdate and for legacy/test
+    fixture shapes.
+
+    Returns None if no probe matches a non-empty string. Defensive
+    against `input_data is None`, non-dict sub-payloads, and
+    non-string ids — the caller (`_decide_directive`) exits cleanly
+    when this returns None.
     """
+    if not isinstance(input_data, dict):
+        return None
+
     tool_input = input_data.get("tool_input") or {}
     if isinstance(tool_input, dict):
         tid = tool_input.get("taskId") or tool_input.get("task_id")
@@ -160,7 +186,21 @@ def _extract_task_id(input_data: dict[str, Any]) -> str | None:
 
     tool_response = input_data.get("tool_response") or {}
     if isinstance(tool_response, dict):
-        tid = tool_response.get("id") or tool_response.get("taskId") or tool_response.get("task_id")
+        nested_task = tool_response.get("task") or {}
+        if isinstance(nested_task, dict):
+            tid = (
+                nested_task.get("id")
+                or nested_task.get("taskId")
+                or nested_task.get("task_id")
+            )
+            if isinstance(tid, str) and tid:
+                return tid
+
+        tid = (
+            tool_response.get("id")
+            or tool_response.get("taskId")
+            or tool_response.get("task_id")
+        )
         if isinstance(tid, str) and tid:
             return tid
 
diff --git a/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py b/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py
index 36464eb2..3f635f8f 100644
--- a/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py
+++ b/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py
@@ -132,7 +132,7 @@ def test_missing_team_name_exits_zero_with_suppress(tmp_path):
         "session_id": "abc",
         "cwd": "/tmp/x",
         "tool_input": {"taskId": "1"},
-        "tool_response": {"id": "1"},
+        "tool_response": {"task": {"id": "1"}},
     })
     rc, out, _ = _run_emitter(payload, env_extra=_pact_session_env(tmp_path, "t"))
     assert rc == 0
@@ -198,7 +198,7 @@ def test_arm_emitted_on_first_task_create(tmp_path):
         "session_id": sid,
         "cwd": pdir,
         "tool_input": {"taskId": "task-1"},
-        "tool_response": {"id": "task-1"},
+        "tool_response": {"task": {"id": "task-1"}},
     }
     out = _emit_output(payload, home)
     hso = out["hookSpecificOutput"]
@@ -213,7 +213,7 @@ def test_arm_includes_idempotency_clause(tmp_path):
     _write_task(home, team, "1", status="pending", owner="x")
     out = _emit_output({
         "tool_name": "TaskCreate", "session_id": sid, "cwd": pdir,
-        "tool_input": {"taskId": "1"}, "tool_response": {"id": "1"},
+        "tool_input": {"taskId": "1"}, "tool_response": {"task": {"id": "1"}},
     }, home)
     additional = out["hookSpecificOutput"]["additionalContext"]
     # Case-insensitive — directive prose capitalizes 'Idempotent' but
@@ -251,7 +251,7 @@ def test_arm_directive_contains_precondition_phrase(tmp_path):
     _write_task(home, team, "1", status="pending", owner="x")
     out = _emit_output({
         "tool_name": "TaskCreate", "session_id": sid, "cwd": pdir,
-        "tool_input": {"taskId": "1"}, "tool_response": {"id": "1"},
+        "tool_input": {"taskId": "1"}, "tool_response": {"task": {"id": "1"}},
     }, home)
     assert "First active teammate task created" in out["hookSpecificOutput"]["additionalContext"]
 
@@ -279,7 +279,7 @@ def test_no_op_on_second_active_task_create(tmp_path):
     _write_task(home, team, "new", status="in_progress", owner="y")
     out = _emit_output({
         "tool_name": "TaskCreate", "session_id": sid, "cwd": pdir,
-        "tool_input": {"taskId": "new"}, "tool_response": {"id": "new"},
+        "tool_input": {"taskId": "new"}, "tool_response": {"task": {"id": "new"}},
     }, home)
     assert out == {"suppressOutput": True}
 
@@ -297,7 +297,7 @@ def test_no_op_on_create_of_signal_task(tmp_path):
     )
     out = _emit_output({
         "tool_name": "TaskCreate", "session_id": sid, "cwd": pdir,
-        "tool_input": {"taskId": "sig-1"}, "tool_response": {"id": "sig-1"},
+        "tool_input": {"taskId": "sig-1"}, "tool_response": {"task": {"id": "sig-1"}},
     }, home)
     assert out == {"suppressOutput": True}
 
@@ -309,7 +309,7 @@ def test_no_op_on_create_owned_by_exempt_agent(tmp_path):
     _write_task(home, team, "sec-1", status="in_progress", owner="secretary")
     out = _emit_output({
         "tool_name": "TaskCreate", "session_id": sid, "cwd": pdir,
-        "tool_input": {"taskId": "sec-1"}, "tool_response": {"id": "sec-1"},
+        "tool_input": {"taskId": "sec-1"}, "tool_response": {"task": {"id": "sec-1"}},
     }, home)
     assert out == {"suppressOutput": True}
 
@@ -487,7 +487,7 @@ def test_no_emit_when_session_id_does_not_match_lead(tmp_path):
         "session_id": teammate_sid,
         "cwd": pdir,
         "tool_input": {"taskId": "task-x"},
-        "tool_response": {"id": "task-x"},
+        "tool_response": {"task": {"id": "task-x"}},
     }
     out = _emit_output(payload, home)
     assert out == {"suppressOutput": True}, (
@@ -514,7 +514,7 @@ def test_no_emit_when_team_config_missing(tmp_path):
     _write_task(home, team, "task-x", status="in_progress", owner="x")
     payload = {
         "tool_name": "TaskCreate", "session_id": sid, "cwd": pdir,
-        "tool_input": {"taskId": "task-x"}, "tool_response": {"id": "task-x"},
+        "tool_input": {"taskId": "task-x"}, "tool_response": {"task": {"id": "task-x"}},
     }
     out = _emit_output(payload, home)
     assert out == {"suppressOutput": True}
@@ -604,7 +604,7 @@ def test_count_active_tasks_called_on_taskcreate():
             "tool_name": "TaskCreate",
             "session_id": "sid", "cwd": "/tmp/p",
             "tool_input": {"taskId": "1"},
-            "tool_response": {"id": "1"},
+            "tool_response": {"task": {"id": "1"}},
         }, "team-x")
         assert mock_count.call_count >= 1
 
@@ -640,7 +640,7 @@ def test_oversized_stdin_payload_fails_open_with_suppress(tmp_path):
         "session_id": sid,
         "cwd": pdir,
         "tool_input": {"taskId": "task-cap", "filler": filler},
-        "tool_response": {"id": "task-cap"},
+        "tool_response": {"task": {"id": "task-cap"}},
     }
     payload_bytes = json.dumps(payload_dict).encode("utf-8")
     assert len(payload_bytes) > 1024 * 1024, (
@@ -671,3 +671,137 @@ def test_emitter_documents_payload_size_cap_constant():
     import wake_lifecycle_emitter as emitter
     assert isinstance(emitter._MAX_PAYLOAD_BYTES, int)
     assert 64 * 1024 <= emitter._MAX_PAYLOAD_BYTES <= 16 * 1024 * 1024
+
+
+# ---------- Shape-resilience for _extract_task_id (#620) ----------
+
+FIXTURES_DIR = Path(__file__).resolve().parent / "fixtures" / "wake_lifecycle"
+
+
+class TestExtractTaskIdShapeResilience:
+    """Pin _extract_task_id behavior across every shape it must handle.
+
+    Production `TaskCreate` `tool_response` is **nested**
+    (`tool_response.task.id`) per #612's logging-shim capture; production
+    `TaskUpdate` `tool_response` is **flat** (`tool_response.id`). The
+    regression in #620 was that the function only probed the flat shape,
+    so every TaskCreate returned None and the auto-Arm path was dead.
+
+    This class fossilizes the precedence + shape-resilience contract.
+    Test #1 is the counter-test-by-revert for the #620 fix: reverting
+    the nested-task probe makes it fail.
+    """
+
+    @staticmethod
+    def _extract(input_data):
+        sys.path.insert(0, str(HOOK_DIR))
+        import wake_lifecycle_emitter as emitter
+        return emitter._extract_task_id(input_data)
+
+    def test_taskcreate_production_nested_task_shape(self):
+        """The #620 regression test. Pipes the production TaskCreate
+        shape (`tool_response.task.id`) and asserts the id is extracted.
+        Counter-test-by-revert: revert the nested-task probe and this
+        fails — the function returns None, replicating the bug."""
+        result = self._extract({"tool_response": {"task": {"id": "5"}}})
+        assert result == "5"
+
+    def test_taskupdate_production_flat_shape(self):
+        """Fossilizes the working TaskUpdate shape. The flat fallback
+        must keep working alongside the new nested probe."""
+        result = self._extract({"tool_response": {"id": "5"}})
+        assert result == "5"
+
+    def test_tool_input_taskid_priority(self):
+        """When both `tool_input.taskId` and a tool_response id are
+        present, `tool_input` wins. Pins the precedence so a future
+        reorder breaks this test rather than silently inverting."""
+        result = self._extract({
+            "tool_input": {"taskId": "from-input"},
+            "tool_response": {"task": {"id": "from-response"}},
+        })
+        assert result == "from-input"
+
+    def test_unknown_shape_returns_none(self):
+        """Fail-open on unknown shape: an unrecognized `tool_response`
+        sub-key returns None, allowing the caller to suppressOutput
+        cleanly without crashing."""
+        result = self._extract(
+            {"tool_response": {"unexpected_key": {"id": "lost"}}}
+        )
+        assert result is None
+
+    @pytest.mark.parametrize(
+        "payload",
+        [
+            {"tool_input": {}, "tool_response": {}},
+            {},
+        ],
+        ids=["both-empty-dicts", "fully-empty-input"],
+    )
+    def test_empty_dicts_return_none(self, payload):
+        """No id anywhere → None. Covers both the empty-sub-dicts and
+        the fully-empty-input shapes."""
+        assert self._extract(payload) is None
+
+    @pytest.mark.parametrize(
+        "bad_id",
+        [5, None, ["x"], {"nested": "value"}, True],
+        ids=["int", "none", "list", "dict", "bool"],
+    )
+    def test_non_string_id_returns_none(self, bad_id):
+        """Only string ids are accepted. Pins the type discipline so
+        a future relaxation (e.g., `str(tid)` coercion) breaks loudly.
+
+        Probes both the nested and the flat path so a non-string id
+        in either position is rejected."""
+        # Nested path
+        assert self._extract({"tool_response": {"task": {"id": bad_id}}}) is None
+        # Flat path
+        assert self._extract({"tool_response": {"id": bad_id}}) is None
+
+    def test_none_input_data_returns_none(self):
+        """Defensive against malformed stdin: `_extract_task_id(None)`
+        returns None rather than raising. The caller relies on this
+        fail-soft behavior to keep `_decide_directive` exit-clean."""
+        assert self._extract(None) is None
+
+
+def test_arm_emitted_on_captured_production_taskcreate_payload(tmp_path):
+    """End-to-end #620 regression: pipe the captured production
+    TaskCreate stdin (from `fixtures/wake_lifecycle/task_create_production_shape.json`)
+    through the full hook entry-point and assert an Arm directive is
+    emitted. Counter-test-by-revert: revert the nested-task probe and
+    `_extract_task_id` returns None on this payload → the
+    `if not _extract_task_id(...)` guard exits → no Arm emit → this
+    test fails. The hand-crafted unit test
+    `test_taskcreate_production_nested_task_shape` covers the same
+    failure mode at the function level; this test additionally
+    exercises the full subprocess pipe so a regression in the hook's
+    main() wiring (e.g., re-introducing a flat-only probe somewhere
+    downstream) is also caught."""
+    fixture = json.loads(
+        (FIXTURES_DIR / "task_create_production_shape.json").read_text(encoding="utf-8")
+    )
+    # Strip the diagnostic _meta sibling; the hook would tolerate it,
+    # but pipe a clean payload to mirror what the platform actually
+    # sends.
+    fixture.pop("_meta", None)
+
+    home = tmp_path / "home"; home.mkdir()
+    sid = fixture["session_id"]
+    pdir = fixture["cwd"]
+    team = "team-prod"
+    _write_session_context(home, sid, pdir, team)
+    task_id = fixture["tool_response"]["task"]["id"]
+    _write_task(home, team, task_id, status="pending", owner="backend-coder")
+
+    out = _emit_output(fixture, home)
+    hso = out.get("hookSpecificOutput")
+    assert hso is not None, (
+        f"Expected Arm directive on captured production TaskCreate; "
+        f"got {out!r}. If `out == {{'suppressOutput': True}}`, the "
+        f"nested-task probe in _extract_task_id is missing — see #620."
+    )
+    assert hso["hookEventName"] == "PostToolUse"
+    assert "Skill(\"PACT:watch-inbox\")" in hso["additionalContext"]

From 76c6a9a0a271646f78575a544d5fba1609320983 Mon Sep 17 00:00:00 2001
From: michael-wojcik <5386199+michael-wojcik@users.noreply.github.com>
Date: Tue, 5 May 2026 17:06:45 -0400
Subject: [PATCH 3/8] chore: bump version 4.0.0 -> 4.0.1

Patch release for #620 watch-inbox Arm regression fix.
---
 .claude-plugin/marketplace.json        | 2 +-
 README.md                              | 2 +-
 pact-plugin/.claude-plugin/plugin.json | 2 +-
 pact-plugin/README.md                  | 2 +-
 4 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/.claude-plugin/marketplace.json b/.claude-plugin/marketplace.json
index 2fa8f6cd..04519712 100644
--- a/.claude-plugin/marketplace.json
+++ b/.claude-plugin/marketplace.json
@@ -12,7 +12,7 @@
       "name": "PACT",
       "source": "./pact-plugin",
       "description": "Orchestration harness that turns Claude Code into a coordinated team of specialist AI agents",
-      "version": "4.0.0",
+      "version": "4.0.1",
       "author": {
         "name": "Synaptic-Labs-AI"
       },
diff --git a/README.md b/README.md
index ed6897de..5670220a 100644
--- a/README.md
+++ b/README.md
@@ -504,7 +504,7 @@ When installed as a plugin, PACT lives in your plugin cache:
 │   └── cache/
 │       └── pact-plugin/
 │           └── PACT/
-│               └── 4.0.0/     # Plugin version
+│               └── 4.0.1/     # Plugin version
 │                   ├── agents/
 │                   ├── commands/
 │                   ├── skills/
diff --git a/pact-plugin/.claude-plugin/plugin.json b/pact-plugin/.claude-plugin/plugin.json
index 75e06345..5f8a7dcc 100644
--- a/pact-plugin/.claude-plugin/plugin.json
+++ b/pact-plugin/.claude-plugin/plugin.json
@@ -1,6 +1,6 @@
 {
   "name": "PACT",
-  "version": "4.0.0",
+  "version": "4.0.1",
   "description": "Orchestration harness that turns Claude Code into a coordinated team of specialist AI agents",
   "author": {
     "name": "Synaptic-Labs-AI",
diff --git a/pact-plugin/README.md b/pact-plugin/README.md
index ea96a26e..3f055a1c 100644
--- a/pact-plugin/README.md
+++ b/pact-plugin/README.md
@@ -1,6 +1,6 @@
 # PACT — Orchestration Harness for Claude Code
 
-> **Version**: 4.0.0
+> **Version**: 4.0.1
 
 Turn a single Claude Code session into a managed team of specialist AI agents that prepare, design, build, and test your code systematically.
 

From d355b828aeca5540c711c7f8e655997b54c6657e Mon Sep 17 00:00:00 2001
From: michael-wojcik <5386199+michael-wojcik@users.noreply.github.com>
Date: Tue, 5 May 2026 17:12:32 -0400
Subject: [PATCH 4/8] test: generalize plugin.json version guardrail (4.0.0 ->
 EXPECTED_VERSION constant)

The v4.0.0 release added test_plugin_json_version_is_4_0_0 as a one-shot
guardrail to verify the BREAKING bump landed. With v4.0.1 it would have
needed bumping again; instead, generalize to a module-top EXPECTED_VERSION
constant so future bumps update one location.

Also scrubs planning-artifact identifiers (C1/C9/C11) from the module
docstring per the agent-consumed-docs current-state-only convention;
the docstring now describes what the tests assert today rather than
which planning commits brought them in.

Refs: #620
---
 .../tests/test_plugin_json_orchestrator.py    | 26 +++++++++----------
 1 file changed, 13 insertions(+), 13 deletions(-)

diff --git a/pact-plugin/tests/test_plugin_json_orchestrator.py b/pact-plugin/tests/test_plugin_json_orchestrator.py
index 4113c15b..99ad072a 100644
--- a/pact-plugin/tests/test_plugin_json_orchestrator.py
+++ b/pact-plugin/tests/test_plugin_json_orchestrator.py
@@ -1,14 +1,11 @@
 """
-plugin.json registers pact-orchestrator agent (13-entry list under v4.0.0).
+plugin.json structural invariants for the PACT plugin.
 
-C1 adds `./agents/pact-orchestrator.md` to the `agents` array; C9 drops
-`./commands/bootstrap.md` and `./commands/teammate-bootstrap.md`; C11 bumps
-the version to 4.0.0. These tests assert all three are landed.
-
-Marker discipline (C2): tests against production already on disk (C1: 13-entry
-agents array including pact-orchestrator) are plain tests. Tests dependent on
-C9 (drop bootstrap commands) and C11 (version bump) carry xfail-strict and flip
-in C10 as their dependent commits land.
+Pins the pinned plugin version, the 13-entry alphabetized `agents` array
+(12 teammates + orchestrator), and the absence of the removed bootstrap
+commands (`bootstrap.md` and `teammate-bootstrap.md`) which are no longer
+registered now that the orchestrator persona is delivered via the
+`--agent` flag.
 """
 import json
 from pathlib import Path
@@ -20,6 +17,8 @@
     Path(__file__).parent.parent / ".claude-plugin" / "plugin.json"
 )
 
+EXPECTED_VERSION = "4.0.1"
+
 EXPECTED_AGENTS = {
     "./agents/pact-architect.md",
     "./agents/pact-auditor.md",
@@ -47,9 +46,10 @@ def plugin_json():
     return json.loads(PLUGIN_JSON_PATH.read_text())
 
 
-def test_plugin_json_version_is_4_0_0(plugin_json):
-    assert plugin_json["version"] == "4.0.0", (
-        f"plugin.json version should be 4.0.0 (BREAKING), got {plugin_json['version']}"
+def test_plugin_json_version_is_pinned_to_current_release(plugin_json):
+    assert plugin_json["version"] == EXPECTED_VERSION, (
+        f"plugin.json version should be {EXPECTED_VERSION}, got {plugin_json['version']}. "
+        "Update EXPECTED_VERSION at the top of this file when bumping the plugin version."
     )
 
 
@@ -86,7 +86,7 @@ def test_plugin_json_agents_alphabetized(plugin_json):
 
 
 def test_plugin_json_drops_bootstrap_commands(plugin_json):
-    """C9 removes bootstrap commands — replaced by --agent flag."""
+    """Bootstrap commands are not registered; orchestrator persona is delivered via --agent."""
     commands = set(plugin_json.get("commands", []))
     leaked = REMOVED_COMMANDS & commands
     assert not leaked, (

From fd2c3a20cc58e8bc3dc3d1bc3952e5e881910039 Mon Sep 17 00:00:00 2001
From: michael-wojcik <5386199+michael-wojcik@users.noreply.github.com>
Date: Tue, 5 May 2026 17:52:57 -0400
Subject: [PATCH 5/8] fix: harden _extract_task_id (drop unreachable
 None-defense + reject whitespace-only ids)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Two coupled review-driven hardenings on the extractor:

D2-a: drop the dict[str, Any] | None signature widening + isinstance
top-level guard. main() at L327 pre-filters non-dicts; the guard tested
an unreachable production branch (#538-adjacent capability-without-
consumer). Per-sub-dict isinstance guards on tool_input/tool_response
are kept — main() does NOT pre-filter sub-fields, so they catch
malformed-but-dict shapes that are reachable. The matching
test_none_input_data_returns_none case is dropped from the regression
class; counter-test-by-revert cardinality on the #620 contract goes
{3} -> {2} (named regression test + end-to-end fixture test still hold).

F5: reject whitespace-only ids at all 3 probe sites by adding `.strip()`
to the existing isinstance(tid, str) and tid check. Previously
`{tool_response: {id: '   '}}` returned `'   '` (truthy whitespace),
which would fail downstream TaskStop with semantically-empty id.
Strengthening is symmetric across input-side, nested-response, and
flat-response probes; cascading-fallthrough invariant verified
(whitespace at higher-precedence falls through to next valid probe
rather than short-circuiting to None). New TestExtractTaskIdShape
Resilience::test_whitespace_only_id_returns_none parametrized over 5
whitespace shapes pins the contract.

Also adds test_all_wake_lifecycle_fixtures_carry_meta_provenance: a
top-level enforcement test that globs tests/fixtures/wake_lifecycle/
and asserts each fixture carries the README-mandated _meta provenance
(capture_session_id, capture_date, capture_method, issue_ref). Closes
the README-discipline-only gap surfaced by the test-engineer's
adversarial-coverage review of PR #638.

Refs: #620, #638
---
 pact-plugin/hooks/wake_lifecycle_emitter.py   | 23 +++---
 .../test_inbox_wake_lifecycle_emitter.py      | 70 +++++++++++++++++--
 2 files changed, 76 insertions(+), 17 deletions(-)

diff --git a/pact-plugin/hooks/wake_lifecycle_emitter.py b/pact-plugin/hooks/wake_lifecycle_emitter.py
index 17db4f76..f9126eb8 100644
--- a/pact-plugin/hooks/wake_lifecycle_emitter.py
+++ b/pact-plugin/hooks/wake_lifecycle_emitter.py
@@ -142,7 +142,7 @@ def _is_lead_session(input_data: dict[str, Any], team_name: str) -> bool:
     return raw_session_id == lead_session_id
 
 
-def _extract_task_id(input_data: dict[str, Any] | None) -> str | None:
+def _extract_task_id(input_data: dict[str, Any]) -> str | None:
     """
     Pull the task_id out of the PostToolUse payload.
 
@@ -151,7 +151,8 @@ def _extract_task_id(input_data: dict[str, Any] | None) -> str | None:
     TaskCreate's tool_response is nested — the created task is wrapped
     under a "task" key (`tool_response.task.id`) — while TaskUpdate's
     tool_response is flat (`tool_response.id`). Probe in precedence
-    order, returning the first non-empty string match:
+    order, returning the first match whose value is a string that is
+    non-empty after `.strip()`:
 
       1. tool_input.taskId
       2. tool_input.task_id
@@ -170,18 +171,16 @@ def _extract_task_id(input_data: dict[str, Any] | None) -> str | None:
     flat probes remain as fallback for TaskUpdate and for legacy/test
     fixture shapes.
 
-    Returns None if no probe matches a non-empty string. Defensive
-    against `input_data is None`, non-dict sub-payloads, and
-    non-string ids — the caller (`_decide_directive`) exits cleanly
-    when this returns None.
+    Returned values are guaranteed non-empty after strip — a
+    whitespace-only id (e.g. `"   "`) would propagate to a TaskStop
+    call with a syntactically-valid-but-semantically-empty id and
+    fail downstream; rejecting at the source is cheaper. Returns
+    None if no probe matches.
     """
-    if not isinstance(input_data, dict):
-        return None
-
     tool_input = input_data.get("tool_input") or {}
     if isinstance(tool_input, dict):
         tid = tool_input.get("taskId") or tool_input.get("task_id")
-        if isinstance(tid, str) and tid:
+        if isinstance(tid, str) and tid.strip():
             return tid
 
     tool_response = input_data.get("tool_response") or {}
@@ -193,7 +192,7 @@ def _extract_task_id(input_data: dict[str, Any] | None) -> str | None:
                 or nested_task.get("taskId")
                 or nested_task.get("task_id")
             )
-            if isinstance(tid, str) and tid:
+            if isinstance(tid, str) and tid.strip():
                 return tid
 
         tid = (
@@ -201,7 +200,7 @@ def _extract_task_id(input_data: dict[str, Any] | None) -> str | None:
             or tool_response.get("taskId")
             or tool_response.get("task_id")
         )
-        if isinstance(tid, str) and tid:
+        if isinstance(tid, str) and tid.strip():
             return tid
 
     return None
diff --git a/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py b/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py
index 3f635f8f..78d8c050 100644
--- a/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py
+++ b/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py
@@ -677,6 +677,49 @@ def test_emitter_documents_payload_size_cap_constant():
 
 FIXTURES_DIR = Path(__file__).resolve().parent / "fixtures" / "wake_lifecycle"
 
+_REQUIRED_META_FIELDS = {
+    "capture_session_id",
+    "capture_date",
+    "capture_method",
+    "issue_ref",
+}
+
+
+def test_all_wake_lifecycle_fixtures_carry_meta_provenance():
+    """Convention enforcement for `tests/fixtures/wake_lifecycle/`: every
+    JSON fixture MUST have a top-level `_meta` dict carrying the four
+    required provenance fields. The README in that directory documents
+    the convention; this test enforces it so a future contributor cannot
+    silently add an un-provenanced fixture and weaken the structural
+    defense against the #612-class shape-divergence regression.
+
+    To extend this enforcement to a sibling fixture subdirectory (e.g.,
+    a future `tests/fixtures/peer_inject/`), add a new test function
+    that points at the new dir, or refactor this function to parametrize
+    over a list of provenance-required fixture roots.
+    """
+    fixture_paths = sorted(FIXTURES_DIR.glob("*.json"))
+    assert fixture_paths, (
+        f"No JSON fixtures found in {FIXTURES_DIR}; convention is moot "
+        f"if the directory is empty — verify the test is pointed at the "
+        f"right path."
+    )
+    for fixture_path in fixture_paths:
+        data = json.loads(fixture_path.read_text(encoding="utf-8"))
+        assert "_meta" in data, (
+            f"{fixture_path.name}: missing top-level `_meta` sibling key. "
+            f"See {FIXTURES_DIR.name}/README.md for the convention."
+        )
+        meta = data["_meta"]
+        assert isinstance(meta, dict), (
+            f"{fixture_path.name}: `_meta` must be a dict, got {type(meta).__name__}"
+        )
+        missing = _REQUIRED_META_FIELDS - set(meta.keys())
+        assert not missing, (
+            f"{fixture_path.name}: `_meta` missing required fields: {missing}. "
+            f"Required: {_REQUIRED_META_FIELDS}."
+        )
+
 
 class TestExtractTaskIdShapeResilience:
     """Pin _extract_task_id behavior across every shape it must handle.
@@ -760,11 +803,28 @@ def test_non_string_id_returns_none(self, bad_id):
         # Flat path
         assert self._extract({"tool_response": {"id": bad_id}}) is None
 
-    def test_none_input_data_returns_none(self):
-        """Defensive against malformed stdin: `_extract_task_id(None)`
-        returns None rather than raising. The caller relies on this
-        fail-soft behavior to keep `_decide_directive` exit-clean."""
-        assert self._extract(None) is None
+    @pytest.mark.parametrize(
+        "whitespace_id",
+        ["   ", "\t", "\n", " \t\n ", " "],
+        ids=["spaces", "tab", "newline", "mixed-whitespace", "nbsp"],
+    )
+    def test_whitespace_only_id_returns_none(self, whitespace_id):
+        """Adversarial: a whitespace-only id is a string and truthy
+        (passes `isinstance(tid, str) and tid`), but downstream
+        `count_active_tasks` would silently fail to find a task by
+        whitespace id — masking the real failure mode. The hook's
+        `.strip()` handling rejects whitespace-only ids upfront so the
+        function returns None and `_decide_directive` exits cleanly.
+
+        Counter-test-by-revert: removing the `.strip()` handling makes
+        this test fail (the function returns the whitespace string).
+        Probes both the nested and the flat path so the discipline
+        applies symmetrically.
+        """
+        # Nested path
+        assert self._extract({"tool_response": {"task": {"id": whitespace_id}}}) is None
+        # Flat path
+        assert self._extract({"tool_response": {"id": whitespace_id}}) is None
 
 
 def test_arm_emitted_on_captured_production_taskcreate_payload(tmp_path):

From 950459447b782f5ef6919b01c326ff3907816826 Mon Sep 17 00:00:00 2001
From: michael-wojcik <5386199+michael-wojcik@users.noreply.github.com>
Date: Tue, 5 May 2026 17:53:10 -0400
Subject: [PATCH 6/8] test: align version pinning with sibling pattern +
 tighten README assertions
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Two version-pinning test refinements driven by PR #638 architect +
test-engineer reviews:

D4-a: replace the EXPECTED_VERSION = "4.0.1" literal in
test_plugin_json_orchestrator.py with json.loads(plugin.json)["version"]
dynamic-source pattern matching sibling test_plugin_version_bump.py:23.
Also drops the now-misleading "Update EXPECTED_VERSION when bumping"
comment — with dynamic-source, plugin.json itself is the source of
truth and there is nothing to update at this site. The structural-
existence-check role is documented in the test docstring; cross-file
drift detection is owned by sibling test_plugin_version_bump.py.

option-b: tighten test_root_readme_version + test_pact_plugin_readme_version
in test_plugin_version_bump.py with a word-bounded regex instead of plain
substring search. _TARGET_VERSION_PATTERN compiles
`(?<![\d.])` + re.escape(TARGET_VERSION) + `(?![\d.])` once at module
load. Closes the substring-match edge case where '4.0.1' would falsely
match '4.0.10' in a README. test_marketplace_json_version is left
untouched (set-membership comparison is already exact).

Refs: #638
---
 .../tests/test_plugin_json_orchestrator.py      | 15 ++++++++++-----
 pact-plugin/tests/test_plugin_version_bump.py   | 17 +++++++++++++----
 2 files changed, 23 insertions(+), 9 deletions(-)

diff --git a/pact-plugin/tests/test_plugin_json_orchestrator.py b/pact-plugin/tests/test_plugin_json_orchestrator.py
index 99ad072a..0c512e5a 100644
--- a/pact-plugin/tests/test_plugin_json_orchestrator.py
+++ b/pact-plugin/tests/test_plugin_json_orchestrator.py
@@ -17,7 +17,7 @@
     Path(__file__).parent.parent / ".claude-plugin" / "plugin.json"
 )
 
-EXPECTED_VERSION = "4.0.1"
+EXPECTED_VERSION = json.loads(PLUGIN_JSON_PATH.read_text(encoding="utf-8"))["version"]
 
 EXPECTED_AGENTS = {
     "./agents/pact-architect.md",
@@ -47,10 +47,15 @@ def plugin_json():
 
 
 def test_plugin_json_version_is_pinned_to_current_release(plugin_json):
-    assert plugin_json["version"] == EXPECTED_VERSION, (
-        f"plugin.json version should be {EXPECTED_VERSION}, got {plugin_json['version']}. "
-        "Update EXPECTED_VERSION at the top of this file when bumping the plugin version."
-    )
+    """Structural existence-check that plugin.json carries a version string.
+
+    EXPECTED_VERSION is sourced dynamically from plugin.json at module
+    load, so this assertion is structurally tautological and serves as a
+    schema-level guard ("the `version` key exists and equals itself").
+    Cross-file version drift across plugin.json/marketplace.json/READMEs
+    is caught by sibling test_plugin_version_bump.py.
+    """
+    assert plugin_json["version"] == EXPECTED_VERSION
 
 
 def test_plugin_json_has_13_agents(plugin_json):
diff --git a/pact-plugin/tests/test_plugin_version_bump.py b/pact-plugin/tests/test_plugin_version_bump.py
index ed67d1ad..d7ac2ce7 100644
--- a/pact-plugin/tests/test_plugin_version_bump.py
+++ b/pact-plugin/tests/test_plugin_version_bump.py
@@ -12,6 +12,7 @@
 """
 
 import json
+import re
 from pathlib import Path
 
 import pytest
@@ -23,6 +24,12 @@
 TARGET_VERSION = json.loads(PLUGIN_JSON_PATH.read_text(encoding="utf-8"))[
     "version"
 ]
+# Word-boundary pattern so e.g. "4.0.1" does NOT match "4.0.10" as a
+# substring. The negative-lookbehind/lookahead exclude digits and dots
+# on either side, so the version must appear as a self-contained token.
+_TARGET_VERSION_PATTERN = re.compile(
+    r"(?<![\d.])" + re.escape(TARGET_VERSION) + r"(?![\d.])"
+)
 
 
 # ---------- 4-file version invariants ----------
@@ -48,16 +55,18 @@ def test_marketplace_json_version():
 def test_root_readme_version():
     p = REPO_ROOT / "README.md"
     text = p.read_text(encoding="utf-8")
-    assert TARGET_VERSION in text, (
-        f"root README.md missing target version literal {TARGET_VERSION}"
+    assert _TARGET_VERSION_PATTERN.search(text), (
+        f"root README.md missing target version literal {TARGET_VERSION} "
+        f"as a word-bounded token (not a digit/dot-adjacent substring)"
     )
 
 
 def test_pact_plugin_readme_version():
     p = REPO_ROOT / "pact-plugin" / "README.md"
     text = p.read_text(encoding="utf-8")
-    assert TARGET_VERSION in text, (
-        f"pact-plugin/README.md missing version literal {TARGET_VERSION}"
+    assert _TARGET_VERSION_PATTERN.search(text), (
+        f"pact-plugin/README.md missing version literal {TARGET_VERSION} "
+        f"as a word-bounded token (not a digit/dot-adjacent substring)"
     )
 
 

From f2c8b3087421eb5b5fed2893bafe0b03af666c6a Mon Sep 17 00:00:00 2001
From: michael-wojcik <5386199+michael-wojcik@users.noreply.github.com>
Date: Tue, 5 May 2026 18:06:13 -0400
Subject: [PATCH 7/8] test: clean up pre-existing Pyright unused-var warnings
 (5 sites)

Latent unused-import + 4 unused-vars in test_inbox_wake_lifecycle_emitter.py
and test_plugin_version_bump.py, surfaced by Pyright re-analysis after
PR #638's edits to those files. Pre-existing in main; not introduced
by review remediation. Bundled here for cleanliness.

  test_plugin_version_bump.py:
    L18  drop unused `import pytest` (no @pytest.fixture / @pytest.mark
         / pytest.raises in this file)

  test_inbox_wake_lifecycle_emitter.py:
    L46  drop unused `team_name` param from `_pact_session_env`; 3 callers
         updated (L117/L123/L137). Internal helper, all callers pass the
         literal "t", body never references it.
    L436 drop unused `tmp_path` fixture from
         `test_is_terminal_status_update_matches_completed_and_deleted`
         signature; the test is in-memory predicate-only.
    L582 drop `result =` LHS in
         `test_count_active_tasks_called_on_taskupdate_terminal_status`;
         assertion is on `mock_count.call_count`, the call is for side
         effects.
    L603 same pattern in `test_count_active_tasks_called_on_taskcreate`.

L543 sibling occurrence is deferred to #640 (suite-wide unused-var/
import scrub).

Refs: #638
---
 .../tests/test_inbox_wake_lifecycle_emitter.py     | 14 +++++++-------
 pact-plugin/tests/test_plugin_version_bump.py      |  2 --
 2 files changed, 7 insertions(+), 9 deletions(-)

diff --git a/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py b/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py
index 78d8c050..f63d6a63 100644
--- a/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py
+++ b/pact-plugin/tests/test_inbox_wake_lifecycle_emitter.py
@@ -43,7 +43,7 @@ def _run_emitter(stdin_payload: str | bytes, env_extra: dict | None = None) -> t
     return proc.returncode, proc.stdout.decode("utf-8"), proc.stderr.decode("utf-8")
 
 
-def _pact_session_env(tmp_path: Path, team_name: str) -> dict:
+def _pact_session_env(tmp_path: Path) -> dict:
     """
     Build env vars + on-disk pact-session-context so the emitter's
     pact_context.init() resolves the team_name from the synthesized
@@ -114,13 +114,13 @@ def test_hooks_json_registers_emitter_under_post_tool_use():
 # ---------- Fail-open paths ----------
 
 def test_malformed_stdin_exits_zero_with_suppress(tmp_path):
-    rc, out, _ = _run_emitter(b"\x00not-json\xff", env_extra=_pact_session_env(tmp_path, "t"))
+    rc, out, _ = _run_emitter(b"\x00not-json\xff", env_extra=_pact_session_env(tmp_path))
     assert rc == 0
     assert json.loads(out) == {"suppressOutput": True}
 
 
 def test_non_dict_stdin_exits_zero_with_suppress(tmp_path):
-    rc, out, _ = _run_emitter("[]", env_extra=_pact_session_env(tmp_path, "t"))
+    rc, out, _ = _run_emitter("[]", env_extra=_pact_session_env(tmp_path))
     assert rc == 0
     assert json.loads(out) == {"suppressOutput": True}
 
@@ -134,7 +134,7 @@ def test_missing_team_name_exits_zero_with_suppress(tmp_path):
         "tool_input": {"taskId": "1"},
         "tool_response": {"task": {"id": "1"}},
     })
-    rc, out, _ = _run_emitter(payload, env_extra=_pact_session_env(tmp_path, "t"))
+    rc, out, _ = _run_emitter(payload, env_extra=_pact_session_env(tmp_path))
     assert rc == 0
     assert json.loads(out) == {"suppressOutput": True}
 
@@ -433,7 +433,7 @@ def test_teardown_emitted_on_status_deleted_at_post_zero(tmp_path):
     assert "Skill(\"PACT:unwatch-inbox\")" in hso["additionalContext"]
 
 
-def test_is_terminal_status_update_matches_completed_and_deleted(tmp_path):
+def test_is_terminal_status_update_matches_completed_and_deleted():
     """Direct unit test on the terminal-status predicate. The behavioral
     contract is "task transitioned to a terminal status" — both
     `completed` and `deleted` are terminal."""
@@ -579,7 +579,7 @@ def test_count_active_tasks_called_on_terminal_status_taskupdate():
     from unittest.mock import patch
     with patch.object(emitter, "_is_lead_session", return_value=True), \
          patch.object(emitter, "count_active_tasks", return_value=0) as mock_count:
-        result = emitter._decide_directive({
+        emitter._decide_directive({
             "tool_name": "TaskUpdate",
             "session_id": "sid", "cwd": "/tmp/p",
             "tool_input": {"taskId": "1", "status": "completed"},
@@ -600,7 +600,7 @@ def test_count_active_tasks_called_on_taskcreate():
     with patch.object(emitter, "_is_lead_session", return_value=True), \
          patch.object(emitter, "_extract_task_id", return_value="1"), \
          patch.object(emitter, "count_active_tasks", return_value=1) as mock_count:
-        result = emitter._decide_directive({
+        emitter._decide_directive({
             "tool_name": "TaskCreate",
             "session_id": "sid", "cwd": "/tmp/p",
             "tool_input": {"taskId": "1"},
diff --git a/pact-plugin/tests/test_plugin_version_bump.py b/pact-plugin/tests/test_plugin_version_bump.py
index d7ac2ce7..4238c4e4 100644
--- a/pact-plugin/tests/test_plugin_version_bump.py
+++ b/pact-plugin/tests/test_plugin_version_bump.py
@@ -15,8 +15,6 @@
 import re
 from pathlib import Path
 
-import pytest
-
 REPO_ROOT = Path(__file__).resolve().parent.parent.parent
 PLUGIN_JSON_PATH = (
     REPO_ROOT / "pact-plugin" / ".claude-plugin" / "plugin.json"

From 4e9178d084e5e79e626ca9f4af64d3ddeec654ab Mon Sep 17 00:00:00 2001
From: michael-wojcik <5386199+michael-wojcik@users.noreply.github.com>
Date: Tue, 5 May 2026 18:19:25 -0400
Subject: [PATCH 8/8] test: drop tautological plugin.json version test
 (post-D4-a)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

After D4-a (Commit 95045944) made EXPECTED_VERSION dynamic-source
(`json.loads(plugin.json)["version"]`), the
`test_plugin_json_version_is_pinned_to_current_release` test in
test_plugin_json_orchestrator.py asserts plugin.json's version
equals plugin.json's version — structurally tautological, catches
nothing. Cross-file drift detection is owned by
test_plugin_version_bump.py (which checks plugin.json against
marketplace.json + both READMEs).

Drop the no-op test rather than carry it. Drops:
  - test_plugin_json_version_is_pinned_to_current_release
  - EXPECTED_VERSION module-level computation (orphan after the
    test goes)

Keeps:
  - plugin_json fixture (5 sibling tests consume it)
  - import json + PLUGIN_JSON_PATH (fixture needs both)
  - all 5 surviving tests (13-entry agents array invariants +
    bootstrap-commands-absent invariant)

Module docstring rewritten to lead with the surviving 13-entry
agents array claim + bootstrap-commands-absent invariant + cross-ref
to test_plugin_version_bump.py for version-pinning ownership.

Refs: #638
---
 .../tests/test_plugin_json_orchestrator.py    | 24 ++++---------------
 1 file changed, 5 insertions(+), 19 deletions(-)

diff --git a/pact-plugin/tests/test_plugin_json_orchestrator.py b/pact-plugin/tests/test_plugin_json_orchestrator.py
index 0c512e5a..2320379d 100644
--- a/pact-plugin/tests/test_plugin_json_orchestrator.py
+++ b/pact-plugin/tests/test_plugin_json_orchestrator.py
@@ -1,11 +1,11 @@
 """
 plugin.json structural invariants for the PACT plugin.
 
-Pins the pinned plugin version, the 13-entry alphabetized `agents` array
-(12 teammates + orchestrator), and the absence of the removed bootstrap
-commands (`bootstrap.md` and `teammate-bootstrap.md`) which are no longer
-registered now that the orchestrator persona is delivered via the
-`--agent` flag.
+Pins the 13-entry alphabetized `agents` array (12 teammates + orchestrator)
+and the absence of the removed bootstrap commands (`bootstrap.md` and
+`teammate-bootstrap.md`) which are no longer registered now that the
+orchestrator persona is delivered via the `--agent` flag. Cross-file
+version-consistency is owned by sibling test_plugin_version_bump.py.
 """
 import json
 from pathlib import Path
@@ -17,8 +17,6 @@
     Path(__file__).parent.parent / ".claude-plugin" / "plugin.json"
 )
 
-EXPECTED_VERSION = json.loads(PLUGIN_JSON_PATH.read_text(encoding="utf-8"))["version"]
-
 EXPECTED_AGENTS = {
     "./agents/pact-architect.md",
     "./agents/pact-auditor.md",
@@ -46,18 +44,6 @@ def plugin_json():
     return json.loads(PLUGIN_JSON_PATH.read_text())
 
 
-def test_plugin_json_version_is_pinned_to_current_release(plugin_json):
-    """Structural existence-check that plugin.json carries a version string.
-
-    EXPECTED_VERSION is sourced dynamically from plugin.json at module
-    load, so this assertion is structurally tautological and serves as a
-    schema-level guard ("the `version` key exists and equals itself").
-    Cross-file version drift across plugin.json/marketplace.json/READMEs
-    is caught by sibling test_plugin_version_bump.py.
-    """
-    assert plugin_json["version"] == EXPECTED_VERSION
-
-
 def test_plugin_json_has_13_agents(plugin_json):
     agents = plugin_json.get("agents", [])
     assert len(agents) == 13, (