TechNickAI · TechNickAI · May 4, 2026 · May 4, 2026 · May 4, 2026
diff --git a/.claude-plugin/marketplace.json b/.claude-plugin/marketplace.json
@@ -6,7 +6,7 @@
   },
   "metadata": {
     "description": "Professional AI coding configurations, agents, skills, and context for Claude Code and Cursor",
-    "version": "9.20.0",
+    "version": "9.21.0",
     "license": "MIT",
     "repository": "https://github.com/TechNickAI/ai-coding-config"
   },
@@ -15,7 +15,7 @@
       "name": "ai-coding-config",
       "source": "./plugins/core",
       "description": "Commands, agents, skills, and context for AI-assisted development workflows",
-      "version": "9.20.0",
+      "version": "9.21.0",
       "tags": ["commands", "agents", "skills", "workflows", "essential"]
     }
   ]

diff --git a/plugins/core/.claude-plugin/plugin.json b/plugins/core/.claude-plugin/plugin.json
@@ -1,6 +1,6 @@
 {
   "name": "ai-coding-config",
-  "version": "9.20.0",
+  "version": "9.21.0",
   "description": "Commands, agents, skills, and context for AI-assisted development workflows",
   "author": {
     "name": "TechNickAI",

diff --git a/plugins/core/hooks/README.md b/plugins/core/hooks/README.md
@@ -0,0 +1,85 @@
+# Hooks
+
+Lifecycle hooks that fire during Claude Code sessions. Each hook is a small bash
+script registered in `hooks.json` against a Claude Code event.
+
+## Conventions
+
+- Bash scripts (`.sh`), executable, with a `#!/bin/bash` shebang.
+- Read JSON payload from stdin via `cat`, parse fields with `jq -r '.field // empty'`.
+- Write any guidance for the model to stdout — Claude Code surfaces stdout as
+  context. Scripts that have nothing to say print nothing.
+- Always `exit 0` unless the hook contract specifically supports blocking. A
+  failing hook that returns non-zero can disrupt the harness.
+- Defensive parsing: handle missing fields, empty input, malformed JSON gracefully.
+  Fail open.
+- Match registration in `hooks.json`. Use `${CLAUDE_PLUGIN_ROOT}/hooks/<file>` for
+  the command path.
+
+## Installed Hooks
+
+### `session-multiplexing.sh` — `SessionStart`
+
+Counts recently-touched session marker files. When 3+ Claude Code sessions are
+active, prints a reminder that the user is juggling windows so the assistant
+includes explicit context (repo, branch, current task) in every status update.
+
+### `todo-persist.sh` — `PostToolUse` (TodoWrite)
+
+Mirrors the model's todo list to a human-readable `todos.md` in the project
+directory each time `TodoWrite` runs. Survives compaction and lets the user see
+in-flight work without the harness UI.
+
+### `verify-deliverables.sh` — `SubagentStop`
+
+Cross-references a subagent's recent activity against its completion claims.
+Surfaces a structured advisory back to the parent agent when the tool-call record
+or filesystem disagrees with what the subagent said it did. Always advisory,
+never blocking.
+
+**What it checks:**
+
+- **Completion claim with zero mutations.** If the subagent's final message
+  contains strong completion language ("done.", "implemented X", "all tests pass",
+  ✅) and a file-path-shaped token, but the recent transcript has zero
+  `Write`/`Edit`/`MultiEdit`/`NotebookEdit` calls — flagged as a likely lie.
+- **Tool call recorded but artifact missing.** For each path the subagent's
+  tool calls claim to have written, verifies the file exists on disk now. A
+  missing file means the tool failed silently, was deleted, or the call was
+  fabricated.
+
+**What it doesn't do:**
+
+- Doesn't verify *correctness* — only existence. Use `verify-fix` for behavioral
+  validation.
+- Doesn't block the subagent from stopping. Output is added to
+  `hookSpecificOutput.additionalContext` so the parent agent sees the
+  discrepancy and decides what to do.
+- Doesn't parse natural-language claims aggressively. Patterns are conservative
+  to keep false-positive rate low; we'd rather miss a few lies than nag on
+  honest analytical responses.
+
+**Escape hatches:**
+
+- Set `VERIFY_DELIVERABLES_DISABLED=1` in the environment to bypass entirely.
+- The hook respects `stop_hook_active=true` and exits silently when the harness
+  signals it has already fired once this stop cycle, so it cannot loop.
+- Any internal error or unreadable transcript causes a silent pass — a broken
+  hook never breaks the harness.
+
+**Why this exists:**
+
+The `<epistemic-honesty>` block in `CLAUDE.md`, the `verify-fix` skill, and the
+`verification-before-completion` superpower all try to prevent subagents from
+claiming work they haven't done. Prompts are advisory; this hook is structural.
+See [issue #51](https://github.com/TechNickAI/ai-coding-config/issues/51) for
+the design discussion.
+
+## Running Tests
+
+```bash
+bash plugins/core/hooks/tests/test-verify-deliverables.sh
+```
+
+Test fixtures generate synthetic transcript JSONL and pipe synthetic stdin
+payloads to the hook. No live Claude Code session required.
diff --git a/plugins/core/hooks/hooks.json b/plugins/core/hooks/hooks.json
@@ -21,6 +21,17 @@
           }
         ]
       }
+    ],
+    "SubagentStop": [
+      {
+        "matcher": "*",
+        "hooks": [
+          {
+            "type": "command",
+            "command": "${CLAUDE_PLUGIN_ROOT}/hooks/verify-deliverables.sh"
+          }
+        ]
+      }
     ]
   }
 }
diff --git a/plugins/core/hooks/tests/test-verify-deliverables.sh b/plugins/core/hooks/tests/test-verify-deliverables.sh
@@ -0,0 +1,223 @@
+#!/bin/bash
+# Test harness for verify-deliverables.sh
+#
+# Generates synthetic SubagentStop payloads and transcript JSONL fixtures,
+# pipes them to the hook, and asserts on its stdout. Doesn't require a
+# live Claude Code session.
+#
+# Run from any cwd:
+#   bash plugins/core/hooks/tests/test-verify-deliverables.sh
+
+set -u
+
+HOOK="$(cd "$(dirname "$0")/.." && pwd)/verify-deliverables.sh"
+if [ ! -x "$HOOK" ]; then
+    echo "ERROR: hook not executable at $HOOK"
+    exit 2
+fi
+
+TEST_DIR=$(mktemp -d)
+trap 'rm -rf "$TEST_DIR"' EXIT
+
+PASS=0
+FAIL=0
+
+# --- Helpers ---
+
+# Run a case. $expect is one of:
+#   silent   — assert empty stdout
+#   advisory — assert stdout contains "additionalContext"
+#   <substring> — assert stdout contains the literal substring
+run_case() {
+    local name="$1"
+    local payload="$2"
+    local expect="$3"
+    local output
+    output=$(printf '%s' "$payload" | bash "$HOOK" 2>&1)
+
+    case "$expect" in
+        silent)
+            if [ -z "$output" ]; then
+                echo "PASS: $name"
+                PASS=$((PASS + 1))
+            else
+                echo "FAIL: $name"
+                echo "    expected: silent"
+                echo "    got:      $output"
+                FAIL=$((FAIL + 1))
+            fi
+            ;;
+        advisory)
+            if echo "$output" | grep -q 'additionalContext'; then
+                echo "PASS: $name"
+                PASS=$((PASS + 1))
+            else
+                echo "FAIL: $name"
+                echo "    expected: advisory output"
+                echo "    got:      $output"
+                FAIL=$((FAIL + 1))
+            fi
+            ;;
+        *)
+            if echo "$output" | grep -qF "$expect"; then
+                echo "PASS: $name"
+                PASS=$((PASS + 1))
+            else
+                echo "FAIL: $name"
+                echo "    expected substring: $expect"
+                echo "    got:                $output"
+                FAIL=$((FAIL + 1))
+            fi
+            ;;
+    esac
+}
+
+write_transcript() {
+    local file="$TEST_DIR/$1.jsonl"
+    shift
+    : > "$file"
+    for line in "$@"; do
+        printf '%s\n' "$line" >> "$file"
+    done
+    printf '%s' "$file"
+}
+
+make_payload() {
+    local transcript="$1"
+    local stop_hook_active="${2:-false}"
+    cat <<EOF
+{"transcript_path":"$transcript","agent_transcript_path":"$transcript","stop_hook_active":$stop_hook_active,"cwd":"$TEST_DIR","hook_event_name":"SubagentStop","session_id":"test-session"}
+EOF
+}
+
+# --- Fixtures ---
+
+# An honest write: tool call to foo.ts AND foo.ts exists on disk.
+echo "content" > "$TEST_DIR/foo.ts"
+TX_HONEST=$(write_transcript "honest" \
+    "{\"type\":\"assistant\",\"message\":{\"content\":[{\"type\":\"tool_use\",\"name\":\"Write\",\"input\":{\"file_path\":\"$TEST_DIR/foo.ts\",\"content\":\"content\"}}]}}" \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"Done. Created `foo.ts` as requested."}]}}'
+)
+
+# A liar: completion claim, zero mutating tool calls (only Read).
+TX_LIAR_NO_ACTION=$(write_transcript "liar-no-action" \
+    '{"type":"assistant","message":{"content":[{"type":"tool_use","name":"Read","input":{"file_path":"src/whatever.ts"}}]}}' \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"Done. Implemented the change in src/whatever.ts."}]}}'
+)
+
+# A ghost: tool call recorded but file is not on disk.
+TX_GHOST=$(write_transcript "ghost" \
+    "{\"type\":\"assistant\",\"message\":{\"content\":[{\"type\":\"tool_use\",\"name\":\"Write\",\"input\":{\"file_path\":\"$TEST_DIR/ghost.md\",\"content\":\"x\"}}]}}" \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"All set."}]}}'
+)
+
+# Pure analyst: no completion claim, no mutations.
+TX_ANALYST=$(write_transcript "analyst" \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"I read the code and found 3 patterns worth examining further."}]}}'
+)
+
+# Trivial chatter: completion-ish word but no file path tokens.
+TX_TRIVIAL=$(write_transcript "trivial" \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"All done with the analysis."}]}}'
+)
+
+# Edit (not Write) to existing file. Should pass — Edit counts as mutating.
+echo "before" > "$TEST_DIR/edited.ts"
+TX_EDIT=$(write_transcript "edit-honest" \
+    "{\"type\":\"assistant\",\"message\":{\"content\":[{\"type\":\"tool_use\",\"name\":\"Edit\",\"input\":{\"file_path\":\"$TEST_DIR/edited.ts\",\"old_string\":\"before\",\"new_string\":\"after\"}}]}}" \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"Done. Updated `edited.ts`."}]}}'
+)
+
+# tool_input shape (alternative payload format) for Write.
+echo "alt-content" > "$TEST_DIR/alt.ts"
+TX_ALT_SHAPE=$(write_transcript "alt-shape" \
+    "{\"type\":\"assistant\",\"message\":{\"content\":[{\"type\":\"tool_use\",\"name\":\"Write\",\"tool_input\":{\"file_path\":\"$TEST_DIR/alt.ts\"}}]}}" \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"Done. Wrote alt.ts."}]}}'
+)
+
+# MultiEdit should count as mutating.
+echo "before" > "$TEST_DIR/multi.ts"
+TX_MULTIEDIT=$(write_transcript "multi-edit" \
+    "{\"type\":\"assistant\",\"message\":{\"content\":[{\"type\":\"tool_use\",\"name\":\"MultiEdit\",\"input\":{\"file_path\":\"$TEST_DIR/multi.ts\",\"edits\":[]}}]}}" \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"Done. Updated multi.ts in several places."}]}}'
+)
+
+# NotebookEdit should count as mutating.
+echo "before" > "$TEST_DIR/nb.ipynb"
+TX_NOTEBOOK=$(write_transcript "notebook-edit" \
+    "{\"type\":\"assistant\",\"message\":{\"content\":[{\"type\":\"tool_use\",\"name\":\"NotebookEdit\",\"input\":{\"file_path\":\"$TEST_DIR/nb.ipynb\",\"cell_number\":0,\"new_source\":\"x\"}}]}}" \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"Done. Updated the notebook."}]}}'
+)
+
+# Negation: "not all tests pass" should not flag.
+TX_NEGATION=$(write_transcript "negated" \
+    '{"type":"assistant","message":{"content":[{"type":"tool_use","name":"Read","input":{"file_path":"src/foo.ts"}}]}}' \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"Investigated src/foo.ts — not all tests pass yet."}]}}'
+)
+
+# Trailing boundary: "fixed itself" should not match "fixed it".
+TX_FIXED_ITSELF=$(write_transcript "fixed-itself" \
+    '{"type":"assistant","message":{"content":[{"type":"tool_use","name":"Read","input":{"file_path":"src/x.ts"}}]}}' \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"After reading src/x.ts the issue fixed itself when I retried."}]}}'
+)
+
+# Broken symlink: tool created the symlink, target is gone. -L catches it.
+ln -s "/nonexistent/target" "$TEST_DIR/broken-link"
+TX_BROKEN_SYMLINK=$(write_transcript "broken-symlink" \
+    "{\"type\":\"assistant\",\"message\":{\"content\":[{\"type\":\"tool_use\",\"name\":\"Write\",\"input\":{\"file_path\":\"$TEST_DIR/broken-link\"}}]}}" \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"Done."}]}}'
+)
+
+# Long transcript: Write at start, final message after many Read calls.
+# Confirms the 200-line slice catches Writes that the old 50-line window missed.
+echo "long-content" > "$TEST_DIR/long.ts"
+{
+    printf '%s\n' "{\"type\":\"assistant\",\"message\":{\"content\":[{\"type\":\"tool_use\",\"name\":\"Write\",\"input\":{\"file_path\":\"$TEST_DIR/long.ts\",\"content\":\"x\"}}]}}"
+    for i in $(seq 1 60); do
+        printf '%s\n' "{\"type\":\"assistant\",\"message\":{\"content\":[{\"type\":\"tool_use\",\"name\":\"Read\",\"input\":{\"file_path\":\"src/file-$i.ts\"}}]}}"
+    done
+    printf '%s\n' '{"type":"assistant","message":{"content":[{"type":"text","text":"Done. Implemented in long.ts."}]}}'
+} > "$TEST_DIR/long-transcript.jsonl"
+TX_LONG="$TEST_DIR/long-transcript.jsonl"
+
+# Relative file_path with cwd — must resolve to $CWD/relative.ts.
+echo "relative-content" > "$TEST_DIR/relative.ts"
+TX_RELATIVE=$(write_transcript "relative" \
+    '{"type":"assistant","message":{"content":[{"type":"tool_use","name":"Write","input":{"file_path":"relative.ts"}}]}}' \
+    '{"type":"assistant","message":{"content":[{"type":"text","text":"Done."}]}}'
+)
+
+# --- Cases ---
+
+run_case "honest completion (write + file exists)" "$(make_payload "$TX_HONEST")" silent
+run_case "edit + file exists" "$(make_payload "$TX_EDIT")" silent
+run_case "MultiEdit counts as mutating" "$(make_payload "$TX_MULTIEDIT")" silent
+run_case "NotebookEdit counts as mutating" "$(make_payload "$TX_NOTEBOOK")" silent
+run_case "alt payload shape (.tool_input.file_path)" "$(make_payload "$TX_ALT_SHAPE")" silent
+run_case "pure analyst (no claim, no mutations)" "$(make_payload "$TX_ANALYST")" silent
+run_case "trivial chatter (claim word but no file token)" "$(make_payload "$TX_TRIVIAL")" silent
+run_case "negated 'not all tests pass' (no flag)" "$(make_payload "$TX_NEGATION")" silent
+run_case "'fixed itself' does not match 'fixed it'" "$(make_payload "$TX_FIXED_ITSELF")" silent
+run_case "broken symlink counts as present" "$(make_payload "$TX_BROKEN_SYMLINK")" silent
+run_case "long transcript (Write at line 1, msg after 60 Reads)" "$(make_payload "$TX_LONG")" silent
+run_case "relative file_path resolves against cwd" "$(make_payload "$TX_RELATIVE")" silent
+run_case "liar — completion + 0 mutations" "$(make_payload "$TX_LIAR_NO_ACTION")" "made no file changes"
+run_case "ghost — tool call but file missing on disk" "$(make_payload "$TX_GHOST")" "not present on disk"
+run_case "escape hatch (stop_hook_active=true)" "$(make_payload "$TX_LIAR_NO_ACTION" true)" silent
+run_case "missing transcript path (fail-open)" '{"stop_hook_active":false}' silent
+run_case "non-existent transcript file (fail-open)" "$(make_payload "/nonexistent/transcript.jsonl")" silent
+run_case "empty stdin (fail-open)" '' silent
+
+# Kill switch — set env var, expect silent regardless of payload.
+KILL_OUT=$(printf '%s' "$(make_payload "$TX_LIAR_NO_ACTION")" | VERIFY_DELIVERABLES_DISABLED=1 bash "$HOOK" 2>&1)
+if [ -z "$KILL_OUT" ]; then
+    echo "PASS: kill switch (VERIFY_DELIVERABLES_DISABLED=1)"
+    PASS=$((PASS + 1))
+else
+    echo "FAIL: kill switch — got: $KILL_OUT"
+    FAIL=$((FAIL + 1))
+fi
+
+echo ""
+echo "Results: $PASS passed, $FAIL failed"
+[ "$FAIL" -eq 0 ]