From b56f8308c5ae7cb2de7d67c7b7825f8ef41744d8 Mon Sep 17 00:00:00 2001
From: "John T. Myers" <9696606+johntmyers@users.noreply.github.com>
Date: Thu, 2 Apr 2026 12:54:59 -0700
Subject: [PATCH 1/9] fix(security): update OSS dependencies to remediate 3
 high-severity CVEs (#737)

- tar 0.4.44 -> 0.4.45 (CVE-2026-33055: PAX size header skip)
- aws-lc-rs 1.16.1 -> 1.16.2 / aws-lc-sys 0.38.0 -> 0.39.1
  (BDSA-2026-5232: name constraints bypass in certificate validation)
- Pygments 2.19.2 -> 2.20.0
  (BDSA-2026-5113 / CVE-2026-4539: catastrophic regex backtracking)
---
 Cargo.lock | 26 +++++++++++++-------------
 uv.lock    |  6 +++---
 2 files changed, 16 insertions(+), 16 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 8f827bc88..7d20c9bd8 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -125,7 +125,7 @@ version = "1.1.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "40c48f72fd53cd289104fc64099abca73db4166ad86ea0b4341abe65af83dadc"
 dependencies = [
- "windows-sys 0.61.2",
+ "windows-sys 0.60.2",
 ]
 
 [[package]]
@@ -136,7 +136,7 @@ checksum = "291e6a250ff86cd4a820112fb8898808a366d8f9f58ce16d1f538353ad55747d"
 dependencies = [
  "anstyle",
  "once_cell_polyfill",
- "windows-sys 0.61.2",
+ "windows-sys 0.60.2",
 ]
 
 [[package]]
@@ -232,9 +232,9 @@ dependencies = [
 
 [[package]]
 name = "aws-lc-rs"
-version = "1.16.1"
+version = "1.16.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "94bffc006df10ac2a68c83692d734a465f8ee6c5b384d8545a636f81d858f4bf"
+checksum = "a054912289d18629dc78375ba2c3726a3afe3ff71b4edba9dedfca0e3446d1fc"
 dependencies = [
  "aws-lc-sys",
  "untrusted 0.7.1",
@@ -243,9 +243,9 @@ dependencies = [
 
 [[package]]
 name = "aws-lc-sys"
-version = "0.38.0"
+version = "0.39.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4321e568ed89bb5a7d291a7f37997c2c0df89809d7b6d12062c81ddb54aa782e"
+checksum = "83a25cf98105baa966497416dbd42565ce3a8cf8dbfd59803ec9ad46f3126399"
 dependencies = [
  "cc",
  "cmake",
@@ -1283,7 +1283,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "39cab71617ae0d63f51a36d69f866391735b51691dbda63cf6f96d042b63efeb"
 dependencies = [
  "libc",
- "windows-sys 0.61.2",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]
@@ -2691,7 +2691,7 @@ version = "0.50.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "7957b9740744892f114936ab4a57b3f487491bbeafaf8083688b16841a4240e5"
 dependencies = [
- "windows-sys 0.61.2",
+ "windows-sys 0.59.0",
 ]
 
 [[package]]
@@ -4044,7 +4044,7 @@ dependencies = [
  "errno",
  "libc",
  "linux-raw-sys 0.12.1",
- "windows-sys 0.61.2",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]
@@ -4519,7 +4519,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "3a766e1110788c36f4fa1c2b71b387a7815aa65f88ce0229841826633d93723e"
 dependencies = [
  "libc",
- "windows-sys 0.61.2",
+ "windows-sys 0.60.2",
 ]
 
 [[package]]
@@ -4902,9 +4902,9 @@ dependencies = [
 
 [[package]]
 name = "tar"
-version = "0.4.44"
+version = "0.4.45"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1d863878d212c87a19c1a610eb53bb01fe12951c0501cf5a0d65f724914a667a"
+checksum = "22692a6476a21fa75fdfc11d452fda482af402c008cdbaf3476414e122040973"
 dependencies = [
  "filetime",
  "libc",
@@ -4930,7 +4930,7 @@ dependencies = [
  "getrandom 0.4.2",
  "once_cell",
  "rustix 1.1.4",
- "windows-sys 0.61.2",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]
diff --git a/uv.lock b/uv.lock
index 687a035ae..38a03ce29 100644
--- a/uv.lock
+++ b/uv.lock
@@ -637,11 +637,11 @@ wheels = [
 
 [[package]]
 name = "pygments"
-version = "2.19.2"
+version = "2.20.0"
 source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/b0/77/a5b8c569bf593b0140bde72ea885a803b82086995367bf2037de0159d924/pygments-2.19.2.tar.gz", hash = "sha256:636cb2477cec7f8952536970bc533bc43743542f70392ae026374600add5b887", size = 4968631, upload-time = "2025-06-21T13:39:12.283Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/c3/b2/bc9c9196916376152d655522fdcebac55e66de6603a76a02bca1b6414f6c/pygments-2.20.0.tar.gz", hash = "sha256:6757cd03768053ff99f3039c1a36d6c0aa0b263438fcab17520b30a303a82b5f", size = 4955991, upload-time = "2026-03-29T13:29:33.898Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/c7/21/705964c7812476f378728bdf590ca4b771ec72385c533964653c68e86bdc/pygments-2.19.2-py3-none-any.whl", hash = "sha256:86540386c03d588bb81d44bc3928634ff26449851e99741617ecb9037ee5ec0b", size = 1225217, upload-time = "2025-06-21T13:39:07.939Z" },
+    { url = "https://files.pythonhosted.org/packages/f4/7e/a72dd26f3b0f4f2bf1dd8923c85f7ceb43172af56d63c7383eb62b332364/pygments-2.20.0-py3-none-any.whl", hash = "sha256:81a9e26dd42fd28a23a2d169d86d7ac03b46e2f8b59ed4698fb4785f946d0176", size = 1231151, upload-time = "2026-03-29T13:29:30.038Z" },
 ]
 
 [[package]]

From 8887d7c66ac6589617e70776e2c7e2104a9a81e6 Mon Sep 17 00:00:00 2001
From: "John T. Myers" <9696606+johntmyers@users.noreply.github.com>
Date: Thu, 2 Apr 2026 14:30:51 -0700
Subject: [PATCH 2/9] fix(sandbox): harden seccomp filter to block dangerous
 syscalls (#740)

---
 architecture/sandbox.md                       |  46 ++++-
 architecture/security-policy.md               |  29 ++-
 .../src/sandbox/linux/seccomp.rs              | 182 ++++++++++++++++++
 3 files changed, 248 insertions(+), 9 deletions(-)

diff --git a/architecture/sandbox.md b/architecture/sandbox.md
index c870708dd..c5e212f85 100644
--- a/architecture/sandbox.md
+++ b/architecture/sandbox.md
@@ -24,7 +24,7 @@ All paths are relative to `crates/openshell-sandbox/src/`.
 | `sandbox/mod.rs` | Platform abstraction -- dispatches to Linux or no-op |
 | `sandbox/linux/mod.rs` | Linux composition: Landlock then seccomp |
 | `sandbox/linux/landlock.rs` | Filesystem isolation via Landlock LSM (ABI V1) |
-| `sandbox/linux/seccomp.rs` | Syscall filtering via BPF on `SYS_socket` |
+| `sandbox/linux/seccomp.rs` | Syscall filtering via BPF: socket domain blocks, dangerous syscall blocks, conditional flag blocks |
 | `bypass_monitor.rs` | Background `/dev/kmsg` reader for iptables bypass detection events |
 | `sandbox/linux/netns.rs` | Network namespace creation, veth pair setup, bypass detection iptables rules, cleanup on drop |
 | `l7/mod.rs` | L7 types (`L7Protocol`, `TlsMode`, `EnforcementMode`, `L7EndpointConfig`), config parsing, validation, access preset expansion, deprecated `tls` value handling |
@@ -451,13 +451,7 @@ Kernel-level error behavior (e.g., Landlock ABI unavailable) depends on `Landloc
 
 **File:** `crates/openshell-sandbox/src/sandbox/linux/seccomp.rs`
 
-Seccomp blocks socket creation for specific address families. The filter targets a single syscall (`SYS_socket`) and inspects argument 0 (the domain).
-
-**Always blocked** (regardless of network mode):
-- `AF_NETLINK`, `AF_PACKET`, `AF_BLUETOOTH`, `AF_VSOCK`
-
-**Additionally blocked in `Block` mode** (no proxy):
-- `AF_INET`, `AF_INET6`
+Seccomp provides three layers of syscall restriction: socket domain blocks, unconditional syscall blocks, and conditional syscall blocks. The filter uses a default-allow policy (`SeccompAction::Allow`) with targeted rules that return `Errno(EPERM)`.
 
 **Skipped entirely** in `Allow` mode.
 
@@ -465,8 +459,44 @@ Setup:
 1. `prctl(PR_SET_NO_NEW_PRIVS, 1)` -- required before seccomp
 2. `seccompiler::apply_filter()` with default action `Allow` and per-rule action `Errno(EPERM)`
 
+#### Socket domain blocks
+
+| Domain | Always blocked | Additionally blocked in Block mode |
+|--------|:-:|:-:|
+| `AF_PACKET` | Yes | |
+| `AF_BLUETOOTH` | Yes | |
+| `AF_VSOCK` | Yes | |
+| `AF_INET` | | Yes |
+| `AF_INET6` | | Yes |
+| `AF_NETLINK` | | Yes |
+
 In `Proxy` mode, `AF_INET`/`AF_INET6` are allowed because the sandboxed process needs to connect to the proxy over the veth pair. The network namespace ensures it can only reach the proxy's IP (`10.200.0.1`).
 
+#### Unconditional syscall blocks
+
+These syscalls are blocked entirely (EPERM for any invocation):
+
+| Syscall | Reason |
+|---------|--------|
+| `memfd_create` | Fileless binary execution bypasses Landlock filesystem restrictions |
+| `ptrace` | Cross-process memory inspection and code injection |
+| `bpf` | Kernel BPF program loading |
+| `process_vm_readv` | Cross-process memory read |
+| `io_uring_setup` | Async I/O subsystem with extensive CVE history |
+| `mount` | Filesystem mount could subvert Landlock or overlay writable paths |
+
+#### Conditional syscall blocks
+
+These syscalls are only blocked when specific flag patterns are present:
+
+| Syscall | Condition | Reason |
+|---------|-----------|--------|
+| `execveat` | `AT_EMPTY_PATH` flag set (arg4) | Fileless execution from an anonymous fd |
+| `unshare` | `CLONE_NEWUSER` flag set (arg0) | User namespace creation enables privilege escalation |
+| `seccomp` | operation == `SECCOMP_SET_MODE_FILTER` (arg0) | Prevents sandboxed code from replacing the active filter |
+
+Conditional blocks use `MaskedEq` for flag checks (bit-test) and `Eq` for exact-value matches. This allows normal use of these syscalls while blocking the dangerous flag combinations.
+
 ### Network namespace isolation
 
 **File:** `crates/openshell-sandbox/src/sandbox/linux/netns.rs`
diff --git a/architecture/security-policy.md b/architecture/security-policy.md
index 555ba67a5..01eb96f94 100644
--- a/architecture/security-policy.md
+++ b/architecture/security-policy.md
@@ -850,6 +850,10 @@ The response includes an `X-OpenShell-Policy` header and `Connection: close`. Se
 
 ## Seccomp Filter Details
 
+The seccomp filter uses a default-allow policy (`SeccompAction::Allow`) with targeted rules that return `EPERM`. It provides three layers of protection: socket domain blocks, unconditional syscall blocks, and conditional syscall blocks. See `crates/openshell-sandbox/src/sandbox/linux/seccomp.rs`.
+
+### Blocked socket domains
+
 Regardless of network mode, certain socket domains are always blocked:
 
 | Domain         | Constant | Reason                                                                          |
@@ -861,7 +865,30 @@ Regardless of network mode, certain socket domains are always blocked:
 
 In proxy mode (which is always active), `AF_INET` (2) and `AF_INET6` (10) are allowed so the sandbox process can reach the proxy.
 
-The seccomp filter uses a default-allow policy (`SeccompAction::Allow`) with specific `socket()` syscall rules that return `EPERM` when the first argument (domain) matches a blocked value. See `crates/openshell-sandbox/src/sandbox/linux/seccomp.rs`.
+### Blocked syscalls
+
+These syscalls are blocked unconditionally (EPERM for any invocation):
+
+| Syscall | NR (x86-64) | Reason |
+|---------|-------------|--------|
+| `memfd_create` | 319 | Fileless binary execution bypasses Landlock filesystem restrictions |
+| `ptrace` | 101 | Cross-process memory inspection and code injection |
+| `bpf` | 321 | Kernel BPF program loading |
+| `process_vm_readv` | 310 | Cross-process memory read |
+| `io_uring_setup` | 425 | Async I/O subsystem with extensive CVE history |
+| `mount` | 165 | Filesystem mount could subvert Landlock or overlay writable paths |
+
+### Conditionally blocked syscalls
+
+These syscalls are blocked only when specific flag patterns are present in their arguments:
+
+| Syscall | NR (x86-64) | Condition | Reason |
+|---------|-------------|-----------|--------|
+| `execveat` | 322 | `AT_EMPTY_PATH` (0x1000) set in flags (arg4) | Fileless execution from an anonymous fd |
+| `unshare` | 272 | `CLONE_NEWUSER` (0x10000000) set in flags (arg0) | User namespace creation enables privilege escalation |
+| `seccomp` | 317 | operation == `SECCOMP_SET_MODE_FILTER` (1) in arg0 | Prevents sandboxed code from replacing the active filter |
+
+Flag checks use `MaskedEq` (`(arg & mask) == mask`) to detect the flag bit regardless of other bits. The `seccomp` syscall check uses `Eq` for exact value comparison on the operation argument.
 
 ---
 
diff --git a/crates/openshell-sandbox/src/sandbox/linux/seccomp.rs b/crates/openshell-sandbox/src/sandbox/linux/seccomp.rs
index 6c9d8307b..e23447498 100644
--- a/crates/openshell-sandbox/src/sandbox/linux/seccomp.rs
+++ b/crates/openshell-sandbox/src/sandbox/linux/seccomp.rs
@@ -2,6 +2,15 @@
 // SPDX-License-Identifier: Apache-2.0
 
 //! Seccomp syscall filtering.
+//!
+//! The filter uses a default-allow policy with targeted blocks:
+//!
+//! 1. **Socket domain blocks** -- prevent raw/kernel sockets that bypass the proxy
+//! 2. **Unconditional syscall blocks** -- block syscalls that enable sandbox escape
+//!    (fileless exec, ptrace, BPF, cross-process memory access, io_uring, mount)
+//! 3. **Conditional syscall blocks** -- block dangerous flag combinations on otherwise
+//!    needed syscalls (execveat+AT_EMPTY_PATH, unshare+CLONE_NEWUSER,
+//!    seccomp+SET_MODE_FILTER)
 
 use crate::policy::{NetworkMode, SandboxPolicy};
 use miette::{IntoDiagnostic, Result};
@@ -13,6 +22,9 @@ use std::collections::BTreeMap;
 use std::convert::TryInto;
 use tracing::debug;
 
+/// Value of `SECCOMP_SET_MODE_FILTER` (linux/seccomp.h).
+const SECCOMP_SET_MODE_FILTER: u64 = 1;
+
 pub fn apply(policy: &SandboxPolicy) -> Result<()> {
     if matches!(policy.network.mode, NetworkMode::Allow) {
         return Ok(());
@@ -37,6 +49,7 @@ pub fn apply(policy: &SandboxPolicy) -> Result<()> {
 fn build_filter(allow_inet: bool) -> Result<seccompiler::BpfProgram> {
     let mut rules: BTreeMap<i64, Vec<SeccompRule>> = BTreeMap::new();
 
+    // --- Socket domain blocks ---
     let mut blocked_domains = vec![libc::AF_PACKET, libc::AF_BLUETOOTH, libc::AF_VSOCK];
     if !allow_inet {
         blocked_domains.push(libc::AF_INET);
@@ -49,6 +62,51 @@ fn build_filter(allow_inet: bool) -> Result<seccompiler::BpfProgram> {
         add_socket_domain_rule(&mut rules, domain)?;
     }
 
+    // --- Unconditional syscall blocks ---
+    // These syscalls are blocked entirely (empty rule vec = unconditional EPERM).
+
+    // Fileless binary execution via memfd bypasses Landlock filesystem restrictions.
+    rules.entry(libc::SYS_memfd_create).or_default();
+    // Cross-process memory inspection and code injection.
+    rules.entry(libc::SYS_ptrace).or_default();
+    // Kernel BPF program loading.
+    rules.entry(libc::SYS_bpf).or_default();
+    // Cross-process memory read.
+    rules.entry(libc::SYS_process_vm_readv).or_default();
+    // Async I/O subsystem with extensive CVE history.
+    rules.entry(libc::SYS_io_uring_setup).or_default();
+    // Filesystem mount could subvert Landlock or overlay writable paths.
+    rules.entry(libc::SYS_mount).or_default();
+
+    // --- Conditional syscall blocks ---
+
+    // execveat with AT_EMPTY_PATH enables fileless execution from an anonymous fd.
+    add_masked_arg_rule(
+        &mut rules,
+        libc::SYS_execveat,
+        4, // flags argument
+        libc::AT_EMPTY_PATH as u64,
+    )?;
+
+    // unshare with CLONE_NEWUSER allows creating user namespaces to escalate privileges.
+    add_masked_arg_rule(
+        &mut rules,
+        libc::SYS_unshare,
+        0, // flags argument
+        libc::CLONE_NEWUSER as u64,
+    )?;
+
+    // seccomp(SECCOMP_SET_MODE_FILTER) would let sandboxed code replace the active filter.
+    let condition = SeccompCondition::new(
+        0, // operation argument
+        SeccompCmpArgLen::Dword,
+        SeccompCmpOp::Eq,
+        SECCOMP_SET_MODE_FILTER,
+    )
+    .into_diagnostic()?;
+    let rule = SeccompRule::new(vec![condition]).into_diagnostic()?;
+    rules.entry(libc::SYS_seccomp).or_default().push(rule);
+
     let arch = std::env::consts::ARCH
         .try_into()
         .map_err(|_| miette::miette!("Unsupported architecture for seccomp"))?;
@@ -74,3 +132,127 @@ fn add_socket_domain_rule(rules: &mut BTreeMap<i64, Vec<SeccompRule>>, domain: i
     rules.entry(libc::SYS_socket).or_default().push(rule);
     Ok(())
 }
+
+/// Block a syscall when a specific bit pattern is set in an argument.
+///
+/// Uses `MaskedEq` to check `(arg & flag_bit) == flag_bit`, which triggers
+/// EPERM when the flag is present regardless of other bits in the argument.
+fn add_masked_arg_rule(
+    rules: &mut BTreeMap<i64, Vec<SeccompRule>>,
+    syscall: i64,
+    arg_index: u8,
+    flag_bit: u64,
+) -> Result<()> {
+    let condition = SeccompCondition::new(
+        arg_index,
+        SeccompCmpArgLen::Dword,
+        SeccompCmpOp::MaskedEq(flag_bit),
+        flag_bit,
+    )
+    .into_diagnostic()?;
+    let rule = SeccompRule::new(vec![condition]).into_diagnostic()?;
+    rules.entry(syscall).or_default().push(rule);
+    Ok(())
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn build_filter_proxy_mode_compiles() {
+        let filter = build_filter(true);
+        assert!(filter.is_ok(), "build_filter(true) should succeed");
+    }
+
+    #[test]
+    fn build_filter_block_mode_compiles() {
+        let filter = build_filter(false);
+        assert!(filter.is_ok(), "build_filter(false) should succeed");
+    }
+
+    #[test]
+    fn add_masked_arg_rule_creates_entry() {
+        let mut rules: BTreeMap<i64, Vec<SeccompRule>> = BTreeMap::new();
+        let result = add_masked_arg_rule(&mut rules, libc::SYS_execveat, 4, 0x1000);
+        assert!(result.is_ok());
+        assert!(
+            rules.contains_key(&libc::SYS_execveat),
+            "should have an entry for SYS_execveat"
+        );
+        assert_eq!(
+            rules[&libc::SYS_execveat].len(),
+            1,
+            "should have exactly one rule"
+        );
+    }
+
+    #[test]
+    fn unconditional_blocks_present_in_filter() {
+        let mut rules: BTreeMap<i64, Vec<SeccompRule>> = BTreeMap::new();
+
+        // Simulate what build_filter does for unconditional blocks
+        rules.entry(libc::SYS_memfd_create).or_default();
+        rules.entry(libc::SYS_ptrace).or_default();
+        rules.entry(libc::SYS_bpf).or_default();
+        rules.entry(libc::SYS_process_vm_readv).or_default();
+        rules.entry(libc::SYS_io_uring_setup).or_default();
+        rules.entry(libc::SYS_mount).or_default();
+
+        // Unconditional blocks have an empty Vec (no conditions = always match)
+        for syscall in [
+            libc::SYS_memfd_create,
+            libc::SYS_ptrace,
+            libc::SYS_bpf,
+            libc::SYS_process_vm_readv,
+            libc::SYS_io_uring_setup,
+            libc::SYS_mount,
+        ] {
+            assert!(
+                rules.contains_key(&syscall),
+                "syscall {syscall} should be in the rules map"
+            );
+            assert!(
+                rules[&syscall].is_empty(),
+                "syscall {syscall} should have empty rules (unconditional block)"
+            );
+        }
+    }
+
+    #[test]
+    fn conditional_blocks_have_rules() {
+        // Build a real filter and verify the conditional syscalls have rule entries
+        // (non-empty Vec means conditional match)
+        let mut rules: BTreeMap<i64, Vec<SeccompRule>> = BTreeMap::new();
+
+        add_masked_arg_rule(
+            &mut rules,
+            libc::SYS_execveat,
+            4,
+            libc::AT_EMPTY_PATH as u64,
+        )
+        .unwrap();
+        add_masked_arg_rule(&mut rules, libc::SYS_unshare, 0, libc::CLONE_NEWUSER as u64).unwrap();
+
+        let condition = SeccompCondition::new(
+            0,
+            SeccompCmpArgLen::Dword,
+            SeccompCmpOp::Eq,
+            SECCOMP_SET_MODE_FILTER,
+        )
+        .unwrap();
+        let rule = SeccompRule::new(vec![condition]).unwrap();
+        rules.entry(libc::SYS_seccomp).or_default().push(rule);
+
+        for syscall in [libc::SYS_execveat, libc::SYS_unshare, libc::SYS_seccomp] {
+            assert!(
+                rules.contains_key(&syscall),
+                "syscall {syscall} should be in the rules map"
+            );
+            assert!(
+                !rules[&syscall].is_empty(),
+                "syscall {syscall} should have conditional rules"
+            );
+        }
+    }
+}

From 77e55ea989d144b8761875a6c566d9289dac460b Mon Sep 17 00:00:00 2001
From: "John T. Myers" <9696606+johntmyers@users.noreply.github.com>
Date: Thu, 2 Apr 2026 15:06:32 -0700
Subject: [PATCH 3/9] test(e2e): replace flaky Python live policy update tests
 with Rust (#742)

Remove test_live_policy_update_and_logs and
test_live_policy_update_from_empty_network_policies from the Python e2e
suite. Both used a manual 90s poll loop against GetSandboxPolicyStatus
that flaked in CI with 'Policy v2 was not loaded within 90s'.

Add e2e/rust/tests/live_policy_update.rs with two replacement tests
that exercise the same policy lifecycle (version bumping, hash
idempotency, policy list history) through the CLI using the built-in
--wait flag for reliable synchronization.
---
 e2e/python/test_sandbox_policy.py    | 260 +---------------
 e2e/rust/tests/live_policy_update.rs | 423 +++++++++++++++++++++++++++
 2 files changed, 424 insertions(+), 259 deletions(-)
 create mode 100644 e2e/rust/tests/live_policy_update.rs

diff --git a/e2e/python/test_sandbox_policy.py b/e2e/python/test_sandbox_policy.py
index 625fe8da0..092f99784 100644
--- a/e2e/python/test_sandbox_policy.py
+++ b/e2e/python/test_sandbox_policy.py
@@ -314,9 +314,7 @@ def log_message(self, *args):
                     {"connect_status": connect_resp.strip(), "http_status": 0}
                 )
 
-            request = (
-                f"{method} {path} HTTP/1.1\r\nHost: {target_host}\r\nConnection: close\r\n\r\n"
-            )
+            request = f"{method} {path} HTTP/1.1\r\nHost: {target_host}\r\nConnection: close\r\n\r\n"
             conn.sendall(request.encode())
 
             data = b""
@@ -1348,262 +1346,6 @@ def test_l7_rule_without_query_matcher_allows_any_query_params(
         assert "connect-server-ok" in resp["body"]
 
 
-# =============================================================================
-# Live policy update + log streaming tests
-#
-# LPU-1: Create sandbox, verify initial policy is v1
-# LPU-2: Set the same policy again -> unchanged (no new version)
-# LPU-3: Push a different policy -> new version loaded, verify connectivity
-# LPU-4: Push v2 again -> unchanged
-# LPU-5: Fetch logs (one-shot + streaming) and verify both sources appear
-# =============================================================================
-
-
-def test_live_policy_update_and_logs(
-    sandbox: Callable[..., Sandbox],
-    sandbox_client: SandboxClient,
-) -> None:
-    """End-to-end: live policy update lifecycle with log verification."""
-    from openshell._proto import openshell_pb2, sandbox_pb2
-
-    # --- Setup: two distinct policies ---
-    # Policy A: python can reach api.anthropic.com
-    policy_a = _base_policy(
-        network_policies={
-            "anthropic": sandbox_pb2.NetworkPolicyRule(
-                name="anthropic",
-                endpoints=[
-                    sandbox_pb2.NetworkEndpoint(host="api.anthropic.com", port=443),
-                ],
-                binaries=[sandbox_pb2.NetworkBinary(path="/**")],
-            ),
-        },
-    )
-    # Policy B: python can reach api.anthropic.com AND example.com
-    policy_b = _base_policy(
-        network_policies={
-            "anthropic": sandbox_pb2.NetworkPolicyRule(
-                name="anthropic",
-                endpoints=[
-                    sandbox_pb2.NetworkEndpoint(host="api.anthropic.com", port=443),
-                ],
-                binaries=[sandbox_pb2.NetworkBinary(path="/**")],
-            ),
-            "example": sandbox_pb2.NetworkPolicyRule(
-                name="example",
-                endpoints=[
-                    sandbox_pb2.NetworkEndpoint(host="example.com", port=443),
-                ],
-                binaries=[sandbox_pb2.NetworkBinary(path="/**")],
-            ),
-        },
-    )
-
-    spec = datamodel_pb2.SandboxSpec(policy=policy_a)
-    stub = sandbox_client._stub
-
-    with sandbox(spec=spec, delete_on_exit=True) as sb:
-        sandbox_name = sb.sandbox.name
-
-        # --- LPU-1: Initial policy should be version 1 ---
-        status_resp = stub.GetSandboxPolicyStatus(
-            openshell_pb2.GetSandboxPolicyStatusRequest(name=sandbox_name, version=0)
-        )
-        assert status_resp.revision.version >= 1, "Initial policy should be at least v1"
-        initial_version = status_resp.revision.version
-        initial_hash = status_resp.revision.policy_hash
-
-        # --- LPU-2: Set the same policy -> no new version ---
-        update_resp = stub.UpdateConfig(
-            openshell_pb2.UpdateConfigRequest(
-                name=sandbox_name,
-                policy=policy_a,
-            )
-        )
-        assert update_resp.version == initial_version, (
-            f"Same policy should return existing version {initial_version}, "
-            f"got {update_resp.version}"
-        )
-        assert update_resp.policy_hash == initial_hash
-
-        # --- LPU-3: Push policy B -> new version ---
-        update_resp = stub.UpdateConfig(
-            openshell_pb2.UpdateConfigRequest(
-                name=sandbox_name,
-                policy=policy_b,
-            )
-        )
-        new_version = update_resp.version
-        assert new_version > initial_version, (
-            f"Different policy should create new version > {initial_version}, "
-            f"got {new_version}"
-        )
-        assert update_resp.policy_hash != initial_hash
-
-        # Wait for the sandbox to load the new policy (poll loop is 30s default).
-        import time
-
-        deadline = time.time() + 90
-        loaded = False
-        while time.time() < deadline:
-            status_resp = stub.GetSandboxPolicyStatus(
-                openshell_pb2.GetSandboxPolicyStatusRequest(
-                    name=sandbox_name, version=new_version
-                )
-            )
-            status = status_resp.revision.status
-            if status == openshell_pb2.POLICY_STATUS_LOADED:
-                loaded = True
-                break
-            if status == openshell_pb2.POLICY_STATUS_FAILED:
-                pytest.fail(
-                    f"Policy v{new_version} failed to load: "
-                    f"{status_resp.revision.load_error}"
-                )
-            time.sleep(2)
-        assert loaded, f"Policy v{new_version} was not loaded within 90s"
-
-        # Verify the new policy works: example.com should now be allowed
-        result = sb.exec_python(_proxy_connect(), args=("example.com", 443))
-        assert result.exit_code == 0, result.stderr
-        assert "200" in result.stdout, (
-            f"example.com should be allowed after policy update, got: {result.stdout}"
-        )
-
-        # --- LPU-4: Push policy B again -> unchanged ---
-        update_resp = stub.UpdateConfig(
-            openshell_pb2.UpdateConfigRequest(
-                name=sandbox_name,
-                policy=policy_b,
-            )
-        )
-        assert update_resp.version == new_version, (
-            f"Same policy B should return existing version {new_version}, "
-            f"got {update_resp.version}"
-        )
-
-        # --- LPU-5: Verify policy history ---
-        list_resp = stub.ListSandboxPolicies(
-            openshell_pb2.ListSandboxPoliciesRequest(name=sandbox_name, limit=10)
-        )
-        versions = [r.version for r in list_resp.revisions]
-        assert new_version in versions
-        assert initial_version in versions
-
-        # Only one version should be Loaded
-        loaded_count = sum(
-            1
-            for r in list_resp.revisions
-            if r.status == openshell_pb2.POLICY_STATUS_LOADED
-        )
-        assert loaded_count == 1, (
-            f"Expected exactly 1 loaded version, got {loaded_count}: "
-            f"{[(r.version, r.status) for r in list_resp.revisions]}"
-        )
-
-        # --- LPU-6: Fetch logs (one-shot) and verify both sources ---
-        # Resolve sandbox ID for log RPCs
-        get_resp = stub.GetSandbox(openshell_pb2.GetSandboxRequest(name=sandbox_name))
-        sandbox_id = get_resp.sandbox.id
-
-        logs_resp = stub.GetSandboxLogs(
-            openshell_pb2.GetSandboxLogsRequest(sandbox_id=sandbox_id, lines=500)
-        )
-        assert logs_resp.buffer_total > 0, "Expected some logs in the buffer"
-
-        sources = {log.source or "gateway" for log in logs_resp.logs}
-        assert "gateway" in sources, (
-            f"Expected gateway logs in response, got sources: {sources}"
-        )
-        # Sandbox logs may take a moment to arrive via the push stream.
-        # If they're present, verify the source tag.
-        if "sandbox" in sources:
-            sandbox_logs = [l for l in logs_resp.logs if l.source == "sandbox"]
-            assert len(sandbox_logs) > 0
-            # Verify structured fields are present on at least one sandbox log
-            has_fields = any(len(l.fields) > 0 for l in sandbox_logs)
-            # Not all sandbox logs have fields (e.g., "Starting sandbox" doesn't),
-            # so we just check at least one does if there are CONNECT logs
-            connect_logs = [l for l in sandbox_logs if "CONNECT" in l.message]
-            if connect_logs:
-                assert has_fields, "CONNECT logs should have structured fields"
-
-
-def test_live_policy_update_from_empty_network_policies(
-    sandbox: Callable[..., Sandbox],
-    sandbox_client: SandboxClient,
-) -> None:
-    """End-to-end: add the first network rule to a running sandbox."""
-    from openshell._proto import openshell_pb2, sandbox_pb2
-
-    initial_policy = _base_policy()
-    updated_policy = _base_policy(
-        network_policies={
-            "example": sandbox_pb2.NetworkPolicyRule(
-                name="example",
-                endpoints=[
-                    sandbox_pb2.NetworkEndpoint(host="example.com", port=443),
-                ],
-                binaries=[sandbox_pb2.NetworkBinary(path="/**")],
-            ),
-        },
-    )
-
-    spec = datamodel_pb2.SandboxSpec(policy=initial_policy)
-    stub = sandbox_client._stub
-
-    with sandbox(spec=spec, delete_on_exit=True) as sb:
-        sandbox_name = sb.sandbox.name
-
-        denied = sb.exec_python(_proxy_connect(), args=("example.com", 443))
-        assert denied.exit_code == 0, denied.stderr
-        assert "403" in denied.stdout, denied.stdout
-
-        initial_status = stub.GetSandboxPolicyStatus(
-            openshell_pb2.GetSandboxPolicyStatusRequest(name=sandbox_name, version=0)
-        )
-        initial_version = initial_status.revision.version
-
-        update_resp = stub.UpdateConfig(
-            openshell_pb2.UpdateConfigRequest(
-                name=sandbox_name,
-                policy=updated_policy,
-            )
-        )
-        new_version = update_resp.version
-        assert new_version > initial_version, (
-            f"Adding the first network rule should create a new version > {initial_version}, "
-            f"got {new_version}"
-        )
-
-        import time
-
-        deadline = time.time() + 90
-        loaded = False
-        while time.time() < deadline:
-            status_resp = stub.GetSandboxPolicyStatus(
-                openshell_pb2.GetSandboxPolicyStatusRequest(
-                    name=sandbox_name, version=new_version
-                )
-            )
-            status = status_resp.revision.status
-            if status == openshell_pb2.POLICY_STATUS_LOADED:
-                loaded = True
-                break
-            if status == openshell_pb2.POLICY_STATUS_FAILED:
-                pytest.fail(
-                    f"Policy v{new_version} failed to load: "
-                    f"{status_resp.revision.load_error}"
-                )
-            time.sleep(2)
-
-        assert loaded, f"Policy v{new_version} was not loaded within 90s"
-
-        allowed = sb.exec_python(_proxy_connect(), args=("example.com", 443))
-        assert allowed.exit_code == 0, allowed.stderr
-        assert "200" in allowed.stdout, allowed.stdout
-
-
 # =============================================================================
 # Forward proxy tests (plain HTTP, non-CONNECT)
 # =============================================================================
diff --git a/e2e/rust/tests/live_policy_update.rs b/e2e/rust/tests/live_policy_update.rs
new file mode 100644
index 000000000..c60b29548
--- /dev/null
+++ b/e2e/rust/tests/live_policy_update.rs
@@ -0,0 +1,423 @@
+// SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+// SPDX-License-Identifier: Apache-2.0
+
+//! E2E tests for live policy updates on a running sandbox.
+//!
+//! Covers the full round-trip:
+//! - Create sandbox with policy A
+//! - Verify initial policy version via `policy get`
+//! - Push same policy A again -> no version bump (idempotent)
+//! - Push different policy B -> new version, `--wait` for sandbox to load it
+//! - Verify policy history via `policy list`
+//!
+//! These tests replace the Python e2e tests `test_live_policy_update_and_logs`
+//! and `test_live_policy_update_from_empty_network_policies`, which were flaky
+//! due to hard-coded 90s poll timeouts. The Rust tests use the CLI's built-in
+//! `--wait` flag for reliable synchronization.
+//!
+//! Note: the removed Python tests also covered `GetSandboxLogs` RPC and
+//! verified actual proxy connectivity after policy update. Those are tracked
+//! as follow-up coverage gaps -- the proxy enforcement path is covered by the
+//! existing L4/L7/SSRF Python e2e tests, and log fetching needs a dedicated
+//! test.
+
+#![cfg(feature = "e2e")]
+
+use std::fmt::Write as _;
+use std::io::Write;
+use std::process::Stdio;
+
+use openshell_e2e::harness::binary::openshell_cmd;
+use openshell_e2e::harness::output::{extract_field, strip_ansi};
+use openshell_e2e::harness::sandbox::SandboxGuard;
+use tempfile::NamedTempFile;
+
+// ---------------------------------------------------------------------------
+// Policy YAML builders
+// ---------------------------------------------------------------------------
+
+/// Build a policy YAML that allows any binary to reach the given hosts on
+/// port 443.
+///
+/// NOTE: The indentation in the format string is load-bearing YAML structure.
+fn write_policy(hosts: &[&str]) -> Result<NamedTempFile, String> {
+    let mut file = NamedTempFile::new().map_err(|e| format!("create temp policy file: {e}"))?;
+
+    let mut network_rules = String::new();
+    for (i, host) in hosts.iter().enumerate() {
+        let _ = write!(
+            network_rules,
+            r#"  rule_{i}:
+    name: rule_{i}
+    endpoints:
+      - host: {host}
+        port: 443
+    binaries:
+      - path: "/**"
+"#
+        );
+    }
+
+    let policy = format!(
+        r"version: 1
+
+filesystem_policy:
+  include_workdir: true
+  read_only:
+    - /usr
+    - /lib
+    - /proc
+    - /dev/urandom
+    - /app
+    - /etc
+    - /var/log
+  read_write:
+    - /sandbox
+    - /tmp
+    - /dev/null
+
+landlock:
+  compatibility: best_effort
+
+process:
+  run_as_user: sandbox
+  run_as_group: sandbox
+
+network_policies:
+{network_rules}"
+    );
+
+    file.write_all(policy.as_bytes())
+        .map_err(|e| format!("write temp policy file: {e}"))?;
+    file.flush()
+        .map_err(|e| format!("flush temp policy file: {e}"))?;
+    Ok(file)
+}
+
+/// Build a minimal policy YAML with no network rules.
+fn write_empty_network_policy() -> Result<NamedTempFile, String> {
+    let mut file = NamedTempFile::new().map_err(|e| format!("create temp policy file: {e}"))?;
+
+    let policy = r"version: 1
+
+filesystem_policy:
+  include_workdir: true
+  read_only:
+    - /usr
+    - /lib
+    - /proc
+    - /dev/urandom
+    - /app
+    - /etc
+    - /var/log
+  read_write:
+    - /sandbox
+    - /tmp
+    - /dev/null
+
+landlock:
+  compatibility: best_effort
+
+process:
+  run_as_user: sandbox
+  run_as_group: sandbox
+";
+
+    file.write_all(policy.as_bytes())
+        .map_err(|e| format!("write temp policy file: {e}"))?;
+    file.flush()
+        .map_err(|e| format!("flush temp policy file: {e}"))?;
+    Ok(file)
+}
+
+// ---------------------------------------------------------------------------
+// CLI helpers
+// ---------------------------------------------------------------------------
+
+struct CliResult {
+    success: bool,
+    output: String,
+    exit_code: Option<i32>,
+}
+
+/// Run an `openshell` CLI command and return the result.
+async fn run_cli(args: &[&str]) -> CliResult {
+    let mut cmd = openshell_cmd();
+    cmd.args(args).stdout(Stdio::piped()).stderr(Stdio::piped());
+
+    let output = cmd.output().await.expect("spawn openshell command");
+    let stdout = String::from_utf8_lossy(&output.stdout).to_string();
+    let stderr = String::from_utf8_lossy(&output.stderr).to_string();
+    let combined = strip_ansi(&format!("{stdout}{stderr}"));
+
+    CliResult {
+        success: output.status.success(),
+        output: combined,
+        exit_code: output.status.code(),
+    }
+}
+
+/// Extract the policy version number from `policy get` output.
+///
+/// Uses the shared `extract_field` helper to find `Version: <n>` or
+/// `Revision: <n>` in CLI tabular output.
+fn extract_version(output: &str) -> Option<u32> {
+    extract_field(output, "Version")
+        .or_else(|| extract_field(output, "Revision"))
+        .and_then(|v| v.parse::<u32>().ok())
+}
+
+/// Extract the policy hash from `policy get` output.
+fn extract_hash(output: &str) -> Option<String> {
+    extract_field(output, "Hash")
+        .or_else(|| extract_field(output, "Policy hash"))
+}
+
+/// Check that a version number appears in `policy list` output as a
+/// distinct field value (not just a substring of some other number).
+///
+/// Looks for the version number preceded by whitespace or at the start
+/// of a line, to avoid matching "2" inside "12" or timestamps.
+fn list_output_contains_version(output: &str, version: u32) -> bool {
+    let v = version.to_string();
+    output.lines().any(|line| {
+        line.split_whitespace()
+            .any(|word| word == v || word.starts_with(&format!("{v} ")))
+    })
+}
+
+// ---------------------------------------------------------------------------
+// Tests
+// ---------------------------------------------------------------------------
+
+/// Test the full live policy update lifecycle:
+///
+/// 1. Create sandbox with `--keep`
+/// 2. Set policy A, verify initial version >= 1
+/// 3. Push same policy A -> version unchanged (idempotent)
+/// 4. Push policy B (adds example.com) with `--wait` -> new version
+/// 5. Push policy B again -> idempotent
+/// 6. Verify policy list shows both versions
+#[tokio::test]
+#[allow(clippy::too_many_lines)]
+async fn live_policy_update_round_trip() {
+    // --- Write two distinct policy files ---
+    let policy_a = write_policy(&["api.anthropic.com"]).expect("write policy A");
+    let policy_b =
+        write_policy(&["api.anthropic.com", "example.com"]).expect("write policy B");
+
+    let policy_a_path = policy_a
+        .path()
+        .to_str()
+        .expect("policy A path should be utf-8")
+        .to_string();
+    let policy_b_path = policy_b
+        .path()
+        .to_str()
+        .expect("policy B path should be utf-8")
+        .to_string();
+
+    // --- Create a long-running sandbox ---
+    let mut guard = SandboxGuard::create_keep(
+        &["sh", "-c", "echo Ready && sleep infinity"],
+        "Ready",
+    )
+    .await
+    .expect("create keep sandbox");
+
+    // --- Set initial policy A ---
+    let r = run_cli(&[
+        "policy", "set", &guard.name, "--policy", &policy_a_path, "--wait", "--timeout", "120",
+    ])
+    .await;
+    assert!(
+        r.success,
+        "policy set A should succeed (exit {:?}):\n{}",
+        r.exit_code, r.output
+    );
+
+    // --- Verify initial policy version ---
+    let r = run_cli(&["policy", "get", &guard.name]).await;
+    assert!(
+        r.success,
+        "policy get should succeed (exit {:?}):\n{}",
+        r.exit_code, r.output
+    );
+
+    let initial_version = extract_version(&r.output)
+        .unwrap_or_else(|| panic!("could not parse version from policy get output:\n{}", r.output));
+    assert!(
+        initial_version >= 1,
+        "initial policy version should be >= 1, got {initial_version}"
+    );
+
+    let initial_hash = extract_hash(&r.output);
+
+    // --- Push same policy A again -> should be idempotent ---
+    let r = run_cli(&[
+        "policy", "set", &guard.name, "--policy", &policy_a_path, "--wait", "--timeout", "120",
+    ])
+    .await;
+    assert!(
+        r.success,
+        "policy set A (repeat) should succeed (exit {:?}):\n{}",
+        r.exit_code, r.output
+    );
+
+    let r = run_cli(&["policy", "get", &guard.name]).await;
+    assert!(r.success, "policy get after repeat should succeed:\n{}", r.output);
+
+    let repeat_version = extract_version(&r.output)
+        .unwrap_or_else(|| panic!("could not parse version after repeat:\n{}", r.output));
+    assert_eq!(
+        repeat_version, initial_version,
+        "same policy should not bump version: expected {initial_version}, got {repeat_version}"
+    );
+
+    if let (Some(ih), Some(rh)) = (&initial_hash, &extract_hash(&r.output)) {
+        assert_eq!(ih, rh, "same policy should produce same hash");
+    }
+
+    // --- Push policy B -> should create new version ---
+    let r = run_cli(&[
+        "policy", "set", &guard.name, "--policy", &policy_b_path, "--wait", "--timeout", "120",
+    ])
+    .await;
+    assert!(
+        r.success,
+        "policy set B should succeed (exit {:?}):\n{}",
+        r.exit_code, r.output
+    );
+
+    let r = run_cli(&["policy", "get", &guard.name]).await;
+    assert!(r.success, "policy get after B should succeed:\n{}", r.output);
+
+    let new_version = extract_version(&r.output)
+        .unwrap_or_else(|| panic!("could not parse version after B:\n{}", r.output));
+    assert!(
+        new_version > initial_version,
+        "different policy should bump version: expected > {initial_version}, got {new_version}"
+    );
+
+    if let (Some(ih), Some(nh)) = (&initial_hash, &extract_hash(&r.output)) {
+        assert_ne!(ih, nh, "different policy should produce different hash");
+    }
+
+    // --- Push policy B again -> idempotent ---
+    let r = run_cli(&[
+        "policy", "set", &guard.name, "--policy", &policy_b_path, "--wait", "--timeout", "120",
+    ])
+    .await;
+    assert!(
+        r.success,
+        "policy set B (repeat) should succeed (exit {:?}):\n{}",
+        r.exit_code, r.output
+    );
+
+    let r = run_cli(&["policy", "get", &guard.name]).await;
+    assert!(r.success, "policy get after B repeat should succeed:\n{}", r.output);
+
+    let repeat_b_version = extract_version(&r.output)
+        .unwrap_or_else(|| panic!("could not parse version after B repeat:\n{}", r.output));
+    assert_eq!(
+        repeat_b_version, new_version,
+        "same policy B should not bump version: expected {new_version}, got {repeat_b_version}"
+    );
+
+    // --- Verify policy list shows revision history ---
+    let r = run_cli(&["policy", "list", &guard.name]).await;
+    assert!(
+        r.success,
+        "policy list should succeed (exit {:?}):\n{}",
+        r.exit_code, r.output
+    );
+
+    // Both versions should appear in the list output.
+    assert!(
+        list_output_contains_version(&r.output, new_version),
+        "policy list should contain version {new_version}:\n{}",
+        r.output
+    );
+    assert!(
+        list_output_contains_version(&r.output, initial_version),
+        "policy list should contain initial version {initial_version}:\n{}",
+        r.output
+    );
+
+    guard.cleanup().await;
+}
+
+/// Test live policy update from an initially empty network policy:
+///
+/// 1. Create sandbox with `--keep`
+/// 2. Set policy with no network rules
+/// 3. Push policy with a network rule using `--wait`
+/// 4. Verify the version bumped
+#[tokio::test]
+async fn live_policy_update_from_empty_network_policies() {
+    let empty_policy = write_empty_network_policy().expect("write empty network policy");
+    let full_policy = write_policy(&["example.com"]).expect("write full policy");
+
+    let empty_path = empty_policy
+        .path()
+        .to_str()
+        .expect("empty policy path should be utf-8")
+        .to_string();
+    let full_path = full_policy
+        .path()
+        .to_str()
+        .expect("full policy path should be utf-8")
+        .to_string();
+
+    // Create sandbox with empty network policy.
+    let mut guard = SandboxGuard::create_keep(
+        &["sh", "-c", "echo Ready && sleep infinity"],
+        "Ready",
+    )
+    .await
+    .expect("create keep sandbox");
+
+    // Set initial empty policy.
+    let r = run_cli(&[
+        "policy", "set", &guard.name, "--policy", &empty_path, "--wait", "--timeout", "120",
+    ])
+    .await;
+    assert!(
+        r.success,
+        "policy set (empty) should succeed (exit {:?}):\n{}",
+        r.exit_code, r.output
+    );
+
+    let r = run_cli(&["policy", "get", &guard.name]).await;
+    assert!(r.success, "policy get (empty) should succeed:\n{}", r.output);
+
+    let initial_version = extract_version(&r.output)
+        .unwrap_or_else(|| panic!("could not parse version from empty policy:\n{}", r.output));
+
+    // Push policy with network rules.
+    let r = run_cli(&[
+        "policy", "set", &guard.name, "--policy", &full_path, "--wait", "--timeout", "120",
+    ])
+    .await;
+    assert!(
+        r.success,
+        "policy set (full) should succeed (exit {:?}):\n{}",
+        r.exit_code, r.output
+    );
+
+    let r = run_cli(&["policy", "get", &guard.name]).await;
+    assert!(r.success, "policy get (full) should succeed:\n{}", r.output);
+
+    let new_version = extract_version(&r.output).unwrap_or_else(|| {
+        panic!(
+            "could not parse version after adding network rules:\n{}",
+            r.output
+        )
+    });
+    assert!(
+        new_version > initial_version,
+        "adding network rules should create new version > {initial_version}, got {new_version}"
+    );
+
+    guard.cleanup().await;
+}

From eea495e6b9002dc611cf73daa893fb13a1a24dce Mon Sep 17 00:00:00 2001
From: "John T. Myers" <9696606+johntmyers@users.noreply.github.com>
Date: Thu, 2 Apr 2026 20:32:59 -0700
Subject: [PATCH 4/9] fix: remediate 9 security findings from external audit
 (OS-15 through OS-23) (#744)

* fix(install): restrict tar extraction to expected binary member

Prevents CWE-22 path traversal by extracting only the expected APP_NAME
member instead of the full archive contents. Adds --no-same-owner and
--no-same-permissions for defense-in-depth.

OS-20

* fix(deploy): quote registry credentials in YAML heredocs

Wraps username/password values with a yaml_quote helper to prevent YAML
injection from special characters in registry credentials (CWE-94).
Applied to all three heredoc blocks that emit registries.yaml auth.

OS-23

* fix(server): redact session token in SSH tunnel rate-limit log

Logs only the last 4 characters of bearer tokens to prevent credential
exposure in log aggregation systems (CWE-532).

OS-18

* fix(server): escape gateway_display in auth connect page

Applies html_escape() to the Host/X-Forwarded-Host header value before
rendering it into the HTML template, preventing HTML injection (CWE-79).

OS-17

* fix(server): prevent XSS via code param with validation and proper JS escaping

Adds server-side validation rejecting confirmation codes that do not
match the CLI-generated format, replaces manual JS string escaping with
serde_json serialization (handling U+2028/U+2029 line terminators), and
adds a Content-Security-Policy header with nonce-based script-src.

OS-16

* fix(sandbox): add byte cap and idle timeout to streaming inference relay

Prevents resource exhaustion from upstream inference endpoints that stream
indefinitely or hold connections open. Adds a 32 MiB total body limit
and 30-second per-chunk idle timeout (CWE-400).

OS-21

* fix(policy): narrow port field from u32 to u16 to reject invalid values

Prevents meaningless port values >65535 from being accepted in policy
YAML definitions. The proto field remains uint32 (protobuf has no u16)
with validation at the conversion boundary.

OS-22

* fix(deps): migrate from archived serde_yaml to serde_yml

Replaces serde_yaml 0.9 (archived, RUSTSEC-2024-0320) with serde_yml
0.0.12, a maintained API-compatible fork. All import sites updated
across openshell-policy, openshell-sandbox, and openshell-router.

OS-19

* fix(server): re-validate sandbox-submitted security_notes and cap hit_count

The gateway now re-runs security heuristics on proposed policy chunks
instead of trusting sandbox-provided security_notes, validates host
wildcards, caps hit_count at 100, and clamps confidence to [0,1]. The
TUI approve-all path is updated to use ApproveAllDraftChunks RPC which
respects the security_notes filtering gate (CWE-284, confused deputy).

OS-15

* chore: apply cargo fmt and update Cargo.lock for serde_yml

---------

Co-authored-by: John Myers <johntmyers@users.noreply.github.com>
---
 Cargo.lock                                |  45 +++++--
 Cargo.toml                                |   2 +-
 crates/openshell-policy/Cargo.toml        |   2 +-
 crates/openshell-policy/src/lib.rs        |  39 ++++--
 crates/openshell-router/Cargo.toml        |   2 +-
 crates/openshell-router/src/config.rs     |   2 +-
 crates/openshell-sandbox/Cargo.toml       |   2 +-
 crates/openshell-sandbox/src/opa.rs       |   2 +-
 crates/openshell-sandbox/src/proxy.rs     |  33 ++++-
 crates/openshell-server/src/auth.rs       | 139 +++++++++++++++++-----
 crates/openshell-server/src/grpc.rs       |  64 ++++++++--
 crates/openshell-server/src/ssh_tunnel.rs |  11 +-
 crates/openshell-tui/src/lib.rs           |  75 ++++++------
 deploy/docker/cluster-entrypoint.sh       |  21 +++-
 install.sh                                |   2 +-
 15 files changed, 326 insertions(+), 115 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 7d20c9bd8..852d97a0c 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -125,7 +125,7 @@ version = "1.1.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "40c48f72fd53cd289104fc64099abca73db4166ad86ea0b4341abe65af83dadc"
 dependencies = [
- "windows-sys 0.60.2",
+ "windows-sys 0.61.2",
 ]
 
 [[package]]
@@ -136,7 +136,7 @@ checksum = "291e6a250ff86cd4a820112fb8898808a366d8f9f58ce16d1f538353ad55747d"
 dependencies = [
  "anstyle",
  "once_cell_polyfill",
- "windows-sys 0.60.2",
+ "windows-sys 0.61.2",
 ]
 
 [[package]]
@@ -1283,7 +1283,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "39cab71617ae0d63f51a36d69f866391735b51691dbda63cf6f96d042b63efeb"
 dependencies = [
  "libc",
- "windows-sys 0.52.0",
+ "windows-sys 0.61.2",
 ]
 
 [[package]]
@@ -2497,6 +2497,16 @@ dependencies = [
  "vcpkg",
 ]
 
+[[package]]
+name = "libyml"
+version = "0.0.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3302702afa434ffa30847a83305f0a69d6abd74293b6554c18ec85c7ef30c980"
+dependencies = [
+ "anyhow",
+ "version_check",
+]
+
 [[package]]
 name = "linux-raw-sys"
 version = "0.4.15"
@@ -2691,7 +2701,7 @@ version = "0.50.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "7957b9740744892f114936ab4a57b3f487491bbeafaf8083688b16841a4240e5"
 dependencies = [
- "windows-sys 0.59.0",
+ "windows-sys 0.61.2",
 ]
 
 [[package]]
@@ -2902,7 +2912,7 @@ dependencies = [
  "miette",
  "openshell-core",
  "serde",
- "serde_yaml",
+ "serde_yml",
 ]
 
 [[package]]
@@ -2922,7 +2932,7 @@ dependencies = [
  "reqwest",
  "serde",
  "serde_json",
- "serde_yaml",
+ "serde_yml",
  "tempfile",
  "thiserror 2.0.18",
  "tokio",
@@ -2958,7 +2968,7 @@ dependencies = [
  "rustls-pemfile",
  "seccompiler",
  "serde_json",
- "serde_yaml",
+ "serde_yml",
  "sha2 0.10.9",
  "temp-env",
  "tempfile",
@@ -4044,7 +4054,7 @@ dependencies = [
  "errno",
  "libc",
  "linux-raw-sys 0.12.1",
- "windows-sys 0.52.0",
+ "windows-sys 0.61.2",
 ]
 
 [[package]]
@@ -4348,6 +4358,21 @@ dependencies = [
  "unsafe-libyaml",
 ]
 
+[[package]]
+name = "serde_yml"
+version = "0.0.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "59e2dd588bf1597a252c3b920e0143eb99b0f76e4e082f4c92ce34fbc9e71ddd"
+dependencies = [
+ "indexmap 2.13.0",
+ "itoa",
+ "libyml",
+ "memchr",
+ "ryu",
+ "serde",
+ "version_check",
+]
+
 [[package]]
 name = "serdect"
 version = "0.4.2"
@@ -4519,7 +4544,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "3a766e1110788c36f4fa1c2b71b387a7815aa65f88ce0229841826633d93723e"
 dependencies = [
  "libc",
- "windows-sys 0.60.2",
+ "windows-sys 0.61.2",
 ]
 
 [[package]]
@@ -4930,7 +4955,7 @@ dependencies = [
  "getrandom 0.4.2",
  "once_cell",
  "rustix 1.1.4",
- "windows-sys 0.52.0",
+ "windows-sys 0.61.2",
 ]
 
 [[package]]
diff --git a/Cargo.toml b/Cargo.toml
index 4fecf1940..08b699d47 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -64,7 +64,7 @@ nix = { version = "0.29", features = ["signal", "process", "user", "fs", "term"]
 # Serialization
 serde = { version = "1", features = ["derive"] }
 serde_json = "1"
-serde_yaml = "0.9"
+serde_yml = "0.0.12"
 
 # HTTP client
 reqwest = { version = "0.12", default-features = false, features = ["json", "rustls-tls"] }
diff --git a/crates/openshell-policy/Cargo.toml b/crates/openshell-policy/Cargo.toml
index 311bb4e86..f26136c6b 100644
--- a/crates/openshell-policy/Cargo.toml
+++ b/crates/openshell-policy/Cargo.toml
@@ -13,7 +13,7 @@ repository.workspace = true
 [dependencies]
 openshell-core = { path = "../openshell-core" }
 serde = { workspace = true }
-serde_yaml = { workspace = true }
+serde_yml = { workspace = true }
 miette = { workspace = true }
 
 [lints]
diff --git a/crates/openshell-policy/src/lib.rs b/crates/openshell-policy/src/lib.rs
index 7adb4dfda..9cf543bdf 100644
--- a/crates/openshell-policy/src/lib.rs
+++ b/crates/openshell-policy/src/lib.rs
@@ -82,11 +82,12 @@ struct NetworkEndpointDef {
     #[serde(default, skip_serializing_if = "String::is_empty")]
     host: String,
     /// Single port (backwards compat). Mutually exclusive with `ports`.
+    /// Uses `u16` to reject invalid values >65535 at parse time.
     #[serde(default, skip_serializing_if = "is_zero")]
-    port: u32,
+    port: u16,
     /// Multiple ports. When non-empty, this endpoint covers all listed ports.
     #[serde(default, skip_serializing_if = "Vec::is_empty")]
-    ports: Vec<u32>,
+    ports: Vec<u16>,
     #[serde(default, skip_serializing_if = "String::is_empty")]
     protocol: String,
     #[serde(default, skip_serializing_if = "String::is_empty")]
@@ -101,7 +102,7 @@ struct NetworkEndpointDef {
     allowed_ips: Vec<String>,
 }
 
-fn is_zero(v: &u32) -> bool {
+fn is_zero(v: &u16) -> bool {
     *v == 0
 }
 
@@ -169,10 +170,10 @@ fn to_proto(raw: PolicyFile) -> SandboxPolicy {
                     .map(|e| {
                         // Normalize port/ports: ports takes precedence, else
                         // single port is promoted to ports array.
-                        let normalized_ports = if !e.ports.is_empty() {
-                            e.ports
+                        let normalized_ports: Vec<u32> = if !e.ports.is_empty() {
+                            e.ports.into_iter().map(u32::from).collect()
                         } else if e.port > 0 {
-                            vec![e.port]
+                            vec![u32::from(e.port)]
                         } else {
                             vec![]
                         };
@@ -285,10 +286,12 @@ fn from_proto(policy: &SandboxPolicy) -> PolicyFile {
                     .map(|e| {
                         // Use compact form: if ports has exactly 1 element,
                         // emit port (scalar). If >1, emit ports (array).
+                        // Proto uses u32; YAML uses u16. Clamp at boundary.
+                        let clamp = |v: u32| -> u16 { v.min(65535) as u16 };
                         let (port, ports) = if e.ports.len() > 1 {
-                            (0, e.ports.clone())
+                            (0, e.ports.iter().map(|&p| clamp(p)).collect())
                         } else {
-                            (e.ports.first().copied().unwrap_or(e.port), vec![])
+                            (clamp(e.ports.first().copied().unwrap_or(e.port)), vec![])
                         };
                         NetworkEndpointDef {
                             host: e.host.clone(),
@@ -358,7 +361,7 @@ fn from_proto(policy: &SandboxPolicy) -> PolicyFile {
 
 /// Parse a sandbox policy from a YAML string.
 pub fn parse_sandbox_policy(yaml: &str) -> Result<SandboxPolicy> {
-    let raw: PolicyFile = serde_yaml::from_str(yaml)
+    let raw: PolicyFile = serde_yml::from_str(yaml)
         .into_diagnostic()
         .wrap_err("failed to parse sandbox policy YAML")?;
     Ok(to_proto(raw))
@@ -371,7 +374,7 @@ pub fn parse_sandbox_policy(yaml: &str) -> Result<SandboxPolicy> {
 /// and is round-trippable through `parse_sandbox_policy`.
 pub fn serialize_sandbox_policy(policy: &SandboxPolicy) -> Result<String> {
     let yaml_repr = from_proto(policy);
-    serde_yaml::to_string(&yaml_repr)
+    serde_yml::to_string(&yaml_repr)
         .into_diagnostic()
         .wrap_err("failed to serialize policy to YAML")
 }
@@ -1207,4 +1210,20 @@ network_policies:
             proto2.network_policies["test"].endpoints[0].host
         );
     }
+
+    #[test]
+    fn rejects_port_above_65535() {
+        let yaml = r#"
+version: 1
+network_policies:
+  test:
+    endpoints:
+      - host: example.com
+        port: 70000
+"#;
+        assert!(
+            parse_sandbox_policy(yaml).is_err(),
+            "port >65535 should fail to parse"
+        );
+    }
 }
diff --git a/crates/openshell-router/Cargo.toml b/crates/openshell-router/Cargo.toml
index dc8e9c924..e4c3d5ea7 100644
--- a/crates/openshell-router/Cargo.toml
+++ b/crates/openshell-router/Cargo.toml
@@ -19,7 +19,7 @@ serde_json = { workspace = true }
 thiserror = { workspace = true }
 tracing = { workspace = true }
 tokio = { workspace = true }
-serde_yaml = { workspace = true }
+serde_yml = { workspace = true }
 uuid = { workspace = true }
 
 [dev-dependencies]
diff --git a/crates/openshell-router/src/config.rs b/crates/openshell-router/src/config.rs
index 52c22da9f..b531e091d 100644
--- a/crates/openshell-router/src/config.rs
+++ b/crates/openshell-router/src/config.rs
@@ -75,7 +75,7 @@ impl RouterConfig {
                 path.display()
             ))
         })?;
-        let config: Self = serde_yaml::from_str(&content).map_err(|e| {
+        let config: Self = serde_yml::from_str(&content).map_err(|e| {
             RouterError::Internal(format!(
                 "failed to parse router config {}: {e}",
                 path.display()
diff --git a/crates/openshell-sandbox/Cargo.toml b/crates/openshell-sandbox/Cargo.toml
index 68e696e95..e8e7e2c97 100644
--- a/crates/openshell-sandbox/Cargo.toml
+++ b/crates/openshell-sandbox/Cargo.toml
@@ -60,7 +60,7 @@ ipnet = "2"
 
 # Serialization
 serde_json = { workspace = true }
-serde_yaml = { workspace = true }
+serde_yml = { workspace = true }
 
 # Logging
 tracing = { workspace = true }
diff --git a/crates/openshell-sandbox/src/opa.rs b/crates/openshell-sandbox/src/opa.rs
index f1df12ff4..f1c0ad293 100644
--- a/crates/openshell-sandbox/src/opa.rs
+++ b/crates/openshell-sandbox/src/opa.rs
@@ -511,7 +511,7 @@ fn parse_process_policy(val: &regorus::Value) -> ProcessPolicy {
 
 /// Preprocess YAML policy data: parse, normalize, validate, expand access presets, return JSON.
 fn preprocess_yaml_data(yaml_str: &str) -> Result<String> {
-    let mut data: serde_json::Value = serde_yaml::from_str(yaml_str)
+    let mut data: serde_json::Value = serde_yml::from_str(yaml_str)
         .map_err(|e| miette::miette!("failed to parse YAML data: {e}"))?;
 
     // Normalize port → ports for all endpoints so Rego always sees "ports" array.
diff --git a/crates/openshell-sandbox/src/proxy.rs b/crates/openshell-sandbox/src/proxy.rs
index a7df76e2f..9e87450d4 100644
--- a/crates/openshell-sandbox/src/proxy.rs
+++ b/crates/openshell-sandbox/src/proxy.rs
@@ -23,6 +23,12 @@ use tracing::{debug, info, warn};
 const MAX_HEADER_BYTES: usize = 8192;
 const INFERENCE_LOCAL_HOST: &str = "inference.local";
 
+/// Maximum total bytes for a streaming inference response body (32 MiB).
+const MAX_STREAMING_BODY: usize = 32 * 1024 * 1024;
+
+/// Idle timeout per chunk when relaying streaming inference responses.
+const CHUNK_IDLE_TIMEOUT: std::time::Duration = std::time::Duration::from_secs(30);
+
 /// Result of a proxy CONNECT policy decision.
 struct ConnectDecision {
     action: NetworkAction,
@@ -1045,18 +1051,35 @@ async fn route_inference_request(
                 let header_bytes = format_http_response_header(resp.status, &resp_headers);
                 write_all(tls_client, &header_bytes).await?;
 
-                // Stream body chunks as they arrive from the upstream.
+                // Stream body chunks with byte cap and idle timeout.
+                let mut total_bytes: usize = 0;
                 loop {
-                    match resp.next_chunk().await {
-                        Ok(Some(chunk)) => {
+                    match tokio::time::timeout(CHUNK_IDLE_TIMEOUT, resp.next_chunk()).await {
+                        Ok(Ok(Some(chunk))) => {
+                            total_bytes += chunk.len();
+                            if total_bytes > MAX_STREAMING_BODY {
+                                warn!(
+                                    total_bytes = total_bytes,
+                                    limit = MAX_STREAMING_BODY,
+                                    "streaming response exceeded byte limit, truncating"
+                                );
+                                break;
+                            }
                             let encoded = format_chunk(&chunk);
                             write_all(tls_client, &encoded).await?;
                         }
-                        Ok(None) => break,
-                        Err(e) => {
+                        Ok(Ok(None)) => break,
+                        Ok(Err(e)) => {
                             warn!(error = %e, "error reading upstream response chunk");
                             break;
                         }
+                        Err(_) => {
+                            warn!(
+                                idle_timeout_secs = CHUNK_IDLE_TIMEOUT.as_secs(),
+                                "streaming response chunk idle timeout, closing"
+                            );
+                            break;
+                        }
                     }
                 }
 
diff --git a/crates/openshell-server/src/auth.rs b/crates/openshell-server/src/auth.rs
index 5a3229ffa..b896d062c 100644
--- a/crates/openshell-server/src/auth.rs
+++ b/crates/openshell-server/src/auth.rs
@@ -22,11 +22,28 @@ use axum::{
     response::{Html, IntoResponse},
     routing::get,
 };
+use http::header;
 use serde::Deserialize;
 use std::sync::Arc;
 
 use crate::ServerState;
 
+/// Validate that a confirmation code matches the CLI-generated format.
+///
+/// Codes are 3 alphanumeric characters, a dash, then 4 alphanumeric characters
+/// (e.g., "AB7-X9KM"). The CLI generates these from the charset `[A-Z2-9]`.
+fn is_valid_code(code: &str) -> bool {
+    let bytes = code.as_bytes();
+    bytes.len() == 8
+        && bytes[3] == b'-'
+        && bytes[..3]
+            .iter()
+            .all(|b| b.is_ascii_uppercase() || b.is_ascii_digit())
+        && bytes[4..]
+            .iter()
+            .all(|b| b.is_ascii_uppercase() || b.is_ascii_digit())
+}
+
 #[derive(Deserialize)]
 struct ConnectParams {
     callback_port: u16,
@@ -54,6 +71,15 @@ async fn auth_connect(
     Query(params): Query<ConnectParams>,
     headers: HeaderMap,
 ) -> impl IntoResponse {
+    // Reject codes that don't match the CLI-generated format to prevent
+    // reflected XSS via crafted URLs.
+    if !is_valid_code(&params.code) {
+        return Html(
+            "<html><body><p>Invalid confirmation code format.</p></body></html>".to_string(),
+        )
+        .into_response();
+    }
+
     let cf_token = headers
         .get("cookie")
         .and_then(|v| v.to_str().ok())
@@ -68,14 +94,34 @@ async fn auth_connect(
         .and_then(|v| v.to_str().ok())
         .map_or_else(|| state.config.bind_address.to_string(), String::from);
 
+    let safe_gateway = html_escape(&gateway_display);
+
     match cf_token {
-        Some(token) => Html(render_connect_page(
-            &gateway_display,
-            params.callback_port,
-            &token,
-            &params.code,
-        )),
-        None => Html(render_waiting_page(params.callback_port, &params.code)),
+        Some(token) => {
+            let nonce = uuid::Uuid::new_v4().to_string();
+            let csp = format!(
+                "default-src 'none'; script-src 'nonce-{nonce}'; style-src 'unsafe-inline'; connect-src http://127.0.0.1:*"
+            );
+            (
+                [(header::CONTENT_SECURITY_POLICY, csp)],
+                Html(render_connect_page(
+                    &safe_gateway,
+                    params.callback_port,
+                    &token,
+                    &params.code,
+                    &nonce,
+                )),
+            )
+                .into_response()
+        }
+        None => {
+            let csp = "default-src 'none'; style-src 'unsafe-inline'".to_string();
+            (
+                [(header::CONTENT_SECURITY_POLICY, csp)],
+                Html(render_waiting_page(params.callback_port, &params.code)),
+            )
+                .into_response()
+        }
     }
 }
 
@@ -104,22 +150,27 @@ fn render_connect_page(
     callback_port: u16,
     cf_token: &str,
     code: &str,
+    nonce: &str,
 ) -> String {
-    // Escape the token for safe embedding in a JS string literal.
-    let escaped_token = cf_token
-        .replace('\\', "\\\\")
-        .replace('\'', "\\'")
-        .replace('"', "\\\"")
-        .replace('<', "\\x3c")
-        .replace('>', "\\x3e");
+    // Use JSON serialization for JS-safe string embedding — handles all
+    // edge cases including \n, \r, U+2028, U+2029 that break JS string
+    // literals. serde_json::to_string produces a quoted JSON string
+    // (e.g., "value") which is a valid JS string literal.
+    //
+    // We additionally escape < and > to \u003c / \u003e because while
+    // they're valid in JSON, they're dangerous inside an HTML <script>
+    // block (the HTML parser sees </script> before the JS parser runs).
+    let json_token = serde_json::to_string(cf_token)
+        .unwrap_or_else(|_| "\"\"".to_string())
+        .replace('<', "\\u003c")
+        .replace('>', "\\u003e");
+    let json_code = serde_json::to_string(code)
+        .unwrap_or_else(|_| "\"\"".to_string())
+        .replace('<', "\\u003c")
+        .replace('>', "\\u003e");
 
-    // Escape the code the same way (it's alphanumeric + dash, but be safe).
-    let escaped_code = code
-        .replace('\\', "\\\\")
-        .replace('\'', "\\'")
-        .replace('"', "\\\"")
-        .replace('<', "\\x3c")
-        .replace('>', "\\x3e");
+    // HTML-safe version of the code for display in the page body.
+    let html_code = html_escape(code);
 
     let version = openshell_core::VERSION;
 
@@ -250,7 +301,7 @@ fn render_connect_page(
         <div class="subtitle">Connect to Gateway</div>
         <div class="code-box">
             <div class="code-label">Confirmation Code</div>
-            <div class="code-value">{escaped_code}</div>
+            <div class="code-value">{html_code}</div>
             <div class="code-hint">Verify this matches the code shown in your terminal</div>
         </div>
         <div class="info">
@@ -271,9 +322,9 @@ fn render_connect_page(
         </div>
         <div class="status" id="status"></div>
     </div>
-    <script>
-        var token = '{escaped_token}';
-        var code = '{escaped_code}';
+    <script nonce="{nonce}">
+        var token = {json_token};
+        var code = {json_code};
         var port = {callback_port};
         function connect() {{
             var btn = document.getElementById('connectBtn');
@@ -440,6 +491,7 @@ mod tests {
             12345,
             "test-jwt-token",
             "ABC-1234",
+            "test-nonce",
         );
         assert!(html.contains("test-jwt-token"));
         assert!(html.contains("12345"));
@@ -452,25 +504,48 @@ mod tests {
         // Should POST with JSON
         assert!(html.contains("method: 'POST'"));
         assert!(html.contains("JSON.stringify"));
+        // CSP nonce should be on the script tag
+        assert!(html.contains("nonce=\"test-nonce\""));
     }
 
     #[test]
     fn render_connect_page_escapes_special_chars() {
-        let html =
-            render_connect_page("gw", 1234, "token<script>alert('xss')</script>", "ABC-1234");
-        // < and > should be escaped
+        let html = render_connect_page(
+            "gw",
+            1234,
+            "token<script>alert('xss')</script>",
+            "ABC-1234",
+            "nonce",
+        );
+        // < and > should be escaped via JSON encoding (\u003c)
         assert!(!html.contains("<script>alert"));
-        assert!(html.contains("\\x3c"));
     }
 
     #[test]
     fn render_connect_page_includes_code_in_js_payload() {
-        let html = render_connect_page("gw", 1234, "jwt", "XY7-9KLM");
-        // The JS should send the code in the JSON payload
-        assert!(html.contains("var code = 'XY7-9KLM'"));
+        let html = render_connect_page("gw", 1234, "jwt", "XY7-9KLM", "nonce");
+        // The JS should send the code in the JSON payload (now JSON-encoded)
+        assert!(html.contains(r#"var code = "XY7-9KLM""#));
         assert!(html.contains("code: code"));
     }
 
+    #[test]
+    fn is_valid_code_accepts_valid_format() {
+        assert!(is_valid_code("AB7-X9KM"));
+        assert!(is_valid_code("222-AAAA"));
+        assert!(is_valid_code("ZZZ-9999"));
+    }
+
+    #[test]
+    fn is_valid_code_rejects_invalid_format() {
+        assert!(!is_valid_code(""));
+        assert!(!is_valid_code("too-long-code"));
+        assert!(!is_valid_code("abc-defg")); // lowercase
+        assert!(!is_valid_code("AB7X9KLM")); // no dash
+        assert!(!is_valid_code("AB7-9KL")); // too short
+        assert!(!is_valid_code("x\u{2028};fetch('//evil')//")); // XSS payload
+    }
+
     #[test]
     fn render_waiting_page_has_auto_refresh_with_code() {
         let html = render_waiting_page(12345, "ABC-1234");
diff --git a/crates/openshell-server/src/grpc.rs b/crates/openshell-server/src/grpc.rs
index 911d2f093..288fb13d5 100644
--- a/crates/openshell-server/src/grpc.rs
+++ b/crates/openshell-server/src/grpc.rs
@@ -1844,18 +1844,21 @@ impl OpenShell for OpenShellService {
                 rule_name: chunk.rule_name.clone(),
                 proposed_rule: proposed_rule_bytes,
                 rationale: chunk.rationale.clone(),
-                security_notes: chunk.security_notes.clone(),
-                confidence: f64::from(chunk.confidence),
+                // Re-compute security notes server-side — never trust
+                // sandbox-provided values (confused-deputy mitigation).
+                security_notes: generate_security_notes(
+                    &ep_host,
+                    u16::try_from(ep_port as u32).unwrap_or(0),
+                ),
+                confidence: f64::from(chunk.confidence.clamp(0.0, 1.0)),
                 created_at_ms: now_ms,
                 decided_at_ms: None,
                 host: ep_host,
                 port: ep_port,
                 binary: ep_binary,
-                hit_count: if chunk.hit_count > 0 {
-                    chunk.hit_count
-                } else {
-                    1
-                },
+                // Cap hit_count to a reasonable ceiling — don't trust
+                // sandbox-supplied counts.
+                hit_count: chunk.hit_count.clamp(1, 100),
                 first_seen_ms: if chunk.first_seen_ms > 0 {
                     chunk.first_seen_ms
                 } else {
@@ -3408,6 +3411,53 @@ fn policy_record_to_revision(record: &PolicyRecord, include_policy: bool) -> San
     }
 }
 
+/// Re-validate security notes server-side for a proposed policy chunk.
+///
+/// Duplicates the heuristics from the sandbox's `mechanistic_mapper` to
+/// ensure the gateway never trusts sandbox-provided security annotations.
+/// This prevents a confused-deputy attack where a compromised sandbox
+/// submits proposals with empty `security_notes` to bypass the safety
+/// gate during bulk approval (CWE-284).
+fn generate_security_notes(host: &str, port: u16) -> String {
+    let mut notes = Vec::new();
+
+    // Check for private/internal IP patterns.
+    if host.starts_with("10.")
+        || host.starts_with("172.")
+        || host.starts_with("192.168.")
+        || host == "localhost"
+        || host.starts_with("127.")
+    {
+        notes.push(format!(
+            "Destination '{host}' appears to be an internal/private address."
+        ));
+    }
+
+    // Host wildcard — broadly permissive.
+    if host.contains('*') {
+        notes.push(format!(
+            "Host '{host}' contains a wildcard — this may match unintended destinations."
+        ));
+    }
+
+    // Ephemeral port range.
+    if port > 49152 {
+        notes.push(format!(
+            "Port {port} is in the ephemeral range — this may be a temporary service."
+        ));
+    }
+
+    // Well-known database / service ports.
+    const DB_PORTS: [u16; 7] = [5432, 3306, 6379, 27017, 9200, 11211, 5672];
+    if DB_PORTS.contains(&port) {
+        notes.push(format!(
+            "Port {port} is a well-known database/service port."
+        ));
+    }
+
+    notes.join(" ")
+}
+
 fn current_time_ms() -> Result<i64, std::time::SystemTimeError> {
     let now = std::time::SystemTime::now().duration_since(std::time::UNIX_EPOCH)?;
     Ok(i64::try_from(now.as_millis()).unwrap_or(i64::MAX))
diff --git a/crates/openshell-server/src/ssh_tunnel.rs b/crates/openshell-server/src/ssh_tunnel.rs
index 5dbff9b50..899f413b6 100644
--- a/crates/openshell-server/src/ssh_tunnel.rs
+++ b/crates/openshell-server/src/ssh_tunnel.rs
@@ -28,6 +28,15 @@ const PREFACE_MAGIC: &str = "NSSH1";
 /// Maximum concurrent SSH tunnel connections per session token.
 const MAX_CONNECTIONS_PER_TOKEN: u32 = 3;
 
+/// Redact a bearer token for safe logging — show only the last 4 characters.
+fn redact_token(token: &str) -> String {
+    if token.len() <= 4 {
+        "****".to_string()
+    } else {
+        format!("****{}", &token[token.len() - 4..])
+    }
+}
+
 /// Maximum concurrent SSH tunnel connections per sandbox.
 const MAX_CONNECTIONS_PER_SANDBOX: u32 = 20;
 
@@ -116,7 +125,7 @@ async fn ssh_connect(
         let mut counts = state.ssh_connections_by_token.lock().unwrap();
         let count = counts.entry(token.clone()).or_insert(0);
         if *count >= MAX_CONNECTIONS_PER_TOKEN {
-            warn!(token = %token, "SSH tunnel: per-token connection limit reached");
+            warn!(token = %redact_token(&token), "SSH tunnel: per-token connection limit reached");
             return StatusCode::TOO_MANY_REQUESTS.into_response();
         }
         *count += 1;
diff --git a/crates/openshell-tui/src/lib.rs b/crates/openshell-tui/src/lib.rs
index 04fdf5685..e8759999a 100644
--- a/crates/openshell-tui/src/lib.rs
+++ b/crates/openshell-tui/src/lib.rs
@@ -1753,13 +1753,15 @@ fn spawn_draft_reject(app: &App, tx: mpsc::UnboundedSender<Event>) {
     });
 }
 
-/// Approve the snapshotted draft chunks one by one.
+/// Approve all pending draft chunks via the bulk `ApproveAllDraftChunks` RPC.
 ///
-/// Only the chunks captured when `[A]` was pressed are approved — any new
-/// chunks that arrived while the confirmation modal was open are skipped.
+/// Uses the server-side bulk endpoint which respects the `security_notes`
+/// safety gate — security-flagged chunks are skipped unless explicitly
+/// included. The `snapshot` parameter is retained for the confirmation
+/// modal count display but is not iterated for per-chunk approval.
 fn spawn_draft_approve_all(
     app: &App,
-    snapshot: Vec<openshell_core::proto::PolicyChunk>,
+    _snapshot: Vec<openshell_core::proto::PolicyChunk>,
     tx: mpsc::UnboundedSender<Event>,
 ) {
     let mut client = app.client.clone();
@@ -1769,41 +1771,40 @@ fn spawn_draft_approve_all(
     };
 
     tokio::spawn(async move {
-        let total = snapshot.len();
-        let mut approved = 0u32;
-        let mut last_version = 0u32;
-        let mut errors: Vec<String> = Vec::new();
-
-        for chunk in &snapshot {
-            let req = openshell_core::proto::ApproveDraftChunkRequest {
-                name: name.clone(),
-                chunk_id: chunk.id.clone(),
-            };
-            match tokio::time::timeout(Duration::from_secs(5), client.approve_draft_chunk(req))
-                .await
-            {
-                Ok(Ok(resp)) => {
-                    approved += 1;
-                    last_version = resp.into_inner().policy_version;
-                }
-                Ok(Err(e)) => {
-                    errors.push(format!("{}: {}", chunk.rule_name, e.message()));
-                }
-                Err(_) => {
-                    errors.push(format!("{}: timed out", chunk.rule_name));
-                }
+        let req = openshell_core::proto::ApproveAllDraftChunksRequest {
+            name,
+            include_security_flagged: false,
+        };
+        match tokio::time::timeout(
+            Duration::from_secs(30),
+            client.approve_all_draft_chunks(req),
+        )
+        .await
+        {
+            Ok(Ok(resp)) => {
+                let inner = resp.into_inner();
+                let msg = if inner.chunks_skipped > 0 {
+                    format!(
+                        "Approved {} chunks, skipped {} security-flagged -> policy v{}",
+                        inner.chunks_approved, inner.chunks_skipped, inner.policy_version
+                    )
+                } else {
+                    format!(
+                        "Approved {} chunks -> policy v{}",
+                        inner.chunks_approved, inner.policy_version
+                    )
+                };
+                let _ = tx.send(Event::DraftActionResult(Ok(msg)));
+            }
+            Ok(Err(e)) => {
+                let _ = tx.send(Event::DraftActionResult(Err(e.message().to_string())));
+            }
+            Err(_) => {
+                let _ = tx.send(Event::DraftActionResult(Err(
+                    "approve-all timed out".to_string()
+                )));
             }
         }
-
-        let msg = if errors.is_empty() {
-            format!("Approved {approved}/{total} chunks -> policy v{last_version}")
-        } else {
-            format!(
-                "Approved {approved}/{total} chunks (errors: {})",
-                errors.join("; ")
-            )
-        };
-        let _ = tx.send(Event::DraftActionResult(Ok(msg)));
     });
 }
 
diff --git a/deploy/docker/cluster-entrypoint.sh b/deploy/docker/cluster-entrypoint.sh
index 367665db3..86d61e062 100644
--- a/deploy/docker/cluster-entrypoint.sh
+++ b/deploy/docker/cluster-entrypoint.sh
@@ -25,6 +25,15 @@
 
 set -e
 
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+# Escape a value for safe embedding as a YAML single-quoted scalar.
+# Single quotes are the only character that needs escaping ('  ->  '').
+yaml_quote() {
+    printf "'%s'" "$(printf '%s' "$1" | sed "s/'/''/g")"
+}
+
 # ---------------------------------------------------------------------------
 # Select iptables backend
 # ---------------------------------------------------------------------------
@@ -269,8 +278,8 @@ REGEOF
 configs:
   "${REGISTRY_HOST}":
     auth:
-      username: ${REGISTRY_USERNAME}
-      password: ${REGISTRY_PASSWORD}
+      username: $(yaml_quote "${REGISTRY_USERNAME}")
+      password: $(yaml_quote "${REGISTRY_PASSWORD}")
 REGEOF
     fi
 
@@ -284,8 +293,8 @@ REGEOF
             cat >> "$REGISTRIES_YAML" <<REGEOF
   "${COMMUNITY_REGISTRY_HOST}":
     auth:
-      username: ${COMMUNITY_REGISTRY_USERNAME}
-      password: ${COMMUNITY_REGISTRY_PASSWORD}
+      username: $(yaml_quote "${COMMUNITY_REGISTRY_USERNAME}")
+      password: $(yaml_quote "${COMMUNITY_REGISTRY_PASSWORD}")
 REGEOF
         else
             cat >> "$REGISTRIES_YAML" <<REGEOF
@@ -293,8 +302,8 @@ REGEOF
 configs:
   "${COMMUNITY_REGISTRY_HOST}":
     auth:
-      username: ${COMMUNITY_REGISTRY_USERNAME}
-      password: ${COMMUNITY_REGISTRY_PASSWORD}
+      username: $(yaml_quote "${COMMUNITY_REGISTRY_USERNAME}")
+      password: $(yaml_quote "${COMMUNITY_REGISTRY_PASSWORD}")
 REGEOF
         fi
     fi
diff --git a/install.sh b/install.sh
index 565c48c09..0ad6eee63 100755
--- a/install.sh
+++ b/install.sh
@@ -277,7 +277,7 @@ main() {
 
   # Extract
   info "extracting..."
-  tar -xzf "${_tmpdir}/${_filename}" -C "${_tmpdir}"
+  tar -xzf "${_tmpdir}/${_filename}" -C "${_tmpdir}" --no-same-owner --no-same-permissions "${APP_NAME}"
 
   # Install
   mkdir -p "$_install_dir" 2>/dev/null || true

From 491c5d81326a5b2b557fcce42f6bee89319a6c66 Mon Sep 17 00:00:00 2001
From: Drew Newberry <anewberry@nvidia.com>
Date: Thu, 2 Apr 2026 23:14:59 -0700
Subject: [PATCH 5/9] fix(bootstrap,server): persist sandbox state across
 gateway stop/start cycles (#739)

---
 architecture/gateway-single-node.md         |   2 +-
 architecture/gateway.md                     |   2 +-
 crates/openshell-bootstrap/src/constants.rs |  85 +++++
 crates/openshell-bootstrap/src/docker.rs    |  59 ++--
 crates/openshell-bootstrap/src/lib.rs       |  68 ++--
 crates/openshell-bootstrap/src/runtime.rs   |  45 ++-
 crates/openshell-server/src/sandbox/mod.rs  | 324 ++++++++++++++++++++
 deploy/docker/cluster-entrypoint.sh         |  20 +-
 8 files changed, 544 insertions(+), 61 deletions(-)

diff --git a/architecture/gateway-single-node.md b/architecture/gateway-single-node.md
index f46a50d2d..6389c728e 100644
--- a/architecture/gateway-single-node.md
+++ b/architecture/gateway-single-node.md
@@ -185,7 +185,7 @@ For the target daemon (local or remote):
 
 After the container starts:
 
-1. **Clean stale nodes**: `clean_stale_nodes()` finds `NotReady` nodes via `kubectl get nodes` and deletes them. This is needed when a container is recreated but reuses the persistent volume -- k3s registers a new node (using the container ID as hostname) while old node entries persist in etcd. Non-fatal on error; returns the count of removed nodes.
+1. **Clean stale nodes**: `clean_stale_nodes()` finds nodes whose name does not match the deterministic k3s `--node-name` and deletes them. That node name is derived from the gateway name but normalized to a Kubernetes-safe lowercase form so existing gateway names that contain `_`, `.`, or uppercase characters still produce a valid node identity. This cleanup is needed when a container is recreated but reuses the persistent volume -- old node entries can persist in etcd. Non-fatal on error; returns the count of removed nodes.
 2. **Push local images** (optional, local deploy only): If `OPENSHELL_PUSH_IMAGES` is set, the comma-separated image refs are exported from the local Docker daemon as a single tar, uploaded into the container via `docker put_archive`, and imported into containerd via `ctr images import` in the `k8s.io` namespace. After import, `kubectl rollout restart deployment/openshell openshell` is run, followed by `kubectl rollout status --timeout=180s` to wait for completion. See `crates/openshell-bootstrap/src/push.rs`.
 3. **Wait for gateway health**: `wait_for_gateway_ready()` polls the Docker HEALTHCHECK status up to 180 times, 2 seconds apart (6 min total). A background task streams container logs during this wait. Failure modes:
     - Container exits during polling: error includes recent log lines.
diff --git a/architecture/gateway.md b/architecture/gateway.md
index 39f97c8c1..72574410d 100644
--- a/architecture/gateway.md
+++ b/architecture/gateway.md
@@ -501,7 +501,7 @@ The Helm chart template is at `deploy/helm/openshell/templates/statefulset.yaml`
 
 `SandboxClient` (`crates/openshell-server/src/sandbox/mod.rs`) manages `agents.x-k8s.io/v1alpha1/Sandbox` CRDs.
 
-- **Create**: Translates a `Sandbox` proto into a Kubernetes `DynamicObject` with labels (`openshell.ai/sandbox-id`, `openshell.ai/managed-by: openshell`) and a spec that includes the pod template, environment variables, and gateway-required env vars (`OPENSHELL_SANDBOX_ID`, `OPENSHELL_ENDPOINT`, `OPENSHELL_SSH_LISTEN_ADDR`, etc.).
+- **Create**: Translates a `Sandbox` proto into a Kubernetes `DynamicObject` with labels (`openshell.ai/sandbox-id`, `openshell.ai/managed-by: openshell`) and a spec that includes the pod template, environment variables, and gateway-required env vars (`OPENSHELL_SANDBOX_ID`, `OPENSHELL_ENDPOINT`, `OPENSHELL_SSH_LISTEN_ADDR`, etc.). When callers do not provide custom `volumeClaimTemplates`, the server injects a default `workspace` PVC and mounts it at `/sandbox` so the default sandbox home/workdir survives pod rescheduling.
 - **Delete**: Calls the Kubernetes API to delete the CRD by name. Returns `false` if already gone (404).
 - **Pod IP resolution**: `agent_pod_ip()` fetches the agent pod and reads `status.podIP`.
 
diff --git a/crates/openshell-bootstrap/src/constants.rs b/crates/openshell-bootstrap/src/constants.rs
index 74e381fd2..eee9000d1 100644
--- a/crates/openshell-bootstrap/src/constants.rs
+++ b/crates/openshell-bootstrap/src/constants.rs
@@ -13,11 +13,66 @@ pub const SERVER_CLIENT_CA_SECRET_NAME: &str = "openshell-server-client-ca";
 pub const CLIENT_TLS_SECRET_NAME: &str = "openshell-client-tls";
 /// K8s secret holding the SSH handshake HMAC secret (shared by gateway and sandbox pods).
 pub const SSH_HANDSHAKE_SECRET_NAME: &str = "openshell-ssh-handshake";
+const NODE_NAME_PREFIX: &str = "openshell-";
+const NODE_NAME_FALLBACK_SUFFIX: &str = "gateway";
+const KUBERNETES_MAX_NAME_LEN: usize = 253;
 
 pub fn container_name(name: &str) -> String {
     format!("openshell-cluster-{name}")
 }
 
+/// Deterministic k3s node name derived from the gateway name.
+///
+/// k3s defaults to using the container hostname (= Docker container ID) as
+/// the node name.  When the container is recreated (e.g. after an image
+/// upgrade), the container ID changes, creating a new k3s node.  The
+/// `clean_stale_nodes` function then deletes PVCs whose backing PVs have
+/// node affinity for the old node — wiping the server database and any
+/// sandbox persistent volumes.
+///
+/// By passing a deterministic `--node-name` to k3s, the node identity
+/// survives container recreation, and PVCs are never orphaned.
+///
+/// Gateway names allow Docker-friendly separators and uppercase characters,
+/// but Kubernetes node names must be DNS-safe. Normalize the gateway name into
+/// a single lowercase RFC 1123 label so previously accepted names such as
+/// `prod_us` or `Prod.US` still deploy successfully.
+pub fn node_name(name: &str) -> String {
+    format!("{NODE_NAME_PREFIX}{}", normalize_node_name_suffix(name))
+}
+
+fn normalize_node_name_suffix(name: &str) -> String {
+    let mut normalized = String::with_capacity(name.len());
+    let mut last_was_separator = false;
+
+    for ch in name.chars() {
+        if ch.is_ascii_alphanumeric() {
+            normalized.push(ch.to_ascii_lowercase());
+            last_was_separator = false;
+        } else if !last_was_separator {
+            normalized.push('-');
+            last_was_separator = true;
+        }
+    }
+
+    let mut normalized = normalized.trim_matches('-').to_string();
+    if normalized.is_empty() {
+        normalized.push_str(NODE_NAME_FALLBACK_SUFFIX);
+    }
+
+    let max_suffix_len = KUBERNETES_MAX_NAME_LEN.saturating_sub(NODE_NAME_PREFIX.len());
+    if normalized.len() > max_suffix_len {
+        normalized.truncate(max_suffix_len);
+        normalized.truncate(normalized.trim_end_matches('-').len());
+    }
+
+    if normalized.is_empty() {
+        normalized.push_str(NODE_NAME_FALLBACK_SUFFIX);
+    }
+
+    normalized
+}
+
 pub fn volume_name(name: &str) -> String {
     format!("openshell-cluster-{name}")
 }
@@ -25,3 +80,33 @@ pub fn volume_name(name: &str) -> String {
 pub fn network_name(name: &str) -> String {
     format!("openshell-cluster-{name}")
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn node_name_normalizes_uppercase_and_underscores() {
+        assert_eq!(node_name("Prod_US"), "openshell-prod-us");
+    }
+
+    #[test]
+    fn node_name_collapses_and_trims_separator_runs() {
+        assert_eq!(node_name("._Prod..__-Gateway-."), "openshell-prod-gateway");
+    }
+
+    #[test]
+    fn node_name_falls_back_when_gateway_name_has_no_alphanumerics() {
+        assert_eq!(node_name("...___---"), "openshell-gateway");
+    }
+
+    #[test]
+    fn node_name_truncates_to_kubernetes_name_limit() {
+        let gateway_name = "A".repeat(400);
+        let node_name = node_name(&gateway_name);
+
+        assert!(node_name.len() <= KUBERNETES_MAX_NAME_LEN);
+        assert!(node_name.starts_with(NODE_NAME_PREFIX));
+        assert!(node_name.ends_with('a'));
+    }
+}
diff --git a/crates/openshell-bootstrap/src/docker.rs b/crates/openshell-bootstrap/src/docker.rs
index d9aaed7f4..be086e534 100644
--- a/crates/openshell-bootstrap/src/docker.rs
+++ b/crates/openshell-bootstrap/src/docker.rs
@@ -2,7 +2,7 @@
 // SPDX-License-Identifier: Apache-2.0
 
 use crate::RemoteOptions;
-use crate::constants::{container_name, network_name, volume_name};
+use crate::constants::{container_name, network_name, node_name, volume_name};
 use crate::image::{self, DEFAULT_IMAGE_REPO_BASE, DEFAULT_REGISTRY, parse_image_ref};
 use bollard::API_DEFAULT_VERSION;
 use bollard::Docker;
@@ -482,6 +482,7 @@ pub async fn ensure_container(
     registry_username: Option<&str>,
     registry_token: Option<&str>,
     device_ids: &[String],
+    resume: bool,
 ) -> Result<u16> {
     let container_name = container_name(name);
 
@@ -491,25 +492,34 @@ pub async fn ensure_container(
         .await
     {
         Ok(info) => {
-            // Container exists — verify it is using the expected image.
-            // Resolve the desired image ref to its content-addressable ID so we
-            // can compare against the container's image field (which Docker
-            // stores as an ID).
-            let desired_id = docker
-                .inspect_image(image_ref)
-                .await
-                .ok()
-                .and_then(|img| img.id);
+            // On resume we always reuse the existing container — the persistent
+            // volume holds k3s etcd state, and recreating the container with
+            // different env vars would cause the entrypoint to rewrite the
+            // HelmChart manifest, triggering a Helm upgrade that changes the
+            // StatefulSet image reference while the old pod still runs with the
+            // previous image.  Reusing the container avoids this entirely.
+            //
+            // On a non-resume path we check whether the image changed and
+            // recreate only when necessary.
+            let reuse = if resume {
+                true
+            } else {
+                let desired_id = docker
+                    .inspect_image(image_ref)
+                    .await
+                    .ok()
+                    .and_then(|img| img.id);
 
-            let container_image_id = info.image;
+                let container_image_id = info.image.clone();
 
-            let image_matches = match (&desired_id, &container_image_id) {
-                (Some(desired), Some(current)) => desired == current,
-                _ => false,
+                match (&desired_id, &container_image_id) {
+                    (Some(desired), Some(current)) => desired == current,
+                    _ => false,
+                }
             };
 
-            if image_matches {
-                // The container exists with the correct image, but its network
+            if reuse {
+                // The container exists and should be reused. Its network
                 // attachment may be stale. When the gateway is resumed after a
                 // container kill, `ensure_network` destroys and recreates the
                 // Docker network (giving it a new ID). The stopped container
@@ -543,8 +553,8 @@ pub async fn ensure_container(
             tracing::info!(
                 "Container {} exists but uses a different image (container={}, desired={}), recreating",
                 container_name,
-                container_image_id.as_deref().map_or("unknown", truncate_id),
-                desired_id.as_deref().map_or("unknown", truncate_id),
+                info.image.as_deref().map_or("unknown", truncate_id),
+                image_ref,
             );
 
             let _ = docker.stop_container(&container_name, None).await;
@@ -684,6 +694,11 @@ pub async fn ensure_container(
         format!("REGISTRY_HOST={registry_host}"),
         format!("REGISTRY_INSECURE={registry_insecure}"),
         format!("IMAGE_REPO_BASE={image_repo_base}"),
+        // Deterministic k3s node name so the node identity survives container
+        // recreation (e.g. after an image upgrade). Without this, k3s uses
+        // the container ID as the hostname/node name, which changes on every
+        // container recreate and triggers stale-node PVC cleanup.
+        format!("OPENSHELL_NODE_NAME={}", node_name(name)),
     ];
     if let Some(endpoint) = registry_endpoint {
         env_vars.push(format!("REGISTRY_ENDPOINT={endpoint}"));
@@ -753,6 +768,14 @@ pub async fn ensure_container(
 
     let config = ContainerCreateBody {
         image: Some(image_ref.to_string()),
+        // Set the container hostname to the deterministic node name.
+        // k3s uses the container hostname as its default node name.  Without
+        // this, Docker defaults to the container ID (first 12 hex chars),
+        // which changes on every container recreation and can cause
+        // `clean_stale_nodes` to delete the wrong node on resume.  The
+        // hostname persists across container stop/start cycles, ensuring a
+        // stable node identity.
+        hostname: Some(node_name(name)),
         cmd: Some(cmd),
         env,
         exposed_ports: Some(exposed_ports),
diff --git a/crates/openshell-bootstrap/src/lib.rs b/crates/openshell-bootstrap/src/lib.rs
index b569cabe7..8ce10703e 100644
--- a/crates/openshell-bootstrap/src/lib.rs
+++ b/crates/openshell-bootstrap/src/lib.rs
@@ -314,6 +314,7 @@ where
     //   idempotent and will reuse the volume, create a container if needed,
     //   and start it)
     let mut resume = false;
+    let mut resume_container_exists = false;
     if let Some(existing) = check_existing_gateway(&target_docker, &name).await? {
         if recreate {
             log("[status] Removing existing gateway".to_string());
@@ -321,39 +322,51 @@ where
         } else if existing.container_running {
             log("[status] Gateway is already running".to_string());
             resume = true;
+            resume_container_exists = true;
         } else {
             log("[status] Resuming gateway from existing state".to_string());
             resume = true;
+            resume_container_exists = existing.container_exists;
         }
     }
 
-    // Ensure the image is available on the target Docker daemon
-    if remote_opts.is_some() {
-        log("[status] Downloading gateway".to_string());
-        let on_log_clone = Arc::clone(&on_log);
-        let progress_cb = move |msg: String| {
-            if let Ok(mut f) = on_log_clone.lock() {
-                f(msg);
-            }
-        };
-        image::pull_remote_image(
-            &target_docker,
-            &image_ref,
-            registry_username.as_deref(),
-            registry_token.as_deref(),
-            progress_cb,
-        )
-        .await?;
-    } else {
-        // Local deployment: ensure image exists (pull if needed)
-        log("[status] Downloading gateway".to_string());
-        ensure_image(
-            &target_docker,
-            &image_ref,
-            registry_username.as_deref(),
-            registry_token.as_deref(),
-        )
-        .await?;
+    // Ensure the image is available on the target Docker daemon.
+    // When both the container and volume exist we can skip the pull entirely
+    // — the container already references a valid local image.  This avoids
+    // failures when the original image tag (e.g. a local-only
+    // `openshell/cluster:dev`) is not available from the default registry.
+    //
+    // When only the volume survives (container was removed), we still need
+    // the image to recreate the container, so the pull must happen.
+    let need_image = !resume || !resume_container_exists;
+    if need_image {
+        if remote_opts.is_some() {
+            log("[status] Downloading gateway".to_string());
+            let on_log_clone = Arc::clone(&on_log);
+            let progress_cb = move |msg: String| {
+                if let Ok(mut f) = on_log_clone.lock() {
+                    f(msg);
+                }
+            };
+            image::pull_remote_image(
+                &target_docker,
+                &image_ref,
+                registry_username.as_deref(),
+                registry_token.as_deref(),
+                progress_cb,
+            )
+            .await?;
+        } else {
+            // Local deployment: ensure image exists (pull if needed)
+            log("[status] Downloading gateway".to_string());
+            ensure_image(
+                &target_docker,
+                &image_ref,
+                registry_username.as_deref(),
+                registry_token.as_deref(),
+            )
+            .await?;
+        }
     }
 
     // All subsequent operations use the target Docker (remote or local)
@@ -444,6 +457,7 @@ where
             registry_username.as_deref(),
             registry_token.as_deref(),
             &device_ids,
+            resume,
         )
         .await?;
         let port = actual_port;
diff --git a/crates/openshell-bootstrap/src/runtime.rs b/crates/openshell-bootstrap/src/runtime.rs
index 2a10b2651..0f9a96e6b 100644
--- a/crates/openshell-bootstrap/src/runtime.rs
+++ b/crates/openshell-bootstrap/src/runtime.rs
@@ -1,7 +1,7 @@
 // SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 // SPDX-License-Identifier: Apache-2.0
 
-use crate::constants::{KUBECONFIG_PATH, container_name};
+use crate::constants::{KUBECONFIG_PATH, container_name, node_name};
 use bollard::Docker;
 use bollard::container::LogOutput;
 use bollard::exec::CreateExecOptions;
@@ -385,11 +385,19 @@ pub async fn clean_stale_nodes(docker: &Docker, name: &str) -> Result<usize> {
     let container_name = container_name(name);
     let mut stale_nodes: Vec<String> = Vec::new();
 
+    // Determine the current node name.  With the deterministic `--node-name`
+    // entrypoint change the k3s node is `openshell-{gateway}`.  However, older
+    // cluster images (built before that change) still use the container hostname
+    // (= Docker container ID) as the node name.  We must handle both:
+    //
+    //   1. If the expected deterministic name appears in the node list, use it.
+    //   2. Otherwise fall back to the container hostname (old behaviour).
+    //
+    // This ensures backward compatibility during upgrades where the bootstrap
+    // CLI is newer than the cluster image.
+    let deterministic_node = node_name(name);
+
     for attempt in 1..=MAX_ATTEMPTS {
-        // List ALL node names and the container's own hostname.  Any node that
-        // is not the current container is stale — we cannot rely on the Ready
-        // condition because k3s may not have marked the old node NotReady yet
-        // when this runs shortly after container start.
         let (output, exit_code) = exec_capture_with_exit(
             docker,
             &container_name,
@@ -406,16 +414,27 @@ pub async fn clean_stale_nodes(docker: &Docker, name: &str) -> Result<usize> {
         .await?;
 
         if exit_code == 0 {
-            // Determine the current node name (container hostname).
-            let (hostname_out, _) =
-                exec_capture_with_exit(docker, &container_name, vec!["hostname".to_string()])
-                    .await?;
-            let current_hostname = hostname_out.trim().to_string();
-
-            stale_nodes = output
+            let all_nodes: Vec<&str> = output
                 .lines()
                 .map(str::trim)
-                .filter(|l| !l.is_empty() && *l != current_hostname)
+                .filter(|l| !l.is_empty())
+                .collect();
+
+            // Pick the current node identity: prefer the deterministic name,
+            // fall back to the container hostname for older cluster images.
+            let current_node = if all_nodes.contains(&deterministic_node.as_str()) {
+                deterministic_node.clone()
+            } else {
+                // Older cluster image without --node-name: read hostname.
+                let (hostname_out, _) =
+                    exec_capture_with_exit(docker, &container_name, vec!["hostname".to_string()])
+                        .await?;
+                hostname_out.trim().to_string()
+            };
+
+            stale_nodes = all_nodes
+                .into_iter()
+                .filter(|n| *n != current_node)
                 .map(ToString::to_string)
                 .collect();
             break;
diff --git a/crates/openshell-server/src/sandbox/mod.rs b/crates/openshell-server/src/sandbox/mod.rs
index 3dca66493..c5e9a8335 100644
--- a/crates/openshell-server/src/sandbox/mod.rs
+++ b/crates/openshell-server/src/sandbox/mod.rs
@@ -34,6 +34,44 @@ const SANDBOX_MANAGED_VALUE: &str = "openshell";
 const GPU_RESOURCE_NAME: &str = "nvidia.com/gpu";
 const GPU_RESOURCE_QUANTITY: &str = "1";
 
+// ---------------------------------------------------------------------------
+// Default workspace persistence (temporary — will be replaced by snapshotting)
+// ---------------------------------------------------------------------------
+// Every sandbox pod gets a PVC-backed `/sandbox` directory so that user data
+// (installed packages, files, dotfiles) survives pod rescheduling across
+// gateway stop/start cycles.  An init container seeds the PVC with the
+// image's original `/sandbox` contents on first use so that the Python venv,
+// skills, and shell config are not lost when the empty PVC is mounted.
+//
+// NOTE: This PVC + init-container approach is a stopgap.  It has known
+// limitations: image upgrades don't propagate into existing PVCs, the init
+// copy adds first-start latency, and the full /sandbox directory is
+// duplicated on disk.  The plan is to replace this with proper container
+// snapshotting so that only the diff from the base image is persisted.
+
+/// Volume name used for the workspace PVC in the pod spec.
+const WORKSPACE_VOLUME_NAME: &str = "workspace";
+
+/// Mount path for the workspace PVC in the **agent** container.  This shadows
+/// the image's `/sandbox` directory — the init container copies the image
+/// contents into the PVC before the agent starts.
+const WORKSPACE_MOUNT_PATH: &str = "/sandbox";
+
+/// Mount path for the workspace PVC in the **init** container.  A temporary
+/// path so the init container can see the image's original `/sandbox` and
+/// copy it into the PVC.
+const WORKSPACE_INIT_MOUNT_PATH: &str = "/workspace-pvc";
+
+/// Name of the init container that seeds the workspace PVC.
+const WORKSPACE_INIT_CONTAINER_NAME: &str = "workspace-init";
+
+/// Default storage request for the workspace PVC.
+const WORKSPACE_DEFAULT_STORAGE: &str = "2Gi";
+
+/// Sentinel file written by the init container after copying the image's
+/// `/sandbox` contents.  Subsequent pod starts skip the copy.
+const WORKSPACE_SENTINEL: &str = ".workspace-initialized";
+
 #[derive(Clone)]
 pub struct SandboxClient {
     client: Client,
@@ -733,6 +771,107 @@ fn apply_supervisor_sideload(pod_template: &mut serde_json::Value) {
     }
 }
 
+/// Apply workspace persistence transforms to an already-built pod template.
+///
+/// This injects:
+///   1. A volume mount on the agent container at `/sandbox`.
+///   2. An init container (same image) that seeds the PVC with the image's
+///      original `/sandbox` contents on first use.
+///
+/// The PVC volume itself is **not** added here — the Sandbox CRD controller
+/// automatically creates a volume for each entry in `volumeClaimTemplates`
+/// (following the StatefulSet convention).  Adding one here would create a
+/// duplicate volume name and fail pod validation.
+///
+/// The init container mounts the PVC at a temporary path so it can still see
+/// the image's `/sandbox` directory.  It checks for a sentinel file and skips
+/// the copy if the PVC was already initialised.
+fn apply_workspace_persistence(pod_template: &mut serde_json::Value, image: &str) {
+    let Some(spec) = pod_template.get_mut("spec").and_then(|v| v.as_object_mut()) else {
+        return;
+    };
+
+    // 1. Add workspace volume mount to the agent container
+    let containers = spec.get_mut("containers").and_then(|v| v.as_array_mut());
+    if let Some(containers) = containers {
+        let mut target_index = None;
+        for (i, c) in containers.iter().enumerate() {
+            if c.get("name").and_then(|v| v.as_str()) == Some("agent") {
+                target_index = Some(i);
+                break;
+            }
+        }
+        let index = target_index.unwrap_or(0);
+
+        if let Some(container) = containers.get_mut(index).and_then(|v| v.as_object_mut()) {
+            let volume_mounts = container
+                .entry("volumeMounts")
+                .or_insert_with(|| serde_json::json!([]))
+                .as_array_mut();
+            if let Some(volume_mounts) = volume_mounts {
+                volume_mounts.push(serde_json::json!({
+                    "name": WORKSPACE_VOLUME_NAME,
+                    "mountPath": WORKSPACE_MOUNT_PATH
+                }));
+            }
+        }
+    }
+
+    // 3. Add the init container that seeds the PVC from the image
+    let init_containers = spec
+        .entry("initContainers")
+        .or_insert_with(|| serde_json::json!([]))
+        .as_array_mut();
+    if let Some(init_containers) = init_containers {
+        // The init container mounts the PVC at a temp path so it can still
+        // read the image's original /sandbox contents.  It copies them into
+        // the PVC only when the sentinel file is absent.
+        //
+        // The inner `[ -d ... ]` guard handles custom images that don't have
+        // a /sandbox directory — the copy is skipped but the sentinel is
+        // still written so subsequent starts are instant.
+        let copy_cmd = format!(
+            "if [ ! -f {WORKSPACE_INIT_MOUNT_PATH}/{WORKSPACE_SENTINEL} ]; then \
+               if [ -d {WORKSPACE_MOUNT_PATH} ]; then \
+                 cp -a {WORKSPACE_MOUNT_PATH}/. {WORKSPACE_INIT_MOUNT_PATH}/; \
+               fi && \
+               touch {WORKSPACE_INIT_MOUNT_PATH}/{WORKSPACE_SENTINEL}; \
+             fi"
+        );
+
+        init_containers.push(serde_json::json!({
+            "name": WORKSPACE_INIT_CONTAINER_NAME,
+            "image": image,
+            "command": ["sh", "-c", copy_cmd],
+            "securityContext": { "runAsUser": 0 },
+            "volumeMounts": [{
+                "name": WORKSPACE_VOLUME_NAME,
+                "mountPath": WORKSPACE_INIT_MOUNT_PATH
+            }]
+        }));
+    }
+}
+
+/// Build the default `volumeClaimTemplates` array for sandbox pods.
+///
+/// Provides a single PVC named "workspace" that backs the `/sandbox`
+/// directory.  The init container seeds it from the image on first use.
+fn default_workspace_volume_claim_templates() -> serde_json::Value {
+    serde_json::json!([{
+        "metadata": {
+            "name": WORKSPACE_VOLUME_NAME
+        },
+        "spec": {
+            "accessModes": ["ReadWriteOnce"],
+            "resources": {
+                "requests": {
+                    "storage": WORKSPACE_DEFAULT_STORAGE
+                }
+            }
+        }
+    }])
+}
+
 #[allow(clippy::too_many_arguments)]
 fn sandbox_to_k8s_spec(
     spec: Option<&SandboxSpec>,
@@ -748,6 +887,18 @@ fn sandbox_to_k8s_spec(
     host_gateway_ip: &str,
 ) -> serde_json::Value {
     let mut root = serde_json::Map::new();
+
+    // Determine early whether the user provided custom volumeClaimTemplates.
+    // When they haven't, we inject a default workspace VCT and corresponding
+    // init container + volume mount so sandbox data persists.  We need this
+    // flag before building the podTemplate because the workspace persistence
+    // transforms are applied inside sandbox_template_to_k8s.
+    let user_has_vct = spec
+        .and_then(|s| s.template.as_ref())
+        .and_then(|t| struct_to_json(&t.volume_claim_templates))
+        .is_some();
+    let inject_workspace = !user_has_vct;
+
     if let Some(spec) = spec {
         if !spec.log_level.is_empty() {
             root.insert("logLevel".to_string(), serde_json::json!(spec.log_level));
@@ -775,6 +926,7 @@ fn sandbox_to_k8s_spec(
                     &spec.environment,
                     client_tls_secret_name,
                     host_gateway_ip,
+                    inject_workspace,
                 ),
             );
             if !template.agent_socket.is_empty() {
@@ -789,6 +941,15 @@ fn sandbox_to_k8s_spec(
         }
     }
 
+    // Inject the default workspace volumeClaimTemplate when the user didn't
+    // provide their own.
+    if inject_workspace {
+        root.insert(
+            "volumeClaimTemplates".to_string(),
+            default_workspace_volume_claim_templates(),
+        );
+    }
+
     // podTemplate is required by the Kubernetes CRD - ensure it's always present
     if !root.contains_key("podTemplate") {
         let empty_env = std::collections::HashMap::new();
@@ -809,6 +970,7 @@ fn sandbox_to_k8s_spec(
                 spec_env,
                 client_tls_secret_name,
                 host_gateway_ip,
+                inject_workspace,
             ),
         );
     }
@@ -833,6 +995,7 @@ fn sandbox_template_to_k8s(
     spec_environment: &std::collections::HashMap<String, String>,
     client_tls_secret_name: &str,
     host_gateway_ip: &str,
+    inject_workspace: bool,
 ) -> serde_json::Value {
     // The supervisor binary is always side-loaded from the node filesystem
     // via a hostPath volume, regardless of which sandbox image is used.
@@ -959,6 +1122,13 @@ fn sandbox_template_to_k8s(
     // Always side-load the supervisor binary from the node filesystem
     apply_supervisor_sideload(&mut result);
 
+    // Inject workspace persistence (init container + PVC volume mount) so
+    // that /sandbox data survives pod rescheduling.  Skipped when the user
+    // provides custom volumeClaimTemplates to avoid conflicts.
+    if inject_workspace {
+        apply_workspace_persistence(&mut result, image);
+    }
+
     result
 }
 
@@ -1631,6 +1801,7 @@ mod tests {
             &std::collections::HashMap::new(),
             "",
             "",
+            true,
         );
 
         assert_eq!(
@@ -1664,6 +1835,7 @@ mod tests {
             &std::collections::HashMap::new(),
             "",
             "",
+            true,
         );
 
         assert_eq!(
@@ -1693,6 +1865,7 @@ mod tests {
             &std::collections::HashMap::new(),
             "",
             "",
+            true,
         );
 
         assert_eq!(
@@ -1735,6 +1908,7 @@ mod tests {
             &std::collections::HashMap::new(),
             "",
             "",
+            true,
         );
 
         let limits = &pod_template["spec"]["containers"][0]["resources"]["limits"];
@@ -1761,6 +1935,7 @@ mod tests {
             &std::collections::HashMap::new(),
             "",
             "172.17.0.1",
+            true,
         );
 
         let host_aliases = pod_template["spec"]["hostAliases"]
@@ -1791,6 +1966,7 @@ mod tests {
             &std::collections::HashMap::new(),
             "",
             "",
+            true,
         );
 
         assert!(
@@ -1816,6 +1992,7 @@ mod tests {
             &std::collections::HashMap::new(),
             "my-tls-secret",
             "",
+            true,
         );
 
         let volumes = pod_template["spec"]["volumes"]
@@ -1831,4 +2008,151 @@ mod tests {
             "TLS secret volume must use mode 0400 to prevent sandbox user from reading the private key"
         );
     }
+
+    // -----------------------------------------------------------------------
+    // Workspace persistence tests
+    // -----------------------------------------------------------------------
+
+    #[test]
+    fn workspace_persistence_injects_init_container_volume_and_mount() {
+        let mut pod_template = serde_json::json!({
+            "spec": {
+                "containers": [{
+                    "name": "agent",
+                    "image": "openshell/sandbox:latest"
+                }]
+            }
+        });
+
+        apply_workspace_persistence(&mut pod_template, "openshell/sandbox:latest");
+
+        // Init container
+        let init_containers = pod_template["spec"]["initContainers"]
+            .as_array()
+            .expect("initContainers should exist");
+        assert_eq!(init_containers.len(), 1);
+        assert_eq!(init_containers[0]["name"], WORKSPACE_INIT_CONTAINER_NAME);
+        assert_eq!(init_containers[0]["image"], "openshell/sandbox:latest");
+        assert_eq!(init_containers[0]["securityContext"]["runAsUser"], 0);
+
+        // Init container mounts PVC at temp path, not /sandbox
+        let init_mounts = init_containers[0]["volumeMounts"]
+            .as_array()
+            .expect("init volumeMounts should exist");
+        assert_eq!(init_mounts.len(), 1);
+        assert_eq!(init_mounts[0]["name"], WORKSPACE_VOLUME_NAME);
+        assert_eq!(init_mounts[0]["mountPath"], WORKSPACE_INIT_MOUNT_PATH);
+
+        // Agent container mounts PVC at /sandbox
+        let agent_mounts = pod_template["spec"]["containers"][0]["volumeMounts"]
+            .as_array()
+            .expect("agent volumeMounts should exist");
+        let workspace_mount = agent_mounts
+            .iter()
+            .find(|m| m["name"] == WORKSPACE_VOLUME_NAME)
+            .expect("workspace mount should exist on agent container");
+        assert_eq!(workspace_mount["mountPath"], WORKSPACE_MOUNT_PATH);
+
+        // The PVC volume is NOT created by apply_workspace_persistence — the
+        // Sandbox CRD controller adds it from the volumeClaimTemplates.
+        // Verify we did not inject one (which would cause a duplicate).
+        let has_pvc_vol = pod_template["spec"]["volumes"]
+            .as_array()
+            .map_or(false, |vols| {
+                vols.iter().any(|v| v["name"] == WORKSPACE_VOLUME_NAME)
+            });
+        assert!(
+            !has_pvc_vol,
+            "apply_workspace_persistence must NOT add a PVC volume (the CRD controller does that)"
+        );
+    }
+
+    #[test]
+    fn workspace_persistence_uses_same_image_as_agent() {
+        let mut pod_template = serde_json::json!({
+            "spec": {
+                "containers": [{
+                    "name": "agent",
+                    "image": "my-custom-image:v2"
+                }]
+            }
+        });
+
+        apply_workspace_persistence(&mut pod_template, "my-custom-image:v2");
+
+        let init_image = pod_template["spec"]["initContainers"][0]["image"]
+            .as_str()
+            .expect("init container should have image");
+        assert_eq!(
+            init_image, "my-custom-image:v2",
+            "init container must use the same image as the agent container"
+        );
+    }
+
+    #[test]
+    fn workspace_init_command_checks_sentinel() {
+        let mut pod_template = serde_json::json!({
+            "spec": {
+                "containers": [{
+                    "name": "agent",
+                    "image": "img:latest"
+                }]
+            }
+        });
+
+        apply_workspace_persistence(&mut pod_template, "img:latest");
+
+        let cmd = pod_template["spec"]["initContainers"][0]["command"]
+            .as_array()
+            .expect("command should be an array");
+        let script = cmd[2].as_str().expect("third element should be the script");
+        assert!(
+            script.contains(WORKSPACE_SENTINEL),
+            "init script must check for sentinel file"
+        );
+        assert!(
+            script.contains("cp -a"),
+            "init script must copy image contents"
+        );
+    }
+
+    #[test]
+    fn workspace_persistence_skipped_when_inject_workspace_false() {
+        let pod_template = sandbox_template_to_k8s(
+            &SandboxTemplate::default(),
+            false,
+            "openshell/sandbox:latest",
+            "",
+            "sandbox-id",
+            "sandbox-name",
+            "https://gateway.example.com",
+            "0.0.0.0:2222",
+            "secret",
+            300,
+            &std::collections::HashMap::new(),
+            "",
+            "",
+            false, // user provided custom VCTs
+        );
+
+        // No init container should be present
+        assert!(
+            pod_template["spec"]["initContainers"].is_null()
+                || pod_template["spec"]["initContainers"]
+                    .as_array()
+                    .is_none_or(|a| a.is_empty()),
+            "workspace init container must NOT be present when inject_workspace is false"
+        );
+
+        // No workspace volume mount on agent
+        let has_workspace_mount = pod_template["spec"]["containers"][0]["volumeMounts"]
+            .as_array()
+            .map_or(false, |mounts| {
+                mounts.iter().any(|m| m["name"] == WORKSPACE_VOLUME_NAME)
+            });
+        assert!(
+            !has_workspace_mount,
+            "workspace mount must NOT be present when inject_workspace is false"
+        );
+    }
 }
diff --git a/deploy/docker/cluster-entrypoint.sh b/deploy/docker/cluster-entrypoint.sh
index 86d61e062..14f13ecb0 100644
--- a/deploy/docker/cluster-entrypoint.sh
+++ b/deploy/docker/cluster-entrypoint.sh
@@ -568,8 +568,26 @@ fi
 # routing to settle first.
 wait_for_default_route
 
+# ---------------------------------------------------------------------------
+# Deterministic k3s node name
+# ---------------------------------------------------------------------------
+# By default k3s uses the container hostname (= Docker container ID) as the
+# node name.  When the container is recreated (e.g. after an image upgrade),
+# the container ID changes, registering a new k3s node.  The bootstrap code
+# then deletes PVCs whose backing PVs have node affinity for the old node —
+# wiping the server database and any sandbox persistent volumes.
+#
+# OPENSHELL_NODE_NAME is set by the bootstrap code to a deterministic value
+# derived from the gateway name, so the node identity survives container
+# recreation and PVCs are never orphaned.
+NODE_NAME_ARG=""
+if [ -n "${OPENSHELL_NODE_NAME:-}" ]; then
+    NODE_NAME_ARG="--node-name=${OPENSHELL_NODE_NAME}"
+    echo "Using deterministic k3s node name: ${OPENSHELL_NODE_NAME}"
+fi
+
 # Execute k3s with explicit resolv-conf passed as a kubelet arg.
 # k3s v1.35.2+ no longer accepts --resolv-conf as a top-level server flag;
 # it must be passed via --kubelet-arg instead.
 # shellcheck disable=SC2086
-exec /bin/k3s "$@" --kubelet-arg=resolv-conf="$RESOLV_CONF" $EXTRA_KUBELET_ARGS
+exec /bin/k3s "$@" $NODE_NAME_ARG --kubelet-arg=resolv-conf="$RESOLV_CONF" $EXTRA_KUBELET_ARGS

From 13262e1cfadccd575c7e041c349945ac2ffd9f70 Mon Sep 17 00:00:00 2001
From: Drew Newberry <anewberry@nvidia.com>
Date: Sat, 4 Apr 2026 21:43:52 -0700
Subject: [PATCH 6/9] feat(cli): add sandbox exec subcommand with TTY support
 (#752)

---
 crates/openshell-cli/src/main.rs    |  74 ++++++++++++++++++
 crates/openshell-cli/src/run.rs     | 116 +++++++++++++++++++++++++++-
 crates/openshell-server/src/grpc.rs |  29 ++++++-
 proto/openshell.proto               |   3 +
 4 files changed, 217 insertions(+), 5 deletions(-)

diff --git a/crates/openshell-cli/src/main.rs b/crates/openshell-cli/src/main.rs
index c81476452..87d377b39 100644
--- a/crates/openshell-cli/src/main.rs
+++ b/crates/openshell-cli/src/main.rs
@@ -1229,6 +1229,48 @@ enum SandboxCommands {
         all: bool,
     },
 
+    /// Execute a command in a running sandbox.
+    ///
+    /// Runs a command inside an existing sandbox using the gRPC exec endpoint.
+    /// Output is streamed to the terminal in real-time. The CLI exits with the
+    /// remote command's exit code.
+    ///
+    /// For interactive shell sessions, use `sandbox connect` instead.
+    ///
+    /// Examples:
+    ///   openshell sandbox exec --name my-sandbox -- ls -la /workspace
+    ///   openshell sandbox exec -n my-sandbox --workdir /app -- python script.py
+    ///   echo "hello" | openshell sandbox exec -n my-sandbox -- cat
+    #[command(help_template = LEAF_HELP_TEMPLATE, next_help_heading = "FLAGS")]
+    Exec {
+        /// Sandbox name (defaults to last-used sandbox).
+        #[arg(long, short = 'n', add = ArgValueCompleter::new(completers::complete_sandbox_names))]
+        name: Option<String>,
+
+        /// Working directory inside the sandbox.
+        #[arg(long)]
+        workdir: Option<String>,
+
+        /// Timeout in seconds (0 = no timeout).
+        #[arg(long, default_value_t = 0)]
+        timeout: u32,
+
+        /// Allocate a pseudo-terminal for the remote command.
+        /// Defaults to auto-detection (on when stdin and stdout are terminals).
+        /// Use --tty to force a PTY even when auto-detection fails, or
+        /// --no-tty to disable.
+        #[arg(long, overrides_with = "no_tty")]
+        tty: bool,
+
+        /// Disable pseudo-terminal allocation.
+        #[arg(long, overrides_with = "tty")]
+        no_tty: bool,
+
+        /// Command and arguments to execute.
+        #[arg(required = true, trailing_var_arg = true, allow_hyphen_values = true)]
+        command: Vec<String>,
+    },
+
     /// Connect to a sandbox.
     ///
     /// When no name is given, reconnects to the last-used sandbox.
@@ -2307,6 +2349,38 @@ async fn main() -> Result<()> {
                             }
                             let _ = save_last_sandbox(&ctx.name, &name);
                         }
+                        SandboxCommands::Exec {
+                            name,
+                            workdir,
+                            timeout,
+                            tty,
+                            no_tty,
+                            command,
+                        } => {
+                            let name = resolve_sandbox_name(name, &ctx.name)?;
+                            // Resolve --tty / --no-tty into an Option<bool> override.
+                            let tty_override = if no_tty {
+                                Some(false)
+                            } else if tty {
+                                Some(true)
+                            } else {
+                                None // auto-detect
+                            };
+                            let exit_code = run::sandbox_exec_grpc(
+                                endpoint,
+                                &name,
+                                &command,
+                                workdir.as_deref(),
+                                timeout,
+                                tty_override,
+                                &tls,
+                            )
+                            .await?;
+                            let _ = save_last_sandbox(&ctx.name, &name);
+                            if exit_code != 0 {
+                                std::process::exit(exit_code);
+                            }
+                        }
                         SandboxCommands::SshConfig { name } => {
                             let name = resolve_sandbox_name(name, &ctx.name)?;
                             run::print_ssh_config(&ctx.name, &name);
diff --git a/crates/openshell-cli/src/run.rs b/crates/openshell-cli/src/run.rs
index 2c06ab948..c40640c30 100644
--- a/crates/openshell-cli/src/run.rs
+++ b/crates/openshell-cli/src/run.rs
@@ -24,13 +24,13 @@ use openshell_bootstrap::{
 use openshell_core::proto::{
     ApproveAllDraftChunksRequest, ApproveDraftChunkRequest, ClearDraftChunksRequest,
     CreateProviderRequest, CreateSandboxRequest, DeleteProviderRequest, DeleteSandboxRequest,
-    GetClusterInferenceRequest, GetDraftHistoryRequest, GetDraftPolicyRequest,
+    ExecSandboxRequest, GetClusterInferenceRequest, GetDraftHistoryRequest, GetDraftPolicyRequest,
     GetGatewayConfigRequest, GetProviderRequest, GetSandboxConfigRequest, GetSandboxLogsRequest,
     GetSandboxPolicyStatusRequest, GetSandboxRequest, HealthRequest, ListProvidersRequest,
     ListSandboxPoliciesRequest, ListSandboxesRequest, PolicyStatus, Provider,
     RejectDraftChunkRequest, Sandbox, SandboxPhase, SandboxPolicy, SandboxSpec, SandboxTemplate,
     SetClusterInferenceRequest, SettingScope, SettingValue, UpdateConfigRequest,
-    UpdateProviderRequest, WatchSandboxRequest, setting_value,
+    UpdateProviderRequest, WatchSandboxRequest, exec_sandbox_event, setting_value,
 };
 use openshell_core::settings::{self, SettingValueKind};
 use openshell_providers::{
@@ -38,7 +38,7 @@ use openshell_providers::{
 };
 use owo_colors::OwoColorize;
 use std::collections::{HashMap, HashSet, VecDeque};
-use std::io::{IsTerminal, Write};
+use std::io::{IsTerminal, Read, Write};
 use std::path::{Path, PathBuf};
 use std::process::Command;
 use std::time::{Duration, Instant};
@@ -2693,6 +2693,116 @@ pub async fn sandbox_get(server: &str, name: &str, tls: &TlsOptions) -> Result<(
     Ok(())
 }
 
+/// Maximum stdin payload size (4 MiB). Prevents the CLI from reading unbounded
+/// data into memory before the server rejects an oversized message.
+const MAX_STDIN_PAYLOAD: usize = 4 * 1024 * 1024;
+
+/// Execute a command in a running sandbox via gRPC, streaming output to the terminal.
+///
+/// Returns the remote command's exit code.
+pub async fn sandbox_exec_grpc(
+    server: &str,
+    name: &str,
+    command: &[String],
+    workdir: Option<&str>,
+    timeout_seconds: u32,
+    tty_override: Option<bool>,
+    tls: &TlsOptions,
+) -> Result<i32> {
+    let mut client = grpc_client(server, tls).await?;
+
+    // Resolve sandbox name to id.
+    let sandbox = client
+        .get_sandbox(GetSandboxRequest {
+            name: name.to_string(),
+        })
+        .await
+        .into_diagnostic()?
+        .into_inner()
+        .sandbox
+        .ok_or_else(|| miette::miette!("sandbox not found"))?;
+
+    // Verify the sandbox is ready before issuing the exec.
+    if SandboxPhase::try_from(sandbox.phase) != Ok(SandboxPhase::Ready) {
+        return Err(miette::miette!(
+            "sandbox '{}' is not ready (phase: {}); wait for it to reach Ready state",
+            name,
+            phase_name(sandbox.phase)
+        ));
+    }
+
+    // Read stdin if piped (not a TTY), using spawn_blocking to avoid blocking
+    // the async runtime. Cap the read at MAX_STDIN_PAYLOAD + 1 so we never
+    // buffer more than the limit into memory.
+    let stdin_payload = if !std::io::stdin().is_terminal() {
+        tokio::task::spawn_blocking(|| {
+            let limit = (MAX_STDIN_PAYLOAD + 1) as u64;
+            let mut buf = Vec::new();
+            std::io::stdin()
+                .take(limit)
+                .read_to_end(&mut buf)
+                .into_diagnostic()?;
+            if buf.len() > MAX_STDIN_PAYLOAD {
+                return Err(miette::miette!(
+                    "stdin payload exceeds {} byte limit; pipe smaller inputs or use `sandbox upload`",
+                    MAX_STDIN_PAYLOAD
+                ));
+            }
+            Ok(buf)
+        })
+        .await
+        .into_diagnostic()?? // first ? unwraps JoinError, second ? unwraps Result
+    } else {
+        Vec::new()
+    };
+
+    // Resolve TTY mode: explicit --tty / --no-tty wins, otherwise auto-detect.
+    let tty = tty_override
+        .unwrap_or_else(|| std::io::stdin().is_terminal() && std::io::stdout().is_terminal());
+
+    // Make the streaming gRPC call.
+    let mut stream = client
+        .exec_sandbox(ExecSandboxRequest {
+            sandbox_id: sandbox.id,
+            command: command.to_vec(),
+            workdir: workdir.unwrap_or_default().to_string(),
+            environment: HashMap::new(),
+            timeout_seconds,
+            stdin: stdin_payload,
+            tty,
+        })
+        .await
+        .into_diagnostic()?
+        .into_inner();
+
+    // Stream output to terminal in real-time.
+    let mut exit_code = 0i32;
+    let stdout = std::io::stdout();
+    let stderr = std::io::stderr();
+
+    while let Some(event) = stream.next().await {
+        let event = event.into_diagnostic()?;
+        match event.payload {
+            Some(exec_sandbox_event::Payload::Stdout(out)) => {
+                let mut handle = stdout.lock();
+                handle.write_all(&out.data).into_diagnostic()?;
+                handle.flush().into_diagnostic()?;
+            }
+            Some(exec_sandbox_event::Payload::Stderr(err)) => {
+                let mut handle = stderr.lock();
+                handle.write_all(&err.data).into_diagnostic()?;
+                handle.flush().into_diagnostic()?;
+            }
+            Some(exec_sandbox_event::Payload::Exit(exit)) => {
+                exit_code = exit.exit_code;
+            }
+            None => {}
+        }
+    }
+
+    Ok(exit_code)
+}
+
 /// Print a single YAML line with dimmed keys and regular values.
 fn print_yaml_line(line: &str) {
     // Find leading whitespace
diff --git a/crates/openshell-server/src/grpc.rs b/crates/openshell-server/src/grpc.rs
index 288fb13d5..d7ef4ccf5 100644
--- a/crates/openshell-server/src/grpc.rs
+++ b/crates/openshell-server/src/grpc.rs
@@ -1043,6 +1043,7 @@ impl OpenShell for OpenShellService {
             .map_err(|e| Status::invalid_argument(format!("command construction failed: {e}")))?;
         let stdin_payload = req.stdin;
         let timeout_seconds = req.timeout_seconds;
+        let request_tty = req.tty;
         let sandbox_id = sandbox.id;
         let handshake_secret = self.state.config.ssh_handshake_secret.clone();
 
@@ -1056,6 +1057,7 @@ impl OpenShell for OpenShellService {
                 &command_str,
                 stdin_payload,
                 timeout_seconds,
+                request_tty,
                 &handshake_secret,
             )
             .await
@@ -3716,6 +3718,7 @@ async fn stream_exec_over_ssh(
     command: &str,
     stdin_payload: Vec<u8>,
     timeout_seconds: u32,
+    request_tty: bool,
     handshake_secret: &str,
 ) -> Result<(), Status> {
     let command_preview: String = command.chars().take(120).collect();
@@ -3764,8 +3767,13 @@ async fn stream_exec_over_ssh(
                 }
             };
 
-            let exec =
-                run_exec_with_russh(local_proxy_port, command, stdin_payload.clone(), tx.clone());
+            let exec = run_exec_with_russh(
+                local_proxy_port,
+                command,
+                stdin_payload.clone(),
+                request_tty,
+                tx.clone(),
+            );
 
             let exec_result = if timeout_seconds == 0 {
                 exec.await
@@ -3843,6 +3851,7 @@ async fn run_exec_with_russh(
     local_proxy_port: u16,
     command: &str,
     stdin_payload: Vec<u8>,
+    request_tty: bool,
     tx: mpsc::Sender<Result<ExecSandboxEvent, Status>>,
 ) -> Result<i32, Status> {
     // Defense-in-depth: validate command at the transport boundary even though
@@ -3886,6 +3895,22 @@ async fn run_exec_with_russh(
         .await
         .map_err(|e| Status::internal(format!("failed to open ssh channel: {e}")))?;
 
+    // Request a PTY before exec when the client asked for terminal allocation.
+    if request_tty {
+        channel
+            .request_pty(
+                false,
+                "xterm-256color",
+                0, // col_width — 0 lets the server decide
+                0, // row_height — 0 lets the server decide
+                0, // pix_width
+                0, // pix_height
+                &[],
+            )
+            .await
+            .map_err(|e| Status::internal(format!("failed to allocate PTY: {e}")))?;
+    }
+
     channel
         .exec(true, command.as_bytes())
         .await
diff --git a/proto/openshell.proto b/proto/openshell.proto
index 22bd64b7b..625a54130 100644
--- a/proto/openshell.proto
+++ b/proto/openshell.proto
@@ -247,6 +247,9 @@ message ExecSandboxRequest {
 
   // Optional stdin payload passed to the command.
   bytes stdin = 6;
+
+  // Request a pseudo-terminal for the remote command.
+  bool tty = 7;
 }
 
 // One stdout chunk from a sandbox exec.

From 428ba4b424e0e957abf05765a519f7750655c36e Mon Sep 17 00:00:00 2001
From: Drew Newberry <anewberry@nvidia.com>
Date: Mon, 6 Apr 2026 13:52:50 -0700
Subject: [PATCH 7/9] chore(proto): remove unused java_package declarations
 (#772)

---
 .../src/proto/openshell.datamodel.v1.rs       |  146 --
 .../src/proto/openshell.sandbox.v1.rs         |  160 ---
 .../src/proto/openshell.test.v1.rs            |   14 -
 .../openshell-core/src/proto/openshell.v1.rs  | 1188 -----------------
 proto/inference.proto                         |    3 -
 proto/openshell.proto                         |    3 -
 6 files changed, 1514 deletions(-)
 delete mode 100644 crates/openshell-core/src/proto/openshell.datamodel.v1.rs
 delete mode 100644 crates/openshell-core/src/proto/openshell.sandbox.v1.rs
 delete mode 100644 crates/openshell-core/src/proto/openshell.test.v1.rs
 delete mode 100644 crates/openshell-core/src/proto/openshell.v1.rs

diff --git a/crates/openshell-core/src/proto/openshell.datamodel.v1.rs b/crates/openshell-core/src/proto/openshell.datamodel.v1.rs
deleted file mode 100644
index 310497d1a..000000000
--- a/crates/openshell-core/src/proto/openshell.datamodel.v1.rs
+++ /dev/null
@@ -1,146 +0,0 @@
-// SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-// SPDX-License-Identifier: Apache-2.0
-
-// This file is @generated by prost-build.
-/// Sandbox model stored by OpenShell.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct Sandbox {
-    #[prost(string, tag = "1")]
-    pub id: ::prost::alloc::string::String,
-    #[prost(string, tag = "2")]
-    pub name: ::prost::alloc::string::String,
-    #[prost(string, tag = "3")]
-    pub namespace: ::prost::alloc::string::String,
-    #[prost(message, optional, tag = "4")]
-    pub spec: ::core::option::Option<SandboxSpec>,
-    #[prost(message, optional, tag = "5")]
-    pub status: ::core::option::Option<SandboxStatus>,
-    #[prost(enumeration = "SandboxPhase", tag = "6")]
-    pub phase: i32,
-}
-/// OpenShell-level sandbox spec.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct SandboxSpec {
-    #[prost(string, tag = "1")]
-    pub log_level: ::prost::alloc::string::String,
-    #[prost(map = "string, string", tag = "5")]
-    pub environment:
-        ::std::collections::HashMap<::prost::alloc::string::String, ::prost::alloc::string::String>,
-    #[prost(message, optional, tag = "6")]
-    pub template: ::core::option::Option<SandboxTemplate>,
-    /// Required sandbox policy configuration.
-    #[prost(message, optional, tag = "7")]
-    pub policy: ::core::option::Option<super::super::sandbox::v1::SandboxPolicy>,
-    /// Provider names to attach to this sandbox.
-    #[prost(string, repeated, tag = "8")]
-    pub providers: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
-}
-/// Sandbox template mapped onto Kubernetes pod template inputs.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct SandboxTemplate {
-    #[prost(string, tag = "1")]
-    pub image: ::prost::alloc::string::String,
-    #[prost(string, tag = "2")]
-    pub runtime_class_name: ::prost::alloc::string::String,
-    #[prost(string, tag = "3")]
-    pub agent_socket: ::prost::alloc::string::String,
-    #[prost(map = "string, string", tag = "4")]
-    pub labels:
-        ::std::collections::HashMap<::prost::alloc::string::String, ::prost::alloc::string::String>,
-    #[prost(map = "string, string", tag = "5")]
-    pub annotations:
-        ::std::collections::HashMap<::prost::alloc::string::String, ::prost::alloc::string::String>,
-    #[prost(map = "string, string", tag = "6")]
-    pub environment:
-        ::std::collections::HashMap<::prost::alloc::string::String, ::prost::alloc::string::String>,
-    #[prost(message, optional, tag = "7")]
-    pub resources: ::core::option::Option<::prost_types::Struct>,
-    #[prost(message, optional, tag = "9")]
-    pub volume_claim_templates: ::core::option::Option<::prost_types::Struct>,
-}
-/// Sandbox status captured from Kubernetes.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct SandboxStatus {
-    #[prost(string, tag = "1")]
-    pub sandbox_name: ::prost::alloc::string::String,
-    #[prost(string, tag = "2")]
-    pub agent_pod: ::prost::alloc::string::String,
-    #[prost(string, tag = "3")]
-    pub agent_fd: ::prost::alloc::string::String,
-    #[prost(string, tag = "4")]
-    pub sandbox_fd: ::prost::alloc::string::String,
-    #[prost(message, repeated, tag = "5")]
-    pub conditions: ::prost::alloc::vec::Vec<SandboxCondition>,
-}
-/// Sandbox condition mirrors Kubernetes conditions.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct SandboxCondition {
-    #[prost(string, tag = "1")]
-    pub r#type: ::prost::alloc::string::String,
-    #[prost(string, tag = "2")]
-    pub status: ::prost::alloc::string::String,
-    #[prost(string, tag = "3")]
-    pub reason: ::prost::alloc::string::String,
-    #[prost(string, tag = "4")]
-    pub message: ::prost::alloc::string::String,
-    #[prost(string, tag = "5")]
-    pub last_transition_time: ::prost::alloc::string::String,
-}
-/// Provider model stored by OpenShell.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct Provider {
-    #[prost(string, tag = "1")]
-    pub id: ::prost::alloc::string::String,
-    #[prost(string, tag = "2")]
-    pub name: ::prost::alloc::string::String,
-    /// Canonical provider type slug (for example: "claude", "gitlab").
-    #[prost(string, tag = "3")]
-    pub r#type: ::prost::alloc::string::String,
-    /// Secret values used for authentication.
-    #[prost(map = "string, string", tag = "4")]
-    pub credentials:
-        ::std::collections::HashMap<::prost::alloc::string::String, ::prost::alloc::string::String>,
-    /// Non-secret provider configuration.
-    #[prost(map = "string, string", tag = "5")]
-    pub config:
-        ::std::collections::HashMap<::prost::alloc::string::String, ::prost::alloc::string::String>,
-}
-/// High-level sandbox lifecycle phase.
-#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
-#[repr(i32)]
-pub enum SandboxPhase {
-    Unspecified = 0,
-    Provisioning = 1,
-    Ready = 2,
-    Error = 3,
-    Deleting = 4,
-    Unknown = 5,
-}
-impl SandboxPhase {
-    /// String value of the enum field names used in the ProtoBuf definition.
-    ///
-    /// The values are not transformed in any way and thus are considered stable
-    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
-    pub fn as_str_name(&self) -> &'static str {
-        match self {
-            Self::Unspecified => "SANDBOX_PHASE_UNSPECIFIED",
-            Self::Provisioning => "SANDBOX_PHASE_PROVISIONING",
-            Self::Ready => "SANDBOX_PHASE_READY",
-            Self::Error => "SANDBOX_PHASE_ERROR",
-            Self::Deleting => "SANDBOX_PHASE_DELETING",
-            Self::Unknown => "SANDBOX_PHASE_UNKNOWN",
-        }
-    }
-    /// Creates an enum from field names used in the ProtoBuf definition.
-    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
-        match value {
-            "SANDBOX_PHASE_UNSPECIFIED" => Some(Self::Unspecified),
-            "SANDBOX_PHASE_PROVISIONING" => Some(Self::Provisioning),
-            "SANDBOX_PHASE_READY" => Some(Self::Ready),
-            "SANDBOX_PHASE_ERROR" => Some(Self::Error),
-            "SANDBOX_PHASE_DELETING" => Some(Self::Deleting),
-            "SANDBOX_PHASE_UNKNOWN" => Some(Self::Unknown),
-            _ => None,
-        }
-    }
-}
diff --git a/crates/openshell-core/src/proto/openshell.sandbox.v1.rs b/crates/openshell-core/src/proto/openshell.sandbox.v1.rs
deleted file mode 100644
index c7fbb178b..000000000
--- a/crates/openshell-core/src/proto/openshell.sandbox.v1.rs
+++ /dev/null
@@ -1,160 +0,0 @@
-// SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-// SPDX-License-Identifier: Apache-2.0
-
-// This file is @generated by prost-build.
-/// Sandbox security policy configuration.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct SandboxPolicy {
-    /// Policy version.
-    #[prost(uint32, tag = "1")]
-    pub version: u32,
-    /// Filesystem access policy.
-    #[prost(message, optional, tag = "2")]
-    pub filesystem: ::core::option::Option<FilesystemPolicy>,
-    /// Network access policy.
-    #[prost(message, optional, tag = "3")]
-    pub network: ::core::option::Option<NetworkPolicy>,
-    /// Landlock configuration.
-    #[prost(message, optional, tag = "4")]
-    pub landlock: ::core::option::Option<LandlockPolicy>,
-    /// Process execution policy.
-    #[prost(message, optional, tag = "5")]
-    pub process: ::core::option::Option<ProcessPolicy>,
-}
-/// Filesystem access policy.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct FilesystemPolicy {
-    /// Read-only directory allow list.
-    #[prost(string, repeated, tag = "1")]
-    pub read_only: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
-    /// Read-write directory allow list.
-    #[prost(string, repeated, tag = "2")]
-    pub read_write: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
-    /// Automatically include the workdir as read-write.
-    #[prost(bool, tag = "3")]
-    pub include_workdir: bool,
-}
-/// Network access policy.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct NetworkPolicy {
-    /// Network access mode.
-    #[prost(enumeration = "NetworkMode", tag = "1")]
-    pub mode: i32,
-    /// Proxy configuration (required when mode is PROXY).
-    #[prost(message, optional, tag = "2")]
-    pub proxy: ::core::option::Option<ProxyPolicy>,
-}
-/// Proxy configuration for network policy.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct ProxyPolicy {
-    /// Unix socket path for a local proxy (preferred for strict seccomp rules).
-    #[prost(string, tag = "1")]
-    pub unix_socket: ::prost::alloc::string::String,
-    /// TCP address for a local HTTP proxy (loopback-only).
-    #[prost(string, tag = "2")]
-    pub http_addr: ::prost::alloc::string::String,
-    /// Allowed hostnames for proxy traffic. Empty means allow all.
-    #[prost(string, repeated, tag = "3")]
-    pub allow_hosts: ::prost::alloc::vec::Vec<::prost::alloc::string::String>,
-}
-/// Landlock policy configuration.
-#[derive(Clone, Copy, PartialEq, ::prost::Message)]
-pub struct LandlockPolicy {
-    /// Compatibility mode.
-    #[prost(enumeration = "LandlockCompatibility", tag = "1")]
-    pub compatibility: i32,
-}
-/// Process execution policy.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct ProcessPolicy {
-    /// User name to run the sandboxed process as.
-    #[prost(string, tag = "1")]
-    pub run_as_user: ::prost::alloc::string::String,
-    /// Group name to run the sandboxed process as.
-    #[prost(string, tag = "2")]
-    pub run_as_group: ::prost::alloc::string::String,
-}
-/// Request to get sandbox policy by sandbox ID.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct GetSandboxPolicyRequest {
-    /// The sandbox ID.
-    #[prost(string, tag = "1")]
-    pub sandbox_id: ::prost::alloc::string::String,
-}
-/// Response containing sandbox policy.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct GetSandboxPolicyResponse {
-    /// The sandbox policy configuration.
-    #[prost(message, optional, tag = "1")]
-    pub policy: ::core::option::Option<SandboxPolicy>,
-}
-/// Network access mode.
-#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
-#[repr(i32)]
-pub enum NetworkMode {
-    /// Unspecified defaults to BLOCK.
-    Unspecified = 0,
-    /// Block all network access.
-    Block = 1,
-    /// Route traffic through a proxy.
-    Proxy = 2,
-    /// Allow all network access.
-    Allow = 3,
-}
-impl NetworkMode {
-    /// String value of the enum field names used in the ProtoBuf definition.
-    ///
-    /// The values are not transformed in any way and thus are considered stable
-    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
-    pub fn as_str_name(&self) -> &'static str {
-        match self {
-            Self::Unspecified => "NETWORK_MODE_UNSPECIFIED",
-            Self::Block => "NETWORK_MODE_BLOCK",
-            Self::Proxy => "NETWORK_MODE_PROXY",
-            Self::Allow => "NETWORK_MODE_ALLOW",
-        }
-    }
-    /// Creates an enum from field names used in the ProtoBuf definition.
-    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
-        match value {
-            "NETWORK_MODE_UNSPECIFIED" => Some(Self::Unspecified),
-            "NETWORK_MODE_BLOCK" => Some(Self::Block),
-            "NETWORK_MODE_PROXY" => Some(Self::Proxy),
-            "NETWORK_MODE_ALLOW" => Some(Self::Allow),
-            _ => None,
-        }
-    }
-}
-/// Landlock compatibility mode.
-#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
-#[repr(i32)]
-pub enum LandlockCompatibility {
-    /// Unspecified defaults to BEST_EFFORT.
-    Unspecified = 0,
-    /// Use best effort - degrade gracefully on older kernels.
-    BestEffort = 1,
-    /// Require full Landlock support or fail.
-    HardRequirement = 2,
-}
-impl LandlockCompatibility {
-    /// String value of the enum field names used in the ProtoBuf definition.
-    ///
-    /// The values are not transformed in any way and thus are considered stable
-    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
-    pub fn as_str_name(&self) -> &'static str {
-        match self {
-            Self::Unspecified => "LANDLOCK_COMPATIBILITY_UNSPECIFIED",
-            Self::BestEffort => "LANDLOCK_COMPATIBILITY_BEST_EFFORT",
-            Self::HardRequirement => "LANDLOCK_COMPATIBILITY_HARD_REQUIREMENT",
-        }
-    }
-    /// Creates an enum from field names used in the ProtoBuf definition.
-    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
-        match value {
-            "LANDLOCK_COMPATIBILITY_UNSPECIFIED" => Some(Self::Unspecified),
-            "LANDLOCK_COMPATIBILITY_BEST_EFFORT" => Some(Self::BestEffort),
-            "LANDLOCK_COMPATIBILITY_HARD_REQUIREMENT" => Some(Self::HardRequirement),
-            _ => None,
-        }
-    }
-}
diff --git a/crates/openshell-core/src/proto/openshell.test.v1.rs b/crates/openshell-core/src/proto/openshell.test.v1.rs
deleted file mode 100644
index 319b3fd3a..000000000
--- a/crates/openshell-core/src/proto/openshell.test.v1.rs
+++ /dev/null
@@ -1,14 +0,0 @@
-// SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-// SPDX-License-Identifier: Apache-2.0
-
-// This file is @generated by prost-build.
-/// Simple object for persistence tests.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct ObjectForTest {
-    #[prost(string, tag = "1")]
-    pub id: ::prost::alloc::string::String,
-    #[prost(string, tag = "2")]
-    pub name: ::prost::alloc::string::String,
-    #[prost(uint32, tag = "3")]
-    pub count: u32,
-}
diff --git a/crates/openshell-core/src/proto/openshell.v1.rs b/crates/openshell-core/src/proto/openshell.v1.rs
deleted file mode 100644
index a2735b076..000000000
--- a/crates/openshell-core/src/proto/openshell.v1.rs
+++ /dev/null
@@ -1,1188 +0,0 @@
-// SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-// SPDX-License-Identifier: Apache-2.0
-
-// This file is @generated by prost-build.
-/// Health check request.
-#[derive(Clone, Copy, PartialEq, ::prost::Message)]
-pub struct HealthRequest {}
-/// Health check response.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct HealthResponse {
-    /// Service status.
-    #[prost(enumeration = "ServiceStatus", tag = "1")]
-    pub status: i32,
-    /// Service version.
-    #[prost(string, tag = "2")]
-    pub version: ::prost::alloc::string::String,
-}
-/// Create sandbox request.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct CreateSandboxRequest {
-    #[prost(message, optional, tag = "1")]
-    pub spec: ::core::option::Option<super::datamodel::v1::SandboxSpec>,
-    /// Optional user-supplied sandbox name. When empty the server generates one.
-    #[prost(string, tag = "2")]
-    pub name: ::prost::alloc::string::String,
-}
-/// Get sandbox request.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct GetSandboxRequest {
-    #[prost(string, tag = "1")]
-    pub id: ::prost::alloc::string::String,
-}
-/// List sandboxes request.
-#[derive(Clone, Copy, PartialEq, ::prost::Message)]
-pub struct ListSandboxesRequest {
-    #[prost(uint32, tag = "1")]
-    pub limit: u32,
-    #[prost(uint32, tag = "2")]
-    pub offset: u32,
-}
-/// Delete sandbox request.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct DeleteSandboxRequest {
-    #[prost(string, tag = "1")]
-    pub id: ::prost::alloc::string::String,
-}
-/// Sandbox response.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct SandboxResponse {
-    #[prost(message, optional, tag = "1")]
-    pub sandbox: ::core::option::Option<super::datamodel::v1::Sandbox>,
-}
-/// List sandboxes response.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct ListSandboxesResponse {
-    #[prost(message, repeated, tag = "1")]
-    pub sandboxes: ::prost::alloc::vec::Vec<super::datamodel::v1::Sandbox>,
-}
-/// Delete sandbox response.
-#[derive(Clone, Copy, PartialEq, ::prost::Message)]
-pub struct DeleteSandboxResponse {
-    #[prost(bool, tag = "1")]
-    pub deleted: bool,
-}
-/// Create SSH session request.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct CreateSshSessionRequest {
-    /// Sandbox id.
-    #[prost(string, tag = "1")]
-    pub sandbox_id: ::prost::alloc::string::String,
-}
-/// Create SSH session response.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct CreateSshSessionResponse {
-    /// Sandbox id.
-    #[prost(string, tag = "1")]
-    pub sandbox_id: ::prost::alloc::string::String,
-    /// Session token for the gateway tunnel.
-    #[prost(string, tag = "2")]
-    pub token: ::prost::alloc::string::String,
-    /// Gateway host for SSH proxy connection.
-    #[prost(string, tag = "3")]
-    pub gateway_host: ::prost::alloc::string::String,
-    /// Gateway port for SSH proxy connection.
-    #[prost(uint32, tag = "4")]
-    pub gateway_port: u32,
-    /// Gateway scheme (http or https).
-    #[prost(string, tag = "5")]
-    pub gateway_scheme: ::prost::alloc::string::String,
-    /// HTTP path for the CONNECT/upgrade endpoint.
-    #[prost(string, tag = "6")]
-    pub connect_path: ::prost::alloc::string::String,
-    /// Optional host key fingerprint.
-    #[prost(string, tag = "7")]
-    pub host_key_fingerprint: ::prost::alloc::string::String,
-}
-/// Revoke SSH session request.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct RevokeSshSessionRequest {
-    /// Session token to revoke.
-    #[prost(string, tag = "1")]
-    pub token: ::prost::alloc::string::String,
-}
-/// Revoke SSH session response.
-#[derive(Clone, Copy, PartialEq, ::prost::Message)]
-pub struct RevokeSshSessionResponse {
-    /// True when a session was revoked.
-    #[prost(bool, tag = "1")]
-    pub revoked: bool,
-}
-/// SSH session record stored in persistence.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct SshSession {
-    /// Unique id (token).
-    #[prost(string, tag = "1")]
-    pub id: ::prost::alloc::string::String,
-    /// Sandbox id.
-    #[prost(string, tag = "2")]
-    pub sandbox_id: ::prost::alloc::string::String,
-    /// Session token.
-    #[prost(string, tag = "3")]
-    pub token: ::prost::alloc::string::String,
-    /// Creation timestamp in milliseconds since epoch.
-    #[prost(int64, tag = "4")]
-    pub created_at_ms: i64,
-    /// Revoked flag.
-    #[prost(bool, tag = "5")]
-    pub revoked: bool,
-}
-/// Watch sandbox request.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct WatchSandboxRequest {
-    /// Sandbox id.
-    #[prost(string, tag = "1")]
-    pub id: ::prost::alloc::string::String,
-    /// Stream sandbox status snapshots.
-    #[prost(bool, tag = "2")]
-    pub follow_status: bool,
-    /// Stream openshell-server process logs correlated to this sandbox.
-    #[prost(bool, tag = "3")]
-    pub follow_logs: bool,
-    /// Stream platform events correlated to this sandbox.
-    #[prost(bool, tag = "4")]
-    pub follow_events: bool,
-    /// Replay the last N log lines (best-effort) before following.
-    #[prost(uint32, tag = "5")]
-    pub log_tail_lines: u32,
-    /// Replay the last N platform events (best-effort) before following.
-    #[prost(uint32, tag = "6")]
-    pub event_tail: u32,
-    /// Stop streaming once the sandbox reaches a terminal phase (READY or ERROR).
-    #[prost(bool, tag = "7")]
-    pub stop_on_terminal: bool,
-}
-/// One event in a sandbox watch stream.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct SandboxStreamEvent {
-    #[prost(oneof = "sandbox_stream_event::Payload", tags = "1, 2, 3, 4")]
-    pub payload: ::core::option::Option<sandbox_stream_event::Payload>,
-}
-/// Nested message and enum types in `SandboxStreamEvent`.
-pub mod sandbox_stream_event {
-    #[derive(Clone, PartialEq, ::prost::Oneof)]
-    pub enum Payload {
-        /// Latest sandbox snapshot.
-        #[prost(message, tag = "1")]
-        Sandbox(super::super::datamodel::v1::Sandbox),
-        /// One server log line/event.
-        #[prost(message, tag = "2")]
-        Log(super::SandboxLogLine),
-        /// One platform event.
-        #[prost(message, tag = "3")]
-        Event(super::PlatformEvent),
-        /// Warning from the server (e.g. missed messages due to lag).
-        #[prost(message, tag = "4")]
-        Warning(super::SandboxStreamWarning),
-    }
-}
-/// OpenShell server process log line correlated to a sandbox.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct SandboxLogLine {
-    #[prost(string, tag = "1")]
-    pub sandbox_id: ::prost::alloc::string::String,
-    #[prost(int64, tag = "2")]
-    pub timestamp_ms: i64,
-    #[prost(string, tag = "3")]
-    pub level: ::prost::alloc::string::String,
-    #[prost(string, tag = "4")]
-    pub target: ::prost::alloc::string::String,
-    #[prost(string, tag = "5")]
-    pub message: ::prost::alloc::string::String,
-}
-/// Platform event correlated to a sandbox.
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct PlatformEvent {
-    /// Event timestamp in milliseconds since epoch.
-    #[prost(int64, tag = "1")]
-    pub timestamp_ms: i64,
-    /// Event source (e.g. "kubernetes", "docker", "process").
-    #[prost(string, tag = "2")]
-    pub source: ::prost::alloc::string::String,
-    /// Event type/severity (e.g. "Normal", "Warning").
-    #[prost(string, tag = "3")]
-    pub r#type: ::prost::alloc::string::String,
-    /// Short reason code (e.g. "Started", "Pulled", "Failed").
-    #[prost(string, tag = "4")]
-    pub reason: ::prost::alloc::string::String,
-    /// Human-readable event message.
-    #[prost(string, tag = "5")]
-    pub message: ::prost::alloc::string::String,
-    /// Optional metadata as key-value pairs.
-    #[prost(map = "string, string", tag = "6")]
-    pub metadata: ::std::collections::HashMap<
-        ::prost::alloc::string::String,
-        ::prost::alloc::string::String,
-    >,
-}
-#[derive(Clone, PartialEq, ::prost::Message)]
-pub struct SandboxStreamWarning {
-    #[prost(string, tag = "1")]
-    pub message: ::prost::alloc::string::String,
-}
-/// Service status enum.
-#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, ::prost::Enumeration)]
-#[repr(i32)]
-pub enum ServiceStatus {
-    Unspecified = 0,
-    Healthy = 1,
-    Degraded = 2,
-    Unhealthy = 3,
-}
-impl ServiceStatus {
-    /// String value of the enum field names used in the ProtoBuf definition.
-    ///
-    /// The values are not transformed in any way and thus are considered stable
-    /// (if the ProtoBuf definition does not change) and safe for programmatic use.
-    pub fn as_str_name(&self) -> &'static str {
-        match self {
-            Self::Unspecified => "SERVICE_STATUS_UNSPECIFIED",
-            Self::Healthy => "SERVICE_STATUS_HEALTHY",
-            Self::Degraded => "SERVICE_STATUS_DEGRADED",
-            Self::Unhealthy => "SERVICE_STATUS_UNHEALTHY",
-        }
-    }
-    /// Creates an enum from field names used in the ProtoBuf definition.
-    pub fn from_str_name(value: &str) -> ::core::option::Option<Self> {
-        match value {
-            "SERVICE_STATUS_UNSPECIFIED" => Some(Self::Unspecified),
-            "SERVICE_STATUS_HEALTHY" => Some(Self::Healthy),
-            "SERVICE_STATUS_DEGRADED" => Some(Self::Degraded),
-            "SERVICE_STATUS_UNHEALTHY" => Some(Self::Unhealthy),
-            _ => None,
-        }
-    }
-}
-/// Generated client implementations.
-pub mod open_shell_client {
-    #![allow(
-        unused_variables,
-        dead_code,
-        missing_docs,
-        clippy::wildcard_imports,
-        clippy::let_unit_value,
-    )]
-    use tonic::codegen::*;
-    use tonic::codegen::http::Uri;
-    /// OpenShell service provides agent execution and management capabilities.
-    #[derive(Debug, Clone)]
-    pub struct OpenShellClient<T> {
-        inner: tonic::client::Grpc<T>,
-    }
-    impl OpenShellClient<tonic::transport::Channel> {
-        /// Attempt to create a new client by connecting to a given endpoint.
-        pub async fn connect<D>(dst: D) -> Result<Self, tonic::transport::Error>
-        where
-            D: TryInto<tonic::transport::Endpoint>,
-            D::Error: Into<StdError>,
-        {
-            let conn = tonic::transport::Endpoint::new(dst)?.connect().await?;
-            Ok(Self::new(conn))
-        }
-    }
-    impl<T> OpenShellClient<T>
-    where
-        T: tonic::client::GrpcService<tonic::body::BoxBody>,
-        T::Error: Into<StdError>,
-        T::ResponseBody: Body<Data = Bytes> + std::marker::Send + 'static,
-        <T::ResponseBody as Body>::Error: Into<StdError> + std::marker::Send,
-    {
-        pub fn new(inner: T) -> Self {
-            let inner = tonic::client::Grpc::new(inner);
-            Self { inner }
-        }
-        pub fn with_origin(inner: T, origin: Uri) -> Self {
-            let inner = tonic::client::Grpc::with_origin(inner, origin);
-            Self { inner }
-        }
-        pub fn with_interceptor<F>(
-            inner: T,
-            interceptor: F,
-        ) -> OpenShellClient<InterceptedService<T, F>>
-        where
-            F: tonic::service::Interceptor,
-            T::ResponseBody: Default,
-            T: tonic::codegen::Service<
-                http::Request<tonic::body::BoxBody>,
-                Response = http::Response<
-                    <T as tonic::client::GrpcService<tonic::body::BoxBody>>::ResponseBody,
-                >,
-            >,
-            <T as tonic::codegen::Service<
-                http::Request<tonic::body::BoxBody>,
-            >>::Error: Into<StdError> + std::marker::Send + std::marker::Sync,
-        {
-            OpenShellClient::new(InterceptedService::new(inner, interceptor))
-        }
-        /// Compress requests with the given encoding.
-        ///
-        /// This requires the server to support it otherwise it might respond with an
-        /// error.
-        #[must_use]
-        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
-            self.inner = self.inner.send_compressed(encoding);
-            self
-        }
-        /// Enable decompressing responses.
-        #[must_use]
-        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
-            self.inner = self.inner.accept_compressed(encoding);
-            self
-        }
-        /// Limits the maximum size of a decoded message.
-        ///
-        /// Default: `4MB`
-        #[must_use]
-        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
-            self.inner = self.inner.max_decoding_message_size(limit);
-            self
-        }
-        /// Limits the maximum size of an encoded message.
-        ///
-        /// Default: `usize::MAX`
-        #[must_use]
-        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
-            self.inner = self.inner.max_encoding_message_size(limit);
-            self
-        }
-        /// Check the health of the service.
-        pub async fn health(
-            &mut self,
-            request: impl tonic::IntoRequest<super::HealthRequest>,
-        ) -> std::result::Result<tonic::Response<super::HealthResponse>, tonic::Status> {
-            self.inner
-                .ready()
-                .await
-                .map_err(|e| {
-                    tonic::Status::unknown(
-                        format!("Service was not ready: {}", e.into()),
-                    )
-                })?;
-            let codec = tonic::codec::ProstCodec::default();
-            let path = http::uri::PathAndQuery::from_static(
-                "/openshell.v1.OpenShell/Health",
-            );
-            let mut req = request.into_request();
-            req.extensions_mut()
-                .insert(GrpcMethod::new("openshell.v1.OpenShell", "Health"));
-            self.inner.unary(req, path, codec).await
-        }
-        /// Create a new sandbox.
-        pub async fn create_sandbox(
-            &mut self,
-            request: impl tonic::IntoRequest<super::CreateSandboxRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::SandboxResponse>,
-            tonic::Status,
-        > {
-            self.inner
-                .ready()
-                .await
-                .map_err(|e| {
-                    tonic::Status::unknown(
-                        format!("Service was not ready: {}", e.into()),
-                    )
-                })?;
-            let codec = tonic::codec::ProstCodec::default();
-            let path = http::uri::PathAndQuery::from_static(
-                "/openshell.v1.OpenShell/CreateSandbox",
-            );
-            let mut req = request.into_request();
-            req.extensions_mut()
-                .insert(GrpcMethod::new("openshell.v1.OpenShell", "CreateSandbox"));
-            self.inner.unary(req, path, codec).await
-        }
-        /// Fetch a sandbox by id.
-        pub async fn get_sandbox(
-            &mut self,
-            request: impl tonic::IntoRequest<super::GetSandboxRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::SandboxResponse>,
-            tonic::Status,
-        > {
-            self.inner
-                .ready()
-                .await
-                .map_err(|e| {
-                    tonic::Status::unknown(
-                        format!("Service was not ready: {}", e.into()),
-                    )
-                })?;
-            let codec = tonic::codec::ProstCodec::default();
-            let path = http::uri::PathAndQuery::from_static(
-                "/openshell.v1.OpenShell/GetSandbox",
-            );
-            let mut req = request.into_request();
-            req.extensions_mut()
-                .insert(GrpcMethod::new("openshell.v1.OpenShell", "GetSandbox"));
-            self.inner.unary(req, path, codec).await
-        }
-        /// List sandboxes.
-        pub async fn list_sandboxes(
-            &mut self,
-            request: impl tonic::IntoRequest<super::ListSandboxesRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::ListSandboxesResponse>,
-            tonic::Status,
-        > {
-            self.inner
-                .ready()
-                .await
-                .map_err(|e| {
-                    tonic::Status::unknown(
-                        format!("Service was not ready: {}", e.into()),
-                    )
-                })?;
-            let codec = tonic::codec::ProstCodec::default();
-            let path = http::uri::PathAndQuery::from_static(
-                "/openshell.v1.OpenShell/ListSandboxes",
-            );
-            let mut req = request.into_request();
-            req.extensions_mut()
-                .insert(GrpcMethod::new("openshell.v1.OpenShell", "ListSandboxes"));
-            self.inner.unary(req, path, codec).await
-        }
-        /// Delete a sandbox by id.
-        pub async fn delete_sandbox(
-            &mut self,
-            request: impl tonic::IntoRequest<super::DeleteSandboxRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::DeleteSandboxResponse>,
-            tonic::Status,
-        > {
-            self.inner
-                .ready()
-                .await
-                .map_err(|e| {
-                    tonic::Status::unknown(
-                        format!("Service was not ready: {}", e.into()),
-                    )
-                })?;
-            let codec = tonic::codec::ProstCodec::default();
-            let path = http::uri::PathAndQuery::from_static(
-                "/openshell.v1.OpenShell/DeleteSandbox",
-            );
-            let mut req = request.into_request();
-            req.extensions_mut()
-                .insert(GrpcMethod::new("openshell.v1.OpenShell", "DeleteSandbox"));
-            self.inner.unary(req, path, codec).await
-        }
-        /// Create a short-lived SSH session for a sandbox.
-        pub async fn create_ssh_session(
-            &mut self,
-            request: impl tonic::IntoRequest<super::CreateSshSessionRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::CreateSshSessionResponse>,
-            tonic::Status,
-        > {
-            self.inner
-                .ready()
-                .await
-                .map_err(|e| {
-                    tonic::Status::unknown(
-                        format!("Service was not ready: {}", e.into()),
-                    )
-                })?;
-            let codec = tonic::codec::ProstCodec::default();
-            let path = http::uri::PathAndQuery::from_static(
-                "/openshell.v1.OpenShell/CreateSshSession",
-            );
-            let mut req = request.into_request();
-            req.extensions_mut()
-                .insert(GrpcMethod::new("openshell.v1.OpenShell", "CreateSshSession"));
-            self.inner.unary(req, path, codec).await
-        }
-        /// Revoke a previously issued SSH session.
-        pub async fn revoke_ssh_session(
-            &mut self,
-            request: impl tonic::IntoRequest<super::RevokeSshSessionRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::RevokeSshSessionResponse>,
-            tonic::Status,
-        > {
-            self.inner
-                .ready()
-                .await
-                .map_err(|e| {
-                    tonic::Status::unknown(
-                        format!("Service was not ready: {}", e.into()),
-                    )
-                })?;
-            let codec = tonic::codec::ProstCodec::default();
-            let path = http::uri::PathAndQuery::from_static(
-                "/openshell.v1.OpenShell/RevokeSshSession",
-            );
-            let mut req = request.into_request();
-            req.extensions_mut()
-                .insert(GrpcMethod::new("openshell.v1.OpenShell", "RevokeSshSession"));
-            self.inner.unary(req, path, codec).await
-        }
-        /// Get sandbox policy by id (called by sandbox entrypoint at startup).
-        pub async fn get_sandbox_policy(
-            &mut self,
-            request: impl tonic::IntoRequest<
-                super::super::sandbox::v1::GetSandboxPolicyRequest,
-            >,
-        ) -> std::result::Result<
-            tonic::Response<super::super::sandbox::v1::GetSandboxPolicyResponse>,
-            tonic::Status,
-        > {
-            self.inner
-                .ready()
-                .await
-                .map_err(|e| {
-                    tonic::Status::unknown(
-                        format!("Service was not ready: {}", e.into()),
-                    )
-                })?;
-            let codec = tonic::codec::ProstCodec::default();
-            let path = http::uri::PathAndQuery::from_static(
-                "/openshell.v1.OpenShell/GetSandboxPolicy",
-            );
-            let mut req = request.into_request();
-            req.extensions_mut()
-                .insert(GrpcMethod::new("openshell.v1.OpenShell", "GetSandboxPolicy"));
-            self.inner.unary(req, path, codec).await
-        }
-        /// Watch a sandbox and stream updates.
-        ///
-        /// This stream can include:
-        /// - Sandbox status snapshots (phase/status)
-        /// - OpenShell server process logs correlated by sandbox_id
-        /// - Platform events correlated to the sandbox
-        pub async fn watch_sandbox(
-            &mut self,
-            request: impl tonic::IntoRequest<super::WatchSandboxRequest>,
-        ) -> std::result::Result<
-            tonic::Response<tonic::codec::Streaming<super::SandboxStreamEvent>>,
-            tonic::Status,
-        > {
-            self.inner
-                .ready()
-                .await
-                .map_err(|e| {
-                    tonic::Status::unknown(
-                        format!("Service was not ready: {}", e.into()),
-                    )
-                })?;
-            let codec = tonic::codec::ProstCodec::default();
-            let path = http::uri::PathAndQuery::from_static(
-                "/openshell.v1.OpenShell/WatchSandbox",
-            );
-            let mut req = request.into_request();
-            req.extensions_mut()
-                .insert(GrpcMethod::new("openshell.v1.OpenShell", "WatchSandbox"));
-            self.inner.server_streaming(req, path, codec).await
-        }
-    }
-}
-/// Generated server implementations.
-pub mod open_shell_server {
-    #![allow(
-        unused_variables,
-        dead_code,
-        missing_docs,
-        clippy::wildcard_imports,
-        clippy::let_unit_value,
-    )]
-    use tonic::codegen::*;
-    /// Generated trait containing gRPC methods that should be implemented for use with OpenShellServer.
-    #[async_trait]
-    pub trait OpenShell: std::marker::Send + std::marker::Sync + 'static {
-        /// Check the health of the service.
-        async fn health(
-            &self,
-            request: tonic::Request<super::HealthRequest>,
-        ) -> std::result::Result<tonic::Response<super::HealthResponse>, tonic::Status>;
-        /// Create a new sandbox.
-        async fn create_sandbox(
-            &self,
-            request: tonic::Request<super::CreateSandboxRequest>,
-        ) -> std::result::Result<tonic::Response<super::SandboxResponse>, tonic::Status>;
-        /// Fetch a sandbox by id.
-        async fn get_sandbox(
-            &self,
-            request: tonic::Request<super::GetSandboxRequest>,
-        ) -> std::result::Result<tonic::Response<super::SandboxResponse>, tonic::Status>;
-        /// List sandboxes.
-        async fn list_sandboxes(
-            &self,
-            request: tonic::Request<super::ListSandboxesRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::ListSandboxesResponse>,
-            tonic::Status,
-        >;
-        /// Delete a sandbox by id.
-        async fn delete_sandbox(
-            &self,
-            request: tonic::Request<super::DeleteSandboxRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::DeleteSandboxResponse>,
-            tonic::Status,
-        >;
-        /// Create a short-lived SSH session for a sandbox.
-        async fn create_ssh_session(
-            &self,
-            request: tonic::Request<super::CreateSshSessionRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::CreateSshSessionResponse>,
-            tonic::Status,
-        >;
-        /// Revoke a previously issued SSH session.
-        async fn revoke_ssh_session(
-            &self,
-            request: tonic::Request<super::RevokeSshSessionRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::RevokeSshSessionResponse>,
-            tonic::Status,
-        >;
-        /// Get sandbox policy by id (called by sandbox entrypoint at startup).
-        async fn get_sandbox_policy(
-            &self,
-            request: tonic::Request<super::super::sandbox::v1::GetSandboxPolicyRequest>,
-        ) -> std::result::Result<
-            tonic::Response<super::super::sandbox::v1::GetSandboxPolicyResponse>,
-            tonic::Status,
-        >;
-        /// Server streaming response type for the WatchSandbox method.
-        type WatchSandboxStream: tonic::codegen::tokio_stream::Stream<
-                Item = std::result::Result<super::SandboxStreamEvent, tonic::Status>,
-            >
-            + std::marker::Send
-            + 'static;
-        /// Watch a sandbox and stream updates.
-        ///
-        /// This stream can include:
-        /// - Sandbox status snapshots (phase/status)
-        /// - OpenShell server process logs correlated by sandbox_id
-        /// - Platform events correlated to the sandbox
-        async fn watch_sandbox(
-            &self,
-            request: tonic::Request<super::WatchSandboxRequest>,
-        ) -> std::result::Result<
-            tonic::Response<Self::WatchSandboxStream>,
-            tonic::Status,
-        >;
-    }
-    /// OpenShell service provides agent execution and management capabilities.
-    #[derive(Debug)]
-    pub struct OpenShellServer<T> {
-        inner: Arc<T>,
-        accept_compression_encodings: EnabledCompressionEncodings,
-        send_compression_encodings: EnabledCompressionEncodings,
-        max_decoding_message_size: Option<usize>,
-        max_encoding_message_size: Option<usize>,
-    }
-    impl<T> OpenShellServer<T> {
-        pub fn new(inner: T) -> Self {
-            Self::from_arc(Arc::new(inner))
-        }
-        pub fn from_arc(inner: Arc<T>) -> Self {
-            Self {
-                inner,
-                accept_compression_encodings: Default::default(),
-                send_compression_encodings: Default::default(),
-                max_decoding_message_size: None,
-                max_encoding_message_size: None,
-            }
-        }
-        pub fn with_interceptor<F>(
-            inner: T,
-            interceptor: F,
-        ) -> InterceptedService<Self, F>
-        where
-            F: tonic::service::Interceptor,
-        {
-            InterceptedService::new(Self::new(inner), interceptor)
-        }
-        /// Enable decompressing requests with the given encoding.
-        #[must_use]
-        pub fn accept_compressed(mut self, encoding: CompressionEncoding) -> Self {
-            self.accept_compression_encodings.enable(encoding);
-            self
-        }
-        /// Compress responses with the given encoding, if the client supports it.
-        #[must_use]
-        pub fn send_compressed(mut self, encoding: CompressionEncoding) -> Self {
-            self.send_compression_encodings.enable(encoding);
-            self
-        }
-        /// Limits the maximum size of a decoded message.
-        ///
-        /// Default: `4MB`
-        #[must_use]
-        pub fn max_decoding_message_size(mut self, limit: usize) -> Self {
-            self.max_decoding_message_size = Some(limit);
-            self
-        }
-        /// Limits the maximum size of an encoded message.
-        ///
-        /// Default: `usize::MAX`
-        #[must_use]
-        pub fn max_encoding_message_size(mut self, limit: usize) -> Self {
-            self.max_encoding_message_size = Some(limit);
-            self
-        }
-    }
-    impl<T, B> tonic::codegen::Service<http::Request<B>> for OpenShellServer<T>
-    where
-        T: OpenShell,
-        B: Body + std::marker::Send + 'static,
-        B::Error: Into<StdError> + std::marker::Send + 'static,
-    {
-        type Response = http::Response<tonic::body::BoxBody>;
-        type Error = std::convert::Infallible;
-        type Future = BoxFuture<Self::Response, Self::Error>;
-        fn poll_ready(
-            &mut self,
-            _cx: &mut Context<'_>,
-        ) -> Poll<std::result::Result<(), Self::Error>> {
-            Poll::Ready(Ok(()))
-        }
-        fn call(&mut self, req: http::Request<B>) -> Self::Future {
-            match req.uri().path() {
-                "/openshell.v1.OpenShell/Health" => {
-                    #[allow(non_camel_case_types)]
-                    struct HealthSvc<T: OpenShell>(pub Arc<T>);
-                    impl<T: OpenShell> tonic::server::UnaryService<super::HealthRequest>
-                    for HealthSvc<T> {
-                        type Response = super::HealthResponse;
-                        type Future = BoxFuture<
-                            tonic::Response<Self::Response>,
-                            tonic::Status,
-                        >;
-                        fn call(
-                            &mut self,
-                            request: tonic::Request<super::HealthRequest>,
-                        ) -> Self::Future {
-                            let inner = Arc::clone(&self.0);
-                            let fut = async move {
-                                <T as OpenShell>::health(&inner, request).await
-                            };
-                            Box::pin(fut)
-                        }
-                    }
-                    let accept_compression_encodings = self.accept_compression_encodings;
-                    let send_compression_encodings = self.send_compression_encodings;
-                    let max_decoding_message_size = self.max_decoding_message_size;
-                    let max_encoding_message_size = self.max_encoding_message_size;
-                    let inner = self.inner.clone();
-                    let fut = async move {
-                        let method = HealthSvc(inner);
-                        let codec = tonic::codec::ProstCodec::default();
-                        let mut grpc = tonic::server::Grpc::new(codec)
-                            .apply_compression_config(
-                                accept_compression_encodings,
-                                send_compression_encodings,
-                            )
-                            .apply_max_message_size_config(
-                                max_decoding_message_size,
-                                max_encoding_message_size,
-                            );
-                        let res = grpc.unary(method, req).await;
-                        Ok(res)
-                    };
-                    Box::pin(fut)
-                }
-                "/openshell.v1.OpenShell/CreateSandbox" => {
-                    #[allow(non_camel_case_types)]
-                    struct CreateSandboxSvc<T: OpenShell>(pub Arc<T>);
-                    impl<
-                        T: OpenShell,
-                    > tonic::server::UnaryService<super::CreateSandboxRequest>
-                    for CreateSandboxSvc<T> {
-                        type Response = super::SandboxResponse;
-                        type Future = BoxFuture<
-                            tonic::Response<Self::Response>,
-                            tonic::Status,
-                        >;
-                        fn call(
-                            &mut self,
-                            request: tonic::Request<super::CreateSandboxRequest>,
-                        ) -> Self::Future {
-                            let inner = Arc::clone(&self.0);
-                            let fut = async move {
-                                <T as OpenShell>::create_sandbox(&inner, request).await
-                            };
-                            Box::pin(fut)
-                        }
-                    }
-                    let accept_compression_encodings = self.accept_compression_encodings;
-                    let send_compression_encodings = self.send_compression_encodings;
-                    let max_decoding_message_size = self.max_decoding_message_size;
-                    let max_encoding_message_size = self.max_encoding_message_size;
-                    let inner = self.inner.clone();
-                    let fut = async move {
-                        let method = CreateSandboxSvc(inner);
-                        let codec = tonic::codec::ProstCodec::default();
-                        let mut grpc = tonic::server::Grpc::new(codec)
-                            .apply_compression_config(
-                                accept_compression_encodings,
-                                send_compression_encodings,
-                            )
-                            .apply_max_message_size_config(
-                                max_decoding_message_size,
-                                max_encoding_message_size,
-                            );
-                        let res = grpc.unary(method, req).await;
-                        Ok(res)
-                    };
-                    Box::pin(fut)
-                }
-                "/openshell.v1.OpenShell/GetSandbox" => {
-                    #[allow(non_camel_case_types)]
-                    struct GetSandboxSvc<T: OpenShell>(pub Arc<T>);
-                    impl<
-                        T: OpenShell,
-                    > tonic::server::UnaryService<super::GetSandboxRequest>
-                    for GetSandboxSvc<T> {
-                        type Response = super::SandboxResponse;
-                        type Future = BoxFuture<
-                            tonic::Response<Self::Response>,
-                            tonic::Status,
-                        >;
-                        fn call(
-                            &mut self,
-                            request: tonic::Request<super::GetSandboxRequest>,
-                        ) -> Self::Future {
-                            let inner = Arc::clone(&self.0);
-                            let fut = async move {
-                                <T as OpenShell>::get_sandbox(&inner, request).await
-                            };
-                            Box::pin(fut)
-                        }
-                    }
-                    let accept_compression_encodings = self.accept_compression_encodings;
-                    let send_compression_encodings = self.send_compression_encodings;
-                    let max_decoding_message_size = self.max_decoding_message_size;
-                    let max_encoding_message_size = self.max_encoding_message_size;
-                    let inner = self.inner.clone();
-                    let fut = async move {
-                        let method = GetSandboxSvc(inner);
-                        let codec = tonic::codec::ProstCodec::default();
-                        let mut grpc = tonic::server::Grpc::new(codec)
-                            .apply_compression_config(
-                                accept_compression_encodings,
-                                send_compression_encodings,
-                            )
-                            .apply_max_message_size_config(
-                                max_decoding_message_size,
-                                max_encoding_message_size,
-                            );
-                        let res = grpc.unary(method, req).await;
-                        Ok(res)
-                    };
-                    Box::pin(fut)
-                }
-                "/openshell.v1.OpenShell/ListSandboxes" => {
-                    #[allow(non_camel_case_types)]
-                    struct ListSandboxesSvc<T: OpenShell>(pub Arc<T>);
-                    impl<
-                        T: OpenShell,
-                    > tonic::server::UnaryService<super::ListSandboxesRequest>
-                    for ListSandboxesSvc<T> {
-                        type Response = super::ListSandboxesResponse;
-                        type Future = BoxFuture<
-                            tonic::Response<Self::Response>,
-                            tonic::Status,
-                        >;
-                        fn call(
-                            &mut self,
-                            request: tonic::Request<super::ListSandboxesRequest>,
-                        ) -> Self::Future {
-                            let inner = Arc::clone(&self.0);
-                            let fut = async move {
-                                <T as OpenShell>::list_sandboxes(&inner, request).await
-                            };
-                            Box::pin(fut)
-                        }
-                    }
-                    let accept_compression_encodings = self.accept_compression_encodings;
-                    let send_compression_encodings = self.send_compression_encodings;
-                    let max_decoding_message_size = self.max_decoding_message_size;
-                    let max_encoding_message_size = self.max_encoding_message_size;
-                    let inner = self.inner.clone();
-                    let fut = async move {
-                        let method = ListSandboxesSvc(inner);
-                        let codec = tonic::codec::ProstCodec::default();
-                        let mut grpc = tonic::server::Grpc::new(codec)
-                            .apply_compression_config(
-                                accept_compression_encodings,
-                                send_compression_encodings,
-                            )
-                            .apply_max_message_size_config(
-                                max_decoding_message_size,
-                                max_encoding_message_size,
-                            );
-                        let res = grpc.unary(method, req).await;
-                        Ok(res)
-                    };
-                    Box::pin(fut)
-                }
-                "/openshell.v1.OpenShell/DeleteSandbox" => {
-                    #[allow(non_camel_case_types)]
-                    struct DeleteSandboxSvc<T: OpenShell>(pub Arc<T>);
-                    impl<
-                        T: OpenShell,
-                    > tonic::server::UnaryService<super::DeleteSandboxRequest>
-                    for DeleteSandboxSvc<T> {
-                        type Response = super::DeleteSandboxResponse;
-                        type Future = BoxFuture<
-                            tonic::Response<Self::Response>,
-                            tonic::Status,
-                        >;
-                        fn call(
-                            &mut self,
-                            request: tonic::Request<super::DeleteSandboxRequest>,
-                        ) -> Self::Future {
-                            let inner = Arc::clone(&self.0);
-                            let fut = async move {
-                                <T as OpenShell>::delete_sandbox(&inner, request).await
-                            };
-                            Box::pin(fut)
-                        }
-                    }
-                    let accept_compression_encodings = self.accept_compression_encodings;
-                    let send_compression_encodings = self.send_compression_encodings;
-                    let max_decoding_message_size = self.max_decoding_message_size;
-                    let max_encoding_message_size = self.max_encoding_message_size;
-                    let inner = self.inner.clone();
-                    let fut = async move {
-                        let method = DeleteSandboxSvc(inner);
-                        let codec = tonic::codec::ProstCodec::default();
-                        let mut grpc = tonic::server::Grpc::new(codec)
-                            .apply_compression_config(
-                                accept_compression_encodings,
-                                send_compression_encodings,
-                            )
-                            .apply_max_message_size_config(
-                                max_decoding_message_size,
-                                max_encoding_message_size,
-                            );
-                        let res = grpc.unary(method, req).await;
-                        Ok(res)
-                    };
-                    Box::pin(fut)
-                }
-                "/openshell.v1.OpenShell/CreateSshSession" => {
-                    #[allow(non_camel_case_types)]
-                    struct CreateSshSessionSvc<T: OpenShell>(pub Arc<T>);
-                    impl<
-                        T: OpenShell,
-                    > tonic::server::UnaryService<super::CreateSshSessionRequest>
-                    for CreateSshSessionSvc<T> {
-                        type Response = super::CreateSshSessionResponse;
-                        type Future = BoxFuture<
-                            tonic::Response<Self::Response>,
-                            tonic::Status,
-                        >;
-                        fn call(
-                            &mut self,
-                            request: tonic::Request<super::CreateSshSessionRequest>,
-                        ) -> Self::Future {
-                            let inner = Arc::clone(&self.0);
-                            let fut = async move {
-                                <T as OpenShell>::create_ssh_session(&inner, request).await
-                            };
-                            Box::pin(fut)
-                        }
-                    }
-                    let accept_compression_encodings = self.accept_compression_encodings;
-                    let send_compression_encodings = self.send_compression_encodings;
-                    let max_decoding_message_size = self.max_decoding_message_size;
-                    let max_encoding_message_size = self.max_encoding_message_size;
-                    let inner = self.inner.clone();
-                    let fut = async move {
-                        let method = CreateSshSessionSvc(inner);
-                        let codec = tonic::codec::ProstCodec::default();
-                        let mut grpc = tonic::server::Grpc::new(codec)
-                            .apply_compression_config(
-                                accept_compression_encodings,
-                                send_compression_encodings,
-                            )
-                            .apply_max_message_size_config(
-                                max_decoding_message_size,
-                                max_encoding_message_size,
-                            );
-                        let res = grpc.unary(method, req).await;
-                        Ok(res)
-                    };
-                    Box::pin(fut)
-                }
-                "/openshell.v1.OpenShell/RevokeSshSession" => {
-                    #[allow(non_camel_case_types)]
-                    struct RevokeSshSessionSvc<T: OpenShell>(pub Arc<T>);
-                    impl<
-                        T: OpenShell,
-                    > tonic::server::UnaryService<super::RevokeSshSessionRequest>
-                    for RevokeSshSessionSvc<T> {
-                        type Response = super::RevokeSshSessionResponse;
-                        type Future = BoxFuture<
-                            tonic::Response<Self::Response>,
-                            tonic::Status,
-                        >;
-                        fn call(
-                            &mut self,
-                            request: tonic::Request<super::RevokeSshSessionRequest>,
-                        ) -> Self::Future {
-                            let inner = Arc::clone(&self.0);
-                            let fut = async move {
-                                <T as OpenShell>::revoke_ssh_session(&inner, request).await
-                            };
-                            Box::pin(fut)
-                        }
-                    }
-                    let accept_compression_encodings = self.accept_compression_encodings;
-                    let send_compression_encodings = self.send_compression_encodings;
-                    let max_decoding_message_size = self.max_decoding_message_size;
-                    let max_encoding_message_size = self.max_encoding_message_size;
-                    let inner = self.inner.clone();
-                    let fut = async move {
-                        let method = RevokeSshSessionSvc(inner);
-                        let codec = tonic::codec::ProstCodec::default();
-                        let mut grpc = tonic::server::Grpc::new(codec)
-                            .apply_compression_config(
-                                accept_compression_encodings,
-                                send_compression_encodings,
-                            )
-                            .apply_max_message_size_config(
-                                max_decoding_message_size,
-                                max_encoding_message_size,
-                            );
-                        let res = grpc.unary(method, req).await;
-                        Ok(res)
-                    };
-                    Box::pin(fut)
-                }
-                "/openshell.v1.OpenShell/GetSandboxPolicy" => {
-                    #[allow(non_camel_case_types)]
-                    struct GetSandboxPolicySvc<T: OpenShell>(pub Arc<T>);
-                    impl<
-                        T: OpenShell,
-                    > tonic::server::UnaryService<
-                        super::super::sandbox::v1::GetSandboxPolicyRequest,
-                    > for GetSandboxPolicySvc<T> {
-                        type Response = super::super::sandbox::v1::GetSandboxPolicyResponse;
-                        type Future = BoxFuture<
-                            tonic::Response<Self::Response>,
-                            tonic::Status,
-                        >;
-                        fn call(
-                            &mut self,
-                            request: tonic::Request<
-                                super::super::sandbox::v1::GetSandboxPolicyRequest,
-                            >,
-                        ) -> Self::Future {
-                            let inner = Arc::clone(&self.0);
-                            let fut = async move {
-                                <T as OpenShell>::get_sandbox_policy(&inner, request).await
-                            };
-                            Box::pin(fut)
-                        }
-                    }
-                    let accept_compression_encodings = self.accept_compression_encodings;
-                    let send_compression_encodings = self.send_compression_encodings;
-                    let max_decoding_message_size = self.max_decoding_message_size;
-                    let max_encoding_message_size = self.max_encoding_message_size;
-                    let inner = self.inner.clone();
-                    let fut = async move {
-                        let method = GetSandboxPolicySvc(inner);
-                        let codec = tonic::codec::ProstCodec::default();
-                        let mut grpc = tonic::server::Grpc::new(codec)
-                            .apply_compression_config(
-                                accept_compression_encodings,
-                                send_compression_encodings,
-                            )
-                            .apply_max_message_size_config(
-                                max_decoding_message_size,
-                                max_encoding_message_size,
-                            );
-                        let res = grpc.unary(method, req).await;
-                        Ok(res)
-                    };
-                    Box::pin(fut)
-                }
-                "/openshell.v1.OpenShell/WatchSandbox" => {
-                    #[allow(non_camel_case_types)]
-                    struct WatchSandboxSvc<T: OpenShell>(pub Arc<T>);
-                    impl<
-                        T: OpenShell,
-                    > tonic::server::ServerStreamingService<super::WatchSandboxRequest>
-                    for WatchSandboxSvc<T> {
-                        type Response = super::SandboxStreamEvent;
-                        type ResponseStream = T::WatchSandboxStream;
-                        type Future = BoxFuture<
-                            tonic::Response<Self::ResponseStream>,
-                            tonic::Status,
-                        >;
-                        fn call(
-                            &mut self,
-                            request: tonic::Request<super::WatchSandboxRequest>,
-                        ) -> Self::Future {
-                            let inner = Arc::clone(&self.0);
-                            let fut = async move {
-                                <T as OpenShell>::watch_sandbox(&inner, request).await
-                            };
-                            Box::pin(fut)
-                        }
-                    }
-                    let accept_compression_encodings = self.accept_compression_encodings;
-                    let send_compression_encodings = self.send_compression_encodings;
-                    let max_decoding_message_size = self.max_decoding_message_size;
-                    let max_encoding_message_size = self.max_encoding_message_size;
-                    let inner = self.inner.clone();
-                    let fut = async move {
-                        let method = WatchSandboxSvc(inner);
-                        let codec = tonic::codec::ProstCodec::default();
-                        let mut grpc = tonic::server::Grpc::new(codec)
-                            .apply_compression_config(
-                                accept_compression_encodings,
-                                send_compression_encodings,
-                            )
-                            .apply_max_message_size_config(
-                                max_decoding_message_size,
-                                max_encoding_message_size,
-                            );
-                        let res = grpc.server_streaming(method, req).await;
-                        Ok(res)
-                    };
-                    Box::pin(fut)
-                }
-                _ => {
-                    Box::pin(async move {
-                        let mut response = http::Response::new(empty_body());
-                        let headers = response.headers_mut();
-                        headers
-                            .insert(
-                                tonic::Status::GRPC_STATUS,
-                                (tonic::Code::Unimplemented as i32).into(),
-                            );
-                        headers
-                            .insert(
-                                http::header::CONTENT_TYPE,
-                                tonic::metadata::GRPC_CONTENT_TYPE,
-                            );
-                        Ok(response)
-                    })
-                }
-            }
-        }
-    }
-    impl<T> Clone for OpenShellServer<T> {
-        fn clone(&self) -> Self {
-            let inner = self.inner.clone();
-            Self {
-                inner,
-                accept_compression_encodings: self.accept_compression_encodings,
-                send_compression_encodings: self.send_compression_encodings,
-                max_decoding_message_size: self.max_decoding_message_size,
-                max_encoding_message_size: self.max_encoding_message_size,
-            }
-        }
-    }
-    /// Generated gRPC service name
-    pub const SERVICE_NAME: &str = "openshell.v1.OpenShell";
-    impl<T> tonic::server::NamedService for OpenShellServer<T> {
-        const NAME: &'static str = SERVICE_NAME;
-    }
-}
diff --git a/proto/inference.proto b/proto/inference.proto
index 1fefe87c6..a14ce70ea 100644
--- a/proto/inference.proto
+++ b/proto/inference.proto
@@ -5,9 +5,6 @@ syntax = "proto3";
 
 package openshell.inference.v1;
 
-option java_multiple_files = true;
-option java_package = "com.anthropic.openshell.inference.v1";
-
 // Inference service provides cluster inference configuration and bundle delivery.
 service Inference {
   // Return the resolved inference route bundle for sandbox-local execution.
diff --git a/proto/openshell.proto b/proto/openshell.proto
index 625a54130..04f705020 100644
--- a/proto/openshell.proto
+++ b/proto/openshell.proto
@@ -8,9 +8,6 @@ package openshell.v1;
 import "datamodel.proto";
 import "sandbox.proto";
 
-option java_multiple_files = true;
-option java_package = "com.anthropic.openshell.v1";
-
 // OpenShell service provides sandbox, provider, and runtime management capabilities.
 service OpenShell {
   // Check the health of the service.

From 6d930896216a95f7289b53445dcd73c5c4ee951b Mon Sep 17 00:00:00 2001
From: Adam Miller <admiller@redhat.com>
Date: Mon, 6 Apr 2026 17:00:16 -0500
Subject: [PATCH 8/9] fix(bootstrap): use host cgroupns for rootful Podman

Rootful Podman (uid 0) has full write access to the host cgroup tree,
so it should use cgroupns=host like Docker. Only rootless Podman needs
cgroupns=private because user namespace restrictions make the host
cgroup tree read-only.

Previously, all Podman instances used PRIVATE cgroupns mode, causing
k3s kubelet to fail with 'missing controllers: cpu, cpuset, hugetlb,
memory, pids' when running as root.
---
 crates/openshell-bootstrap/src/container_runtime.rs | 12 +++++++++++-
 crates/openshell-bootstrap/src/docker.rs            |  6 +++++-
 2 files changed, 16 insertions(+), 2 deletions(-)

diff --git a/crates/openshell-bootstrap/src/container_runtime.rs b/crates/openshell-bootstrap/src/container_runtime.rs
index 855f76f5c..605aed787 100644
--- a/crates/openshell-bootstrap/src/container_runtime.rs
+++ b/crates/openshell-bootstrap/src/container_runtime.rs
@@ -8,7 +8,7 @@
 //! explicit override via the `OPENSHELL_CONTAINER_RUNTIME` environment variable
 //! or `--container-runtime` CLI flag.
 
-use miette::{Result, miette};
+use miette::{miette, Result};
 use std::fmt;
 use std::path::Path;
 
@@ -203,6 +203,16 @@ fn podman_rootless_socket_path() -> Option<String> {
     Some(format!("{runtime_dir}/podman/podman.sock"))
 }
 
+/// Check whether the current process is running as a non-root user.
+///
+/// Returns `true` when the effective UID is non-zero (rootless mode).
+/// Used to decide container configuration — for example, rootless Podman
+/// needs a private cgroup namespace while rootful Podman (and Docker) can
+/// use the host cgroup namespace.
+pub(crate) fn is_rootless() -> bool {
+    current_uid().map_or(false, |uid| uid != 0)
+}
+
 /// Get the current user's UID by reading `/proc/self/status`.
 ///
 /// Returns `None` on non-Linux systems or if the file cannot be parsed.
diff --git a/crates/openshell-bootstrap/src/docker.rs b/crates/openshell-bootstrap/src/docker.rs
index 697c66e83..2dedd7d5b 100644
--- a/crates/openshell-bootstrap/src/docker.rs
+++ b/crates/openshell-bootstrap/src/docker.rs
@@ -664,7 +664,11 @@ pub async fn ensure_container(
     // Rootless Podman with cgroupns=host mounts the host cgroup tree
     // read-only (user namespace restriction), so it needs a private cgroup
     // namespace where the delegated controllers are writable.
-    let cgroupns = if runtime == ContainerRuntime::Podman {
+    // Rootful Podman (uid 0) can use host cgroupns just like Docker since
+    // root has full write access to the host cgroup tree.
+    let is_rootless_podman = runtime == ContainerRuntime::Podman
+        && crate::container_runtime::is_rootless();
+    let cgroupns = if is_rootless_podman {
         HostConfigCgroupnsModeEnum::PRIVATE
     } else {
         HostConfigCgroupnsModeEnum::HOST

From 9ac1ab87aa57d095eb27ec25b0c1bc96b44989fb Mon Sep 17 00:00:00 2001
From: Adam Miller <admiller@redhat.com>
Date: Mon, 6 Apr 2026 17:36:43 -0500
Subject: [PATCH 9/9] fix(ci): apply rustfmt and fix install.sh e2e tests for
 fork repos

- Apply cargo fmt to container_runtime.rs (import order) and docker.rs
  (line-break style)
- Make install.sh REPO overridable via OPENSHELL_REPO env var so the
  e2e tests can point at the upstream NVIDIA repo (which has actual
  releases) when running against fork repos that have no releases
- Update e2e/install helpers (sh and fish) to default OPENSHELL_REPO
  to NVIDIA/OpenShell for test runs
---
 .../src/container_runtime.rs                  |  2 +-
 crates/openshell-bootstrap/src/docker.rs      |  4 +-
 e2e/install/fish_test.fish                    |  3 +
 e2e/install/helpers.sh                        | 71 ++++++++++---------
 install.sh                                    |  2 +-
 5 files changed, 44 insertions(+), 38 deletions(-)

diff --git a/crates/openshell-bootstrap/src/container_runtime.rs b/crates/openshell-bootstrap/src/container_runtime.rs
index 605aed787..86d7c337f 100644
--- a/crates/openshell-bootstrap/src/container_runtime.rs
+++ b/crates/openshell-bootstrap/src/container_runtime.rs
@@ -8,7 +8,7 @@
 //! explicit override via the `OPENSHELL_CONTAINER_RUNTIME` environment variable
 //! or `--container-runtime` CLI flag.
 
-use miette::{miette, Result};
+use miette::{Result, miette};
 use std::fmt;
 use std::path::Path;
 
diff --git a/crates/openshell-bootstrap/src/docker.rs b/crates/openshell-bootstrap/src/docker.rs
index 2dedd7d5b..ff29bbd53 100644
--- a/crates/openshell-bootstrap/src/docker.rs
+++ b/crates/openshell-bootstrap/src/docker.rs
@@ -666,8 +666,8 @@ pub async fn ensure_container(
     // namespace where the delegated controllers are writable.
     // Rootful Podman (uid 0) can use host cgroupns just like Docker since
     // root has full write access to the host cgroup tree.
-    let is_rootless_podman = runtime == ContainerRuntime::Podman
-        && crate::container_runtime::is_rootless();
+    let is_rootless_podman =
+        runtime == ContainerRuntime::Podman && crate::container_runtime::is_rootless();
     let cgroupns = if is_rootless_podman {
         HostConfigCgroupnsModeEnum::PRIVATE
     } else {
diff --git a/e2e/install/fish_test.fish b/e2e/install/fish_test.fish
index 101760715..9a95a9730 100755
--- a/e2e/install/fish_test.fish
+++ b/e2e/install/fish_test.fish
@@ -65,7 +65,10 @@ end
 function run_install
     set -g INSTALL_DIR (mktemp -d)/bin
 
+    # Use the upstream NVIDIA repo for release resolution in tests, since fork
+    # repos (e.g. LobsterTrap) may not have published releases.
     set -g INSTALL_OUTPUT (OPENSHELL_INSTALL_DIR="$INSTALL_DIR" \
+        OPENSHELL_REPO=(set -q OPENSHELL_REPO; and echo $OPENSHELL_REPO; or echo "NVIDIA/OpenShell") \
         SHELL="/usr/bin/fish" \
         PATH="/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin" \
         sh "$INSTALL_SCRIPT" 2>&1)
diff --git a/e2e/install/helpers.sh b/e2e/install/helpers.sh
index ff5f66376..eb76e4411 100644
--- a/e2e/install/helpers.sh
+++ b/e2e/install/helpers.sh
@@ -28,40 +28,40 @@ INSTALL_OUTPUT=""
 # ---------------------------------------------------------------------------
 
 pass() {
-  _PASS=$((_PASS + 1))
-  printf '  PASS: %s\n' "$1"
+	_PASS=$((_PASS + 1))
+	printf '  PASS: %s\n' "$1"
 }
 
 fail() {
-  _FAIL=$((_FAIL + 1))
-  printf '  FAIL: %s\n' "$1" >&2
-  if [ -n "${2:-}" ]; then
-    printf '        %s\n' "$2" >&2
-  fi
+	_FAIL=$((_FAIL + 1))
+	printf '  FAIL: %s\n' "$1" >&2
+	if [ -n "${2:-}" ]; then
+		printf '        %s\n' "$2" >&2
+	fi
 }
 
 assert_output_contains() {
-  _aoc_output="$1"
-  _aoc_pattern="$2"
-  _aoc_label="$3"
+	_aoc_output="$1"
+	_aoc_pattern="$2"
+	_aoc_label="$3"
 
-  if printf '%s' "$_aoc_output" | grep -qF "$_aoc_pattern"; then
-    pass "$_aoc_label"
-  else
-    fail "$_aoc_label" "expected '$_aoc_pattern' in output"
-  fi
+	if printf '%s' "$_aoc_output" | grep -qF "$_aoc_pattern"; then
+		pass "$_aoc_label"
+	else
+		fail "$_aoc_label" "expected '$_aoc_pattern' in output"
+	fi
 }
 
 assert_output_not_contains() {
-  _aonc_output="$1"
-  _aonc_pattern="$2"
-  _aonc_label="$3"
+	_aonc_output="$1"
+	_aonc_pattern="$2"
+	_aonc_label="$3"
 
-  if printf '%s' "$_aonc_output" | grep -qF "$_aonc_pattern"; then
-    fail "$_aonc_label" "unexpected '$_aonc_pattern' found in output"
-  else
-    pass "$_aonc_label"
-  fi
+	if printf '%s' "$_aonc_output" | grep -qF "$_aonc_pattern"; then
+		fail "$_aonc_label" "unexpected '$_aonc_pattern' found in output"
+	else
+		pass "$_aonc_label"
+	fi
 }
 
 # ---------------------------------------------------------------------------
@@ -78,16 +78,19 @@ assert_output_not_contains() {
 # Usage:
 #   SHELL="/bin/bash" run_install
 run_install() {
-  INSTALL_DIR="$(mktemp -d)/bin"
+	INSTALL_DIR="$(mktemp -d)/bin"
 
-  # Remove the install dir from PATH (it won't be there, but be explicit).
-  # Keep a minimal PATH so curl/tar/install are available.
-  INSTALL_OUTPUT="$(OPENSHELL_INSTALL_DIR="$INSTALL_DIR" \
-    PATH="/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin" \
-    sh "$INSTALL_SCRIPT" 2>&1)" || {
-    printf 'install.sh failed:\n%s\n' "$INSTALL_OUTPUT" >&2
-    return 1
-  }
+	# Remove the install dir from PATH (it won't be there, but be explicit).
+	# Keep a minimal PATH so curl/tar/install are available.
+	# Use the upstream NVIDIA repo for release resolution in tests, since fork
+	# repos (e.g. LobsterTrap) may not have published releases.
+	INSTALL_OUTPUT="$(OPENSHELL_INSTALL_DIR="$INSTALL_DIR" \
+		OPENSHELL_REPO="${OPENSHELL_REPO:-NVIDIA/OpenShell}" \
+		PATH="/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin" \
+		sh "$INSTALL_SCRIPT" 2>&1)" || {
+		printf 'install.sh failed:\n%s\n' "$INSTALL_OUTPUT" >&2
+		return 1
+	}
 }
 
 # ---------------------------------------------------------------------------
@@ -95,6 +98,6 @@ run_install() {
 # ---------------------------------------------------------------------------
 
 print_summary() {
-  printf '\n=== Results: %d passed, %d failed ===\n' "$_PASS" "$_FAIL"
-  [ "$_FAIL" -eq 0 ]
+	printf '\n=== Results: %d passed, %d failed ===\n' "$_PASS" "$_FAIL"
+	[ "$_FAIL" -eq 0 ]
 }
diff --git a/install.sh b/install.sh
index d9f62df1d..169e9c209 100755
--- a/install.sh
+++ b/install.sh
@@ -17,7 +17,7 @@
 set -eu
 
 APP_NAME="openshell"
-REPO="LobsterTrap/OpenShell"
+REPO="${OPENSHELL_REPO:-LobsterTrap/OpenShell}"
 GITHUB_URL="https://github.com/${REPO}"
 
 # ---------------------------------------------------------------------------