From 5bba1b726711aa7720ce27156692ad8ae3140efb Mon Sep 17 00:00:00 2001
From: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
Date: Wed, 24 Jun 2026 09:43:23 -0300
Subject: [PATCH 1/9] feat(wxc_common): add the sandbox execution interfaces
 (SandboxBackend / SandboxProcess / Runner)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Introduce the shared, no-pty execution surface that the containment backends
and a future in-process library build on. Purely additive: no existing code
path uses these yet, so behavior is unchanged.

- `SandboxProcess` — a handle to a running sandboxed child: `take_stdin` /
  `take_stdout` / `take_stderr`, `try_wait`, `id`, `kill` (process-tree), and
  `wait` (drains any untaken stdio, honors `scriptTimeout`), plus stdout/stderr
  closers for abandoning a backgrounded-descendant-held read without a kill.
- `SandboxBackend` — `validate` + `spawn(request, logger, StdioMode) ->
  SandboxProcess` + a `diagnose_exit` hook; `StdioMode::{Pipes, Inherit}`.
- `Runner<B>` — the generic adapter bridging any `SandboxBackend` to the
  run-to-completion `ScriptRunner` (spawn `Inherit`, then `wait`).
- `StreamCloser`, `group_kill` (Unix leader-first SIGKILL of the child's group),
  and `wait_with_timeout` (adaptive 1ms->50ms backoff poll).
- `interruptible_reader` (Unix self-pipe + `poll`) and the Windows pipe helpers
  in `process_util` (`InterruptiblePipeReader` / `PipeReadCanceller` /
  `create_std_pipes`) for out-of-band-cancelable streaming reads.
- `FailurePhase::Timeout` so a timeout is distinguishable from other failures.

The library backends and executor binaries are migrated onto this surface in a
follow-up PR, and the importable `mxc-sdk` crate is built on top of it.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
Signed-off-by: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
---
 src/core/wxc_common/Cargo.toml                |   2 +-
 .../wxc_common/src/interruptible_reader.rs    | 293 +++++++++++
 src/core/wxc_common/src/lib.rs                |   5 +
 src/core/wxc_common/src/models.rs             |   5 +
 src/core/wxc_common/src/process_util.rs       | 227 ++++++++-
 src/core/wxc_common/src/sandbox_process.rs    | 475 ++++++++++++++++++
 6 files changed, 1005 insertions(+), 2 deletions(-)
 create mode 100644 src/core/wxc_common/src/interruptible_reader.rs
 create mode 100644 src/core/wxc_common/src/sandbox_process.rs
diff --git a/src/core/wxc_common/Cargo.toml b/src/core/wxc_common/Cargo.toml
index e6dcf35b8..bca51a80f 100644
--- a/src/core/wxc_common/Cargo.toml
+++ b/src/core/wxc_common/Cargo.toml
@@ -28,7 +28,7 @@ windows-core = { workspace = true }
 widestring = { workspace = true }
 winreg = { workspace = true }
 
-[target.'cfg(target_os = "linux")'.dependencies]
+[target.'cfg(unix)'.dependencies]
 libc = { workspace = true }
 
 [dev-dependencies]
diff --git a/src/core/wxc_common/src/interruptible_reader.rs b/src/core/wxc_common/src/interruptible_reader.rs
new file mode 100644
index 000000000..1cc01bb11
--- /dev/null
+++ b/src/core/wxc_common/src/interruptible_reader.rs
@@ -0,0 +1,293 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! A Unix pipe reader whose `read` can be cancelled out-of-band.
+//!
+//! The in-tree Unix backends (Seatbelt, Bubblewrap) hand the caller the child's
+//! raw stdout/stderr pipe, where a blocking `read` only ends at EOF — when every
+//! write end closes. A backgrounded descendant that inherited the pipe can hold
+//! its write end open past the foreground command's exit, leaving such a read
+//! parked indefinitely. [`InterruptibleReader`] wraps the pipe so a separate
+//! [`ReadCanceller`] (a [`StreamCloser`]) can make that read return EOF
+//! (`Ok(0)`) promptly, without killing the child.
+//!
+//! It uses a self-pipe + `poll(2)`: the read fd is set non-blocking and the
+//! reader blocks in `poll` on both the data pipe and the read end of a
+//! self-pipe; cancellation writes a byte to the self-pipe (waking the `poll`)
+//! and sets a flag so later reads short-circuit to EOF.
+
+use std::io::{self, Read};
+use std::os::fd::{AsRawFd, FromRawFd, OwnedFd, RawFd};
+use std::sync::atomic::{AtomicBool, Ordering};
+use std::sync::Arc;
+
+use crate::sandbox_process::StreamCloser;
+
+/// Cancellation state shared between an [`InterruptibleReader`] and the
+/// [`ReadCanceller`]s minted from it: the write end of the self-pipe used to
+/// wake the reader's `poll`, plus a flag so a read after cancellation returns
+/// EOF without touching the data pipe.
+struct CancelState {
+    cancelled: AtomicBool,
+    /// Write end of the self-pipe; one byte here wakes the reader's `poll`.
+    wake_w: OwnedFd,
+}
+
+impl CancelState {
+    /// Mark cancelled (once) and nudge the reader's `poll` awake.
+    fn cancel(&self) {
+        // Flag first so a read that wakes observes EOF, then wake the poll. If
+        // we were already cancelled, do nothing — `close` is idempotent.
+        if self.cancelled.swap(true, Ordering::Release) {
+            return;
+        }
+        // A single byte makes `poll` return. The self-pipe write end is
+        // non-blocking, so this never blocks; ignore the result — `EAGAIN`
+        // (a wake byte is already pending) and `EPIPE` (the reader's end has
+        // been dropped) are both fine.
+        let byte = [0u8; 1];
+        // SAFETY: `wake_w` is a valid, owned, non-blocking pipe write fd; the
+        // buffer is a valid 1-byte local.
+        unsafe {
+            libc::write(self.wake_w.as_raw_fd(), byte.as_ptr().cast(), 1);
+        }
+    }
+}
+
+/// A [`StreamCloser`] for an [`InterruptibleReader`]. Cloneable and `Send +
+/// Sync` so several may be held (and fired from any thread); all share one
+/// cancellation state, and `close` is idempotent.
+#[derive(Clone)]
+pub struct ReadCanceller(Arc<CancelState>);
+
+impl StreamCloser for ReadCanceller {
+    fn close(&self) {
+        self.0.cancel();
+    }
+}
+
+/// A readable pipe whose `read` can be cancelled via a [`ReadCanceller`].
+///
+/// Implements [`Read`]: it blocks in `poll(2)` on the data pipe and a self-pipe
+/// and returns the next chunk, real EOF (`Ok(0)`), or — once a paired
+/// [`ReadCanceller::close`] fires — a prompt cancellation EOF (`Ok(0)`).
+pub struct InterruptibleReader {
+    /// The child's stdout/stderr pipe, set non-blocking.
+    fd: OwnedFd,
+    /// Read end of the self-pipe; readable once cancellation writes its byte.
+    wake_r: OwnedFd,
+    state: Arc<CancelState>,
+}
+
+impl InterruptibleReader {
+    /// Wrap an owned readable pipe `fd` so its reads can be cancelled
+    /// out-of-band. Sets `fd` non-blocking and creates the self-pipe used for
+    /// wakeups.
+    ///
+    /// # Errors
+    ///
+    /// Returns the underlying [`io::Error`] if the self-pipe cannot be created
+    /// or either fd cannot be switched to non-blocking mode.
+    pub fn new(fd: OwnedFd) -> io::Result<Self> {
+        set_nonblocking(fd.as_raw_fd())?;
+
+        // Self-pipe for wakeups: the write end is non-blocking so `cancel`
+        // never stalls; the read end stays blocking but is only ever polled.
+        let mut fds = [0 as RawFd; 2];
+        // SAFETY: `fds` is a valid 2-element array for `pipe` to fill.
+        if unsafe { libc::pipe(fds.as_mut_ptr()) } < 0 {
+            return Err(io::Error::last_os_error());
+        }
+        // SAFETY: `pipe` succeeded, so both fds are freshly owned by us.
+        let wake_r = unsafe { OwnedFd::from_raw_fd(fds[0]) };
+        let wake_w = unsafe { OwnedFd::from_raw_fd(fds[1]) };
+        set_nonblocking(wake_w.as_raw_fd())?;
+
+        Ok(Self {
+            fd,
+            wake_r,
+            state: Arc::new(CancelState {
+                cancelled: AtomicBool::new(false),
+                wake_w,
+            }),
+        })
+    }
+
+    /// Mint a closer that EOFs this reader's `read` on demand. Several closers
+    /// may be minted; they share one cancellation state.
+    pub fn canceller(&self) -> ReadCanceller {
+        ReadCanceller(Arc::clone(&self.state))
+    }
+}
+
+/// Wrap an optional child pipe end into an [`InterruptibleReader`] plus a
+/// [`ReadCanceller`] for its [`StreamCloser`]. `None` (inherited stdio) stays
+/// `None` for both. Convenience for the Unix backends, which hold `ChildStdout`
+/// / `ChildStderr` (both `Into<OwnedFd>`).
+///
+/// # Errors
+///
+/// Propagates any [`io::Error`] from [`InterruptibleReader::new`].
+pub fn wrap_pipe<T: Into<OwnedFd>>(
+    pipe: Option<T>,
+) -> io::Result<(Option<InterruptibleReader>, Option<ReadCanceller>)> {
+    let Some(pipe) = pipe else {
+        return Ok((None, None));
+    };
+    let reader = InterruptibleReader::new(pipe.into())?;
+    let canceller = reader.canceller();
+    Ok((Some(reader), Some(canceller)))
+}
+
+impl Read for InterruptibleReader {
+    fn read(&mut self, buf: &mut [u8]) -> io::Result<usize> {
+        // A zero-length read must return `Ok(0)` immediately (the `Read`
+        // contract), never block in `poll`.
+        if buf.is_empty() {
+            return Ok(0);
+        }
+        // Already cancelled: report EOF without touching the data pipe.
+        if self.state.cancelled.load(Ordering::Acquire) {
+            return Ok(0);
+        }
+        loop {
+            let mut poll_fds = [
+                libc::pollfd {
+                    fd: self.fd.as_raw_fd(),
+                    events: libc::POLLIN,
+                    revents: 0,
+                },
+                libc::pollfd {
+                    fd: self.wake_r.as_raw_fd(),
+                    events: libc::POLLIN,
+                    revents: 0,
+                },
+            ];
+            // SAFETY: `poll_fds` is a valid 2-element array of pollfds; both
+            // fds are owned and live for the duration of the call.
+            let rc = unsafe { libc::poll(poll_fds.as_mut_ptr(), 2, -1) };
+            if rc < 0 {
+                let err = io::Error::last_os_error();
+                if err.kind() == io::ErrorKind::Interrupted {
+                    continue;
+                }
+                return Err(err);
+            }
+
+            // Cancellation wins over any pending data so a held-open pipe is
+            // abandoned promptly.
+            if self.state.cancelled.load(Ordering::Acquire) || poll_fds[1].revents != 0 {
+                return Ok(0);
+            }
+
+            if poll_fds[0].revents != 0 {
+                // SAFETY: `fd` is owned and `buf` is a valid writable slice.
+                let n =
+                    unsafe { libc::read(self.fd.as_raw_fd(), buf.as_mut_ptr().cast(), buf.len()) };
+                if n >= 0 {
+                    return Ok(n as usize);
+                }
+                let err = io::Error::last_os_error();
+                match err.raw_os_error() {
+                    // Spurious readiness (e.g. POLLHUP with no buffered bytes):
+                    // loop and re-poll.
+                    Some(libc::EAGAIN) => continue,
+                    _ if err.kind() == io::ErrorKind::Interrupted => continue,
+                    _ => return Err(err),
+                }
+            }
+        }
+    }
+}
+
+/// Add `O_NONBLOCK` to `fd`'s file-status flags.
+fn set_nonblocking(fd: RawFd) -> io::Result<()> {
+    // SAFETY: `fd` is a valid open fd; `fcntl` with these commands only reads
+    // and writes its flags.
+    let flags = unsafe { libc::fcntl(fd, libc::F_GETFL) };
+    if flags < 0 {
+        return Err(io::Error::last_os_error());
+    }
+    if unsafe { libc::fcntl(fd, libc::F_SETFL, flags | libc::O_NONBLOCK) } < 0 {
+        return Err(io::Error::last_os_error());
+    }
+    Ok(())
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::io::Write;
+    use std::time::{Duration, Instant};
+
+    /// Build an `InterruptibleReader` over a fresh pipe, returning it plus the
+    /// write end so a test can feed it bytes.
+    fn reader_with_writer() -> (InterruptibleReader, OwnedFd) {
+        let mut fds = [0 as RawFd; 2];
+        assert!(unsafe { libc::pipe(fds.as_mut_ptr()) } == 0, "pipe");
+        let read_end = unsafe { OwnedFd::from_raw_fd(fds[0]) };
+        let write_end = unsafe { OwnedFd::from_raw_fd(fds[1]) };
+        let reader = InterruptibleReader::new(read_end).expect("wrap reader");
+        (reader, write_end)
+    }
+
+    #[test]
+    fn reads_data_then_eof_on_writer_close() {
+        let (mut reader, write_end) = reader_with_writer();
+        let mut writer = std::fs::File::from(write_end);
+        writer.write_all(b"hello").expect("write");
+        drop(writer); // close write end -> EOF after the data
+
+        let mut buf = [0u8; 16];
+        let n = reader.read(&mut buf).expect("read data");
+        assert_eq!(&buf[..n], b"hello");
+        assert_eq!(reader.read(&mut buf).expect("read eof"), 0);
+    }
+
+    #[test]
+    fn zero_length_read_returns_ok_zero_without_blocking() {
+        // The write end stays open, so a normal read would block; a zero-length
+        // read must still return Ok(0) immediately per the `Read` contract.
+        let (mut reader, _write_end) = reader_with_writer();
+        let mut empty: [u8; 0] = [];
+        assert_eq!(reader.read(&mut empty).expect("zero-length read"), 0);
+    }
+
+    #[test]
+    fn close_unblocks_a_parked_read_without_writer_close() {
+        // The write end stays open for the whole test, so a plain read would
+        // block forever; the canceller must EOF it promptly.
+        let (reader, _write_end) = reader_with_writer();
+        let canceller = reader.canceller();
+        let mut reader = reader;
+
+        let handle = std::thread::spawn(move || {
+            let mut buf = [0u8; 16];
+            let start = Instant::now();
+            let n = reader.read(&mut buf).expect("read returns");
+            (n, start.elapsed())
+        });
+
+        std::thread::sleep(Duration::from_millis(50));
+        canceller.close();
+
+        let (n, elapsed) = handle.join().expect("reader thread");
+        assert_eq!(n, 0, "cancelled read reports EOF");
+        assert!(
+            elapsed < Duration::from_secs(5),
+            "read should return promptly after close, took {elapsed:?}"
+        );
+    }
+
+    #[test]
+    fn close_is_idempotent_and_reads_stay_eof() {
+        let (mut reader, _write_end) = reader_with_writer();
+        let canceller = reader.canceller();
+        canceller.close();
+        canceller.close(); // second call is a no-op
+
+        let mut buf = [0u8; 16];
+        assert_eq!(reader.read(&mut buf).expect("eof"), 0);
+        assert_eq!(reader.read(&mut buf).expect("still eof"), 0);
+    }
+}
diff --git a/src/core/wxc_common/src/lib.rs b/src/core/wxc_common/src/lib.rs
index f6af283b6..9165e7441 100644
--- a/src/core/wxc_common/src/lib.rs
+++ b/src/core/wxc_common/src/lib.rs
@@ -14,6 +14,7 @@ pub mod logger;
 pub mod microvm_staging;
 pub mod models;
 pub mod mxc_error;
+pub mod sandbox_process;
 pub mod script_runner;
 pub mod state_aware_backend;
 pub mod state_aware_dispatch;
@@ -40,6 +41,10 @@ pub mod process_util;
 #[cfg(target_os = "windows")]
 pub mod string_util;
 
+// Unix-specific modules (shared by the Seatbelt and Bubblewrap backends).
+#[cfg(unix)]
+pub mod interruptible_reader;
+
 // Linux-specific modules
 #[cfg(target_os = "linux")]
 pub mod linux_proxy_coordinator;
diff --git a/src/core/wxc_common/src/models.rs b/src/core/wxc_common/src/models.rs
index c5ff37e6d..29a41f21e 100644
--- a/src/core/wxc_common/src/models.rs
+++ b/src/core/wxc_common/src/models.rs
@@ -592,6 +592,11 @@ pub enum FailurePhase {
     LaunchFailed,
     /// The process was created but exited with a non-zero code.
     ProcessExited,
+    /// The process was force-terminated because it exceeded `scriptTimeout`.
+    /// Distinct from [`ProcessExited`] (it did not exit on its own) so callers
+    /// can detect a timeout uniformly across backends rather than inferring it
+    /// from `exit_code == -1` (which collides with other failures).
+    Timeout,
     /// The selected containment backend is unavailable on this host: the API is
     /// missing, or present but not usable (e.g. feature-disabled). Distinct from
     /// [`LaunchFailed`] so callers can fall back to a lower tier rather than
diff --git a/src/core/wxc_common/src/process_util.rs b/src/core/wxc_common/src/process_util.rs
index 14605e059..2c89f56dc 100644
--- a/src/core/wxc_common/src/process_util.rs
+++ b/src/core/wxc_common/src/process_util.rs
@@ -2,8 +2,11 @@
 // Licensed under the MIT License.
 
 use std::path::PathBuf;
+use std::sync::{Arc, Mutex, Weak};
+use std::time::Duration;
 
 use crate::error::WxcError;
+use crate::sandbox_process::StreamCloser;
 use crate::string_util;
 
 use windows::Win32::Foundation::{
@@ -11,12 +14,234 @@ use windows::Win32::Foundation::{
     HLOCAL, WAIT_OBJECT_0,
 };
 use windows::Win32::Security::{DeriveCapabilitySidsFromName, PSID, SECURITY_ATTRIBUTES};
-use windows::Win32::Storage::FileSystem::ReadFile;
+use windows::Win32::Storage::FileSystem::{ReadFile, WriteFile};
 use windows::Win32::System::Pipes::CreatePipe;
 use windows::Win32::System::Threading::WaitForSingleObject;
+use windows::Win32::System::IO::CancelIoEx;
 use windows_core::BOOL;
 use windows_core::PCWSTR;
 
+/// A readable end of an anonymous pipe (e.g. the child's stdout/stderr),
+/// owning the handle and closing it on drop. Implements [`std::io::Read`]
+/// via `ReadFile`; a broken pipe (all write ends closed) reads as EOF.
+/// `Send` so it can be handed to a reader thread.
+pub struct PipeReader(SendOwnedHandle);
+
+impl PipeReader {
+    /// Take ownership of `handle` (invalidating the source `OwnedHandle`).
+    pub fn new(mut handle: OwnedHandle) -> Self {
+        Self(SendOwnedHandle::take(&mut handle))
+    }
+}
+
+impl std::io::Read for PipeReader {
+    fn read(&mut self, buf: &mut [u8]) -> std::io::Result<usize> {
+        use windows::Win32::Foundation::ERROR_BROKEN_PIPE;
+        let mut read: u32 = 0;
+        // SAFETY: `self.0` owns a valid pipe handle for the lifetime of this
+        // `PipeReader`; `buf`/`read` are valid local out-params for the call.
+        match unsafe { ReadFile(self.0.get(), Some(buf), Some(&mut read), None) } {
+            Ok(()) => Ok(read as usize),
+            // Write ends all closed: normal end-of-stream, report EOF.
+            Err(e) if e.code() == ERROR_BROKEN_PIPE.to_hresult() => Ok(0),
+            Err(e) => Err(std::io::Error::other(e)),
+        }
+    }
+}
+
+/// Cancellation state shared between an [`InterruptiblePipeReader`] and its
+/// [`PipeReadCanceller`]s. Owns the pipe handle — closed only when the **last**
+/// reference drops, so a canceller's `CancelIoEx` can never race a closed (and
+/// possibly reused) handle — plus the [`ReadGate`] the reader and cancellers
+/// hand off through.
+struct CancelablePipe {
+    handle: SendOwnedHandle,
+    gate: Mutex<ReadGate>,
+}
+
+/// Reader/canceller handshake, guarded by [`CancelablePipe::gate`].
+///
+/// `CancelIoEx` is *edge-triggered*: it aborts only I/O already pending when it
+/// is called. A bare `cancelled` flag + a single `CancelIoEx` therefore has a
+/// lost-wakeup race — a `close` landing between a read's flag check and its
+/// `ReadFile` entering the kernel cancels nothing and never retries, parking the
+/// read until real EOF. The mutex closes that race by ordering "a read is
+/// starting" against "cancel requested": a racing `close` either sees the read
+/// has not started (and the read then observes `cancelled`) or sees `reading`
+/// and keeps issuing `CancelIoEx` until the read is aborted.
+#[derive(Default)]
+struct ReadGate {
+    /// Set once `close` has been called; a read observing it returns EOF instead
+    /// of issuing (or while abandoning) a `ReadFile`.
+    cancelled: bool,
+    /// True while a read is in — or about to enter — its blocking `ReadFile`, so
+    /// `close` knows to keep issuing `CancelIoEx` until that read is aborted.
+    reading: bool,
+}
+
+impl CancelablePipe {
+    /// Lock the gate, tolerating a poisoned mutex (the guarded data is two
+    /// bools with no broken invariant on panic).
+    fn lock(&self) -> std::sync::MutexGuard<'_, ReadGate> {
+        self.gate
+            .lock()
+            .unwrap_or_else(|poisoned| poisoned.into_inner())
+    }
+}
+
+// SAFETY: the only non-`Sync` field is a process-global Windows HANDLE whose
+// value is copied for `ReadFile` / `CancelIoEx`; issuing `CancelIoEx` from one
+// thread to abort a `ReadFile` blocked on another is the documented, supported
+// way to interrupt synchronous pipe I/O, and the reader/canceller handshake is
+// serialised by `gate`. So sharing `&CancelablePipe` across threads is sound.
+unsafe impl Sync for CancelablePipe {}
+
+/// A readable pipe end (e.g. the child's stdout/stderr) whose blocking
+/// `ReadFile` can be cancelled out-of-band via a [`PipeReadCanceller`] —
+/// reporting EOF — without closing the child or its other streams. A broken
+/// pipe (all write ends closed) still reads as EOF as usual. `Send` so it can
+/// be handed to a reader thread. Single-reader: at most one thread may `read` it
+/// at a time (any number of cancellers may fire concurrently).
+pub struct InterruptiblePipeReader(Arc<CancelablePipe>);
+
+impl InterruptiblePipeReader {
+    /// Take ownership of `handle` (invalidating the source `OwnedHandle`).
+    pub fn new(mut handle: OwnedHandle) -> Self {
+        Self(Arc::new(CancelablePipe {
+            handle: SendOwnedHandle::take(&mut handle),
+            gate: Mutex::new(ReadGate::default()),
+        }))
+    }
+
+    /// Mint a closer that EOFs this reader's `read` on demand. Several closers
+    /// may be minted; they share one cancellation state. The closer holds only a
+    /// [`Weak`] reference, so it never keeps the read handle open past this
+    /// reader's lifetime.
+    pub fn canceller(&self) -> PipeReadCanceller {
+        PipeReadCanceller(Arc::downgrade(&self.0))
+    }
+}
+
+impl std::io::Read for InterruptiblePipeReader {
+    fn read(&mut self, buf: &mut [u8]) -> std::io::Result<usize> {
+        use windows::Win32::Foundation::{ERROR_BROKEN_PIPE, ERROR_OPERATION_ABORTED};
+        // Announce the read under the gate: a `close` that already fired makes us
+        // EOF without touching the pipe; otherwise mark `reading` so a `close`
+        // racing us keeps issuing `CancelIoEx` until our `ReadFile` is aborted.
+        {
+            let mut gate = self.0.lock();
+            if gate.cancelled {
+                return Ok(0);
+            }
+            gate.reading = true;
+        }
+        let mut read: u32 = 0;
+        // SAFETY: the `Arc` keeps the pipe handle valid for this call;
+        // `buf`/`read` are valid local out-params.
+        let result = unsafe { ReadFile(self.0.handle.get(), Some(buf), Some(&mut read), None) };
+        let cancelled = {
+            let mut gate = self.0.lock();
+            gate.reading = false;
+            gate.cancelled
+        };
+        // If `close` fired while this read was in flight, drop any
+        // completed-but-undelivered chunk and report EOF — matching the Unix
+        // reader, which never delivers data once cancelled.
+        if cancelled {
+            return Ok(0);
+        }
+        match result {
+            Ok(()) => Ok(read as usize),
+            // Write ends all closed: normal end-of-stream, report EOF.
+            Err(e) if e.code() == ERROR_BROKEN_PIPE.to_hresult() => Ok(0),
+            // A canceller's `CancelIoEx` aborted this read: report EOF.
+            Err(e) if e.code() == ERROR_OPERATION_ABORTED.to_hresult() => Ok(0),
+            Err(e) => Err(std::io::Error::other(e)),
+        }
+    }
+}
+
+/// A [`StreamCloser`] for an [`InterruptiblePipeReader`]. Cloneable and
+/// `Send + Sync` so a watchdog thread can hold and fire it; all clones share
+/// one cancellation state and [`close`](StreamCloser::close) is idempotent.
+/// Holds a [`Weak`] reference so a stored canceller never keeps the reader's
+/// data-pipe handle open after the reader is dropped.
+#[derive(Clone)]
+pub struct PipeReadCanceller(Weak<CancelablePipe>);
+
+impl StreamCloser for PipeReadCanceller {
+    fn close(&self) {
+        // Upgrade to a temporary strong ref for the duration of the cancel. If
+        // the reader has already been dropped there is nothing to cancel (and
+        // its handle is already closed), so this is a no-op.
+        let Some(pipe) = self.0.upgrade() else {
+            return;
+        };
+        // Mark cancelled once (so reads short-circuit to EOF), then abort an
+        // in-flight read. Because `CancelIoEx` is edge-triggered, retry while a
+        // read is in its announce→`ReadFile` window (`reading == true`): the next
+        // iteration catches the `ReadFile` once it enters the kernel. The reader
+        // clears `reading` when its `ReadFile` returns (aborted or with data),
+        // which bounds the loop; if no read is in progress it exits at once.
+        {
+            let mut gate = pipe.lock();
+            if gate.cancelled {
+                return;
+            }
+            gate.cancelled = true;
+        }
+        loop {
+            // SAFETY: the upgraded `Arc` keeps the handle valid; `CancelIoEx`
+            // with a null overlapped aborts all outstanding synchronous I/O on
+            // it. Ignore the result — a benign no-op (ERROR_NOT_FOUND) when none
+            // is pending.
+            unsafe {
+                let _ = CancelIoEx(pipe.handle.get(), None);
+            }
+            if !pipe.lock().reading {
+                return;
+            }
+            std::thread::sleep(Duration::from_millis(1));
+        }
+    }
+}
+
+/// A writable end of an anonymous pipe (e.g. the child's stdin), owning the
+/// handle and closing it on drop (which sends EOF to the child). Implements
+/// [`std::io::Write`] via `WriteFile`. `Send`.
+pub struct PipeWriter(SendOwnedHandle);
+
+impl PipeWriter {
+    /// Take ownership of `handle` (invalidating the source `OwnedHandle`).
+    pub fn new(mut handle: OwnedHandle) -> Self {
+        Self(SendOwnedHandle::take(&mut handle))
+    }
+}
+
+impl std::io::Write for PipeWriter {
+    fn write(&mut self, buf: &[u8]) -> std::io::Result<usize> {
+        use windows::Win32::Foundation::ERROR_BROKEN_PIPE;
+        let mut written: u32 = 0;
+        // SAFETY: `self.0` owns a valid pipe handle for the lifetime of this
+        // `PipeWriter`; `buf`/`written` are valid local params for the call.
+        match unsafe { WriteFile(self.0.get(), Some(buf), Some(&mut written), None) } {
+            Ok(()) => Ok(written as usize),
+            // The read end is gone (child exited / closed its stdin): surface the
+            // standard `BrokenPipe` kind so callers' graceful handling fires
+            // instead of an opaque OS error.
+            Err(e) if e.code() == ERROR_BROKEN_PIPE.to_hresult() => {
+                Err(std::io::Error::from(std::io::ErrorKind::BrokenPipe))
+            }
+            Err(e) => Err(std::io::Error::other(e)),
+        }
+    }
+
+    fn flush(&mut self) -> std::io::Result<()> {
+        // Anonymous pipes are not buffered on the writer side.
+        Ok(())
+    }
+}
+
 const BUFFER_SIZE: u32 = 4096;
 const MAX_OUTPUT_CHARS: usize = 1024 * 1024;
 
diff --git a/src/core/wxc_common/src/sandbox_process.rs b/src/core/wxc_common/src/sandbox_process.rs
new file mode 100644
index 000000000..957507456
--- /dev/null
+++ b/src/core/wxc_common/src/sandbox_process.rs
@@ -0,0 +1,475 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! Handle-based ("streaming") sandbox execution.
+//!
+//! [`ScriptRunner`](crate::script_runner::ScriptRunner) owns the whole
+//! lifecycle (spawn → wait → drain → return), which is fine for fire-and-
+//! forget runs but cannot expose the running child. This module adds the
+//! interface for the other model: spawn the sandboxed process and hand the
+//! caller a [`SandboxProcess`] handle they can write to, read from, wait on,
+//! and kill while it runs.
+//!
+//! As with [`ScriptRunner`](crate::script_runner::ScriptRunner), the traits
+//! live in `wxc_common` (the cross-platform foundation) while the
+//! implementations live in the per-backend crates — `wxc_common` must not
+//! depend on any `backends/*` crate.
+
+use std::io::{Read, Write};
+
+use crate::logger::Logger;
+use crate::models::{ExecutionRequest, FailurePhase, ScriptResponse};
+use crate::script_runner::ScriptRunner;
+
+/// A handle to a running sandboxed process.
+///
+/// Modelled on [`std::process::Child`]: the caller may `take_*` the std
+/// streams to drive them directly (and is then responsible for draining any
+/// stream they take, to avoid the child blocking on a full pipe), then
+/// [`wait`](SandboxProcess::wait) for exit or [`kill`](SandboxProcess::kill)
+/// it.
+///
+/// Any stdout/stderr stream the caller does **not** take is drained and
+/// discarded internally by [`wait`](SandboxProcess::wait) so the child can
+/// never block on a full pipe.
+///
+/// No pty is ever allocated; the streams are ordinary pipes.
+///
+/// # Abandoning a held-open stream (stdout/stderr closers)
+///
+/// A read on a taken stdout/stderr only ends at EOF — when **every** write end
+/// closes. A backgrounded descendant that inherited the pipe can hold its write
+/// end open long after the foreground command exits, so a caller blocked on
+/// such a read would hang until that descendant finally exits. A plain
+/// [`kill`](SandboxProcess::kill) would unblock it but also tear the descendant
+/// down, defeating any grace window for backgrounded work.
+///
+/// [`stdout_closer`](SandboxProcess::stdout_closer) /
+/// [`stderr_closer`](SandboxProcess::stderr_closer) hand back a
+/// [`StreamCloser`] for exactly this case: calling
+/// [`close`](StreamCloser::close) makes an in-flight or subsequent read on that
+/// stream return EOF (`Ok(0)`) promptly **without** terminating the child.
+///
+/// # Pipe-deadlock contract (read both ends concurrently)
+///
+/// stdout and stderr are independent OS pipes with bounded kernel buffers. If
+/// one is left undrained while the child keeps writing to it, the child blocks
+/// on the full pipe — and if the reader is meanwhile blocked waiting on the
+/// *other* stream (or on the child to exit), the two deadlock. So both ends
+/// must be consumed **concurrently**, never one fully then the other:
+///
+/// - **Implementors** of [`wait`](SandboxProcess::wait) must drain the
+///   not-taken stdout and stderr on separate threads (or non-blocking I/O)
+///   before/while waiting on the child — not sequentially. The in-tree
+///   backends spawn one reader thread per stream.
+/// - **Callers** that `take_stdout()` *and* `take_stderr()` and read them to
+///   EOF must likewise read them on separate threads; reading one to EOF
+///   before touching the other can hang on output-heavy children. Taking only
+///   one stream (leaving the other for `wait()` to drain) is always safe.
+pub trait SandboxProcess: Send {
+    /// Take ownership of the child's stdin so the caller can write to it.
+    /// Returns `None` if already taken. Drop the writer to send EOF.
+    fn take_stdin(&mut self) -> Option<Box<dyn Write + Send>>;
+
+    /// Take ownership of the child's stdout for live reading. Returns `None`
+    /// if already taken. A taken stream is **not** drained by
+    /// [`wait`](SandboxProcess::wait).
+    fn take_stdout(&mut self) -> Option<Box<dyn Read + Send>>;
+
+    /// Take ownership of the child's stderr for live reading. Returns `None`
+    /// if already taken. A taken stream is **not** drained by
+    /// [`wait`](SandboxProcess::wait).
+    fn take_stderr(&mut self) -> Option<Box<dyn Read + Send>>;
+
+    /// Non-blocking exit check. `Ok(Some(code))` if the child has exited,
+    /// `Ok(None)` if it is still running.
+    fn try_wait(&mut self) -> std::io::Result<Option<i32>>;
+
+    /// The OS process id of the sandboxed child (its PID on Unix, process id
+    /// on Windows). Useful for external monitoring or a caller-driven process
+    /// tree kill.
+    ///
+    /// Only meaningful while the child is alive. On Unix the PID may be reused
+    /// by an unrelated process once the child has been reaped (by
+    /// [`wait`](SandboxProcess::wait)), so do not act on it after waiting.
+    fn id(&self) -> u32;
+
+    /// Request termination of the sandboxed process **and its descendants**
+    /// (a process-tree kill). On Unix the child leads its own process group
+    /// and this signals the whole group (an immediate `SIGKILL`, no graceful
+    /// `SIGTERM` first); on Windows it terminates the job
+    /// object the child is assigned to. Reaping happens in
+    /// [`wait`](SandboxProcess::wait).
+    fn kill(&mut self) -> std::io::Result<()>;
+
+    /// Block until the child exits (honouring the request's `scriptTimeout`,
+    /// where `0` means wait forever) and return its exit code.
+    ///
+    /// Any stdout/stderr the caller did not `take_*` is drained and discarded
+    /// while waiting so the child can never block on a full pipe. If the
+    /// timeout elapses, the child and its tree are killed and
+    /// [`ErrorKind::TimedOut`](std::io::ErrorKind::TimedOut) is returned.
+    ///
+    /// Implementors must drain the not-taken stdout and stderr **concurrently**
+    /// (not one then the other) — see the type-level pipe-deadlock contract.
+    fn wait(&mut self) -> std::io::Result<i32>;
+
+    /// A closer that EOFs the stdout stream returned by
+    /// [`take_stdout`](SandboxProcess::take_stdout), on demand, **without**
+    /// killing the child — for abandoning a stream a backgrounded descendant is
+    /// holding open past the foreground command's exit (a plain
+    /// [`kill`](SandboxProcess::kill) would also take that descendant down).
+    ///
+    /// Intended for a stream the caller has **taken** and is reading:
+    /// [`close`](StreamCloser::close) abandons that read, and may be called
+    /// concurrently with it. [`wait`](SandboxProcess::wait) already cancels its
+    /// own internal safety-drain of any *not-taken* stream once the child exits,
+    /// so a closer is only useful on a taken stream — firing one on a not-taken
+    /// stream while the child is still producing output would stall the child on
+    /// a full pipe. Returns `None` when the stream is not interruptible — e.g.
+    /// inherited stdio ([`StdioMode::Inherit`]), where the caller never reads
+    /// from a handle stream. The default returns `None`.
+    fn stdout_closer(&self) -> Option<Box<dyn StreamCloser>> {
+        None
+    }
+
+    /// A closer for the stderr stream — see
+    /// [`stdout_closer`](SandboxProcess::stdout_closer). The default returns
+    /// `None`.
+    fn stderr_closer(&self) -> Option<Box<dyn StreamCloser>> {
+        None
+    }
+}
+
+/// Abandons reads on one of a [`SandboxProcess`]'s standard streams: a call to
+/// [`close`](StreamCloser::close) makes an in-flight or subsequent read on the
+/// corresponding [`take_stdout`](SandboxProcess::take_stdout) /
+/// [`take_stderr`](SandboxProcess::take_stderr) stream return EOF (`Ok(0)`)
+/// promptly, **without** terminating the child.
+///
+/// Obtained from [`stdout_closer`](SandboxProcess::stdout_closer) /
+/// [`stderr_closer`](SandboxProcess::stderr_closer). `Send + Sync` so a
+/// watchdog thread (separate from the one blocked on the read) can hold and
+/// fire it.
+pub trait StreamCloser: Send + Sync {
+    /// Promptly EOF the stream this closer was minted for. Idempotent and safe
+    /// to call after the reader has already reached EOF or been dropped.
+    fn close(&self);
+}
+
+/// Spawn a thread that reads `reader` to EOF and discards it, so a stream the
+/// caller did not take can't block the child on a full pipe. Returns `None`
+/// when there is nothing to drain.
+pub fn spawn_discard<R: Read + Send + 'static>(
+    reader: Option<R>,
+) -> Option<std::thread::JoinHandle<()>> {
+    reader.map(|mut r| {
+        std::thread::spawn(move || {
+            let _ = std::io::copy(&mut r, &mut std::io::sink());
+        })
+    })
+}
+
+/// Join a [`spawn_discard`] thread (no-op when absent).
+pub fn join_discard(handle: Option<std::thread::JoinHandle<()>>) {
+    if let Some(t) = handle {
+        let _ = t.join();
+    }
+}
+
+/// Take a readable stream out of an `Option` and box it as a trait object, for
+/// the [`SandboxProcess::take_stdout`] / [`SandboxProcess::take_stderr`]
+/// accessors. Returns `None` if already taken.
+pub fn take_boxed_read<R: Read + Send + 'static>(
+    slot: &mut Option<R>,
+) -> Option<Box<dyn Read + Send>> {
+    slot.take().map(|r| Box::new(r) as Box<dyn Read + Send>)
+}
+
+/// Take a writable stream out of an `Option` and box it as a trait object, for
+/// the [`SandboxProcess::take_stdin`] accessor. Returns `None` if already taken.
+pub fn take_boxed_write<W: Write + Send + 'static>(
+    slot: &mut Option<W>,
+) -> Option<Box<dyn Write + Send>> {
+    slot.take().map(|w| Box::new(w) as Box<dyn Write + Send>)
+}
+
+/// Clone a stored stream canceller and box it as a [`StreamCloser`], for the
+/// [`SandboxProcess::stdout_closer`] / [`SandboxProcess::stderr_closer`]
+/// accessors. Returns `None` when there is no canceller (non-streamed stdio).
+pub fn boxed_closer<C: StreamCloser + Clone + 'static>(
+    canceller: &Option<C>,
+) -> Option<Box<dyn StreamCloser>> {
+    canceller
+        .clone()
+        .map(|c| Box::new(c) as Box<dyn StreamCloser>)
+}
+
+/// Join a not-taken stdout/stderr discard thread from
+/// [`wait`](SandboxProcess::wait), first cancelling its read so the join can't
+/// block. When the stream was drained (a [`spawn_discard`] thread exists), fire
+/// `canceller` before joining: a backgrounded descendant holding the pipe's
+/// write end open past the foreground child's exit would otherwise keep the
+/// discard [`io::copy`](std::io::copy) — and thus `wait()` — from ever returning
+/// under a wait-forever (`scriptTimeout == 0`) timeout. The drained output is
+/// discarded regardless, so cutting it short is harmless.
+///
+/// Call *after* the child has exited (so its own output has drained normally).
+/// A no-op when the caller took the stream (`drain` is `None`): there is no
+/// thread to join, and the canceller must not fire while the caller may still be
+/// reading.
+pub fn cancel_and_join_discard<C: StreamCloser>(
+    drain: Option<std::thread::JoinHandle<()>>,
+    canceller: &Option<C>,
+) {
+    if drain.is_some() {
+        if let Some(canceller) = canceller {
+            canceller.close();
+        }
+    }
+    join_discard(drain);
+}
+
+/// SIGKILL a Unix child's process group. The backends make the child a group
+/// leader (`setsid()` / `process_group(0)`), so `-pid` targets that group —
+/// never the host's — killing the leader and every descendant.
+///
+/// No graceful `SIGTERM` first: it's unreliable (a `/bin/sh -c …` wrapper parked
+/// in a foreground `wait` defers it and finishes the script) and sandboxed code
+/// isn't owed a cleanup window. The **leader is killed before the group**: a
+/// `-pid`-only sweep races — the kernel can kill a descendant first, waking the
+/// shell to run one more command (seen as post-timeout output on the Inherit
+/// path) before its own signal lands — so we make the leader's SIGKILL pending
+/// first. The caller reaps the direct child afterwards.
+#[cfg(unix)]
+pub fn group_kill(child: &mut std::process::Child) -> std::io::Result<()> {
+    // The child is unreaped, so its pid (== pgid) can't have been recycled.
+    let pid = child.id() as i32;
+    // SAFETY: `kill(2)` with a plain pid / negative pgid — just integers.
+    unsafe {
+        libc::kill(pid, libc::SIGKILL); // leader first
+        libc::kill(-pid, libc::SIGKILL); // then its group
+    }
+    Ok(())
+}
+
+/// Outcome of [`wait_with_timeout`]: the child exited, the deadline passed, or
+/// the wait itself failed.
+#[cfg(unix)]
+pub enum WaitError {
+    Timeout,
+    Io(std::io::Error),
+}
+
+/// Wait for `child` to exit. With a timeout we poll (rather than add an async
+/// runtime), starting at a short interval and backing off to a cap: a quick
+/// child is detected within ~a millisecond instead of always paying a full
+/// fixed tick, while a long run settles to an inexpensive cadence. Each sleep is
+/// clamped to the time remaining so even sub-interval timeouts fire on time.
+/// Shared by the Unix run-to-completion backends.
+#[cfg(unix)]
+pub fn wait_with_timeout(
+    child: &mut std::process::Child,
+    timeout: Option<std::time::Duration>,
+) -> Result<std::process::ExitStatus, WaitError> {
+    use std::time::{Duration, Instant};
+    // Poll interval grows from this floor to the cap (doubling each idle tick),
+    // trading low exit-detection latency for short runs against an inexpensive
+    // cadence for long ones.
+    const MIN_POLL: Duration = Duration::from_millis(1);
+    const MAX_POLL: Duration = Duration::from_millis(50);
+
+    let Some(deadline) = timeout.map(|d| Instant::now() + d) else {
+        return child.wait().map_err(WaitError::Io);
+    };
+    let mut interval = MIN_POLL;
+    loop {
+        match child.try_wait() {
+            Ok(Some(status)) => return Ok(status),
+            Ok(None) => {
+                let now = Instant::now();
+                if now >= deadline {
+                    return Err(WaitError::Timeout);
+                }
+                std::thread::sleep((deadline - now).min(interval));
+                interval = (interval * 2).min(MAX_POLL);
+            }
+            Err(error) => return Err(WaitError::Io(error)),
+        }
+    }
+}
+
+/// How a [`SandboxBackend`] wires the sandboxed child's standard streams.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum StdioMode {
+    /// stdin/stdout/stderr are fresh pipes the caller drives via the handle's
+    /// `take_*` accessors (the `mxc` library / streaming path). The child sees
+    /// no TTY and leads its own process group so it can be tree-terminated.
+    Pipes,
+    /// The child inherits the current process's stdin/stdout/stderr (the CLI
+    /// executor path): its output goes straight to the binary's own stdio, so
+    /// the child sees a TTY exactly when the binary does. The returned handle's
+    /// `take_*` all return `None`; [`wait`](SandboxProcess::wait) just waits.
+    Inherit,
+}
+
+/// A containment backend that spawns a sandboxed process and hands back a
+/// [`SandboxProcess`] handle — the single entry point for starting a sandbox.
+///
+/// The caller picks how the child's stdio is wired ([`StdioMode`]) and then
+/// drives the handle: stream it ([`StdioMode::Pipes`]) or just
+/// [`wait`](SandboxProcess::wait) ([`StdioMode::Inherit`]). The `mxc` library
+/// calls this directly with [`StdioMode::Pipes`]; the CLI executor binaries
+/// reach it through the [`Runner`] bridge.
+pub trait SandboxBackend {
+    /// Backend-specific validation, run before [`spawn`](SandboxBackend::spawn)
+    /// and on dry-run. Override to reject unsupported policies; default accepts.
+    fn validate(&self, _request: &ExecutionRequest) -> Result<(), ScriptResponse> {
+        Ok(())
+    }
+
+    /// Apply this backend's containment and spawn the sandboxed process with
+    /// stdio wired per `stdio`, returning a handle. On a validation or spawn
+    /// failure returns a [`ScriptResponse`] carrying the error.
+    fn spawn(
+        &mut self,
+        request: &ExecutionRequest,
+        logger: &mut Logger,
+        stdio: StdioMode,
+    ) -> Result<Box<dyn SandboxProcess>, ScriptResponse>;
+
+    /// Optional post-exit diagnostics for the run-to-completion (binary) path:
+    /// when the child exits non-zero, return a more actionable error message
+    /// (e.g. a known AppContainer filesystem-permission failure). Default: none.
+    /// The streaming/library path does not call this.
+    fn diagnose_exit(&self, _request: &ExecutionRequest, _exit_code: i32) -> Option<String> {
+        None
+    }
+}
+
+/// The single run-to-completion bridge: adapts any [`SandboxBackend`] to the
+/// [`ScriptRunner`] contract the executor binaries (`wxc-exec` / `lxc-exec` /
+/// `mxc-exec-mac`) dispatch over.
+///
+/// It spawns the child with [`StdioMode::Inherit`] — so the sandboxed process
+/// reads/writes the binary's own stdio directly (a TTY when the binary has
+/// one) — and [`wait`](SandboxProcess::wait)s for exit, mapping the outcome to
+/// a [`ScriptResponse`]. Because the child streams straight to the binary's
+/// stdio, `standard_out`/`standard_err` stay empty (the binaries already print
+/// those, which is then a no-op).
+///
+/// This is the *only* run-to-completion logic for these backends; the backends
+/// themselves expose just [`SandboxBackend::spawn`].
+pub struct Runner<B>(B);
+
+impl<B> Runner<B> {
+    /// Wrap a [`SandboxBackend`] so it can be dispatched as a [`ScriptRunner`].
+    pub fn new(backend: B) -> Self {
+        Self(backend)
+    }
+}
+
+impl<B: SandboxBackend> ScriptRunner for Runner<B> {
+    fn validate_runner(&self, request: &ExecutionRequest) -> Result<(), ScriptResponse> {
+        self.0.validate(request)
+    }
+
+    fn execute(&mut self, request: &ExecutionRequest, logger: &mut Logger) -> ScriptResponse {
+        let mut child = match self.0.spawn(request, logger, StdioMode::Inherit) {
+            Ok(child) => child,
+            Err(response) => return response,
+        };
+        match child.wait() {
+            Ok(exit_code) => {
+                let mut response = ScriptResponse {
+                    exit_code,
+                    failure_phase: if exit_code == 0 {
+                        FailurePhase::None
+                    } else {
+                        FailurePhase::ProcessExited
+                    },
+                    ..Default::default()
+                };
+                // Let the backend enrich a non-zero exit with an actionable
+                // message (the child streamed live, so the response is otherwise
+                // empty).
+                if exit_code != 0 {
+                    if let Some(msg) = self.0.diagnose_exit(request, exit_code) {
+                        logger.log_line(&format!("Error: Launch diagnostic: {msg}"));
+                        response.standard_err.push_str(&msg);
+                        response.error_message = msg;
+                    }
+                }
+                response
+            }
+            Err(e) if e.kind() == std::io::ErrorKind::TimedOut => ScriptResponse {
+                exit_code: -1,
+                error_message: format!("script timed out after {}ms", request.script_timeout),
+                failure_phase: FailurePhase::Timeout,
+                ..Default::default()
+            },
+            Err(e) => ScriptResponse::error(&format!("wait failed: {e}")),
+        }
+    }
+}
+
+#[cfg(all(test, unix))]
+mod tests {
+    use super::{wait_with_timeout, WaitError};
+    use std::process::Command;
+    use std::time::{Duration, Instant};
+
+    #[test]
+    fn wait_with_timeout_detects_quick_exit_promptly() {
+        // A child that exits almost immediately is reaped well before a generous
+        // deadline -- the adaptive poll starts in the millisecond range, so the
+        // detection latency is small (the old fixed 50ms tick was the worst case).
+        let mut child = Command::new("true").spawn().expect("spawn true");
+        let start = Instant::now();
+        let status = match wait_with_timeout(&mut child, Some(Duration::from_secs(10))) {
+            Ok(status) => status,
+            Err(_) => panic!("a quick child must exit, not time out"),
+        };
+        assert!(status.success(), "`true` exits 0");
+        assert!(
+            start.elapsed() < Duration::from_secs(1),
+            "quick exit should be detected promptly, took {:?}",
+            start.elapsed()
+        );
+    }
+
+    #[test]
+    fn wait_with_timeout_fires_at_the_deadline() {
+        // A long-running child hits the timeout branch at (not before) the
+        // deadline, even though the deadline is shorter than the poll cap.
+        let mut child = Command::new("sleep")
+            .arg("30")
+            .spawn()
+            .expect("spawn sleep");
+        let start = Instant::now();
+        let result = wait_with_timeout(&mut child, Some(Duration::from_millis(200)));
+        let elapsed = start.elapsed();
+        let _ = child.kill();
+        let _ = child.wait();
+        assert!(matches!(result, Err(WaitError::Timeout)), "should time out");
+        assert!(
+            elapsed >= Duration::from_millis(200),
+            "must not fire before the deadline, fired at {elapsed:?}"
+        );
+        assert!(
+            elapsed < Duration::from_secs(2),
+            "should fire near the deadline, fired at {elapsed:?}"
+        );
+    }
+
+    #[test]
+    fn wait_with_timeout_without_deadline_waits_for_exit() {
+        // A `None` timeout blocks until the child exits.
+        let mut child = Command::new("true").spawn().expect("spawn true");
+        let status = match wait_with_timeout(&mut child, None) {
+            Ok(status) => status,
+            Err(_) => panic!("blocking wait must return the exit status"),
+        };
+        assert!(status.success());
+    }
+}

From 93eafce4faa4483487d4f2116372558071ba7d32 Mon Sep 17 00:00:00 2001
From: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
Date: Wed, 24 Jun 2026 09:52:19 -0300
Subject: [PATCH 2/9] refactor(backends): unify the library backends on
 SandboxBackend + route binaries via Runner
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Migrate the three in-process backends — Seatbelt (macOS), Bubblewrap (Linux),
and Windows ProcessContainer (AppContainer + BaseContainer) — onto the
SandboxBackend / SandboxProcess interfaces added in the previous PR, and route
the executor binaries (wxc-exec, lxc-exec, mxc-exec-mac) through the generic
Runner<B> adapter. The old per-backend run-to-completion logic is removed; each
backend now exposes only spawn(), and Runner provides the single ScriptRunner
the binaries dispatch on (spawn StdioMode::Inherit, then wait).

Each backend gains a streaming handle with whole-process-tree termination
(Unix process-group SIGKILL; Windows job-object terminate) and a uniform
io::ErrorKind::TimedOut on scriptTimeout.

Intentional behavior changes for existing binaries (call-outs for review):
- Seatbelt now always env_clear()s the child (previously only when process.env
  was non-empty), aligning the binary with the SDK's documented "host env is
  not inherited" contract.
- Seatbelt resolves an empty process.cwd to a policy read-write path (or "/")
  instead of the launcher's cwd.
- Seatbelt/Bubblewrap inherit the executor's own stdio (StdioMode::Inherit) —
  Seatbelt no longer allocates a private pty, and Bubblewrap no longer forces
  stdin to /dev/null or post-exit-captures stdout/stderr (it streams live).
- BaseContainer now places the child in a UiJobObject for tree-kill (it had
  none before); the child is created suspended, assigned to the job, then
  resumed so no descendant can escape the kill window.
- kill() is a no-op once the child has been reaped, so it never signals a
  recycled pid/process-group.

The macOS Seatbelt characterization suite is updated to assert the new env/cwd/
streaming/timeout behavior; the LXC and Seatbelt backend docs are updated to
match. The default LXC path keeps its native pty and is unaffected.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
Signed-off-by: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
---
 docs/lxc-support/lxc-backend.md               |   2 +-
 docs/macos-support/seatbelt-backend.md        |  15 +
 src/Cargo.lock                                |   1 -
 .../common/src/appcontainer_runner.rs         | 713 ++++++++++++-----
 .../common/src/base_container_runner.rs       | 695 +++++++++++++----
 .../appcontainer/common/src/dispatcher.rs     |  15 +-
 .../appcontainer/common/src/job_object.rs     |  20 +-
 .../common/src/network_manager.rs             | 198 ++---
 src/backends/appcontainer/common/src/probe.rs |   2 +-
 .../bubblewrap/common/src/bwrap_runner.rs     | 390 ++++++---
 src/backends/seatbelt/common/Cargo.toml       |   4 -
 .../seatbelt/common/src/profile_builder.rs    |  14 +-
 .../seatbelt/common/src/seatbelt_runner.rs    | 738 +++++++++++-------
 src/core/lxc/src/main.rs                      |   4 +-
 src/core/mxc_darwin/src/main.rs               |   3 +-
 src/core/wxc/src/main.rs                      |   3 +-
 .../tests/e2e_seatbelt_characterization.rs    |  83 +-
 17 files changed, 1961 insertions(+), 939 deletions(-)

diff --git a/docs/lxc-support/lxc-backend.md b/docs/lxc-support/lxc-backend.md
index 32c20d3b5..b94cd2861 100644
--- a/docs/lxc-support/lxc-backend.md
+++ b/docs/lxc-support/lxc-backend.md
@@ -91,7 +91,7 @@ The `process.cwd` and `process.env` fields from the standard schema are honored
 | `process.cwd` | `cd -- "$1" && exec /bin/sh -c "$2"` wrapper prelude, with the cwd passed as a positional argument | Empty string preserves the container default cwd. A nonexistent or non-permitted path surfaces as a generic non-zero exit (typically `1`, from `cd`'s own status); callers needing strong cwd validation should pre-check the path. The positional-arg trick means cwd values with spaces, quotes, `$vars`, or backticks pass through verbatim with no shell escaping. |
 | `process.env` | Each `KEY=VAL` entry becomes a repeated `--set-var=KEY=VAL` flag to `lxc-attach` | Malformed entries — those without `=` (e.g. `"BADENTRY"`) or with an empty key (e.g. `"=foo"`) — are silently skipped. Embedded `=` in the value (e.g. `"X=a=b=c"`) is preserved. |
 
-**Replace semantics.** When `process.env` is non-empty, `lxc-exec` also passes `--clear-env` to `lxc-attach` so the host environment does **not** leak into the sandbox, regardless of how many entries survive the malformed-skip. This matches the Seatbelt backend's `env_clear()`-on-non-empty contract and is the posture `lxc-attach(1)` recommends for sandbox-spawn callers. If a variable is set in both the host and `process.env`, the `process.env` value wins.
+**Replace semantics.** When `process.env` is non-empty, `lxc-exec` also passes `--clear-env` to `lxc-attach` so the host environment does **not** leak into the sandbox, regardless of how many entries survive the malformed-skip. This is the posture `lxc-attach(1)` recommends for sandbox-spawn callers. If a variable is set in both the host and `process.env`, the `process.env` value wins.
 
 When `process.env` is empty (or absent), the legacy keep-env behavior is preserved and the host environment is inherited.
 
diff --git a/docs/macos-support/seatbelt-backend.md b/docs/macos-support/seatbelt-backend.md
index dd2ad0b69..039dd0761 100644
--- a/docs/macos-support/seatbelt-backend.md
+++ b/docs/macos-support/seatbelt-backend.md
@@ -207,6 +207,21 @@ SDK rejects it with a clear error, mirroring the Linux behavior.
 | `ui.clipboard: "none"` (default) | `(deny mach-lookup (global-name "com.apple.pasteboard.1"))` |
 | `ui.injection: false` (default) | `(deny iokit-open (iokit-user-client-class "IOHIDLibUserClient"))` |
 
+### Process environment
+
+The host environment is **never** inherited — the sandboxed child always starts
+from a cleared environment, so host secrets (cloud credentials, API tokens) can
+never leak into untrusted code. `PATH` defaults to `/usr/bin:/bin:/usr/sbin:/sbin`,
+and each `process.env` entry adds to / overrides that baseline. (This is
+unconditional; it applies whether or not `process.env` is provided.)
+
+### Working directory
+
+If `process.cwd` is omitted it resolves to `readwritePaths[0]`, else
+`readonlyPaths[0]`, else `/`; a `~`/`~/…` default is tilde-expanded the same way
+the sandbox profile expands policy paths. `PWD` is exported to the resolved
+directory so the child's `getcwd()` takes its fast `$PWD` path.
+
 ## Usage
 
 ### Command line
diff --git a/src/Cargo.lock b/src/Cargo.lock
index a4397660b..cead9eaad 100644
--- a/src/Cargo.lock
+++ b/src/Cargo.lock
@@ -1906,7 +1906,6 @@ name = "seatbelt_common"
 version = "0.7.0"
 dependencies = [
  "libc",
- "mxc_pty",
  "wxc_common",
 ]
 
diff --git a/src/backends/appcontainer/common/src/appcontainer_runner.rs b/src/backends/appcontainer/common/src/appcontainer_runner.rs
index cf7aba8ad..cd2edd00b 100644
--- a/src/backends/appcontainer/common/src/appcontainer_runner.rs
+++ b/src/backends/appcontainer/common/src/appcontainer_runner.rs
@@ -6,7 +6,7 @@ use std::ptr;
 
 use windows::Win32::Foundation::{
     CloseHandle, GetLastError, LocalFree, SetHandleInformation, ERROR_ALREADY_EXISTS, HANDLE,
-    HANDLE_FLAG_INHERIT, HLOCAL, WAIT_FAILED, WAIT_OBJECT_0, WAIT_TIMEOUT,
+    HANDLE_FLAG_INHERIT, HLOCAL, WAIT_OBJECT_0, WAIT_TIMEOUT,
 };
 use windows::Win32::Security::Authorization::ConvertSidToStringSidW;
 use windows::Win32::Security::Isolation::{
@@ -35,8 +35,15 @@ use crate::process_mitigation;
 use wxc_common::error::WxcError;
 use wxc_common::logger::Logger;
 use wxc_common::models::{ExecutionRequest, NetworkEnforcementMode, NetworkPolicy, ScriptResponse};
-use wxc_common::process_util::{get_capability_sid_from_name, OwnedHandle, SidAndAttributes};
-use wxc_common::script_runner::{get_timeout_milliseconds, ScriptRunner};
+use wxc_common::process_util::{
+    create_std_pipes, get_capability_sid_from_name, InterruptiblePipeReader, OwnedHandle,
+    PipeReadCanceller, PipeWriter, SendOwnedHandle, SidAndAttributes,
+};
+use wxc_common::sandbox_process::{
+    boxed_closer, cancel_and_join_discard, spawn_discard, take_boxed_read, take_boxed_write,
+    SandboxBackend, SandboxProcess, StdioMode, StreamCloser,
+};
+use wxc_common::script_runner::get_timeout_milliseconds;
 use wxc_common::{string_util, ui_policy};
 
 /// `UpdateProcThreadAttribute` value for
@@ -147,20 +154,25 @@ fn build_explicit_entries(
         .collect();
 
     if let Some(addr) = proxy_address {
-        // Strip existing proxy vars before injecting ours.
-        entries.retain(|(key, _)| {
-            !PROXY_VAR_NAMES
-                .iter()
-                .any(|name| key.eq_ignore_ascii_case(name))
-        });
-        let proxy_url = addr.to_url();
-        entries.push(("HTTP_PROXY".to_string(), proxy_url.clone()));
-        entries.push(("HTTPS_PROXY".to_string(), proxy_url));
+        inject_proxy_vars(&mut entries, addr);
     }
 
     entries
 }
 
+/// Strip any pre-existing proxy env vars from `entries`, then inject the
+/// configured proxy as `HTTP_PROXY` / `HTTPS_PROXY`.
+fn inject_proxy_vars(entries: &mut Vec<(String, String)>, addr: &wxc_common::models::ProxyAddress) {
+    entries.retain(|(key, _)| {
+        !PROXY_VAR_NAMES
+            .iter()
+            .any(|name| key.eq_ignore_ascii_case(name))
+    });
+    let proxy_url = addr.to_url();
+    entries.push(("HTTP_PROXY".to_string(), proxy_url.clone()));
+    entries.push(("HTTPS_PROXY".to_string(), proxy_url));
+}
+
 /// RAII guard that frees capability SID pointers via `LocalFree` on drop.
 /// Ensures SIDs are freed regardless of the error return path.
 struct CapabilitySidGuard(Vec<*mut core::ffi::c_void>);
@@ -415,12 +427,18 @@ impl AppContainerScriptRunner {
         }
     }
 
-    /// Core implementation of `run_internal`, returning `Result` for ergonomic error handling.
-    fn run_internal_impl(
+    /// Set up the AppContainer and create the sandboxed child **suspended**,
+    /// returning a [`SpawnedChild`] the caller resumes and then either waits on
+    /// (run-to-completion) or wraps in a streaming handle. When `capture` is set
+    /// the child's stdio is wired to pipes the caller drives (the streaming
+    /// path); otherwise the child inherits the parent's std handles / console
+    /// (the run-to-completion path).
+    fn spawn_suspended(
         &self,
         request: &ExecutionRequest,
         logger: &mut Logger,
-    ) -> Result<ScriptResponse, WxcError> {
+        capture: bool,
+    ) -> Result<SpawnedChild, WxcError> {
         // --- Validate permissiveLearningMode ---
         for cap in &request.policy.capabilities {
             if cap == "permissiveLearningMode" {
@@ -434,8 +452,9 @@ impl AppContainerScriptRunner {
                 }
                 #[cfg(not(debug_assertions))]
                 {
-                    return Ok(ScriptResponse::error(
-                        "SECURITY: permissiveLearningMode not allowed in release builds",
+                    return Err(WxcError::Validation(
+                        "SECURITY: permissiveLearningMode not allowed in release builds"
+                            .to_string(),
                     ));
                 }
             }
@@ -495,10 +514,20 @@ impl AppContainerScriptRunner {
         // we forward our own std handles to the child via STARTF_USESTDHANDLES so the
         // child's output streams directly to the SDK in real time. Otherwise we use
         // console sharing (the ConPTY path).
-        let pipe_mode = !std::io::stdout().is_terminal() || !std::io::stderr().is_terminal();
+        //
+        // In capture mode (`StdioMode::Pipes`) we always take the pipe
+        // path — but instead of forwarding our own std handles we wire the
+        // child to capture pipes that the streaming handle reads from.
+        let pipe_mode =
+            capture || !std::io::stdout().is_terminal() || !std::io::stderr().is_terminal();
 
         if pipe_mode {
-            logger.log_line("STDIO mode: passthrough (forwarding parent handles to child)");
+            if capture {
+                logger
+                    .log_line("STDIO mode: capture (piping child output to the streaming handle)");
+            } else {
+                logger.log_line("STDIO mode: passthrough (forwarding parent handles to child)");
+            }
         }
 
         // --- Allocate and initialize attribute list ---
@@ -609,48 +638,86 @@ impl AppContainerScriptRunner {
             logger.log_line("Win32k mitigation applied to child process");
         }
 
-        // --- Setup handle passthrough (pipe mode only) ---
-        // Forward wxc-exec's own stdin/stdout/stderr handles to the child so the
-        // child's output streams directly to the SDK caller in real time.
-        // Handle list for PROC_THREAD_ATTRIBUTE_HANDLE_LIST. Must outlive CreateProcessW.
+        // --- Setup handle passthrough / capture (pipe mode only) ---
+        // In passthrough mode we forward wxc-exec's own std handles to the
+        // child so its output streams to the caller. In capture mode we wire
+        // the child to fresh capture pipes that the streaming handle reads from
+        // (the `mxc` library path). Handle list for
+        // PROC_THREAD_ATTRIBUTE_HANDLE_LIST. Must outlive CreateProcessW.
         let mut handle_list: Vec<HANDLE> = Vec::new();
 
         let h_stdin;
         let h_stdout;
         let h_stderr;
 
+        // Capture pipe read-ends (parent side): kept alive until after the
+        // wait, then drained. Child-side ends (stdin read, stdout/stderr
+        // write): kept alive until after CreateProcessW, then dropped so the
+        // read-ends observe EOF when the child exits.
+        let mut capture_reads: Option<(OwnedHandle, OwnedHandle)> = None;
+        let mut capture_child_ends: Vec<OwnedHandle> = Vec::new();
+        // Parent's stdin write-end; in capture mode it is handed to the caller
+        // so they can write to the child.
+        let mut captured_stdin_write: Option<OwnedHandle> = None;
+
         if pipe_mode {
-            h_stdin = unsafe { GetStdHandle(STD_INPUT_HANDLE) }
-                .map_err(|e| WxcError::Process(format!("GetStdHandle(STDIN): {e}")))?;
-            h_stdout = unsafe { GetStdHandle(STD_OUTPUT_HANDLE) }
-                .map_err(|e| WxcError::Process(format!("GetStdHandle(STDOUT): {e}")))?;
-            h_stderr = unsafe { GetStdHandle(STD_ERROR_HANDLE) }
-                .map_err(|e| WxcError::Process(format!("GetStdHandle(STDERR): {e}")))?;
-
-            if h_stdin.is_invalid() || h_stdin == HANDLE::default() {
-                return Err(WxcError::Process(
-                    "GetStdHandle(STDIN) returned null/invalid handle".to_string(),
-                ));
-            }
-            if h_stdout.is_invalid() || h_stdout == HANDLE::default() {
-                return Err(WxcError::Process(
-                    "GetStdHandle(STDOUT) returned null/invalid handle".to_string(),
-                ));
-            }
-            if h_stderr.is_invalid() || h_stderr == HANDLE::default() {
-                return Err(WxcError::Process(
-                    "GetStdHandle(STDERR) returned null/invalid handle".to_string(),
-                ));
-            }
+            if capture {
+                // create_std_pipes(false): read-end inheritable (child stdin),
+                // write-end non-inheritable (kept for streaming, else dropped).
+                let (stdin_read, stdin_write) = create_std_pipes(false)?;
+                // create_std_pipes(true): read-end non-inheritable (parent
+                // reads it), write-end inheritable (child writes to it).
+                let (stdout_read, stdout_write) = create_std_pipes(true)?;
+                let (stderr_read, stderr_write) = create_std_pipes(true)?;
+
+                h_stdin = stdin_read.get();
+                h_stdout = stdout_write.get();
+                h_stderr = stderr_write.get();
+
+                capture_child_ends.push(stdin_read);
+                capture_child_ends.push(stdout_write);
+                capture_child_ends.push(stderr_write);
+                captured_stdin_write = Some(stdin_write);
+                capture_reads = Some((stdout_read, stderr_read));
+            } else {
+                h_stdin = unsafe { GetStdHandle(STD_INPUT_HANDLE) }
+                    .map_err(|e| WxcError::Process(format!("GetStdHandle(STDIN): {e}")))?;
+                h_stdout = unsafe { GetStdHandle(STD_OUTPUT_HANDLE) }
+                    .map_err(|e| WxcError::Process(format!("GetStdHandle(STDOUT): {e}")))?;
+                h_stderr = unsafe { GetStdHandle(STD_ERROR_HANDLE) }
+                    .map_err(|e| WxcError::Process(format!("GetStdHandle(STDERR): {e}")))?;
+
+                if h_stdin.is_invalid() || h_stdin == HANDLE::default() {
+                    return Err(WxcError::Process(
+                        "GetStdHandle(STDIN) returned null/invalid handle".to_string(),
+                    ));
+                }
+                if h_stdout.is_invalid() || h_stdout == HANDLE::default() {
+                    return Err(WxcError::Process(
+                        "GetStdHandle(STDOUT) returned null/invalid handle".to_string(),
+                    ));
+                }
+                if h_stderr.is_invalid() || h_stderr == HANDLE::default() {
+                    return Err(WxcError::Process(
+                        "GetStdHandle(STDERR) returned null/invalid handle".to_string(),
+                    ));
+                }
 
-            // Ensure the handles are inheritable.
-            unsafe {
-                SetHandleInformation(h_stdin, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
-                    .map_err(|e| WxcError::Process(format!("SetHandleInformation(STDIN): {e}")))?;
-                SetHandleInformation(h_stdout, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
-                    .map_err(|e| WxcError::Process(format!("SetHandleInformation(STDOUT): {e}")))?;
-                SetHandleInformation(h_stderr, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
-                    .map_err(|e| WxcError::Process(format!("SetHandleInformation(STDERR): {e}")))?;
+                // Ensure the handles are inheritable.
+                unsafe {
+                    SetHandleInformation(h_stdin, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
+                        .map_err(|e| {
+                            WxcError::Process(format!("SetHandleInformation(STDIN): {e}"))
+                        })?;
+                    SetHandleInformation(h_stdout, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
+                        .map_err(|e| {
+                            WxcError::Process(format!("SetHandleInformation(STDOUT): {e}"))
+                        })?;
+                    SetHandleInformation(h_stderr, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
+                        .map_err(|e| {
+                            WxcError::Process(format!("SetHandleInformation(STDERR): {e}"))
+                        })?;
+                }
             }
 
             handle_list.push(h_stdin);
@@ -721,16 +788,7 @@ impl AppContainerScriptRunner {
             // Get clean default user env without inheriting process env vars.
             let mut entries = create_default_env_entries()?;
             if let Some(addr) = self.proxy_address.as_ref() {
-                // Strip any pre-existing proxy vars from the default block
-                // and inject our configured proxy.
-                entries.retain(|(key, _)| {
-                    !PROXY_VAR_NAMES
-                        .iter()
-                        .any(|name| key.eq_ignore_ascii_case(name))
-                });
-                let proxy_url = addr.to_url();
-                entries.push(("HTTP_PROXY".to_string(), proxy_url.clone()));
-                entries.push(("HTTPS_PROXY".to_string(), proxy_url));
+                inject_proxy_vars(&mut entries, addr);
             }
             encode_env_block(&entries)
         };
@@ -789,13 +847,17 @@ impl AppContainerScriptRunner {
             pi.dwProcessId
         ));
 
+        // The child has inherited the pipe handles, so close the parent's
+        // child-side ends now (otherwise the read-ends would never see EOF).
+        capture_child_ends.clear();
+
         let process_handle = OwnedHandle::new(pi.hProcess);
         let thread_handle = OwnedHandle::new(pi.hThread);
 
         // CRITICAL: child was created with CREATE_SUSPENDED. We must either
-        // successfully attach the Job Object and ResumeThread, OR TerminateProcess.
-        // Anything that returns an error in this block must terminate first.
-        let _job = match (|| -> Result<UiJobObject, WxcError> {
+        // successfully attach the Job Object, OR TerminateProcess. Anything
+        // that returns an error in this block must terminate first.
+        let job = match (|| -> Result<UiJobObject, WxcError> {
             let job = UiJobObject::new()?;
             let restrictions = ui_policy::resolve_ui_restrictions(
                 &request.policy.ui,
@@ -817,56 +879,22 @@ impl AppContainerScriptRunner {
             }
         };
 
-        // Resume the child now that UI restrictions are in place.
-        // ResumeThread returns the previous suspend count (or u32::MAX on failure).
-        let resume_result = unsafe { ResumeThread(thread_handle.get()) };
-        if resume_result == u32::MAX {
-            let err = unsafe { GetLastError() };
-            unsafe {
-                let _ = TerminateProcess(process_handle.get(), u32::MAX);
-            }
-            return Err(WxcError::Process(format!("ResumeThread failed: {:?}", err)));
-        }
-
-        // --- Wait for child process to exit ---
-        let timeout_ms = get_timeout_milliseconds(request.script_timeout);
-
-        let wait_result = unsafe { WaitForSingleObject(process_handle.get(), timeout_ms) };
-
-        match wait_result {
-            WAIT_OBJECT_0 => {}
-            WAIT_TIMEOUT => unsafe {
-                let _ = TerminateProcess(process_handle.get(), u32::MAX);
-                let _ = WaitForSingleObject(process_handle.get(), u32::MAX);
-            },
-            WAIT_FAILED => {
-                let err = unsafe { GetLastError() };
-                return Err(WxcError::Process(format!(
-                    "WaitForSingleObject failed: {:?}",
-                    err
-                )));
-            }
-            other => {
-                return Err(WxcError::Process(format!(
-                    "WaitForSingleObject returned unexpected value: {}",
-                    other.0
-                )));
-            }
-        }
-
-        // --- Get exit code ---
-        let mut exit_code: u32 = 0;
-        unsafe {
-            GetExitCodeProcess(process_handle.get(), &mut exit_code)
-                .map_err(|_| WxcError::Process("GetExitCodeProcess failed".into()))?;
-        }
+        let (stdout_read, stderr_read) = match capture_reads {
+            Some((out, err)) => (Some(out), Some(err)),
+            None => (None, None),
+        };
 
-        Ok(ScriptResponse {
-            exit_code: exit_code as i32,
-            standard_out: String::new(),
-            standard_err: String::new(),
-            error_message: String::new(),
-            ..Default::default()
+        // The child is still suspended; the caller resumes it (after starting
+        // any drain threads, for the run-to-completion path).
+        Ok(SpawnedChild {
+            process: process_handle,
+            thread: thread_handle,
+            job,
+            pid: pi.dwProcessId,
+            stdin_write: captured_stdin_write,
+            stdout_read,
+            stderr_read,
+            timeout_ms: get_timeout_milliseconds(request.script_timeout),
         })
     }
 
@@ -895,13 +923,38 @@ impl AppContainerScriptRunner {
         }
         unsafe { string_util::sid_to_string(self.app_container_sid.0, "unknown-sid") }
     }
+}
 
-    /// Execute the script inside the AppContainer, converting errors to ScriptResponse.
-    fn run_internal(&mut self, request: &ExecutionRequest, logger: &mut Logger) -> ScriptResponse {
-        match self.run_internal_impl(request, logger) {
-            Ok(response) => response,
-            Err(e) => ScriptResponse::error(&e.to_string()),
+/// A sandboxed AppContainer child created **suspended** by
+/// [`AppContainerScriptRunner::spawn_suspended`]. The caller resumes it and
+/// then either runs it to completion (blocking) or wraps it in a streaming
+/// handle. Owns the process/thread/job handles and the parent-side pipe ends.
+struct SpawnedChild {
+    process: OwnedHandle,
+    thread: OwnedHandle,
+    job: UiJobObject,
+    /// OS process id of the child.
+    pid: u32,
+    /// Parent's stdin write-end (Some only when spawned for streaming).
+    stdin_write: Option<OwnedHandle>,
+    /// Parent's stdout/stderr read-ends (Some only in streaming mode).
+    stdout_read: Option<OwnedHandle>,
+    stderr_read: Option<OwnedHandle>,
+    timeout_ms: u32,
+}
+
+impl SpawnedChild {
+    /// Resume the suspended child, terminating it on failure.
+    fn resume(&self) -> Result<(), WxcError> {
+        let r = unsafe { ResumeThread(self.thread.get()) };
+        if r == u32::MAX {
+            let err = unsafe { GetLastError() };
+            unsafe {
+                let _ = TerminateProcess(self.process.get(), u32::MAX);
+            }
+            return Err(WxcError::Process(format!("ResumeThread failed: {:?}", err)));
         }
+        Ok(())
     }
 }
 
@@ -911,28 +964,74 @@ impl Default for AppContainerScriptRunner {
     }
 }
 
-impl ScriptRunner for AppContainerScriptRunner {
-    fn validate_runner(&self, request: &ExecutionRequest) -> Result<(), ScriptResponse> {
-        if !request.policy.denied_paths.is_empty() && self.filesystem_mode != FilesystemMode::Dacl {
-            return Err(ScriptResponse::error(
-                wxc_common::error::DENIED_PATHS_NOT_SUPPORTED_MSG,
-            ));
+/// Delete the AppContainer profile created via [`CreateAppContainerProfile`]
+/// and clear any BFS policy registered against it.
+///
+/// This is the explicit cleanup entry point used by `wxc-exec --delete`,
+/// kept next to the create/setup path on `AppContainerScriptRunner` so
+/// both ends of the profile lifecycle live in the same module.
+///
+/// The BFS-clear step is best-effort: it delegates to
+/// [`FileSystemBfsManager::clear_policy`], which resolves `bfscfg.exe`
+/// itself and logs (rather than fails) when the resolver returns no
+/// path. The profile delete is still attempted in that case.
+pub fn delete_app_container_profile(name: &str, logger: &mut Logger) -> bool {
+    crate::filesystem_bfs::FileSystemBfsManager::clear_policy(name, logger);
+
+    let wide_name: Vec<u16> = name.encode_utf16().chain(std::iter::once(0)).collect();
+    let hstring = windows::core::HSTRING::from_wide(&wide_name[..wide_name.len() - 1]);
+    match unsafe { DeleteAppContainerProfile(&hstring) } {
+        Ok(()) => {
+            logger.log_line(&format!("Deleted AppContainer profile: {}", name));
+            true
         }
-        if !request.policy.allowed_hosts.is_empty() || !request.policy.blocked_hosts.is_empty() {
-            return Err(ScriptResponse::error(
-                wxc_common::error::HOST_LISTS_NOT_SUPPORTED_MSG,
+        Err(e) => {
+            logger.log_line(&format!(
+                "Failed to delete AppContainer profile '{}': {}",
+                name, e
             ));
+            false
+        }
+    }
+}
+
+impl Drop for AppContainerScriptRunner {
+    fn drop(&mut self) {
+        if !self.app_container_sid.0.is_null() {
+            unsafe {
+                // AppContainer SIDs from CreateAppContainerProfile /
+                // DeriveAppContainerSidFromAppContainerName must be freed with FreeSid.
+                windows::Win32::Security::FreeSid(self.app_container_sid);
+            }
+            self.app_container_sid = PSID(ptr::null_mut());
         }
-        Ok(())
     }
+}
+
+// ───────────────────────────────────────────────────────────────────────────
+// Shared setup/teardown + streaming (handle-based) execution
+// ───────────────────────────────────────────────────────────────────────────
 
-    fn execute(&mut self, request: &ExecutionRequest, logger: &mut Logger) -> ScriptResponse {
+/// Per-run resources (firewall + filesystem policy) whose lifetime is tied to
+/// the sandboxed child. Created by [`AppContainerScriptRunner::prepare`] and
+/// torn down by [`AppContainerScriptRunner::teardown`] after the child exits.
+struct Prepared {
+    network_manager: crate::network_manager::NetworkManager,
+    bfs_manager: crate::filesystem_bfs::FileSystemBfsManager,
+}
+
+impl AppContainerScriptRunner {
+    /// Set up the AppContainer for a run: initialise the SID, configure BFS
+    /// filesystem policy, and start network enforcement. Shared by both stdio
+    /// modes of [`SandboxBackend::spawn`].
+    fn prepare(
+        &mut self,
+        request: &ExecutionRequest,
+        logger: &mut Logger,
+    ) -> Result<Prepared, ScriptResponse> {
         use crate::filesystem_bfs::FileSystemBfsManager;
-        use crate::launch_diagnostics::diagnose_process_exit;
         use crate::network_manager::NetworkManager;
-        use wxc_common::models::FailurePhase;
 
-        // Apply experimental features when flag is set
         if request.experimental_enabled {
             if let Some(ref test) = request.experimental.test {
                 logger.log_line(&format!(
@@ -943,21 +1042,18 @@ impl ScriptRunner for AppContainerScriptRunner {
         }
 
         if let Err(e) = self.initialize(request) {
-            return ScriptResponse::error(&e.to_string());
+            return Err(ScriptResponse::error(&e.to_string()));
         }
 
         let principal_id = self.get_principal_id();
         logger.log_line(&format!("AppContainerSID: {principal_id}"));
 
-        // Resolve `bfscfg.exe` by absolute path so probe and execution
-        // agree on the binary — defeats executable-search-order
-        // hijacking (see `fallback_detector::find_bfscfg_exe`). Only
-        // resolve when we actually plan to use BFS; Tier 3 (DACL) hosts
-        // legitimately may not have `bfscfg.exe` installed.
+        // Resolve `bfscfg.exe` by absolute path (defeats search-order
+        // hijacking); only needed in BFS mode.
         let bfscfg_path = if self.filesystem_mode == FilesystemMode::Bfs {
             match crate::fallback_detector::find_bfscfg_exe() {
                 Ok(p) => p,
-                Err(e) => return ScriptResponse::error(&e.to_string()),
+                Err(e) => return Err(ScriptResponse::error(&e.to_string())),
             }
         } else {
             None
@@ -981,7 +1077,7 @@ impl ScriptRunner for AppContainerScriptRunner {
                 } else {
                     e.to_string()
                 };
-                return ScriptResponse::error(&msg);
+                return Err(ScriptResponse::error(&msg));
             }
         }
 
@@ -1005,92 +1101,283 @@ impl ScriptRunner for AppContainerScriptRunner {
                 self.proxy_address = network_manager.proxy_address().cloned();
             }
             Err(err) => {
-                return ScriptResponse::error(&err.to_string());
+                return Err(ScriptResponse::error(&err.to_string()));
             }
         }
 
-        let mut response = match std::panic::catch_unwind(std::panic::AssertUnwindSafe(|| {
-            self.run_internal(request, logger)
-        })) {
-            Ok(r) => r,
-            Err(_) => ScriptResponse::error("Unknown error during script execution."),
-        };
+        Ok(Prepared {
+            network_manager,
+            bfs_manager,
+        })
+    }
 
-        // Post-failure diagnostics: if the child failed, check for known
-        // environment issues and enrich the error message.
-        if response.exit_code != 0 {
-            response.failure_phase = FailurePhase::ProcessExited;
-            if let Some(diag) = diagnose_process_exit(
-                &request.script_code,
-                &request.policy.readonly_paths,
-                &request.policy.readwrite_paths,
-                response.exit_code as u32,
-            ) {
-                logger.log_line(&format!(
-                    "Error: Launch diagnostic [{}]: {}",
-                    diag.kind, diag.message
-                ));
-                if !response.error_message.is_empty() {
-                    response.extended_error = response.error_message.clone();
-                }
-                response.error_message = diag.message.clone();
-                response.standard_err.push_str(&diag.message);
+    /// Tear down the per-run firewall and filesystem policy. Idempotent at the
+    /// manager level; called once after the child exits.
+    fn teardown(&self, prepared: &mut Prepared, preserve_policy: bool, logger: &mut Logger) {
+        prepared.network_manager.stop_all(!preserve_policy, logger);
+        if self.filesystem_mode == FilesystemMode::Bfs
+            && prepared.bfs_manager.configured()
+            && !preserve_policy
+        {
+            prepared.bfs_manager.remove_configuration(logger);
+        }
+    }
+}
+
+impl SandboxBackend for AppContainerScriptRunner {
+    fn validate(&self, request: &ExecutionRequest) -> Result<(), ScriptResponse> {
+        if !request.policy.denied_paths.is_empty() && self.filesystem_mode != FilesystemMode::Dacl {
+            return Err(ScriptResponse::error(
+                wxc_common::error::DENIED_PATHS_NOT_SUPPORTED_MSG,
+            ));
+        }
+        if !request.policy.allowed_hosts.is_empty() || !request.policy.blocked_hosts.is_empty() {
+            return Err(ScriptResponse::error(
+                wxc_common::error::HOST_LISTS_NOT_SUPPORTED_MSG,
+            ));
+        }
+        Ok(())
+    }
+
+    fn spawn(
+        &mut self,
+        request: &ExecutionRequest,
+        logger: &mut Logger,
+        stdio: StdioMode,
+    ) -> Result<Box<dyn SandboxProcess>, ScriptResponse> {
+        use wxc_common::validator::validate_common;
+
+        validate_common(request)?;
+        self.validate(request)?;
+
+        let mut prepared = self.prepare(request, logger)?;
+
+        // Pipes → capture pipes the caller drives; Inherit → the child inherits
+        // the binary's own std handles / console (a TTY when the binary has one).
+        let capture = stdio == StdioMode::Pipes;
+        let child = match self.spawn_suspended(request, logger, capture) {
+            Ok(c) => c,
+            Err(e) => {
+                self.teardown(&mut prepared, request.lifecycle.preserve_policy, logger);
+                return Err(ScriptResponse::error(&e.to_string()));
             }
+        };
+        if let Err(e) = child.resume() {
+            self.teardown(&mut prepared, request.lifecycle.preserve_policy, logger);
+            return Err(ScriptResponse::error(&e.to_string()));
+        }
+
+        Ok(Box::new(AppContainerSandboxProcess::new(
+            child,
+            prepared,
+            self.filesystem_mode,
+            request,
+        )))
+    }
+
+    fn diagnose_exit(&self, request: &ExecutionRequest, exit_code: i32) -> Option<String> {
+        crate::launch_diagnostics::diagnose_process_exit(
+            &request.script_code,
+            &request.policy.readonly_paths,
+            &request.policy.readwrite_paths,
+            exit_code as u32,
+        )
+        .map(|diag| diag.message)
+    }
+}
+
+/// A running AppContainer-sandboxed process exposed as a [`SandboxProcess`].
+/// Owns the process/job handles, the parent-side pipes, and the per-run
+/// firewall/filesystem policy, which it tears down once the child exits.
+struct AppContainerSandboxProcess {
+    process: SendOwnedHandle,
+    _thread: SendOwnedHandle,
+    job: crate::job_object::UiJobObject,
+    pid: u32,
+    stdin: Option<PipeWriter>,
+    stdout: Option<InterruptiblePipeReader>,
+    stderr: Option<InterruptiblePipeReader>,
+    /// Cancellers for the stdout/stderr reads, kept so the `SandboxProcess`
+    /// closers can mint a [`StreamCloser`] even after the stream is taken.
+    stdout_canceller: Option<PipeReadCanceller>,
+    stderr_canceller: Option<PipeReadCanceller>,
+    prepared: Prepared,
+    filesystem_mode: FilesystemMode,
+    preserve_policy: bool,
+    timeout_ms: u32,
+    teardown_done: bool,
+}
+
+// SAFETY: the fields are Windows HANDLEs / handle-owning managers and owned
+// strings. HANDLEs are process-global and safe to use from any single thread,
+// and this handle is owned exclusively by the caller (not shared), so it is
+// only ever touched from one thread at a time.
+//
+// The one historically thread-affine field was the `NetworkManager` inside
+// `prepared`: it used to cache an STA `INetFwPolicy2` interface plus its
+// `CoInitializeEx` state and reuse them at teardown, which is unsound when
+// `wait()`/`kill()`/`Drop` run on a different thread (e.g. a tokio
+// `spawn_blocking` worker) than `spawn`. That no longer happens: each firewall
+// apply/remove is apartment-self-contained (it opens its own COM apartment,
+// creates a fresh interface, and uninitializes — all on whichever thread runs
+// it), so no COM interface or apartment state is moved across threads. The only
+// remaining OS state the manager keeps is the process-global Winsock refcount,
+// which is thread-agnostic. Moving this handle across threads is therefore
+// sound.
+unsafe impl Send for AppContainerSandboxProcess {}
+
+impl AppContainerSandboxProcess {
+    fn new(
+        mut child: SpawnedChild,
+        prepared: Prepared,
+        filesystem_mode: FilesystemMode,
+        request: &ExecutionRequest,
+    ) -> Self {
+        let process = SendOwnedHandle::take(&mut child.process);
+        let thread = SendOwnedHandle::take(&mut child.thread);
+        let stdin = child.stdin_write.take().map(PipeWriter::new);
+        let stdout = child.stdout_read.take().map(InterruptiblePipeReader::new);
+        let stderr = child.stderr_read.take().map(InterruptiblePipeReader::new);
+        let stdout_canceller = stdout.as_ref().map(InterruptiblePipeReader::canceller);
+        let stderr_canceller = stderr.as_ref().map(InterruptiblePipeReader::canceller);
+        Self {
+            process,
+            _thread: thread,
+            job: child.job,
+            pid: child.pid,
+            stdin,
+            stdout,
+            stderr,
+            stdout_canceller,
+            stderr_canceller,
+            prepared,
+            filesystem_mode,
+            preserve_policy: request.lifecycle.preserve_policy,
+            timeout_ms: child.timeout_ms,
+            teardown_done: false,
         }
+    }
 
-        network_manager.stop_all(!request.lifecycle.preserve_policy, logger);
+    fn run_teardown(&mut self) {
+        if self.teardown_done {
+            return;
+        }
+        self.teardown_done = true;
+        let mut logger = Logger::new(wxc_common::logger::Mode::Buffer);
+        self.prepared
+            .network_manager
+            .stop_all(!self.preserve_policy, &mut logger);
         if self.filesystem_mode == FilesystemMode::Bfs
-            && bfs_manager.configured()
-            && !request.lifecycle.preserve_policy
+            && self.prepared.bfs_manager.configured()
+            && !self.preserve_policy
         {
-            bfs_manager.remove_configuration(logger);
+            self.prepared.bfs_manager.remove_configuration(&mut logger);
         }
-
-        response
     }
 }
 
-/// Delete the AppContainer profile created via [`CreateAppContainerProfile`]
-/// and clear any BFS policy registered against it.
-///
-/// This is the explicit cleanup entry point used by `wxc-exec --delete`,
-/// kept next to the create/setup path on `AppContainerScriptRunner` so
-/// both ends of the profile lifecycle live in the same module.
-///
-/// The BFS-clear step is best-effort: it delegates to
-/// [`FileSystemBfsManager::clear_policy`], which resolves `bfscfg.exe`
-/// itself and logs (rather than fails) when the resolver returns no
-/// path. The profile delete is still attempted in that case.
-pub fn delete_app_container_profile(name: &str, logger: &mut Logger) -> bool {
-    crate::filesystem_bfs::FileSystemBfsManager::clear_policy(name, logger);
+impl SandboxProcess for AppContainerSandboxProcess {
+    fn take_stdin(&mut self) -> Option<Box<dyn std::io::Write + Send>> {
+        take_boxed_write(&mut self.stdin)
+    }
 
-    let wide_name: Vec<u16> = name.encode_utf16().chain(std::iter::once(0)).collect();
-    let hstring = windows::core::HSTRING::from_wide(&wide_name[..wide_name.len() - 1]);
-    match unsafe { DeleteAppContainerProfile(&hstring) } {
-        Ok(()) => {
-            logger.log_line(&format!("Deleted AppContainer profile: {}", name));
-            true
+    fn take_stdout(&mut self) -> Option<Box<dyn std::io::Read + Send>> {
+        take_boxed_read(&mut self.stdout)
+    }
+
+    fn take_stderr(&mut self) -> Option<Box<dyn std::io::Read + Send>> {
+        take_boxed_read(&mut self.stderr)
+    }
+
+    fn stdout_closer(&self) -> Option<Box<dyn StreamCloser>> {
+        boxed_closer(&self.stdout_canceller)
+    }
+
+    fn stderr_closer(&self) -> Option<Box<dyn StreamCloser>> {
+        boxed_closer(&self.stderr_canceller)
+    }
+
+    fn try_wait(&mut self) -> std::io::Result<Option<i32>> {
+        match unsafe { WaitForSingleObject(self.process.get(), 0) } {
+            WAIT_OBJECT_0 => {
+                let mut code: u32 = 0;
+                if unsafe { GetExitCodeProcess(self.process.get(), &mut code) }.is_err() {
+                    return Err(std::io::Error::other("GetExitCodeProcess failed"));
+                }
+                Ok(Some(code as i32))
+            }
+            WAIT_TIMEOUT => Ok(None),
+            _ => Err(std::io::Error::other("WaitForSingleObject failed")),
         }
-        Err(e) => {
-            logger.log_line(&format!(
-                "Failed to delete AppContainer profile '{}': {}",
-                name, e
-            ));
-            false
+    }
+
+    fn id(&self) -> u32 {
+        self.pid
+    }
+
+    fn kill(&mut self) -> std::io::Result<()> {
+        // Terminate the whole job: the child and every descendant assigned to
+        // it die together (tree-kill).
+        self.job.terminate(u32::MAX);
+        Ok(())
+    }
+
+    fn wait(&mut self) -> std::io::Result<i32> {
+        // Close our copy of any not-taken stdin so the child sees EOF and can
+        // exit reliably (an interactive command would otherwise block waiting
+        // for input).
+        self.stdin.take();
+
+        // Drain (and discard) any not-taken streams concurrently to avoid the
+        // child blocking on a full pipe buffer.
+        let stdout_thread = spawn_discard(self.stdout.take());
+        let stderr_thread = spawn_discard(self.stderr.take());
+
+        let result = match unsafe { WaitForSingleObject(self.process.get(), self.timeout_ms) } {
+            WAIT_OBJECT_0 => {
+                let mut code: u32 = 0;
+                if unsafe { GetExitCodeProcess(self.process.get(), &mut code) }.is_err() {
+                    Err(std::io::Error::other("GetExitCodeProcess failed"))
+                } else {
+                    Ok(code as i32)
+                }
+            }
+            WAIT_TIMEOUT => Err(std::io::Error::new(
+                std::io::ErrorKind::TimedOut,
+                format!("script timed out after {}ms", self.timeout_ms),
+            )),
+            _ => Err(std::io::Error::other("WaitForSingleObject failed")),
+        };
+
+        // Tree-kill the job so any backgrounded descendant dies *before*
+        // `run_teardown()` removes the firewall / BFS enforcement (keyed to the
+        // shared AppContainer package SID) — upholding the same invariant as
+        // `Drop`. The foreground child has already exited on the success path; on
+        // a timeout or wait failure this also terminates it. Then reap the root
+        // (immediate once it has exited) before releasing the pipe drains — and
+        // killing the tree closes the descendant's pipe write-ends, so the drains
+        // can finish.
+        let _ = self.kill();
+        unsafe {
+            let _ = WaitForSingleObject(self.process.get(), u32::MAX);
         }
+        cancel_and_join_discard(stdout_thread, &self.stdout_canceller);
+        cancel_and_join_discard(stderr_thread, &self.stderr_canceller);
+        self.run_teardown();
+        result
     }
 }
 
-impl Drop for AppContainerScriptRunner {
+impl Drop for AppContainerSandboxProcess {
     fn drop(&mut self) {
-        if !self.app_container_sid.0.is_null() {
-            unsafe {
-                // AppContainer SIDs from CreateAppContainerProfile /
-                // DeriveAppContainerSidFromAppContainerName must be freed with FreeSid.
-                windows::Win32::Security::FreeSid(self.app_container_sid);
-            }
-            self.app_container_sid = PSID(ptr::null_mut());
+        // Kill the tree and reap before tearing down firewall/filesystem
+        // policy, so an abandoned-but-running sandbox cannot outlive its
+        // enforcement (or leak as an orphan). `kill()` terminates the job.
+        let _ = self.kill();
+        unsafe {
+            let _ = WaitForSingleObject(self.process.get(), u32::MAX);
         }
+        self.run_teardown();
     }
 }
 
@@ -1272,7 +1559,7 @@ mod tests {
 
     use super::{AppContainerScriptRunner, FilesystemMode};
     use wxc_common::models::ExecutionRequest;
-    use wxc_common::script_runner::ScriptRunner;
+    use wxc_common::sandbox_process::SandboxBackend;
 
     #[test]
     fn validate_runner_rejects_denied_paths_in_bfs_mode() {
@@ -1281,7 +1568,7 @@ mod tests {
         request.policy.denied_paths = vec!["C:\\secret".into()];
 
         let err = runner
-            .validate_runner(&request)
+            .validate(&request)
             .expect_err("BFS mode must reject deniedPaths");
         assert!(
             err.error_message.contains("deniedPaths"),
@@ -1297,7 +1584,7 @@ mod tests {
         request.policy.denied_paths = vec!["C:\\secret".into()];
 
         assert!(
-            runner.validate_runner(&request).is_ok(),
+            runner.validate(&request).is_ok(),
             "DACL mode supports deniedPaths and should not error"
         );
     }
@@ -1309,7 +1596,7 @@ mod tests {
         request.policy.allowed_hosts = vec!["example.com".into()];
 
         let err = runner
-            .validate_runner(&request)
+            .validate(&request)
             .expect_err("allowedHosts is not yet supported");
         assert!(err.error_message.contains("allowedHosts"));
     }
@@ -1321,7 +1608,7 @@ mod tests {
         request.policy.blocked_hosts = vec!["bad.example.com".into()];
 
         let err = runner
-            .validate_runner(&request)
+            .validate(&request)
             .expect_err("blockedHosts is not yet supported");
         assert!(err.error_message.contains("blockedHosts"));
     }
@@ -1330,6 +1617,6 @@ mod tests {
     fn validate_runner_accepts_empty_policy() {
         let runner = AppContainerScriptRunner::new();
         let request = ExecutionRequest::default();
-        assert!(runner.validate_runner(&request).is_ok());
+        assert!(runner.validate(&request).is_ok());
     }
 }
diff --git a/src/backends/appcontainer/common/src/base_container_runner.rs b/src/backends/appcontainer/common/src/base_container_runner.rs
index f5e6c2527..073f9be19 100644
--- a/src/backends/appcontainer/common/src/base_container_runner.rs
+++ b/src/backends/appcontainer/common/src/base_container_runner.rs
@@ -16,7 +16,7 @@ use std::ptr;
 
 use windows::Win32::Foundation::{
     CloseHandle, GetLastError, SetHandleInformation, ERROR_CALL_NOT_IMPLEMENTED, E_NOTIMPL, HANDLE,
-    HANDLE_FLAG_INHERIT, WAIT_FAILED, WAIT_TIMEOUT,
+    HANDLE_FLAG_INHERIT, WAIT_OBJECT_0, WAIT_TIMEOUT,
 };
 use windows::Win32::System::Console::{
     GetStdHandle, STD_ERROR_HANDLE, STD_INPUT_HANDLE, STD_OUTPUT_HANDLE,
@@ -30,6 +30,7 @@ use windows::Win32::System::Threading::{
 };
 use windows_core::PCWSTR;
 
+use crate::job_object::UiJobObject;
 use crate::launch_diagnostics::{
     diagnose_create_process_failure, diagnose_environment_not_supported, diagnose_process_exit,
     is_environment_not_supported,
@@ -48,10 +49,20 @@ use wxc_common::models::{
     ExecutionRequest, FailurePhase, NetworkEnforcementMode, NetworkPolicy, ProxyAddress,
     ScriptResponse,
 };
-use wxc_common::script_runner::{get_timeout_milliseconds, ScriptRunner};
+use wxc_common::process_util::{
+    create_std_pipes, InterruptiblePipeReader, OwnedHandle, PipeReadCanceller, PipeWriter,
+    SendOwnedHandle,
+};
+use wxc_common::sandbox_process::{
+    boxed_closer, cancel_and_join_discard, spawn_discard, take_boxed_read, take_boxed_write,
+    SandboxBackend, SandboxProcess, StdioMode, StreamCloser,
+};
+use wxc_common::script_runner::get_timeout_milliseconds;
 use wxc_common::string_util;
 
-use windows::Win32::System::Threading::CREATE_UNICODE_ENVIRONMENT;
+use windows::Win32::System::Threading::{
+    ResumeThread, CREATE_SUSPENDED, CREATE_UNICODE_ENVIRONMENT,
+};
 
 /// Serialize `KEY=VALUE` pairs into a double-null-terminated UTF-16 environment block.
 ///
@@ -101,7 +112,7 @@ const SANDBOX_CAP_CREATE_PROCESS_IN_SANDBOX: u64 = 0x0000_0000_0000_0001;
 
 /// True when a Win32 error code signals the BaseContainer feature is not
 /// enabled on this build (symbol present, capability gated off).
-pub(crate) fn is_api_not_implemented(err: u32) -> bool {
+fn is_api_not_implemented(err: u32) -> bool {
     err == ERROR_CALL_NOT_IMPLEMENTED.0 || err == E_NOTIMPL.0 as u32
 }
 
@@ -532,51 +543,23 @@ impl BaseContainerRunner {
     }
 }
 
-impl ScriptRunner for BaseContainerRunner {
-    fn validate_runner(&self, request: &ExecutionRequest) -> Result<(), ScriptResponse> {
-        if !request.policy.denied_paths.is_empty() {
-            return Err(ScriptResponse::error(
-                wxc_common::error::DENIED_PATHS_NOT_SUPPORTED_MSG,
-            ));
-        }
-        if !request.policy.allowed_hosts.is_empty() || !request.policy.blocked_hosts.is_empty() {
-            return Err(ScriptResponse::error(
-                wxc_common::error::HOST_LISTS_NOT_SUPPORTED_MSG,
-            ));
-        }
-        Self::is_base_container_api_present().map_err(|e| {
-            let hint = if !request.experimental_enabled {
-                format!(
-                    "BaseContainer API unavailable: {e}\n\
-                     Hint: Config schema version '{}' requires the BaseContainer backend, \
-                     but this OS build does not support it. \
-                     Use schema version '0.4.0-alpha' to fall back to AppContainer.",
-                    request.schema_version
-                )
-            } else {
-                format!(
-                    "BaseContainer API unavailable: {e}\n\
-                     Hint: --experimental requested BaseContainer, but this OS build \
-                     does not support it. Remove --experimental to use the AppContainer \
-                     backend, or use an OS build with BaseContainer support."
-                )
-            };
-            ScriptResponse {
-                // Symbol absent: report BackendUnavailable, not a hard error.
-                failure_phase: FailurePhase::BackendUnavailable,
-                ..ScriptResponse::error(&hint)
-            }
-        })
-    }
-
-    fn execute(&mut self, request: &ExecutionRequest, logger: &mut Logger) -> ScriptResponse {
+impl BaseContainerRunner {
+    /// Set up and launch the BaseContainer child, returning a [`BaseChild`] the
+    /// caller runs to completion (blocking) or wraps in a streaming handle. When
+    /// `capture` is set the child's stdio is wired to pipes the caller drives
+    /// (the streaming path); otherwise the child inherits the parent's std
+    /// handles / console (the run-to-completion path).
+    fn spawn_base(
+        &mut self,
+        request: &ExecutionRequest,
+        logger: &mut Logger,
+        capture: bool,
+    ) -> Result<BaseChild, ScriptResponse> {
         let _ = writeln!(
             logger,
             "{EMOJI_SECTION} SECTION: Backend runner 'BaseContainer'"
         );
 
-        let run_start = std::time::Instant::now();
-
         // Launch builtin test proxy if requested (before building spec so we have the port).
         let mut request = request.clone();
         if request.policy.network_proxy.builtin_test_server {
@@ -586,9 +569,9 @@ impl ScriptRunner for BaseContainerRunner {
                     request.policy.network_proxy.address = Some(addr);
                 }
                 Err(e) => {
-                    return ScriptResponse::error(&format!(
+                    return Err(ScriptResponse::error(&format!(
                         "Failed to start builtin test proxy: {e}"
-                    ));
+                    )));
                 }
             }
         }
@@ -626,7 +609,7 @@ impl ScriptRunner for BaseContainerRunner {
         // 2. Dynamically load the API from processmodel.dll.
         let create_process_in_sandbox = match Self::load_api() {
             Ok(f) => f,
-            Err(e) => return ScriptResponse::error(&e),
+            Err(e) => return Err(ScriptResponse::error(&e)),
         };
         let _ = writeln!(
             logger,
@@ -714,60 +697,123 @@ impl ScriptRunner for BaseContainerRunner {
         // If wxc-exec's stdout or stderr is not a terminal (i.e., piped by the SDK),
         // we forward our own std handles to the child via STARTF_USESTDHANDLES so the
         // child's output streams directly to the SDK in real time.
-        let pipe_mode = !std::io::stdout().is_terminal() || !std::io::stderr().is_terminal();
+        //
+        // In capture mode (`StdioMode::Pipes`) we always take the pipe
+        // path and wire the child to capture pipes that the streaming handle
+        // reads from.
+        let pipe_mode =
+            capture || !std::io::stdout().is_terminal() || !std::io::stderr().is_terminal();
 
         if pipe_mode {
-            let _ = writeln!(
-                logger,
-                "STDIO mode: passthrough (forwarding parent handles to child)"
-            );
+            if capture {
+                let _ = writeln!(
+                    logger,
+                    "STDIO mode: capture (piping child output to the streaming handle)"
+                );
+            } else {
+                let _ = writeln!(
+                    logger,
+                    "STDIO mode: passthrough (forwarding parent handles to child)"
+                );
+            }
         }
 
-        // --- Retrieve parent std handles for passthrough (pipe mode only) ---
+        // --- Retrieve / create std handles (pipe mode only) ---
         let mut h_stdin = HANDLE::default();
         let mut h_stdout = HANDLE::default();
         let mut h_stderr = HANDLE::default();
 
+        // Capture pipe read-ends (parent side) kept alive until after the wait;
+        // child-side ends kept alive until after process creation.
+        let mut capture_reads: Option<(OwnedHandle, OwnedHandle)> = None;
+        let mut capture_child_ends: Vec<OwnedHandle> = Vec::new();
+        // Parent's stdin write-end; in capture mode it is handed to the caller
+        // so they can write to the child.
+        let mut captured_stdin_write: Option<OwnedHandle> = None;
+
         if pipe_mode {
-            h_stdin = match unsafe { GetStdHandle(STD_INPUT_HANDLE) } {
-                Ok(h) => h,
-                Err(e) => return ScriptResponse::error(&format!("GetStdHandle(STDIN): {e}")),
-            };
-            h_stdout = match unsafe { GetStdHandle(STD_OUTPUT_HANDLE) } {
-                Ok(h) => h,
-                Err(e) => return ScriptResponse::error(&format!("GetStdHandle(STDOUT): {e}")),
-            };
-            h_stderr = match unsafe { GetStdHandle(STD_ERROR_HANDLE) } {
-                Ok(h) => h,
-                Err(e) => return ScriptResponse::error(&format!("GetStdHandle(STDERR): {e}")),
-            };
+            if capture {
+                let (stdin_read, stdin_write) = match create_std_pipes(false) {
+                    Ok(p) => p,
+                    Err(e) => return Err(ScriptResponse::error(&format!("stdin pipe: {e}"))),
+                };
+                let (stdout_read, stdout_write) = match create_std_pipes(true) {
+                    Ok(p) => p,
+                    Err(e) => return Err(ScriptResponse::error(&format!("stdout pipe: {e}"))),
+                };
+                let (stderr_read, stderr_write) = match create_std_pipes(true) {
+                    Ok(p) => p,
+                    Err(e) => return Err(ScriptResponse::error(&format!("stderr pipe: {e}"))),
+                };
 
-            if h_stdin.is_invalid() || h_stdin == HANDLE::default() {
-                return ScriptResponse::error("GetStdHandle(STDIN) returned null/invalid handle");
-            }
-            if h_stdout.is_invalid() || h_stdout == HANDLE::default() {
-                return ScriptResponse::error("GetStdHandle(STDOUT) returned null/invalid handle");
-            }
-            if h_stderr.is_invalid() || h_stderr == HANDLE::default() {
-                return ScriptResponse::error("GetStdHandle(STDERR) returned null/invalid handle");
-            }
+                h_stdin = stdin_read.get();
+                h_stdout = stdout_write.get();
+                h_stderr = stderr_write.get();
 
-            // Ensure the handles are inheritable.
-            unsafe {
-                if let Err(e) =
-                    SetHandleInformation(h_stdin, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
-                {
-                    return ScriptResponse::error(&format!("SetHandleInformation(STDIN): {e}"));
+                capture_child_ends.push(stdin_read);
+                capture_child_ends.push(stdout_write);
+                capture_child_ends.push(stderr_write);
+                captured_stdin_write = Some(stdin_write);
+                capture_reads = Some((stdout_read, stderr_read));
+            } else {
+                h_stdin = match unsafe { GetStdHandle(STD_INPUT_HANDLE) } {
+                    Ok(h) => h,
+                    Err(e) => {
+                        return Err(ScriptResponse::error(&format!("GetStdHandle(STDIN): {e}")))
+                    }
+                };
+                h_stdout = match unsafe { GetStdHandle(STD_OUTPUT_HANDLE) } {
+                    Ok(h) => h,
+                    Err(e) => {
+                        return Err(ScriptResponse::error(&format!("GetStdHandle(STDOUT): {e}")))
+                    }
+                };
+                h_stderr = match unsafe { GetStdHandle(STD_ERROR_HANDLE) } {
+                    Ok(h) => h,
+                    Err(e) => {
+                        return Err(ScriptResponse::error(&format!("GetStdHandle(STDERR): {e}")))
+                    }
+                };
+
+                if h_stdin.is_invalid() || h_stdin == HANDLE::default() {
+                    return Err(ScriptResponse::error(
+                        "GetStdHandle(STDIN) returned null/invalid handle",
+                    ));
                 }
-                if let Err(e) =
-                    SetHandleInformation(h_stdout, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
-                {
-                    return ScriptResponse::error(&format!("SetHandleInformation(STDOUT): {e}"));
+                if h_stdout.is_invalid() || h_stdout == HANDLE::default() {
+                    return Err(ScriptResponse::error(
+                        "GetStdHandle(STDOUT) returned null/invalid handle",
+                    ));
                 }
-                if let Err(e) =
-                    SetHandleInformation(h_stderr, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
-                {
-                    return ScriptResponse::error(&format!("SetHandleInformation(STDERR): {e}"));
+                if h_stderr.is_invalid() || h_stderr == HANDLE::default() {
+                    return Err(ScriptResponse::error(
+                        "GetStdHandle(STDERR) returned null/invalid handle",
+                    ));
+                }
+
+                // Ensure the handles are inheritable.
+                unsafe {
+                    if let Err(e) =
+                        SetHandleInformation(h_stdin, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
+                    {
+                        return Err(ScriptResponse::error(&format!(
+                            "SetHandleInformation(STDIN): {e}"
+                        )));
+                    }
+                    if let Err(e) =
+                        SetHandleInformation(h_stdout, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
+                    {
+                        return Err(ScriptResponse::error(&format!(
+                            "SetHandleInformation(STDOUT): {e}"
+                        )));
+                    }
+                    if let Err(e) =
+                        SetHandleInformation(h_stderr, HANDLE_FLAG_INHERIT.0, HANDLE_FLAG_INHERIT)
+                    {
+                        return Err(ScriptResponse::error(&format!(
+                            "SetHandleInformation(STDERR): {e}"
+                        )));
+                    }
                 }
             }
         }
@@ -805,11 +851,17 @@ impl ScriptRunner for BaseContainerRunner {
             .as_ref()
             .map(|b| b.as_ptr() as *const c_void)
             .unwrap_or(ptr::null());
-        let creation_flags = if env_block.is_some() {
-            CREATE_UNICODE_ENVIRONMENT.0
-        } else {
-            0
-        };
+        // Create the child suspended so its main thread cannot spawn any
+        // descendant before we've assigned it to the job object below; it is
+        // resumed right after the assignment. If the sandbox create API ignores
+        // CREATE_SUSPENDED on a given build, the child starts running anyway and
+        // the later resume is a harmless no-op.
+        let creation_flags = CREATE_SUSPENDED.0
+            | if env_block.is_some() {
+                CREATE_UNICODE_ENVIRONMENT.0
+            } else {
+                0
+            };
 
         let _ = writeln!(logger, "launching: {}", request.script_code);
         let _ = writeln!(logger, "identity: {identity}");
@@ -829,13 +881,13 @@ impl ScriptRunner for BaseContainerRunner {
                 "Error: Pre-launch diagnostic [{}]: {}",
                 diag.kind, diag.message
             );
-            return ScriptResponse {
+            return Err(ScriptResponse {
                 exit_code: -1,
                 error_message: diag.message.clone(),
                 standard_err: diag.message,
                 failure_phase: FailurePhase::LaunchFailed,
                 ..Default::default()
-            };
+            });
         }
 
         // 4. Call Experimental_CreateProcessInSandbox.
@@ -902,9 +954,10 @@ impl ScriptRunner for BaseContainerRunner {
                     diag.kind, diag.message
                 );
 
-                // Retry without the environment block.
+                // Retry without the environment block, but keep the child
+                // suspended (resumed after job assignment).
                 current_env_ptr = ptr::null();
-                current_creation_flags = 0;
+                current_creation_flags = CREATE_SUSPENDED.0;
                 continue;
             }
 
@@ -960,107 +1013,405 @@ impl ScriptRunner for BaseContainerRunner {
                 FailurePhase::LaunchFailed
             };
 
-            return ScriptResponse {
+            return Err(ScriptResponse {
                 exit_code: -1,
                 error_message: diag.message.clone(),
                 standard_err: diag.message,
                 extended_error,
                 failure_phase,
                 ..Default::default()
-            };
+            });
         }
 
         let _ = writeln!(logger, "process created (PID: {})", pi.dwProcessId);
 
-        let _ = writeln!(logger, "{EMOJI_SECTION} SECTION: Wait for exit");
+        // Child has inherited the pipe handles; close the parent's child-side
+        // ends so the read-ends observe EOF when the child exits.
+        capture_child_ends.clear();
 
-        // 5. Wait for the child process to exit.
-        let timeout_ms = get_timeout_milliseconds(request.script_timeout);
-        let mut exit_code: u32 = u32::MAX;
+        let (stdout_read, stderr_read) = match capture_reads {
+            Some((out, err)) => (Some(out), Some(err)),
+            None => (None, None),
+        };
 
-        unsafe {
-            let wait_result = WaitForSingleObject(pi.hProcess, timeout_ms);
-            if wait_result == WAIT_FAILED {
-                let err = GetLastError();
-                let _ = CloseHandle(pi.hProcess);
-                let _ = CloseHandle(pi.hThread);
-                return ScriptResponse::error(&format!("WaitForSingleObject failed: {err:?}"));
-            } else if wait_result == WAIT_TIMEOUT {
-                let _ = writeln!(logger, "process timed out, terminating...");
-                let _ = TerminateProcess(pi.hProcess, u32::MAX);
-                let _ = WaitForSingleObject(pi.hProcess, 5000);
+        // Assign the child to a job object so the streaming handle's `kill()`
+        // (and the timeout / `Drop` paths) can tree-kill it — the child plus
+        // every descendant it spawns after assignment. This backend *is* a
+        // security boundary, so fail **closed**: if the job cannot be created
+        // or the process cannot be assigned, terminate the just-launched child
+        // and reject the spawn rather than run a sandbox that cannot be
+        // reliably torn down. (Previously this was best-effort: a failed
+        // assignment left `job = None`, after which `kill()`/timeout/`Drop`
+        // could only `TerminateProcess` the root and no descendant was
+        // tree-killed at all.)
+        //
+        // The child was created suspended (CREATE_SUSPENDED) and is resumed only
+        // after this assignment, so no descendant it spawns can escape the job.
+        // If the create API ignores CREATE_SUSPENDED on a given build the child
+        // is already running; it is a shell that has not yet run the user
+        // command, so the pre-assignment window is empty in practice and the
+        // later resume is a harmless no-op.
+        let job = match UiJobObject::new().and_then(|job| {
+            // Pass the raw handle — `assign_process` borrows it and does not
+            // take ownership. Wrapping it in a temporary `OwnedHandle` here
+            // would close `pi.hProcess` when the temporary dropped, leaving the
+            // owned handle on the `BaseChild` below pointing at a closed (and
+            // possibly reused) handle. Sole ownership stays with that field.
+            job.assign_process(pi.hProcess)?;
+            Ok(job)
+        }) {
+            Ok(job) => job,
+            Err(e) => {
+                let _ = writeln!(
+                    logger,
+                    "Error: BaseContainer job-object setup failed ({e}); terminating \
+                     the child and failing closed — a sandbox that cannot be \
+                     tree-killed must not run."
+                );
+                // The child is already running and there is no job to tree-kill
+                // through, so terminate the root directly and reap it before
+                // tearing down sandbox / proxy state, upholding the same
+                // "enforcement never outlives a live child" invariant as the
+                // normal teardown paths.
+                unsafe {
+                    let _ = TerminateProcess(pi.hProcess, u32::MAX);
+                    let _ = WaitForSingleObject(pi.hProcess, u32::MAX);
+                    let _ = CloseHandle(pi.hProcess);
+                    let _ = CloseHandle(pi.hThread);
+                }
+                if request.lifecycle.destroy_on_exit {
+                    run_sandbox_cleanup(
+                        &identity,
+                        &sid_string,
+                        request.policy.network_proxy.is_enabled(),
+                        logger,
+                    );
+                    sandbox_tracking::unregister_ctrl_c_cleanup();
+                }
+                self.proxy_coordinator.stop(logger);
+
+                const JOB_SETUP_FAILED_MSG: &str =
+                    "BaseContainer sandbox could not be placed in a job object, so it \
+                     could not be reliably terminated; the launch was rejected to \
+                     avoid running an uncontainable sandbox.";
+                return Err(ScriptResponse {
+                    exit_code: -1,
+                    error_message: JOB_SETUP_FAILED_MSG.to_string(),
+                    standard_err: JOB_SETUP_FAILED_MSG.to_string(),
+                    extended_error: format!("BaseContainer job-object setup failed: {e}"),
+                    failure_phase: FailurePhase::LaunchFailed,
+                    ..Default::default()
+                });
             }
+        };
 
-            let _ = GetExitCodeProcess(pi.hProcess, &mut exit_code);
+        // The child was created suspended; now that it is in the job object (so
+        // every descendant it spawns is captured), resume its main thread. If the
+        // create API ignored CREATE_SUSPENDED the thread is already running and
+        // this is a harmless no-op.
+        // SAFETY: `pi.hThread` is the just-created, still-owned main-thread
+        // handle; `ResumeThread` only adjusts its suspend count.
+        unsafe {
+            ResumeThread(pi.hThread);
+        }
 
-            let _ = CloseHandle(pi.hProcess);
-            let _ = CloseHandle(pi.hThread);
+        // Hand ownership to the caller via `BaseChild`, which performs
+        // sandbox/proxy teardown after the child exits. `job` is always present
+        // here (we failed closed above); the `Option` and the root-only fallback
+        // in `kill()` remain purely as defense-in-depth.
+        Ok(BaseChild {
+            process: OwnedHandle::new(pi.hProcess),
+            thread: OwnedHandle::new(pi.hThread),
+            pid: pi.dwProcessId,
+            job: Some(job),
+            stdin_write: captured_stdin_write,
+            stdout_read,
+            stderr_read,
+            timeout_ms: get_timeout_milliseconds(request.script_timeout),
+            destroy_on_exit: request.lifecycle.destroy_on_exit,
+            proxy_enabled: request.policy.network_proxy.is_enabled(),
+            identity,
+            sid_string,
+            proxy_coordinator: std::mem::take(&mut self.proxy_coordinator),
+        })
+    }
+}
+
+/// A BaseContainer child launched by [`BaseContainerRunner::spawn_base`]. The
+/// child runs immediately (no suspend); this owns the process handle, the
+/// parent-side pipe ends, and the per-run proxy/sandbox state it tears down
+/// once the child exits.
+struct BaseChild {
+    process: OwnedHandle,
+    thread: OwnedHandle,
+    pid: u32,
+    /// Job object the child is assigned to, used to tree-kill it. Always
+    /// `Some` on a successfully spawned child (`spawn_base` fails closed when
+    /// the job cannot be set up); the `Option` is retained so `kill()` can keep
+    /// a root-only fallback as defense-in-depth.
+    job: Option<UiJobObject>,
+    stdin_write: Option<OwnedHandle>,
+    stdout_read: Option<OwnedHandle>,
+    stderr_read: Option<OwnedHandle>,
+    timeout_ms: u32,
+    destroy_on_exit: bool,
+    proxy_enabled: bool,
+    identity: String,
+    sid_string: String,
+    proxy_coordinator: ProxyCoordinator,
+}
+
+impl SandboxBackend for BaseContainerRunner {
+    fn validate(&self, request: &ExecutionRequest) -> Result<(), ScriptResponse> {
+        if !request.policy.denied_paths.is_empty() {
+            return Err(ScriptResponse::error(
+                wxc_common::error::DENIED_PATHS_NOT_SUPPORTED_MSG,
+            ));
+        }
+        if !request.policy.allowed_hosts.is_empty() || !request.policy.blocked_hosts.is_empty() {
+            return Err(ScriptResponse::error(
+                wxc_common::error::HOST_LISTS_NOT_SUPPORTED_MSG,
+            ));
         }
+        Self::is_base_container_api_present().map_err(|e| {
+            let hint = if !request.experimental_enabled {
+                format!(
+                    "BaseContainer API unavailable: {e}\n\
+                     Hint: Config schema version '{}' requires the BaseContainer backend, \
+                     but this OS build does not support it. \
+                     Use schema version '0.4.0-alpha' to fall back to AppContainer.",
+                    request.schema_version
+                )
+            } else {
+                format!(
+                    "BaseContainer API unavailable: {e}\n\
+                     Hint: --experimental requested BaseContainer, but this OS build \
+                     does not support it. Remove --experimental to use the AppContainer \
+                     backend, or use an OS build with BaseContainer support."
+                )
+            };
+            ScriptResponse {
+                // Symbol absent: report BackendUnavailable, not a hard error.
+                failure_phase: FailurePhase::BackendUnavailable,
+                ..ScriptResponse::error(&hint)
+            }
+        })
+    }
 
-        let _ = writeln!(logger, "process exited with code {exit_code}");
+    fn spawn(
+        &mut self,
+        request: &ExecutionRequest,
+        logger: &mut Logger,
+        stdio: StdioMode,
+    ) -> Result<Box<dyn SandboxProcess>, ScriptResponse> {
+        use wxc_common::validator::validate_common;
+
+        validate_common(request)?;
+        self.validate(request)?;
+
+        // Pipes → capture pipes the caller drives; Inherit → the child inherits
+        // the binary's own std handles / console (a TTY when the binary has one).
+        let capture = stdio == StdioMode::Pipes;
+        let child = self.spawn_base(request, logger, capture)?;
+        Ok(Box::new(BaseContainerSandboxProcess::from_child(child)))
+    }
 
-        // 6. Sandbox cleanup: delete AppContainer profile and tracking entry.
-        //    Deferred if a network proxy is configured (proxy state can't be cleaned up yet).
-        if request.lifecycle.destroy_on_exit {
+    fn diagnose_exit(&self, request: &ExecutionRequest, exit_code: i32) -> Option<String> {
+        diagnose_process_exit(
+            &request.script_code,
+            &request.policy.readonly_paths,
+            &request.policy.readwrite_paths,
+            exit_code as u32,
+        )
+        .map(|diag| diag.message)
+    }
+}
+
+/// A running BaseContainer-sandboxed process exposed as a [`SandboxProcess`].
+/// Owns the process handle, the parent-side pipes, and the per-run proxy /
+/// sandbox state, which it tears down once the child exits.
+struct BaseContainerSandboxProcess {
+    process: SendOwnedHandle,
+    _thread: SendOwnedHandle,
+    job: Option<UiJobObject>,
+    pid: u32,
+    stdin: Option<PipeWriter>,
+    stdout: Option<InterruptiblePipeReader>,
+    stderr: Option<InterruptiblePipeReader>,
+    /// Cancellers for the stdout/stderr reads, kept so the `SandboxProcess`
+    /// closers can mint a [`StreamCloser`] even after the stream is taken.
+    stdout_canceller: Option<PipeReadCanceller>,
+    stderr_canceller: Option<PipeReadCanceller>,
+    timeout_ms: u32,
+    destroy_on_exit: bool,
+    proxy_enabled: bool,
+    identity: String,
+    sid_string: String,
+    proxy_coordinator: ProxyCoordinator,
+    teardown_done: bool,
+}
+
+// SAFETY: the fields are Windows HANDLEs / handle-owning managers and owned
+// strings. HANDLEs are process-global and safe to use from any single thread;
+// this handle is owned exclusively by the caller, so moving it across threads
+// is sound.
+unsafe impl Send for BaseContainerSandboxProcess {}
+
+impl BaseContainerSandboxProcess {
+    fn from_child(mut child: BaseChild) -> Self {
+        let process = SendOwnedHandle::take(&mut child.process);
+        let thread = SendOwnedHandle::take(&mut child.thread);
+        let stdin = child.stdin_write.take().map(PipeWriter::new);
+        let stdout = child.stdout_read.take().map(InterruptiblePipeReader::new);
+        let stderr = child.stderr_read.take().map(InterruptiblePipeReader::new);
+        let stdout_canceller = stdout.as_ref().map(InterruptiblePipeReader::canceller);
+        let stderr_canceller = stderr.as_ref().map(InterruptiblePipeReader::canceller);
+        Self {
+            process,
+            _thread: thread,
+            job: child.job.take(),
+            pid: child.pid,
+            stdin,
+            stdout,
+            stderr,
+            stdout_canceller,
+            stderr_canceller,
+            timeout_ms: child.timeout_ms,
+            destroy_on_exit: child.destroy_on_exit,
+            proxy_enabled: child.proxy_enabled,
+            identity: std::mem::take(&mut child.identity),
+            sid_string: std::mem::take(&mut child.sid_string),
+            proxy_coordinator: std::mem::take(&mut child.proxy_coordinator),
+            teardown_done: false,
+        }
+    }
+
+    fn run_teardown(&mut self) {
+        if self.teardown_done {
+            return;
+        }
+        self.teardown_done = true;
+        let mut logger = Logger::new(wxc_common::logger::Mode::Buffer);
+        if self.destroy_on_exit {
             run_sandbox_cleanup(
-                &identity,
-                &sid_string,
-                request.policy.network_proxy.is_enabled(),
-                logger,
+                &self.identity,
+                &self.sid_string,
+                self.proxy_enabled,
+                &mut logger,
             );
-            // Unregister so a late Ctrl+C doesn't double-cleanup.
             sandbox_tracking::unregister_ctrl_c_cleanup();
         }
+        self.proxy_coordinator.stop(&mut logger);
+    }
+}
 
-        let _ = writeln!(
-            logger,
-            "{EMOJI_SECTION} SECTION: Done ({:.3}s)",
-            run_start.elapsed().as_secs_f64()
-        );
+impl SandboxProcess for BaseContainerSandboxProcess {
+    fn take_stdin(&mut self) -> Option<Box<dyn std::io::Write + Send>> {
+        take_boxed_write(&mut self.stdin)
+    }
 
-        // Stop the builtin test proxy if it was started.
-        self.proxy_coordinator.stop(logger);
+    fn take_stdout(&mut self) -> Option<Box<dyn std::io::Read + Send>> {
+        take_boxed_read(&mut self.stdout)
+    }
 
-        //
-        // Diagnose the application failure (FailurePhase::ProcessExited).
-        //
-        let (error_message, failure_phase) = if exit_code != 0 {
-            if let Some(diag) = diagnose_process_exit(
-                &request.script_code,
-                &request.policy.readonly_paths,
-                &request.policy.readwrite_paths,
-                exit_code,
-            ) {
-                let _ = writeln!(
-                    logger,
-                    "Error: Launch diagnostic [{}]: {}",
-                    diag.kind, diag.message
-                );
-                (diag.message, FailurePhase::ProcessExited)
-            } else {
-                (String::new(), FailurePhase::ProcessExited)
+    fn take_stderr(&mut self) -> Option<Box<dyn std::io::Read + Send>> {
+        take_boxed_read(&mut self.stderr)
+    }
+
+    fn stdout_closer(&self) -> Option<Box<dyn StreamCloser>> {
+        boxed_closer(&self.stdout_canceller)
+    }
+
+    fn stderr_closer(&self) -> Option<Box<dyn StreamCloser>> {
+        boxed_closer(&self.stderr_canceller)
+    }
+
+    fn try_wait(&mut self) -> std::io::Result<Option<i32>> {
+        match unsafe { WaitForSingleObject(self.process.get(), 0) } {
+            WAIT_OBJECT_0 => {
+                let mut code: u32 = 0;
+                if unsafe { GetExitCodeProcess(self.process.get(), &mut code) }.is_err() {
+                    return Err(std::io::Error::other("GetExitCodeProcess failed"));
+                }
+                Ok(Some(code as i32))
             }
-        } else {
-            (String::new(), FailurePhase::None)
-        };
+            WAIT_TIMEOUT => Ok(None),
+            _ => Err(std::io::Error::other("WaitForSingleObject failed")),
+        }
+    }
+
+    fn id(&self) -> u32 {
+        self.pid
+    }
 
-        // Merge diagnostic error into stderr field if present.
-        // In passthrough mode, stdout/stderr already went directly to the SDK caller,
-        // so standard_out/standard_err in ScriptResponse will be empty.
-        let final_stderr = if error_message.is_empty() {
-            String::new()
+    fn kill(&mut self) -> std::io::Result<()> {
+        // Tree-kill via the job object when the child was successfully assigned
+        // to one; otherwise fall back to terminating the root process.
+        if let Some(job) = &self.job {
+            job.terminate(u32::MAX);
         } else {
-            error_message.clone()
+            unsafe {
+                let _ = TerminateProcess(self.process.get(), u32::MAX);
+            }
+        }
+        Ok(())
+    }
+
+    fn wait(&mut self) -> std::io::Result<i32> {
+        // Close our copy of any not-taken stdin so the child sees EOF and can
+        // exit reliably (an interactive command would otherwise block waiting
+        // for input).
+        self.stdin.take();
+
+        // Drain (and discard) any not-taken streams concurrently to avoid the
+        // child blocking on a full pipe buffer.
+        let stdout_thread = spawn_discard(self.stdout.take());
+        let stderr_thread = spawn_discard(self.stderr.take());
+
+        let result = match unsafe { WaitForSingleObject(self.process.get(), self.timeout_ms) } {
+            WAIT_OBJECT_0 => {
+                let mut code: u32 = 0;
+                if unsafe { GetExitCodeProcess(self.process.get(), &mut code) }.is_err() {
+                    Err(std::io::Error::other("GetExitCodeProcess failed"))
+                } else {
+                    Ok(code as i32)
+                }
+            }
+            WAIT_TIMEOUT => Err(std::io::Error::new(
+                std::io::ErrorKind::TimedOut,
+                format!("script timed out after {}ms", self.timeout_ms),
+            )),
+            _ => Err(std::io::Error::other("WaitForSingleObject failed")),
         };
 
-        ScriptResponse {
-            exit_code: exit_code as i32,
-            standard_out: String::new(),
-            standard_err: final_stderr,
-            error_message,
-            failure_phase,
-            ..Default::default()
+        // Tree-kill (the job when assigned, else the root) so any backgrounded
+        // descendant dies *before* `run_teardown()` stops the proxy / sandbox
+        // enforcement — upholding the same invariant as `Drop`. The foreground
+        // child has already exited on the success path; on a timeout or wait
+        // failure this also terminates it. Then reap the root before releasing
+        // the pipe drains — and killing the tree closes the descendant's pipe
+        // write-ends, so the drains can finish.
+        let _ = self.kill();
+        unsafe {
+            let _ = WaitForSingleObject(self.process.get(), u32::MAX);
+        }
+        cancel_and_join_discard(stdout_thread, &self.stdout_canceller);
+        cancel_and_join_discard(stderr_thread, &self.stderr_canceller);
+        self.run_teardown();
+        result
+    }
+}
+
+impl Drop for BaseContainerSandboxProcess {
+    fn drop(&mut self) {
+        // Kill and reap before tearing down proxy / sandbox state, so an
+        // abandoned-but-running sandbox cannot outlive its enforcement (or
+        // leak as an orphan).
+        let _ = self.kill();
+        unsafe {
+            let _ = WaitForSingleObject(self.process.get(), u32::MAX);
         }
+        self.run_teardown();
     }
 }
 
@@ -1319,7 +1670,7 @@ mod tests {
 
     // ---- validate_runner: unsupported policy fields surface as errors. ----
 
-    use wxc_common::script_runner::ScriptRunner;
+    use wxc_common::sandbox_process::SandboxBackend;
 
     #[test]
     fn validate_runner_rejects_denied_paths() {
@@ -1328,7 +1679,7 @@ mod tests {
         request.policy.denied_paths = vec!["C:\\secret".into()];
 
         let err = runner
-            .validate_runner(&request)
+            .validate(&request)
             .expect_err("BaseContainer does not yet support deniedPaths");
         assert!(
             err.error_message.contains("deniedPaths"),
@@ -1344,7 +1695,7 @@ mod tests {
         request.policy.allowed_hosts = vec!["example.com".into()];
 
         let err = runner
-            .validate_runner(&request)
+            .validate(&request)
             .expect_err("allowedHosts is not yet supported");
         assert!(err.error_message.contains("allowedHosts"));
     }
@@ -1356,7 +1707,7 @@ mod tests {
         request.policy.blocked_hosts = vec!["bad.example.com".into()];
 
         let err = runner
-            .validate_runner(&request)
+            .validate(&request)
             .expect_err("blockedHosts is not yet supported");
         assert!(err.error_message.contains("blockedHosts"));
     }
@@ -1370,7 +1721,7 @@ mod tests {
         // the policy-field checks above don't fire. Skip when the host doesn't
         // expose the API.
         if BaseContainerRunner::is_base_container_api_present().is_ok() {
-            assert!(runner.validate_runner(&request).is_ok());
+            assert!(runner.validate(&request).is_ok());
         }
     }
 }
diff --git a/src/backends/appcontainer/common/src/dispatcher.rs b/src/backends/appcontainer/common/src/dispatcher.rs
index 6e85c09fa..48f62fedb 100644
--- a/src/backends/appcontainer/common/src/dispatcher.rs
+++ b/src/backends/appcontainer/common/src/dispatcher.rs
@@ -75,6 +75,7 @@ use crate::fallback_detector::{self, FallbackError, IsolationTier};
 use wxc_common::error::WxcError;
 use wxc_common::filesystem_dacl::{DaclError, DaclManager, RO_MASK, RW_MASK};
 use wxc_common::models::ExecutionRequest;
+use wxc_common::sandbox_process::Runner;
 use wxc_common::script_runner::ScriptRunner;
 
 /// Result of a successful dispatch decision: a phased handle holding a
@@ -287,7 +288,7 @@ pub fn dispatch_with_fallback(request: &ExecutionRequest) -> Result<Dispatched,
             // opaque principal `Experimental_CreateProcessInSandbox`
             // actually runs the child under; a mismatch would render
             // the ACEs inert and silently un-enforce `deniedPaths`.
-            let runner: Box<dyn ScriptRunner> = Box::new(BaseContainerRunner::new());
+            let runner: Box<dyn ScriptRunner> = Box::new(Runner::new(BaseContainerRunner::new()));
             (runner, None)
         }
         IsolationTier::AppContainerBfs => {
@@ -297,9 +298,9 @@ pub fn dispatch_with_fallback(request: &ExecutionRequest) -> Result<Dispatched,
             // common no-deny case skips both costs.
             let denied = paths_to_pathbufs(&request.policy.denied_paths);
             if denied.is_empty() {
-                let runner: Box<dyn ScriptRunner> = Box::new(
+                let runner: Box<dyn ScriptRunner> = Box::new(Runner::new(
                     AppContainerScriptRunner::with_filesystem_mode(FilesystemMode::Bfs),
-                );
+                ));
                 (runner, None)
             } else {
                 let sid =
@@ -308,12 +309,12 @@ pub fn dispatch_with_fallback(request: &ExecutionRequest) -> Result<Dispatched,
                 // Hand the derived SID string to the runner so it does
                 // not re-run `ConvertSidToStringSidW` for the firewall
                 // principal-id lookup.
-                let runner: Box<dyn ScriptRunner> = Box::new(
+                let runner: Box<dyn ScriptRunner> = Box::new(Runner::new(
                     AppContainerScriptRunner::with_filesystem_mode_and_sid_string(
                         FilesystemMode::Bfs,
                         sid,
                     ),
-                );
+                ));
                 (runner, mgr)
             }
         }
@@ -342,12 +343,12 @@ pub fn dispatch_with_fallback(request: &ExecutionRequest) -> Result<Dispatched,
             let denied = paths_to_pathbufs(&request.policy.denied_paths);
             let sid = derive_sid_string(&container_name(request)).map_err(DispatchError::Sid)?;
             let mgr = build_t3_dacl(&sid, &readwrite, &readonly, &denied)?;
-            let runner: Box<dyn ScriptRunner> = Box::new(
+            let runner: Box<dyn ScriptRunner> = Box::new(Runner::new(
                 AppContainerScriptRunner::with_filesystem_mode_and_sid_string(
                     FilesystemMode::Dacl,
                     sid,
                 ),
-            );
+            ));
             (runner, Some(mgr))
         }
     };
diff --git a/src/backends/appcontainer/common/src/job_object.rs b/src/backends/appcontainer/common/src/job_object.rs
index fa83b48ff..2080d7ade 100644
--- a/src/backends/appcontainer/common/src/job_object.rs
+++ b/src/backends/appcontainer/common/src/job_object.rs
@@ -19,10 +19,11 @@ use std::sync::OnceLock;
 use windows::Win32::Foundation::{CloseHandle, HANDLE};
 use windows::Win32::System::JobObjects::{
     AssignProcessToJobObject, CreateJobObjectW, JobObjectBasicUIRestrictions,
-    SetInformationJobObject, JOBOBJECT_BASIC_UI_RESTRICTIONS, JOB_OBJECT_UILIMIT,
-    JOB_OBJECT_UILIMIT_DESKTOP, JOB_OBJECT_UILIMIT_DISPLAYSETTINGS, JOB_OBJECT_UILIMIT_EXITWINDOWS,
-    JOB_OBJECT_UILIMIT_GLOBALATOMS, JOB_OBJECT_UILIMIT_HANDLES, JOB_OBJECT_UILIMIT_READCLIPBOARD,
-    JOB_OBJECT_UILIMIT_SYSTEMPARAMETERS, JOB_OBJECT_UILIMIT_WRITECLIPBOARD,
+    SetInformationJobObject, TerminateJobObject, JOBOBJECT_BASIC_UI_RESTRICTIONS,
+    JOB_OBJECT_UILIMIT, JOB_OBJECT_UILIMIT_DESKTOP, JOB_OBJECT_UILIMIT_DISPLAYSETTINGS,
+    JOB_OBJECT_UILIMIT_EXITWINDOWS, JOB_OBJECT_UILIMIT_GLOBALATOMS, JOB_OBJECT_UILIMIT_HANDLES,
+    JOB_OBJECT_UILIMIT_READCLIPBOARD, JOB_OBJECT_UILIMIT_SYSTEMPARAMETERS,
+    JOB_OBJECT_UILIMIT_WRITECLIPBOARD,
 };
 use windows::Win32::System::SystemServices::JOB_OBJECT_UILIMIT_IME;
 use windows_core::PCWSTR;
@@ -273,6 +274,17 @@ impl UiJobObject {
         unsafe { AssignProcessToJobObject(self.handle, process_handle) }
             .map_err(|e| WxcError::Process(format!("AssignProcessToJobObject: {e}")))
     }
+
+    /// Terminate every process currently assigned to this job (the sandboxed
+    /// child and all of its descendants) with the given exit code. Used to
+    /// tree-kill a running sandbox. Best-effort: errors are ignored since the
+    /// processes may already have exited.
+    pub fn terminate(&self, exit_code: u32) {
+        // SAFETY: `self.handle` is a valid job handle owned by this struct.
+        unsafe {
+            let _ = TerminateJobObject(self.handle, exit_code);
+        }
+    }
 }
 
 impl Drop for UiJobObject {
diff --git a/src/backends/appcontainer/common/src/network_manager.rs b/src/backends/appcontainer/common/src/network_manager.rs
index 1f7c2b732..9abb2c342 100644
--- a/src/backends/appcontainer/common/src/network_manager.rs
+++ b/src/backends/appcontainer/common/src/network_manager.rs
@@ -28,20 +28,80 @@ pub enum DefaultPolicy {
     Block,
 }
 
+/// `RPC_E_CHANGED_MODE`: `CoInitializeEx` returns this when COM is already
+/// initialized on the calling thread with a *different* apartment model. The
+/// existing initialization is reused and must **not** be balanced by our own
+/// `CoUninitialize`.
+const RPC_E_CHANGED_MODE: u32 = 0x8001_0106;
+
+/// RAII guard for a per-call COM apartment on the **current** thread.
+///
+/// Every firewall operation creates one of these, does all of its COM work
+/// (`CoCreateInstance`, interface use, release) while it is alive, and lets it
+/// drop — running the matching `CoUninitialize` — before returning. Because no
+/// COM interface or apartment state is ever cached on [`NetworkManager`] across
+/// calls, teardown (`remove_firewall_rules`) can run on a *different* thread
+/// than setup (`apply_firewall_rules`) without ever using an interface from
+/// another apartment or pairing `CoInitializeEx`/`CoUninitialize` across
+/// threads. That self-containment is what makes the `unsafe impl Send` on the
+/// owning sandbox handle sound.
+struct ComApartment {
+    /// Whether *this* guard performed the initialization that it must balance
+    /// with `CoUninitialize`. `false` when COM was already initialized on this
+    /// thread under a different model (`RPC_E_CHANGED_MODE`).
+    owns_init: bool,
+}
+
+impl ComApartment {
+    /// Join (or initialize) an apartment-threaded COM apartment for the current
+    /// thread. `S_OK`/`S_FALSE` both count as an initialization this guard must
+    /// balance; `RPC_E_CHANGED_MODE` reuses an existing apartment without
+    /// taking ownership of its teardown.
+    fn new() -> Result<Self, WxcError> {
+        // SAFETY: `CoInitializeEx` is always safe to call; the matching
+        // `CoUninitialize` runs in `Drop` on this same thread when we own it.
+        let hr = unsafe { CoInitializeEx(None, COINIT_APARTMENTTHREADED) };
+        if hr.is_ok() {
+            Ok(Self { owns_init: true })
+        } else if hr.0 as u32 == RPC_E_CHANGED_MODE {
+            Ok(Self { owns_init: false })
+        } else {
+            Err(WxcError::Firewall(format!(
+                "CoInitializeEx failed: 0x{:08X}",
+                hr.0 as u32
+            )))
+        }
+    }
+}
+
+impl Drop for ComApartment {
+    fn drop(&mut self) {
+        if self.owns_init {
+            // SAFETY: balances the `CoInitializeEx` in `new` on the same thread.
+            unsafe { CoUninitialize() };
+        }
+    }
+}
+
 pub struct NetworkManager {
-    fw_policy: Option<INetFwPolicy2>,
     created_rule_names: Vec<String>,
-    com_initialized: bool,
     wsa_initialized: bool,
     proxy_coordinator: ProxyCoordinator,
 }
 
+/// Invariant context for creating firewall rules within a single
+/// `apply_firewall_rules` call: the firewall interface (valid only for the
+/// current COM apartment / thread) and the AppContainer principal the rules are
+/// scoped to. Bundled so the rule helpers stay within the argument-count lint.
+struct RuleContext<'a> {
+    fw_policy: &'a INetFwPolicy2,
+    principal_id: &'a str,
+}
+
 impl NetworkManager {
     pub fn new() -> Self {
         Self {
-            fw_policy: None,
             created_rule_names: Vec::new(),
-            com_initialized: false,
             wsa_initialized: false,
             proxy_coordinator: ProxyCoordinator::new(),
         }
@@ -84,7 +144,13 @@ impl NetworkManager {
             return Ok(true);
         }
 
-        self.initialize_firewall(logger)?;
+        // Open a COM apartment and create the firewall interface for the
+        // duration of *this* call only — nothing is cached on `self`. See
+        // [`ComApartment`] for why this self-containment matters.
+        let _com = ComApartment::new()?;
+        let fw_policy: INetFwPolicy2 =
+            unsafe { CoCreateInstance(&NetFwPolicy2, None, CLSCTX_INPROC_SERVER) }
+                .map_err(|e| WxcError::Firewall(format!("Failed to create NetFwPolicy2: {e}")))?;
         self.ensure_wsa_initialized(logger)?;
 
         let now = std::time::SystemTime::now()
@@ -100,43 +166,35 @@ impl NetworkManager {
             sanitized_principal_id.truncate(MAX_PRINCIPAL_ID_LEN);
         }
         let rule_prefix = format!("WXC_{}_{}", sanitized_principal_id, millis);
+        let ctx = RuleContext {
+            fw_policy: &fw_policy,
+            principal_id,
+        };
 
         if default_policy == DefaultPolicy::Block {
             let block_all_name = format!("{}_BlockAll", rule_prefix);
-            if !self.create_rule(
-                &block_all_name,
-                principal_id,
-                NET_FW_ACTION_BLOCK,
-                "",
-                logger,
-            )? {
+            if !self.create_rule(&ctx, &block_all_name, NET_FW_ACTION_BLOCK, "", logger)? {
                 return Ok(false);
             }
             self.created_rule_names.push(block_all_name);
             self.process_host_list(
+                &ctx,
                 &policy.allowed_hosts,
                 &rule_prefix,
-                principal_id,
                 NET_FW_ACTION_ALLOW,
                 "Allow",
                 logger,
             )?;
         } else {
             let allow_all_name = format!("{}_AllowAll", rule_prefix);
-            if !self.create_rule(
-                &allow_all_name,
-                principal_id,
-                NET_FW_ACTION_ALLOW,
-                "*",
-                logger,
-            )? {
+            if !self.create_rule(&ctx, &allow_all_name, NET_FW_ACTION_ALLOW, "*", logger)? {
                 return Ok(false);
             }
             self.created_rule_names.push(allow_all_name);
             self.process_host_list(
+                &ctx,
                 &policy.blocked_hosts,
                 &rule_prefix,
-                principal_id,
                 NET_FW_ACTION_BLOCK,
                 "Block",
                 logger,
@@ -148,9 +206,9 @@ impl NetworkManager {
 
     fn process_host_list(
         &mut self,
+        ctx: &RuleContext,
         hosts: &[String],
         rule_prefix: &str,
-        principal_id: &str,
         action: NET_FW_ACTION,
         action_name: &str,
         logger: &mut Logger,
@@ -169,7 +227,7 @@ impl NetworkManager {
             };
 
             let rule_name = format!("{}_{}_{}", rule_prefix, action_name, index);
-            match self.create_rule(&rule_name, principal_id, action, &ip_address, logger) {
+            match self.create_rule(ctx, &rule_name, action, &ip_address, logger) {
                 Ok(true) => {
                     self.created_rule_names.push(rule_name);
                 }
@@ -236,13 +294,19 @@ impl NetworkManager {
     }
 
     pub fn remove_firewall_rules(&mut self, logger: &mut Logger) -> Result<bool, WxcError> {
-        let fw_policy = match &self.fw_policy {
-            Some(p) => p.clone(),
-            None => {
-                logger.log_line("Firewall policy not initialized");
-                return Ok(false);
-            }
-        };
+        if self.created_rule_names.is_empty() {
+            return Ok(true);
+        }
+
+        // Re-acquire a fresh firewall interface in its own apartment on the
+        // current thread. Windows Firewall rules persist by name independently
+        // of the COM client that created them, so removal does not need (and
+        // must not reuse) the interface or apartment `apply_firewall_rules`
+        // used — which may have run on a different thread. See [`ComApartment`].
+        let _com = ComApartment::new()?;
+        let fw_policy: INetFwPolicy2 =
+            unsafe { CoCreateInstance(&NetFwPolicy2, None, CLSCTX_INPROC_SERVER) }
+                .map_err(|e| WxcError::Firewall(format!("Failed to create NetFwPolicy2: {e}")))?;
 
         let rules = unsafe { fw_policy.Rules() }
             .map_err(|e| WxcError::Firewall(format!("Failed to get firewall rules: {}", e)))?;
@@ -255,60 +319,10 @@ impl NetworkManager {
             }
         }
         self.created_rule_names.clear();
-        Ok(all_success)
-    }
-
-    fn initialize_firewall(&mut self, _logger: &mut Logger) -> Result<(), WxcError> {
-        if self.fw_policy.is_some() {
-            return Ok(());
-        }
-
-        let hr = unsafe { CoInitializeEx(None, COINIT_APARTMENTTHREADED) };
-        // CoInitializeEx returns HRESULT directly in windows 0.58
-        if hr.is_ok() {
-            self.com_initialized = true;
-        } else {
-            // RPC_E_CHANGED_MODE (0x80010106) means COM is already initialized
-            // with a different threading model — that's acceptable.
-            let code = hr.0 as u32;
-            if code == 0x80010106 {
-                self.com_initialized = false;
-            } else {
-                return Err(WxcError::Firewall(format!(
-                    "CoInitializeEx failed: 0x{:08X}",
-                    code
-                )));
-            }
-        }
-
-        match unsafe {
-            CoCreateInstance::<_, INetFwPolicy2>(&NetFwPolicy2, None, CLSCTX_INPROC_SERVER)
-        } {
-            Ok(policy) => {
-                self.fw_policy = Some(policy);
-                Ok(())
-            }
-            Err(e) => {
-                if self.com_initialized {
-                    unsafe { CoUninitialize() };
-                    self.com_initialized = false;
-                }
-                Err(WxcError::Firewall(format!(
-                    "Failed to create NetFwPolicy2: {}",
-                    e
-                )))
-            }
-        }
-    }
-
-    fn cleanup_firewall(&mut self) {
-        if let Some(policy) = self.fw_policy.take() {
-            drop(policy);
-        }
-        if self.com_initialized {
-            unsafe { CoUninitialize() };
-            self.com_initialized = false;
+        if !all_success {
+            logger.log_line("Warning: some firewall rules could not be removed");
         }
+        Ok(all_success)
     }
 
     fn ensure_wsa_initialized(&mut self, _logger: &mut Logger) -> Result<(), WxcError> {
@@ -336,18 +350,13 @@ impl NetworkManager {
 
     fn create_rule(
         &self,
+        ctx: &RuleContext,
         rule_name: &str,
-        principal_id: &str,
         action: NET_FW_ACTION,
         remote_addresses: &str,
         _logger: &mut Logger,
     ) -> Result<bool, WxcError> {
-        let fw_policy = self
-            .fw_policy
-            .as_ref()
-            .ok_or_else(|| WxcError::Firewall("Firewall policy not initialized".into()))?;
-
-        let rules = unsafe { fw_policy.Rules() }
+        let rules = unsafe { ctx.fw_policy.Rules() }
             .map_err(|e| WxcError::Firewall(format!("Failed to get firewall rules: {}", e)))?;
 
         let rule: windows::Win32::NetworkManagement::WindowsFirewall::INetFwRule =
@@ -366,7 +375,7 @@ impl NetworkManager {
                 .map_err(|e| WxcError::Firewall(format!("put_Description failed: {}", e)))?;
 
             rule3
-                .SetLocalAppPackageId(&BSTR::from(principal_id))
+                .SetLocalAppPackageId(&BSTR::from(ctx.principal_id))
                 .map_err(|e| WxcError::Firewall(format!("put_LocalAppPackageId failed: {}", e)))?;
 
             rule.SetDirection(NET_FW_RULE_DIR_OUT)
@@ -411,7 +420,10 @@ impl Default for NetworkManager {
 
 impl Drop for NetworkManager {
     fn drop(&mut self) {
-        self.cleanup_firewall();
+        // No COM state is cached across calls (each firewall op is
+        // apartment-self-contained), so there is nothing COM-related to undo
+        // here. Only the process-global Winsock refcount — which is
+        // thread-agnostic — needs balancing.
         self.cleanup_wsa();
     }
 }
@@ -528,9 +540,7 @@ mod tests {
     #[test]
     fn test_default_creates_new_manager() {
         let mgr = NetworkManager::default();
-        assert!(mgr.fw_policy.is_none());
         assert!(mgr.created_rule_names.is_empty());
-        assert!(!mgr.com_initialized);
         assert!(!mgr.wsa_initialized);
     }
 
diff --git a/src/backends/appcontainer/common/src/probe.rs b/src/backends/appcontainer/common/src/probe.rs
index c0eb3dec6..8d0be7023 100644
--- a/src/backends/appcontainer/common/src/probe.rs
+++ b/src/backends/appcontainer/common/src/probe.rs
@@ -63,7 +63,7 @@ pub struct ProbeFacts {
 }
 
 /// Host support for enforcing sandbox UI restrictions.
-#[derive(Serialize, Debug)]
+#[derive(Serialize, Debug, Clone)]
 #[serde(rename_all = "camelCase")]
 pub struct UiCapabilitySupport {
     /// Whether the host can block reads from the clipboard.
diff --git a/src/backends/bubblewrap/common/src/bwrap_runner.rs b/src/backends/bubblewrap/common/src/bwrap_runner.rs
index ba888e98f..2c297872b 100644
--- a/src/backends/bubblewrap/common/src/bwrap_runner.rs
+++ b/src/backends/bubblewrap/common/src/bwrap_runner.rs
@@ -26,20 +26,24 @@
 //! without root.
 
 use std::fmt::Write as FmtWrite;
-use std::process::{Command, Stdio};
-use std::time::{Duration, Instant};
+use std::os::unix::process::CommandExt;
+use std::process::{Child, ChildStdin, Command, Stdio};
+use std::time::Duration;
 
 use lxc_common::network_iptables::NetworkIptablesManager;
+use wxc_common::interruptible_reader::{wrap_pipe, InterruptibleReader, ReadCanceller};
 use wxc_common::linux_proxy_coordinator::LinuxProxyCoordinator;
 use wxc_common::logger::Logger;
 use wxc_common::models::{ExecutionRequest, NetworkEnforcementMode, ScriptResponse};
-use wxc_common::script_runner::ScriptRunner;
+use wxc_common::sandbox_process::{
+    boxed_closer, cancel_and_join_discard, group_kill, spawn_discard, take_boxed_read,
+    take_boxed_write, wait_with_timeout, SandboxBackend, SandboxProcess, StdioMode, StreamCloser,
+    WaitError,
+};
+use wxc_common::validator::validate_common;
 
 use crate::bwrap_command;
 
-/// Polling interval for timeout enforcement.
-const POLL_INTERVAL_MS: u64 = 500;
-
 /// Bubblewrap sandbox runner. Uses only shared `ContainerPolicy` fields —
 /// no backend-specific config struct required.
 #[derive(Default)]
@@ -62,8 +66,8 @@ impl BubblewrapScriptRunner {
     }
 }
 
-impl ScriptRunner for BubblewrapScriptRunner {
-    fn validate_runner(&self, request: &ExecutionRequest) -> Result<(), ScriptResponse> {
+impl SandboxBackend for BubblewrapScriptRunner {
+    fn validate(&self, request: &ExecutionRequest) -> Result<(), ScriptResponse> {
         // User-input validation runs before the environmental `bwrap`
         // probe so config errors are reported deterministically even on
         // hosts without bwrap installed.
@@ -85,14 +89,6 @@ impl ScriptRunner for BubblewrapScriptRunner {
             ));
         }
 
-        // Reject timeouts smaller than our polling interval.
-        if request.script_timeout > 0 && u64::from(request.script_timeout) < POLL_INTERVAL_MS {
-            return Err(ScriptResponse::error(&format!(
-                "script_timeout {}ms is below the minimum of {}ms",
-                request.script_timeout, POLL_INTERVAL_MS
-            )));
-        }
-
         if !Self::is_bwrap_available() {
             return Err(ScriptResponse::error(
                 "Bubblewrap (bwrap) is not installed or not on PATH. \
@@ -103,16 +99,34 @@ impl ScriptRunner for BubblewrapScriptRunner {
         Ok(())
     }
 
-    fn execute(&mut self, request: &ExecutionRequest, logger: &mut Logger) -> ScriptResponse {
+    fn spawn(
+        &mut self,
+        request: &ExecutionRequest,
+        logger: &mut Logger,
+        stdio: StdioMode,
+    ) -> Result<Box<dyn SandboxProcess>, ScriptResponse> {
+        validate_common(request)?;
+        self.validate(request)?;
+        let child = self.spawn_bwrap(request, logger, stdio)?;
+        Ok(Box::new(BubblewrapSandboxProcess::new(child)))
+    }
+}
+
+impl BubblewrapScriptRunner {
+    /// Set up networking and spawn `bwrap`, returning a [`BwrapChild`] wrapped
+    /// by the [`SandboxProcess`] handle. With [`StdioMode::Pipes`] the child's
+    /// stdio is piped (the caller drives it); with [`StdioMode::Inherit`] it
+    /// inherits the binary's stdio (a TTY when the binary has one). bwrap is
+    /// always placed in its own process group so it can be tree-terminated.
+    fn spawn_bwrap(
+        &self,
+        request: &ExecutionRequest,
+        logger: &mut Logger,
+        stdio: StdioMode,
+    ) -> Result<BwrapChild, ScriptResponse> {
         // 1. Start the network proxy if configured. Must happen before
         //    arg-building so the proxy's loopback address can be injected as
         //    HTTP_PROXY / HTTPS_PROXY into the sandbox environment.
-        //
-        //    Pass the request's `default_network_policy` through so that a
-        //    config of `{ defaultPolicy: "block", proxy: {...}, allowedHosts:
-        //    [] }` actually denies-by-default at the proxy layer (otherwise
-        //    the empty allow list + no iptables + no --unshare-net would let
-        //    everything through).
         let mut proxy = LinuxProxyCoordinator::new();
         if request.policy.network_proxy.is_enabled() {
             if let Err(err) = proxy.start(
@@ -123,10 +137,10 @@ impl ScriptRunner for BubblewrapScriptRunner {
                 request.policy.default_network_policy.clone(),
                 logger,
             ) {
-                return ScriptResponse::error(&format!(
+                return Err(ScriptResponse::error(&format!(
                     "Bubblewrap: failed to start network proxy: {}",
                     err
-                ));
+                )));
             }
         }
 
@@ -148,7 +162,7 @@ impl ScriptRunner for BubblewrapScriptRunner {
             request.container_id.clone()
         };
 
-        let mut fw_manager = if needs_iptables {
+        let fw_manager = if needs_iptables {
             let _ = writeln!(
                 logger,
                 "Bubblewrap: applying iptables rules for host-level network filtering"
@@ -158,16 +172,16 @@ impl ScriptRunner for BubblewrapScriptRunner {
                 Ok(true) => {}
                 Ok(false) => {
                     proxy.stop(logger);
-                    return ScriptResponse::error(
+                    return Err(ScriptResponse::error(
                         "Bubblewrap: failed to apply iptables firewall rules.",
-                    );
+                    ));
                 }
                 Err(e) => {
                     proxy.stop(logger);
-                    return ScriptResponse::error(&format!(
+                    return Err(ScriptResponse::error(&format!(
                         "Bubblewrap: network policy error: {}",
                         e
-                    ));
+                    )));
                 }
             }
             Some(mgr)
@@ -178,77 +192,253 @@ impl ScriptRunner for BubblewrapScriptRunner {
         // 4. Spawn `bwrap`.
         let mut command = Command::new("bwrap");
         command.args(&args);
-        command
-            .stdin(Stdio::null())
-            .stdout(Stdio::piped())
-            .stderr(Stdio::piped());
+        match stdio {
+            StdioMode::Pipes => {
+                command
+                    .stdin(Stdio::piped())
+                    .stdout(Stdio::piped())
+                    .stderr(Stdio::piped());
+            }
+            StdioMode::Inherit => {
+                // The child (bwrap, PID 1 of the sandbox) inherits the binary's
+                // stdio directly — a TTY when the binary has one.
+                command
+                    .stdin(Stdio::inherit())
+                    .stdout(Stdio::inherit())
+                    .stderr(Stdio::inherit());
+            }
+        }
+        // Pipes mode: put bwrap in its own process group so a timeout / `kill()`
+        // can tree-kill it with a single `killpg` without touching the host's
+        // group. Inherit mode keeps bwrap in the executor's group (so it retains
+        // the controlling terminal and can't be SIGTTIN-stopped reading it); it's
+        // PID 1 of the new pid namespace (`--unshare-pid`), so killing the root
+        // process alone tears the whole sandbox down.
+        let group = stdio == StdioMode::Pipes;
+        if group {
+            command.process_group(0);
+        }
 
         let mut child = match command.spawn() {
             Ok(process) => process,
             Err(error) => {
+                let mut fw_manager = fw_manager;
                 cleanup_iptables(&mut fw_manager, logger);
                 proxy.stop(logger);
-                return ScriptResponse::error(&format!(
+                return Err(ScriptResponse::error(&format!(
                     "Bubblewrap: failed to spawn bwrap: {}",
                     error
-                ));
+                )));
             }
         };
 
-        // 5. Drain stdout/stderr in background threads to avoid pipe-buffer
-        //    deadlock.
-        let stdout_handle = child
-            .stdout
-            .take()
-            .map(|r| std::thread::spawn(move || read_to_string(r)));
-        let stderr_handle = child
-            .stderr
-            .take()
-            .map(|r| std::thread::spawn(move || read_to_string(r)));
-
-        // 6. Wait with optional timeout.
+        let (stdin, stdout, stderr) = match stdio {
+            StdioMode::Pipes => (child.stdin.take(), child.stdout.take(), child.stderr.take()),
+            StdioMode::Inherit => (None, None, None),
+        };
+        // Wrap the pipe reads so the caller can abandon a stream a backgrounded
+        // descendant is holding open (see `SandboxProcess::stdout_closer`)
+        // without killing the child. On failure, tear down the per-run network
+        // state we already set up before returning the error.
+        let (stdout, stdout_canceller, stderr, stderr_canceller) =
+            match (wrap_pipe(stdout), wrap_pipe(stderr)) {
+                (Ok((out, out_canceller)), Ok((err, err_canceller))) => {
+                    (out, out_canceller, err, err_canceller)
+                }
+                (out_result, err_result) => {
+                    let _ = child.kill();
+                    let _ = child.wait();
+                    let mut fw_manager = fw_manager;
+                    cleanup_iptables(&mut fw_manager, logger);
+                    proxy.stop(logger);
+                    let error = out_result.err().or(err_result.err());
+                    return Err(ScriptResponse::error(&format!(
+                        "Bubblewrap: failed to wrap stdio pipes: {}",
+                        error.map_or_else(|| "unknown error".to_string(), |e| e.to_string()),
+                    )));
+                }
+            };
         let timeout = if request.script_timeout == 0 {
             None
         } else {
             Some(Duration::from_millis(u64::from(request.script_timeout)))
         };
 
-        let exit_status = match wait_with_timeout(&mut child, timeout) {
-            Ok(status) => status,
+        Ok(BwrapChild {
+            child,
+            stdin,
+            stdout,
+            stderr,
+            stdout_canceller,
+            stderr_canceller,
+            group,
+            proxy,
+            fw_manager,
+            timeout,
+        })
+    }
+}
+
+/// A spawned `bwrap` sandbox: the child process, its parent-side pipe ends,
+/// and the per-run network proxy / iptables state torn down once it exits.
+struct BwrapChild {
+    child: Child,
+    stdin: Option<ChildStdin>,
+    stdout: Option<InterruptibleReader>,
+    stderr: Option<InterruptibleReader>,
+    /// Cancellers for the stdout/stderr reads, kept so the `SandboxProcess`
+    /// closers can mint a [`StreamCloser`] even after the stream is taken.
+    stdout_canceller: Option<ReadCanceller>,
+    stderr_canceller: Option<ReadCanceller>,
+    /// `true` when bwrap leads its own process group (`Pipes` mode), so
+    /// termination signals the whole group; `false` for `Inherit` mode, where
+    /// killing bwrap (pid 1 of the namespace) alone tears the sandbox down.
+    group: bool,
+    proxy: LinuxProxyCoordinator,
+    fw_manager: Option<NetworkIptablesManager>,
+    timeout: Option<Duration>,
+}
+
+impl BwrapChild {
+    /// Tear down per-run network state (iptables rules + proxy). Idempotent at
+    /// the manager level.
+    fn cleanup(&mut self, logger: &mut Logger) {
+        cleanup_iptables(&mut self.fw_manager, logger);
+        self.proxy.stop(logger);
+    }
+}
+
+/// A running `bwrap` sandbox exposed as a [`SandboxProcess`]. Wraps the spawned
+/// [`BwrapChild`] (child, pipes, and per-run network state), tearing the network
+/// state down once the child exits.
+struct BubblewrapSandboxProcess {
+    inner: BwrapChild,
+    teardown_done: bool,
+}
+
+impl BubblewrapSandboxProcess {
+    fn new(child: BwrapChild) -> Self {
+        Self {
+            inner: child,
+            teardown_done: false,
+        }
+    }
+
+    fn run_teardown(&mut self) {
+        if self.teardown_done {
+            return;
+        }
+        self.teardown_done = true;
+        let mut logger = Logger::new(wxc_common::logger::Mode::Buffer);
+        self.inner.cleanup(&mut logger);
+    }
+}
+
+impl SandboxProcess for BubblewrapSandboxProcess {
+    fn take_stdin(&mut self) -> Option<Box<dyn std::io::Write + Send>> {
+        take_boxed_write(&mut self.inner.stdin)
+    }
+
+    fn take_stdout(&mut self) -> Option<Box<dyn std::io::Read + Send>> {
+        take_boxed_read(&mut self.inner.stdout)
+    }
+
+    fn take_stderr(&mut self) -> Option<Box<dyn std::io::Read + Send>> {
+        take_boxed_read(&mut self.inner.stderr)
+    }
+
+    fn stdout_closer(&self) -> Option<Box<dyn StreamCloser>> {
+        boxed_closer(&self.inner.stdout_canceller)
+    }
+
+    fn stderr_closer(&self) -> Option<Box<dyn StreamCloser>> {
+        boxed_closer(&self.inner.stderr_canceller)
+    }
+
+    fn try_wait(&mut self) -> std::io::Result<Option<i32>> {
+        Ok(self
+            .inner
+            .child
+            .try_wait()?
+            .map(|status| status.code().unwrap_or(-1)))
+    }
+
+    fn id(&self) -> u32 {
+        self.inner.child.id()
+    }
+
+    fn kill(&mut self) -> std::io::Result<()> {
+        // No-op once the child has exited and been reaped: its pid/pgid can be
+        // recycled, so signaling it could hit an unrelated process (group). A
+        // reaped `Child` returns its cached status here without a syscall.
+        if self.inner.child.try_wait()?.is_some() {
+            return Ok(());
+        }
+        if self.inner.group {
+            // Pipes mode: bwrap leads its own process group — tree-kill it.
+            group_kill(&mut self.inner.child)
+        } else {
+            // Inherit mode: bwrap shares the executor's group (no
+            // `process_group(0)`), so a group-kill would hit the executor.
+            // bwrap is pid 1 of the sandbox pid namespace, so killing the root
+            // alone tears the whole namespace (every descendant) down.
+            self.inner.child.kill()
+        }
+    }
+
+    fn wait(&mut self) -> std::io::Result<i32> {
+        // Close our copy of any not-taken stdin so the child sees EOF.
+        self.inner.stdin.take();
+
+        // Drain (and discard) any not-taken stdout/stderr concurrently so the
+        // child can't block on a full pipe (taken streams are the caller's
+        // responsibility).
+        let stdout_thread = spawn_discard(self.inner.stdout.take());
+        let stderr_thread = spawn_discard(self.inner.stderr.take());
+
+        let result = match wait_with_timeout(&mut self.inner.child, self.inner.timeout) {
+            Ok(status) => Ok(status.code().unwrap_or(-1)),
             Err(WaitError::Timeout) => {
-                let _ = child.kill();
-                let _ = child.wait();
-                cleanup_iptables(&mut fw_manager, logger);
-                proxy.stop(logger);
-                return ScriptResponse {
-                    exit_code: -1,
-                    standard_out: join_reader(stdout_handle),
-                    standard_err: join_reader(stderr_handle),
-                    error_message: format!(
-                        "Bubblewrap: script timed out after {}ms",
-                        request.script_timeout
-                    ),
-                    ..Default::default()
-                };
+                // Tree-kill so descendants die too and release any stdout/stderr
+                // pipe write-ends (else the drain threads below could block).
+                // `kill()` group-kills in Pipes mode, and in Inherit mode kills
+                // bwrap (pid 1 of the namespace), which tears the sandbox down.
+                let _ = self.kill();
+                let _ = self.inner.child.wait();
+                Err(std::io::Error::new(
+                    std::io::ErrorKind::TimedOut,
+                    "Bubblewrap: script timed out",
+                ))
             }
             Err(WaitError::Io(error)) => {
-                cleanup_iptables(&mut fw_manager, logger);
-                proxy.stop(logger);
-                return ScriptResponse::error(&format!("Bubblewrap: wait failed: {}", error));
+                // The child may still be alive; kill+reap it before
+                // `run_teardown()` removes the iptables/proxy enforcement out
+                // from under it.
+                let _ = self.kill();
+                let _ = self.inner.child.wait();
+                Err(std::io::Error::other(format!(
+                    "Bubblewrap: wait failed: {error}"
+                )))
             }
         };
 
-        // 7. Collect output and clean up.
-        cleanup_iptables(&mut fw_manager, logger);
-        proxy.stop(logger);
+        cancel_and_join_discard(stdout_thread, &self.inner.stdout_canceller);
+        cancel_and_join_discard(stderr_thread, &self.inner.stderr_canceller);
+        self.run_teardown();
+        result
+    }
+}
 
-        ScriptResponse {
-            exit_code: exit_status.code().unwrap_or(-1),
-            standard_out: join_reader(stdout_handle),
-            standard_err: join_reader(stderr_handle),
-            error_message: String::new(),
-            ..Default::default()
-        }
+impl Drop for BubblewrapSandboxProcess {
+    fn drop(&mut self) {
+        // Kill and reap the child *before* removing network enforcement —
+        // otherwise an abandoned-but-running sandbox would keep egressing after
+        // its iptables/proxy rules were torn down, and the child would leak as
+        // a zombie. `kill()` group-kills (bwrap is PID 1 of the pid namespace),
+        // then we reap.
+        let _ = self.kill();
+        let _ = self.inner.child.wait();
+        self.run_teardown();
     }
 }
 
@@ -276,48 +466,6 @@ fn cleanup_iptables(manager: &mut Option<NetworkIptablesManager>, logger: &mut L
     }
 }
 
-// -- I/O helpers (mirrors seatbelt_runner) --------------------------------
-
-fn read_to_string<R: std::io::Read>(mut reader: R) -> String {
-    let mut buffer = String::new();
-    let _ = reader.read_to_string(&mut buffer);
-    buffer
-}
-
-fn join_reader(handle: Option<std::thread::JoinHandle<String>>) -> String {
-    match handle {
-        Some(h) => h.join().unwrap_or_default(),
-        None => String::new(),
-    }
-}
-
-enum WaitError {
-    Timeout,
-    Io(std::io::Error),
-}
-
-fn wait_with_timeout(
-    child: &mut std::process::Child,
-    timeout: Option<Duration>,
-) -> Result<std::process::ExitStatus, WaitError> {
-    let Some(deadline) = timeout.map(|d| Instant::now() + d) else {
-        return child.wait().map_err(WaitError::Io);
-    };
-
-    loop {
-        match child.try_wait() {
-            Ok(Some(status)) => return Ok(status),
-            Ok(None) => {
-                if Instant::now() >= deadline {
-                    return Err(WaitError::Timeout);
-                }
-                std::thread::sleep(Duration::from_millis(POLL_INTERVAL_MS));
-            }
-            Err(e) => return Err(WaitError::Io(e)),
-        }
-    }
-}
-
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -340,7 +488,7 @@ mod tests {
         req.experimental_enabled = false;
 
         let runner = BubblewrapScriptRunner::new();
-        let err = runner.validate_runner(&req).unwrap_err();
+        let err = runner.validate(&req).unwrap_err();
         assert!(
             err.error_message.contains("builtinTestServer")
                 && err.error_message.contains("--experimental"),
@@ -357,7 +505,7 @@ mod tests {
         req.script_code = String::new();
 
         let runner = BubblewrapScriptRunner::new();
-        let err = runner.validate_runner(&req).unwrap_err();
+        let err = runner.validate(&req).unwrap_err();
         assert!(err.error_message.contains("script_code is empty"));
     }
 }
diff --git a/src/backends/seatbelt/common/Cargo.toml b/src/backends/seatbelt/common/Cargo.toml
index 378e6fda1..fb7029ae6 100644
--- a/src/backends/seatbelt/common/Cargo.toml
+++ b/src/backends/seatbelt/common/Cargo.toml
@@ -12,7 +12,3 @@ wxc_common = { workspace = true }
 
 [target.'cfg(target_os = "macos")'.dependencies]
 libc = { workspace = true }
-# Pty bridge is shared with the LXC backend via mxc_pty; that crate owns
-# the openpty + pre_exec (setsid + TIOCSCTTY) plumbing and the libc/nix
-# deps that go with it.
-mxc_pty = { workspace = true }
diff --git a/src/backends/seatbelt/common/src/profile_builder.rs b/src/backends/seatbelt/common/src/profile_builder.rs
index effb4c03d..df4ae160f 100644
--- a/src/backends/seatbelt/common/src/profile_builder.rs
+++ b/src/backends/seatbelt/common/src/profile_builder.rs
@@ -59,11 +59,11 @@ pub fn build_profile(request: &ExecutionRequest) -> Result<String, String> {
     // Filesystem — read-only system paths every process needs.
     out.push_str(SYSTEM_READ_ALLOW);
 
-    // Pseudo-terminal access — the seatbelt runner attaches the inner
-    // shell to a freshly-allocated pty (see `mxc_pty::run_with_pty`) so
-    // callers can stream output and the shell sees a real TTY. Without
-    // these rules, `isatty()` / `tcgetattr()` / `ttyname()` fail with
-    // EPERM because the kernel calls block on the secondary fd.
+    // Pseudo-terminal access — when the executor binary runs under a pty
+    // the sandboxed shell inherits that TTY, so it sees a real terminal
+    // and calls `isatty()` / `tcgetattr()` / `ttyname()` against it.
+    // Without these rules, those calls fail with EPERM because the
+    // kernel calls block on the secondary fd.
     out.push_str(TTY_ALLOW);
 
     // Policy-derived allow rules.
@@ -136,7 +136,7 @@ const SYSTEM_READ_ALLOW: &str = "\
 /// at startup, and read access to `/dev/fd` for the `/dev/stdout` etc.
 /// indirection some tools use.
 const TTY_ALLOW: &str = "\
-;; --- pseudo-terminal access (pty bridge in mxc_pty::run_with_pty) ---
+;; --- pseudo-terminal access (inherited TTY when run under a pty) ---
 (allow file-read* file-write* file-ioctl
     (literal \"/dev/tty\")
     (regex #\"^/dev/ttys[0-9]+$\"))
@@ -422,7 +422,7 @@ fn write_extra_seatbelt_rules(out: &mut String, request: &ExecutionRequest) {
 
 /// Expand a leading `~` or `~/` to the current user's home directory.
 /// Returns an error if `HOME` is not set and the path requires expansion.
-fn expand_tilde(path: &str) -> Result<String, String> {
+pub(crate) fn expand_tilde(path: &str) -> Result<String, String> {
     if path == "~" || path.starts_with("~/") {
         let home = std::env::var("HOME").map_err(|_| {
             format!("HOME environment variable not set; cannot expand '{path}' in seatbelt profile")
diff --git a/src/backends/seatbelt/common/src/seatbelt_runner.rs b/src/backends/seatbelt/common/src/seatbelt_runner.rs
index 1c6f63655..49db23aff 100644
--- a/src/backends/seatbelt/common/src/seatbelt_runner.rs
+++ b/src/backends/seatbelt/common/src/seatbelt_runner.rs
@@ -7,9 +7,11 @@
 //! The sandbox is applied via `sandbox_init()` inside `Command::pre_exec`,
 //! then `/bin/sh` is exec'd directly. The child inherits the parent's
 //! Mach bootstrap namespace so both CLI commands and GUI applications
-//! (when `guiAccess = true`) work correctly. The exec path uses
-//! [`mxc_pty::run_with_pty`] so the inner shell sees a real TTY and the
-//! host can stream its output as it arrives.
+//! (when `guiAccess = true`) work correctly. The exec path returns a
+//! `SandboxProcess` whose stdio follows the requested `StdioMode`:
+//! `Inherit` gives the child the host's own stdio (a real TTY when the
+//! binary runs under a pty), while `Pipes` exposes stdout/stderr/stdin
+//! handles the caller can stream.
 //!
 //! For apps that require LaunchServices (`launchMethod: "open"`), the runner
 //! writes a sandbox helper script and launches the target app via `open -n -W`,
@@ -23,12 +25,17 @@ use std::fmt::Write as FmtWrite;
 use std::fs;
 use std::os::unix::process::CommandExt;
 use std::process::{Command, Stdio};
-use std::time::{Duration, Instant};
+use std::time::Duration;
 
-use mxc_pty::{run_with_pty, PtyOptions, PtyOutcome};
+use wxc_common::interruptible_reader::{wrap_pipe, InterruptibleReader, ReadCanceller};
 use wxc_common::logger::Logger;
 use wxc_common::models::{ExecutionRequest, LaunchMethod, ScriptResponse};
-use wxc_common::script_runner::ScriptRunner;
+use wxc_common::sandbox_process::{
+    boxed_closer, cancel_and_join_discard, group_kill, spawn_discard, take_boxed_read,
+    take_boxed_write, wait_with_timeout, SandboxBackend, SandboxProcess, StdioMode, StreamCloser,
+    WaitError,
+};
+use wxc_common::validator::validate_common;
 
 use crate::profile_builder::build_profile;
 
@@ -65,10 +72,8 @@ impl SeatbeltScriptRunner {
     }
 }
 
-const POLL_INTERVAL_MS: u64 = 500;
-
-impl ScriptRunner for SeatbeltScriptRunner {
-    fn validate_runner(&self, request: &ExecutionRequest) -> Result<(), ScriptResponse> {
+impl SandboxBackend for SeatbeltScriptRunner {
+    fn validate(&self, request: &ExecutionRequest) -> Result<(), ScriptResponse> {
         // Seatbelt cannot filter network by hostname — reject blockedHosts
         // rather than silently allowing traffic the user expects to be denied.
         if !request.policy.blocked_hosts.is_empty() {
@@ -80,40 +85,27 @@ impl ScriptRunner for SeatbeltScriptRunner {
             ));
         }
 
-        // Reject timeouts that are too small for our polling interval to
-        // enforce accurately.
-        if request.script_timeout > 0 && u64::from(request.script_timeout) < POLL_INTERVAL_MS {
-            return Err(error_response(format!(
-                "scriptTimeout {}ms is below the minimum of {}ms",
-                request.script_timeout, POLL_INTERVAL_MS
-            )));
-        }
-
         Ok(())
     }
 
-    fn execute(&mut self, request: &ExecutionRequest, logger: &mut Logger) -> ScriptResponse {
-        // 1. Build the Seatbelt profile from the policy.
-        let profile = match build_profile(request) {
-            Ok(p) => p,
-            Err(e) => {
-                return ScriptResponse {
-                    exit_code: -1,
-                    standard_out: String::new(),
-                    standard_err: String::new(),
-                    error_message: e,
-                    ..Default::default()
-                }
-            }
-        };
+    fn spawn(
+        &mut self,
+        request: &ExecutionRequest,
+        logger: &mut Logger,
+        stdio: StdioMode,
+    ) -> Result<Box<dyn SandboxProcess>, ScriptResponse> {
+        validate_common(request)?;
+        self.validate(request)?;
 
-        // Determine launch method from seatbelt config.
+        // Build the Seatbelt profile from the policy.
+        let profile = build_profile(request).map_err(error_response)?;
+
+        // Determine launch method + GUI access from the seatbelt config.
         let launch_method = request
             .seatbelt
             .as_ref()
             .map(|s| s.launch_method.clone())
             .unwrap_or_default();
-
         let gui_access = request
             .seatbelt
             .as_ref()
@@ -121,252 +113,388 @@ impl ScriptRunner for SeatbeltScriptRunner {
             .unwrap_or(false);
 
         match launch_method {
-            LaunchMethod::Exec => self.execute_exec(&profile, request, gui_access, logger),
-            LaunchMethod::Open => self.execute_open(&profile, request, logger),
+            LaunchMethod::Exec => spawn_exec(&profile, request, gui_access, stdio, logger),
+            LaunchMethod::Open => spawn_open(&profile, request, stdio, logger),
         }
     }
 }
 
-impl SeatbeltScriptRunner {
-    /// Standard execution path: fork → sandbox_init → exec.
-    /// When `gui_access` is true, stdio is inherited for GUI app compatibility.
-    fn execute_exec(
-        &self,
-        profile: &str,
-        request: &ExecutionRequest,
-        gui_access: bool,
-        logger: &mut Logger,
-    ) -> ScriptResponse {
-        let mut command = match build_sandbox_command(profile, &request.script_code, logger) {
-            Ok(cmd) => cmd,
-            Err(resp) => return resp,
-        };
-
-        // Environment setup.
-        if !request.env.is_empty() {
-            command.env_clear();
-            for kv in &request.env {
-                if let Some((key, value)) = kv.split_once('=') {
-                    command.env(key, value);
-                }
-            }
-        }
+/// Exec launch path: fork → sandbox_init → exec `/bin/sh -c <script>`. With
+/// [`StdioMode::Pipes`] the child gets pipes and leads its own session (so the
+/// caller can tree-terminate via the process group); with
+/// [`StdioMode::Inherit`] it inherits the process's stdio (a TTY when the
+/// binary has one) and stays in the binary's session. `gui_access` apps require
+/// inherited stdio and cannot stream.
+fn spawn_exec(
+    profile: &str,
+    request: &ExecutionRequest,
+    gui_access: bool,
+    stdio: StdioMode,
+    logger: &mut Logger,
+) -> Result<Box<dyn SandboxProcess>, ScriptResponse> {
+    if gui_access && stdio == StdioMode::Pipes {
+        return Err(error_response(
+            "Seatbelt guiAccess requires inherited stdio and cannot stream over pipes".to_string(),
+        ));
+    }
 
-        if !request.working_directory.is_empty() {
-            command.current_dir(&request.working_directory);
+    // Pipes → own session (setsid) so a process-group tree-kill never touches
+    // the host. Inherit/GUI → keep the binary's session and controlling
+    // terminal so the child sees a TTY exactly when the binary does.
+    let new_session = stdio == StdioMode::Pipes;
+    // Inherit mode with a finite timeout: put the child in its own process group
+    // (same session, so it keeps the controlling terminal) so the timeout branch
+    // can tree-kill its descendants instead of only the direct `/bin/sh`. A
+    // backgrounded group reading the inherited TTY can be SIGTTIN-stopped, so
+    // this is limited to timeout-bounded runs, which are inherently
+    // non-interactive.
+    let new_group = stdio == StdioMode::Inherit && timeout_from(request).is_some();
+    let mut command = build_sandbox_command(
+        profile,
+        &request.script_code,
+        new_session,
+        new_group,
+        logger,
+    )?;
+
+    // Always start from a cleared environment so untrusted sandboxed code never
+    // inherits the host's env.
+    apply_clean_environment(&mut command, request);
+
+    // Working directory. Also export `PWD` so the child's `getcwd()` uses its
+    // fast `$PWD` path (a single stat) instead of walking parent directories
+    // the sandbox may not let it read — which otherwise leaks
+    // "getcwd: ... Operation not permitted" to stderr.
+    let cwd = resolve_working_directory(request);
+    command.current_dir(&cwd);
+    command.env("PWD", &cwd);
+
+    match stdio {
+        StdioMode::Pipes => {
+            command
+                .stdin(Stdio::piped())
+                .stdout(Stdio::piped())
+                .stderr(Stdio::piped());
         }
-
-        if gui_access {
-            // GUI apps need inherited stdio for window interaction.
+        StdioMode::Inherit => {
+            // The child inherits the binary's stdio directly (a TTY when the
+            // binary has one) — no separate pty bridge.
             command
                 .stdin(Stdio::inherit())
                 .stdout(Stdio::inherit())
                 .stderr(Stdio::inherit());
+        }
+    }
 
-            // Spawn manually — run_with_pty is not appropriate for GUI mode.
-            let mut child = match command.spawn() {
-                Ok(process) => process,
-                Err(error) => {
-                    let msg = if error.kind() == std::io::ErrorKind::PermissionDenied {
-                        format!(
-                            "failed to spawn sandboxed process (sandbox_init likely rejected \
-                             the profile — check stderr for details): {error}"
-                        )
-                    } else {
-                        format!("failed to spawn sandboxed process: {error}")
-                    };
-                    return error_response(msg);
-                }
-            };
-
-            let timeout = if request.script_timeout == 0 {
-                None
-            } else {
-                Some(Duration::from_millis(u64::from(request.script_timeout)))
-            };
-
-            match wait_with_timeout(&mut child, timeout) {
-                Ok(status) => ScriptResponse {
-                    exit_code: status.code().unwrap_or(-1),
-                    ..Default::default()
-                },
-                Err(WaitError::Timeout) => {
-                    let _ = child.kill();
-                    let _ = child.wait();
-                    ScriptResponse {
-                        exit_code: -1,
-                        error_message: format!(
-                            "Seatbelt: process timed out after {}ms",
-                            request.script_timeout
-                        ),
-                        ..Default::default()
-                    }
-                }
-                Err(WaitError::Io(error)) => error_response(format!("wait failed: {error}")),
+    let mut child = command
+        .spawn()
+        .map_err(|error| error_response(spawn_error(&error)))?;
+
+    let (stdin, stdout, stderr) = match stdio {
+        StdioMode::Pipes => (child.stdin.take(), child.stdout.take(), child.stderr.take()),
+        StdioMode::Inherit => (None, None, None),
+    };
+
+    // Wrap the pipe reads so the caller can abandon a stream a backgrounded
+    // descendant is holding open (see `SandboxProcess::stdout_closer`), without
+    // killing the child. On failure, don't orphan the already-spawned sandboxed
+    // process — kill and reap it before returning the error.
+    let (stdout, stdout_canceller, stderr, stderr_canceller) =
+        match (wrap_pipe(stdout), wrap_pipe(stderr)) {
+            (Ok((out, out_canceller)), Ok((err, err_canceller))) => {
+                (out, out_canceller, err, err_canceller)
             }
-        } else {
-            // CLI mode: hand off to the shared PTY bridge so the inner shell
-            // sees a real TTY and the host can stream output as it arrives.
-            let timeout = if request.script_timeout == 0 {
-                None
-            } else {
-                Some(Duration::from_millis(u64::from(request.script_timeout)))
-            };
-
-            let options = PtyOptions {
-                timeout,
-                ..PtyOptions::default()
-            };
-
-            match run_with_pty(command, options) {
-                Ok(PtyOutcome::Exited(status)) => ScriptResponse {
-                    exit_code: status.code().unwrap_or(-1),
-                    ..Default::default()
-                },
-                Ok(PtyOutcome::TimedOut) => {
-                    let msg = format!(
-                        "Seatbelt: script timed out after {}ms",
-                        request.script_timeout
-                    );
-                    let _ = writeln!(logger, "{msg}");
-                    error_response(msg)
-                }
-                Err(error) => error_response(format!("Seatbelt: {error}")),
+            (out_result, err_result) => {
+                let _ = child.kill();
+                let _ = child.wait();
+                let error = out_result.err().or(err_result.err());
+                return Err(error_response(format!(
+                    "Seatbelt: failed to wrap stdio pipes: {}",
+                    error.map_or_else(|| "unknown error".to_string(), |e| e.to_string()),
+                )));
             }
-        }
+        };
+
+    Ok(Box::new(SeatbeltSandboxProcess {
+        child,
+        stdin,
+        stdout,
+        stderr,
+        stdout_canceller,
+        stderr_canceller,
+        timeout: timeout_from(request),
+        group: new_session || new_group,
+        cleanup: Vec::new(),
+    }))
+}
+
+/// LaunchServices launch path: write a sandbox helper + `.command` file and run
+/// it in Terminal.app via `open -n -W`. Required for Apple system apps with
+/// Launch Constraints (e.g. Terminal.app). The sandboxed shell runs inside
+/// Terminal, not as our child, so there are no pipes to stream — only the
+/// `open -W` waiter — and [`StdioMode::Pipes`] is rejected.
+fn spawn_open(
+    profile: &str,
+    request: &ExecutionRequest,
+    stdio: StdioMode,
+    logger: &mut Logger,
+) -> Result<Box<dyn SandboxProcess>, ScriptResponse> {
+    if stdio == StdioMode::Pipes {
+        return Err(error_response(
+            "Seatbelt launchMethod 'open' launches Terminal.app and cannot stream over pipes"
+                .to_string(),
+        ));
     }
 
-    /// LaunchServices execution path: write a sandbox helper, launch via
-    /// `open -n -W`. Required for Apple system apps with Launch Constraints
-    /// (e.g. Terminal.app).
-    fn execute_open(
-        &self,
-        profile: &str,
-        request: &ExecutionRequest,
-        logger: &mut Logger,
-    ) -> ScriptResponse {
-        let _ = writeln!(
-            logger,
-            "Seatbelt: using LaunchServices (open) launch method"
-        );
-
-        // 1. Write the profile to a secure temp file.
-        let profile_path = match write_secure_temp_file("mxc_sb_profile_", profile, 0o600) {
-            Ok(p) => p,
-            Err(e) => return error_response(format!("failed to write profile: {e}")),
-        };
+    let _ = writeln!(
+        logger,
+        "Seatbelt: using LaunchServices (open) launch method"
+    );
 
-        // 2. Build environment exports for the helper script.
-        let mut env_exports = String::new();
-        for kv in &request.env {
-            if let Some((key, value)) = kv.split_once('=') {
-                // Validate key is a safe shell identifier to prevent injection.
-                if !key.chars().all(|c| c.is_ascii_alphanumeric() || c == '_')
-                    || key.is_empty()
-                    || key.starts_with(|c: char| c.is_ascii_digit())
-                {
-                    continue; // Skip invalid env var names
-                }
-                // Shell-escape the value.
-                let escaped = value.replace('\'', "'\\''");
-                let _ = writeln!(env_exports, "export {key}='{escaped}'");
+    // 1. Write the profile to a secure temp file.
+    let profile_path = match write_secure_temp_file("mxc_sb_profile_", profile, 0o600) {
+        Ok(p) => p,
+        Err(e) => return Err(error_response(format!("failed to write profile: {e}"))),
+    };
+
+    // 2. Build environment exports for the helper script.
+    let mut env_exports = String::new();
+    for kv in &request.env {
+        if let Some((key, value)) = kv.split_once('=') {
+            // Validate key is a safe shell identifier to prevent injection.
+            if !key.chars().all(|c| c.is_ascii_alphanumeric() || c == '_')
+                || key.is_empty()
+                || key.starts_with(|c: char| c.is_ascii_digit())
+            {
+                continue; // Skip invalid env var names
             }
+            // Shell-escape the value.
+            let escaped = value.replace('\'', "'\\''");
+            let _ = writeln!(env_exports, "export {key}='{escaped}'");
         }
+    }
 
-        // 3. Create the sandbox helper script.
-        // This script is executed inside the terminal app. It:
-        //   a) Calls sandbox-exec with the profile file to sandbox the shell
-        //   b) Execs the user's command inside the sandbox
-        let script_code = &request.script_code;
-        let helper_content = format!(
-            "#!/bin/sh\n\
-             # MXC Seatbelt sandbox helper — auto-generated, do not edit.\n\
-             {env_exports}\
-             exec /usr/bin/sandbox-exec -f '{profile_path}' /bin/sh -c 'clear; {script_escaped}'\n",
-            profile_path = profile_path,
-            script_escaped = script_code.replace('\'', "'\\''"),
-        );
-
-        let helper_path = match write_secure_temp_file("mxc_sb_helper_", &helper_content, 0o700) {
-            Ok(p) => p,
-            Err(e) => {
-                let _ = fs::remove_file(&profile_path);
-                return error_response(format!("failed to write helper script: {e}"));
-            }
-        };
+    // 3. Create the sandbox helper script.
+    // This script is executed inside the terminal app. It:
+    //   a) Calls sandbox-exec with the profile file to sandbox the shell
+    //   b) Execs the user's command inside the sandbox
+    let script_code = &request.script_code;
+    let helper_content = format!(
+        "#!/bin/sh\n\
+         # MXC Seatbelt sandbox helper — auto-generated, do not edit.\n\
+         {env_exports}\
+         exec /usr/bin/sandbox-exec -f '{profile_path}' /bin/sh -c 'clear; {script_escaped}'\n",
+        profile_path = profile_path,
+        script_escaped = script_code.replace('\'', "'\\''"),
+    );
+
+    let helper_path = match write_secure_temp_file("mxc_sb_helper_", &helper_content, 0o700) {
+        Ok(p) => p,
+        Err(e) => {
+            let _ = fs::remove_file(&profile_path);
+            return Err(error_response(format!(
+                "failed to write helper script: {e}"
+            )));
+        }
+    };
 
-        // 4. Create the .command file that Terminal will execute.
-        let command_content = format!("#!/bin/sh\nexec '{}'\n", helper_path);
-        let command_path = match write_secure_temp_file("mxc_sb_launch_", &command_content, 0o700) {
-            Ok(p) => {
-                // Rename to .command extension so Terminal recognizes it.
-                let new_path = format!("{p}.command");
-                if let Err(e) = fs::rename(&p, &new_path) {
-                    let _ = fs::remove_file(&p);
-                    let _ = fs::remove_file(&profile_path);
-                    let _ = fs::remove_file(&helper_path);
-                    return error_response(format!("failed to rename to .command: {e}"));
-                }
-                new_path
-            }
-            Err(e) => {
+    // 4. Create the .command file that Terminal will execute.
+    let command_content = format!("#!/bin/sh\nexec '{}'\n", helper_path);
+    let command_path = match write_secure_temp_file("mxc_sb_launch_", &command_content, 0o700) {
+        Ok(p) => {
+            // Rename to .command extension so Terminal recognizes it.
+            let new_path = format!("{p}.command");
+            if let Err(e) = fs::rename(&p, &new_path) {
+                let _ = fs::remove_file(&p);
                 let _ = fs::remove_file(&profile_path);
                 let _ = fs::remove_file(&helper_path);
-                return error_response(format!("failed to write .command file: {e}"));
+                return Err(error_response(format!("failed to rename to .command: {e}")));
             }
-        };
+            new_path
+        }
+        Err(e) => {
+            let _ = fs::remove_file(&profile_path);
+            let _ = fs::remove_file(&helper_path);
+            return Err(error_response(format!(
+                "failed to write .command file: {e}"
+            )));
+        }
+    };
 
-        let _ = writeln!(logger, "Seatbelt: launching via: open -n -W {command_path}");
+    let _ = writeln!(logger, "Seatbelt: launching via: open -n -W {command_path}");
+
+    // 5. Launch via `open -n -W`.
+    let child = match Command::new("open")
+        .args(["-n", "-W", "-a", "Terminal", &command_path])
+        .stdin(Stdio::null())
+        .stdout(Stdio::null())
+        .stderr(Stdio::null())
+        .spawn()
+    {
+        Ok(c) => c,
+        Err(e) => {
+            cleanup_files(&[&profile_path, &helper_path, &command_path]);
+            return Err(error_response(format!("failed to launch via open: {e}")));
+        }
+    };
 
-        // 5. Launch via `open -n -W`.
-        let mut child = match Command::new("open")
-            .args(["-n", "-W", "-a", "Terminal", &command_path])
-            .stdin(Stdio::null())
-            .stdout(Stdio::null())
-            .stderr(Stdio::null())
-            .spawn()
-        {
-            Ok(c) => c,
-            Err(e) => {
-                cleanup_files(&[&profile_path, &helper_path, &command_path]);
-                return error_response(format!("failed to launch via open: {e}"));
-            }
-        };
+    // The `open -W` process is the thing to wait on; the sandboxed shell runs
+    // inside Terminal. No streamable stdio; the temp files are removed once the
+    // handle's `wait()` (or drop) runs.
+    Ok(Box::new(SeatbeltSandboxProcess {
+        child,
+        stdin: None,
+        stdout: None,
+        stderr: None,
+        stdout_canceller: None,
+        stderr_canceller: None,
+        timeout: timeout_from(request),
+        group: false,
+        cleanup: vec![profile_path, helper_path, command_path],
+    }))
+}
+
+/// A running Seatbelt-sandboxed process: the child plus, for the pipes path,
+/// its parent-side pipe ends. See [`SandboxProcess`] for the contract.
+struct SeatbeltSandboxProcess {
+    child: std::process::Child,
+    /// Pipe ends — `Some` only for [`StdioMode::Pipes`]; `None` for inherited
+    /// stdio / Open mode (the streams are the binary's own, or detached). The
+    /// reads are wrapped so they can be cancelled out-of-band (see the
+    /// `*_canceller` fields).
+    stdin: Option<std::process::ChildStdin>,
+    stdout: Option<InterruptibleReader>,
+    stderr: Option<InterruptibleReader>,
+    /// Cancellers for the stdout/stderr reads (`Some` alongside the pipe ends),
+    /// kept so [`stdout_closer`](SandboxProcess::stdout_closer) /
+    /// [`stderr_closer`](SandboxProcess::stderr_closer) can mint closers even
+    /// after the stream has been taken.
+    stdout_canceller: Option<ReadCanceller>,
+    stderr_canceller: Option<ReadCanceller>,
+    timeout: Option<Duration>,
+    /// The child leads its own process group (`setsid`), so termination signals
+    /// the whole group; `false` for inherited / Open mode (a single process).
+    group: bool,
+    /// Temp files to remove once the child exits (Open mode); empty otherwise.
+    cleanup: Vec<String>,
+}
+
+impl SeatbeltSandboxProcess {
+    /// Remove the Open-mode temp files (profile / helper / `.command`) once the
+    /// child has exited. Idempotent — drains `cleanup` — so it is safe to call
+    /// from both `wait()` and `drop`.
+    fn run_cleanup(&mut self) {
+        if self.cleanup.is_empty() {
+            return;
+        }
+        let files = std::mem::take(&mut self.cleanup);
+        let refs: Vec<&str> = files.iter().map(String::as_str).collect();
+        cleanup_files(&refs);
+    }
+}
+
+impl SandboxProcess for SeatbeltSandboxProcess {
+    fn take_stdin(&mut self) -> Option<Box<dyn std::io::Write + Send>> {
+        take_boxed_write(&mut self.stdin)
+    }
+
+    fn take_stdout(&mut self) -> Option<Box<dyn std::io::Read + Send>> {
+        take_boxed_read(&mut self.stdout)
+    }
+
+    fn take_stderr(&mut self) -> Option<Box<dyn std::io::Read + Send>> {
+        take_boxed_read(&mut self.stderr)
+    }
+
+    fn stdout_closer(&self) -> Option<Box<dyn StreamCloser>> {
+        boxed_closer(&self.stdout_canceller)
+    }
+
+    fn stderr_closer(&self) -> Option<Box<dyn StreamCloser>> {
+        boxed_closer(&self.stderr_canceller)
+    }
+
+    fn try_wait(&mut self) -> std::io::Result<Option<i32>> {
+        Ok(self
+            .child
+            .try_wait()?
+            .map(|status| status.code().unwrap_or(-1)))
+    }
+
+    fn id(&self) -> u32 {
+        self.child.id()
+    }
 
-        // 6. Wait for the terminal to close.
-        let timeout = if request.script_timeout == 0 {
-            None
+    fn kill(&mut self) -> std::io::Result<()> {
+        // No-op once the child has exited and been reaped: its pid/pgid can be
+        // recycled, so signaling it could hit an unrelated process (group). A
+        // reaped `Child` returns its cached status here without a syscall.
+        if self.child.try_wait()?.is_some() {
+            return Ok(());
+        }
+        if self.group {
+            // The child leads its own process group — signal the whole group so
+            // sandboxed descendants are terminated too.
+            group_kill(&mut self.child)
         } else {
-            Some(Duration::from_millis(u64::from(request.script_timeout)))
-        };
+            // Inherited / Open mode: a single process sharing the binary's
+            // process group, so signal just it (a group-kill would hit the
+            // binary itself).
+            self.child.kill()
+        }
+    }
+
+    fn wait(&mut self) -> std::io::Result<i32> {
+        // Close our copy of any not-taken stdin so the child sees EOF and is
+        // not blocked waiting for input the caller never intends to send.
+        self.stdin.take();
 
-        let result = match wait_with_timeout(&mut child, timeout) {
-            Ok(status) => ScriptResponse {
-                exit_code: status.code().unwrap_or(-1),
-                ..Default::default()
-            },
+        // Drain (and discard) any not-taken stdout/stderr concurrently so the
+        // child can't block on a full pipe (taken streams are the caller's
+        // responsibility).
+        let stdout_thread = spawn_discard(self.stdout.take());
+        let stderr_thread = spawn_discard(self.stderr.take());
+
+        let result = match wait_with_timeout(&mut self.child, self.timeout) {
+            Ok(status) => Ok(status.code().unwrap_or(-1)),
             Err(WaitError::Timeout) => {
-                let _ = child.kill();
-                let _ = child.wait();
-                ScriptResponse {
-                    exit_code: -1,
-                    error_message: format!(
-                        "Seatbelt: terminal timed out after {}ms",
-                        request.script_timeout
-                    ),
-                    ..Default::default()
-                }
+                // Timed out — terminate now (`kill()` SIGKILLs the group or the
+                // lone child) and reap the zombie.
+                let _ = self.kill();
+                let _ = self.child.wait();
+                Err(std::io::Error::new(
+                    std::io::ErrorKind::TimedOut,
+                    "Seatbelt: process timed out",
+                ))
+            }
+            Err(WaitError::Io(error)) => {
+                // The child may still be running: kill+reap it (don't orphan
+                // the sandbox) before returning.
+                let _ = self.kill();
+                let _ = self.child.wait();
+                Err(std::io::Error::other(format!("wait failed: {error}")))
             }
-            Err(WaitError::Io(error)) => error_response(format!("wait failed: {error}")),
         };
 
-        // 7. Cleanup temp files.
-        cleanup_files(&[&profile_path, &helper_path, &command_path]);
-
+        cancel_and_join_discard(stdout_thread, &self.stdout_canceller);
+        cancel_and_join_discard(stderr_thread, &self.stderr_canceller);
+        self.run_cleanup();
         result
     }
 }
 
+impl Drop for SeatbeltSandboxProcess {
+    fn drop(&mut self) {
+        // Don't leak a running sandboxed process (and its group) or a zombie if
+        // the handle is dropped without `wait()`, and remove any temp files.
+        // `kill()` is idempotent (its `try_wait` guard no-ops once the child has
+        // exited).
+        let _ = self.kill();
+        let _ = self.child.wait();
+        self.run_cleanup();
+    }
+}
+
 /// Build a `Command` that applies the sandbox via `sandbox_init()` in
 /// `pre_exec`, then execs `/bin/sh -c <script>`. The child inherits the
 /// parent's Mach bootstrap namespace, so both CLI and GUI applications
@@ -381,6 +509,8 @@ impl SeatbeltScriptRunner {
 fn build_sandbox_command(
     profile: &str,
     script_code: &str,
+    new_session: bool,
+    new_group: bool,
     logger: &mut Logger,
 ) -> Result<Command, ScriptResponse> {
     let profile_cstr = CString::new(profile)
@@ -391,6 +521,38 @@ fn build_sandbox_command(
     let mut command = Command::new(DEFAULT_SHELL);
     command.arg("-c").arg(script_code);
 
+    // When requested (streaming path), put the child in its own session /
+    // process group via `setsid()` so a caller can tree-kill it with a single
+    // `killpg` without touching the host's process group. This runs before
+    // `sandbox_init` so the detach happens regardless of the profile.
+    //
+    // SAFETY: `setsid` is async-signal-safe and runs after fork(), before
+    // exec(); the child is not a process-group leader at this point, so it
+    // succeeds. Failure is non-fatal (the caller's negative-pid kill simply
+    // targets a group that does not exist).
+    if new_session {
+        unsafe {
+            command.pre_exec(|| {
+                libc::setsid();
+                Ok(())
+            });
+        }
+    } else if new_group {
+        // Inherit-with-timeout: a new process group within the *existing*
+        // session, so the child keeps the controlling terminal yet can be
+        // tree-killed via `killpg(-pgid)` on timeout.
+        //
+        // SAFETY: `setpgid` is async-signal-safe and runs after fork(), before
+        // exec(); the child is not yet a group leader, so it succeeds. Failure
+        // is non-fatal (the timeout kill then targets the direct child only).
+        unsafe {
+            command.pre_exec(|| {
+                libc::setpgid(0, 0);
+                Ok(())
+            });
+        }
+    }
+
     // SAFETY: The closure runs after fork(), before exec(). We only call
     // sandbox_init with a pre-allocated CString — no Rust allocations
     // happen inside the closure. sandbox_init is used in this fork+exec
@@ -428,32 +590,70 @@ fn error_response(message: String) -> ScriptResponse {
     }
 }
 
-enum WaitError {
-    Timeout,
-    Io(std::io::Error),
+/// The optional run timeout — `None` when `scriptTimeout` is 0 (wait forever).
+fn timeout_from(request: &ExecutionRequest) -> Option<Duration> {
+    if request.script_timeout == 0 {
+        None
+    } else {
+        Some(Duration::from_millis(u64::from(request.script_timeout)))
+    }
 }
 
-/// Wait for `child` to exit, polling at `POLL_INTERVAL_MS` intervals if a
-/// timeout is set. We poll manually rather than adding an async runtime
-/// dependency since the runner is otherwise synchronous.
-fn wait_with_timeout(
-    child: &mut std::process::Child,
-    timeout: Option<Duration>,
-) -> Result<std::process::ExitStatus, WaitError> {
-    let Some(deadline) = timeout.map(|duration| Instant::now() + duration) else {
-        return child.wait().map_err(WaitError::Io);
-    };
+/// Message for a `Command::spawn` failure, calling out the likely cause
+/// (`sandbox_init` rejecting the profile) when the OS reports a permission
+/// error.
+fn spawn_error(error: &std::io::Error) -> String {
+    if error.kind() == std::io::ErrorKind::PermissionDenied {
+        format!(
+            "failed to spawn sandboxed process (sandbox_init likely rejected \
+             the profile — check stderr for details): {error}"
+        )
+    } else {
+        format!("failed to spawn sandboxed process: {error}")
+    }
+}
 
-    loop {
-        match child.try_wait() {
-            Ok(Some(status)) => return Ok(status),
-            Ok(None) => {
-                if Instant::now() >= deadline {
-                    return Err(WaitError::Timeout);
-                }
-                std::thread::sleep(Duration::from_millis(POLL_INTERVAL_MS));
-            }
-            Err(error) => return Err(WaitError::Io(error)),
+/// Resolve the working directory for the sandboxed child.
+///
+/// An explicit `working_directory` always wins. Otherwise — rather than
+/// inheriting the host process's cwd, which under the deny-by-default Seatbelt
+/// profile may be inaccessible and make `getcwd()` fail (leaking a
+/// "getcwd: ... Operation not permitted" line on the child's stderr) — we pick
+/// a directory the profile is guaranteed to allow: the first readwrite path,
+/// else the first readonly path, else `/` (always readable per the baseline).
+fn resolve_working_directory(request: &ExecutionRequest) -> String {
+    if !request.working_directory.is_empty() {
+        return request.working_directory.clone();
+    }
+    let default = request
+        .policy
+        .readwrite_paths
+        .first()
+        .or_else(|| request.policy.readonly_paths.first())
+        .cloned()
+        .unwrap_or_else(|| "/".to_string());
+    // The default may be a `~`/`~/…` policy path; expand it exactly as the
+    // sandbox profile does so `Command::current_dir` never gets a literal `~`
+    // (which would fail). Fall back to the unexpanded value if `HOME` is unset.
+    crate::profile_builder::expand_tilde(&default).unwrap_or(default)
+}
+
+/// Baseline `PATH` for the sandboxed child. We always start from a cleared
+/// environment (so the host process's env — cloud creds, API tokens — never
+/// leaks into untrusted sandboxed code), which means we must supply a default
+/// `PATH` for the `/bin/sh` wrapper and common tools to resolve.
+const DEFAULT_SANDBOX_PATH: &str = "/usr/bin:/bin:/usr/sbin:/sbin";
+
+/// Populate `command`'s environment from a cleared baseline: never inherit the
+/// host environment (matching the bubblewrap `--clearenv` and AppContainer
+/// clean-block behaviour). Sets a default `PATH`, then the request's vars
+/// (which may override `PATH`). `PWD` is set separately alongside the cwd.
+fn apply_clean_environment(command: &mut Command, request: &ExecutionRequest) {
+    command.env_clear();
+    command.env("PATH", DEFAULT_SANDBOX_PATH);
+    for kv in &request.env {
+        if let Some((key, value)) = kv.split_once('=') {
+            command.env(key, value);
         }
     }
 }
@@ -529,7 +729,7 @@ mod tests {
         let mut request = base_request();
         request.policy.blocked_hosts = vec!["evil.example.com".into()];
         let runner = SeatbeltScriptRunner::new();
-        let response = runner.validate_runner(&request).unwrap_err();
+        let response = runner.validate(&request).unwrap_err();
         assert_eq!(response.exit_code, -1);
         assert!(response.error_message.contains("blockedHosts"));
         assert!(response.error_message.contains("cannot be enforced"));
diff --git a/src/core/lxc/src/main.rs b/src/core/lxc/src/main.rs
index ad720514c..7c1bddf6f 100644
--- a/src/core/lxc/src/main.rs
+++ b/src/core/lxc/src/main.rs
@@ -19,6 +19,8 @@ use lxc_common::lxc_runner::LxcScriptRunner;
 use lxc_common::signal_cleanup;
 #[cfg(feature = "microvm")]
 use nanvix_runner::NanVixScriptRunner;
+#[cfg(target_os = "linux")]
+use wxc_common::sandbox_process::Runner;
 
 #[derive(Parser)]
 #[command(name = "lxc-exec", about = "Linux Container Executor")]
@@ -254,7 +256,7 @@ fn main() {
         ContainmentBackend::Bubblewrap => {
             #[cfg(target_os = "linux")]
             {
-                Box::new(BubblewrapScriptRunner::new())
+                Box::new(Runner::new(BubblewrapScriptRunner::new()))
             }
             #[cfg(not(target_os = "linux"))]
             {
diff --git a/src/core/mxc_darwin/src/main.rs b/src/core/mxc_darwin/src/main.rs
index b862a75b1..048ca3aca 100644
--- a/src/core/mxc_darwin/src/main.rs
+++ b/src/core/mxc_darwin/src/main.rs
@@ -125,8 +125,9 @@ fn main() {
 #[cfg(target_os = "macos")]
 fn run_seatbelt(request: &ExecutionRequest, logger: &mut Logger) -> ! {
     use seatbelt_common::seatbelt_runner::SeatbeltScriptRunner;
+    use wxc_common::sandbox_process::Runner;
 
-    let mut runner = SeatbeltScriptRunner::new();
+    let mut runner = Runner::new(SeatbeltScriptRunner::new());
     let run_start = Instant::now();
     let response = runner.run(request, logger);
     let run_elapsed = run_start.elapsed();
diff --git a/src/core/wxc/src/main.rs b/src/core/wxc/src/main.rs
index 018b38b0d..17a5011b7 100644
--- a/src/core/wxc/src/main.rs
+++ b/src/core/wxc/src/main.rs
@@ -26,6 +26,7 @@ use wxc_common::diagnostic::DiagnosticConfig;
 use wxc_common::logger::{Logger, Mode};
 use wxc_common::models::{ContainmentBackend, ExecutionRequest, ScriptResponse};
 use wxc_common::mxc_error::{MxcError, ResponseEnvelope};
+use wxc_common::sandbox_process::Runner;
 use wxc_common::script_runner::{handle_dry_run_exit, ScriptRunner};
 #[cfg(all(target_os = "windows", feature = "isolation_session"))]
 use wxc_common::state_aware_dispatch::dispatch_state_aware;
@@ -853,7 +854,7 @@ fn main() {
                     }
                 }
             } else {
-                Box::new(AppContainerScriptRunner::new())
+                Box::new(Runner::new(AppContainerScriptRunner::new()))
             }
         }
         ContainmentBackend::Wslc => {
diff --git a/src/testing/wxc_e2e_tests/tests/e2e_seatbelt_characterization.rs b/src/testing/wxc_e2e_tests/tests/e2e_seatbelt_characterization.rs
index 4ee0b5cff..228787eb0 100644
--- a/src/testing/wxc_e2e_tests/tests/e2e_seatbelt_characterization.rs
+++ b/src/testing/wxc_e2e_tests/tests/e2e_seatbelt_characterization.rs
@@ -3,17 +3,14 @@
 
 //! Seatbelt (macOS) executor **characterization** tests.
 //!
-//! These lock in the *current* run-to-completion behavior of the `mxc-exec-mac`
-//! executor before the unified `SandboxBackend`/`Runner` refactor (the risky
-//! part of the `mxc` library work) lands. They assert what the code does
-//! **today**, not what it ideally should do.
+//! These pin the run-to-completion behavior of the `mxc-exec-mac` executor
+//! under the unified `SandboxBackend`/`Runner` design, exercised end-to-end.
 //!
-//! Two of them — `inherits_host_env_when_process_env_empty` and
-//! `runs_in_launcher_cwd_when_process_cwd_empty` — pin behaviors that the
-//! unification was observed to change (it makes Seatbelt unconditionally
-//! `env_clear()` and rewrite the working directory). If a future refactor turns
-//! these RED, that is the signal to confirm the change is intentional and
-//! documented as a breaking change — not an accident.
+//! Two of them — `clears_host_env_when_process_env_empty` and
+//! `runs_in_first_readwrite_path_when_process_cwd_empty` — assert behaviors the
+//! unification deliberately changed from the pre-refactor executor: Seatbelt now
+//! unconditionally `env_clear()`s and resolves an empty working directory to a
+//! policy path. If they turn RED, the env/cwd model has drifted.
 //!
 //! They run in the existing macOS CI job (`cargo test --target
 //! aarch64-apple-darwin`) with no extra infrastructure: `sandbox-exec` needs no
@@ -92,33 +89,34 @@ fn seatbelt_streams_stdout() {
 
 /// CHARACTERIZES CURRENT BEHAVIOR (regression guard).
 ///
-/// With an empty `process.env`, the Seatbelt exec path does *not* clear the
-/// environment today, so the sandboxed child inherits the launcher's env. The
-/// unification refactor makes Seatbelt always `env_clear()` — which will turn
-/// this test RED. That is the intended early-warning signal.
+/// With an empty `process.env`, the Seatbelt exec path starts the child from a
+/// *cleared* environment (`env_clear()` plus a default `PATH`), so the
+/// launcher's environment — which may hold cloud creds / API tokens — never
+/// leaks into untrusted sandboxed code. This matches Bubblewrap's `--clearenv`
+/// model (see `bubblewrap_clears_host_env_by_default`); if it ever turns RED the
+/// env model has drifted.
 #[test]
-fn seatbelt_inherits_host_env_when_process_env_empty() {
+fn seatbelt_clears_host_env_when_process_env_empty() {
     if !has_platform_exec() {
         return;
     }
-    let marker = "CHAR_SEATBELT_ENV_INHERIT_4b7c2";
+    let marker = "CHAR_SEATBELT_ENV_CLEAR_4b7c2";
     let result = run_platform_config_value(
-        "seatbelt env inherit",
-        &config(
-            "env-inherit",
-            "printf 'MARKER=[%s]\\n' \"$MXC_CHAR_MARKER\"",
-        ),
+        "seatbelt env clear",
+        &config("env-clear", "printf 'MARKER=[%s]\\n' \"$MXC_CHAR_MARKER\""),
         &[("MXC_CHAR_MARKER", marker)],
         None,
     );
     assert_eq!(result.code, Some(0), "stderr: {}", result.stderr);
+    let out = result.combined_output();
     assert!(
-        result
-            .combined_output()
-            .contains(&format!("MARKER=[{marker}]")),
-        "expected the child to inherit MXC_CHAR_MARKER from the launcher \
-         (current Seatbelt behavior with empty process.env). Output:\n{}",
-        result.combined_output()
+        out.contains("MARKER=[]"),
+        "expected a cleared env (MARKER=[]); the child must not inherit the \
+         launcher's environment when process.env is empty. Output:\n{out}"
+    );
+    assert!(
+        !out.contains(marker),
+        "host env marker leaked into the sandbox. Output:\n{out}"
     );
 }
 
@@ -142,30 +140,31 @@ fn seatbelt_applies_requested_env() {
 
 /// CHARACTERIZES CURRENT BEHAVIOR (regression guard).
 ///
-/// With an empty `process.cwd`, the Seatbelt exec path does *not* change
-/// directory today, so the sandboxed child runs in the launcher's working
-/// directory. The unification refactor rewrites cwd to a policy path or `/` —
-/// which will turn this test RED.
+/// With an empty `process.cwd`, the Seatbelt exec path no longer inherits the
+/// launcher's working directory (which the deny-by-default profile may forbid,
+/// making the child's `getcwd()` fail and leak a "getcwd: Operation not
+/// permitted" line). Instead it resolves the cwd to the first readwrite policy
+/// path — a directory the profile is guaranteed to allow. `write_dir` is listed
+/// first, so the relative-path probe lands there, not in the launcher cwd.
 ///
 /// We observe the cwd by having the child create a file via a relative path
 /// (a shell redirection) and checking which directory it lands in — this
 /// avoids `pwd`/`realpath`, which the default Seatbelt profile denies for
-/// arbitrary temp paths. `write_dir` is a second writable policy path that is
-/// *not* the launcher cwd, so a refactor that rewrites cwd to a policy path
-/// would drop the probe there (or elsewhere) instead of in `launch_dir`.
+/// arbitrary temp paths. `launch_dir` is a second writable policy path that is
+/// *not* the resolved cwd, so the probe must not land there.
 #[test]
-fn seatbelt_runs_in_launcher_cwd_when_process_cwd_empty() {
+fn seatbelt_runs_in_first_readwrite_path_when_process_cwd_empty() {
     if !has_platform_exec() {
         return;
     }
     let write_dir = fs::canonicalize(unique_tempdir("cwd-write")).expect("canonicalize");
     let launch_dir = fs::canonicalize(unique_tempdir("cwd-launch")).expect("canonicalize");
-    let probe = "char_cwd_inherit_probe.txt";
-    let mut cfg = config("cwd-inherit", &format!("echo CHAR_OK > {probe}"));
+    let probe = "char_cwd_default_probe.txt";
+    let mut cfg = config("cwd-default", &format!("echo CHAR_OK > {probe}"));
     cfg["filesystem"] = json!({
         "readwritePaths": [write_dir.to_string_lossy(), launch_dir.to_string_lossy()]
     });
-    let result = run_platform_config_value("seatbelt cwd inherit", &cfg, &[], Some(&launch_dir));
+    let result = run_platform_config_value("seatbelt cwd default", &cfg, &[], Some(&launch_dir));
     let in_launch = launch_dir.join(probe).exists();
     let in_write = write_dir.join(probe).exists();
     let _ = fs::remove_dir_all(&launch_dir);
@@ -177,10 +176,10 @@ fn seatbelt_runs_in_launcher_cwd_when_process_cwd_empty() {
         result.combined_output()
     );
     assert!(
-        in_launch && !in_write,
-        "expected the probe in the launcher cwd {} (current behavior with empty \
-         process.cwd); in_launch={in_launch} in_write={in_write}\n{}",
-        launch_dir.display(),
+        in_write && !in_launch,
+        "expected the probe in the first readwrite policy path {} (resolved cwd \
+         with empty process.cwd); in_write={in_write} in_launch={in_launch}\n{}",
+        write_dir.display(),
         result.combined_output()
     );
 }

From 5ced2376211ae1e77968e9256920891fd17c6268 Mon Sep 17 00:00:00 2001
From: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
Date: Wed, 24 Jun 2026 09:57:13 -0300
Subject: [PATCH 3/9] feat(mxc-sdk): add the importable in-process sandbox
 library crate
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Add `mxc-sdk` (lib `mxc_sdk`), a Rust library for starting MXC sandboxes
in-process without a pty, built on the SandboxBackend interfaces and the
unified backends from the previous PRs. Callers stream a sandboxed process
without shelling out to the executor binaries or depending on the TypeScript
SDK.

Public surface (crate-owned types — `wxc_common` stays an implementation
detail):
- `build_request(&SandboxPolicy)` -> `SandboxRequest`, then `spawn_sandbox`
  -> `Sandbox`: a handle for bidirectional stdio (`take_stdin`/`take_stdout`/
  `take_stderr`), `try_wait`, `id`, `kill` (process-tree), and `wait` ->
  `WaitOutcome` (`Exited(i32)` | `TimedOut`), plus stdout/stderr closers.
- `Error` / `ErrorCode` mirror the wire-format error one-for-one.
- `mxc_sdk::policy` ports the SDK's config building (`createConfigFromPolicy`
  plus `available_tools_policy` / `user_profile_policy` /
  `temporary_files_policy`); `platform_support` ports `getPlatformSupport`.

Backends: Bubblewrap (Linux), Seatbelt (macOS), Windows ProcessContainer
(AppContainer + BaseContainer). Other backends and LXC return
`UnsupportedContainment` (LXC has no non-pty capture path); `dry_run` is
rejected for streaming spawns.

Adds `wxc_common::config_parser::load_request_from_value` so the crate maps a
config it already holds as JSON without a base64 round-trip. The in-crate
backend dispatch (`dispatch.rs`) and host probe (`platform.rs`) are marked
provisional — a follow-up moves them into a shared `mxc` engine crate that both
this library and the executor binaries call into.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
Signed-off-by: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
---
 .github/copilot-instructions.md          |    5 +-
 docs/sandbox-policy/v1/policy.md         |    4 +-
 src/Cargo.lock                           |   13 +
 src/Cargo.toml                           |    2 +
 src/core/mxc-sdk/Cargo.toml              |   27 +
 src/core/mxc-sdk/README.md               |  148 +++
 src/core/mxc-sdk/src/dispatch.rs         |  259 ++++++
 src/core/mxc-sdk/src/error.rs            |   97 ++
 src/core/mxc-sdk/src/lib.rs              |   76 ++
 src/core/mxc-sdk/src/platform.rs         |  100 ++
 src/core/mxc-sdk/src/policy.rs           | 1059 ++++++++++++++++++++++
 src/core/mxc-sdk/src/sandbox.rs          |  115 +++
 src/core/mxc-sdk/tests/sandbox.rs        |  308 +++++++
 src/core/mxc-sdk/tests/sdk_helpers.rs    |  245 +++++
 src/core/mxc-sdk/tests/streaming.rs      |  458 ++++++++++
 src/core/wxc_common/src/config_parser.rs |   21 +-
 16 files changed, 2931 insertions(+), 6 deletions(-)
 create mode 100644 src/core/mxc-sdk/Cargo.toml
 create mode 100644 src/core/mxc-sdk/README.md
 create mode 100644 src/core/mxc-sdk/src/dispatch.rs
 create mode 100644 src/core/mxc-sdk/src/error.rs
 create mode 100644 src/core/mxc-sdk/src/lib.rs
 create mode 100644 src/core/mxc-sdk/src/platform.rs
 create mode 100644 src/core/mxc-sdk/src/policy.rs
 create mode 100644 src/core/mxc-sdk/src/sandbox.rs
 create mode 100644 src/core/mxc-sdk/tests/sandbox.rs
 create mode 100644 src/core/mxc-sdk/tests/sdk_helpers.rs
 create mode 100644 src/core/mxc-sdk/tests/streaming.rs

diff --git a/.github/copilot-instructions.md b/.github/copilot-instructions.md
index 3ca324980..0bdfb55d9 100644
--- a/.github/copilot-instructions.md
+++ b/.github/copilot-instructions.md
@@ -173,7 +173,7 @@ The workspace is organized into five top-level directories under `src/`:
 
 | Directory | Purpose | Examples |
 |-----------|---------|----------|
-| `core/` | Cross-platform foundation + per-platform aggregator binaries | `wxc_common/`, `wxc/`, `lxc/`, `mxc_darwin/`, `mxc_pty/`, `mxc_build_common/`, `generated/` |
+| `core/` | Cross-platform foundation + per-platform aggregator binaries | `wxc_common/`, `wxc/`, `lxc/`, `mxc_darwin/`, `mxc-sdk/`, `mxc_pty/`, `mxc_build_common/`, `generated/` |
 | `backends/` | Backend-specific code (one subfolder per containment backend) | `appcontainer/common`, `windows_sandbox/{daemon,guest,common}`, `isolation_session/{bindings,common}`, `hyperlight/common`, `nanvix/{common,build_common,binaries,runner}`, `lxc/common`, `bubblewrap/common`, `wslc/common`, `seatbelt/common` |
 | `host/` | Host-side utilities | `wxc_host_prep/`, `wxc_winhttp_proxy_shim/` |
 | `testing/` | Test infrastructure crates | `wxc_e2e_tests/`, `wxc_test_driver/`, `wxc_test_proxy/`, `linux_test_proxy/`, `wxc_ui_probe/`, `fuzz/` |
@@ -182,7 +182,8 @@ The workspace is organized into five top-level directories under `src/`:
 - `wxc_common` is the **cross-platform foundation**: config parsing, models, errors, logger, `ScriptRunner` / `StatefulSandboxBackend` traits, state-aware dispatch helpers, validators, ids, ui-policy, encoding. Plus a few thin Windows API helpers shared by host tools and backends (`process_util`, `string_util`, `filesystem_dacl`, `diagnostic`). It must not depend on any `backends/*` crate.
 - Each Windows containment backend lives in its own `backends/*/common` crate (e.g. `appcontainer_common`, `windows_sandbox_common`, `isolation_session_common`, `hyperlight_common`, `nanvix_runner`). Backend crates depend on `wxc_common`; there are no cross-edges between backend crates.
 - `wxc` and `lxc` are thin binary crates that wire up CLI args (`clap`) and dispatch to `wxc_common` and the per-backend crates
-- `mxc_pty` is the shared pty bridge used by the unix-side backends (`lxc_common::lxc_bindings::attach_run` on Linux and `seatbelt_common::seatbelt_runner` on macOS) so the inner shell sees a real TTY and host stdio is streamed live
+- `mxc-sdk` is an **importable library** for starting sandboxes in-process without a pty: `spawn_sandbox` takes a `SandboxRequest` (from `build_request`), selects the host backend, and returns a `Sandbox` handle for persistent bidirectional stdio (`take_stdin`/`take_stdout`/`take_stderr`), `kill()`, and `wait()` (which drains and discards any untaken stdout/stderr and returns a `WaitOutcome` — `Exited(i32)` or `TimedOut` — as `io::Result`, reserving `Err` for an actual OS/wait failure). It additionally ports the SDK's config-building surface so callers don't need the TypeScript module: `mxc_sdk::policy` (`SandboxPolicy` + `build_request` → `SandboxRequest` (opaque wrapper mapping to the internal `ExecutionRequest`), the port of `createConfigFromPolicy`; plus `available_tools_policy`/`user_profile_policy`/`temporary_files_policy` discovery helpers) and `mxc_sdk::platform_support` (port of `getPlatformSupport`, using the in-process probe on Windows). It depends on the backend crates (cfg-split: appcontainer on Windows, bubblewrap on Linux, seatbelt on macOS) — so it can't live in `wxc_common`. The public surface is deliberately minimal (streaming only): the `dispatch` and `platform` modules are private and only their used items are re-exported at the crate root (`platform_support`, `PlatformSupport`); `policy` is the one public submodule (callers name `mxc_sdk::policy::{SandboxPolicy sections}`). The execution surface lives in `wxc_common::sandbox_process`: the `SandboxBackend` trait (`validate` + `spawn(request, logger, StdioMode) -> Box<dyn SandboxProcess>` + a `diagnose_exit` hook for enriching launch-failure exits) and the generic `Runner<B>` adapter that bridges any `SandboxBackend` to the run-to-completion `ScriptRunner` (by calling `spawn(StdioMode::Inherit)` then `wait()`). `StdioMode::Pipes` hands the caller live stdin/stdout/stderr (what `mxc-sdk` uses); `StdioMode::Inherit` lets the child inherit the host process's own stdio (what the executor binaries use, preserving the TTY under a pty). `SandboxBackend` is implemented for every library backend — Seatbelt (macOS), Bubblewrap (Linux), and Windows ProcessContainer (AppContainer + BaseContainer). The `wxc`/`lxc`/`mxc_darwin` executor binaries do **not** depend on `mxc-sdk`; they keep their own backend dispatch (sharing only the lower-level `appcontainer_common::dispatcher::dispatch_with_fallback`). The `mxc-sdk` in-crate backend dispatch (`dispatch.rs`) and host probing (`platform.rs`) are **provisional** — a follow-up will move them into a dedicated `mxc` engine crate that both `mxc-sdk` and the executor binaries call into.
+- `mxc_pty` is the shared pty bridge used by the LXC backend (`lxc_common::lxc_bindings::attach_run`) so the inner shell sees a real TTY and host stdio is streamed live. (Seatbelt and Bubblewrap no longer use it: they spawn directly and let the child inherit the host's stdio — a TTY when the executor binary runs under a pty — via `SandboxBackend::spawn(StdioMode::Inherit)`.)
 - `mxc_build_common` is a build-time helper crate — all Windows binary crates use it in their `build.rs` to embed VersionInfo (ProductName, FileDescription, copyright, version+commit). When adding a new Windows binary crate, add `mxc_build_common` as a build-dependency and call `mxc_build_common::embed_version_info()` from `build.rs`
 - `nanvix_build_common` is a **build-only** helper crate (never linked into the runtime): it stages NanVix binaries next to the executable and resolves the `NANVIX_BIN` prefetch directory. The `nanvix_binaries`, `wxc`, and `lxc` build scripts consume it as a `[build-dependencies]` entry. Runtime constants it needs (binary/snapshot filenames) stay in `nanvix_common`. Keep build-only file-staging logic here, not in `nanvix_common` (which is a runtime dependency of `nanvix_runner`).
 - Platform-specific modules use `#[cfg(target_os = "windows")]` / `#[cfg(target_os = "linux")]`
diff --git a/docs/sandbox-policy/v1/policy.md b/docs/sandbox-policy/v1/policy.md
index e7f12ced3..a4c1e8a5c 100644
--- a/docs/sandbox-policy/v1/policy.md
+++ b/docs/sandbox-policy/v1/policy.md
@@ -217,8 +217,8 @@ All flags default to `false` (no network access).
 |--------------------|-------------|
 | `allowOutbound`    | Allow outbound connections to the internet (HTTP, DNS, etc.). |
 | `allowLocalNetwork`| Allow connections to local networks. |
-| `allowedHosts`     | When set, ONLY these outbound hosts are reachable. Error if `allowOutbound` is not set. |
-| `blockedHosts`     | Hosts to block even when outbound is allowed. Error if `allowOutbound` is not set. |
+| `allowedHosts`     | When set, ONLY these outbound hosts are reachable. Host-filtering backends (Linux, macOS) accept this without `allowOutbound`; Windows ProcessContainer requires `allowOutbound`. |
+| `blockedHosts`     | Hosts to block even when outbound is allowed. Same `allowOutbound` requirement as `allowedHosts` (Windows ProcessContainer only). |
 | `proxy`            | `{ builtinTestServer: true }` or `{ url: "..." }`. Routes all traffic through this proxy. Cannot be combined with other network flags. |
 
 Omitted = no network access.
diff --git a/src/Cargo.lock b/src/Cargo.lock
index cead9eaad..26ff4e3d1 100644
--- a/src/Cargo.lock
+++ b/src/Cargo.lock
@@ -1385,6 +1385,19 @@ dependencies = [
  "vmm-sys-util",
 ]
 
+[[package]]
+name = "mxc-sdk"
+version = "0.7.0"
+dependencies = [
+ "appcontainer_common",
+ "bwrap_common",
+ "libc",
+ "seatbelt_common",
+ "serde",
+ "serde_json",
+ "wxc_common",
+]
+
 [[package]]
 name = "mxc_build_common"
 version = "0.7.0"
diff --git a/src/Cargo.toml b/src/Cargo.toml
index 458fd2f28..84e7ba361 100644
--- a/src/Cargo.toml
+++ b/src/Cargo.toml
@@ -4,6 +4,7 @@ members = [
     "core/wxc_common",
     "core/lxc",
     "core/mxc_darwin",
+    "core/mxc-sdk",
     "core/mxc_pty",
     "core/mxc_build_common",
     "core/generated/base_container_specification",
@@ -102,6 +103,7 @@ libc = "0.2"
 nix = { version = "0.29", features = ["fs", "mount", "sched", "signal", "net", "process", "user", "term"] }
 lxc_common = { path = "backends/lxc/common" }
 bwrap_common = { path = "backends/bubblewrap/common" }
+seatbelt_common = { path = "backends/seatbelt/common" }
 wslc_common = { path = "backends/wslc/common" }
 isolation_session_bindings = { path = "backends/isolation_session/bindings" }
 mxc_pty = { path = "core/mxc_pty" }
diff --git a/src/core/mxc-sdk/Cargo.toml b/src/core/mxc-sdk/Cargo.toml
new file mode 100644
index 000000000..ce9a14260
--- /dev/null
+++ b/src/core/mxc-sdk/Cargo.toml
@@ -0,0 +1,27 @@
+[package]
+name = "mxc-sdk"
+version.workspace = true
+edition.workspace = true
+license.workspace = true
+description = "Importable library for starting MXC sandboxes in-process (no pty, streaming stdio)."
+
+[lib]
+name = "mxc_sdk"
+path = "src/lib.rs"
+
+[dependencies]
+wxc_common.workspace = true
+serde = { workspace = true }
+serde_json = { workspace = true }
+
+[target.'cfg(target_os = "windows")'.dependencies]
+appcontainer_common = { workspace = true }
+
+[target.'cfg(target_os = "linux")'.dependencies]
+bwrap_common = { workspace = true }
+
+[target.'cfg(target_os = "macos")'.dependencies]
+seatbelt_common = { workspace = true }
+
+[target.'cfg(target_os = "macos")'.dev-dependencies]
+libc = { workspace = true }
diff --git a/src/core/mxc-sdk/README.md b/src/core/mxc-sdk/README.md
new file mode 100644
index 000000000..b438956d9
--- /dev/null
+++ b/src/core/mxc-sdk/README.md
@@ -0,0 +1,148 @@
+# `mxc-sdk`
+
+An importable Rust library for starting [MXC](../../../README.md) sandboxes
+**in-process**, without ever allocating a pty.
+
+Build a `SandboxRequest` from a [`SandboxPolicy`], then hand it to
+[`spawn_sandbox`]: it selects the
+right containment backend for the host and spawns the sandboxed process —
+returning a handle for live bidirectional stdio and termination.
+
+## Usage
+
+```rust,no_run
+use std::io::Read;
+use mxc_sdk::{build_request, spawn_sandbox, SandboxPolicy, WaitOutcome};
+
+// Describe what to restrict, turn it into a request, fill in the command.
+let policy = SandboxPolicy {
+    version: "0.7.0-alpha".to_string(),
+    filesystem: None,
+    network: None,
+    ui: None,
+    timeout_ms: Some(10_000),
+};
+let mut request = build_request(&policy, None)?;
+request.set_script("echo hello");
+
+let mut proc = spawn_sandbox(request)?;
+let mut stdout = proc.take_stdout().unwrap();
+let mut out = String::new();
+stdout.read_to_string(&mut out)?; // "hello\n"
+let outcome = proc.wait()?;       // drains/discards any untaken stream
+assert_eq!(outcome, WaitOutcome::Exited(0));
+# Ok::<(), Box<dyn std::error::Error>>(())
+```
+
+[`build_request`] is the Rust port of the SDK's `createConfigFromPolicy`. It
+resolves the host's containment backend (Seatbelt on macOS, Bubblewrap on
+Linux, ProcessContainer on Windows) and mirrors the SDK's field mapping and
+network validation, building the same wire config internally and running it
+through the shared parser. The returned [`SandboxRequest`] has an empty
+command line — set the command with [`SandboxRequest::set_script`] (and any
+working directory / env) before spawning.
+
+Filesystem-policy discovery helpers (ports of the SDK's `policy.ts`) are also
+available to feed a policy: [`available_tools_policy`] (PATH + tool/SDK env
+dirs), [`user_profile_policy`], and [`temporary_files_policy`].
+
+[`platform_support`] is the Rust port of `getPlatformSupport` — reports host
+support and the available containment backends.
+
+## Live stdio + kill (streaming)
+
+[`spawn_sandbox`] returns a [`Sandbox`] you can drive
+while it runs — persistent bidirectional stdio plus termination. No pty is
+allocated; the streams are ordinary pipes.
+
+```rust,no_run
+use std::io::{Read, Write};
+use mxc_sdk::{build_request, spawn_sandbox, SandboxPolicy, WaitOutcome};
+
+let policy = SandboxPolicy {
+    version: "0.7.0-alpha".to_string(),
+    filesystem: None,
+    network: None,
+    ui: None,
+    timeout_ms: None,
+};
+let mut request = build_request(&policy, None)?;
+request.set_script("cat"); // echoes stdin until EOF
+
+let mut proc = spawn_sandbox(request)?;
+let mut stdin = proc.take_stdin().unwrap();
+let mut stdout = proc.take_stdout().unwrap();
+
+stdin.write_all(b"hello\n")?;
+drop(stdin);                      // close -> child sees EOF
+let mut out = String::new();
+stdout.read_to_string(&mut out)?; // "hello\n"
+
+let outcome = proc.wait()?;       // any untaken stream is drained and discarded
+assert_eq!(outcome, WaitOutcome::Exited(0));
+# Ok::<(), Box<dyn std::error::Error>>(())
+```
+
+The handle is modelled on [`std::process::Child`]:
+
+- `take_stdin()` → `Box<dyn Write + Send>`, `take_stdout()` / `take_stderr()`
+  → `Box<dyn Read + Send>` (drive them yourself; you own draining any stream
+  you take, to avoid the child blocking on a full pipe).
+- `id()` returns the child's OS process id, for external monitoring or a
+  caller-driven process-tree kill.
+- `try_wait()` for a non-blocking exit check.
+- `kill()` terminates the sandboxed process **and its descendants** (a
+  process-tree kill): on Unix the child leads its own process group and the
+  whole group is signalled (an immediate `SIGKILL`, no graceful `SIGTERM`);
+  on Windows the child's job object is terminated.
+- `wait()` blocks until exit (honouring `scriptTimeout`, where `0` waits
+  forever), drains and discards any **untaken** stdout/stderr so the child
+  can't block on a full pipe, and returns a `WaitOutcome` —
+  `Exited(code)` or `TimedOut` if the timeout elapses (`Err` is reserved for an
+  actual OS/wait failure).
+- `stdout_closer()` / `stderr_closer()` → `Option<StreamCloser>`: a
+  closer that makes an in-flight or subsequent read on the taken stream return
+  EOF promptly **without** killing the child — for abandoning a stream a
+  backgrounded descendant is holding open past the foreground command's exit (a
+  plain `kill()` would also take that descendant down). Returns `None` for
+  non-streamed stdio.
+
+Streaming is implemented for **Seatbelt (macOS)**, **Bubblewrap (Linux)**, and
+**Windows ProcessContainer (AppContainer + BaseContainer)** — i.e. every
+backend the library supports.
+
+> **Windows note:** streaming does not use the AppContainer-BFS /
+> AppContainer-DACL fallback. Experimental / newer-schema configs that select
+> BaseContainer require the native BaseContainer API; on a host without it,
+> `spawn_sandbox` fails closed with a clear error rather than
+> falling back to an AppContainer tier.
+
+## Supported backends
+
+The backend is chosen by the `containment` field in the request (or the host
+default):
+
+| Host    | Backend(s)                                             |
+|---------|--------------------------------------------------------|
+| Linux   | Bubblewrap                                             |
+| macOS   | Seatbelt                                               |
+| Windows | ProcessContainer (AppContainer + BaseContainer)        |
+
+Any other backend (Windows Sandbox, IsolationSession, MicroVM, Hyperlight,
+WSLC, LXC) returns an [`Error`] with [`ErrorCode::UnsupportedContainment`]; drive the standalone
+executor binaries for those.
+
+## No pty
+
+The child's stdio is always wired to ordinary pipes — the library never
+allocates a pty (the executor binaries, by contrast, stream live: LXC via a
+pty, Seatbelt/Bubblewrap/AppContainer by inheriting the executor's stdio
+directly — a TTY when the executor has one). Output the caller doesn't
+take is drained and discarded by `wait()`.
+
+## Relationship to the executor binaries
+
+The `wxc-exec`, `lxc-exec`, and `mxc-exec-mac` binaries do not depend on this
+crate. It reuses the same backend crates they do, but selects between them
+directly (no BFS/DACL `dispatch_with_fallback`) and spawns its own streaming
+handles.
diff --git a/src/core/mxc-sdk/src/dispatch.rs b/src/core/mxc-sdk/src/dispatch.rs
new file mode 100644
index 000000000..607ec5758
--- /dev/null
+++ b/src/core/mxc-sdk/src/dispatch.rs
@@ -0,0 +1,259 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! Streaming backend dispatch for the `mxc-sdk` library.
+//!
+//! Spawns the right [`SandboxProcess`] for the request's containment backend.
+//! It lives here — rather than in `wxc_common` — because constructing a
+//! backend runner requires depending on the `backends/*` crates, and
+//! `wxc_common` must not (it is the cross-platform foundation those backends
+//! build on).
+//!
+//! Only the backends the `mxc-sdk` library officially supports are handled here:
+//! ProcessContainer (Windows AppContainer / BaseContainer fallback),
+//! Bubblewrap (Linux), and Seatbelt (macOS). Every other backend — including
+//! the experimental ones (Windows Sandbox, IsolationSession, MicroVM,
+//! Hyperlight, WSLC) and LXC (no streaming path suitable for the library) —
+//! returns [`MxcError::unsupported_containment`]; callers that need those must
+//! drive the standalone executor binaries.
+//!
+//! **Provisional.** This in-crate backend selection is a temporary home. A
+//! follow-up will introduce a dedicated `mxc` engine crate that both `mxc-sdk`
+//! and the executor binaries call into; the selection/spawn logic here — and the
+//! host probing in `platform.rs` — moves there, leaving `mxc-sdk` a thin
+//! streaming wrapper over the engine.
+
+use wxc_common::logger::Logger;
+use wxc_common::models::{ContainmentBackend, ExecutionRequest, ScriptResponse};
+use wxc_common::mxc_error::MxcError;
+use wxc_common::sandbox_process::SandboxProcess;
+
+/// `Err` when the host OS has no MXC sandbox backend. Checked before backend
+/// selection so an unsupported platform reports a clear message rather than a
+/// backend-specific one (the default/abstract intent resolves to
+/// ProcessContainer on non-Linux/macOS hosts).
+fn ensure_host_supported() -> Result<(), MxcError> {
+    #[cfg(any(target_os = "windows", target_os = "linux", target_os = "macos"))]
+    {
+        Ok(())
+    }
+    #[cfg(not(any(target_os = "windows", target_os = "linux", target_os = "macos")))]
+    {
+        Err(MxcError::unsupported_containment(
+            "the mxc-sdk library has no sandbox backend for this host OS \
+             (supported: Windows, Linux, macOS)",
+        ))
+    }
+}
+
+// ---------------------------------------------------------------------------
+// Streaming (handle-based) spawn
+// ---------------------------------------------------------------------------
+
+/// Spawn a [`SandboxProcess`] handle for `request` on the current host.
+///
+/// Spawns the sandboxed process with piped stdio and returns a handle the
+/// caller can write to, read from, wait on, and kill. Backends without a
+/// streaming implementation return [`MxcError::unsupported_containment`].
+pub fn spawn_runner(
+    request: &ExecutionRequest,
+    logger: &mut Logger,
+) -> Result<Box<dyn SandboxProcess>, MxcError> {
+    ensure_host_supported()?;
+    // `dry_run` means "validate, don't execute" — there is no process to
+    // stream, so reject it rather than silently ignoring it.
+    if request.dry_run {
+        return Err(MxcError::malformed_request(
+            "dry_run is not supported for streaming spawns",
+        ));
+    }
+    match &request.containment {
+        ContainmentBackend::Seatbelt => spawn_seatbelt(request, logger),
+        ContainmentBackend::Bubblewrap => spawn_bubblewrap(request, logger),
+        ContainmentBackend::ProcessContainer => spawn_process_container(request, logger),
+        other => Err(MxcError::unsupported_containment(format!(
+            "the mxc-sdk library does not yet support streaming for the '{}' backend",
+            other.wire_name()
+        ))),
+    }
+}
+
+/// Map a backend's `spawn` failure `ScriptResponse` to an
+/// [`MxcError`], preserving the `BackendUnavailable` phase (so callers can fall
+/// back to a lower tier) and folding any `extended_error` detail into the
+/// message — rather than flattening everything to a generic `BackendError`.
+fn map_spawn_error(resp: ScriptResponse) -> MxcError {
+    use wxc_common::models::FailurePhase;
+
+    let mut message = resp.error_message;
+    if !resp.extended_error.is_empty() {
+        if message.is_empty() {
+            message = resp.extended_error;
+        } else {
+            message = format!("{message} ({})", resp.extended_error);
+        }
+    }
+    match resp.failure_phase {
+        FailurePhase::BackendUnavailable => MxcError::backend_unavailable(message),
+        _ => MxcError::backend_error(message),
+    }
+}
+
+#[cfg(target_os = "linux")]
+fn spawn_bubblewrap(
+    request: &ExecutionRequest,
+    logger: &mut Logger,
+) -> Result<Box<dyn SandboxProcess>, MxcError> {
+    use wxc_common::sandbox_process::{SandboxBackend, StdioMode};
+    let mut runner = bwrap_common::bwrap_runner::BubblewrapScriptRunner::new();
+    runner
+        .spawn(request, logger, StdioMode::Pipes)
+        .map_err(map_spawn_error)
+}
+
+#[cfg(not(target_os = "linux"))]
+fn spawn_bubblewrap(
+    _request: &ExecutionRequest,
+    _logger: &mut Logger,
+) -> Result<Box<dyn SandboxProcess>, MxcError> {
+    Err(MxcError::unsupported_containment(
+        "Bubblewrap is only available on Linux",
+    ))
+}
+
+#[cfg(target_os = "macos")]
+fn spawn_seatbelt(
+    request: &ExecutionRequest,
+    logger: &mut Logger,
+) -> Result<Box<dyn SandboxProcess>, MxcError> {
+    use wxc_common::sandbox_process::{SandboxBackend, StdioMode};
+    let mut runner = seatbelt_common::seatbelt_runner::SeatbeltScriptRunner::new();
+    runner
+        .spawn(request, logger, StdioMode::Pipes)
+        .map_err(map_spawn_error)
+}
+
+#[cfg(not(target_os = "macos"))]
+fn spawn_seatbelt(
+    _request: &ExecutionRequest,
+    _logger: &mut Logger,
+) -> Result<Box<dyn SandboxProcess>, MxcError> {
+    Err(MxcError::unsupported_containment(
+        "Seatbelt is only available on macOS",
+    ))
+}
+
+#[cfg(target_os = "windows")]
+fn spawn_process_container(
+    request: &ExecutionRequest,
+    logger: &mut Logger,
+) -> Result<Box<dyn SandboxProcess>, MxcError> {
+    use appcontainer_common::appcontainer_runner::AppContainerScriptRunner;
+    use wxc_common::config_parser::is_base_container_version;
+    use wxc_common::sandbox_process::{SandboxBackend, StdioMode};
+
+    // The AppContainer fast path vs the native BaseContainer (OS sandbox API):
+    // unlike the executor binaries' run-to-completion fallback, streaming does
+    // NOT route through `dispatch_with_fallback` — there is no AppContainer-BFS
+    // / AppContainer-DACL fallback for streaming.
+    //
+    // Why: `dispatch_with_fallback` yields a run-to-completion
+    // `Box<dyn ScriptRunner>` plus a `DaclManager` guard, neither of which
+    // fits the streaming handle (the DACL tier would require the returned
+    // `SandboxProcess` to own the guard so ACE restore outlives the child).
+    //
+    // Consequence (intentional, fail-closed): an experimental / newer-schema
+    // config on a host that lacks the native BaseContainer API fails here with
+    // a clear "BaseContainer API unavailable" error from
+    // `BaseContainerRunner`'s validation, whereas the binaries' fallback would
+    // drop to an AppContainer tier. Streaming therefore requires the native
+    // BaseContainer API for those configs.
+    let version_implies_base_container = is_base_container_version(&request.schema_version);
+    if request.experimental_enabled || version_implies_base_container {
+        let mut runner = appcontainer_common::base_container_runner::BaseContainerRunner::new();
+        return runner
+            .spawn(request, logger, StdioMode::Pipes)
+            .map_err(map_spawn_error);
+    }
+
+    let mut runner = AppContainerScriptRunner::new();
+    runner
+        .spawn(request, logger, StdioMode::Pipes)
+        .map_err(map_spawn_error)
+}
+
+#[cfg(not(target_os = "windows"))]
+fn spawn_process_container(
+    _request: &ExecutionRequest,
+    _logger: &mut Logger,
+) -> Result<Box<dyn SandboxProcess>, MxcError> {
+    Err(MxcError::unsupported_containment(
+        "ProcessContainer (AppContainer / BaseContainer) is only available on Windows",
+    ))
+}
+
+#[cfg(test)]
+mod tests {
+    use super::spawn_runner;
+    use crate::policy::{build_request, SandboxPolicy};
+    use wxc_common::logger::{Logger, Mode};
+    use wxc_common::mxc_error::MxcErrorCode;
+
+    fn minimal_policy() -> SandboxPolicy {
+        SandboxPolicy {
+            version: "0.7.0-alpha".to_string(),
+            filesystem: None,
+            network: None,
+            ui: None,
+            timeout_ms: None,
+        }
+    }
+
+    #[test]
+    fn streaming_rejects_dry_run() {
+        // `dry_run` ("validate, don't execute") has no process to stream, so the
+        // streaming spawn rejects it. The public `SandboxRequest` can't set it,
+        // so drive the dispatch directly with the internal model.
+        let mut request = build_request(&minimal_policy(), None).expect("build_request");
+        request.inner.dry_run = true;
+        let mut logger = Logger::new(Mode::Buffer);
+        let err = match spawn_runner(&request.inner, &mut logger) {
+            Ok(_) => panic!("dry_run must be rejected"),
+            Err(e) => e,
+        };
+        assert_eq!(err.code, MxcErrorCode::MalformedRequest);
+    }
+
+    #[cfg(target_os = "macos")]
+    #[test]
+    fn streaming_rejects_gui_access() {
+        // A windowed (guiAccess) app needs inherited stdio, so it can't stream
+        // over pipes — the backend must reject it rather than drop the GUI cap.
+        let policy = SandboxPolicy {
+            version: "0.7.0-alpha".to_string(),
+            filesystem: Some(crate::policy::FilesystemSection {
+                readwrite_paths: vec!["/tmp".to_string()],
+                readonly_paths: vec![],
+                denied_paths: vec![],
+                clear_policy_on_exit: None,
+            }),
+            network: None,
+            ui: None,
+            timeout_ms: None,
+        };
+        let mut request = build_request(&policy, None).expect("build_request");
+        request.set_script("echo hi");
+        request
+            .inner
+            .seatbelt
+            .as_mut()
+            .expect("seatbelt config on macOS")
+            .gui_access = true;
+        let mut logger = Logger::new(Mode::Buffer);
+        let err = match spawn_runner(&request.inner, &mut logger) {
+            Ok(_) => panic!("guiAccess must be rejected"),
+            Err(e) => e,
+        };
+        assert!(err.message.contains("guiAccess"), "got: {}", err.message);
+    }
+}
diff --git a/src/core/mxc-sdk/src/error.rs b/src/core/mxc-sdk/src/error.rs
new file mode 100644
index 000000000..02a3ffddc
--- /dev/null
+++ b/src/core/mxc-sdk/src/error.rs
@@ -0,0 +1,97 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! The SDK's own error type — a crate-owned facade over the internal
+//! `wxc_common` error, so the public API never exposes the foundation crate.
+
+use wxc_common::mxc_error::{MxcError, MxcErrorCode};
+
+/// Closed set of error codes the SDK can return. Mirrors the wire-format codes
+/// (serialised as snake_case strings) one-for-one.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+pub enum ErrorCode {
+    MalformedRequest,
+    UnsupportedContainment,
+    UnsupportedPhase,
+    BackendUnavailable,
+    MalformedId,
+    StaleId,
+    NotProvisioned,
+    NotStarted,
+    AlreadyStarted,
+    AlreadyStopped,
+    PolicyValidation,
+    BackendError,
+}
+
+impl ErrorCode {
+    /// The wire-format (snake_case) string for this code.
+    pub fn as_str(self) -> &'static str {
+        match self {
+            Self::MalformedRequest => "malformed_request",
+            Self::UnsupportedContainment => "unsupported_containment",
+            Self::UnsupportedPhase => "unsupported_phase",
+            Self::BackendUnavailable => "backend_unavailable",
+            Self::MalformedId => "malformed_id",
+            Self::StaleId => "stale_id",
+            Self::NotProvisioned => "not_provisioned",
+            Self::NotStarted => "not_started",
+            Self::AlreadyStarted => "already_started",
+            Self::AlreadyStopped => "already_stopped",
+            Self::PolicyValidation => "policy_validation",
+            Self::BackendError => "backend_error",
+        }
+    }
+}
+
+impl std::fmt::Display for ErrorCode {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        f.write_str(self.as_str())
+    }
+}
+
+impl From<MxcErrorCode> for ErrorCode {
+    fn from(code: MxcErrorCode) -> Self {
+        match code {
+            MxcErrorCode::MalformedRequest => Self::MalformedRequest,
+            MxcErrorCode::UnsupportedContainment => Self::UnsupportedContainment,
+            MxcErrorCode::UnsupportedPhase => Self::UnsupportedPhase,
+            MxcErrorCode::BackendUnavailable => Self::BackendUnavailable,
+            MxcErrorCode::MalformedId => Self::MalformedId,
+            MxcErrorCode::StaleId => Self::StaleId,
+            MxcErrorCode::NotProvisioned => Self::NotProvisioned,
+            MxcErrorCode::NotStarted => Self::NotStarted,
+            MxcErrorCode::AlreadyStarted => Self::AlreadyStarted,
+            MxcErrorCode::AlreadyStopped => Self::AlreadyStopped,
+            MxcErrorCode::PolicyValidation => Self::PolicyValidation,
+            MxcErrorCode::BackendError => Self::BackendError,
+        }
+    }
+}
+
+/// An error returned by the SDK's fallible operations
+/// ([`build_request`](crate::build_request) / [`spawn_sandbox`](crate::spawn_sandbox)).
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct Error {
+    /// The closed error code.
+    pub code: ErrorCode,
+    /// A human-readable message.
+    pub message: String,
+}
+
+impl std::fmt::Display for Error {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{}: {}", self.code, self.message)
+    }
+}
+
+impl std::error::Error for Error {}
+
+impl From<MxcError> for Error {
+    fn from(error: MxcError) -> Self {
+        Self {
+            code: error.code.into(),
+            message: error.message,
+        }
+    }
+}
diff --git a/src/core/mxc-sdk/src/lib.rs b/src/core/mxc-sdk/src/lib.rs
new file mode 100644
index 000000000..5ba317ef5
--- /dev/null
+++ b/src/core/mxc-sdk/src/lib.rs
@@ -0,0 +1,76 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! `mxc-sdk` — an importable library for starting MXC sandboxes in-process.
+//!
+//! Build a [`SandboxRequest`] from a [`SandboxPolicy`] with [`build_request`],
+//! then hand it to [`spawn_sandbox`]:
+//! it selects the right containment backend for the host and spawns the
+//! sandboxed process **without ever allocating a pty**, returning a
+//! [`Sandbox`] handle for live bidirectional stdio and termination.
+//!
+//! ```no_run
+//! use mxc_sdk::{build_request, spawn_sandbox, SandboxPolicy, WaitOutcome};
+//!
+//! // Turn a policy into a request, fill in the command, and spawn it.
+//! let policy = SandboxPolicy {
+//!     version: "0.7.0-alpha".to_string(),
+//!     filesystem: None,
+//!     network: None,
+//!     ui: None,
+//!     timeout_ms: None,
+//! };
+//! let mut request = build_request(&policy, None)?;
+//! request.set_script("echo hi");
+//! let mut proc = spawn_sandbox(request)?;
+//! match proc.wait()? {
+//!     WaitOutcome::Exited(code) => println!("exit={code}"),
+//!     WaitOutcome::TimedOut => println!("timed out"),
+//! }
+//! # Ok::<(), Box<dyn std::error::Error>>(())
+//! ```
+//!
+//! ## Backend support
+//!
+//! The selected backend is driven by the `containment` field in the request
+//! (or the host default). The library supports Bubblewrap (Linux), Seatbelt
+//! (macOS), and ProcessContainer — AppContainer and BaseContainer —
+//! (Windows). Other backends return an [`Error`] with
+//! [`ErrorCode::UnsupportedContainment`].
+//!
+//! ## No pty
+//!
+//! The child's stdio is always wired to ordinary pipes — the library never
+//! allocates a pty. Stream the handle's `take_stdout`/`take_stderr`, or let
+//! [`wait`](Sandbox::wait) drain and discard any untaken stream.
+
+mod dispatch;
+mod error;
+mod platform;
+pub mod policy;
+mod sandbox;
+
+use dispatch::spawn_runner;
+pub use platform::{platform_support, PlatformSupport};
+pub use policy::{
+    available_tools_policy, build_request, temporary_files_policy, user_profile_policy,
+    FilesystemPolicyResult, SandboxPolicy, SandboxRequest,
+};
+
+pub use error::{Error, ErrorCode};
+pub use sandbox::{Sandbox, StreamCloser, WaitOutcome};
+
+use wxc_common::logger::{Logger, Mode};
+
+/// Spawn a sandbox from a [`SandboxRequest`] built by [`build_request`] (with
+/// the command, and any working directory / env, filled in).
+///
+/// Returns a [`Sandbox`] handle for live bidirectional stdio and termination;
+/// no pty is allocated. Any stdout/stderr stream the caller does not `take_*` is
+/// drained and discarded by [`wait`](Sandbox::wait).
+pub fn spawn_sandbox(request: SandboxRequest) -> Result<Sandbox, Error> {
+    let mut logger = Logger::new(Mode::Buffer);
+    spawn_runner(&request.inner, &mut logger)
+        .map(Sandbox::new)
+        .map_err(Error::from)
+}
diff --git a/src/core/mxc-sdk/src/platform.rs b/src/core/mxc-sdk/src/platform.rs
new file mode 100644
index 000000000..5ea7be621
--- /dev/null
+++ b/src/core/mxc-sdk/src/platform.rs
@@ -0,0 +1,100 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! Host platform support detection — the Rust port of the SDK's
+//! `getPlatformSupport`.
+//!
+//! Reports whether MXC can run on the current host and which containment
+//! backends are available. This lets callers stop depending on the TypeScript
+//! SDK for platform discovery.
+//!
+//! **Provisional.** Like the backend dispatch in `dispatch.rs`, this host
+//! probing is a temporary home; it moves to the future `mxc` engine crate that
+//! both `mxc-sdk` and the executor binaries will share.
+
+/// Platform support information — the Rust analogue of the SDK
+/// `PlatformSupport` type.
+#[derive(Debug, Clone, Default)]
+pub struct PlatformSupport {
+    /// Whether MXC is supported on the current host.
+    pub is_supported: bool,
+    /// Why the platform is unsupported, when `is_supported` is false.
+    pub reason: Option<String>,
+    /// Containment backends available on this host, by wire name
+    /// (e.g. `"seatbelt"`, `"bubblewrap"`, `"processcontainer"`).
+    pub available_methods: Vec<String>,
+}
+
+/// Detect MXC support on the current host.
+///
+/// Mirrors the SDK's `getPlatformSupport`, restricted to the backends the
+/// `mxc-sdk` library can actually run. On Windows the isolation tier and UI
+/// capabilities come from the in-process fallback probe rather than a
+/// `wxc-exec --probe` subprocess.
+pub fn platform_support() -> PlatformSupport {
+    #[cfg(target_os = "macos")]
+    {
+        if std::path::Path::new("/usr/bin/sandbox-exec").exists() {
+            PlatformSupport {
+                is_supported: true,
+                available_methods: vec!["seatbelt".to_string()],
+                ..Default::default()
+            }
+        } else {
+            PlatformSupport {
+                reason: Some(
+                    "/usr/bin/sandbox-exec not found; macOS install is incomplete".to_string(),
+                ),
+                ..Default::default()
+            }
+        }
+    }
+
+    #[cfg(target_os = "linux")]
+    {
+        if command_succeeds("bwrap", &["--version"]) {
+            PlatformSupport {
+                is_supported: true,
+                available_methods: vec!["bubblewrap".to_string()],
+                ..Default::default()
+            }
+        } else {
+            PlatformSupport {
+                reason: Some("Bubblewrap is not available on this system".to_string()),
+                ..Default::default()
+            }
+        }
+    }
+
+    #[cfg(target_os = "windows")]
+    {
+        PlatformSupport {
+            is_supported: true,
+            available_methods: vec!["processcontainer".to_string()],
+            ..Default::default()
+        }
+    }
+
+    #[cfg(not(any(target_os = "macos", target_os = "linux", target_os = "windows")))]
+    {
+        PlatformSupport {
+            reason: Some("MXC is not supported on this platform".to_string()),
+            ..Default::default()
+        }
+    }
+}
+
+/// Returns true when `program args...` exits successfully — used to probe for
+/// the presence of `bwrap` on Linux.
+#[cfg(target_os = "linux")]
+fn command_succeeds(program: &str, args: &[&str]) -> bool {
+    use std::process::{Command, Stdio};
+    Command::new(program)
+        .args(args)
+        .stdin(Stdio::null())
+        .stdout(Stdio::null())
+        .stderr(Stdio::null())
+        .status()
+        .map(|s| s.success())
+        .unwrap_or(false)
+}
diff --git a/src/core/mxc-sdk/src/policy.rs b/src/core/mxc-sdk/src/policy.rs
new file mode 100644
index 000000000..0b36a556c
--- /dev/null
+++ b/src/core/mxc-sdk/src/policy.rs
@@ -0,0 +1,1059 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! Policy discovery and config building — the Rust port of the SDK's
+//! `policy.ts` helpers and `createConfigFromPolicy`.
+//!
+//! - [`available_tools_policy`], [`user_profile_policy`], and
+//!   [`temporary_files_policy`] enumerate the host environment to discover
+//!   tool/SDK/profile/temp directories as filesystem-policy fragments.
+//! - [`SandboxPolicy`] mirrors the SDK's cross-platform policy type, and
+//!   [`build_request`] maps it to an [`ExecutionRequest`] for the backends the
+//!   crate supports (Seatbelt, Bubblewrap, ProcessContainer) — so callers no
+//!   longer need the TypeScript SDK to build a spawnable config.
+
+use std::borrow::Cow;
+use std::collections::HashSet;
+use std::path::{Path, PathBuf};
+
+use wxc_common::logger::{Logger, Mode};
+use wxc_common::models::ExecutionRequest;
+use wxc_common::mxc_error::MxcError;
+
+// ---------------------------------------------------------------------------
+// Filesystem policy discovery
+// ---------------------------------------------------------------------------
+
+/// A composable fragment of filesystem policy. Callers merge one or more into
+/// a [`SandboxPolicy`]'s filesystem section.
+#[derive(Debug, Clone, Default, PartialEq, Eq)]
+pub struct FilesystemPolicyResult {
+    /// Paths to grant read-only access inside the sandbox.
+    pub readonly_paths: Vec<String>,
+    /// Paths to grant read-write access inside the sandbox.
+    pub readwrite_paths: Vec<String>,
+}
+
+/// Well-known tool/SDK environment variables and how to extract directories
+/// from each. Mirrors the SDK's `KNOWN_ENV_VARS`. The `bool` is whether the
+/// value is a path-list (split on the platform separator) vs a single path.
+const KNOWN_ENV_VARS: &[(&str, bool)] = &[
+    ("PYTHONPATH", true),
+    ("PYTHONHOME", false),
+    ("VCINSTALLDIR", false),
+    ("VSINSTALLDIR", false),
+    ("PSModulePath", true),
+    ("VCPKG_ROOT", false),
+    ("GOPATH", false),
+    ("GOROOT", false),
+    ("CARGO_HOME", false),
+    ("RUSTUP_HOME", false),
+    ("JAVA_HOME", false),
+    ("NVM_HOME", false),
+    ("NVM_SYMLINK", false),
+    ("NODE_PATH", true),
+    ("DOTNET_ROOT", false),
+    ("CONDA_PREFIX", false),
+    ("LD_LIBRARY_PATH", true),
+    ("VIRTUAL_ENV", false),
+    ("PYENV_ROOT", false),
+];
+
+fn is_windows() -> bool {
+    cfg!(target_os = "windows")
+}
+
+/// Split a path-list value on the platform separator (`;` on Windows, `:`
+/// elsewhere), dropping empty entries.
+fn split_path_list(value: &str) -> Vec<String> {
+    let sep = if is_windows() { ';' } else { ':' };
+    value
+        .split(sep)
+        .filter(|p| !p.is_empty())
+        .map(str::to_string)
+        .collect()
+}
+
+fn single_path(value: &str) -> Vec<String> {
+    let trimmed = value.trim();
+    if trimmed.is_empty() {
+        Vec::new()
+    } else {
+        vec![trimmed.to_string()]
+    }
+}
+
+fn directory_exists(dir: &str) -> bool {
+    std::fs::metadata(dir).map(|m| m.is_dir()).unwrap_or(false)
+}
+
+/// Join `base` with successive path segments, returning an owned `String`.
+/// Windows policy paths are always valid UTF-16/UTF-8, so the lossy conversion
+/// never actually substitutes characters in practice.
+fn join_str(base: &str, segments: &[&str]) -> String {
+    let mut path = PathBuf::from(base);
+    for segment in segments {
+        path.push(segment);
+    }
+    path.to_string_lossy().into_owned()
+}
+
+/// Resolve a path to absolute, lexically-normalized form — the equivalent of
+/// the SDK's `path.resolve`. Purely lexical (no filesystem access, no symlink
+/// resolution): a relative path is joined with the cwd, then `.`/`..` segments
+/// are collapsed. Crucially it does *not* canonicalize, so on Windows it keeps
+/// the plain `C:\...` form (no `\\?\` verbatim prefix) — otherwise
+/// [`is_system_critical_path`]'s `C:\Windows` prefix check would never match.
+fn resolve_path(p: &str) -> String {
+    let path = Path::new(p);
+    let absolute = if path.is_absolute() {
+        path.to_path_buf()
+    } else {
+        match std::env::current_dir() {
+            Ok(cwd) => cwd.join(path),
+            Err(_) => path.to_path_buf(),
+        }
+    };
+    normalize_lexically(&absolute)
+        .to_string_lossy()
+        .into_owned()
+}
+
+/// Collapse `.`/`..` segments without touching the filesystem, preserving the
+/// path prefix/root (the well-known lexical-normalize pattern).
+fn normalize_lexically(path: &Path) -> PathBuf {
+    use std::path::Component;
+    let mut components = path.components().peekable();
+    let mut out = if let Some(c @ Component::Prefix(..)) = components.peek().copied() {
+        components.next();
+        PathBuf::from(c.as_os_str())
+    } else {
+        PathBuf::new()
+    };
+    for component in components {
+        match component {
+            Component::Prefix(..) => unreachable!("prefix only appears first"),
+            Component::RootDir => out.push(component.as_os_str()),
+            Component::CurDir => {}
+            Component::ParentDir => match out.components().next_back() {
+                // Pop a real directory name.
+                Some(Component::Normal(_)) => {
+                    out.pop();
+                }
+                // At a root/prefix: `..` can't go above it — ignore the segment
+                // (so `/a/../../b` stays `/b`, and `C:\..` stays `C:\`).
+                Some(Component::RootDir | Component::Prefix(..)) => {}
+                // Relative path (empty or already leading with `..`): preserve.
+                _ => out.push(component.as_os_str()),
+            },
+            Component::Normal(c) => out.push(c),
+        }
+    }
+    out
+}
+
+/// Deduplicate resolved paths, case-insensitively on Windows.
+fn deduplicate_paths(paths: &[String]) -> Vec<String> {
+    let windows = is_windows();
+    let mut seen: HashSet<String> = HashSet::new();
+    let mut out = Vec::new();
+    for p in paths {
+        let resolved = resolve_path(p);
+        let key = if windows {
+            resolved.to_lowercase()
+        } else {
+            resolved.clone()
+        };
+        if seen.insert(key) {
+            out.push(resolved);
+        }
+    }
+    out
+}
+
+/// Whether `dir` is under a system-critical location that must not be exposed.
+fn is_system_critical_path(dir: &str) -> bool {
+    let normalized = resolve_path(dir);
+    if is_windows() {
+        // A set-but-empty `WINDIR` must not disable the filter: treat empty as
+        // unset and fall back (the same `WINDIR` handling `powershell_policy`
+        // uses).
+        let win_dir = std::env::var("WINDIR")
+            .ok()
+            .or_else(|| std::env::var("windir").ok())
+            .filter(|s| !s.is_empty())
+            .unwrap_or_else(|| "C:\\Windows".to_string())
+            .to_lowercase();
+        // Strip a verbatim (`\\?\`, `\\?\UNC\`) prefix so a path supplied in
+        // that form still matches the plain `C:\Windows` comparison.
+        let n = normalized.to_lowercase();
+        let n = n
+            .strip_prefix(r"\\?\unc\")
+            .or_else(|| n.strip_prefix(r"\\?\"))
+            .unwrap_or(&n);
+        return n == win_dir || n.starts_with(&format!("{win_dir}\\"));
+    }
+    const CRITICAL: &[&str] = &[
+        "/bin",
+        "/sbin",
+        "/usr/bin",
+        "/usr/sbin",
+        "/boot",
+        "/proc",
+        "/sys",
+        "/dev",
+    ];
+    CRITICAL
+        .iter()
+        .any(|cp| normalized == *cp || normalized.starts_with(&format!("{cp}/")))
+}
+
+fn env_get<'a>(env: &'a [(String, String)], name: &str) -> Option<&'a str> {
+    // Windows environment variable names are case-insensitive (matching the OS
+    // and Node's `process.env`, which the TS SDK relies on); Unix names are
+    // case-sensitive.
+    env.iter()
+        .find(|(k, _)| {
+            if cfg!(windows) {
+                k.eq_ignore_ascii_case(name)
+            } else {
+                k == name
+            }
+        })
+        .map(|(_, v)| v.as_str())
+}
+
+/// Borrow the caller-supplied env, or snapshot the process environment when
+/// `None`.
+fn env_or_process(env: Option<&[(String, String)]>) -> Cow<'_, [(String, String)]> {
+    match env {
+        Some(e) => Cow::Borrowed(e),
+        None => Cow::Owned(std::env::vars().collect()),
+    }
+}
+
+/// PowerShell-specific policy: when `pwsh.exe` is found on `path_dirs`
+/// (Windows only), grant the system-drive root (`C:\`) read-only — `pwsh.exe`
+/// enumerates the drive root on startup — plus the PSReadLine history directory
+/// read-write so the module can persist command history.
+///
+/// Mirrors the SDK's `getPowerShellPolicy`. The system drive is read from the
+/// process environment (`SystemDrive`, defaulting to `C:`); the user-scoped
+/// `USERPROFILE` comes from the passed-in `env`.
+///
+/// On non-Windows, or when `pwsh.exe` is not on `path_dirs`, returns an empty
+/// policy.
+fn powershell_policy(path_dirs: &[String], env: &[(String, String)]) -> FilesystemPolicyResult {
+    if !is_windows() {
+        return FilesystemPolicyResult::default();
+    }
+
+    let pwsh_found = path_dirs
+        .iter()
+        .any(|dir| Path::new(dir).join("pwsh.exe").exists());
+    if !pwsh_found {
+        return FilesystemPolicyResult::default();
+    }
+
+    let system_drive = std::env::var("SystemDrive")
+        .ok()
+        .filter(|s| !s.is_empty())
+        .unwrap_or_else(|| "C:".to_string());
+    let readonly_paths = vec![format!("{system_drive}\\")];
+
+    let mut readwrite_paths: Vec<String> = Vec::new();
+    if let Some(user_profile) = env_get(env, "USERPROFILE") {
+        // PSReadLine command-history directory (read-write).
+        readwrite_paths.push(join_str(
+            user_profile,
+            &[
+                "AppData",
+                "Roaming",
+                "Microsoft",
+                "Windows",
+                "PowerShell",
+                "PSReadLine",
+            ],
+        ));
+    }
+
+    FilesystemPolicyResult {
+        readonly_paths,
+        readwrite_paths,
+    }
+}
+
+/// Discover tool and SDK directories from `env` (defaults to the process
+/// environment) as read-only policy paths.
+///
+/// Reads `PATH` plus a registry of well-known tool/SDK variables, then filters
+/// out non-existent and system-critical directories, and adds PowerShell paths
+/// when `pwsh.exe` is on `PATH`. The Rust port of `getAvailableToolsPolicy`.
+/// (The SDK's `processcontainer` AAP-ACL filter is Windows-runtime-specific and
+/// is applied server-side; it is not replicated here.)
+pub fn available_tools_policy(env: Option<&[(String, String)]>) -> FilesystemPolicyResult {
+    let env = env_or_process(env);
+    let env: &[(String, String)] = &env;
+
+    let mut collected = Vec::new();
+    let path_value = env_get(env, "PATH")
+        .or_else(|| env_get(env, "Path"))
+        .unwrap_or("");
+    let path_dirs = split_path_list(path_value);
+    collected.extend(path_dirs.iter().cloned());
+
+    for (name, is_list) in KNOWN_ENV_VARS {
+        if let Some(value) = env_get(env, name) {
+            let extracted = if *is_list {
+                split_path_list(value)
+            } else {
+                single_path(value)
+            };
+            collected.extend(extracted);
+        }
+    }
+
+    let filtered: Vec<String> = deduplicate_paths(&collected)
+        .into_iter()
+        .filter(|dir| directory_exists(dir) && !is_system_critical_path(dir))
+        .collect();
+
+    let pwsh = powershell_policy(&path_dirs, env);
+
+    let mut readonly = filtered;
+    readonly.extend(pwsh.readonly_paths);
+
+    FilesystemPolicyResult {
+        readonly_paths: deduplicate_paths(&readonly),
+        readwrite_paths: deduplicate_paths(&pwsh.readwrite_paths),
+    }
+}
+
+/// Read-only policy for standard user-profile application data locations.
+///
+/// Windows: immediate subdirectories of `%LOCALAPPDATA%\Programs`. Other
+/// platforms: `~/.local/bin` and `~/.local/lib`. The Rust port of
+/// `getUserProfilePolicy`.
+pub fn user_profile_policy() -> FilesystemPolicyResult {
+    let mut readonly_paths = Vec::new();
+
+    if is_windows() {
+        if let Ok(local_app_data) = std::env::var("LOCALAPPDATA") {
+            if directory_exists(&local_app_data) {
+                let programs = Path::new(&local_app_data).join("Programs");
+                if let Ok(entries) = std::fs::read_dir(&programs) {
+                    for entry in entries.flatten() {
+                        if entry.file_type().map(|t| t.is_dir()).unwrap_or(false) {
+                            readonly_paths.push(entry.path().to_string_lossy().into_owned());
+                        }
+                    }
+                }
+            }
+        }
+    } else if let Ok(home) = std::env::var("HOME") {
+        for sub in [".local/bin", ".local/lib"] {
+            let dir = Path::new(&home).join(sub);
+            let dir = dir.to_string_lossy().into_owned();
+            if directory_exists(&dir) {
+                readonly_paths.push(dir);
+            }
+        }
+    }
+
+    FilesystemPolicyResult {
+        readonly_paths,
+        readwrite_paths: Vec::new(),
+    }
+}
+
+/// Read-write policy for the host temporary directory.
+///
+/// Windows: `TEMP` or `TMP`. Other platforms: `TMPDIR` or `/tmp`. Returns an
+/// empty fragment when the resolved directory does not exist. The Rust port of
+/// `getTemporaryFilesPolicy`.
+pub fn temporary_files_policy(env: Option<&[(String, String)]>) -> FilesystemPolicyResult {
+    let env = env_or_process(env);
+    let env: &[(String, String)] = &env;
+
+    let temp_root = if is_windows() {
+        env_get(env, "TEMP").or_else(|| env_get(env, "TMP"))
+    } else {
+        Some(env_get(env, "TMPDIR").unwrap_or("/tmp"))
+    };
+
+    match temp_root {
+        Some(root) if directory_exists(root) => FilesystemPolicyResult {
+            readonly_paths: Vec::new(),
+            readwrite_paths: vec![root.to_string()],
+        },
+        _ => FilesystemPolicyResult::default(),
+    }
+}
+
+// ---------------------------------------------------------------------------
+// SandboxPolicy -> ExecutionRequest
+// ---------------------------------------------------------------------------
+
+/// Clipboard access level, mirroring the SDK `ClipboardPolicy`
+/// (`"none" | "read" | "write" | "all"`).
+#[derive(Debug, Clone, Copy, PartialEq, Eq, serde::Serialize, serde::Deserialize, Default)]
+#[serde(rename_all = "camelCase")]
+pub enum ClipboardPolicy {
+    /// No clipboard access.
+    #[default]
+    None,
+    /// Read-only clipboard access.
+    Read,
+    /// Write-only clipboard access.
+    Write,
+    /// Read and write clipboard access.
+    All,
+}
+
+impl ClipboardPolicy {
+    /// Wire-format value accepted by the config parser.
+    fn wire(self) -> &'static str {
+        match self {
+            ClipboardPolicy::None => "none",
+            ClipboardPolicy::Read => "read",
+            ClipboardPolicy::Write => "write",
+            ClipboardPolicy::All => "all",
+        }
+    }
+}
+
+/// Filesystem section of a [`SandboxPolicy`].
+#[derive(Debug, Clone, Default, serde::Deserialize)]
+#[serde(rename_all = "camelCase", default)]
+pub struct FilesystemSection {
+    pub readwrite_paths: Vec<String>,
+    pub readonly_paths: Vec<String>,
+    pub denied_paths: Vec<String>,
+    /// Clear the filesystem policy when the shell exits (default `true`).
+    pub clear_policy_on_exit: Option<bool>,
+}
+
+/// Network proxy configuration, mirroring the SDK union type
+/// `{ builtinTestServer: true } | { localhost: number } | { url: string }`.
+#[derive(Debug, Clone)]
+pub enum ProxySpec {
+    /// Route through the built-in test proxy server.
+    BuiltinTestServer,
+    /// Route through `127.0.0.1:<port>`.
+    Localhost(u16),
+    /// Route through an explicit proxy URL.
+    Url(String),
+}
+
+// Custom `Deserialize` matching the SDK's object union
+// `{ builtinTestServer: true } | { localhost: number } | { url: string }`.
+// serde's default derive can't express it, and an untagged enum would silently
+// keep the first matching variant when several conflicting keys are present, so
+// we parse all recognised modes and require exactly one — rejecting conflicts
+// the way the shared wire-config parser does.
+impl<'de> serde::Deserialize<'de> for ProxySpec {
+    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
+    where
+        D: serde::Deserializer<'de>,
+    {
+        #[derive(serde::Deserialize)]
+        #[serde(rename_all = "camelCase", deny_unknown_fields)]
+        struct Raw {
+            #[serde(default)]
+            builtin_test_server: Option<bool>,
+            #[serde(default)]
+            localhost: Option<u16>,
+            #[serde(default)]
+            url: Option<String>,
+        }
+        let raw = Raw::deserialize(deserializer)?;
+        match (raw.builtin_test_server, raw.localhost, raw.url) {
+            (Some(true), None, None) => Ok(ProxySpec::BuiltinTestServer),
+            // The SDK union type is `{ builtinTestServer: true }`, so an explicit
+            // `false` is malformed. Reject it rather than silently selecting the
+            // (experimental, deliberately-permissive) built-in proxy — fail closed.
+            (Some(false), None, None) => Err(serde::de::Error::custom(
+                "network.proxy.builtinTestServer must be true; omit the proxy to disable it",
+            )),
+            (None, Some(port), None) => Ok(ProxySpec::Localhost(port)),
+            (None, None, Some(url)) => Ok(ProxySpec::Url(url)),
+            _ => Err(serde::de::Error::custom(
+                "network.proxy must set exactly one of builtinTestServer, localhost, or url",
+            )),
+        }
+    }
+}
+
+/// Network section of a [`SandboxPolicy`]. All flags default to deny.
+#[derive(Debug, Clone, Default, serde::Deserialize)]
+#[serde(rename_all = "camelCase", default)]
+pub struct NetworkSection {
+    pub allow_outbound: bool,
+    pub allow_local_network: bool,
+    pub allowed_hosts: Vec<String>,
+    pub blocked_hosts: Vec<String>,
+    pub proxy: Option<ProxySpec>,
+}
+
+/// UI section of a [`SandboxPolicy`]. All flags default to denied.
+#[derive(Debug, Clone, Default, serde::Deserialize)]
+#[serde(rename_all = "camelCase", default)]
+pub struct UiSection {
+    pub allow_windows: bool,
+    pub clipboard: ClipboardPolicy,
+    pub allow_input_injection: bool,
+}
+
+/// Cross-platform sandbox policy — the Rust analogue of the SDK
+/// `SandboxPolicy`. Describes *what* to restrict; omitted fields are
+/// most-restrictive (default-deny).
+#[derive(Debug, Clone, serde::Deserialize)]
+#[serde(rename_all = "camelCase")]
+pub struct SandboxPolicy {
+    /// Policy/schema version (e.g. `"0.7.0-alpha"`).
+    pub version: String,
+    #[serde(default)]
+    pub filesystem: Option<FilesystemSection>,
+    #[serde(default)]
+    pub network: Option<NetworkSection>,
+    #[serde(default)]
+    pub ui: Option<UiSection>,
+    /// Execution timeout in milliseconds (`None` = no timeout).
+    #[serde(default)]
+    pub timeout_ms: Option<u32>,
+}
+
+/// A spawnable sandbox request, built from a [`SandboxPolicy`] by
+/// [`build_request`]. Fill in the command with
+/// [`set_script`](Self::set_script) — and optionally a working
+/// directory or environment — then hand it to
+/// [`spawn_sandbox`](crate::spawn_sandbox).
+///
+/// This is the SDK's own request type; the internal execution model it maps to
+/// is an implementation detail callers don't depend on.
+#[derive(Debug, Clone)]
+pub struct SandboxRequest {
+    /// The internal execution model. `pub(crate)` so the SDK's own modules and
+    /// unit tests can map/inspect it, while it stays out of the public API.
+    pub(crate) inner: ExecutionRequest,
+}
+
+impl SandboxRequest {
+    /// Set the command the sandbox runs — the `/bin/sh -c` body on Unix, the
+    /// command line on Windows.
+    ///
+    /// This is the raw command string, mapped to the same `script_code` the
+    /// executor binaries run, so it is interpreted exactly as the SDK's
+    /// `spawnSandbox(script)` / `process.commandLine` is — behavior is identical
+    /// across the SDK and this crate.
+    pub fn set_script(&mut self, script: impl Into<String>) -> &mut Self {
+        self.inner.script_code = script.into();
+        self
+    }
+
+    /// Override the working directory the sandboxed child starts in. Left unset,
+    /// it defaults to the policy's resolution.
+    pub fn set_working_directory(&mut self, working_directory: impl Into<String>) -> &mut Self {
+        self.inner.working_directory = working_directory.into();
+        self
+    }
+
+    /// Set the child's environment as `KEY=VALUE` entries.
+    pub fn set_env(&mut self, env: Vec<String>) -> &mut Self {
+        self.inner.env = env;
+        self
+    }
+
+    /// The Seatbelt (macOS) extra Mach service names the sandbox profile lets the
+    /// child look up. Empty when the request carries no Seatbelt config (i.e. a
+    /// non-Seatbelt backend). Read these — e.g. to union with your own — before
+    /// [`set_seatbelt_extra_mach_lookups`](Self::set_seatbelt_extra_mach_lookups).
+    pub fn seatbelt_extra_mach_lookups(&self) -> &[String] {
+        self.inner
+            .seatbelt
+            .as_ref()
+            .map_or(&[], |s| s.extra_mach_lookups.as_slice())
+    }
+
+    /// Set the Seatbelt (macOS) extra Mach service names the child may look up.
+    /// Creates a default Seatbelt config if the request carries none.
+    pub fn set_seatbelt_extra_mach_lookups(&mut self, lookups: Vec<String>) -> &mut Self {
+        self.inner
+            .seatbelt
+            .get_or_insert_default()
+            .extra_mach_lookups = lookups;
+        self
+    }
+
+    /// Allow (or deny) the Seatbelt-sandboxed (macOS) child access to the system
+    /// keychain. Creates a default Seatbelt config if the request carries none.
+    pub fn set_seatbelt_keychain_access(&mut self, allow: bool) -> &mut Self {
+        self.inner.seatbelt.get_or_insert_default().keychain_access = allow;
+        self
+    }
+}
+
+/// Build a [`SandboxRequest`] from a [`SandboxPolicy`], resolving the host's
+/// containment backend — the Rust port of the SDK's `createConfigFromPolicy`.
+///
+/// The returned request has an empty command line; set the command with
+/// [`SandboxRequest::set_script`] (and any working directory / env) before
+/// streaming it via [`crate::spawn_sandbox`].
+///
+/// Mirrors the SDK field mapping and validation (network proxy/host-filtering
+/// constraints) for the supported backends. Internally it builds the same
+/// wire-format `ContainerConfig` the SDK emits and runs it through the shared
+/// config parser, so validation and the wire→model mapping match production.
+pub fn build_request(
+    policy: &SandboxPolicy,
+    container_name: Option<&str>,
+) -> Result<SandboxRequest, crate::Error> {
+    // The shared parser tolerates an empty schema version (treats it as
+    // "unset"), but the SDK requires it; reject it here for parity.
+    if policy.version.is_empty() {
+        return Err(MxcError::malformed_request("Policy version is required").into());
+    }
+    let config = build_wire_config(policy, container_name)?;
+
+    let mut logger = Logger::new(Mode::Buffer);
+    // Map the wire config straight to a request — no base64/file round-trip.
+    // The command line is intentionally empty here (the caller fills
+    // `script_code` before running), so tolerate a missing command.
+    let inner = wxc_common::config_parser::load_request_from_value(config, &mut logger, true)
+        .map_err(|e| MxcError::malformed_request(format!("failed to build request: {e}")))?;
+    Ok(SandboxRequest { inner })
+}
+
+/// Construct the wire-format `ContainerConfig` JSON value for the supported
+/// backends, mirroring `createConfigFromPolicy` + the per-backend builders.
+fn build_wire_config(
+    policy: &SandboxPolicy,
+    container_name: Option<&str>,
+) -> Result<serde_json::Value, MxcError> {
+    use serde_json::json;
+
+    let container_id = container_name
+        .map(str::to_string)
+        .unwrap_or_else(wxc_common::id::mint_random_token);
+
+    let fs = policy.filesystem.clone().unwrap_or_default();
+    let clear_policy = fs.clear_policy_on_exit.unwrap_or(true);
+
+    let mut config = json!({
+        "version": policy.version,
+        "containerId": container_id,
+        "lifecycle": { "destroyOnExit": true, "preservePolicy": !clear_policy },
+        "process": { "commandLine": "", "timeout": policy.timeout_ms.unwrap_or(0) },
+        "filesystem": {
+            "readwritePaths": fs.readwrite_paths,
+            "readonlyPaths": fs.readonly_paths,
+            "deniedPaths": fs.denied_paths,
+        },
+        "ui": {
+            "disable": !policy.ui.as_ref().map(|u| u.allow_windows).unwrap_or(false),
+            "clipboard": policy.ui.as_ref().map(|u| u.clipboard).unwrap_or_default().wire(),
+            "injection": policy.ui.as_ref().map(|u| u.allow_input_injection).unwrap_or(false),
+        },
+    });
+
+    // Mirror the SDK's `resolvesToHostFilteringBackend` (sdk/src/sandbox.ts):
+    // Linux (Bubblewrap/LXC) and macOS (Seatbelt) are treated as host-filtering
+    // backends, so `allowedHosts`/`blockedHosts` are accepted without
+    // `allowOutbound`; only Windows ProcessContainer requires `allowOutbound`.
+    // NB: Seatbelt can't actually enforce hostnames (`profile_builder` degrades a
+    // non-empty `allowedHosts` to allow-all outbound), but we accept it on macOS
+    // anyway to stay consistent with the SDK rather than diverging — keeping the
+    // two ports reconciled matters more than being stricter here.
+    let targets_host_filtering_backend = cfg!(any(target_os = "linux", target_os = "macos"));
+
+    if let Some(net) = &policy.network {
+        if net.proxy.is_some() && cfg!(target_os = "macos") {
+            return Err(MxcError::malformed_request(
+                "Proxy configuration is not supported on macOS",
+            ));
+        }
+
+        if !targets_host_filtering_backend
+            && (!net.allowed_hosts.is_empty() || !net.blocked_hosts.is_empty())
+            && !net.allow_outbound
+        {
+            return Err(MxcError::malformed_request(
+                "allowedHosts/blockedHosts require allowOutbound to be true",
+            ));
+        }
+
+        let mut network = json!({
+            "defaultPolicy": if net.allow_outbound { "allow" } else { "block" },
+            "allowLocalNetwork": net.allow_local_network,
+            "allowedHosts": net.allowed_hosts,
+            "blockedHosts": net.blocked_hosts,
+        });
+        if let Some(proxy) = &net.proxy {
+            network["proxy"] = proxy_to_wire(proxy);
+        }
+        config["network"] = network;
+    } else {
+        config["network"] = json!({ "defaultPolicy": "block" });
+    }
+
+    apply_backend(&mut config, policy, &container_id);
+    Ok(config)
+}
+
+fn proxy_to_wire(proxy: &ProxySpec) -> serde_json::Value {
+    use serde_json::json;
+    match proxy {
+        ProxySpec::BuiltinTestServer => json!({ "builtinTestServer": true }),
+        ProxySpec::Localhost(port) => json!({ "localhost": port }),
+        ProxySpec::Url(url) => json!({ "url": url }),
+    }
+}
+
+/// Apply backend-specific fields, resolving the abstract `Process` intent the
+/// same way the SDK does (Bubblewrap on Linux, Seatbelt on macOS,
+/// BaseContainer on Windows).
+fn apply_backend(config: &mut serde_json::Value, policy: &SandboxPolicy, container_id: &str) {
+    use serde_json::json;
+
+    // Resolve the abstract Process intent per host.
+    config["containment"] = json!("process");
+
+    #[cfg(target_os = "linux")]
+    {
+        let _ = (policy, container_id);
+        apply_linux_network_policy(config);
+    }
+
+    #[cfg(target_os = "macos")]
+    {
+        let _ = (policy, container_id);
+        config["containment"] = json!("seatbelt");
+        if config.get("seatbelt").is_none() {
+            config["seatbelt"] = json!({});
+        }
+    }
+
+    #[cfg(target_os = "windows")]
+    {
+        let mut capabilities: Vec<&str> = Vec::new();
+        if let Some(net) = &policy.network {
+            if net.allow_outbound {
+                capabilities.push("internetClient");
+            }
+            if net.allow_local_network {
+                capabilities.push("privateNetworkClientServer");
+            }
+        }
+        config["processContainer"] = json!({
+            "name": container_id,
+            "leastPrivilege": false,
+            "capabilities": capabilities,
+            "ui": {
+                "isolation": "container",
+                "desktopSystemControl": false,
+                "systemSettings": "none",
+                "ime": false,
+            },
+        });
+        if let Some(network) = config.get_mut("network") {
+            let mode = if has_host_rules(network) {
+                "both"
+            } else {
+                "capabilities"
+            };
+            network["enforcementMode"] = json!(mode);
+        }
+    }
+
+    #[cfg(not(any(target_os = "linux", target_os = "macos", target_os = "windows")))]
+    {
+        let _ = (policy, container_id);
+    }
+}
+
+/// True when the network section carries any host allow/deny rules, deciding
+/// whether host-level enforcement is engaged. (Linux + Windows only.)
+#[cfg(any(target_os = "linux", target_os = "windows"))]
+fn has_host_rules(network: &serde_json::Value) -> bool {
+    let non_empty = |key: &str| {
+        network
+            .get(key)
+            .and_then(|v| v.as_array())
+            .is_some_and(|a| !a.is_empty())
+    };
+    non_empty("allowedHosts") || non_empty("blockedHosts")
+}
+
+/// Promote network enforcement to `firewall` when host rules are present and
+/// no cooperative proxy is configured — the Linux counterpart of the SDK's
+/// `applyLinuxNetworkPolicy`.
+#[cfg(target_os = "linux")]
+fn apply_linux_network_policy(config: &mut serde_json::Value) {
+    use serde_json::json;
+    let Some(network) = config.get_mut("network") else {
+        return;
+    };
+    let has_proxy = network.get("proxy").is_some();
+    if has_host_rules(network) && !has_proxy {
+        network["enforcementMode"] = json!("firewall");
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::ProxySpec;
+
+    #[test]
+    fn proxy_builtin_test_server_true_is_accepted() {
+        let spec: ProxySpec =
+            serde_json::from_str(r#"{ "builtinTestServer": true }"#).expect("true is valid");
+        assert!(matches!(spec, ProxySpec::BuiltinTestServer));
+    }
+
+    #[test]
+    fn proxy_builtin_test_server_false_is_rejected() {
+        // An explicit `false` must not silently select the (experimental,
+        // deliberately-permissive) built-in proxy — it is rejected as malformed.
+        let err = serde_json::from_str::<ProxySpec>(r#"{ "builtinTestServer": false }"#)
+            .expect_err("false must be rejected");
+        assert!(
+            err.to_string().contains("builtinTestServer must be true"),
+            "unexpected error: {err}"
+        );
+    }
+
+    #[test]
+    fn proxy_conflicting_modes_are_rejected() {
+        // Several modes at once must be rejected (cr-005), not silently reduced
+        // to the first matching one.
+        let err = serde_json::from_str::<ProxySpec>(
+            r#"{ "builtinTestServer": true, "localhost": 8080 }"#,
+        )
+        .expect_err("conflicting proxy modes must be rejected");
+        assert!(
+            err.to_string().contains("exactly one"),
+            "unexpected error: {err}"
+        );
+    }
+
+    #[test]
+    fn proxy_localhost_and_url_still_parse() {
+        assert!(matches!(
+            serde_json::from_str::<ProxySpec>(r#"{ "localhost": 8080 }"#).expect("localhost"),
+            ProxySpec::Localhost(8080)
+        ));
+        assert!(matches!(
+            serde_json::from_str::<ProxySpec>(r#"{ "url": "http://proxy" }"#).expect("url"),
+            ProxySpec::Url(_)
+        ));
+    }
+
+    #[cfg(target_os = "windows")]
+    #[test]
+    fn powershell_policy_grants_system_drive_root() {
+        use super::powershell_policy;
+        use std::fs;
+        use std::path::PathBuf;
+
+        // Simulate a `$PSHOME` by creating a temp dir containing a fake pwsh.exe.
+        let unique = format!(
+            "mxc_pwsh_policy_test_{}_{}",
+            std::process::id(),
+            std::time::SystemTime::now()
+                .duration_since(std::time::UNIX_EPOCH)
+                .unwrap()
+                .as_nanos()
+        );
+        let ps_home: PathBuf = std::env::temp_dir().join(unique);
+        fs::create_dir_all(&ps_home).expect("create temp $PSHOME");
+        fs::write(ps_home.join("pwsh.exe"), b"").expect("create fake pwsh.exe");
+        let ps_home_str = ps_home.to_string_lossy().into_owned();
+
+        let env = vec![("USERPROFILE".to_string(), "C:\\Users\\example".to_string())];
+        let result = powershell_policy(std::slice::from_ref(&ps_home_str), &env);
+
+        // Clean up before asserting so a failing assertion still leaves nothing.
+        let _ = fs::remove_dir_all(&ps_home);
+
+        // The system-drive root (e.g. `C:\`) is granted read-only — pwsh
+        // enumerates the drive root on startup (mirrors `getPowerShellPolicy`).
+        // A bare drive root normalizes to a 2-char `X:` after trimming separators.
+        assert!(
+            result.readonly_paths.iter().any(|p| {
+                let trimmed = p.trim_end_matches(['\\', '/']);
+                trimmed.len() == 2 && trimmed.ends_with(':')
+            }),
+            "expected system-drive root in readonly paths: {:?}",
+            result.readonly_paths
+        );
+        // PSReadLine command history stays read-write.
+        assert!(
+            result
+                .readwrite_paths
+                .iter()
+                .any(|p| p.contains("PSReadLine")),
+            "expected PSReadLine history in readwrite paths: {:?}",
+            result.readwrite_paths
+        );
+    }
+
+    use super::{build_request, NetworkSection, SandboxPolicy};
+
+    fn policy_with_network(network: NetworkSection) -> SandboxPolicy {
+        SandboxPolicy {
+            version: "0.7.0-alpha".to_string(),
+            filesystem: None,
+            network: Some(network),
+            ui: None,
+            timeout_ms: None,
+        }
+    }
+
+    // macOS Seatbelt is treated as a host-filtering backend to mirror the SDK
+    // (`resolvesToHostFilteringBackend` in sdk/src/sandbox.ts), so `allowedHosts`
+    // is accepted with or without `allowOutbound` — consistency with the SDK over
+    // rejecting on macOS, even though Seatbelt can't actually filter by host.
+    #[cfg(target_os = "macos")]
+    #[test]
+    fn macos_allowed_hosts_without_outbound_is_accepted() {
+        // The SDK accepts allowedHosts without allowOutbound on Seatbelt, so the
+        // Rust port must too (the guard only applies to Windows ProcessContainer).
+        let policy = policy_with_network(NetworkSection {
+            allow_outbound: false,
+            allowed_hosts: vec!["example.com".to_string()],
+            ..Default::default()
+        });
+        assert!(
+            build_request(&policy, None).is_ok(),
+            "macOS must accept allowedHosts without allowOutbound, matching the SDK"
+        );
+    }
+
+    #[cfg(target_os = "macos")]
+    #[test]
+    fn macos_allowed_hosts_with_outbound_is_accepted() {
+        // allowOutbound=true is the caller explicitly allowing outbound, so it
+        // builds (allowedHosts simply isn't enforceable on Seatbelt).
+        let policy = policy_with_network(NetworkSection {
+            allow_outbound: true,
+            allowed_hosts: vec!["example.com".to_string()],
+            ..Default::default()
+        });
+        assert!(
+            build_request(&policy, None).is_ok(),
+            "outbound-allowed host filter should build"
+        );
+    }
+
+    #[test]
+    fn build_request_maps_filesystem_and_timeout() {
+        let policy = SandboxPolicy {
+            version: "0.7.0-alpha".to_string(),
+            filesystem: Some(super::FilesystemSection {
+                readwrite_paths: vec!["/tmp".to_string()],
+                readonly_paths: vec![],
+                denied_paths: vec![],
+                clear_policy_on_exit: None,
+            }),
+            network: None,
+            ui: None,
+            timeout_ms: Some(5000),
+        };
+
+        // Inspect the internal model the SDK maps to — a unit concern; the public
+        // API only hands back the opaque `SandboxRequest`.
+        let request =
+            build_request(&policy, Some("test-container")).expect("build_request should succeed");
+        assert_eq!(request.inner.script_timeout, 5000);
+        assert!(request
+            .inner
+            .policy
+            .readwrite_paths
+            .contains(&"/tmp".to_string()));
+        assert!(request.inner.script_code.is_empty());
+    }
+
+    #[test]
+    fn build_request_preserves_clipboard_policy() {
+        use super::ClipboardPolicy as P;
+        use wxc_common::models::ClipboardPolicy as Wire;
+
+        for (input, expected) in [
+            (P::None, Wire::None),
+            (P::Read, Wire::Read),
+            (P::Write, Wire::Write),
+            (P::All, Wire::All),
+        ] {
+            let policy = SandboxPolicy {
+                version: "0.7.0-alpha".to_string(),
+                filesystem: None,
+                network: None,
+                ui: Some(super::UiSection {
+                    allow_windows: true,
+                    clipboard: input,
+                    allow_input_injection: false,
+                }),
+                timeout_ms: None,
+            };
+            let request = build_request(&policy, None).expect("build_request should succeed");
+            assert_eq!(
+                request.inner.policy.ui.clipboard, expected,
+                "clipboard {input:?} should map to {expected:?}"
+            );
+        }
+    }
+
+    #[test]
+    fn build_request_maps_network_hosts() {
+        let policy = policy_with_network(NetworkSection {
+            allow_outbound: true,
+            allow_local_network: true,
+            allowed_hosts: vec!["allowed.example".to_string()],
+            blocked_hosts: vec!["blocked.example".to_string()],
+            ..Default::default()
+        });
+        let request = build_request(&policy, None)
+            .expect("build_request should accept host rules with allowOutbound");
+        assert!(request
+            .inner
+            .policy
+            .allowed_hosts
+            .contains(&"allowed.example".to_string()));
+        assert!(request
+            .inner
+            .policy
+            .blocked_hosts
+            .contains(&"blocked.example".to_string()));
+        assert!(request.inner.policy.allow_local_network);
+    }
+
+    #[cfg(target_os = "macos")]
+    #[test]
+    fn seatbelt_extra_mach_lookups_and_keychain_round_trip() {
+        let policy = SandboxPolicy {
+            version: "0.7.0-alpha".to_string(),
+            filesystem: None,
+            network: None,
+            ui: None,
+            timeout_ms: None,
+        };
+        // build_request resolves Seatbelt on macOS, so the config is present and
+        // the consumer can read its defaults and write back.
+        let mut request = build_request(&policy, None).expect("build_request");
+        let mut union: Vec<String> = request.seatbelt_extra_mach_lookups().to_vec();
+        union.push("com.example.service".to_string());
+        request.set_seatbelt_extra_mach_lookups(union.clone());
+        request.set_seatbelt_keychain_access(true);
+
+        assert_eq!(request.seatbelt_extra_mach_lookups(), union.as_slice());
+        let cfg = request
+            .inner
+            .seatbelt
+            .as_ref()
+            .expect("seatbelt config on macOS");
+        assert!(cfg.keychain_access);
+        assert!(cfg
+            .extra_mach_lookups
+            .contains(&"com.example.service".to_string()));
+    }
+}
diff --git a/src/core/mxc-sdk/src/sandbox.rs b/src/core/mxc-sdk/src/sandbox.rs
new file mode 100644
index 000000000..5c47c834a
--- /dev/null
+++ b/src/core/mxc-sdk/src/sandbox.rs
@@ -0,0 +1,115 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! The SDK's sandbox handle — a crate-owned facade over the internal
+//! `wxc_common` streaming handle, so the public API never exposes the
+//! foundation crate's traits.
+
+use std::io::{Read, Write};
+
+use wxc_common::sandbox_process::{SandboxProcess, StreamCloser as InnerCloser};
+
+/// The outcome of waiting on a [`Sandbox`] (see [`Sandbox::wait`]).
+///
+/// An ordinary exit and a timeout are both represented here as success
+/// outcomes; [`Sandbox::wait`] reserves its `Err` for an actual OS / wait
+/// failure.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum WaitOutcome {
+    /// The process exited with this code. On Unix a process terminated by a
+    /// signal (rather than exiting normally) surfaces as `Exited(-1)`.
+    Exited(i32),
+    /// The request's `scriptTimeout` elapsed before the process exited; the
+    /// process and its whole tree were killed.
+    TimedOut,
+}
+
+/// A live sandboxed process, returned by [`spawn_sandbox`](crate::spawn_sandbox).
+///
+/// Stream the child's stdio with the `take_*` accessors, wait for it, or kill
+/// it (and its whole tree). No pty is allocated — the streams are ordinary
+/// pipes. Any stdout/stderr the caller does not `take_*` is drained and
+/// discarded by [`wait`](Self::wait).
+pub struct Sandbox {
+    inner: Box<dyn SandboxProcess>,
+}
+
+impl Sandbox {
+    pub(crate) fn new(inner: Box<dyn SandboxProcess>) -> Self {
+        Self { inner }
+    }
+
+    /// Take the child's stdin pipe. Returns `None` after the first call.
+    pub fn take_stdin(&mut self) -> Option<Box<dyn Write + Send>> {
+        self.inner.take_stdin()
+    }
+
+    /// Take the child's stdout pipe. Returns `None` after the first call.
+    pub fn take_stdout(&mut self) -> Option<Box<dyn Read + Send>> {
+        self.inner.take_stdout()
+    }
+
+    /// Take the child's stderr pipe. Returns `None` after the first call.
+    pub fn take_stderr(&mut self) -> Option<Box<dyn Read + Send>> {
+        self.inner.take_stderr()
+    }
+
+    /// A [`StreamCloser`] that unblocks a parked blocking read on stdout without
+    /// killing the child. `None` if stdout was not piped.
+    pub fn stdout_closer(&self) -> Option<StreamCloser> {
+        self.inner.stdout_closer().map(StreamCloser::new)
+    }
+
+    /// As [`stdout_closer`](Self::stdout_closer), for stderr.
+    pub fn stderr_closer(&self) -> Option<StreamCloser> {
+        self.inner.stderr_closer().map(StreamCloser::new)
+    }
+
+    /// Non-blocking exit check: `Some(code)` if the child has exited.
+    pub fn try_wait(&mut self) -> std::io::Result<Option<i32>> {
+        self.inner.try_wait()
+    }
+
+    /// The child's process id.
+    pub fn id(&self) -> u32 {
+        self.inner.id()
+    }
+
+    /// Kill the child and its process tree.
+    pub fn kill(&mut self) -> std::io::Result<()> {
+        self.inner.kill()
+    }
+
+    /// Wait for the child to exit, draining and discarding any untaken
+    /// stdout/stderr so it can't block on a full pipe.
+    ///
+    /// Returns [`WaitOutcome::Exited`] with the exit code, or
+    /// [`WaitOutcome::TimedOut`] if the request's `scriptTimeout` elapsed (the
+    /// process and its tree are killed first). `Err` is reserved for an actual
+    /// OS / wait failure.
+    pub fn wait(&mut self) -> std::io::Result<WaitOutcome> {
+        match self.inner.wait() {
+            Ok(code) => Ok(WaitOutcome::Exited(code)),
+            Err(e) if e.kind() == std::io::ErrorKind::TimedOut => Ok(WaitOutcome::TimedOut),
+            Err(e) => Err(e),
+        }
+    }
+}
+
+/// Closes one of a [`Sandbox`]'s streams, unblocking a read parked on it without
+/// killing the process. Obtained from [`Sandbox::stdout_closer`] /
+/// [`Sandbox::stderr_closer`].
+pub struct StreamCloser {
+    inner: Box<dyn InnerCloser>,
+}
+
+impl StreamCloser {
+    fn new(inner: Box<dyn InnerCloser>) -> Self {
+        Self { inner }
+    }
+
+    /// Close the stream, making any read currently parked on it return.
+    pub fn close(&self) {
+        self.inner.close();
+    }
+}
diff --git a/src/core/mxc-sdk/tests/sandbox.rs b/src/core/mxc-sdk/tests/sandbox.rs
new file mode 100644
index 000000000..90aca5781
--- /dev/null
+++ b/src/core/mxc-sdk/tests/sandbox.rs
@@ -0,0 +1,308 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! End-to-end tests for the `mxc-sdk` library against the host backend.
+//!
+//! Seatbelt-specific cases run only on macOS. The library exposes only the
+//! streaming API, so "run to completion" here means build a request via
+//! [`build_request`], `spawn_sandbox`, read the (untaken)
+//! stdout/stderr, then [`wait`](mxc_sdk::Sandbox::wait) for the exit code —
+//! the same path the consumer drives.
+
+use mxc_sdk::{build_request, ErrorCode, SandboxPolicy};
+#[cfg(any(target_os = "macos", target_os = "windows"))]
+use mxc_sdk::{spawn_sandbox, SandboxRequest, WaitOutcome};
+
+/// A Seatbelt request exposing `/tmp` read-write, with the given command and
+/// timeout (ms; `0` == run until exit).
+#[cfg(target_os = "macos")]
+fn seatbelt_request(command: &str, timeout_ms: u32) -> SandboxRequest {
+    let policy = SandboxPolicy {
+        version: "0.7.0-alpha".to_string(),
+        filesystem: Some(mxc_sdk::policy::FilesystemSection {
+            readwrite_paths: vec!["/tmp".to_string()],
+            readonly_paths: vec![],
+            denied_paths: vec![],
+            clear_policy_on_exit: None,
+        }),
+        network: None,
+        ui: None,
+        timeout_ms: if timeout_ms == 0 {
+            None
+        } else {
+            Some(timeout_ms)
+        },
+    };
+    let mut request = build_request(&policy, None).expect("build_request should succeed");
+    request.set_script(command);
+    request
+}
+
+/// A Windows ProcessContainer request exposing `C:\Windows\Temp` read-write.
+/// The policy `version` selects the tier (>= 0.5 implies BaseContainer).
+#[cfg(target_os = "windows")]
+fn process_container_request(version: &str, command: &str, timeout_ms: u32) -> SandboxRequest {
+    let policy = SandboxPolicy {
+        version: version.to_string(),
+        filesystem: Some(mxc_sdk::policy::FilesystemSection {
+            readwrite_paths: vec!["C:\\Windows\\Temp".to_string()],
+            readonly_paths: vec![],
+            denied_paths: vec![],
+            clear_policy_on_exit: None,
+        }),
+        network: None,
+        ui: None,
+        timeout_ms: if timeout_ms == 0 {
+            None
+        } else {
+            Some(timeout_ms)
+        },
+    };
+    let mut request = build_request(&policy, None).expect("build_request should succeed");
+    request.set_script(command);
+    request
+}
+
+/// Outcome of running a sandbox to completion via the streaming API.
+#[cfg(any(target_os = "macos", target_os = "windows"))]
+#[derive(Debug)]
+struct RunOutcome {
+    exit_code: i32,
+    timed_out: bool,
+    standard_out: String,
+    standard_err: String,
+}
+
+/// Spawn a request, read its stdout/stderr concurrently, and wait for exit —
+/// the streaming-API equivalent of running to completion.
+#[cfg(any(target_os = "macos", target_os = "windows"))]
+fn spawn_and_wait(request: SandboxRequest) -> Result<RunOutcome, mxc_sdk::Error> {
+    use std::io::Read;
+
+    fn read_thread(
+        reader: Option<Box<dyn Read + Send>>,
+    ) -> Option<std::thread::JoinHandle<String>> {
+        reader.map(|mut r| {
+            std::thread::spawn(move || {
+                let mut s = String::new();
+                let _ = r.read_to_string(&mut s);
+                s
+            })
+        })
+    }
+
+    let mut proc = spawn_sandbox(request)?;
+    let out_thread = read_thread(proc.take_stdout());
+    let err_thread = read_thread(proc.take_stderr());
+    let (exit_code, timed_out) = match proc.wait() {
+        Ok(WaitOutcome::Exited(code)) => (code, false),
+        Ok(WaitOutcome::TimedOut) => (-1, true),
+        Err(e) => panic!("wait failed: {e}"),
+    };
+    let standard_out = out_thread
+        .map(|t| t.join().unwrap_or_default())
+        .unwrap_or_default();
+    let standard_err = err_thread
+        .map(|t| t.join().unwrap_or_default())
+        .unwrap_or_default();
+    Ok(RunOutcome {
+        exit_code,
+        timed_out,
+        standard_out,
+        standard_err,
+    })
+}
+
+#[test]
+fn version_older_than_supported_is_rejected() {
+    // Schema version below the supported floor (>=0.4) must be rejected by the
+    // parser before any backend selection happens.
+    let policy = SandboxPolicy {
+        version: "0.3.0-alpha".to_string(),
+        filesystem: None,
+        network: None,
+        ui: None,
+        timeout_ms: None,
+    };
+
+    let err =
+        build_request(&policy, None).expect_err("an out-of-range schema version must be rejected");
+    assert_eq!(err.code, ErrorCode::MalformedRequest);
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn seatbelt_does_not_leak_host_environment() {
+    // A host env var must not be visible to the sandboxed child (the request's
+    // env is the only source; the host environment is cleared).
+    std::env::set_var("MXC_HOST_SECRET", "leaked-value");
+
+    let result = spawn_and_wait(seatbelt_request("echo [$MXC_HOST_SECRET]", 10000))
+        .expect("seatbelt run should succeed");
+    std::env::remove_var("MXC_HOST_SECRET");
+
+    assert_eq!(result.exit_code, 0, "stderr: {}", result.standard_err);
+    assert!(
+        !result.standard_out.contains("leaked-value"),
+        "host env must not leak into the sandbox, got: {:?}",
+        result.standard_out
+    );
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn seatbelt_env_reaches_sandboxed_process() {
+    // An env entry set on the request must reach the sandboxed child.
+    let mut request = seatbelt_request("echo $MXC_TEST_VAR", 10000);
+    request.set_env(vec!["MXC_TEST_VAR=injected-value".to_string()]);
+
+    let result = spawn_and_wait(request).expect("seatbelt run should succeed");
+
+    assert_eq!(result.exit_code, 0, "stderr: {}", result.standard_err);
+    assert!(
+        result.standard_out.contains("injected-value"),
+        "env var should reach the sandboxed process, got: {:?}",
+        result.standard_out
+    );
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn seatbelt_finite_timeout_fires() {
+    // A finite scriptTimeout shorter than the command's runtime must fire and
+    // terminate the process.
+    let start = std::time::Instant::now();
+    let result = spawn_and_wait(seatbelt_request("sleep 30", 1000))
+        .expect("seatbelt run should return a response");
+    assert!(result.timed_out, "a timed-out run must report a timeout");
+    assert!(
+        start.elapsed() < std::time::Duration::from_secs(20),
+        "timeout must fire well before the command's own 30s runtime"
+    );
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn seatbelt_captures_stderr_only() {
+    // Output written solely to stderr must be captured on standard_err, with
+    // standard_out left empty.
+    let result = spawn_and_wait(seatbelt_request("echo only-stderr 1>&2", 10000))
+        .expect("seatbelt run should succeed");
+    assert_eq!(result.exit_code, 0, "stderr: {}", result.standard_err);
+    assert!(
+        result.standard_err.contains("only-stderr"),
+        "stderr should be captured, got: {:?}",
+        result.standard_err
+    );
+    assert!(
+        !result.standard_out.contains("only-stderr"),
+        "stdout should be empty, got: {:?}",
+        result.standard_out
+    );
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn seatbelt_reports_nonzero_exit_code() {
+    let result =
+        spawn_and_wait(seatbelt_request("exit 7", 10000)).expect("seatbelt run should succeed");
+
+    assert_eq!(result.exit_code, 7);
+    assert!(
+        !result.timed_out,
+        "a clean non-zero exit must not be reported as a timeout"
+    );
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn seatbelt_defaults_cwd_to_allowed_path_without_getcwd_leak() {
+    // No `cwd` set: the child must run in a sandbox-allowed directory (the
+    // first readwrite path) rather than inheriting a possibly-inaccessible
+    // host cwd, so getcwd() does not leak a permission error to stderr.
+    let result =
+        spawn_and_wait(seatbelt_request("/bin/pwd", 10000)).expect("seatbelt run should succeed");
+
+    assert_eq!(result.exit_code, 0, "stderr: {}", result.standard_err);
+    assert!(
+        result.standard_out.contains("tmp"),
+        "child cwd should default to the readwrite path, got: {:?}",
+        result.standard_out
+    );
+    assert!(
+        !result.standard_err.contains("getcwd")
+            && !result.standard_err.contains("Operation not permitted"),
+        "no getcwd leak expected, stderr: {:?}",
+        result.standard_err
+    );
+}
+
+// ---------------------------------------------------------------------------
+// Windows ProcessContainer (AppContainer + BaseContainer) — integration tests.
+//
+// These exercise the capture and timeout paths that regressed as review items
+// #1 (BaseContainer ran with an already-closed process handle) and #2
+// (AppContainer timeout killed only the direct child, so it never fired).
+// They run a real sandbox, so they require an elevated, host-prepped Windows
+// host (see docs/host-prep.md) and are therefore `#[ignore]`d — run them with
+// `cargo test -p mxc-sdk -- --ignored` on such a host.
+// ---------------------------------------------------------------------------
+
+#[cfg(target_os = "windows")]
+#[test]
+#[ignore = "requires an elevated, host-prepped Windows host (see docs/host-prep.md)"]
+fn base_container_captures_stdout() {
+    // Schema >= 0.5 implies the BaseContainer fallback. Regression guard for
+    // #1: a valid exit code and captured stdout prove the process handle was
+    // not closed out from under the wait.
+    let result = spawn_and_wait(process_container_request(
+        "0.7.0-alpha",
+        "cmd /c echo hello-base-container",
+        30000,
+    ))
+    .expect("BaseContainer run should succeed");
+    assert_eq!(result.exit_code, 0, "stderr: {}", result.standard_err);
+    assert!(
+        result.standard_out.contains("hello-base-container"),
+        "stdout should be captured, got: {:?}",
+        result.standard_out
+    );
+}
+
+#[cfg(target_os = "windows")]
+#[test]
+#[ignore = "requires an elevated, host-prepped Windows host (see docs/host-prep.md)"]
+fn appcontainer_captures_stdout() {
+    // Schema 0.4 keeps us on the AppContainer fast path (no BaseContainer).
+    let result = spawn_and_wait(process_container_request(
+        "0.4.0-alpha",
+        "cmd /c echo hello-appcontainer",
+        30000,
+    ))
+    .expect("AppContainer run should succeed");
+    assert_eq!(result.exit_code, 0, "stderr: {}", result.standard_err);
+    assert!(
+        result.standard_out.contains("hello-appcontainer"),
+        "stdout should be captured, got: {:?}",
+        result.standard_out
+    );
+}
+
+#[cfg(target_os = "windows")]
+#[test]
+#[ignore = "requires an elevated, host-prepped Windows host (see docs/host-prep.md)"]
+fn appcontainer_finite_timeout_fires() {
+    // Regression guard for #2: a finite timeout must fire even when the command
+    // spawns a descendant that keeps the inherited stdout write-end open. If
+    // the timeout only killed the direct child, the capture reader would block
+    // forever and this test would hang past the bounded wall-clock below.
+    let result = spawn_and_wait(process_container_request(
+        "0.4.0-alpha",
+        "cmd /c start /b ping -n 60 127.0.0.1 >nul & ping -n 60 127.0.0.1 >nul",
+        2000,
+    ))
+    .expect("AppContainer run should return a response");
+    assert!(result.timed_out, "a timed-out run must report a timeout");
+    // The bounded wait is enforced by the test harness; a hang here is the
+    // failure mode the regression guards against.
+}
diff --git a/src/core/mxc-sdk/tests/sdk_helpers.rs b/src/core/mxc-sdk/tests/sdk_helpers.rs
new file mode 100644
index 000000000..69e115393
--- /dev/null
+++ b/src/core/mxc-sdk/tests/sdk_helpers.rs
@@ -0,0 +1,245 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! Tests for the ported SDK helpers: policy discovery, platform support, and
+//! the SandboxPolicy -> SandboxRequest builder.
+
+use mxc_sdk::{
+    available_tools_policy, build_request, platform_support, temporary_files_policy,
+    user_profile_policy, SandboxPolicy,
+};
+
+#[cfg(target_os = "macos")]
+use mxc_sdk::{spawn_sandbox, WaitOutcome};
+
+fn env_pairs(pairs: &[(&str, &str)]) -> Vec<(String, String)> {
+    pairs
+        .iter()
+        .map(|(k, v)| (k.to_string(), v.to_string()))
+        .collect()
+}
+
+#[test]
+fn platform_support_reports_host() {
+    let support = platform_support();
+    // Every platform this test runs on (macOS/Linux/Windows in CI) is supported.
+    assert!(support.is_supported, "reason: {:?}", support.reason);
+    assert!(!support.available_methods.is_empty());
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn platform_support_macos_is_seatbelt() {
+    let support = platform_support();
+    assert_eq!(support.available_methods, vec!["seatbelt".to_string()]);
+}
+
+#[test]
+fn available_tools_policy_filters_nonexistent_and_dedups() {
+    // A real dir (cwd), a bogus dir, and the real dir again under a known var.
+    let cwd = std::env::current_dir()
+        .unwrap()
+        .to_string_lossy()
+        .into_owned();
+    let sep = if cfg!(target_os = "windows") {
+        ";"
+    } else {
+        ":"
+    };
+    let path_val = format!("{cwd}{sep}/this/does/not/exist/xyzzy");
+    let env = env_pairs(&[("PATH", &path_val), ("CARGO_HOME", &cwd)]);
+
+    let result = available_tools_policy(Some(&env));
+
+    assert!(
+        result.readonly_paths.iter().any(|p| p.contains(&cwd)),
+        "the full resolved cwd should be discovered: cwd={cwd:?} paths={:?}",
+        result.readonly_paths
+    );
+    assert!(
+        !result.readonly_paths.iter().any(|p| p.contains("xyzzy")),
+        "non-existent dir should be filtered: {:?}",
+        result.readonly_paths
+    );
+    // cwd appeared twice (PATH + CARGO_HOME) but must be deduplicated.
+    let cwd_hits = result
+        .readonly_paths
+        .iter()
+        .filter(|p| {
+            p.ends_with(
+                std::path::Path::new(&cwd)
+                    .file_name()
+                    .unwrap()
+                    .to_str()
+                    .unwrap(),
+            )
+        })
+        .count();
+    assert!(
+        cwd_hits <= 1,
+        "cwd should not be duplicated: {:?}",
+        result.readonly_paths
+    );
+}
+
+#[test]
+fn temporary_files_policy_returns_existing_temp() {
+    let cwd = std::env::current_dir()
+        .unwrap()
+        .to_string_lossy()
+        .into_owned();
+    let var = if cfg!(target_os = "windows") {
+        "TEMP"
+    } else {
+        "TMPDIR"
+    };
+    let env = env_pairs(&[(var, &cwd)]);
+
+    let result = temporary_files_policy(Some(&env));
+    assert_eq!(result.readwrite_paths.len(), 1);
+    assert!(result.readonly_paths.is_empty());
+}
+
+#[test]
+fn temporary_files_policy_empty_when_missing() {
+    let env = env_pairs(&[
+        ("TEMP", "/no/such/temp/xyzzy"),
+        ("TMPDIR", "/no/such/temp/xyzzy"),
+    ]);
+    let result = temporary_files_policy(Some(&env));
+    assert!(result.readwrite_paths.is_empty());
+}
+
+#[test]
+fn user_profile_policy_does_not_panic() {
+    // Behaviour is host-dependent; assert it returns without error and never
+    // populates readwrite (it is a read-only fragment).
+    let result = user_profile_policy();
+    assert!(result.readwrite_paths.is_empty());
+}
+
+#[test]
+fn build_request_rejects_empty_version() {
+    // Parity with the SDK, which throws "Policy version is required".
+    let policy = SandboxPolicy {
+        version: String::new(),
+        filesystem: None,
+        network: None,
+        ui: None,
+        timeout_ms: None,
+    };
+
+    let err = build_request(&policy, None).expect_err("an empty policy version must be rejected");
+    assert_eq!(err.code, mxc_sdk::ErrorCode::MalformedRequest);
+}
+
+#[test]
+fn build_request_host_rules_require_outbound() {
+    let policy = SandboxPolicy {
+        version: "0.7.0-alpha".to_string(),
+        filesystem: None,
+        network: Some(mxc_sdk::policy::NetworkSection {
+            allow_outbound: false,
+            allow_local_network: false,
+            allowed_hosts: vec!["example.com".to_string()],
+            blocked_hosts: vec![],
+            proxy: None,
+        }),
+        ui: None,
+        timeout_ms: None,
+    };
+
+    // Mirror the SDK's `resolvesToHostFilteringBackend`: Linux (Bubblewrap/LXC)
+    // and macOS (Seatbelt) accept host rules without `allowOutbound`; only the
+    // Windows ProcessContainer backend requires it. Either way it must not panic.
+    let result = build_request(&policy, None);
+    if cfg!(any(target_os = "linux", target_os = "macos")) {
+        assert!(
+            result.is_ok(),
+            "Linux/macOS host-filtering backends accept host rules without allowOutbound (matching the SDK)"
+        );
+    } else {
+        assert!(
+            result.is_err(),
+            "Windows ProcessContainer requires allowOutbound for host rules"
+        );
+    }
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn build_request_then_run_seatbelt() {
+    let policy = SandboxPolicy {
+        version: "0.7.0-alpha".to_string(),
+        filesystem: Some(mxc_sdk::policy::FilesystemSection {
+            readwrite_paths: vec!["/tmp".to_string()],
+            readonly_paths: vec![],
+            denied_paths: vec![],
+            clear_policy_on_exit: None,
+        }),
+        network: None,
+        ui: None,
+        timeout_ms: Some(10000),
+    };
+
+    let mut request = build_request(&policy, None).expect("build_request should succeed");
+    request.set_script("echo built-from-policy");
+
+    let mut proc = spawn_sandbox(request).expect("spawn should succeed");
+    let mut out = String::new();
+    if let Some(mut stdout) = proc.take_stdout() {
+        let _ = std::io::Read::read_to_string(&mut stdout, &mut out);
+    }
+    let outcome = proc.wait().expect("wait should succeed");
+    assert_eq!(outcome, WaitOutcome::Exited(0));
+    assert!(out.contains("built-from-policy"), "got: {out:?}");
+}
+
+#[cfg(target_os = "linux")]
+#[test]
+fn platform_support_linux_methods_are_bubblewrap_only() {
+    let support = platform_support();
+    // The crate dispatches only Bubblewrap on Linux (LXC has no captured /
+    // streaming path), so that is the only method it should ever report.
+    for method in &support.available_methods {
+        assert_eq!(method, "bubblewrap", "unexpected Linux method: {method}");
+    }
+}
+
+#[cfg(target_os = "windows")]
+#[test]
+fn platform_support_windows_is_processcontainer() {
+    let support = platform_support();
+    assert!(support.is_supported, "reason: {:?}", support.reason);
+    assert_eq!(
+        support.available_methods,
+        vec!["processcontainer".to_string()]
+    );
+}
+
+#[test]
+fn available_tools_policy_filters_system_critical() {
+    // A system-critical, existing directory on PATH must be filtered out so it
+    // never lands in readonly_paths.
+    let critical = if cfg!(target_os = "windows") {
+        format!(
+            "{}\\System32",
+            std::env::var("WINDIR").unwrap_or_else(|_| "C:\\Windows".to_string())
+        )
+    } else {
+        "/usr/bin".to_string()
+    };
+    if !std::path::Path::new(&critical).is_dir() {
+        return; // skip if the critical dir doesn't exist on this host
+    }
+    let env = env_pairs(&[("PATH", &critical)]);
+    let result = available_tools_policy(Some(&env));
+    assert!(
+        !result
+            .readonly_paths
+            .iter()
+            .any(|p| p.to_lowercase().contains("system32") || p == "/usr/bin"),
+        "system-critical dir must be filtered: {:?}",
+        result.readonly_paths
+    );
+}
diff --git a/src/core/mxc-sdk/tests/streaming.rs b/src/core/mxc-sdk/tests/streaming.rs
new file mode 100644
index 000000000..da168739b
--- /dev/null
+++ b/src/core/mxc-sdk/tests/streaming.rs
@@ -0,0 +1,458 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! Streaming (handle-based) API tests: live stdio, kill, and wait.
+//! Seatbelt-specific cases run only on macOS.
+//!
+//! These drive the real consumer path: build a [`SandboxRequest`] from a
+//! [`SandboxPolicy`] via `build_request`, fill in the command, then
+//! `spawn_sandbox`.
+
+#![cfg(target_os = "macos")]
+
+use mxc_sdk::{build_request, spawn_sandbox, SandboxPolicy, SandboxRequest, WaitOutcome};
+
+/// A Seatbelt streaming request (`/tmp` read-write) with the given command and
+/// timeout (ms; `0` == run until exit, required for interactive/long cases).
+#[cfg(target_os = "macos")]
+fn seatbelt_request(command: &str, timeout_ms: u32) -> SandboxRequest {
+    let policy = SandboxPolicy {
+        version: "0.7.0-alpha".to_string(),
+        filesystem: Some(mxc_sdk::policy::FilesystemSection {
+            readwrite_paths: vec!["/tmp".to_string()],
+            readonly_paths: vec![],
+            denied_paths: vec![],
+            clear_policy_on_exit: None,
+        }),
+        network: None,
+        ui: None,
+        timeout_ms: if timeout_ms == 0 {
+            None
+        } else {
+            Some(timeout_ms)
+        },
+    };
+    let mut request = build_request(&policy, None).expect("build_request should succeed");
+    request.set_script(command);
+    request
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_double_take_returns_none() {
+    let mut proc = spawn_sandbox(seatbelt_request("cat", 0)).expect("spawn");
+
+    assert!(
+        proc.take_stdin().is_some(),
+        "first take_stdin yields the pipe"
+    );
+    assert!(proc.take_stdin().is_none(), "second take_stdin yields None");
+    assert!(
+        proc.take_stdout().is_some(),
+        "first take_stdout yields the pipe"
+    );
+    assert!(
+        proc.take_stdout().is_none(),
+        "second take_stdout yields None"
+    );
+    assert!(
+        proc.take_stderr().is_some(),
+        "first take_stderr yields the pipe"
+    );
+    assert!(
+        proc.take_stderr().is_none(),
+        "second take_stderr yields None"
+    );
+
+    proc.kill().expect("kill");
+    let _ = proc.wait();
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_try_wait_reports_exit_after_completion() {
+    let mut proc = spawn_sandbox(seatbelt_request("true", 0)).expect("spawn");
+
+    // Poll try_wait until the quick command exits; it must then report Some.
+    let mut code = None;
+    for _ in 0..100 {
+        if let Some(c) = proc.try_wait().expect("try_wait") {
+            code = Some(c);
+            break;
+        }
+        std::thread::sleep(std::time::Duration::from_millis(50));
+    }
+    let code = code.expect("process should exit and try_wait report it");
+    assert_eq!(code, 0, "quick command should exit 0");
+}
+
+#[test]
+fn streaming_kill_after_reap_is_a_noop() {
+    // Regression: once the child has exited and been reaped (here via `wait`),
+    // `kill()` must not signal its pid/pgid again — a recycled pid could belong
+    // to an unrelated process (group). The post-reap `kill()` is a clean no-op.
+    let mut proc = spawn_sandbox(seatbelt_request("true", 0)).expect("spawn");
+    assert_eq!(
+        proc.wait().expect("wait"),
+        WaitOutcome::Exited(0),
+        "quick command should exit 0"
+    );
+    proc.kill().expect("kill after reap is a no-op Ok");
+    proc.kill().expect("repeat kill after reap stays Ok");
+}
+
+#[test]
+fn streaming_kill_after_try_wait_reap_is_a_noop() {
+    // The exact race the review flagged: `try_wait()` reaps the exited child, so
+    // a later `kill()` must not signal the now-recycled pid/pgid. Poll try_wait
+    // to completion, then `kill()` must stay a clean no-op.
+    let mut proc = spawn_sandbox(seatbelt_request("true", 0)).expect("spawn");
+    let mut reaped = false;
+    for _ in 0..100 {
+        if proc.try_wait().expect("try_wait").is_some() {
+            reaped = true;
+            break;
+        }
+        std::thread::sleep(std::time::Duration::from_millis(50));
+    }
+    assert!(
+        reaped,
+        "quick command should exit and try_wait should reap it"
+    );
+    proc.kill().expect("kill after try_wait reap is a no-op Ok");
+    proc.kill().expect("repeat kill stays Ok");
+}
+
+#[test]
+fn streaming_double_kill_before_wait_completes_promptly() {
+    // Calling `kill()` twice before `wait()` must be stable (both Ok), and
+    // `wait()` must then complete promptly rather than hang.
+    let mut proc = spawn_sandbox(seatbelt_request("sleep 30", 0)).expect("spawn");
+    proc.kill().expect("first kill");
+    proc.kill().expect("second kill stays Ok");
+    let start = std::time::Instant::now();
+    let _ = proc.wait();
+    assert!(
+        start.elapsed() < std::time::Duration::from_secs(5),
+        "wait() after a double kill should complete promptly, took {:?}",
+        start.elapsed()
+    );
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_stdout_closer_unblocks_parked_read_without_killing() {
+    use std::io::Read;
+
+    // `sleep` produces no output yet holds its stdout pipe write-end open, so a
+    // read parks indefinitely (mirroring a backgrounded descendant that keeps a
+    // pipe open past the foreground command's exit). The stdout closer must EOF
+    // that read promptly *without* terminating the still-running child — a plain
+    // `kill()` would defeat the point.
+    let mut proc = spawn_sandbox(seatbelt_request("sleep 30", 0)).expect("spawn");
+
+    let mut stdout = proc.take_stdout().expect("stdout available");
+    // The closer is valid even though stdout has already been taken.
+    let closer = proc.stdout_closer().expect("stdout closer available");
+    assert!(
+        proc.stderr_closer().is_some(),
+        "stderr closer should also be available in pipes mode"
+    );
+
+    // Park a blocking read on a worker thread; with the writer held open it
+    // cannot return on its own.
+    let reader = std::thread::spawn(move || {
+        let mut buf = [0u8; 64];
+        let start = std::time::Instant::now();
+        let n = stdout.read(&mut buf).expect("read returns");
+        (n, start.elapsed())
+    });
+
+    // Let the read park, confirm the child is still running, then close.
+    std::thread::sleep(std::time::Duration::from_millis(200));
+    assert!(
+        proc.try_wait().expect("try_wait").is_none(),
+        "child should still be running while the read is parked"
+    );
+    closer.close();
+
+    let (n, elapsed) = reader.join().expect("reader thread");
+    assert_eq!(n, 0, "closed stream reports EOF");
+    assert!(
+        elapsed < std::time::Duration::from_secs(10),
+        "read should return promptly after close (elapsed: {elapsed:?})"
+    );
+
+    // The closer must not have terminated the child.
+    assert!(
+        proc.try_wait().expect("try_wait").is_none(),
+        "stdout_closer must not terminate the child"
+    );
+
+    // A second close is a harmless no-op.
+    closer.close();
+
+    proc.kill().expect("kill");
+    let _ = proc.wait();
+}
+
+// ---------------------------------------------------------------------------
+// Windows ProcessContainer streaming — integration test. Requires an elevated,
+// host-prepped Windows host (see docs/host-prep.md), so it is `#[ignore]`d.
+// ---------------------------------------------------------------------------
+
+#[cfg(target_os = "windows")]
+#[test]
+#[ignore = "requires an elevated, host-prepped Windows host (see docs/host-prep.md)"]
+fn streaming_processcontainer_bidirectional_stdio() {
+    use std::io::{Read, Write};
+
+    let policy = SandboxPolicy {
+        version: "0.7.0-alpha".to_string(),
+        filesystem: Some(mxc_sdk::policy::FilesystemSection {
+            readwrite_paths: vec!["C:\\Windows\\Temp".to_string()],
+            readonly_paths: vec![],
+            denied_paths: vec![],
+            clear_policy_on_exit: None,
+        }),
+        network: None,
+        ui: None,
+        timeout_ms: None,
+    };
+    let mut request = build_request(&policy, None).expect("build_request");
+    // `cmd /c more` echoes stdin to stdout until EOF, then exits.
+    request.set_script("cmd /c more");
+    let mut proc = spawn_sandbox(request).expect("spawn");
+
+    let mut stdin = proc.take_stdin().expect("stdin available");
+    let mut stdout = proc.take_stdout().expect("stdout available");
+
+    stdin.write_all(b"ping-pong\r\n").expect("write stdin");
+    drop(stdin);
+
+    let mut out = String::new();
+    stdout.read_to_string(&mut out).expect("read stdout");
+    assert!(out.contains("ping-pong"), "got: {:?}", out);
+
+    assert_eq!(proc.wait().expect("wait"), WaitOutcome::Exited(0));
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_wait_discards_untaken_streams() {
+    let mut proc =
+        spawn_sandbox(seatbelt_request("echo streamed-out", 0)).expect("spawn should succeed");
+    // Take nothing -> wait() drains and discards the output, returning only
+    // the exit code.
+    assert_eq!(
+        proc.wait().expect("wait should succeed"),
+        WaitOutcome::Exited(0)
+    );
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_bidirectional_stdio() {
+    use std::io::{Read, Write};
+
+    // `cat` echoes stdin to stdout until EOF, then exits.
+    let mut proc = spawn_sandbox(seatbelt_request("cat", 0)).expect("spawn");
+
+    let mut stdin = proc.take_stdin().expect("stdin available");
+    let mut stdout = proc.take_stdout().expect("stdout available");
+
+    stdin.write_all(b"ping-pong\n").expect("write stdin");
+    drop(stdin); // close -> cat sees EOF and exits
+
+    let mut out = String::new();
+    stdout.read_to_string(&mut out).expect("read stdout");
+    assert!(out.contains("ping-pong"), "got: {:?}", out);
+
+    assert_eq!(proc.wait().expect("wait"), WaitOutcome::Exited(0));
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_kill_terminates_process() {
+    let mut proc = spawn_sandbox(seatbelt_request("sleep 30", 0)).expect("spawn");
+
+    // Still running shortly after spawn.
+    assert!(proc.try_wait().expect("try_wait").is_none());
+
+    proc.kill().expect("kill should succeed");
+
+    // After kill, the process must be reapable and not report success.
+    assert_ne!(
+        proc.wait().expect("wait after kill"),
+        WaitOutcome::Exited(0),
+        "killed process should not exit 0"
+    );
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_kill_terminates_forked_descendant_quickly() {
+    // Regression for the early-kill race: when the shell *forks* the inner
+    // command (`echo` then `sleep`), an early `kill()` could SIGTERM the shell
+    // (which dies) before the just-forked `sleep` joined the group — leaving
+    // `sleep` alive and the follow-up `wait()` blocking for its full runtime.
+    // The whole tree must die promptly regardless.
+    let mut proc = spawn_sandbox(seatbelt_request("echo hi; sleep 30", 0)).expect("spawn");
+
+    proc.kill().expect("kill should succeed");
+
+    let start = std::time::Instant::now();
+    let _ = proc.wait();
+    assert!(
+        start.elapsed() < std::time::Duration::from_secs(10),
+        "wait() must return promptly after kill(), not wait out the child's \
+         30s runtime (elapsed: {:?})",
+        start.elapsed()
+    );
+}
+
+#[cfg(target_os = "macos")]
+fn pid_alive(pid: u32) -> bool {
+    // Signal 0 probes existence without delivering a signal — no PID-reuse
+    // race from spawning `ps`, and no false "dead" if the probe itself fails.
+    let rc = unsafe { libc::kill(pid as libc::pid_t, 0) };
+    if rc == 0 {
+        return true;
+    }
+    // ESRCH => no such process (dead). Any other errno (e.g. EPERM: the pid
+    // exists but we may not signal it) means it is still alive.
+    std::io::Error::last_os_error().raw_os_error() != Some(libc::ESRCH)
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_kill_terminates_process_tree() {
+    use std::io::{BufRead, BufReader};
+
+    // The sandboxed shell backgrounds a `sleep` (a descendant), prints its
+    // pid, then blocks. `kill()` must take the whole process group down,
+    // including that descendant.
+    let mut proc =
+        spawn_sandbox(seatbelt_request("sleep 300 & echo CHILD=$!; sleep 300", 0)).expect("spawn");
+
+    assert!(proc.id() > 0, "id() should expose the child pid");
+
+    let stdout = proc.take_stdout().expect("stdout");
+    let mut reader = BufReader::new(stdout);
+    let mut line = String::new();
+    reader.read_line(&mut line).expect("read descendant pid");
+    let descendant: u32 = line
+        .trim()
+        .strip_prefix("CHILD=")
+        .expect("CHILD= prefix")
+        .parse()
+        .expect("descendant pid");
+
+    assert!(
+        pid_alive(descendant),
+        "descendant {descendant} should be running before kill"
+    );
+
+    proc.kill().expect("kill");
+    let _ = proc.wait();
+
+    let mut gone = false;
+    for _ in 0..60 {
+        if !pid_alive(descendant) {
+            gone = true;
+            break;
+        }
+        std::thread::sleep(std::time::Duration::from_millis(50));
+    }
+    assert!(
+        gone,
+        "descendant {descendant} should be killed with the process tree"
+    );
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_timeout_kills_process_tree() {
+    use std::io::{BufRead, BufReader};
+
+    // 1s timeout; the shell backgrounds a long sleep (descendant), prints its
+    // pid, then blocks past the timeout. wait()'s timeout branch must group-
+    // kill, taking the descendant down too.
+    let mut proc = spawn_sandbox(seatbelt_request(
+        "sleep 300 & echo CHILD=$!; sleep 300",
+        1000,
+    ))
+    .expect("spawn");
+
+    let stdout = proc.take_stdout().expect("stdout");
+    let mut reader = BufReader::new(stdout);
+    let mut line = String::new();
+    reader.read_line(&mut line).expect("read descendant pid");
+    let descendant: u32 = line
+        .trim()
+        .strip_prefix("CHILD=")
+        .expect("CHILD= prefix")
+        .parse()
+        .expect("descendant pid");
+
+    assert_eq!(
+        proc.wait().expect("wait yields an outcome"),
+        WaitOutcome::TimedOut,
+        "timed-out process should report a timeout"
+    );
+
+    let mut gone = false;
+    for _ in 0..60 {
+        if !pid_alive(descendant) {
+            gone = true;
+            break;
+        }
+        std::thread::sleep(std::time::Duration::from_millis(50));
+    }
+    assert!(gone, "descendant {descendant} should be killed on timeout");
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_wait_returns_when_descendant_holds_not_taken_stream_open() {
+    // The foreground command exits immediately, but a backgrounded `sleep`
+    // inherits and holds stdout's write end open. We take NOTHING, so `wait()`
+    // drains stdout/stderr itself; with no timeout (wait-forever) it must still
+    // return promptly once the foreground child exits — the held-open descendant
+    // pipe must not wedge the discard drain (cr-002 regression).
+    let mut proc =
+        spawn_sandbox(seatbelt_request("sleep 30 & exit 0", 0)).expect("spawn should succeed");
+
+    let start = std::time::Instant::now();
+    assert_eq!(
+        proc.wait().expect("wait should return"),
+        WaitOutcome::Exited(0),
+        "foreground command exits 0"
+    );
+    assert!(
+        start.elapsed() < std::time::Duration::from_secs(10),
+        "wait() must return promptly, not block on the descendant's 30s pipe hold \
+         (elapsed: {:?})",
+        start.elapsed()
+    );
+}
+
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_honors_sub_500ms_timeout() {
+    // A sub-500ms timeout used to be rejected outright; it must now be accepted
+    // and enforced (cr-011), and fire with low latency (cr-016). `sleep 30`
+    // exceeds it, so wait() reports a timeout promptly.
+    let mut proc = spawn_sandbox(seatbelt_request("sleep 30", 200)).expect("spawn");
+    let start = std::time::Instant::now();
+    assert_eq!(
+        proc.wait().expect("wait yields an outcome"),
+        WaitOutcome::TimedOut,
+        "sub-500ms timeout should fire"
+    );
+    assert!(
+        start.elapsed() < std::time::Duration::from_secs(5),
+        "timeout should fire near 200ms, not wait out the 30s sleep (elapsed: {:?})",
+        start.elapsed()
+    );
+}
diff --git a/src/core/wxc_common/src/config_parser.rs b/src/core/wxc_common/src/config_parser.rs
index 546662588..61278bd77 100644
--- a/src/core/wxc_common/src/config_parser.rs
+++ b/src/core/wxc_common/src/config_parser.rs
@@ -427,8 +427,25 @@ pub fn load_request_with_options(
     convert_raw_config_inner(raw, logger, true, opts.allow_missing_command)
 }
 
-/// Loads a request and routes to the one-shot or state-aware path based on
-/// presence of the wire-format `phase` field. Errors are categorised so the
+/// Build a request from an already-parsed wire-format config [`Value`], running
+/// the same validation and wire→model mapping as [`load_request_with_options`]
+/// but without a base64 (or file) round-trip. For in-process callers (e.g. the
+/// `mxc` crate) that already hold the config as JSON and would otherwise pay to
+/// serialise → base64 → decode → re-parse it.
+///
+/// [`Value`]: serde_json::Value
+pub fn load_request_from_value(
+    config: serde_json::Value,
+    logger: &mut Logger,
+    allow_missing_command: bool,
+) -> Result<ExecutionRequest, WxcError> {
+    let raw: RawConfig = serde_json::from_value(config).map_err(|e| {
+        logger.log_line("Error parsing JSON");
+        WxcError::ConfigParse(format!("JSON parse error: {}", e))
+    })?;
+
+    convert_raw_config_inner(raw, logger, true, allow_missing_command)
+}
 /// driver can pick the right output convention per path (envelope on stdout
 /// for state-aware, diagnostic on stderr for one-shot and pre-discrimination
 /// failures).

From a5073b687cbe636f3c5ecdce6b067812a403e824 Mon Sep 17 00:00:00 2001
From: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
Date: Wed, 24 Jun 2026 11:41:21 -0300
Subject: [PATCH 4/9] feat(mxc-sdk): add Sandbox::wait_with_output to drain
 both streams safely

Taking both take_stdout() and take_stderr() and reading them sequentially
can deadlock an output-heavy child (one pipe fills while the reader is
blocked on the other). Add wait_with_output(): it consumes the handle,
drains stdout and stderr concurrently on separate threads, and returns
Output { outcome, stdout, stderr } -- the safe, convenient default,
mirroring std::process::Child::wait_with_output. Review CR-24.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
Signed-off-by: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
---
 .github/copilot-instructions.md     |  2 +-
 src/core/mxc-sdk/README.md          |  4 +++
 src/core/mxc-sdk/src/lib.rs         |  2 +-
 src/core/mxc-sdk/src/sandbox.rs     | 45 +++++++++++++++++++++++++++++
 src/core/mxc-sdk/tests/streaming.rs | 23 +++++++++++++++
 5 files changed, 74 insertions(+), 2 deletions(-)

diff --git a/.github/copilot-instructions.md b/.github/copilot-instructions.md
index 0bdfb55d9..3e8b020fd 100644
--- a/.github/copilot-instructions.md
+++ b/.github/copilot-instructions.md
@@ -182,7 +182,7 @@ The workspace is organized into five top-level directories under `src/`:
 - `wxc_common` is the **cross-platform foundation**: config parsing, models, errors, logger, `ScriptRunner` / `StatefulSandboxBackend` traits, state-aware dispatch helpers, validators, ids, ui-policy, encoding. Plus a few thin Windows API helpers shared by host tools and backends (`process_util`, `string_util`, `filesystem_dacl`, `diagnostic`). It must not depend on any `backends/*` crate.
 - Each Windows containment backend lives in its own `backends/*/common` crate (e.g. `appcontainer_common`, `windows_sandbox_common`, `isolation_session_common`, `hyperlight_common`, `nanvix_runner`). Backend crates depend on `wxc_common`; there are no cross-edges between backend crates.
 - `wxc` and `lxc` are thin binary crates that wire up CLI args (`clap`) and dispatch to `wxc_common` and the per-backend crates
-- `mxc-sdk` is an **importable library** for starting sandboxes in-process without a pty: `spawn_sandbox` takes a `SandboxRequest` (from `build_request`), selects the host backend, and returns a `Sandbox` handle for persistent bidirectional stdio (`take_stdin`/`take_stdout`/`take_stderr`), `kill()`, and `wait()` (which drains and discards any untaken stdout/stderr and returns a `WaitOutcome` — `Exited(i32)` or `TimedOut` — as `io::Result`, reserving `Err` for an actual OS/wait failure). It additionally ports the SDK's config-building surface so callers don't need the TypeScript module: `mxc_sdk::policy` (`SandboxPolicy` + `build_request` → `SandboxRequest` (opaque wrapper mapping to the internal `ExecutionRequest`), the port of `createConfigFromPolicy`; plus `available_tools_policy`/`user_profile_policy`/`temporary_files_policy` discovery helpers) and `mxc_sdk::platform_support` (port of `getPlatformSupport`, using the in-process probe on Windows). It depends on the backend crates (cfg-split: appcontainer on Windows, bubblewrap on Linux, seatbelt on macOS) — so it can't live in `wxc_common`. The public surface is deliberately minimal (streaming only): the `dispatch` and `platform` modules are private and only their used items are re-exported at the crate root (`platform_support`, `PlatformSupport`); `policy` is the one public submodule (callers name `mxc_sdk::policy::{SandboxPolicy sections}`). The execution surface lives in `wxc_common::sandbox_process`: the `SandboxBackend` trait (`validate` + `spawn(request, logger, StdioMode) -> Box<dyn SandboxProcess>` + a `diagnose_exit` hook for enriching launch-failure exits) and the generic `Runner<B>` adapter that bridges any `SandboxBackend` to the run-to-completion `ScriptRunner` (by calling `spawn(StdioMode::Inherit)` then `wait()`). `StdioMode::Pipes` hands the caller live stdin/stdout/stderr (what `mxc-sdk` uses); `StdioMode::Inherit` lets the child inherit the host process's own stdio (what the executor binaries use, preserving the TTY under a pty). `SandboxBackend` is implemented for every library backend — Seatbelt (macOS), Bubblewrap (Linux), and Windows ProcessContainer (AppContainer + BaseContainer). The `wxc`/`lxc`/`mxc_darwin` executor binaries do **not** depend on `mxc-sdk`; they keep their own backend dispatch (sharing only the lower-level `appcontainer_common::dispatcher::dispatch_with_fallback`). The `mxc-sdk` in-crate backend dispatch (`dispatch.rs`) and host probing (`platform.rs`) are **provisional** — a follow-up will move them into a dedicated `mxc` engine crate that both `mxc-sdk` and the executor binaries call into.
+- `mxc-sdk` is an **importable library** for starting sandboxes in-process without a pty: `spawn_sandbox` takes a `SandboxRequest` (from `build_request`), selects the host backend, and returns a `Sandbox` handle for persistent bidirectional stdio (`take_stdin`/`take_stdout`/`take_stderr`), `kill()`, and `wait()` (which drains and discards any untaken stdout/stderr and returns a `WaitOutcome` — `Exited(i32)` or `TimedOut` — as `io::Result`, reserving `Err` for an actual OS/wait failure), or `wait_with_output()` (consumes the handle, drains both streams concurrently, returns an `Output` with the `WaitOutcome` + captured `stdout`/`stderr`). It additionally ports the SDK's config-building surface so callers don't need the TypeScript module: `mxc_sdk::policy` (`SandboxPolicy` + `build_request` → `SandboxRequest` (opaque wrapper mapping to the internal `ExecutionRequest`), the port of `createConfigFromPolicy`; plus `available_tools_policy`/`user_profile_policy`/`temporary_files_policy` discovery helpers) and `mxc_sdk::platform_support` (port of `getPlatformSupport`, using the in-process probe on Windows). It depends on the backend crates (cfg-split: appcontainer on Windows, bubblewrap on Linux, seatbelt on macOS) — so it can't live in `wxc_common`. The public surface is deliberately minimal (streaming only): the `dispatch` and `platform` modules are private and only their used items are re-exported at the crate root (`platform_support`, `PlatformSupport`); `policy` is the one public submodule (callers name `mxc_sdk::policy::{SandboxPolicy sections}`). The execution surface lives in `wxc_common::sandbox_process`: the `SandboxBackend` trait (`validate` + `spawn(request, logger, StdioMode) -> Box<dyn SandboxProcess>` + a `diagnose_exit` hook for enriching launch-failure exits) and the generic `Runner<B>` adapter that bridges any `SandboxBackend` to the run-to-completion `ScriptRunner` (by calling `spawn(StdioMode::Inherit)` then `wait()`). `StdioMode::Pipes` hands the caller live stdin/stdout/stderr (what `mxc-sdk` uses); `StdioMode::Inherit` lets the child inherit the host process's own stdio (what the executor binaries use, preserving the TTY under a pty). `SandboxBackend` is implemented for every library backend — Seatbelt (macOS), Bubblewrap (Linux), and Windows ProcessContainer (AppContainer + BaseContainer). The `wxc`/`lxc`/`mxc_darwin` executor binaries do **not** depend on `mxc-sdk`; they keep their own backend dispatch (sharing only the lower-level `appcontainer_common::dispatcher::dispatch_with_fallback`). The `mxc-sdk` in-crate backend dispatch (`dispatch.rs`) and host probing (`platform.rs`) are **provisional** — a follow-up will move them into a dedicated `mxc` engine crate that both `mxc-sdk` and the executor binaries call into.
 - `mxc_pty` is the shared pty bridge used by the LXC backend (`lxc_common::lxc_bindings::attach_run`) so the inner shell sees a real TTY and host stdio is streamed live. (Seatbelt and Bubblewrap no longer use it: they spawn directly and let the child inherit the host's stdio — a TTY when the executor binary runs under a pty — via `SandboxBackend::spawn(StdioMode::Inherit)`.)
 - `mxc_build_common` is a build-time helper crate — all Windows binary crates use it in their `build.rs` to embed VersionInfo (ProductName, FileDescription, copyright, version+commit). When adding a new Windows binary crate, add `mxc_build_common` as a build-dependency and call `mxc_build_common::embed_version_info()` from `build.rs`
 - `nanvix_build_common` is a **build-only** helper crate (never linked into the runtime): it stages NanVix binaries next to the executable and resolves the `NANVIX_BIN` prefetch directory. The `nanvix_binaries`, `wxc`, and `lxc` build scripts consume it as a `[build-dependencies]` entry. Runtime constants it needs (binary/snapshot filenames) stay in `nanvix_common`. Keep build-only file-staging logic here, not in `nanvix_common` (which is a runtime dependency of `nanvix_runner`).
diff --git a/src/core/mxc-sdk/README.md b/src/core/mxc-sdk/README.md
index b438956d9..6c20c0709 100644
--- a/src/core/mxc-sdk/README.md
+++ b/src/core/mxc-sdk/README.md
@@ -100,6 +100,10 @@ The handle is modelled on [`std::process::Child`]:
   can't block on a full pipe, and returns a `WaitOutcome` —
   `Exited(code)` or `TimedOut` if the timeout elapses (`Err` is reserved for an
   actual OS/wait failure).
+- `wait_with_output()` consumes the handle and returns an `Output` with the
+  `WaitOutcome` plus the captured `stdout`/`stderr` — it drains both streams
+  concurrently for you, the safe alternative to `take_stdout()` + `take_stderr()`
+  (reading one to EOF before the other can deadlock an output-heavy child).
 - `stdout_closer()` / `stderr_closer()` → `Option<StreamCloser>`: a
   closer that makes an in-flight or subsequent read on the taken stream return
   EOF promptly **without** killing the child — for abandoning a stream a
diff --git a/src/core/mxc-sdk/src/lib.rs b/src/core/mxc-sdk/src/lib.rs
index 5ba317ef5..50490f054 100644
--- a/src/core/mxc-sdk/src/lib.rs
+++ b/src/core/mxc-sdk/src/lib.rs
@@ -58,7 +58,7 @@ pub use policy::{
 };
 
 pub use error::{Error, ErrorCode};
-pub use sandbox::{Sandbox, StreamCloser, WaitOutcome};
+pub use sandbox::{Output, Sandbox, StreamCloser, WaitOutcome};
 
 use wxc_common::logger::{Logger, Mode};
 
diff --git a/src/core/mxc-sdk/src/sandbox.rs b/src/core/mxc-sdk/src/sandbox.rs
index 5c47c834a..35d78b32c 100644
--- a/src/core/mxc-sdk/src/sandbox.rs
+++ b/src/core/mxc-sdk/src/sandbox.rs
@@ -24,6 +24,18 @@ pub enum WaitOutcome {
     TimedOut,
 }
 
+/// The captured result of running a [`Sandbox`] to completion via
+/// [`wait_with_output`](Sandbox::wait_with_output).
+#[derive(Debug, Clone)]
+pub struct Output {
+    /// How the process finished.
+    pub outcome: WaitOutcome,
+    /// Everything the child wrote to stdout.
+    pub stdout: Vec<u8>,
+    /// Everything the child wrote to stderr.
+    pub stderr: Vec<u8>,
+}
+
 /// A live sandboxed process, returned by [`spawn_sandbox`](crate::spawn_sandbox).
 ///
 /// Stream the child's stdio with the `take_*` accessors, wait for it, or kill
@@ -94,6 +106,39 @@ impl Sandbox {
             Err(e) => Err(e),
         }
     }
+
+    /// Wait for the child to exit, capturing its stdout and stderr.
+    ///
+    /// The safe alternative to [`take_stdout`](Self::take_stdout) +
+    /// [`take_stderr`](Self::take_stderr): it drains both streams **concurrently**
+    /// on separate threads, so an output-heavy child can't deadlock (reading one
+    /// stream to EOF before the other can). Consumes the handle.
+    ///
+    /// `Err` is reserved for an actual OS / wait failure; a timeout is reported
+    /// as [`Output`] with `outcome: WaitOutcome::TimedOut` and whatever each
+    /// stream produced before the tree was killed.
+    pub fn wait_with_output(mut self) -> std::io::Result<Output> {
+        fn capture(stream: Option<Box<dyn Read + Send>>) -> std::thread::JoinHandle<Vec<u8>> {
+            std::thread::spawn(move || {
+                let mut buf = Vec::new();
+                if let Some(mut stream) = stream {
+                    let _ = stream.read_to_end(&mut buf);
+                }
+                buf
+            })
+        }
+
+        // Take both streams before waiting so `wait` won't discard them, and
+        // read each on its own thread so the child never blocks on a full pipe.
+        let stdout = capture(self.inner.take_stdout());
+        let stderr = capture(self.inner.take_stderr());
+        let outcome = self.wait()?;
+        Ok(Output {
+            outcome,
+            stdout: stdout.join().unwrap_or_default(),
+            stderr: stderr.join().unwrap_or_default(),
+        })
+    }
 }
 
 /// Closes one of a [`Sandbox`]'s streams, unblocking a read parked on it without
diff --git a/src/core/mxc-sdk/tests/streaming.rs b/src/core/mxc-sdk/tests/streaming.rs
index da168739b..742b49c11 100644
--- a/src/core/mxc-sdk/tests/streaming.rs
+++ b/src/core/mxc-sdk/tests/streaming.rs
@@ -250,6 +250,29 @@ fn streaming_wait_discards_untaken_streams() {
     );
 }
 
+#[cfg(target_os = "macos")]
+#[test]
+fn streaming_wait_with_output_captures_both_streams() {
+    // wait_with_output drains stdout and stderr concurrently, so a child that
+    // writes to both is captured without the take-both deadlock foot-gun.
+    let proc = spawn_sandbox(seatbelt_request("echo to-out; echo to-err 1>&2", 0))
+        .expect("spawn should succeed");
+    let output = proc
+        .wait_with_output()
+        .expect("wait_with_output should succeed");
+    assert_eq!(output.outcome, WaitOutcome::Exited(0));
+    assert!(
+        String::from_utf8_lossy(&output.stdout).contains("to-out"),
+        "stdout: {:?}",
+        String::from_utf8_lossy(&output.stdout)
+    );
+    assert!(
+        String::from_utf8_lossy(&output.stderr).contains("to-err"),
+        "stderr: {:?}",
+        String::from_utf8_lossy(&output.stderr)
+    );
+}
+
 #[cfg(target_os = "macos")]
 #[test]
 fn streaming_bidirectional_stdio() {

From 34c36e2a101c4ad188ec5c57b8cc07d1d4d68737 Mon Sep 17 00:00:00 2001
From: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
Date: Wed, 24 Jun 2026 11:59:46 -0300
Subject: [PATCH 5/9] test(mxc-sdk): cover dispatch guard branches for
 unsupported containment/host

The streaming dispatch in `dispatch.rs` only had direct tests for the
`dry_run` and macOS `guiAccess` rejection branches. Add two more so the
remaining guardrails are exercised in CI:

- `streaming_rejects_unsupported_containment`: drives the internal model
  with `containment = Lxc` and asserts `UnsupportedContainment` plus the
  backend name in the message.
- `host_support_ok_on_supported_platforms`: cfg-gated to Windows / Linux /
  macOS, guards against the `ensure_host_supported` cfg list dropping a
  supported platform.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
Signed-off-by: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
---
 src/core/mxc-sdk/src/dispatch.rs | 29 ++++++++++++++++++++++++++++-
 1 file changed, 28 insertions(+), 1 deletion(-)

diff --git a/src/core/mxc-sdk/src/dispatch.rs b/src/core/mxc-sdk/src/dispatch.rs
index 607ec5758..7cacb9e4b 100644
--- a/src/core/mxc-sdk/src/dispatch.rs
+++ b/src/core/mxc-sdk/src/dispatch.rs
@@ -194,9 +194,10 @@ fn spawn_process_container(
 
 #[cfg(test)]
 mod tests {
-    use super::spawn_runner;
+    use super::{ensure_host_supported, spawn_runner};
     use crate::policy::{build_request, SandboxPolicy};
     use wxc_common::logger::{Logger, Mode};
+    use wxc_common::models::ContainmentBackend;
     use wxc_common::mxc_error::MxcErrorCode;
 
     fn minimal_policy() -> SandboxPolicy {
@@ -224,6 +225,32 @@ mod tests {
         assert_eq!(err.code, MxcErrorCode::MalformedRequest);
     }
 
+    #[test]
+    fn streaming_rejects_unsupported_containment() {
+        // LXC has no streaming path in the library; selecting it must surface a
+        // clear `UnsupportedContainment` rather than spawning. The public
+        // `SandboxRequest` can't choose a backend, so drive dispatch with the
+        // internal model.
+        let mut request = build_request(&minimal_policy(), None).expect("build_request");
+        request.inner.containment = ContainmentBackend::Lxc;
+        let mut logger = Logger::new(Mode::Buffer);
+        let err = match spawn_runner(&request.inner, &mut logger) {
+            Ok(_) => panic!("LXC must be rejected"),
+            Err(e) => e,
+        };
+        assert_eq!(err.code, MxcErrorCode::UnsupportedContainment);
+        assert!(err.message.contains("lxc"), "got: {}", err.message);
+    }
+
+    #[cfg(any(target_os = "windows", target_os = "linux", target_os = "macos"))]
+    #[test]
+    fn host_support_ok_on_supported_platforms() {
+        // The three platforms the library supports must all pass the host gate
+        // `spawn_runner` checks before backend selection; this guards against a
+        // regression in the `cfg` list dropping one of them.
+        assert!(ensure_host_supported().is_ok());
+    }
+
     #[cfg(target_os = "macos")]
     #[test]
     fn streaming_rejects_gui_access() {

From 085751e39a105d8912f95e7a340a4f5224869796 Mon Sep 17 00:00:00 2001
From: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
Date: Wed, 24 Jun 2026 12:56:56 -0300
Subject: [PATCH 6/9] feat(mxc-sdk): take structured (key, value) pairs in
 SandboxRequest::set_env

set_env(Vec<String>) made the caller hand-format raw KEY=VALUE strings,
which diverged from the SDK's env channel -- injectEnvIntoConfig
(sdk/src/sandbox.ts) takes a structured { key: value } map and joins it to
the KEY=VALUE wire form internally.

Accept (key, value) pairs instead and do the formatting in the setter, so
the crate matches the SDK surface and callers can't forget the '='. The wire
representation (Vec<String> of KEY=VALUE) is unchanged, and iteration order
is preserved so a later duplicate key still wins downstream -- same as the
SDK. No eager validation is added: the SDK doesn't validate either, and
structured input already removes the malformed-entry foot-gun.

Adds a unit test asserting the pair-to-KEY=VALUE ordered mapping.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
Signed-off-by: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
---
 src/core/mxc-sdk/src/policy.rs    | 39 ++++++++++++++++++++++++++++---
 src/core/mxc-sdk/tests/sandbox.rs |  2 +-
 2 files changed, 37 insertions(+), 4 deletions(-)

diff --git a/src/core/mxc-sdk/src/policy.rs b/src/core/mxc-sdk/src/policy.rs
index 0b36a556c..f5d0b69a1 100644
--- a/src/core/mxc-sdk/src/policy.rs
+++ b/src/core/mxc-sdk/src/policy.rs
@@ -558,9 +558,25 @@ impl SandboxRequest {
         self
     }
 
-    /// Set the child's environment as `KEY=VALUE` entries.
-    pub fn set_env(&mut self, env: Vec<String>) -> &mut Self {
-        self.inner.env = env;
+    /// Set the child's environment from `(key, value)` pairs.
+    ///
+    /// Each pair is stored as a `KEY=VALUE` entry — the same wire form the SDK's
+    /// env channel produces (`injectEnvIntoConfig` joins a `{ key: value }` map
+    /// the same way), so behavior is identical across the SDK and this crate.
+    /// Iteration order is preserved, so on a duplicate key the later entry wins,
+    /// matching the SDK.
+    pub fn set_env<K, V>(&mut self, env: impl IntoIterator<Item = (K, V)>) -> &mut Self
+    where
+        K: Into<String>,
+        V: Into<String>,
+    {
+        self.inner.env = env
+            .into_iter()
+            .map(|(k, v)| {
+                let (k, v): (String, String) = (k.into(), v.into());
+                format!("{k}={v}")
+            })
+            .collect();
         self
     }
 
@@ -973,6 +989,23 @@ mod tests {
         assert!(request.inner.script_code.is_empty());
     }
 
+    #[test]
+    fn set_env_formats_pairs_as_key_value_in_order() {
+        // The structured `(key, value)` setter mirrors the SDK env channel
+        // (`injectEnvIntoConfig`): each pair becomes a `KEY=VALUE` wire entry, in
+        // iteration order so a later duplicate key wins downstream.
+        let policy = SandboxPolicy {
+            version: "0.7.0-alpha".to_string(),
+            filesystem: None,
+            network: None,
+            ui: None,
+            timeout_ms: None,
+        };
+        let mut request = build_request(&policy, None).expect("build_request should succeed");
+        request.set_env([("FIRST", "1"), ("SECOND", "2")]);
+        assert_eq!(request.inner.env, vec!["FIRST=1", "SECOND=2"]);
+    }
+
     #[test]
     fn build_request_preserves_clipboard_policy() {
         use super::ClipboardPolicy as P;
diff --git a/src/core/mxc-sdk/tests/sandbox.rs b/src/core/mxc-sdk/tests/sandbox.rs
index 90aca5781..01c0e97a3 100644
--- a/src/core/mxc-sdk/tests/sandbox.rs
+++ b/src/core/mxc-sdk/tests/sandbox.rs
@@ -154,7 +154,7 @@ fn seatbelt_does_not_leak_host_environment() {
 fn seatbelt_env_reaches_sandboxed_process() {
     // An env entry set on the request must reach the sandboxed child.
     let mut request = seatbelt_request("echo $MXC_TEST_VAR", 10000);
-    request.set_env(vec!["MXC_TEST_VAR=injected-value".to_string()]);
+    request.set_env([("MXC_TEST_VAR", "injected-value")]);
 
     let result = spawn_and_wait(request).expect("seatbelt run should succeed");
 

From 0c9779e89da7f8c3e3927302e9d0ca307f96b8d4 Mon Sep 17 00:00:00 2001
From: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
Date: Wed, 24 Jun 2026 13:27:59 -0300
Subject: [PATCH 7/9] fix(wxc_common): set FD_CLOEXEC on the
 interruptible-reader wake pipe

The self-pipe used to wake `InterruptibleReader`'s `poll` was created with
`libc::pipe`, which does not set close-on-exec. Both wake fds would then leak
into any process the thread later forks+execs (e.g. another sandbox child) and
keep the wake pipe alive unexpectedly. Mark both ends `FD_CLOEXEC` after
`pipe()`, mirroring the fixup `mxc_pty` already does for PTY fds. The data pipe
is unaffected -- Rust already sets CLOEXEC on `Child` stdio.

Addresses a Copilot review comment on #555.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
Signed-off-by: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
---
 .../wxc_common/src/interruptible_reader.rs    | 20 +++++++++++++++++++
 1 file changed, 20 insertions(+)

diff --git a/src/core/wxc_common/src/interruptible_reader.rs b/src/core/wxc_common/src/interruptible_reader.rs
index 1cc01bb11..78d6e0137 100644
--- a/src/core/wxc_common/src/interruptible_reader.rs
+++ b/src/core/wxc_common/src/interruptible_reader.rs
@@ -101,6 +101,12 @@ impl InterruptibleReader {
         // SAFETY: `pipe` succeeded, so both fds are freshly owned by us.
         let wake_r = unsafe { OwnedFd::from_raw_fd(fds[0]) };
         let wake_w = unsafe { OwnedFd::from_raw_fd(fds[1]) };
+        // `pipe(2)` doesn't set close-on-exec, so mark both ends `FD_CLOEXEC` —
+        // otherwise they leak into any process this thread later forks+execs
+        // (e.g. another sandbox child). The data pipe is already CLOEXEC: Rust
+        // sets it on `Child` stdio.
+        set_cloexec(wake_r.as_raw_fd())?;
+        set_cloexec(wake_w.as_raw_fd())?;
         set_nonblocking(wake_w.as_raw_fd())?;
 
         Ok(Self {
@@ -214,6 +220,20 @@ fn set_nonblocking(fd: RawFd) -> io::Result<()> {
     Ok(())
 }
 
+/// Add `FD_CLOEXEC` to `fd`'s descriptor flags so it doesn't leak across `exec`.
+fn set_cloexec(fd: RawFd) -> io::Result<()> {
+    // SAFETY: `fd` is a valid open fd; `fcntl` with these commands only reads
+    // and writes its descriptor flags.
+    let flags = unsafe { libc::fcntl(fd, libc::F_GETFD) };
+    if flags < 0 {
+        return Err(io::Error::last_os_error());
+    }
+    if unsafe { libc::fcntl(fd, libc::F_SETFD, flags | libc::FD_CLOEXEC) } < 0 {
+        return Err(io::Error::last_os_error());
+    }
+    Ok(())
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;

From bd9f28312945bcb7d644439970d47d13afdcc3c8 Mon Sep 17 00:00:00 2001
From: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
Date: Wed, 24 Jun 2026 13:27:59 -0300
Subject: [PATCH 8/9] fix(wxc_common): propagate non-benign group_kill signal
 errors

`group_kill` discarded both `kill(2)` results and always returned `Ok(())`, so
`SandboxProcess::kill()` reported success even when it never signalled the
process group. Route both signals through a `send_sigkill` helper that returns
the error instead, treating only the "already gone" outcomes as success:
`ESRCH`, and `EPERM` -- which on macOS a redundant kill of an exited-but-unreaped
child's group reports in place of `ESRCH` (observed via the double-kill test).
The caller guards with `try_wait()` first, so the pid/pgid can't be recycled and
`EPERM` here can only be that benign race, never a real permission failure.

Addresses a Copilot review comment on #556.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
Signed-off-by: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
---
 src/core/wxc_common/src/sandbox_process.rs | 25 ++++++++++++++++++----
 1 file changed, 21 insertions(+), 4 deletions(-)

diff --git a/src/core/wxc_common/src/sandbox_process.rs b/src/core/wxc_common/src/sandbox_process.rs
index 957507456..8449eacc2 100644
--- a/src/core/wxc_common/src/sandbox_process.rs
+++ b/src/core/wxc_common/src/sandbox_process.rs
@@ -245,12 +245,29 @@ pub fn cancel_and_join_discard<C: StreamCloser>(
 pub fn group_kill(child: &mut std::process::Child) -> std::io::Result<()> {
     // The child is unreaped, so its pid (== pgid) can't have been recycled.
     let pid = child.id() as i32;
+    send_sigkill(pid)?; // leader first
+    send_sigkill(-pid)?; // then its group
+    Ok(())
+}
+
+/// `SIGKILL` `target` (a pid, or a negative pgid), treating the "already gone"
+/// outcomes as success. The caller only invokes this on its own still-unreaped
+/// child (so the pid/pgid can't have been recycled), which leaves two benign
+/// errno: `ESRCH` (no such process/group — already exited) and `EPERM`, which on
+/// macOS a redundant kill of an exited-but-not-yet-reaped child's group reports
+/// instead of `ESRCH`. Any other error propagates, so a genuinely failed signal
+/// isn't misreported as a successful kill.
+#[cfg(unix)]
+fn send_sigkill(target: i32) -> std::io::Result<()> {
     // SAFETY: `kill(2)` with a plain pid / negative pgid — just integers.
-    unsafe {
-        libc::kill(pid, libc::SIGKILL); // leader first
-        libc::kill(-pid, libc::SIGKILL); // then its group
+    if unsafe { libc::kill(target, libc::SIGKILL) } == 0 {
+        return Ok(());
+    }
+    let err = std::io::Error::last_os_error();
+    match err.raw_os_error() {
+        Some(libc::ESRCH) | Some(libc::EPERM) => Ok(()),
+        _ => Err(err),
     }
-    Ok(())
 }
 
 /// Outcome of [`wait_with_timeout`]: the child exited, the deadline passed, or

From c718c98153d3a2988b01065e91f37d852e36da9e Mon Sep 17 00:00:00 2001
From: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
Date: Wed, 24 Jun 2026 13:28:00 -0300
Subject: [PATCH 9/9] test(mxc-sdk): move the Windows streaming test out of the
 macOS-gated file

`tests/streaming.rs` is `#![cfg(target_os = "macos")]`, so the
`#[cfg(target_os = "windows")]` ProcessContainer streaming test it contained
could never compile -- the intended Windows coverage was silently missing.
Move that test into its own `tests/streaming_processcontainer.rs`, gated
`#![cfg(target_os = "windows")]`, so it actually builds on Windows.

Addresses a Copilot review comment on #556.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
Signed-off-by: Carlos Alexandro Becker <caarlos0@users.noreply.github.com>
---
 src/core/mxc-sdk/tests/streaming.rs           | 41 ----------------
 .../tests/streaming_processcontainer.rs       | 47 +++++++++++++++++++
 2 files changed, 47 insertions(+), 41 deletions(-)
 create mode 100644 src/core/mxc-sdk/tests/streaming_processcontainer.rs

diff --git a/src/core/mxc-sdk/tests/streaming.rs b/src/core/mxc-sdk/tests/streaming.rs
index 742b49c11..60668fd1a 100644
--- a/src/core/mxc-sdk/tests/streaming.rs
+++ b/src/core/mxc-sdk/tests/streaming.rs
@@ -196,47 +196,6 @@ fn streaming_stdout_closer_unblocks_parked_read_without_killing() {
     let _ = proc.wait();
 }
 
-// ---------------------------------------------------------------------------
-// Windows ProcessContainer streaming — integration test. Requires an elevated,
-// host-prepped Windows host (see docs/host-prep.md), so it is `#[ignore]`d.
-// ---------------------------------------------------------------------------
-
-#[cfg(target_os = "windows")]
-#[test]
-#[ignore = "requires an elevated, host-prepped Windows host (see docs/host-prep.md)"]
-fn streaming_processcontainer_bidirectional_stdio() {
-    use std::io::{Read, Write};
-
-    let policy = SandboxPolicy {
-        version: "0.7.0-alpha".to_string(),
-        filesystem: Some(mxc_sdk::policy::FilesystemSection {
-            readwrite_paths: vec!["C:\\Windows\\Temp".to_string()],
-            readonly_paths: vec![],
-            denied_paths: vec![],
-            clear_policy_on_exit: None,
-        }),
-        network: None,
-        ui: None,
-        timeout_ms: None,
-    };
-    let mut request = build_request(&policy, None).expect("build_request");
-    // `cmd /c more` echoes stdin to stdout until EOF, then exits.
-    request.set_script("cmd /c more");
-    let mut proc = spawn_sandbox(request).expect("spawn");
-
-    let mut stdin = proc.take_stdin().expect("stdin available");
-    let mut stdout = proc.take_stdout().expect("stdout available");
-
-    stdin.write_all(b"ping-pong\r\n").expect("write stdin");
-    drop(stdin);
-
-    let mut out = String::new();
-    stdout.read_to_string(&mut out).expect("read stdout");
-    assert!(out.contains("ping-pong"), "got: {:?}", out);
-
-    assert_eq!(proc.wait().expect("wait"), WaitOutcome::Exited(0));
-}
-
 #[cfg(target_os = "macos")]
 #[test]
 fn streaming_wait_discards_untaken_streams() {
diff --git a/src/core/mxc-sdk/tests/streaming_processcontainer.rs b/src/core/mxc-sdk/tests/streaming_processcontainer.rs
new file mode 100644
index 000000000..d7941ce19
--- /dev/null
+++ b/src/core/mxc-sdk/tests/streaming_processcontainer.rs
@@ -0,0 +1,47 @@
+// Copyright (c) Microsoft Corporation.
+// Licensed under the MIT License.
+
+//! Windows ProcessContainer streaming integration test, in its own
+//! Windows-gated file. The sibling `streaming.rs` is `#![cfg(macos)]`, which
+//! would otherwise make a `#[cfg(windows)]` test there impossible to compile.
+//! Requires an elevated, host-prepped Windows host (see docs/host-prep.md), so
+//! it is `#[ignore]`d.
+
+#![cfg(target_os = "windows")]
+
+use mxc_sdk::{build_request, spawn_sandbox, SandboxPolicy, WaitOutcome};
+
+#[test]
+#[ignore = "requires an elevated, host-prepped Windows host (see docs/host-prep.md)"]
+fn streaming_processcontainer_bidirectional_stdio() {
+    use std::io::{Read, Write};
+
+    let policy = SandboxPolicy {
+        version: "0.7.0-alpha".to_string(),
+        filesystem: Some(mxc_sdk::policy::FilesystemSection {
+            readwrite_paths: vec!["C:\\Windows\\Temp".to_string()],
+            readonly_paths: vec![],
+            denied_paths: vec![],
+            clear_policy_on_exit: None,
+        }),
+        network: None,
+        ui: None,
+        timeout_ms: None,
+    };
+    let mut request = build_request(&policy, None).expect("build_request");
+    // `cmd /c more` echoes stdin to stdout until EOF, then exits.
+    request.set_script("cmd /c more");
+    let mut proc = spawn_sandbox(request).expect("spawn");
+
+    let mut stdin = proc.take_stdin().expect("stdin available");
+    let mut stdout = proc.take_stdout().expect("stdout available");
+
+    stdin.write_all(b"ping-pong\r\n").expect("write stdin");
+    drop(stdin);
+
+    let mut out = String::new();
+    stdout.read_to_string(&mut out).expect("read stdout");
+    assert!(out.contains("ping-pong"), "got: {:?}", out);
+
+    assert_eq!(proc.wait().expect("wait"), WaitOutcome::Exited(0));
+}