feat(linux-sandbox): vendor bubblewrap and wire it with FFI (#10413)

## Summary Vendor Bubblewrap into the repo and add minimal build plumbing in `codex-linux-sandbox` to compile/link it. ## Why We want to move Linux sandboxing toward Bubblewrap, but in a safe two-step rollout: 1) vendoring/build setup (this PR), 2) runtime integration (follow-up PR). ## Included - Add `codex-rs/vendor/bubblewrap` sources. - Add build-time FFI path in `codex-rs/linux-sandbox`. - Update `build.rs` rerun tracking for vendored files. - Small vendored compile warning fix (`sockaddr_nl` full init). follow up in https://github.com/openai/codex/pull/9938
2026-04-29 19:03:02 +03:00 · 2026-02-02 23:33:46 -08:00
parent 53d8474061
commit f956cc2a02
57 changed files with 11261 additions and 6 deletions
--- a/codex-rs/linux-sandbox/src/bwrap.rs
+++ b/codex-rs/linux-sandbox/src/bwrap.rs
@@ -0,0 +1,291 @@
+//! Bubblewrap-based filesystem sandboxing for Linux.
+//!
+//! This module mirrors the semantics used by the macOS Seatbelt sandbox:
+//! - the filesystem is read-only by default,
+//! - explicit writable roots are layered on top, and
+//! - sensitive subpaths such as `.git` and `.codex` remain read-only even when
+//!   their parent root is writable.
+//!
+//! The overall Linux sandbox is composed of:
+//! - seccomp + `PR_SET_NO_NEW_PRIVS` applied in-process, and
+//! - bubblewrap used to construct the filesystem view before exec.
+use std::collections::BTreeSet;
+use std::path::Path;
+use std::path::PathBuf;
+
+use codex_core::error::CodexErr;
+use codex_core::error::Result;
+use codex_core::protocol::SandboxPolicy;
+use codex_core::protocol::WritableRoot;
+
+/// Options that control how bubblewrap is invoked.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub(crate) struct BwrapOptions {
+    /// Whether to mount a fresh `/proc` inside the PID namespace.
+    ///
+    /// This is the secure default, but some restrictive container environments
+    /// deny `--proc /proc` even when PID namespaces are available.
+    pub mount_proc: bool,
+}
+
+impl Default for BwrapOptions {
+    fn default() -> Self {
+        Self { mount_proc: true }
+    }
+}
+
+/// Wrap a command with bubblewrap so the filesystem is read-only by default,
+/// with explicit writable roots and read-only subpaths layered afterward.
+///
+/// When the policy grants full disk write access, this returns `command`
+/// unchanged so we avoid unnecessary sandboxing overhead.
+pub(crate) fn create_bwrap_command_args(
+    command: Vec<String>,
+    sandbox_policy: &SandboxPolicy,
+    cwd: &Path,
+    options: BwrapOptions,
+    bwrap_path: Option<&Path>,
+) -> Result<Vec<String>> {
+    if sandbox_policy.has_full_disk_write_access() {
+        return Ok(command);
+    }
+
+    let bwrap_path = match bwrap_path {
+        Some(path) => {
+            if path.exists() {
+                path.to_path_buf()
+            } else {
+                return Err(CodexErr::UnsupportedOperation(format!(
+                    "bubblewrap (bwrap) not found at configured path: {}",
+                    path.display()
+                )));
+            }
+        }
+        None => which::which("bwrap").map_err(|err| {
+            CodexErr::UnsupportedOperation(format!("bubblewrap (bwrap) not found on PATH: {err}"))
+        })?,
+    };
+
+    let mut args = Vec::new();
+    args.push(path_to_string(&bwrap_path));
+    args.extend(create_bwrap_flags(command, sandbox_policy, cwd, options)?);
+    Ok(args)
+}
+
+/// Doc-hidden helper that builds bubblewrap arguments without a program path.
+///
+/// This is intended for experiments where we call a build-time bubblewrap
+/// `main` symbol via FFI rather than exec'ing the `bwrap` binary. The caller
+/// is responsible for providing a suitable `argv[0]`.
+#[doc(hidden)]
+pub(crate) fn create_bwrap_command_args_vendored(
+    command: Vec<String>,
+    sandbox_policy: &SandboxPolicy,
+    cwd: &Path,
+    options: BwrapOptions,
+) -> Result<Vec<String>> {
+    if sandbox_policy.has_full_disk_write_access() {
+        return Ok(command);
+    }
+
+    create_bwrap_flags(command, sandbox_policy, cwd, options)
+}
+
+/// Build the bubblewrap flags (everything after `argv[0]`).
+fn create_bwrap_flags(
+    command: Vec<String>,
+    sandbox_policy: &SandboxPolicy,
+    cwd: &Path,
+    options: BwrapOptions,
+) -> Result<Vec<String>> {
+    let mut args = Vec::new();
+    args.push("--new-session".to_string());
+    args.push("--die-with-parent".to_string());
+    args.extend(create_filesystem_args(sandbox_policy, cwd)?);
+    // Isolate the PID namespace.
+    args.push("--unshare-pid".to_string());
+    // Mount a fresh /proc unless the caller explicitly disables it.
+    if options.mount_proc {
+        args.push("--proc".to_string());
+        args.push("/proc".to_string());
+    }
+    args.push("--".to_string());
+    args.extend(command);
+    Ok(args)
+}
+
+/// Build the bubblewrap filesystem mounts for a given sandbox policy.
+///
+/// The mount order is important:
+/// 1. `--ro-bind / /` makes the entire filesystem read-only.
+/// 2. `--bind <root> <root>` re-enables writes for allowed roots.
+/// 3. `--ro-bind <subpath> <subpath>` re-applies read-only protections under
+///    those writable roots so protected subpaths win.
+/// 4. `--dev-bind /dev/null /dev/null` preserves the common sink even under a
+///    read-only root.
+fn create_filesystem_args(sandbox_policy: &SandboxPolicy, cwd: &Path) -> Result<Vec<String>> {
+    let writable_roots = sandbox_policy.get_writable_roots_with_cwd(cwd);
+    ensure_mount_targets_exist(&writable_roots)?;
+
+    let mut args = Vec::new();
+
+    // Read-only root, then selectively re-enable writes.
+    args.push("--ro-bind".to_string());
+    args.push("/".to_string());
+    args.push("/".to_string());
+
+    for writable_root in &writable_roots {
+        let root = writable_root.root.as_path();
+        args.push("--bind".to_string());
+        args.push(path_to_string(root));
+        args.push(path_to_string(root));
+    }
+
+    // Re-apply read-only subpaths after the writable binds so they win.
+    let allowed_write_paths: Vec<PathBuf> = writable_roots
+        .iter()
+        .map(|writable_root| writable_root.root.as_path().to_path_buf())
+        .collect();
+
+    for subpath in collect_read_only_subpaths(&writable_roots) {
+        if let Some(symlink_path) = find_symlink_in_path(&subpath, &allowed_write_paths) {
+            args.push("--ro-bind".to_string());
+            args.push("/dev/null".to_string());
+            args.push(path_to_string(&symlink_path));
+            continue;
+        }
+
+        if !subpath.exists() {
+            if let Some(first_missing) = find_first_non_existent_component(&subpath)
+                && is_within_allowed_write_paths(&first_missing, &allowed_write_paths)
+            {
+                args.push("--ro-bind".to_string());
+                args.push("/dev/null".to_string());
+                args.push(path_to_string(&first_missing));
+            }
+            continue;
+        }
+
+        if is_within_allowed_write_paths(&subpath, &allowed_write_paths) {
+            args.push("--ro-bind".to_string());
+            args.push(path_to_string(&subpath));
+            args.push(path_to_string(&subpath));
+        }
+    }
+
+    // Ensure `/dev/null` remains usable regardless of the root bind.
+    args.push("--dev-bind".to_string());
+    args.push("/dev/null".to_string());
+    args.push("/dev/null".to_string());
+
+    Ok(args)
+}
+
+/// Collect unique read-only subpaths across all writable roots.
+fn collect_read_only_subpaths(writable_roots: &[WritableRoot]) -> Vec<PathBuf> {
+    let mut subpaths: BTreeSet<PathBuf> = BTreeSet::new();
+    for writable_root in writable_roots {
+        for subpath in &writable_root.read_only_subpaths {
+            subpaths.insert(subpath.as_path().to_path_buf());
+        }
+    }
+    subpaths.into_iter().collect()
+}
+
+/// Validate that writable roots exist before constructing mounts.
+///
+/// Bubblewrap requires bind mount targets to exist. We fail fast with a clear
+/// error so callers can present an actionable message.
+fn ensure_mount_targets_exist(writable_roots: &[WritableRoot]) -> Result<()> {
+    for writable_root in writable_roots {
+        let root = writable_root.root.as_path();
+        if !root.exists() {
+            return Err(CodexErr::UnsupportedOperation(format!(
+                "Sandbox expected writable root {root}, but it does not exist.",
+                root = root.display()
+            )));
+        }
+    }
+    Ok(())
+}
+
+fn path_to_string(path: &Path) -> String {
+    path.to_string_lossy().to_string()
+}
+
+/// Returns true when `path` is under any allowed writable root.
+fn is_within_allowed_write_paths(path: &Path, allowed_write_paths: &[PathBuf]) -> bool {
+    allowed_write_paths
+        .iter()
+        .any(|root| path.starts_with(root))
+}
+
+/// Find the first symlink along `target_path` that is also under a writable root.
+///
+/// This blocks symlink replacement attacks where a protected path is a symlink
+/// inside a writable root (e.g., `.codex -> ./decoy`). In that case we mount
+/// `/dev/null` on the symlink itself to prevent rewiring it.
+fn find_symlink_in_path(target_path: &Path, allowed_write_paths: &[PathBuf]) -> Option<PathBuf> {
+    let mut current = PathBuf::new();
+
+    for component in target_path.components() {
+        use std::path::Component;
+        match component {
+            Component::RootDir => {
+                current.push(Path::new("/"));
+                continue;
+            }
+            Component::CurDir => continue,
+            Component::ParentDir => {
+                current.pop();
+                continue;
+            }
+            Component::Normal(part) => current.push(part),
+            Component::Prefix(_) => continue,
+        }
+
+        let metadata = match std::fs::symlink_metadata(&current) {
+            Ok(metadata) => metadata,
+            Err(_) => break,
+        };
+
+        if metadata.file_type().is_symlink()
+            && is_within_allowed_write_paths(&current, allowed_write_paths)
+        {
+            return Some(current);
+        }
+    }
+
+    None
+}
+
+/// Find the first missing path component while walking `target_path`.
+///
+/// Mounting `/dev/null` on the first missing component prevents the sandboxed
+/// process from creating the protected path hierarchy.
+fn find_first_non_existent_component(target_path: &Path) -> Option<PathBuf> {
+    let mut current = PathBuf::new();
+
+    for component in target_path.components() {
+        use std::path::Component;
+        match component {
+            Component::RootDir => {
+                current.push(Path::new("/"));
+                continue;
+            }
+            Component::CurDir => continue,
+            Component::ParentDir => {
+                current.pop();
+                continue;
+            }
+            Component::Normal(part) => current.push(part),
+            Component::Prefix(_) => continue,
+        }
+
+        if !current.exists() {
+            return Some(current);
+        }
+    }
+
+    None
+}