Stabilize exec-server filesystem tests in CI (#17671)

## Summary\n- add an exec-server package-local test helper binary that can run exec-server and fs-helper flows\n- route exec-server filesystem tests through that helper instead of cross-crate codex helper binaries\n- stop relying on Bazel-only extra binary wiring for these tests\n\n## Testing\n- not run (per repo guidance for codex changes) --------- Co-authored-by: Codex <noreply@openai.com>
2026-04-27 08:05:51 +00:00 · 2026-04-13 16:53:42 -07:00
parent d4be06adea
commit 280a4a6d42
16 changed files with 674 additions and 111 deletions
--- a/codex-rs/core/tests/common/test_codex.rs
+++ b/codex-rs/core/tests/common/test_codex.rs
@@ -175,12 +175,18 @@ fn start_remote_exec_server(remote_env: &RemoteEnvConfig) -> Result<RemoteExecSe
    let container_name = remote_env.container_name.as_str();
    let instance_id = remote_exec_server_instance_id();
    let remote_exec_server_path = format!("/tmp/codex-{instance_id}");
+    let remote_linux_sandbox_path = format!("/tmp/codex-linux-sandbox-{instance_id}");
    let stdout_path = format!("/tmp/codex-exec-server-{instance_id}.stdout");
    let local_binary = codex_utils_cargo_bin::cargo_bin("codex").context("resolve codex binary")?;
+    let local_linux_sandbox = codex_utils_cargo_bin::cargo_bin("codex-linux-sandbox")
+        .context("resolve codex-linux-sandbox binary")?;
    let local_binary = local_binary.to_string_lossy().to_string();
+    let local_linux_sandbox = local_linux_sandbox.to_string_lossy().to_string();
    let remote_binary = format!("{container_name}:{remote_exec_server_path}");
+    let remote_linux_sandbox = format!("{container_name}:{remote_linux_sandbox_path}");

    docker_command_success(["cp", &local_binary, &remote_binary])?;
+    docker_command_success(["cp", &local_linux_sandbox, &remote_linux_sandbox])?;
    docker_command_success([
        "exec",
        container_name,
@@ -188,6 +194,14 @@ fn start_remote_exec_server(remote_env: &RemoteEnvConfig) -> Result<RemoteExecSe
        "+x",
        &remote_exec_server_path,
    ])?;
+    docker_command_success([
+        "exec",
+        container_name,
+        "chmod",
+        "+x",
+        &remote_linux_sandbox_path,
+    ])?;
+    probe_remote_linux_sandbox(container_name, &remote_linux_sandbox_path)?;

    let start_script = format!(
        "rm -f {stdout_path}; \
@@ -209,12 +223,32 @@ echo $!"
            pid,
            remote_exec_server_path,
            stdout_path,
-            cleanup_paths: Vec::new(),
+            cleanup_paths: vec![remote_linux_sandbox_path],
        },
        listen_url,
    })
 }

+fn probe_remote_linux_sandbox(container_name: &str, remote_linux_sandbox_path: &str) -> Result<()> {
+    let policy = serde_json::to_string(&SandboxPolicy::new_read_only_policy())
+        .context("serialize remote sandbox probe policy")?;
+    let probe_script = format!(
+        "{remote_linux_sandbox_path} --sandbox-policy-cwd /tmp --sandbox-policy '{policy}' -- /bin/true"
+    );
+    let output = Command::new("docker")
+        .args(["exec", container_name, "sh", "-lc", &probe_script])
+        .output()
+        .with_context(|| format!("probe remote linux sandbox in container `{container_name}`"))?;
+    if !output.status.success() {
+        return Err(anyhow!(
+            "remote linux sandbox probe failed in container `{container_name}`: stdout={} stderr={}",
+            String::from_utf8_lossy(&output.stdout).trim(),
+            String::from_utf8_lossy(&output.stderr).trim()
+        ));
+    }
+    Ok(())
+}
+
 fn remote_aware_cwd_path() -> AbsolutePathBuf {
    PathBuf::from(format!(
        "/tmp/codex-core-test-cwd-{}",