mirror of
https://github.com/openai/codex.git
synced 2026-05-01 09:56:37 +00:00
## What is flaky The Windows shell-driven integration tests in `codex-rs/core` were intermittently unstable, especially: - `apply_patch_cli_can_use_shell_command_output_as_patch_input` - `websocket_test_codex_shell_chain` - `websocket_v2_test_codex_shell_chain` ## Why it was flaky These tests were exercising real shell-tool flows through whichever shell Codex selected on Windows, and the `apply_patch` test also nested a PowerShell read inside `cmd /c`. There were multiple independent sources of nondeterminism in that setup: - The test harness depended on the model-selected Windows shell instead of pinning the shell it actually meant to exercise. - `cmd.exe /c powershell.exe -Command "..."` is quoting-sensitive; on CI that could leave the read command wrapped as a literal string instead of executing it. - Even after getting the quoting right, PowerShell could emit CLIXML progress records like module-initialization output onto stdout. - The `apply_patch` test was building a patch directly from shell stdout, so any quoting artifact or progress noise corrupted the patch input. So the failures were driven by shell startup and output-shape variance, not by the `apply_patch` or websocket logic themselves. ## How this PR fixes it - Add a test-only `user_shell_override` path so Windows integration tests can pin `cmd.exe` explicitly. - Use that override in the websocket shell-chain tests and in the `apply_patch` harness. - Change the nested Windows file read in `apply_patch_cli_can_use_shell_command_output_as_patch_input` to a UTF-8 PowerShell `-EncodedCommand` script. - Run that nested PowerShell process with `-NonInteractive`, set `$ProgressPreference = 'SilentlyContinue'`, and read the file with `[System.IO.File]::ReadAllText(...)`. ## Why this fix fixes the flakiness The outer harness now runs under a deterministic shell, and the inner PowerShell read no longer depends on fragile `cmd` quoting or on progress output staying quiet by accident. The shell tool returns only the file contents, so patch construction and websocket assertions depend on stable test inputs instead of on runner-specific shell behavior. --------- Co-authored-by: Ahmed Ibrahim <219906144+aibrahim-oai@users.noreply.github.com> Co-authored-by: Codex <noreply@openai.com>
641 lines
20 KiB
Rust
641 lines
20 KiB
Rust
use std::mem::swap;
|
|
use std::path::Path;
|
|
use std::path::PathBuf;
|
|
use std::sync::Arc;
|
|
|
|
use anyhow::Context;
|
|
use anyhow::Result;
|
|
use codex_core::CodexAuth;
|
|
use codex_core::CodexThread;
|
|
use codex_core::ModelProviderInfo;
|
|
use codex_core::ThreadManager;
|
|
use codex_core::built_in_model_providers;
|
|
use codex_core::config::Config;
|
|
use codex_core::features::Feature;
|
|
use codex_core::models_manager::collaboration_mode_presets::CollaborationModesConfig;
|
|
use codex_core::shell::Shell;
|
|
use codex_core::shell::get_shell_by_model_provided_path;
|
|
use codex_protocol::config_types::ServiceTier;
|
|
use codex_protocol::openai_models::ModelsResponse;
|
|
use codex_protocol::protocol::AskForApproval;
|
|
use codex_protocol::protocol::EventMsg;
|
|
use codex_protocol::protocol::Op;
|
|
use codex_protocol::protocol::SandboxPolicy;
|
|
use codex_protocol::protocol::SessionConfiguredEvent;
|
|
use codex_protocol::protocol::SessionSource;
|
|
use codex_protocol::user_input::UserInput;
|
|
use serde_json::Value;
|
|
use tempfile::TempDir;
|
|
use wiremock::MockServer;
|
|
|
|
use crate::load_default_config_for_test;
|
|
use crate::responses::WebSocketTestServer;
|
|
use crate::responses::output_value_to_text;
|
|
use crate::responses::start_mock_server;
|
|
use crate::streaming_sse::StreamingSseServer;
|
|
use crate::wait_for_event;
|
|
use crate::wait_for_event_match;
|
|
use wiremock::Match;
|
|
use wiremock::matchers::path_regex;
|
|
|
|
type ConfigMutator = dyn FnOnce(&mut Config) + Send;
|
|
type PreBuildHook = dyn FnOnce(&Path) + Send + 'static;
|
|
const TEST_MODEL_WITH_EXPERIMENTAL_TOOLS: &str = "test-gpt-5.1-codex";
|
|
|
|
/// A collection of different ways the model can output an apply_patch call
|
|
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash)]
|
|
pub enum ApplyPatchModelOutput {
|
|
Freeform,
|
|
Function,
|
|
Shell,
|
|
ShellViaHeredoc,
|
|
ShellCommandViaHeredoc,
|
|
}
|
|
|
|
/// A collection of different ways the model can output an apply_patch call
|
|
#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash)]
|
|
pub enum ShellModelOutput {
|
|
Shell,
|
|
ShellCommand,
|
|
LocalShell,
|
|
// UnifiedExec has its own set of tests
|
|
}
|
|
|
|
pub struct TestCodexBuilder {
|
|
config_mutators: Vec<Box<ConfigMutator>>,
|
|
auth: CodexAuth,
|
|
pre_build_hooks: Vec<Box<PreBuildHook>>,
|
|
home: Option<Arc<TempDir>>,
|
|
user_shell_override: Option<Shell>,
|
|
}
|
|
|
|
impl TestCodexBuilder {
|
|
pub fn with_config<T>(mut self, mutator: T) -> Self
|
|
where
|
|
T: FnOnce(&mut Config) + Send + 'static,
|
|
{
|
|
self.config_mutators.push(Box::new(mutator));
|
|
self
|
|
}
|
|
|
|
pub fn with_auth(mut self, auth: CodexAuth) -> Self {
|
|
self.auth = auth;
|
|
self
|
|
}
|
|
|
|
pub fn with_model(self, model: &str) -> Self {
|
|
let new_model = model.to_string();
|
|
self.with_config(move |config| {
|
|
config.model = Some(new_model.clone());
|
|
})
|
|
}
|
|
|
|
pub fn with_pre_build_hook<F>(mut self, hook: F) -> Self
|
|
where
|
|
F: FnOnce(&Path) + Send + 'static,
|
|
{
|
|
self.pre_build_hooks.push(Box::new(hook));
|
|
self
|
|
}
|
|
|
|
pub fn with_home(mut self, home: Arc<TempDir>) -> Self {
|
|
self.home = Some(home);
|
|
self
|
|
}
|
|
|
|
pub fn with_user_shell(mut self, user_shell: Shell) -> Self {
|
|
self.user_shell_override = Some(user_shell);
|
|
self
|
|
}
|
|
|
|
pub fn with_windows_cmd_shell(self) -> Self {
|
|
if cfg!(windows) {
|
|
self.with_user_shell(get_shell_by_model_provided_path(&PathBuf::from("cmd.exe")))
|
|
} else {
|
|
self
|
|
}
|
|
}
|
|
|
|
pub async fn build(&mut self, server: &wiremock::MockServer) -> anyhow::Result<TestCodex> {
|
|
let home = match self.home.clone() {
|
|
Some(home) => home,
|
|
None => Arc::new(TempDir::new()?),
|
|
};
|
|
Box::pin(self.build_with_home(server, home, /*resume_from*/ None)).await
|
|
}
|
|
|
|
pub async fn build_with_streaming_server(
|
|
&mut self,
|
|
server: &StreamingSseServer,
|
|
) -> anyhow::Result<TestCodex> {
|
|
let base_url = server.uri();
|
|
let home = match self.home.clone() {
|
|
Some(home) => home,
|
|
None => Arc::new(TempDir::new()?),
|
|
};
|
|
Box::pin(self.build_with_home_and_base_url(
|
|
format!("{base_url}/v1"),
|
|
home,
|
|
/*resume_from*/ None,
|
|
))
|
|
.await
|
|
}
|
|
|
|
pub async fn build_with_websocket_server(
|
|
&mut self,
|
|
server: &WebSocketTestServer,
|
|
) -> anyhow::Result<TestCodex> {
|
|
let base_url = format!("{}/v1", server.uri());
|
|
let home = match self.home.clone() {
|
|
Some(home) => home,
|
|
None => Arc::new(TempDir::new()?),
|
|
};
|
|
let base_url_clone = base_url.clone();
|
|
self.config_mutators.push(Box::new(move |config| {
|
|
config.model_provider.base_url = Some(base_url_clone);
|
|
config.experimental_realtime_ws_model = Some("realtime-test-model".to_string());
|
|
config
|
|
.features
|
|
.enable(Feature::ResponsesWebsockets)
|
|
.expect("test config should allow feature update");
|
|
}));
|
|
Box::pin(self.build_with_home_and_base_url(base_url, home, /*resume_from*/ None)).await
|
|
}
|
|
|
|
pub async fn resume(
|
|
&mut self,
|
|
server: &wiremock::MockServer,
|
|
home: Arc<TempDir>,
|
|
rollout_path: PathBuf,
|
|
) -> anyhow::Result<TestCodex> {
|
|
Box::pin(self.build_with_home(server, home, Some(rollout_path))).await
|
|
}
|
|
|
|
async fn build_with_home(
|
|
&mut self,
|
|
server: &wiremock::MockServer,
|
|
home: Arc<TempDir>,
|
|
resume_from: Option<PathBuf>,
|
|
) -> anyhow::Result<TestCodex> {
|
|
let base_url = format!("{}/v1", server.uri());
|
|
let (config, cwd) = self.prepare_config(base_url, &home).await?;
|
|
Box::pin(self.build_from_config(config, cwd, home, resume_from)).await
|
|
}
|
|
|
|
async fn build_with_home_and_base_url(
|
|
&mut self,
|
|
base_url: String,
|
|
home: Arc<TempDir>,
|
|
resume_from: Option<PathBuf>,
|
|
) -> anyhow::Result<TestCodex> {
|
|
let (config, cwd) = self.prepare_config(base_url, &home).await?;
|
|
Box::pin(self.build_from_config(config, cwd, home, resume_from)).await
|
|
}
|
|
|
|
async fn build_from_config(
|
|
&mut self,
|
|
config: Config,
|
|
cwd: Arc<TempDir>,
|
|
home: Arc<TempDir>,
|
|
resume_from: Option<PathBuf>,
|
|
) -> anyhow::Result<TestCodex> {
|
|
let auth = self.auth.clone();
|
|
let thread_manager = if config.model_catalog.is_some() {
|
|
ThreadManager::new(
|
|
&config,
|
|
codex_core::test_support::auth_manager_from_auth(auth.clone()),
|
|
SessionSource::Exec,
|
|
CollaborationModesConfig::default(),
|
|
)
|
|
} else {
|
|
codex_core::test_support::thread_manager_with_models_provider_and_home(
|
|
auth.clone(),
|
|
config.model_provider.clone(),
|
|
config.codex_home.clone(),
|
|
)
|
|
};
|
|
let thread_manager = Arc::new(thread_manager);
|
|
let user_shell_override = self.user_shell_override.clone();
|
|
|
|
let new_conversation = match (resume_from, user_shell_override) {
|
|
(Some(path), Some(user_shell_override)) => {
|
|
let auth_manager = codex_core::test_support::auth_manager_from_auth(auth);
|
|
Box::pin(
|
|
codex_core::test_support::resume_thread_from_rollout_with_user_shell_override(
|
|
thread_manager.as_ref(),
|
|
config.clone(),
|
|
path,
|
|
auth_manager,
|
|
user_shell_override,
|
|
),
|
|
)
|
|
.await?
|
|
}
|
|
(Some(path), None) => {
|
|
let auth_manager = codex_core::test_support::auth_manager_from_auth(auth);
|
|
Box::pin(thread_manager.resume_thread_from_rollout(
|
|
config.clone(),
|
|
path,
|
|
auth_manager,
|
|
/*parent_trace*/ None,
|
|
))
|
|
.await?
|
|
}
|
|
(None, Some(user_shell_override)) => {
|
|
Box::pin(
|
|
codex_core::test_support::start_thread_with_user_shell_override(
|
|
thread_manager.as_ref(),
|
|
config.clone(),
|
|
user_shell_override,
|
|
),
|
|
)
|
|
.await?
|
|
}
|
|
(None, None) => Box::pin(thread_manager.start_thread(config.clone())).await?,
|
|
};
|
|
|
|
Ok(TestCodex {
|
|
home,
|
|
cwd,
|
|
config,
|
|
codex: new_conversation.thread,
|
|
session_configured: new_conversation.session_configured,
|
|
thread_manager,
|
|
})
|
|
}
|
|
|
|
async fn prepare_config(
|
|
&mut self,
|
|
base_url: String,
|
|
home: &TempDir,
|
|
) -> anyhow::Result<(Config, Arc<TempDir>)> {
|
|
let model_provider = ModelProviderInfo {
|
|
base_url: Some(base_url),
|
|
..built_in_model_providers(/*openai_base_url*/ None)["openai"].clone()
|
|
};
|
|
let cwd = Arc::new(TempDir::new()?);
|
|
let mut config = load_default_config_for_test(home).await;
|
|
config.cwd = cwd.path().to_path_buf();
|
|
config.model_provider = model_provider;
|
|
for hook in self.pre_build_hooks.drain(..) {
|
|
hook(home.path());
|
|
}
|
|
if let Ok(path) = codex_utils_cargo_bin::cargo_bin("codex") {
|
|
config.codex_linux_sandbox_exe = Some(path);
|
|
} else if let Ok(exe) = std::env::current_exe()
|
|
&& let Some(path) = exe
|
|
.parent()
|
|
.and_then(|parent| parent.parent())
|
|
.map(|parent| parent.join("codex"))
|
|
&& path.is_file()
|
|
{
|
|
config.codex_linux_sandbox_exe = Some(path);
|
|
}
|
|
|
|
let mut mutators = vec![];
|
|
swap(&mut self.config_mutators, &mut mutators);
|
|
for mutator in mutators {
|
|
mutator(&mut config);
|
|
}
|
|
ensure_test_model_catalog(&mut config)?;
|
|
|
|
if config.include_apply_patch_tool {
|
|
config.features.enable(Feature::ApplyPatchFreeform)?;
|
|
} else {
|
|
config.features.disable(Feature::ApplyPatchFreeform)?;
|
|
}
|
|
|
|
Ok((config, cwd))
|
|
}
|
|
}
|
|
|
|
fn ensure_test_model_catalog(config: &mut Config) -> Result<()> {
|
|
if config.model.as_deref() != Some(TEST_MODEL_WITH_EXPERIMENTAL_TOOLS)
|
|
|| config.model_catalog.is_some()
|
|
{
|
|
return Ok(());
|
|
}
|
|
|
|
let bundled_models_path = codex_utils_cargo_bin::find_resource!("../../models.json")
|
|
.context("bundled models.json")?;
|
|
let bundled_models_contents =
|
|
std::fs::read_to_string(&bundled_models_path).with_context(|| {
|
|
format!(
|
|
"read bundled models.json from {}",
|
|
bundled_models_path.display()
|
|
)
|
|
})?;
|
|
let bundled_models: ModelsResponse =
|
|
serde_json::from_str(&bundled_models_contents).context("parse bundled models.json")?;
|
|
let mut model = bundled_models
|
|
.models
|
|
.iter()
|
|
.find(|candidate| candidate.slug == "gpt-5.1-codex")
|
|
.cloned()
|
|
.unwrap_or_else(|| panic!("missing bundled model gpt-5.1-codex"));
|
|
model.slug = TEST_MODEL_WITH_EXPERIMENTAL_TOOLS.to_string();
|
|
model.display_name = TEST_MODEL_WITH_EXPERIMENTAL_TOOLS.to_string();
|
|
model.experimental_supported_tools = vec![
|
|
"test_sync_tool".to_string(),
|
|
"read_file".to_string(),
|
|
"grep_files".to_string(),
|
|
"list_dir".to_string(),
|
|
];
|
|
config.model_catalog = Some(ModelsResponse {
|
|
models: vec![model],
|
|
});
|
|
Ok(())
|
|
}
|
|
|
|
pub struct TestCodex {
|
|
pub home: Arc<TempDir>,
|
|
pub cwd: Arc<TempDir>,
|
|
pub codex: Arc<CodexThread>,
|
|
pub session_configured: SessionConfiguredEvent,
|
|
pub config: Config,
|
|
pub thread_manager: Arc<ThreadManager>,
|
|
}
|
|
|
|
impl TestCodex {
|
|
pub fn cwd_path(&self) -> &Path {
|
|
self.cwd.path()
|
|
}
|
|
|
|
pub fn codex_home_path(&self) -> &Path {
|
|
self.config.codex_home.as_path()
|
|
}
|
|
|
|
pub fn workspace_path(&self, rel: impl AsRef<Path>) -> PathBuf {
|
|
self.cwd_path().join(rel)
|
|
}
|
|
|
|
pub async fn submit_turn(&self, prompt: &str) -> Result<()> {
|
|
self.submit_turn_with_policies(
|
|
prompt,
|
|
AskForApproval::Never,
|
|
SandboxPolicy::DangerFullAccess,
|
|
)
|
|
.await
|
|
}
|
|
|
|
pub async fn submit_turn_with_policy(
|
|
&self,
|
|
prompt: &str,
|
|
sandbox_policy: SandboxPolicy,
|
|
) -> Result<()> {
|
|
self.submit_turn_with_policies(prompt, AskForApproval::Never, sandbox_policy)
|
|
.await
|
|
}
|
|
|
|
pub async fn submit_turn_with_service_tier(
|
|
&self,
|
|
prompt: &str,
|
|
service_tier: Option<ServiceTier>,
|
|
) -> Result<()> {
|
|
self.submit_turn_with_context(
|
|
prompt,
|
|
AskForApproval::Never,
|
|
SandboxPolicy::DangerFullAccess,
|
|
Some(service_tier),
|
|
)
|
|
.await
|
|
}
|
|
|
|
pub async fn submit_turn_with_policies(
|
|
&self,
|
|
prompt: &str,
|
|
approval_policy: AskForApproval,
|
|
sandbox_policy: SandboxPolicy,
|
|
) -> Result<()> {
|
|
self.submit_turn_with_context(
|
|
prompt,
|
|
approval_policy,
|
|
sandbox_policy,
|
|
/*service_tier*/ None,
|
|
)
|
|
.await
|
|
}
|
|
|
|
async fn submit_turn_with_context(
|
|
&self,
|
|
prompt: &str,
|
|
approval_policy: AskForApproval,
|
|
sandbox_policy: SandboxPolicy,
|
|
service_tier: Option<Option<ServiceTier>>,
|
|
) -> Result<()> {
|
|
let session_model = self.session_configured.model.clone();
|
|
self.codex
|
|
.submit(Op::UserTurn {
|
|
items: vec![UserInput::Text {
|
|
text: prompt.into(),
|
|
text_elements: Vec::new(),
|
|
}],
|
|
final_output_json_schema: None,
|
|
cwd: self.cwd.path().to_path_buf(),
|
|
approval_policy,
|
|
sandbox_policy,
|
|
model: session_model,
|
|
effort: None,
|
|
summary: None,
|
|
service_tier,
|
|
collaboration_mode: None,
|
|
personality: None,
|
|
})
|
|
.await?;
|
|
|
|
let turn_id = wait_for_event_match(&self.codex, |event| match event {
|
|
EventMsg::TurnStarted(event) => Some(event.turn_id.clone()),
|
|
_ => None,
|
|
})
|
|
.await;
|
|
wait_for_event(&self.codex, |event| match event {
|
|
EventMsg::TurnComplete(event) => event.turn_id == turn_id,
|
|
_ => false,
|
|
})
|
|
.await;
|
|
Ok(())
|
|
}
|
|
}
|
|
|
|
pub struct TestCodexHarness {
|
|
server: MockServer,
|
|
test: TestCodex,
|
|
}
|
|
|
|
impl TestCodexHarness {
|
|
pub async fn new() -> Result<Self> {
|
|
Self::with_builder(test_codex()).await
|
|
}
|
|
|
|
pub async fn with_config(mutator: impl FnOnce(&mut Config) + Send + 'static) -> Result<Self> {
|
|
Self::with_builder(test_codex().with_config(mutator)).await
|
|
}
|
|
|
|
pub async fn with_builder(mut builder: TestCodexBuilder) -> Result<Self> {
|
|
let server = start_mock_server().await;
|
|
let test = builder.build(&server).await?;
|
|
Ok(Self { server, test })
|
|
}
|
|
|
|
pub fn server(&self) -> &MockServer {
|
|
&self.server
|
|
}
|
|
|
|
pub fn test(&self) -> &TestCodex {
|
|
&self.test
|
|
}
|
|
|
|
pub fn cwd(&self) -> &Path {
|
|
self.test.cwd_path()
|
|
}
|
|
|
|
pub fn path(&self, rel: impl AsRef<Path>) -> PathBuf {
|
|
self.test.workspace_path(rel)
|
|
}
|
|
|
|
pub async fn submit(&self, prompt: &str) -> Result<()> {
|
|
self.test.submit_turn(prompt).await
|
|
}
|
|
|
|
pub async fn submit_with_policy(
|
|
&self,
|
|
prompt: &str,
|
|
sandbox_policy: SandboxPolicy,
|
|
) -> Result<()> {
|
|
self.test
|
|
.submit_turn_with_policy(prompt, sandbox_policy)
|
|
.await
|
|
}
|
|
|
|
pub async fn request_bodies(&self) -> Vec<Value> {
|
|
let path_matcher = path_regex(".*/responses$");
|
|
self.server
|
|
.received_requests()
|
|
.await
|
|
.expect("mock server should not fail")
|
|
.into_iter()
|
|
.filter(|req| path_matcher.matches(req))
|
|
.map(|req| {
|
|
req.body_json::<Value>()
|
|
.expect("request body to be valid JSON")
|
|
})
|
|
.collect()
|
|
}
|
|
|
|
pub async fn function_call_output_value(&self, call_id: &str) -> Value {
|
|
let bodies = self.request_bodies().await;
|
|
function_call_output(&bodies, call_id).clone()
|
|
}
|
|
|
|
pub async fn function_call_stdout(&self, call_id: &str) -> String {
|
|
self.function_call_output_value(call_id)
|
|
.await
|
|
.get("output")
|
|
.and_then(Value::as_str)
|
|
.expect("output string")
|
|
.to_string()
|
|
}
|
|
|
|
pub async fn custom_tool_call_output(&self, call_id: &str) -> String {
|
|
let bodies = self.request_bodies().await;
|
|
custom_tool_call_output_text(&bodies, call_id)
|
|
}
|
|
|
|
pub async fn apply_patch_output(
|
|
&self,
|
|
call_id: &str,
|
|
output_type: ApplyPatchModelOutput,
|
|
) -> String {
|
|
match output_type {
|
|
ApplyPatchModelOutput::Freeform => self.custom_tool_call_output(call_id).await,
|
|
ApplyPatchModelOutput::Function
|
|
| ApplyPatchModelOutput::Shell
|
|
| ApplyPatchModelOutput::ShellViaHeredoc
|
|
| ApplyPatchModelOutput::ShellCommandViaHeredoc => {
|
|
self.function_call_stdout(call_id).await
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
fn custom_tool_call_output<'a>(bodies: &'a [Value], call_id: &str) -> &'a Value {
|
|
for body in bodies {
|
|
if let Some(items) = body.get("input").and_then(Value::as_array) {
|
|
for item in items {
|
|
if item.get("type").and_then(Value::as_str) == Some("custom_tool_call_output")
|
|
&& item.get("call_id").and_then(Value::as_str) == Some(call_id)
|
|
{
|
|
return item;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
panic!("custom_tool_call_output {call_id} not found");
|
|
}
|
|
|
|
fn custom_tool_call_output_text(bodies: &[Value], call_id: &str) -> String {
|
|
let output = custom_tool_call_output(bodies, call_id)
|
|
.get("output")
|
|
.unwrap_or_else(|| panic!("custom_tool_call_output {call_id} missing output"));
|
|
output_value_to_text(output)
|
|
.unwrap_or_else(|| panic!("custom_tool_call_output {call_id} missing text output"))
|
|
}
|
|
|
|
fn function_call_output<'a>(bodies: &'a [Value], call_id: &str) -> &'a Value {
|
|
for body in bodies {
|
|
if let Some(items) = body.get("input").and_then(Value::as_array) {
|
|
for item in items {
|
|
if item.get("type").and_then(Value::as_str) == Some("function_call_output")
|
|
&& item.get("call_id").and_then(Value::as_str) == Some(call_id)
|
|
{
|
|
return item;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
panic!("function_call_output {call_id} not found");
|
|
}
|
|
|
|
pub fn test_codex() -> TestCodexBuilder {
|
|
TestCodexBuilder {
|
|
config_mutators: vec![],
|
|
auth: CodexAuth::from_api_key("dummy"),
|
|
pre_build_hooks: vec![],
|
|
home: None,
|
|
user_shell_override: None,
|
|
}
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod tests {
|
|
use super::*;
|
|
use pretty_assertions::assert_eq;
|
|
use serde_json::json;
|
|
|
|
#[test]
|
|
fn custom_tool_call_output_text_returns_output_text() {
|
|
let bodies = vec![json!({
|
|
"input": [{
|
|
"type": "custom_tool_call_output",
|
|
"call_id": "call-1",
|
|
"output": "hello"
|
|
}]
|
|
})];
|
|
|
|
assert_eq!(custom_tool_call_output_text(&bodies, "call-1"), "hello");
|
|
}
|
|
|
|
#[test]
|
|
#[should_panic(expected = "custom_tool_call_output call-2 missing output")]
|
|
fn custom_tool_call_output_text_panics_when_output_is_missing() {
|
|
let bodies = vec![json!({
|
|
"input": [{
|
|
"type": "custom_tool_call_output",
|
|
"call_id": "call-2"
|
|
}]
|
|
})];
|
|
|
|
let _ = custom_tool_call_output_text(&bodies, "call-2");
|
|
}
|
|
}
|