Add model-controlled truncation for code mode results (#14258)

Summary - document that `@openai/code_mode` exposes `set_max_output_tokens_per_exec_call` and that `code_mode` truncates the final Rust-side output when the budget is exceeded - enforce the configured budget in the Rust tool runner, reusing truncation helpers so text-only outputs follow the unified-exec wrapper and mixed outputs still fit within the limit - ensure the new behavior is covered by a code-mode integration test and string spec update Testing - Not run (not requested)
2026-04-26 23:55:25 +00:00 · 2026-03-10 15:57:14 -07:00
parent ee8f84153e
commit 3d41ff0b77
5 changed files with 284 additions and 38 deletions
--- a/codex-rs/core/tests/suite/code_mode.rs
+++ b/codex-rs/core/tests/suite/code_mode.rs
@@ -4,6 +4,7 @@ use anyhow::Result;
 use codex_core::config::types::McpServerConfig;
 use codex_core::config::types::McpServerTransportConfig;
 use codex_core::features::Feature;
+use core_test_support::assert_regex_match;
 use core_test_support::responses;
 use core_test_support::responses::ResponseMock;
 use core_test_support::responses::ResponsesRequest;
@@ -175,6 +176,51 @@ add_content(JSON.stringify(await exec_command({ cmd: "printf code_mode_exec_mark
    Ok(())
 }

+#[cfg_attr(windows, ignore = "no exec_command on Windows")]
+#[tokio::test(flavor = "multi_thread", worker_threads = 2)]
+async fn code_mode_can_truncate_final_result_with_configured_budget() -> Result<()> {
+    skip_if_no_network!(Ok(()));
+
+    let server = responses::start_mock_server().await;
+    let (_test, second_mock) = run_code_mode_turn(
+        &server,
+        "use code_mode to truncate the final result",
+        r#"
+import { exec_command } from "tools.js";
+import { set_max_output_tokens_per_exec_call } from "@openai/code_mode";
+
+set_max_output_tokens_per_exec_call(6);
+
+add_content(JSON.stringify(await exec_command({
+  cmd: "printf 'token one token two token three token four token five token six token seven'",
+  max_output_tokens: 100
+})));
+"#,
+        false,
+    )
+    .await?;
+
+    let req = second_mock.single_request();
+    let (output, success) = custom_tool_output_text_and_success(&req, "call-1");
+    assert_ne!(
+        success,
+        Some(false),
+        "code_mode call failed unexpectedly: {output}"
+    );
+    let expected_pattern = r#"(?sx)
+\A
+Original\ token\ count:\ \d+\n
+Output:\n
+Total\ output\ lines:\ 1\n
+\n
+\{"chunk_id".*…\d+\ tokens\ truncated….*
+\z
+"#;
+    assert_regex_match(expected_pattern, &output);
+
+    Ok(())
+}
+
 #[tokio::test(flavor = "multi_thread", worker_threads = 2)]
 async fn code_mode_can_apply_patch_via_nested_tool() -> Result<()> {
    skip_if_no_network!(Ok(()));