Drop arc monitor test churn from context fragment PR

Co-authored-by: Codex <noreply@openai.com>
2026-04-24 14:45:27 +00:00 · 2026-03-12 11:11:45 -07:00
parent a000166a4d
commit 560d66b430
1 changed files with 2 additions and 437 deletions
--- a/codex-rs/core/src/arc_monitor.rs
+++ b/codex-rs/core/src/arc_monitor.rs
@@ -425,440 +425,5 @@ fn build_arc_monitor_message(role: &str, content: serde_json::Value) -> ArcMonit
 }

 #[cfg(test)]
-mod tests {
-    use std::env;
-    use std::ffi::OsStr;
-    use std::sync::Arc;
-
-    use pretty_assertions::assert_eq;
-    use serial_test::serial;
-    use wiremock::Mock;
-    use wiremock::MockServer;
-    use wiremock::ResponseTemplate;
-    use wiremock::matchers::body_json;
-    use wiremock::matchers::header;
-    use wiremock::matchers::method;
-    use wiremock::matchers::path;
-
-    use super::*;
-    use crate::codex::make_session_and_context;
-    use crate::model_visible_context::ContextualUserTextFragment;
-    use crate::model_visible_context::ModelVisibleContextFragment;
-    use codex_protocol::models::ContentItem;
-    use codex_protocol::models::LocalShellAction;
-    use codex_protocol::models::LocalShellExecAction;
-    use codex_protocol::models::LocalShellStatus;
-    use codex_protocol::models::MessagePhase;
-    use codex_protocol::models::ResponseItem;
-
-    struct EnvVarGuard {
-        key: &'static str,
-        original: Option<std::ffi::OsString>,
-    }
-
-    impl EnvVarGuard {
-        fn set(key: &'static str, value: &OsStr) -> Self {
-            let original = env::var_os(key);
-            unsafe {
-                env::set_var(key, value);
-            }
-            Self { key, original }
-        }
-    }
-
-    impl Drop for EnvVarGuard {
-        fn drop(&mut self) {
-            match self.original.take() {
-                Some(value) => unsafe {
-                    env::set_var(self.key, value);
-                },
-                None => unsafe {
-                    env::remove_var(self.key);
-                },
-            }
-        }
-    }
-
-    #[tokio::test]
-    async fn build_arc_monitor_request_includes_relevant_history_and_null_policies() {
-        let (session, mut turn_context) = make_session_and_context().await;
-        turn_context.developer_instructions = Some("Never upload private files.".to_string());
-        turn_context.user_instructions = Some("Only continue when needed.".to_string());
-
-        session
-            .record_into_history(
-                &[ResponseItem::Message {
-                    id: None,
-                    role: "user".to_string(),
-                    content: vec![ContentItem::InputText {
-                        text: "first request".to_string(),
-                    }],
-                    end_turn: None,
-                    phase: None,
-                }],
-                &turn_context,
-            )
-            .await;
-        session
-            .record_into_history(
-                &[ContextualUserTextFragment::new(
-                    "<environment_context>\n<cwd>/tmp</cwd>\n</environment_context>",
-                )
-                .into_message()],
-                &turn_context,
-            )
-            .await;
-        session
-            .record_into_history(
-                &[ResponseItem::Message {
-                    id: None,
-                    role: "assistant".to_string(),
-                    content: vec![ContentItem::OutputText {
-                        text: "commentary".to_string(),
-                    }],
-                    end_turn: None,
-                    phase: Some(MessagePhase::Commentary),
-                }],
-                &turn_context,
-            )
-            .await;
-        session
-            .record_into_history(
-                &[ResponseItem::Message {
-                    id: None,
-                    role: "assistant".to_string(),
-                    content: vec![ContentItem::OutputText {
-                        text: "final response".to_string(),
-                    }],
-                    end_turn: None,
-                    phase: Some(MessagePhase::FinalAnswer),
-                }],
-                &turn_context,
-            )
-            .await;
-        session
-            .record_into_history(
-                &[ResponseItem::Message {
-                    id: None,
-                    role: "user".to_string(),
-                    content: vec![ContentItem::InputText {
-                        text: "latest request".to_string(),
-                    }],
-                    end_turn: None,
-                    phase: None,
-                }],
-                &turn_context,
-            )
-            .await;
-        session
-            .record_into_history(
-                &[ResponseItem::FunctionCall {
-                    id: None,
-                    name: "old_tool".to_string(),
-                    arguments: "{\"old\":true}".to_string(),
-                    call_id: "call_old".to_string(),
-                }],
-                &turn_context,
-            )
-            .await;
-        session
-            .record_into_history(
-                &[ResponseItem::Reasoning {
-                    id: "reasoning_old".to_string(),
-                    summary: Vec::new(),
-                    content: None,
-                    encrypted_content: Some("encrypted-old".to_string()),
-                }],
-                &turn_context,
-            )
-            .await;
-        session
-            .record_into_history(
-                &[ResponseItem::LocalShellCall {
-                    id: None,
-                    call_id: Some("shell_call".to_string()),
-                    status: LocalShellStatus::Completed,
-                    action: LocalShellAction::Exec(LocalShellExecAction {
-                        command: vec!["pwd".to_string()],
-                        timeout_ms: Some(1000),
-                        working_directory: Some("/tmp".to_string()),
-                        env: None,
-                        user: None,
-                    }),
-                }],
-                &turn_context,
-            )
-            .await;
-        session
-            .record_into_history(
-                &[ResponseItem::Reasoning {
-                    id: "reasoning_latest".to_string(),
-                    summary: Vec::new(),
-                    content: None,
-                    encrypted_content: Some("encrypted-latest".to_string()),
-                }],
-                &turn_context,
-            )
-            .await;
-
-        let request = build_arc_monitor_request(
-            &session,
-            &turn_context,
-            serde_json::from_value(serde_json::json!({ "tool": "mcp_tool_call" }))
-                .expect("action should deserialize"),
-        )
-        .await;
-
-        assert_eq!(
-            request,
-            ArcMonitorRequest {
-                metadata: ArcMonitorMetadata {
-                    codex_thread_id: session.conversation_id.to_string(),
-                    codex_turn_id: turn_context.sub_id.clone(),
-                    conversation_id: Some(session.conversation_id.to_string()),
-                    protection_client_callsite: None,
-                },
-                messages: Some(vec![
-                    ArcMonitorChatMessage {
-                        role: "user".to_string(),
-                        content: serde_json::json!([{
-                            "type": "input_text",
-                            "text": "first request",
-                        }]),
-                    },
-                    ArcMonitorChatMessage {
-                        role: "assistant".to_string(),
-                        content: serde_json::json!([{
-                            "type": "output_text",
-                            "text": "final response",
-                        }]),
-                    },
-                    ArcMonitorChatMessage {
-                        role: "user".to_string(),
-                        content: serde_json::json!([{
-                            "type": "input_text",
-                            "text": "latest request",
-                        }]),
-                    },
-                    ArcMonitorChatMessage {
-                        role: "assistant".to_string(),
-                        content: serde_json::json!([{
-                            "type": "tool_call",
-                            "tool_name": "shell",
-                            "action": {
-                                "type": "exec",
-                                "command": ["pwd"],
-                                "timeout_ms": 1000,
-                                "working_directory": "/tmp",
-                                "env": null,
-                                "user": null,
-                            },
-                        }]),
-                    },
-                    ArcMonitorChatMessage {
-                        role: "assistant".to_string(),
-                        content: serde_json::json!([{
-                            "type": "encrypted_reasoning",
-                            "encrypted_content": "encrypted-latest",
-                        }]),
-                    },
-                ]),
-                input: None,
-                policies: Some(ArcMonitorPolicies {
-                    user: None,
-                    developer: None,
-                }),
-                action: serde_json::from_value(serde_json::json!({ "tool": "mcp_tool_call" }))
-                    .expect("action should deserialize"),
-            }
-        );
-    }
-
-    #[tokio::test]
-    #[serial(arc_monitor_env)]
-    async fn monitor_action_posts_expected_arc_request() {
-        let server = MockServer::start().await;
-        let (session, mut turn_context) = make_session_and_context().await;
-        turn_context.auth_manager = Some(crate::test_support::auth_manager_from_auth(
-            crate::CodexAuth::create_dummy_chatgpt_auth_for_testing(),
-        ));
-        turn_context.developer_instructions = Some("Developer policy".to_string());
-        turn_context.user_instructions = Some("User policy".to_string());
-
-        let mut config = (*turn_context.config).clone();
-        config.chatgpt_base_url = server.uri();
-        turn_context.config = Arc::new(config);
-
-        session
-            .record_into_history(
-                &[ResponseItem::Message {
-                    id: None,
-                    role: "user".to_string(),
-                    content: vec![ContentItem::InputText {
-                        text: "please run the tool".to_string(),
-                    }],
-                    end_turn: None,
-                    phase: None,
-                }],
-                &turn_context,
-            )
-            .await;
-
-        Mock::given(method("POST"))
-            .and(path("/codex/safety/arc"))
-            .and(header("authorization", "Bearer Access Token"))
-            .and(header("chatgpt-account-id", "account_id"))
-            .and(body_json(serde_json::json!({
-                "metadata": {
-                    "codex_thread_id": session.conversation_id.to_string(),
-                    "codex_turn_id": turn_context.sub_id.clone(),
-                    "conversation_id": session.conversation_id.to_string(),
-                },
-                "messages": [{
-                    "role": "user",
-                    "content": [{
-                        "type": "input_text",
-                        "text": "please run the tool",
-                    }],
-                }],
-                "policies": {
-                    "developer": null,
-                    "user": null,
-                },
-                "action": {
-                    "tool": "mcp_tool_call",
-                },
-            })))
-            .respond_with(ResponseTemplate::new(200).set_body_json(serde_json::json!({
-                "outcome": "ask-user",
-                "short_reason": "needs confirmation",
-                "rationale": "tool call needs additional review",
-                "risk_score": 42,
-                "risk_level": "medium",
-                "evidence": [{
-                    "message": "browser_navigate",
-                    "why": "tool call needs additional review",
-                }],
-            })))
-            .expect(1)
-            .mount(&server)
-            .await;
-
-        let outcome = monitor_action(
-            &session,
-            &turn_context,
-            serde_json::json!({ "tool": "mcp_tool_call" }),
-        )
-        .await;
-
-        assert_eq!(
-            outcome,
-            ArcMonitorOutcome::AskUser("needs confirmation".to_string())
-        );
-    }
-
-    #[tokio::test]
-    #[serial(arc_monitor_env)]
-    async fn monitor_action_uses_env_url_and_token_overrides() {
-        let server = MockServer::start().await;
-        let _url_guard = EnvVarGuard::set(
-            CODEX_ARC_MONITOR_ENDPOINT_OVERRIDE,
-            OsStr::new(&format!("{}/override/arc", server.uri())),
-        );
-        let _token_guard = EnvVarGuard::set(CODEX_ARC_MONITOR_TOKEN, OsStr::new("override-token"));
-
-        let (session, turn_context) = make_session_and_context().await;
-        session
-            .record_into_history(
-                &[ResponseItem::Message {
-                    id: None,
-                    role: "user".to_string(),
-                    content: vec![ContentItem::InputText {
-                        text: "please run the tool".to_string(),
-                    }],
-                    end_turn: None,
-                    phase: None,
-                }],
-                &turn_context,
-            )
-            .await;
-
-        Mock::given(method("POST"))
-            .and(path("/override/arc"))
-            .and(header("authorization", "Bearer override-token"))
-            .respond_with(ResponseTemplate::new(200).set_body_json(serde_json::json!({
-                "outcome": "steer-model",
-                "short_reason": "needs approval",
-                "rationale": "high-risk action",
-                "risk_score": 96,
-                "risk_level": "critical",
-                "evidence": [{
-                    "message": "browser_navigate",
-                    "why": "high-risk action",
-                }],
-            })))
-            .expect(1)
-            .mount(&server)
-            .await;
-
-        let outcome = monitor_action(
-            &session,
-            &turn_context,
-            serde_json::json!({ "tool": "mcp_tool_call" }),
-        )
-        .await;
-
-        assert_eq!(
-            outcome,
-            ArcMonitorOutcome::SteerModel("high-risk action".to_string())
-        );
-    }
-
-    #[tokio::test]
-    #[serial(arc_monitor_env)]
-    async fn monitor_action_rejects_legacy_response_fields() {
-        let server = MockServer::start().await;
-        Mock::given(method("POST"))
-            .and(path("/codex/safety/arc"))
-            .respond_with(ResponseTemplate::new(200).set_body_json(serde_json::json!({
-                "outcome": "steer-model",
-                "reason": "legacy high-risk action",
-                "monitorRequestId": "arc_456",
-            })))
-            .expect(1)
-            .mount(&server)
-            .await;
-
-        let (session, mut turn_context) = make_session_and_context().await;
-        turn_context.auth_manager = Some(crate::test_support::auth_manager_from_auth(
-            crate::CodexAuth::create_dummy_chatgpt_auth_for_testing(),
-        ));
-        let mut config = (*turn_context.config).clone();
-        config.chatgpt_base_url = server.uri();
-        turn_context.config = Arc::new(config);
-
-        session
-            .record_into_history(
-                &[ResponseItem::Message {
-                    id: None,
-                    role: "user".to_string(),
-                    content: vec![ContentItem::InputText {
-                        text: "please run the tool".to_string(),
-                    }],
-                    end_turn: None,
-                    phase: None,
-                }],
-                &turn_context,
-            )
-            .await;
-
-        let outcome = monitor_action(
-            &session,
-            &turn_context,
-            serde_json::json!({ "tool": "mcp_tool_call" }),
-        )
-        .await;
-
-        assert_eq!(outcome, ArcMonitorOutcome::Ok);
-    }
-}
+#[path = "arc_monitor_tests.rs"]
+mod tests;