feat(app-server): API proposal for better thread loading performance

2026-05-04 03:16:31 +00:00 · 2026-04-30 16:59:12 -07:00
parent 6014b6679f
commit 0aec5b61ef
7 changed files with 292 additions and 12 deletions
--- a/codex-rs/app-server-protocol/src/protocol/common.rs
+++ b/codex-rs/app-server-protocol/src/protocol/common.rs
@@ -570,6 +570,18 @@ client_request_definitions! {
        serialization: None,
        response: v2::ThreadTurnsListResponse,
    },
+    ThreadItemsList => "thread/items/list" {
+        params: v2::ThreadItemsListParams,
+        // Explicitly concurrent: this primarily reads append-only rollout storage.
+        serialization: None,
+        response: v2::ThreadItemsListResponse,
+    },
+    ThreadItemContentRead => "thread/item/content/read" {
+        params: v2::ThreadItemContentReadParams,
+        // Explicitly concurrent: this reads deferred item content without mutating the thread.
+        serialization: None,
+        response: v2::ThreadItemContentReadResponse,
+    },
    /// Append raw Responses API items to the thread history without starting a user turn.
    ThreadInjectItems => "thread/inject_items" {
        params: v2::ThreadInjectItemsParams,
--- a/codex-rs/app-server-protocol/src/protocol/thread_history.rs
+++ b/codex-rs/app-server-protocol/src/protocol/thread_history.rs
@@ -10,6 +10,7 @@ use crate::protocol::v2::CollabAgentToolCallStatus;
 use crate::protocol::v2::CommandExecutionStatus;
 use crate::protocol::v2::DynamicToolCallOutputContentItem;
 use crate::protocol::v2::DynamicToolCallStatus;
+use crate::protocol::v2::ImageGenerationContent;
 use crate::protocol::v2::McpToolCallError;
 use crate::protocol::v2::McpToolCallResult;
 use crate::protocol::v2::McpToolCallStatus;
@@ -17,6 +18,7 @@ use crate::protocol::v2::ThreadItem;
 use crate::protocol::v2::Turn;
 use crate::protocol::v2::TurnError as V2TurnError;
 use crate::protocol::v2::TurnError;
+use crate::protocol::v2::TurnItemsView;
 use crate::protocol::v2::TurnStatus;
 use crate::protocol::v2::UserInput;
 use crate::protocol::v2::WebSearchAction;
@@ -580,6 +582,9 @@ impl ThreadHistoryBuilder {
            id: payload.call_id.clone(),
            status: String::new(),
            revised_prompt: None,
+            content: ImageGenerationContent::Unavailable {
+                reason: "image generation has not completed".to_string(),
+            },
            result: String::new(),
            saved_path: None,
        };
@@ -591,6 +596,11 @@ impl ThreadHistoryBuilder {
            id: payload.call_id.clone(),
            status: payload.status.clone(),
            revised_prompt: payload.revised_prompt.clone(),
+            content: ImageGenerationContent::Inline {
+                data_base64: payload.result.clone(),
+                mime_type: None,
+                byte_length: None,
+            },
            result: payload.result.clone(),
            saved_path: payload.saved_path.clone(),
        };
@@ -1160,6 +1170,7 @@ impl From<PendingTurn> for Turn {
    fn from(value: PendingTurn) -> Self {
        Self {
            id: value.id,
+            items_view: TurnItemsView::Full,
            items: value.items,
            error: value.error,
            status: value.status,
@@ -1174,6 +1185,7 @@ impl From<&PendingTurn> for Turn {
    fn from(value: &PendingTurn) -> Self {
        Self {
            id: value.id.clone(),
+            items_view: TurnItemsView::Full,
            items: value.items.clone(),
            error: value.error.clone(),
            status: value.status.clone(),
@@ -1442,6 +1454,7 @@ mod tests {
            turns[0],
            Turn {
                id: "turn-image".into(),
+                items_view: TurnItemsView::Full,
                status: TurnStatus::Completed,
                error: None,
                started_at: None,
@@ -1459,6 +1472,11 @@ mod tests {
                        id: "ig_123".into(),
                        status: "completed".into(),
                        revised_prompt: Some("final prompt".into()),
+                        content: ImageGenerationContent::Inline {
+                            data_base64: "Zm9v".into(),
+                            mime_type: None,
+                            byte_length: None,
+                        },
                        result: "Zm9v".into(),
                        saved_path: Some(test_path_buf("/tmp/ig_123.png").abs()),
                    },
@@ -2706,6 +2724,7 @@ mod tests {
            turns,
            vec![Turn {
                id: "turn-compact".into(),
+                items_view: TurnItemsView::Full,
                status: TurnStatus::Completed,
                error: None,
                started_at: None,
@@ -2961,6 +2980,7 @@ mod tests {
            turns[0],
            Turn {
                id: "turn-a".into(),
+                items_view: TurnItemsView::Full,
                status: TurnStatus::Completed,
                error: None,
                started_at: None,
--- a/codex-rs/app-server-protocol/src/protocol/v2.rs
+++ b/codex-rs/app-server-protocol/src/protocol/v2.rs
@@ -3735,9 +3735,19 @@ pub struct ThreadResumeParams {
    pub developer_instructions: Option<String>,
    #[ts(optional = nullable)]
    pub personality: Option<Personality>,
-    /// When true, return only thread metadata and live-resume state without
-    /// populating `thread.turns`. This is useful when the client plans to call
-    /// `thread/turns/list` immediately after resuming.
+    /// Controls whether large item payloads, such as generated image bytes, are embedded in
+    /// returned ThreadItems or replaced with deferred content references.
+    ///
+    /// Defaults to `inline` for compatibility. New clients that may load large histories should
+    /// prefer `deferred` and fetch bytes on demand with `thread/item/content/read`.
+    #[ts(optional = nullable)]
+    pub large_content: Option<LargeContentMode>,
+    /// When false, `thread/resume` returns the traditional fully hydrated thread history:
+    /// `thread.turns` is populated and each returned Turn has `itemsView: "full"`.
+    ///
+    /// When true, return only thread metadata and live-resume state without populating
+    /// `thread.turns`. Clients that choose this scalable mode should page history with
+    /// `thread/turns/list`, then hydrate individual summary turns with `thread/items/list`.
    #[serde(default, skip_serializing_if = "std::ops::Not::not")]
    pub exclude_turns: bool,
    /// If true, persist additional rollout EventMsg variants required to
@@ -3837,6 +3847,13 @@ pub struct ThreadForkParams {
    pub base_instructions: Option<String>,
    #[ts(optional = nullable)]
    pub developer_instructions: Option<String>,
+    /// Controls whether large item payloads, such as generated image bytes, are embedded in
+    /// returned ThreadItems or replaced with deferred content references.
+    ///
+    /// Defaults to `inline` for compatibility. New clients that may load large histories should
+    /// prefer `deferred` and fetch bytes on demand with `thread/item/content/read`.
+    #[ts(optional = nullable)]
+    pub large_content: Option<LargeContentMode>,
    #[serde(default, skip_serializing_if = "std::ops::Not::not")]
    pub ephemeral: bool,
    /// When true, return only thread metadata and live fork state without
@@ -4408,7 +4425,18 @@ pub enum ThreadActiveFlag {
 #[ts(export_to = "v2/")]
 pub struct ThreadReadParams {
    pub thread_id: String,
-    /// When true, include turns and their items from rollout history.
+    /// Controls whether large item payloads, such as generated image bytes, are embedded in
+    /// returned ThreadItems or replaced with deferred content references.
+    ///
+    /// Defaults to `inline` for compatibility. New clients that may load large histories should
+    /// prefer `deferred` and fetch bytes on demand with `thread/item/content/read`.
+    #[ts(optional = nullable)]
+    pub large_content: Option<LargeContentMode>,
+    /// When true, include the traditional fully hydrated thread history:
+    /// `thread.turns` is populated and each returned Turn has `itemsView: "full"`.
+    ///
+    /// When false, `thread/read` returns metadata only. Clients can page history separately
+    /// with `thread/turns/list`, then hydrate individual summary turns with `thread/items/list`.
    #[serde(default)]
    pub include_turns: bool,
 }
@@ -4425,6 +4453,12 @@ pub struct ThreadReadResponse {
 #[ts(export_to = "v2/")]
 pub struct ThreadTurnsListParams {
    pub thread_id: String,
+    /// Controls whether large item payloads in summary Turn items are embedded inline or returned
+    /// as deferred content references.
+    ///
+    /// Defaults to `inline` for compatibility. New clients should prefer `deferred`.
+    #[ts(optional = nullable)]
+    pub large_content: Option<LargeContentMode>,
    /// Opaque cursor to pass to the next call to continue after the last turn.
    #[ts(optional = nullable)]
    pub cursor: Option<String>,
@@ -4440,6 +4474,11 @@ pub struct ThreadTurnsListParams {
 #[serde(rename_all = "camelCase")]
 #[ts(export_to = "v2/")]
 pub struct ThreadTurnsListResponse {
+    /// Summary turns for paged history UIs.
+    ///
+    /// Each Turn returned by `thread/turns/list` has `itemsView: "summary"` and includes only
+    /// the first user message and final assistant message in `items` when those items are
+    /// available. Use `thread/items/list` to hydrate the complete item list for a turn.
    pub data: Vec<Turn>,
    /// Opaque cursor to pass to the next call to continue after the last turn.
    /// if None, there are no more turns to return.
@@ -4451,6 +4490,82 @@ pub struct ThreadTurnsListResponse {
    pub backwards_cursor: Option<String>,
 }

+#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, JsonSchema, TS)]
+#[serde(rename_all = "camelCase")]
+#[ts(export_to = "v2/")]
+pub struct ThreadItemsListParams {
+    pub thread_id: String,
+    /// Turn to hydrate after receiving a summary Turn from `thread/turns/list`.
+    pub turn_id: String,
+    /// Controls whether large item payloads, such as generated image bytes, are embedded in
+    /// returned ThreadItems or replaced with deferred content references.
+    ///
+    /// Defaults to `inline` for compatibility. New clients should prefer `deferred`.
+    #[ts(optional = nullable)]
+    pub large_content: Option<LargeContentMode>,
+    /// Opaque cursor to pass to the next call to continue after the last item.
+    #[ts(optional = nullable)]
+    pub cursor: Option<String>,
+    /// Optional item page size.
+    #[ts(optional = nullable)]
+    pub limit: Option<u32>,
+    /// Optional item pagination direction; defaults to ascending.
+    #[ts(optional = nullable)]
+    pub sort_direction: Option<SortDirection>,
+}
+
+#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, JsonSchema, TS)]
+#[serde(rename_all = "camelCase")]
+#[ts(export_to = "v2/")]
+pub struct ThreadItemsListResponse {
+    /// Full ThreadItems for the requested turn page. Accumulate pages until `nextCursor` is null
+    /// to hydrate the client-side Turn representation.
+    pub data: Vec<ThreadItem>,
+    /// Opaque cursor to pass to the next call to continue after the last item.
+    /// if None, there are no more items to return.
+    pub next_cursor: Option<String>,
+    /// Opaque cursor to pass as `cursor` when reversing `sortDirection`.
+    /// This is only populated when the page contains at least one item.
+    /// Use it with the opposite `sortDirection` to include the anchor item again
+    /// and catch updates to that item.
+    pub backwards_cursor: Option<String>,
+}
+
+#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, JsonSchema, TS)]
+#[serde(rename_all = "camelCase")]
+#[ts(export_to = "v2/")]
+pub struct ThreadItemContentReadParams {
+    pub thread_id: String,
+    pub turn_id: String,
+    pub item_id: String,
+    /// Opaque content identifier returned from a deferred item content placeholder.
+    pub content_id: String,
+}
+
+#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, JsonSchema, TS)]
+#[serde(rename_all = "camelCase")]
+#[ts(export_to = "v2/")]
+pub struct ThreadItemContentReadResponse {
+    /// Media type of the returned content when known.
+    pub mime_type: Option<String>,
+    /// Base64-encoded content bytes.
+    pub data_base64: String,
+    /// Decoded byte length when known.
+    #[ts(type = "number | null")]
+    pub byte_length: Option<i64>,
+}
+
+#[derive(Serialize, Deserialize, Debug, Clone, Copy, PartialEq, Eq, JsonSchema, TS)]
+#[serde(rename_all = "camelCase")]
+#[ts(rename_all = "camelCase", export_to = "v2/")]
+pub enum LargeContentMode {
+    /// Preserve legacy behavior and embed large payloads directly in returned ThreadItems.
+    Inline,
+    /// Return metadata placeholders for large payloads and fetch bytes through
+    /// `thread/item/content/read`.
+    Deferred,
+}
+
 #[derive(Serialize, Deserialize, Debug, Clone, PartialEq, JsonSchema, TS)]
 #[serde(rename_all = "camelCase")]
 #[ts(export_to = "v2/")]
@@ -5146,10 +5261,10 @@ impl From<CoreTokenUsage> for TokenUsageBreakdown {
 #[ts(export_to = "v2/")]
 pub struct Turn {
    pub id: String,
-    /// Only populated on a `thread/resume` or `thread/fork` response.
-    /// For all other responses and notifications returning a Turn,
-    /// the items field will be an empty list.
+    /// Turn items at the level of detail described by `itemsView`.
    pub items: Vec<ThreadItem>,
+    /// Indicates how much of this Turn's item history is present in `items`.
+    pub items_view: TurnItemsView,
    pub status: TurnStatus,
    /// Only populated when the Turn's status is failed.
    pub error: Option<TurnError>,
@@ -5164,6 +5279,22 @@ pub struct Turn {
    pub duration_ms: Option<i64>,
 }

+#[derive(Serialize, Deserialize, Debug, Clone, Copy, PartialEq, Eq, JsonSchema, TS)]
+#[serde(rename_all = "camelCase")]
+#[ts(rename_all = "camelCase", export_to = "v2/")]
+pub enum TurnItemsView {
+    /// `items` was not loaded for this Turn. The field is intentionally empty.
+    NotLoaded,
+    /// `items` contains only a display summary for this Turn.
+    ///
+    /// For `thread/turns/list`, this currently means the first user message and the final
+    /// assistant message when those items are available.
+    Summary,
+    /// `items` contains every ThreadItem available from persisted app-server history for this
+    /// Turn.
+    Full,
+}
+
 #[derive(Serialize, Deserialize, Debug, Clone, PartialEq, Eq, JsonSchema, TS)]
 #[serde(rename_all = "camelCase")]
 #[ts(export_to = "v2/")]
@@ -5948,6 +6079,14 @@ pub enum ThreadItem {
        id: String,
        status: String,
        revised_prompt: Option<String>,
+        /// Structured image content metadata. New clients should render from this field instead
+        /// of reading the legacy `result` field directly.
+        content: ImageGenerationContent,
+        /// Legacy base64-encoded image result.
+        ///
+        /// This is populated in `largeContent: "inline"` mode for compatibility. In
+        /// `largeContent: "deferred"` mode, clients should expect this to be empty and use
+        /// `content` plus `thread/item/content/read` instead.
        result: String,
        #[serde(default, skip_serializing_if = "Option::is_none")]
        #[ts(optional)]
@@ -5964,6 +6103,36 @@ pub enum ThreadItem {
    ContextCompaction { id: String },
 }

+#[derive(Serialize, Deserialize, Debug, Clone, PartialEq, Eq, JsonSchema, TS)]
+#[serde(tag = "type", rename_all = "camelCase")]
+#[ts(tag = "type", export_to = "v2/")]
+pub enum ImageGenerationContent {
+    /// Image bytes are embedded directly in the item.
+    #[serde(rename_all = "camelCase")]
+    #[ts(rename_all = "camelCase")]
+    Inline {
+        data_base64: String,
+        mime_type: Option<String>,
+        #[ts(type = "number | null")]
+        byte_length: Option<i64>,
+    },
+    /// Image bytes are available through `thread/item/content/read`.
+    #[serde(rename_all = "camelCase")]
+    #[ts(rename_all = "camelCase")]
+    Deferred {
+        content_id: String,
+        mime_type: Option<String>,
+        #[ts(type = "number | null")]
+        byte_length: Option<i64>,
+        width: Option<u32>,
+        height: Option<u32>,
+    },
+    /// Image content is not available yet, or is no longer available.
+    #[serde(rename_all = "camelCase")]
+    #[ts(rename_all = "camelCase")]
+    Unavailable { reason: String },
+}
+
 #[derive(Serialize, Deserialize, Debug, Clone, PartialEq, Eq, JsonSchema, TS)]
 #[serde(rename_all = "camelCase")]
 #[ts(rename_all = "camelCase", export_to = "v2/")]
@@ -6421,6 +6590,11 @@ impl From<CoreTurnItem> for ThreadItem {
                id: image.id,
                status: image.status,
                revised_prompt: image.revised_prompt,
+                content: ImageGenerationContent::Inline {
+                    data_base64: image.result.clone(),
+                    mime_type: None,
+                    byte_length: None,
+                },
                result: image.result,
                saved_path: image.saved_path,
            },