feat: proxy context left after compaction (#6597)

2026-04-30 03:12:20 +03:00 · 2025-11-13 15:54:03 +00:00
parent 8dcbd29edd
commit 2a417c47ac
5 changed files with 142 additions and 4 deletions
--- a/codex-rs/core/tests/suite/compact.rs
+++ b/codex-rs/core/tests/suite/compact.rs
@@ -14,6 +14,7 @@ use codex_protocol::user_input::UserInput;
 use core_test_support::load_default_config_for_test;
 use core_test_support::skip_if_no_network;
 use core_test_support::wait_for_event;
+use core_test_support::wait_for_event_match;
 use std::collections::VecDeque;
 use tempfile::TempDir;

@@ -366,6 +367,72 @@ async fn manual_compact_uses_custom_prompt() {
    assert!(!found_default_prompt, "default prompt should be replaced");
 }

+#[tokio::test(flavor = "multi_thread", worker_threads = 2)]
+async fn manual_compact_emits_estimated_token_usage_event() {
+    skip_if_no_network!();
+
+    let server = start_mock_server().await;
+
+    // Compact run where the API reports zero tokens in usage. Our local
+    // estimator should still compute a non-zero context size for the compacted
+    // history.
+    let sse_compact = sse(vec![
+        ev_assistant_message("m1", SUMMARY_TEXT),
+        ev_completed_with_tokens("r1", 0),
+    ]);
+    mount_sse_once(&server, sse_compact).await;
+
+    let model_provider = ModelProviderInfo {
+        base_url: Some(format!("{}/v1", server.uri())),
+        ..built_in_model_providers()["openai"].clone()
+    };
+    let home = TempDir::new().unwrap();
+    let mut config = load_default_config_for_test(&home);
+    config.model_provider = model_provider;
+    set_test_compact_prompt(&mut config);
+
+    let conversation_manager = ConversationManager::with_auth(CodexAuth::from_api_key("dummy"));
+    let NewConversation {
+        conversation: codex,
+        ..
+    } = conversation_manager.new_conversation(config).await.unwrap();
+
+    // Trigger manual compact and collect TokenCount events for the compact turn.
+    codex.submit(Op::Compact).await.unwrap();
+
+    // First TokenCount: from the compact API call (usage.total_tokens = 0).
+    let first = wait_for_event_match(&codex, |ev| match ev {
+        EventMsg::TokenCount(tc) => tc
+            .info
+            .as_ref()
+            .map(|info| info.last_token_usage.total_tokens),
+        _ => None,
+    })
+    .await;
+
+    // Second TokenCount: from the local post-compaction estimate.
+    let last = wait_for_event_match(&codex, |ev| match ev {
+        EventMsg::TokenCount(tc) => tc
+            .info
+            .as_ref()
+            .map(|info| info.last_token_usage.total_tokens),
+        _ => None,
+    })
+    .await;
+
+    // Ensure the compact task itself completes.
+    wait_for_event(&codex, |ev| matches!(ev, EventMsg::TaskComplete(_))).await;
+
+    assert_eq!(
+        first, 0,
+        "expected first TokenCount from compact API usage to be zero"
+    );
+    assert!(
+        last > 0,
+        "second TokenCount should reflect a non-zero estimated context size after compaction"
+    );
+}
+
 // Windows CI only: bump to 4 workers to prevent SSE/event starvation and test timeouts.
 #[cfg_attr(windows, tokio::test(flavor = "multi_thread", worker_threads = 4))]
 #[cfg_attr(not(windows), tokio::test(flavor = "multi_thread", worker_threads = 2))]