Act on reasoning-included per turn (#9402)

- Reset reasoning-included flag each turn and update compaction test
2026-05-02 20:32:04 +03:00 · 2026-01-19 11:23:25 -08:00
parent 57ec3a8277
commit b11e96fb04
12 changed files with 192 additions and 11 deletions
--- a/codex-rs/core/src/context_manager/history.rs
+++ b/codex-rs/core/src/context_manager/history.rs
@@ -235,12 +235,19 @@ impl ContextManager {
        token_estimate as usize
    }

-    pub(crate) fn get_total_token_usage(&self) -> i64 {
-        self.token_info
+    /// When true, the server already accounted for past reasoning tokens and
+    /// the client should not re-estimate them.
+    pub(crate) fn get_total_token_usage(&self, server_reasoning_included: bool) -> i64 {
+        let last_tokens = self
+            .token_info
            .as_ref()
            .map(|info| info.last_token_usage.total_tokens)
-            .unwrap_or(0)
-            .saturating_add(self.get_non_last_reasoning_items_tokens() as i64)
+            .unwrap_or(0);
+        if server_reasoning_included {
+            last_tokens
+        } else {
+            last_tokens.saturating_add(self.get_non_last_reasoning_items_tokens() as i64)
+        }
    }

    /// This function enforces a couple of invariants on the in-memory history: