Merge pull request #1609 from 0xbyt4/fix/context-counter-cache-tokens

fix: context counter shows cached token count in status bar
2026-03-17 01:45:12 -07:00 · 2026-03-17 01:45:12 -07:00 · 5ada0b95e9
commit 5ada0b95e9
parent 19eaf5d956 8d0a96a8bf
2 changed files with 124 additions and 0 deletions
--- a/run_agent.py
+++ b/run_agent.py
@ -5258,6 +5258,15 @@ class AIAgent:
                    if hasattr(response, 'usage') and response.usage:
                        if self.api_mode in ("codex_responses", "anthropic_messages"):
                            prompt_tokens = getattr(response.usage, 'input_tokens', 0) or 0
+                            if self.api_mode == "anthropic_messages":
+                                # Anthropic splits input into cache_read + cache_creation
+                                # + non-cached input_tokens. Without adding the cached
+                                # portions, the context bar shows only the tiny non-cached
+                                # portion (e.g. 3 tokens) instead of the real total (~18K).
+                                # Other providers (OpenAI/Codex) already include cached
+                                # tokens in their input_tokens/prompt_tokens field.
+                                prompt_tokens += getattr(response.usage, 'cache_read_input_tokens', 0) or 0
+                                prompt_tokens += getattr(response.usage, 'cache_creation_input_tokens', 0) or 0
                            completion_tokens = getattr(response.usage, 'output_tokens', 0) or 0
                            total_tokens = (
                                getattr(response.usage, 'total_tokens', None)