feat(agent): suppress non-forced output during post-response housekeeping

- Introduced a mechanism to mute output after the main response is delivered, ensuring that subsequent tool calls run without cluttering the CLI. - Redirected stdout to devnull during the review agent's execution to prevent any print statements from interfering with the main CLI display. - Added a new attribute `_mute_post_response` to manage output suppression effectively.
2026-03-20 23:54:42 -07:00 · 2026-03-20 23:54:42 -07:00 · 885f88fb60
commit 885f88fb60
parent 3585019831
1 changed files with 36 additions and 23 deletions
--- a/run_agent.py
+++ b/run_agent.py
@ -1119,7 +1119,13 @@ class AIAgent:
        During tool execution (``_executing_tools`` is True), printing is
        allowed even with stream consumers registered because no tokens
        are being streamed at that point.
        After the main response has been delivered and the remaining tool
        calls are post-response housekeeping (``_mute_post_response``),
        all non-forced output is suppressed.
        """
        if not force and getattr(self, "_mute_post_response", False):
            return
        if not force and self._has_stream_consumers() and not self._executing_tools:
            return
        self._safe_print(*args, **kwargs)
@ -1366,29 +1372,30 @@ class AIAgent:
            prompt = self._SKILL_REVIEW_PROMPT
        def _run_review():
            import contextlib, os as _os
            try:
-                # Full agent fork — same model, tools, context. Just a tighter
+                # Redirect stdout to devnull so spinners, cute messages,
-                # iteration budget and quiet mode. No toolset filtering so we
+                # and any other print() calls from the review agent don't
-                # don't break prompt caching on the tool schema.
+                # leak into the main CLI display.
-                review_agent = AIAgent(
+                with open(_os.devnull, "w") as _devnull, \
-                    model=self.model,
+                     contextlib.redirect_stdout(_devnull):
-                    max_iterations=8,
+                    review_agent = AIAgent(
-                    quiet_mode=True,
+                        model=self.model,
-                    platform=self.platform,
+                        max_iterations=8,
-                    provider=self.provider,
+                        quiet_mode=True,
-                )
+                        platform=self.platform,
-                # Share the memory store so writes persist to disk
+                        provider=self.provider,
-                review_agent._memory_store = self._memory_store
+                    )
-                review_agent._memory_enabled = self._memory_enabled
+                    review_agent._memory_store = self._memory_store
-                review_agent._user_profile_enabled = self._user_profile_enabled
+                    review_agent._memory_enabled = self._memory_enabled
-                # Disable nudges in the review agent to prevent recursion
+                    review_agent._user_profile_enabled = self._user_profile_enabled
-                review_agent._memory_nudge_interval = 0
+                    review_agent._memory_nudge_interval = 0
-                review_agent._skill_nudge_interval = 0
+                    review_agent._skill_nudge_interval = 0
-                review_agent.run_conversation(
+                    review_agent.run_conversation(
-                    user_message=prompt,
+                        user_message=prompt,
-                    conversation_history=messages_snapshot,
+                        conversation_history=messages_snapshot,
-                )
+                    )
            except Exception as e:
                logger.debug("Background memory/skill review failed: %s", e)
@ -5288,6 +5295,7 @@ class AIAgent:
        self._incomplete_scratchpad_retries = 0
        self._codex_incomplete_retries = 0
        self._last_content_with_tools = None
        self._mute_post_response = False
        # NOTE: _turns_since_memory and _iters_since_skill are NOT reset here.
        # They are initialized in __init__ and must persist across run_conversation
        # calls so that nudge logic accumulates correctly in CLI mode.
@ -6634,8 +6642,13 @@ class AIAgent:
                    turn_content = assistant_message.content or ""
                    if turn_content and self._has_content_after_think_block(turn_content):
                        self._last_content_with_tools = turn_content
-                        # Show intermediate commentary so the user can follow along
+                        # The response was already streamed to the user in the
-                        if self.quiet_mode:
+                        # response box.  The remaining tool calls (memory, skill,
                        # todo, etc.) are post-response housekeeping — mute all
                        # subsequent CLI output so they run invisibly.
                        if self._has_stream_consumers():
                            self._mute_post_response = True
                        elif self.quiet_mode:
                            clean = self._strip_think_blocks(turn_content).strip()
                            if clean:
                                self._vprint(f"  ┊ 💬 {clean}")