feat: enhance chat event streaming by tracking active tool depth to prevent inner-tool LLM token leakage

2026-04-25 00:36:31 +02:00 · 2026-02-19 13:11:18 +05:30 · 2026-02-19 13:11:18 +05:30 · f3ec48fb00
commit f3ec48fb00
parent ce110faa5a
1 changed files with 6 additions and 1 deletions
--- a/surfsense_backend/app/tasks/chat/stream_new_chat.py
+++ b/surfsense_backend/app/tasks/chat/stream_new_chat.py
@ -226,6 +226,7 @@ async def _stream_agent_events(
    last_active_step_title: str = initial_step_title
    last_active_step_items: list[str] = initial_step_items or []
    just_finished_tool: bool = False
+    active_tool_depth: int = 0  # Track nesting: >0 means we're inside a tool

    def next_thinking_step_id() -> str:
        nonlocal thinking_step_counter
@ -250,6 +251,8 @@ async def _stream_agent_events(
        event_type = event.get("event", "")

        if event_type == "on_chat_model_stream":
+            if active_tool_depth > 0:
+                continue  # Suppress inner-tool LLM tokens from leaking into chat
            chunk = event.get("data", {}).get("chunk")
            if chunk and hasattr(chunk, "content"):
                content = chunk.content
@ -269,6 +272,7 @@ async def _stream_agent_events(
                    accumulated_text += content

        elif event_type == "on_tool_start":
+            active_tool_depth += 1
            tool_name = event.get("name", "unknown_tool")
            run_id = event.get("run_id", "")
            tool_input = event.get("data", {}).get("input", {})
@ -428,6 +432,7 @@ async def _stream_agent_events(
            )

        elif event_type == "on_tool_end":
+            active_tool_depth = max(0, active_tool_depth - 1)
            run_id = event.get("run_id", "")
            tool_name = event.get("name", "unknown_tool")
            raw_output = event.get("data", {}).get("output", "")
@ -1309,4 +1314,4 @@ async def stream_resume_chat(
        yield streaming_service.format_done()

    finally:
-        await clear_ai_responding(session, chat_id)
+        await clear_ai_responding(session, chat_id)