feat: enhance document formatting and context management for LLM tools

- Introduced dynamic character budget calculation for document formatting based on model's context window. - Updated `format_documents_for_context` to respect character limits and improve output quality. - Added `max_input_tokens` parameter to various functions to facilitate context-aware processing. - Enhanced error handling for context overflow in LLM router service.
2026-07-18 23:11:12 +02:00 · 2026-02-26 20:47:19 -08:00 · 2026-02-26 20:47:19 -08:00 · 1e4b8d3e89
commit 1e4b8d3e89
parent a4dc84d1ab
4 changed files with 178 additions and 24 deletions
--- a/surfsense_backend/app/agents/new_chat/chat_deepagent.py
+++ b/surfsense_backend/app/agents/new_chat/chat_deepagent.py
@ -241,6 +241,15 @@ async def create_surfsense_deep_agent(

    # Build dependencies dict for the tools registry
    visibility = thread_visibility or ChatVisibility.PRIVATE
+
+    # Extract the model's context window so tools can size their output.
+    _model_profile = getattr(llm, "profile", None)
+    _max_input_tokens: int | None = (
+        _model_profile.get("max_input_tokens")
+        if isinstance(_model_profile, dict)
+        else None
+    )
+
    dependencies = {
        "search_space_id": search_space_id,
        "db_session": db_session,
@ -251,6 +260,7 @@ async def create_surfsense_deep_agent(
        "thread_visibility": visibility,
        "available_connectors": available_connectors,
        "available_document_types": available_document_types,
+        "max_input_tokens": _max_input_tokens,
    }

    # Disable Notion action tools if no Notion connector is configured