refactor: anonymous/free chat experience

- Enhanced lambda function formatting in `_after_commit` for better clarity. - Simplified generator expression in `_match_condition` for improved readability. - Streamlined function signature in `_eligible` for consistency. - Updated imports and refactored anonymous chat routes to use a new agent creation method. - Added a new function `_load_anon_document` to handle document loading from Redis. - Improved UI components by replacing legacy structures with modern alternatives, including alerts and separators. - Refactored quota-related components to utilize new alert structures for better user feedback. - Cleaned up unused variables and optimized component states for performance.
2026-06-02 19:55:18 +02:00 · 2026-05-31 15:58:21 -07:00 · 2026-05-31 15:58:21 -07:00 · 0f2e3c7655
commit 0f2e3c7655
parent 0cce9b7e64
17 changed files with 493 additions and 278 deletions
--- a/surfsense_backend/app/agents/new_chat/anonymous_agent.py
+++ b/surfsense_backend/app/agents/new_chat/anonymous_agent.py
@ -0,0 +1,168 @@
+"""Minimal anonymous / free-chat agent.
+
+The no-login chat experience must stay dead simple: the user asks a question
+and the model answers, optionally using ``web_search`` and an optionally
+uploaded **read-only** document. We deliberately bypass the full SurfSense deep
+agent stack (filesystem, file-intent, knowledge-base persistence, subagents,
+skills, memory) because those middlewares stage or persist "documents" that an
+anonymous session can never see again -- which produced phantom
+"I saved it to a file" answers for free users.
+
+For any other SurfSense capability the model is instructed (via the system
+prompt built here) to tell the user to create a free account instead of
+pretending to perform the action.
+"""
+
+from __future__ import annotations
+
+from datetime import UTC, datetime
+from typing import Any
+
+from deepagents.backends import StateBackend
+from langchain.agents import create_agent
+from langchain.agents.middleware import (
+    ModelCallLimitMiddleware,
+    ToolCallLimitMiddleware,
+)
+from langchain_core.language_models import BaseChatModel
+from langgraph.types import Checkpointer
+
+from app.agents.new_chat.context import SurfSenseContextSchema
+from app.agents.new_chat.middleware import (
+    RetryAfterMiddleware,
+    create_surfsense_compaction_middleware,
+)
+from app.agents.new_chat.tools.web_search import create_web_search_tool
+
+# Cap how much of an uploaded document we inline into the system prompt. The
+# upload endpoint allows files up to several MB, but the doc is re-sent on
+# every turn and counts against the anonymous token quota, so we bound it.
+_MAX_DOC_CHARS = 50_000
+
+
+def build_anonymous_system_prompt(anon_doc: dict[str, Any] | None = None) -> str:
+    """Build the system prompt for the minimal anonymous chat agent.
+
+    The prompt keeps the assistant focused on plain Q/A + web search, inlines
+    any uploaded document as read-only context, and redirects every other
+    SurfSense feature to account registration.
+    """
+    today = datetime.now(UTC).strftime("%A, %B %d, %Y")
+
+    doc_section = ""
+    if anon_doc:
+        title = str(anon_doc.get("title") or "uploaded_document")
+        content = str(anon_doc.get("content") or "")
+        truncated = content[:_MAX_DOC_CHARS]
+        truncation_note = ""
+        if len(content) > _MAX_DOC_CHARS:
+            truncation_note = (
+                "\n\n[Note: the document was truncated because it is large; "
+                "only the beginning is shown.]"
+            )
+        doc_section = (
+            "\n\n## Uploaded document (read-only)\n"
+            f'The user uploaded a document named "{title}". Its contents are '
+            "provided below for reference only. You may read it and answer "
+            "questions about it, but you cannot modify, save, or store it.\n\n"
+            f'<uploaded_document title="{title}">\n'
+            f"{truncated}{truncation_note}\n"
+            "</uploaded_document>"
+        )
+
+    return (
+        "You are SurfSense's free AI assistant, available to everyone without "
+        "login.\n\n"
+        f"Today's date is {today}.\n\n"
+        "## How to help\n"
+        "- Answer the user's questions directly and conversationally. You are "
+        "a straightforward question-and-answer assistant.\n"
+        "- When a question needs current, real-time, or factual information "
+        "from the internet (news, prices, weather, recent events, live data), "
+        "use the `web_search` tool. Otherwise, answer directly from your own "
+        "knowledge.\n"
+        "- Be concise, accurate, and helpful. Use Markdown formatting when it "
+        "improves readability."
+        f"{doc_section}\n\n"
+        "## What is not available here\n"
+        "This is the free, no-login experience. You CANNOT save files or "
+        "notes, generate reports, podcasts, resumes, presentations, or images, "
+        "search or build a knowledge base, connect to apps (Gmail, Google "
+        "Drive, Notion, Slack, Calendar, Discord, and similar), set up "
+        "automations, or remember anything across sessions.\n\n"
+        "If the user asks for any of these, do NOT pretend to do them and "
+        "never claim you saved, created, or stored anything. Instead, briefly "
+        "let them know the feature requires a free SurfSense account and "
+        "invite them to create one at https://www.surfsense.com. Then offer to "
+        "help with what you can do here (answering questions and searching the "
+        "web)."
+    )
+
+
+async def create_anonymous_chat_agent(
+    *,
+    llm: BaseChatModel,
+    checkpointer: Checkpointer,
+    anon_session_id: str | None = None,
+    anon_doc: dict[str, Any] | None = None,
+    enable_web_search: bool = True,
+):
+    """Create a minimal Q/A agent for anonymous / free chat.
+
+    Unlike :func:`create_surfsense_deep_agent`, this agent has no filesystem,
+    file-intent, knowledge-base persistence, subagent, skills, or memory
+    middleware. Its only tool is ``web_search`` (when ``enable_web_search`` is
+    True), and any uploaded document is injected into the system prompt as
+    read-only context.
+
+    Args:
+        llm: The chat model to use (already built by the caller).
+        checkpointer: LangGraph checkpointer for the ephemeral anon thread.
+        anon_session_id: Anonymous session id (used only for telemetry/metadata).
+        anon_doc: Optional ``{"title", "content"}`` for an uploaded document.
+        enable_web_search: When False, the agent runs as a pure LLM with no
+            tools (used when the user toggles web search off).
+    """
+    tools = (
+        [create_web_search_tool(search_space_id=None, available_connectors=None)]
+        if enable_web_search
+        else []
+    )
+
+    # Reliability-only middleware. Nothing here touches the database or
+    # filesystem: call limits guard against loops, compaction summarises long
+    # histories into in-graph state, and retry handles provider rate limits.
+    middleware: list[Any] = [
+        ModelCallLimitMiddleware(thread_limit=120, run_limit=80, exit_behavior="end"),
+    ]
+    if tools:
+        middleware.append(
+            ToolCallLimitMiddleware(
+                thread_limit=300, run_limit=80, exit_behavior="continue"
+            )
+        )
+    middleware.append(create_surfsense_compaction_middleware(llm, StateBackend))
+    middleware.append(RetryAfterMiddleware(max_retries=3))
+
+    system_prompt = build_anonymous_system_prompt(anon_doc)
+
+    agent = create_agent(
+        llm,
+        system_prompt=system_prompt,
+        tools=tools,
+        middleware=middleware,
+        context_schema=SurfSenseContextSchema,
+        checkpointer=checkpointer,
+    )
+    return agent.with_config(
+        {
+            "recursion_limit": 40,
+            "metadata": {
+                "ls_integration": "surfsense_anonymous_chat",
+                "anon_session_id": anon_session_id,
+            },
+        }
+    )
+
+
+__all__ = ["build_anonymous_system_prompt", "create_anonymous_chat_agent"]
--- a/surfsense_backend/app/automations/triggers/builtin/event/filter.py
+++ b/surfsense_backend/app/automations/triggers/builtin/event/filter.py
@ -65,8 +65,7 @@ def _match_condition(condition: Any, actual: Any) -> bool:
        return False
    if isinstance(condition, dict):
        return all(
-            _apply_operator(op, operand, actual)
-            for op, operand in condition.items()
+            _apply_operator(op, operand, actual) for op, operand in condition.items()
        )
    return actual == condition

--- a/surfsense_backend/app/automations/triggers/builtin/event/selector.py
+++ b/surfsense_backend/app/automations/triggers/builtin/event/selector.py
@ -41,9 +41,7 @@ async def _select_and_start(event_dict: dict[str, Any]) -> None:
            await _start_one(session, trigger=trigger, event=event)


-async def _eligible(
-    session: AsyncSession, *, event: Event
-) -> list[AutomationTrigger]:
+async def _eligible(session: AsyncSession, *, event: Event) -> list[AutomationTrigger]:
    """Enabled ``event`` triggers for this event type whose filter matches."""
    stmt = select(AutomationTrigger).where(
        AutomationTrigger.type == TriggerType.EVENT,
--- a/surfsense_backend/app/routes/anonymous_chat_routes.py
+++ b/surfsense_backend/app/routes/anonymous_chat_routes.py
@ -351,10 +351,9 @@ async def stream_anonymous_chat(
    async def _generate():
        from langchain_core.messages import AIMessage, HumanMessage

-        from app.agents.new_chat.chat_deepagent import create_surfsense_deep_agent
+        from app.agents.new_chat.anonymous_agent import create_anonymous_chat_agent
        from app.agents.new_chat.checkpointer import get_checkpointer
        from app.db import shielded_async_session
-        from app.services.connector_service import ConnectorService
        from app.services.new_streaming_service import VercelStreamingService
        from app.services.token_tracking_service import start_turn
        from app.tasks.chat.stream_new_chat import StreamResult, _stream_agent_events
@ -363,24 +362,23 @@ async def stream_anonymous_chat(
        streaming_service = VercelStreamingService()

        try:
-            async with shielded_async_session() as session:
-                connector_service = ConnectorService(session, search_space_id=None)
+            async with shielded_async_session():
                checkpointer = await get_checkpointer()

                anon_thread_id = f"anon-{session_id}-{request_id}"

-                agent = await create_surfsense_deep_agent(
+                # Load the optional uploaded document as read-only context.
+                anon_doc = await _load_anon_document(session_id)
+
+                # Minimal Q/A agent: web_search only (when enabled), no
+                # filesystem / persistence / subagents. The uploaded document
+                # is injected into the system prompt as read-only context.
+                agent = await create_anonymous_chat_agent(
                    llm=llm,
-                    search_space_id=0,
-                    db_session=session,
-                    connector_service=connector_service,
                    checkpointer=checkpointer,
-                    user_id=None,
-                    thread_id=None,
-                    agent_config=agent_config,
-                    enabled_tools=list(enabled_for_agent),
-                    disabled_tools=None,
                    anon_session_id=session_id,
+                    anon_doc=anon_doc,
+                    enable_web_search="web_search" in enabled_for_agent,
                )

                langchain_messages = []
@ -396,7 +394,6 @@ async def stream_anonymous_chat(

                input_state = {
                    "messages": langchain_messages,
-                    "search_space_id": 0,
                }

                langgraph_config = {
@ -500,6 +497,38 @@ ANON_ALLOWED_EXTENSIONS = PLAINTEXT_EXTENSIONS | DIRECT_CONVERT_EXTENSIONS
 ANON_DOC_REDIS_PREFIX = "anon:doc:"


+async def _load_anon_document(session_id: str) -> dict[str, Any] | None:
+    """Read the anonymous session's uploaded document from Redis.
+
+    Returns ``{"title", "content"}`` for read-only injection into the agent's
+    system prompt, or ``None`` when nothing was uploaded for this session.
+    """
+    import json as _json
+
+    import redis.asyncio as aioredis
+
+    redis_client = aioredis.from_url(config.REDIS_APP_URL, decode_responses=True)
+    redis_key = f"{ANON_DOC_REDIS_PREFIX}{session_id}"
+    try:
+        data = await redis_client.get(redis_key)
+        if not data:
+            return None
+        payload = _json.loads(data)
+    except Exception as exc:  # pragma: no cover - defensive
+        logger.warning("Failed to load anonymous document from Redis: %s", exc)
+        return None
+    finally:
+        await redis_client.aclose()
+
+    content = str(payload.get("content") or "")
+    if not content:
+        return None
+    return {
+        "title": str(payload.get("filename") or "uploaded_document"),
+        "content": content,
+    }
+
+
 class AnonDocResponse(BaseModel):
    filename: str
    size_bytes: int
--- a/surfsense_backend/app/session_events.py
+++ b/surfsense_backend/app/session_events.py
@ -79,9 +79,11 @@ def _after_commit(session: Session) -> None:
    ]
    for task in tasks:
        task.add_done_callback(
-            lambda t: logger.error("event publish failed: %s", t.exception())
-            if not t.cancelled() and t.exception()
-            else None
+            lambda t: (
+                logger.error("event publish failed: %s", t.exception())
+                if not t.cancelled() and t.exception()
+                else None
+            )
        )