fix: restore connector mentions, free-tier fallback, orphan-row guard in new chat flow

2026-07-22 23:31:12 +02:00 · 2026-06-04 10:25:06 +02:00 · 2026-06-04 10:25:06 +02:00 · 44abf56d6c
commit 44abf56d6c
parent 1165b3ad5c
5 changed files with 104 additions and 11 deletions
--- a/surfsense_backend/app/tasks/chat/streaming/flows/new_chat/auto_pin.py
+++ b/surfsense_backend/app/tasks/chat/streaming/flows/new_chat/auto_pin.py
@ -50,8 +50,14 @@ async def resolve_initial_auto_pin(
    selected_llm_config_id: int,
    requires_image_input: bool,
    requested_llm_config_id: int,
+    force_repin_free: bool = False,
 ) -> AutoPinResult:
-    """Run the resolver and classify any ``ValueError`` for the SSE error path."""
+    """Run the resolver and classify any ``ValueError`` for the SSE error path.
+
+    ``force_repin_free`` forces a fresh re-pin to a free-tier config (used on
+    the premium-quota-exhausted fallback so an out-of-quota user isn't repinned
+    onto another paid model).
+    """
    try:
        pinned = await resolve_or_get_pinned_llm_config_id(
            session,
@ -60,6 +66,7 @@ async def resolve_initial_auto_pin(
            user_id=user_id,
            selected_llm_config_id=selected_llm_config_id,
            requires_image_input=requires_image_input,
+            force_repin_free=force_repin_free,
        )
        ot.add_event(
            "model.pin.resolved",
--- a/surfsense_backend/app/tasks/chat/streaming/flows/new_chat/input_state.py
+++ b/surfsense_backend/app/tasks/chat/streaming/flows/new_chat/input_state.py
@ -9,9 +9,9 @@ Pipeline:
     can resolve ``report_id`` for versioning without spelunking history.
  3. **@-mention resolve** (cloud mode) — substitute ``@title`` tokens in the
     query with canonical ``\`/documents/...\``` paths the LLM expects.
-  4. **Context block render** — XML-wrap recent reports, prepend to the
-     rewritten query, optionally prefix with display name for SEARCH_SPACE
-     visibility.
+  4. **Context block render** — XML-wrap @-mentioned connectors and recent
+     reports, prepend to the rewritten query, optionally prefix with display
+     name for SEARCH_SPACE visibility.
  5. **HumanMessage** — multimodal content if images are attached.

 Returns the assembled ``input_state`` dict plus side-channel data the
@ -62,6 +62,7 @@ async def build_new_chat_input_state(
    user_image_data_urls: list[str] | None,
    mentioned_document_ids: list[int] | None,
    mentioned_folder_ids: list[int] | None,
+    mentioned_connectors: list[dict[str, Any]] | None,
    mentioned_documents: list[dict[str, Any]] | None,
    needs_history_bootstrap: bool,
    thread_visibility: ChatVisibility,
@ -111,6 +112,7 @@ async def build_new_chat_input_state(
    final_query = _render_query_with_context(
        agent_user_query=agent_user_query,
        recent_reports=recent_reports,
+        mentioned_connectors=mentioned_connectors,
    )

    if thread_visibility == ChatVisibility.SEARCH_SPACE and current_user_display_name:
@ -193,14 +195,56 @@ async def _resolve_mentions_for_query(
    return agent_user_query, accepted_folder_ids


+def _render_connector_block(mentioned_connectors: list[dict[str, Any]]) -> str | None:
+    """Render the ``<mentioned_connectors>`` block, or ``None`` when empty.
+
+    Malformed entries (non-dict, or missing id/type) are skipped.
+    """
+    connector_lines: list[str] = []
+    for connector in mentioned_connectors:
+        if not isinstance(connector, dict):
+            continue
+        connector_id = connector.get("id")
+        connector_type = connector.get("connector_type") or connector.get(
+            "document_type"
+        )
+        account_name = connector.get("account_name") or connector.get("title")
+        if connector_id is None or connector_type is None:
+            continue
+        connector_lines.append(
+            f'  - connector_id={connector_id}, connector_type="{connector_type}", '
+            f'account_name="{account_name or ""}"'
+        )
+    if not connector_lines:
+        return None
+    return (
+        "<mentioned_connectors>\n"
+        "The user selected these exact connector accounts with @. "
+        "These entries are selection metadata, not retrieved connector content. "
+        "When a connector-backed tool needs an account, use the matching "
+        "connector_id from this list if the tool supports connector_id:\n"
+        + "\n".join(connector_lines)
+        + "\n</mentioned_connectors>"
+    )
+
+
 def _render_query_with_context(
    *,
    agent_user_query: str,
    recent_reports: list[Report],
+    mentioned_connectors: list[dict[str, Any]] | None,
 ) -> str:
-    """Prepend recent-reports XML block to the user query."""
+    """Prepend the ``<mentioned_connectors>`` then ``<report_context>`` blocks.
+
+    Order is load-bearing for legacy parity.
+    """
    context_parts: list[str] = []

+    if mentioned_connectors:
+        connector_block = _render_connector_block(mentioned_connectors)
+        if connector_block:
+            context_parts.append(connector_block)
+
    if recent_reports:
        report_lines: list[str] = []
        for r in recent_reports:
--- a/surfsense_backend/app/tasks/chat/streaming/flows/new_chat/orchestrator.py
+++ b/surfsense_backend/app/tasks/chat/streaming/flows/new_chat/orchestrator.py
@ -124,6 +124,8 @@ async def stream_new_chat(
    llm_config_id: int = -1,
    mentioned_document_ids: list[int] | None = None,
    mentioned_folder_ids: list[int] | None = None,
+    mentioned_connector_ids: list[int] | None = None,
+    mentioned_connectors: list[dict[str, Any]] | None = None,
    mentioned_documents: list[dict[str, Any]] | None = None,
    checkpoint_id: str | None = None,
    needs_history_bootstrap: bool = False,
@ -272,6 +274,7 @@ async def stream_new_chat(
                        selected_llm_config_id=0,
                        requires_image_input=requires_image_input,
                        requested_llm_config_id=requested_llm_config_id,
+                        force_repin_free=True,
                    )
                    if pin_fallback.error is not None:
                        message, error_code, error_kind = pin_fallback.error
@ -367,12 +370,6 @@ async def stream_new_chat(
            mentioned_documents=mentioned_documents,
            background_tasks=_background_tasks,
        )
-        persist_asst_task = spawn_persist_assistant_shell_task(
-            chat_id=chat_id,
-            user_id=user_id,
-            turn_id=stream_result.turn_id,
-            background_tasks=_background_tasks,
-        )

        _t0 = time.perf_counter()
        connector_service, firecrawl_api_key = await setup_connector_and_firecrawl(
@ -435,6 +432,7 @@ async def stream_new_chat(
            user_image_data_urls=user_image_data_urls,
            mentioned_document_ids=mentioned_document_ids,
            mentioned_folder_ids=mentioned_folder_ids,
+            mentioned_connectors=mentioned_connectors,
            mentioned_documents=mentioned_documents,
            needs_history_bootstrap=needs_history_bootstrap,
            thread_visibility=visibility,
@ -523,6 +521,14 @@ async def stream_new_chat(
            {"message_id": user_message_id, "turn_id": stream_result.turn_id},
        )

+        # Spawned only after the user row is confirmed, so a user-persist
+        # failure can't orphan an assistant shell on the same turn.
+        persist_asst_task = spawn_persist_assistant_shell_task(
+            chat_id=chat_id,
+            user_id=user_id,
+            turn_id=stream_result.turn_id,
+            background_tasks=_background_tasks,
+        )
        assistant_message_id = await await_persist_task(
            persist_asst_task,
            chat_id=chat_id,
@ -588,6 +594,8 @@ async def stream_new_chat(
            mentioned_document_ids=mentioned_document_ids,
            accepted_folder_ids=accepted_folder_ids,
            mentioned_folder_ids=mentioned_folder_ids,
+            mentioned_connector_ids=mentioned_connector_ids,
+            mentioned_connectors=mentioned_connectors,
            request_id=request_id,
            turn_id=stream_result.turn_id,
        )
--- a/surfsense_backend/app/tasks/chat/streaming/flows/new_chat/runtime_context.py
+++ b/surfsense_backend/app/tasks/chat/streaming/flows/new_chat/runtime_context.py
@ -17,6 +17,8 @@ def build_new_chat_runtime_context(
    mentioned_document_ids: list[int] | None,
    accepted_folder_ids: list[int],
    mentioned_folder_ids: list[int] | None,
+    mentioned_connector_ids: list[int] | None,
+    mentioned_connectors: list[dict[str, object]] | None,
    request_id: str | None,
    turn_id: str,
 ) -> SurfSenseContextSchema:
@ -26,11 +28,16 @@ def build_new_chat_runtime_context(
    ``mentioned_folder_ids`` from the request: the resolver drops chips that
    pointed at deleted folders or folders the caller can't see, so middlewares
    only get authorized ids.
+
+    Connector mentions are set on the schema for legacy parity even though no
+    middleware reads them yet.
    """
    return SurfSenseContextSchema(
        search_space_id=search_space_id,
        mentioned_document_ids=list(mentioned_document_ids or []),
        mentioned_folder_ids=list(accepted_folder_ids or mentioned_folder_ids or []),
+        mentioned_connector_ids=list(mentioned_connector_ids or []),
+        mentioned_connectors=list(mentioned_connectors or []),
        request_id=request_id,
        turn_id=turn_id,
    )
--- a/surfsense_backend/tests/unit/tasks/chat/streaming/test_parallel_refactor_parity.py
+++ b/surfsense_backend/tests/unit/tasks/chat/streaming/test_parallel_refactor_parity.py
@ -241,11 +241,14 @@ def test_image_capability_blocks_known_text_only_models() -> None:


 def test_new_chat_runtime_context_prefers_accepted_folder_ids() -> None:
+    """Post-resolve accepted folder ids win over the raw requested ids."""
    ctx = build_new_chat_runtime_context(
        search_space_id=7,
        mentioned_document_ids=[1, 2],
        accepted_folder_ids=[10],
        mentioned_folder_ids=[20, 30],
+        mentioned_connector_ids=None,
+        mentioned_connectors=None,
        request_id="req",
        turn_id="t1",
    )
@ -258,17 +261,41 @@ def test_new_chat_runtime_context_prefers_accepted_folder_ids() -> None:


 def test_new_chat_runtime_context_falls_back_to_mentioned_folder_ids() -> None:
+    """With no accepted ids, the raw requested folder ids flow through."""
    ctx = build_new_chat_runtime_context(
        search_space_id=7,
        mentioned_document_ids=None,
        accepted_folder_ids=[],
        mentioned_folder_ids=[20, 30],
+        mentioned_connector_ids=None,
+        mentioned_connectors=None,
        request_id=None,
        turn_id="t2",
    )
    assert list(ctx.mentioned_folder_ids) == [20, 30]


+def test_new_chat_runtime_context_propagates_connector_mentions() -> None:
+    """@-selected connector ids/accounts ride onto the runtime context schema.
+
+    Parity with the legacy ``stream_new_chat`` runtime context, which set both
+    ``mentioned_connector_ids`` and ``mentioned_connectors`` on the schema.
+    """
+    connectors = [{"id": 5, "connector_type": "SLACK_CONNECTOR", "title": "acme"}]
+    ctx = build_new_chat_runtime_context(
+        search_space_id=7,
+        mentioned_document_ids=None,
+        accepted_folder_ids=[],
+        mentioned_folder_ids=None,
+        mentioned_connector_ids=[5],
+        mentioned_connectors=connectors,
+        request_id=None,
+        turn_id="t3",
+    )
+    assert list(ctx.mentioned_connector_ids) == [5]
+    assert list(ctx.mentioned_connectors) == connectors
+
+
 def test_resume_chat_runtime_context_empty_mention_lists() -> None:
    ctx = build_resume_chat_runtime_context(
        search_space_id=42, request_id="req-r", turn_id="t-r"