Merge upstream/dev

2026-07-22 23:31:12 +02:00 · 2026-06-05 19:18:12 +02:00 · 2026-06-05 19:18:12 +02:00 · 8bdfd00a15
commit 8bdfd00a15
parent 52ff304d64 c2b8b3ac5e
191 changed files with 3301 additions and 4079 deletions
--- a/surfsense_backend/tests/e2e/fakes/llm.py
+++ b/surfsense_backend/tests/e2e/fakes/llm.py
@ -7,13 +7,13 @@ The production indexing pipeline summarizes documents with:
    summary_content = summary_result.content

 The `llm` parameter is supplied per-document by
-`app.services.llm_service.get_user_long_context_llm`. We patch THAT
+`app.services.llm_service.get_agent_llm`. We patch THAT
 function to return a langchain-native FakeListChatModel so the rest of
 the chain works unchanged. No real LLM provider package is touched.

 Run-backend / run-celery use unittest.mock.patch.start() to install
 this at every binding site (the source module + every consumer that
-did `from app.services.llm_service import get_user_long_context_llm`
+did `from app.services.llm_service import get_agent_llm`
 at module load time).
 """

@ -42,7 +42,7 @@ def _make_fake_llm() -> FakeListChatModel:
    return fake


-async def fake_get_user_long_context_llm(*args: Any, **kwargs: Any) -> Any:
-    """Drop-in replacement for app.services.llm_service.get_user_long_context_llm."""
+async def fake_get_agent_llm(*args: Any, **kwargs: Any) -> Any:
+    """Drop-in replacement for app.services.llm_service.get_agent_llm."""
    logger.info("[fake-llm] returning FakeListChatModel for E2E indexing")
    return _make_fake_llm()
--- a/surfsense_backend/tests/e2e/run_backend.py
+++ b/surfsense_backend/tests/e2e/run_backend.py
@ -206,23 +206,23 @@ def _patch_llm_bindings() -> None:
        fake_create_chat_litellm_from_agent_config,
        fake_create_chat_litellm_from_config,
    )
-    from tests.e2e.fakes.llm import fake_get_user_long_context_llm
+    from tests.e2e.fakes.llm import fake_get_agent_llm

    targets = [
-        "app.services.llm_service.get_user_long_context_llm",
-        "app.tasks.connector_indexers.confluence_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.google_drive_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.google_gmail_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.notion_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.onedrive_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.dropbox_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.local_folder_indexer.get_user_long_context_llm",
-        "app.tasks.document_processors._save.get_user_long_context_llm",
-        "app.tasks.document_processors.markdown_processor.get_user_long_context_llm",
+        "app.services.llm_service.get_agent_llm",
+        "app.tasks.connector_indexers.confluence_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.google_drive_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.google_gmail_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.notion_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.onedrive_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.dropbox_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.local_folder_indexer.get_agent_llm",
+        "app.tasks.document_processors._save.get_agent_llm",
+        "app.tasks.document_processors.markdown_processor.get_agent_llm",
    ]
    for target in targets:
        try:
-            p = patch(target, fake_get_user_long_context_llm)
+            p = patch(target, fake_get_agent_llm)
            p.start()
            _active_patches.append(p)
            logger.info("[fake-llm] patched %s", target)
--- a/surfsense_backend/tests/e2e/run_celery.py
+++ b/surfsense_backend/tests/e2e/run_celery.py
@ -183,23 +183,23 @@ def _patch_llm_bindings() -> None:
        fake_create_chat_litellm_from_agent_config,
        fake_create_chat_litellm_from_config,
    )
-    from tests.e2e.fakes.llm import fake_get_user_long_context_llm
+    from tests.e2e.fakes.llm import fake_get_agent_llm

    targets = [
-        "app.services.llm_service.get_user_long_context_llm",
-        "app.tasks.connector_indexers.confluence_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.google_drive_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.google_gmail_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.notion_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.onedrive_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.dropbox_indexer.get_user_long_context_llm",
-        "app.tasks.connector_indexers.local_folder_indexer.get_user_long_context_llm",
-        "app.tasks.document_processors._save.get_user_long_context_llm",
-        "app.tasks.document_processors.markdown_processor.get_user_long_context_llm",
+        "app.services.llm_service.get_agent_llm",
+        "app.tasks.connector_indexers.confluence_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.google_drive_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.google_gmail_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.notion_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.onedrive_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.dropbox_indexer.get_agent_llm",
+        "app.tasks.connector_indexers.local_folder_indexer.get_agent_llm",
+        "app.tasks.document_processors._save.get_agent_llm",
+        "app.tasks.document_processors.markdown_processor.get_agent_llm",
    ]
    for target in targets:
        try:
-            p = patch(target, fake_get_user_long_context_llm)
+            p = patch(target, fake_get_agent_llm)
            p.start()
            _active_patches.append(p)
            logger.info("[fake-llm] patched %s in celery worker", target)
--- a/surfsense_backend/tests/integration/chat/test_thread_visibility.py
+++ b/surfsense_backend/tests/integration/chat/test_thread_visibility.py
@ -0,0 +1,279 @@
+"""Integration tests for new-chat thread visibility invariants.
+
+These tests exercise the route handlers directly with real DB-backed
+users, memberships, and permissions. The important contract is that a
+thread shared with a search space stays shared across normal metadata
+updates until the creator explicitly makes it private again.
+"""
+
+from __future__ import annotations
+
+import uuid
+
+import pytest
+import pytest_asyncio
+from fastapi import HTTPException
+from sqlalchemy import select
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.db import (
+    ChatVisibility,
+    SearchSpace,
+    SearchSpaceMembership,
+    SearchSpaceRole,
+    User,
+)
+from app.routes import new_chat_routes
+from app.schemas.new_chat import (
+    NewChatThreadCreate,
+    NewChatThreadUpdate,
+    NewChatThreadVisibilityUpdate,
+)
+
+pytestmark = pytest.mark.integration
+
+
+@pytest_asyncio.fixture
+async def db_member(db_session: AsyncSession, db_search_space: SearchSpace) -> User:
+    member = User(
+        id=uuid.uuid4(),
+        email="member@surfsense.net",
+        hashed_password="hashed",
+        is_active=True,
+        is_superuser=False,
+        is_verified=True,
+    )
+    db_session.add(member)
+    await db_session.flush()
+
+    role = (
+        (
+            await db_session.execute(
+                select(SearchSpaceRole).where(
+                    SearchSpaceRole.search_space_id == db_search_space.id,
+                    SearchSpaceRole.name == "Editor",
+                )
+            )
+        )
+        .scalars()
+        .one()
+    )
+    db_session.add(
+        SearchSpaceMembership(
+            user_id=member.id,
+            search_space_id=db_search_space.id,
+            role_id=role.id,
+            is_owner=False,
+        )
+    )
+    await db_session.flush()
+    return member
+
+
+async def _create_thread(
+    db_session: AsyncSession,
+    db_user: User,
+    db_search_space: SearchSpace,
+    *,
+    title: str = "Visibility Invariant Chat",
+):
+    return await new_chat_routes.create_thread(
+        NewChatThreadCreate(
+            title=title,
+            archived=False,
+            search_space_id=db_search_space.id,
+            visibility=ChatVisibility.PRIVATE,
+        ),
+        session=db_session,
+        user=db_user,
+    )
+
+
+def _active_thread_ids(response) -> set[int]:
+    return {thread.id for thread in response.threads}
+
+
+def _search_thread_ids(response) -> set[int]:
+    return {thread.id for thread in response}
+
+
+async def test_private_thread_is_hidden_from_other_search_space_member(
+    db_session: AsyncSession,
+    db_user: User,
+    db_member: User,
+    db_search_space: SearchSpace,
+):
+    thread = await _create_thread(db_session, db_user, db_search_space)
+
+    member_threads = await new_chat_routes.list_threads(
+        search_space_id=db_search_space.id,
+        session=db_session,
+        user=db_member,
+    )
+    member_search = await new_chat_routes.search_threads(
+        search_space_id=db_search_space.id,
+        title="Visibility",
+        session=db_session,
+        user=db_member,
+    )
+
+    assert thread.id not in _active_thread_ids(member_threads)
+    assert thread.id not in _search_thread_ids(member_search)
+    with pytest.raises(HTTPException) as exc_info:
+        await new_chat_routes.get_thread_full(
+            thread_id=thread.id,
+            session=db_session,
+            user=db_member,
+        )
+    assert exc_info.value.status_code == 403
+
+
+async def test_creator_can_share_thread_and_member_can_list_search_read_it(
+    db_session: AsyncSession,
+    db_user: User,
+    db_member: User,
+    db_search_space: SearchSpace,
+):
+    thread = await _create_thread(db_session, db_user, db_search_space)
+
+    updated = await new_chat_routes.update_thread_visibility(
+        thread_id=thread.id,
+        visibility_update=NewChatThreadVisibilityUpdate(
+            visibility=ChatVisibility.SEARCH_SPACE,
+        ),
+        session=db_session,
+        user=db_user,
+    )
+
+    member_threads = await new_chat_routes.list_threads(
+        search_space_id=db_search_space.id,
+        session=db_session,
+        user=db_member,
+    )
+    member_search = await new_chat_routes.search_threads(
+        search_space_id=db_search_space.id,
+        title="Visibility",
+        session=db_session,
+        user=db_member,
+    )
+    full_thread = await new_chat_routes.get_thread_full(
+        thread_id=thread.id,
+        session=db_session,
+        user=db_member,
+    )
+
+    assert updated.visibility == ChatVisibility.SEARCH_SPACE
+    assert thread.id in _active_thread_ids(member_threads)
+    assert thread.id in _search_thread_ids(member_search)
+    assert full_thread["id"] == thread.id
+    assert full_thread["visibility"] == ChatVisibility.SEARCH_SPACE
+
+
+async def test_rename_and_archive_do_not_reset_shared_visibility(
+    db_session: AsyncSession,
+    db_user: User,
+    db_search_space: SearchSpace,
+):
+    thread = await _create_thread(db_session, db_user, db_search_space)
+    await new_chat_routes.update_thread_visibility(
+        thread_id=thread.id,
+        visibility_update=NewChatThreadVisibilityUpdate(
+            visibility=ChatVisibility.SEARCH_SPACE,
+        ),
+        session=db_session,
+        user=db_user,
+    )
+
+    renamed = await new_chat_routes.update_thread(
+        thread_id=thread.id,
+        thread_update=NewChatThreadUpdate(title="Renamed Shared Chat"),
+        session=db_session,
+        user=db_user,
+    )
+    archived = await new_chat_routes.update_thread(
+        thread_id=thread.id,
+        thread_update=NewChatThreadUpdate(archived=True),
+        session=db_session,
+        user=db_user,
+    )
+
+    assert renamed.visibility == ChatVisibility.SEARCH_SPACE
+    assert archived.visibility == ChatVisibility.SEARCH_SPACE
+    assert archived.archived is True
+
+
+async def test_non_creator_cannot_change_shared_thread_back_to_private(
+    db_session: AsyncSession,
+    db_user: User,
+    db_member: User,
+    db_search_space: SearchSpace,
+):
+    thread = await _create_thread(db_session, db_user, db_search_space)
+    await new_chat_routes.update_thread_visibility(
+        thread_id=thread.id,
+        visibility_update=NewChatThreadVisibilityUpdate(
+            visibility=ChatVisibility.SEARCH_SPACE,
+        ),
+        session=db_session,
+        user=db_user,
+    )
+
+    with pytest.raises(HTTPException) as exc_info:
+        await new_chat_routes.update_thread_visibility(
+            thread_id=thread.id,
+            visibility_update=NewChatThreadVisibilityUpdate(
+                visibility=ChatVisibility.PRIVATE,
+            ),
+            session=db_session,
+            user=db_member,
+        )
+
+    assert exc_info.value.status_code == 403
+
+
+async def test_creator_can_make_shared_thread_private_again(
+    db_session: AsyncSession,
+    db_user: User,
+    db_member: User,
+    db_search_space: SearchSpace,
+):
+    thread = await _create_thread(db_session, db_user, db_search_space)
+    await new_chat_routes.update_thread_visibility(
+        thread_id=thread.id,
+        visibility_update=NewChatThreadVisibilityUpdate(
+            visibility=ChatVisibility.SEARCH_SPACE,
+        ),
+        session=db_session,
+        user=db_user,
+    )
+
+    private_again = await new_chat_routes.update_thread_visibility(
+        thread_id=thread.id,
+        visibility_update=NewChatThreadVisibilityUpdate(
+            visibility=ChatVisibility.PRIVATE,
+        ),
+        session=db_session,
+        user=db_user,
+    )
+    member_threads = await new_chat_routes.list_threads(
+        search_space_id=db_search_space.id,
+        session=db_session,
+        user=db_member,
+    )
+    member_search = await new_chat_routes.search_threads(
+        search_space_id=db_search_space.id,
+        title="Visibility",
+        session=db_session,
+        user=db_member,
+    )
+
+    assert private_again.visibility == ChatVisibility.PRIVATE
+    assert thread.id not in _active_thread_ids(member_threads)
+    assert thread.id not in _search_thread_ids(member_search)
+    with pytest.raises(HTTPException) as exc_info:
+        await new_chat_routes.get_thread_full(
+            thread_id=thread.id,
+            session=db_session,
+            user=db_member,
+        )
+    assert exc_info.value.status_code == 403
--- a/surfsense_backend/tests/integration/conftest.py
+++ b/surfsense_backend/tests/integration/conftest.py
@ -1,7 +1,7 @@
 import importlib
 import sys
 import uuid
-from unittest.mock import AsyncMock, MagicMock
+from unittest.mock import MagicMock

 import pytest
 import pytest_asyncio
@ -123,26 +123,6 @@ async def db_search_space(db_session: AsyncSession, db_user: User) -> SearchSpac
    return space


-@pytest.fixture
-def patched_summarize(monkeypatch) -> AsyncMock:
-    mock = AsyncMock(return_value="Mocked summary.")
-    monkeypatch.setattr(
-        "app.indexing_pipeline.indexing_pipeline_service.summarize_document",
-        mock,
-    )
-    return mock
-
-
-@pytest.fixture
-def patched_summarize_raises(monkeypatch) -> AsyncMock:
-    mock = AsyncMock(side_effect=RuntimeError("LLM unavailable"))
-    monkeypatch.setattr(
-        "app.indexing_pipeline.indexing_pipeline_service.summarize_document",
-        mock,
-    )
-    return mock
-
-
@pytest.fixture
 def patched_embed_texts(monkeypatch) -> MagicMock:
    mock = MagicMock(side_effect=lambda texts: [[0.1] * _EMBEDDING_DIM for _ in texts])
@ -153,6 +133,16 @@ def patched_embed_texts(monkeypatch) -> MagicMock:
    return mock


+@pytest.fixture
+def patched_embed_texts_raises(monkeypatch) -> MagicMock:
+    mock = MagicMock(side_effect=RuntimeError("Embedding unavailable"))
+    monkeypatch.setattr(
+        "app.indexing_pipeline.indexing_pipeline_service.embed_texts",
+        mock,
+    )
+    return mock
+
+
@pytest.fixture
 def patched_chunk_text(monkeypatch) -> MagicMock:
    mock = MagicMock(return_value=["Test chunk content."])
--- a/surfsense_backend/tests/integration/document_upload/conftest.py
+++ b/surfsense_backend/tests/integration/document_upload/conftest.py
@ -68,7 +68,6 @@ class InlineTaskDispatcher:
        filename: str,
        search_space_id: int,
        user_id: str,
-        should_summarize: bool = False,
        use_vision_llm: bool = False,
        processing_mode: str = "basic",
    ) -> None:
@ -83,7 +82,6 @@ class InlineTaskDispatcher:
                filename,
                search_space_id,
                user_id,
-                should_summarize=should_summarize,
                use_vision_llm=use_vision_llm,
                processing_mode=processing_mode,
            )
@ -266,10 +264,6 @@ async def page_limits():
@pytest.fixture(autouse=True)
 def _mock_external_apis(monkeypatch):
    """Mock LLM, embedding, and chunking — these are external API boundaries."""
-    monkeypatch.setattr(
-        "app.indexing_pipeline.indexing_pipeline_service.summarize_document",
-        AsyncMock(return_value="Mocked summary."),
-    )
    monkeypatch.setattr(
        "app.indexing_pipeline.indexing_pipeline_service.embed_texts",
        MagicMock(side_effect=lambda texts: [[0.1] * _EMBEDDING_DIM for _ in texts]),
--- a/surfsense_backend/tests/integration/indexing_pipeline/adapters/test_file_upload_adapter.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/adapters/test_file_upload_adapter.py
@ -8,7 +8,7 @@ pytestmark = pytest.mark.integration


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_sets_status_ready(db_session, db_search_space, db_user, mocker):
    """Document status is READY after successful indexing."""
@ -19,7 +19,6 @@ async def test_sets_status_ready(db_session, db_search_space, db_user, mocker):
        etl_service="UNSTRUCTURED",
        search_space_id=db_search_space.id,
        user_id=str(db_user.id),
-        llm=mocker.Mock(),
    )

    result = await db_session.execute(
@ -31,10 +30,10 @@ async def test_sets_status_ready(db_session, db_search_space, db_user, mocker):


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
-async def test_content_is_summary(db_session, db_search_space, db_user, mocker):
-    """Document content is set to the LLM-generated summary."""
+async def test_content_is_source_markdown(db_session, db_search_space, db_user, mocker):
+    """Document content is set to the extracted source markdown."""
    adapter = UploadDocumentAdapter(db_session)
    await adapter.index(
        markdown_content="## Hello\n\nSome content.",
@ -42,8 +41,6 @@ async def test_content_is_summary(db_session, db_search_space, db_user, mocker):
        etl_service="UNSTRUCTURED",
        search_space_id=db_search_space.id,
        user_id=str(db_user.id),
-        llm=mocker.Mock(),
-        should_summarize=True,
    )

    result = await db_session.execute(
@ -51,11 +48,11 @@ async def test_content_is_summary(db_session, db_search_space, db_user, mocker):
    )
    document = result.scalars().first()

-    assert document.content == "Mocked summary."
+    assert document.content == "## Hello\n\nSome content."


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_chunks_written_to_db(db_session, db_search_space, db_user, mocker):
    """Chunks derived from the source markdown are persisted in the DB."""
@ -66,7 +63,6 @@ async def test_chunks_written_to_db(db_session, db_search_space, db_user, mocker
        etl_service="UNSTRUCTURED",
        search_space_id=db_search_space.id,
        user_id=str(db_user.id),
-        llm=mocker.Mock(),
    )

    result = await db_session.execute(
@ -83,9 +79,7 @@ async def test_chunks_written_to_db(db_session, db_search_space, db_user, mocker
    assert chunks[0].content == "Test chunk content."


-@pytest.mark.usefixtures(
-    "patched_summarize_raises", "patched_embed_texts", "patched_chunk_text"
-)
+@pytest.mark.usefixtures("patched_embed_texts_raises", "patched_chunk_text")
 async def test_raises_on_indexing_failure(db_session, db_search_space, db_user, mocker):
    """RuntimeError is raised when the indexing step fails so the caller can fire a failure notification."""
    adapter = UploadDocumentAdapter(db_session)
@ -96,8 +90,6 @@ async def test_raises_on_indexing_failure(db_session, db_search_space, db_user,
            etl_service="UNSTRUCTURED",
            search_space_id=db_search_space.id,
            user_id=str(db_user.id),
-            llm=mocker.Mock(),
-            should_summarize=True,
        )


@ -107,10 +99,10 @@ async def test_raises_on_indexing_failure(db_session, db_search_space, db_user,


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_reindex_updates_content(db_session, db_search_space, db_user, mocker):
-    """Document content is updated to the new summary after reindexing."""
+    """Document content is updated to the new source markdown after reindexing."""
    adapter = UploadDocumentAdapter(db_session)
    await adapter.index(
        markdown_content="## Original\n\nOriginal content.",
@ -118,7 +110,6 @@ async def test_reindex_updates_content(db_session, db_search_space, db_user, moc
        etl_service="UNSTRUCTURED",
        search_space_id=db_search_space.id,
        user_id=str(db_user.id),
-        llm=mocker.Mock(),
    )

    result = await db_session.execute(
@ -129,14 +120,14 @@ async def test_reindex_updates_content(db_session, db_search_space, db_user, moc
    document.source_markdown = "## Edited\n\nNew content after user edit."
    await db_session.flush()

-    await adapter.reindex(document=document, llm=mocker.Mock())
+    await adapter.reindex(document=document)

    await db_session.refresh(document)
-    assert document.content == "Mocked summary."
+    assert document.content == "## Edited\n\nNew content after user edit."


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_reindex_updates_content_hash(
    db_session, db_search_space, db_user, mocker
@ -149,7 +140,6 @@ async def test_reindex_updates_content_hash(
        etl_service="UNSTRUCTURED",
        search_space_id=db_search_space.id,
        user_id=str(db_user.id),
-        llm=mocker.Mock(),
    )

    result = await db_session.execute(
@ -161,14 +151,14 @@ async def test_reindex_updates_content_hash(
    document.source_markdown = "## Edited\n\nNew content after user edit."
    await db_session.flush()

-    await adapter.reindex(document=document, llm=mocker.Mock())
+    await adapter.reindex(document=document)

    await db_session.refresh(document)
    assert document.content_hash != original_hash


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_reindex_sets_status_ready(db_session, db_search_space, db_user, mocker):
    """Document status is READY after successful reindexing."""
@ -179,7 +169,6 @@ async def test_reindex_sets_status_ready(db_session, db_search_space, db_user, m
        etl_service="UNSTRUCTURED",
        search_space_id=db_search_space.id,
        user_id=str(db_user.id),
-        llm=mocker.Mock(),
    )

    result = await db_session.execute(
@ -190,13 +179,13 @@ async def test_reindex_sets_status_ready(db_session, db_search_space, db_user, m
    document.source_markdown = "## Edited\n\nNew content after user edit."
    await db_session.flush()

-    await adapter.reindex(document=document, llm=mocker.Mock())
+    await adapter.reindex(document=document)

    await db_session.refresh(document)
    assert DocumentStatus.is_state(document.status, DocumentStatus.READY)


-@pytest.mark.usefixtures("patched_summarize", "patched_embed_texts")
+@pytest.mark.usefixtures("patched_embed_texts")
 async def test_reindex_replaces_chunks(db_session, db_search_space, db_user, mocker):
    """Reindexing replaces old chunks with new content rather than appending."""
    mocker.patch(
@ -211,7 +200,6 @@ async def test_reindex_replaces_chunks(db_session, db_search_space, db_user, moc
        etl_service="UNSTRUCTURED",
        search_space_id=db_search_space.id,
        user_id=str(db_user.id),
-        llm=mocker.Mock(),
    )

    result = await db_session.execute(
@ -223,7 +211,7 @@ async def test_reindex_replaces_chunks(db_session, db_search_space, db_user, moc
    document.source_markdown = "## Edited\n\nNew content after user edit."
    await db_session.flush()

-    await adapter.reindex(document=document, llm=mocker.Mock())
+    await adapter.reindex(document=document)

    chunks_result = await db_session.execute(
        select(Chunk).filter(Chunk.document_id == document_id)
@ -235,7 +223,7 @@ async def test_reindex_replaces_chunks(db_session, db_search_space, db_user, moc


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_reindex_clears_reindexing_flag(
    db_session, db_search_space, db_user, mocker
@ -248,7 +236,6 @@ async def test_reindex_clears_reindexing_flag(
        etl_service="UNSTRUCTURED",
        search_space_id=db_search_space.id,
        user_id=str(db_user.id),
-        llm=mocker.Mock(),
    )

    result = await db_session.execute(
@ -260,19 +247,17 @@ async def test_reindex_clears_reindexing_flag(
    document.content_needs_reindexing = True
    await db_session.flush()

-    await adapter.reindex(document=document, llm=mocker.Mock())
+    await adapter.reindex(document=document)

    await db_session.refresh(document)
    assert document.content_needs_reindexing is False


@pytest.mark.usefixtures("patched_embed_texts", "patched_chunk_text")
-async def test_reindex_raises_on_failure(db_session, db_search_space, db_user, mocker):
+async def test_reindex_raises_on_failure(
+    db_session, db_search_space, db_user, patched_embed_texts, mocker
+):
    """RuntimeError is raised when reindexing fails so the caller can handle it."""
-    mocker.patch(
-        "app.indexing_pipeline.indexing_pipeline_service.summarize_document",
-        return_value="Mocked summary.",
-    )

    adapter = UploadDocumentAdapter(db_session)
    await adapter.index(
@ -281,7 +266,6 @@ async def test_reindex_raises_on_failure(db_session, db_search_space, db_user, m
        etl_service="UNSTRUCTURED",
        search_space_id=db_search_space.id,
        user_id=str(db_user.id),
-        llm=mocker.Mock(),
    )

    result = await db_session.execute(
@ -292,13 +276,10 @@ async def test_reindex_raises_on_failure(db_session, db_search_space, db_user, m
    document.source_markdown = "## Edited\n\nNew content after user edit."
    await db_session.flush()

-    mocker.patch(
-        "app.indexing_pipeline.indexing_pipeline_service.summarize_document",
-        side_effect=RuntimeError("LLM unavailable"),
-    )
+    patched_embed_texts.side_effect = RuntimeError("Embedding unavailable")

    with pytest.raises(RuntimeError, match=r"Embedding failed|Reindexing failed"):
-        await adapter.reindex(document=document, llm=mocker.Mock())
+        await adapter.reindex(document=document)


 async def test_reindex_raises_on_empty_source_markdown(
@ -323,4 +304,4 @@ async def test_reindex_raises_on_empty_source_markdown(
    adapter = UploadDocumentAdapter(db_session)

    with pytest.raises(RuntimeError, match="no source_markdown"):
-        await adapter.reindex(document=document, llm=mocker.Mock())
+        await adapter.reindex(document=document)
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_calendar_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_calendar_pipeline.py
@ -25,8 +25,6 @@ def _cal_doc(
        search_space_id=search_space_id,
        connector_id=connector_id,
        created_by_id=user_id,
-        should_summarize=True,
-        fallback_summary=f"Calendar: Event {unique_id}",
        metadata={
            "event_id": unique_id,
            "start_time": "2025-01-15T10:00:00",
@ -37,7 +35,7 @@ def _cal_doc(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_calendar_pipeline_creates_ready_document(
    db_session, db_search_space, db_connector, db_user, mocker
@ -55,7 +53,7 @@ async def test_calendar_pipeline_creates_ready_document(
    prepared = await service.prepare_for_indexing([doc])
    assert len(prepared) == 1

-    await service.index(prepared[0], doc, llm=mocker.Mock())
+    await service.index(prepared[0], doc)

    result = await db_session.execute(
        select(Document).filter(Document.search_space_id == space_id)
@ -68,7 +66,7 @@ async def test_calendar_pipeline_creates_ready_document(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_calendar_legacy_doc_migrated(
    db_session, db_search_space, db_connector, db_user, mocker
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_drive_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_drive_pipeline.py
@ -25,8 +25,6 @@ def _drive_doc(
        search_space_id=search_space_id,
        connector_id=connector_id,
        created_by_id=user_id,
-        should_summarize=True,
-        fallback_summary=f"File: {unique_id}.pdf",
        metadata={
            "google_drive_file_id": unique_id,
            "google_drive_file_name": f"{unique_id}.pdf",
@ -36,7 +34,7 @@ def _drive_doc(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_drive_pipeline_creates_ready_document(
    db_session, db_search_space, db_connector, db_user, mocker
@ -54,7 +52,7 @@ async def test_drive_pipeline_creates_ready_document(
    prepared = await service.prepare_for_indexing([doc])
    assert len(prepared) == 1

-    await service.index(prepared[0], doc, llm=mocker.Mock())
+    await service.index(prepared[0], doc)

    result = await db_session.execute(
        select(Document).filter(Document.search_space_id == space_id)
@ -67,7 +65,7 @@ async def test_drive_pipeline_creates_ready_document(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_drive_legacy_doc_migrated(
    db_session, db_search_space, db_connector, db_user, mocker
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_dropbox_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_dropbox_pipeline.py
@ -24,8 +24,6 @@ def _dropbox_doc(
        search_space_id=search_space_id,
        connector_id=connector_id,
        created_by_id=user_id,
-        should_summarize=True,
-        fallback_summary=f"File: {unique_id}.docx",
        metadata={
            "dropbox_file_id": unique_id,
            "dropbox_file_name": f"{unique_id}.docx",
@ -35,7 +33,7 @@ def _dropbox_doc(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_dropbox_pipeline_creates_ready_document(
    db_session, db_search_space, db_connector, db_user, mocker
@ -53,7 +51,7 @@ async def test_dropbox_pipeline_creates_ready_document(
    prepared = await service.prepare_for_indexing([doc])
    assert len(prepared) == 1

-    await service.index(prepared[0], doc, llm=mocker.Mock())
+    await service.index(prepared[0], doc)

    result = await db_session.execute(
        select(Document).filter(Document.search_space_id == space_id)
@ -66,7 +64,7 @@ async def test_dropbox_pipeline_creates_ready_document(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_dropbox_duplicate_content_skipped(
    db_session, db_search_space, db_connector, db_user, mocker
@ -86,7 +84,7 @@ async def test_dropbox_duplicate_content_skipped(

    prepared = await service.prepare_for_indexing([doc])
    assert len(prepared) == 1
-    await service.index(prepared[0], doc, llm=mocker.Mock())
+    await service.index(prepared[0], doc)

    result = await db_session.execute(
        select(Document).filter(Document.search_space_id == space_id)
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_gmail_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_gmail_pipeline.py
@ -28,8 +28,6 @@ def _gmail_doc(
        search_space_id=search_space_id,
        connector_id=connector_id,
        created_by_id=user_id,
-        should_summarize=True,
-        fallback_summary=f"Gmail: Subject for {unique_id}",
        metadata={
            "message_id": unique_id,
            "from": "sender@example.com",
@ -39,7 +37,7 @@ def _gmail_doc(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_gmail_pipeline_creates_ready_document(
    db_session, db_search_space, db_connector, db_user, mocker
@ -57,7 +55,7 @@ async def test_gmail_pipeline_creates_ready_document(
    prepared = await service.prepare_for_indexing([doc])
    assert len(prepared) == 1

-    await service.index(prepared[0], doc, llm=mocker.Mock())
+    await service.index(prepared[0], doc)

    result = await db_session.execute(
        select(Document).filter(Document.search_space_id == space_id)
@ -71,7 +69,7 @@ async def test_gmail_pipeline_creates_ready_document(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_gmail_legacy_doc_migrated_then_reused(
    db_session, db_search_space, db_connector, db_user, mocker
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_index_batch.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_index_batch.py
@ -10,7 +10,7 @@ pytestmark = pytest.mark.integration


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_index_batch_creates_ready_documents(
    db_session, db_search_space, make_connector_document, mocker
@ -33,7 +33,7 @@ async def test_index_batch_creates_ready_documents(
    ]

    service = IndexingPipelineService(session=db_session)
-    results = await service.index_batch(docs, llm=mocker.Mock())
+    results = await service.index_batch(docs)

    assert len(results) == 2

@ -50,10 +50,10 @@ async def test_index_batch_creates_ready_documents(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_index_batch_empty_returns_empty(db_session, mocker):
    """index_batch with empty input returns an empty list."""
    service = IndexingPipelineService(session=db_session)
-    results = await service.index_batch([], llm=mocker.Mock())
+    results = await service.index_batch([])
    assert results == []
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_index_document.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_index_document.py
@ -10,9 +10,7 @@ _EMBEDDING_DIM = app_config.embedding_model_instance.dimension
 pytestmark = pytest.mark.integration


-@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
-)
+@pytest.mark.usefixtures("patched_embed_texts", "patched_chunk_text")
 async def test_sets_status_ready(
    db_session,
    db_search_space,
@ -27,7 +25,7 @@ async def test_sets_status_ready(
    document = prepared[0]
    document_id = document.id

-    await service.index(document, connector_doc, llm=mocker.Mock())
+    await service.index(document, connector_doc)

    result = await db_session.execute(
        select(Document).filter(Document.id == document_id)
@ -37,16 +35,14 @@ async def test_sets_status_ready(
    assert DocumentStatus.is_state(reloaded.status, DocumentStatus.READY)


-@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
-)
-async def test_content_is_summary_when_should_summarize_true(
+@pytest.mark.usefixtures("patched_embed_texts", "patched_chunk_text")
+async def test_content_is_source_markdown_by_default(
    db_session,
    db_search_space,
    make_connector_document,
    mocker,
 ):
-    """Document content is set to the LLM-generated summary when should_summarize=True."""
+    """Document content is set to source_markdown by default."""
    connector_doc = make_connector_document(search_space_id=db_search_space.id)
    service = IndexingPipelineService(session=db_session)

@ -54,28 +50,25 @@ async def test_content_is_summary_when_should_summarize_true(
    document = prepared[0]
    document_id = document.id

-    await service.index(document, connector_doc, llm=mocker.Mock())
+    await service.index(document, connector_doc)

    result = await db_session.execute(
        select(Document).filter(Document.id == document_id)
    )
    reloaded = result.scalars().first()

-    assert reloaded.content == "Mocked summary."
+    assert reloaded.content == connector_doc.source_markdown


-@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
-)
-async def test_content_is_source_markdown_when_should_summarize_false(
+@pytest.mark.usefixtures("patched_embed_texts", "patched_chunk_text")
+async def test_content_is_source_markdown_when_custom_content(
    db_session,
    db_search_space,
    make_connector_document,
 ):
-    """Document content is set to source_markdown verbatim when should_summarize=False."""
+    """Document content is set to source_markdown verbatim."""
    connector_doc = make_connector_document(
        search_space_id=db_search_space.id,
-        should_summarize=False,
        source_markdown="## Raw content",
    )
    service = IndexingPipelineService(session=db_session)
@ -84,7 +77,7 @@ async def test_content_is_source_markdown_when_should_summarize_false(
    document = prepared[0]
    document_id = document.id

-    await service.index(document, connector_doc, llm=None)
+    await service.index(document, connector_doc)

    result = await db_session.execute(
        select(Document).filter(Document.id == document_id)
@ -94,9 +87,7 @@ async def test_content_is_source_markdown_when_should_summarize_false(
    assert reloaded.content == "## Raw content"


-@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
-)
+@pytest.mark.usefixtures("patched_embed_texts", "patched_chunk_text")
 async def test_chunks_written_to_db(
    db_session,
    db_search_space,
@ -111,7 +102,7 @@ async def test_chunks_written_to_db(
    document = prepared[0]
    document_id = document.id

-    await service.index(document, connector_doc, llm=mocker.Mock())
+    await service.index(document, connector_doc)

    result = await db_session.execute(
        select(Chunk).filter(Chunk.document_id == document_id)
@ -122,9 +113,7 @@ async def test_chunks_written_to_db(
    assert chunks[0].content == "Test chunk content."


-@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
-)
+@pytest.mark.usefixtures("patched_embed_texts", "patched_chunk_text")
 async def test_embedding_written_to_db(
    db_session,
    db_search_space,
@ -139,7 +128,7 @@ async def test_embedding_written_to_db(
    document = prepared[0]
    document_id = document.id

-    await service.index(document, connector_doc, llm=mocker.Mock())
+    await service.index(document, connector_doc)

    result = await db_session.execute(
        select(Document).filter(Document.id == document_id)
@ -150,9 +139,7 @@ async def test_embedding_written_to_db(
    assert len(reloaded.embedding) == _EMBEDDING_DIM


-@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
-)
+@pytest.mark.usefixtures("patched_embed_texts", "patched_chunk_text")
 async def test_updated_at_advances_after_indexing(
    db_session,
    db_search_space,
@ -172,7 +159,7 @@ async def test_updated_at_advances_after_indexing(
    )
    updated_at_pending = result.scalars().first().updated_at

-    await service.index(document, connector_doc, llm=mocker.Mock())
+    await service.index(document, connector_doc)

    result = await db_session.execute(
        select(Document).filter(Document.id == document_id)
@ -182,18 +169,15 @@ async def test_updated_at_advances_after_indexing(
    assert updated_at_ready > updated_at_pending


-@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
-)
+@pytest.mark.usefixtures("patched_embed_texts", "patched_chunk_text")
 async def test_no_llm_falls_back_to_source_markdown(
    db_session,
    db_search_space,
    make_connector_document,
 ):
-    """When llm=None and no fallback_summary, content falls back to source_markdown."""
+    """Content stays deterministic source markdown without an LLM."""
    connector_doc = make_connector_document(
        search_space_id=db_search_space.id,
-        should_summarize=True,
        source_markdown="## Fallback content",
    )
    service = IndexingPipelineService(session=db_session)
@ -202,7 +186,7 @@ async def test_no_llm_falls_back_to_source_markdown(
    document = prepared[0]
    document_id = document.id

-    await service.index(document, connector_doc, llm=None)
+    await service.index(document, connector_doc)

    result = await db_session.execute(
        select(Document).filter(Document.id == document_id)
@ -213,27 +197,23 @@ async def test_no_llm_falls_back_to_source_markdown(
    assert reloaded.content == "## Fallback content"


-@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
-)
-async def test_fallback_summary_used_when_llm_unavailable(
+@pytest.mark.usefixtures("patched_embed_texts", "patched_chunk_text")
+async def test_source_markdown_used_without_preview(
    db_session,
    db_search_space,
    make_connector_document,
 ):
-    """fallback_summary is used as content when llm=None and should_summarize=True."""
+    """Source markdown is used without fallback preview fields."""
    connector_doc = make_connector_document(
        search_space_id=db_search_space.id,
-        should_summarize=True,
        source_markdown="## Full raw content",
-        fallback_summary="Short pre-built summary.",
    )
    service = IndexingPipelineService(session=db_session)

    prepared = await service.prepare_for_indexing([connector_doc])
    document_id = prepared[0].id

-    await service.index(prepared[0], connector_doc, llm=None)
+    await service.index(prepared[0], connector_doc)

    result = await db_session.execute(
        select(Document).filter(Document.id == document_id)
@ -241,12 +221,10 @@ async def test_fallback_summary_used_when_llm_unavailable(
    reloaded = result.scalars().first()

    assert DocumentStatus.is_state(reloaded.status, DocumentStatus.READY)
-    assert reloaded.content == "Short pre-built summary."
+    assert reloaded.content == "## Full raw content"


-@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
-)
+@pytest.mark.usefixtures("patched_embed_texts", "patched_chunk_text")
 async def test_reindex_replaces_old_chunks(
    db_session,
    db_search_space,
@ -264,14 +242,14 @@ async def test_reindex_replaces_old_chunks(
    document = prepared[0]
    document_id = document.id

-    await service.index(document, connector_doc, llm=mocker.Mock())
+    await service.index(document, connector_doc)

    updated_doc = make_connector_document(
        search_space_id=db_search_space.id,
        source_markdown="## v2",
    )
    re_prepared = await service.prepare_for_indexing([updated_doc])
-    await service.index(re_prepared[0], updated_doc, llm=mocker.Mock())
+    await service.index(re_prepared[0], updated_doc)

    result = await db_session.execute(
        select(Chunk).filter(Chunk.document_id == document_id)
@ -281,16 +259,14 @@ async def test_reindex_replaces_old_chunks(
    assert len(chunks) == 1


-@pytest.mark.usefixtures(
-    "patched_summarize_raises", "patched_embed_texts", "patched_chunk_text"
-)
-async def test_llm_error_sets_status_failed(
+@pytest.mark.usefixtures("patched_embed_texts_raises", "patched_chunk_text")
+async def test_embedding_error_sets_status_failed(
    db_session,
    db_search_space,
    make_connector_document,
    mocker,
 ):
-    """Document status is FAILED when the LLM raises during indexing."""
+    """Document status is FAILED when embedding raises during indexing."""
    connector_doc = make_connector_document(search_space_id=db_search_space.id)
    service = IndexingPipelineService(session=db_session)

@ -298,7 +274,7 @@ async def test_llm_error_sets_status_failed(
    document = prepared[0]
    document_id = document.id

-    await service.index(document, connector_doc, llm=mocker.Mock())
+    await service.index(document, connector_doc)

    result = await db_session.execute(
        select(Document).filter(Document.id == document_id)
@ -308,10 +284,8 @@ async def test_llm_error_sets_status_failed(
    assert DocumentStatus.is_state(reloaded.status, DocumentStatus.FAILED)


-@pytest.mark.usefixtures(
-    "patched_summarize_raises", "patched_embed_texts", "patched_chunk_text"
-)
-async def test_llm_error_leaves_no_partial_data(
+@pytest.mark.usefixtures("patched_embed_texts_raises", "patched_chunk_text")
+async def test_embedding_error_leaves_no_partial_data(
    db_session,
    db_search_space,
    make_connector_document,
@ -325,7 +299,7 @@ async def test_llm_error_leaves_no_partial_data(
    document = prepared[0]
    document_id = document.id

-    await service.index(document, connector_doc, llm=mocker.Mock())
+    await service.index(document, connector_doc)

    result = await db_session.execute(
        select(Document).filter(Document.id == document_id)
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@ -21,7 +21,6 @@ from app.db import (
 pytestmark = pytest.mark.integration

 UNIFIED_FIXTURES = (
-    "patched_summarize",
    "patched_embed_texts",
    "patched_chunk_text",
 )
@ -787,7 +786,7 @@ class TestPipelineIntegration:
        assert len(prepared) == 1

        db_doc = prepared[0]
-        result = await service.index(db_doc, doc, llm=mocker.Mock())
+        result = await service.index(db_doc, doc)
        assert result is not None

        docs = (
@ -1272,7 +1271,7 @@ class TestIndexingProgressFlag:
        original_index = IndexingPipelineService.index
        flag_observed = []

-        async def patched_index(self_pipe, document, connector_doc, llm):
+        async def patched_index(self_pipe, document, connector_doc):
            folder = (
                await db_session.execute(
                    select(Folder).where(
@ -1284,7 +1283,7 @@ class TestIndexingProgressFlag:
            if folder:
                meta = folder.folder_metadata or {}
                flag_observed.append(meta.get("indexing_in_progress", False))
-            return await original_index(self_pipe, document, connector_doc, llm)
+            return await original_index(self_pipe, document, connector_doc)

        IndexingPipelineService.index = patched_index
        try:
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_onedrive_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_onedrive_pipeline.py
@ -24,8 +24,6 @@ def _onedrive_doc(
        search_space_id=search_space_id,
        connector_id=connector_id,
        created_by_id=user_id,
-        should_summarize=True,
-        fallback_summary=f"File: {unique_id}.docx",
        metadata={
            "onedrive_file_id": unique_id,
            "onedrive_file_name": f"{unique_id}.docx",
@ -35,7 +33,7 @@ def _onedrive_doc(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_onedrive_pipeline_creates_ready_document(
    db_session, db_search_space, db_connector, db_user, mocker
@ -53,7 +51,7 @@ async def test_onedrive_pipeline_creates_ready_document(
    prepared = await service.prepare_for_indexing([doc])
    assert len(prepared) == 1

-    await service.index(prepared[0], doc, llm=mocker.Mock())
+    await service.index(prepared[0], doc)

    result = await db_session.execute(
        select(Document).filter(Document.search_space_id == space_id)
@ -66,7 +64,7 @@ async def test_onedrive_pipeline_creates_ready_document(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_onedrive_duplicate_content_skipped(
    db_session, db_search_space, db_connector, db_user, mocker
@ -86,7 +84,7 @@ async def test_onedrive_duplicate_content_skipped(

    prepared = await service.prepare_for_indexing([doc])
    assert len(prepared) == 1
-    await service.index(prepared[0], doc, llm=mocker.Mock())
+    await service.index(prepared[0], doc)

    result = await db_session.execute(
        select(Document).filter(Document.search_space_id == space_id)
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_prepare_for_indexing.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_prepare_for_indexing.py
@ -33,7 +33,7 @@ async def test_new_document_is_persisted_with_pending_status(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_unchanged_ready_document_is_skipped(
    db_session,
@ -47,7 +47,7 @@ async def test_unchanged_ready_document_is_skipped(

    # Index fully so the document reaches ready state
    prepared = await service.prepare_for_indexing([doc])
-    await service.index(prepared[0], doc, llm=mocker.Mock())
+    await service.index(prepared[0], doc)

    # Same content on the next run — a ready document must be skipped
    results = await service.prepare_for_indexing([doc])
@ -56,7 +56,7 @@ async def test_unchanged_ready_document_is_skipped(


@pytest.mark.usefixtures(
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+"patched_embed_texts", "patched_chunk_text"
 )
 async def test_title_only_change_updates_title_in_db(
    db_session,
@ -72,7 +72,7 @@ async def test_title_only_change_updates_title_in_db(

    prepared = await service.prepare_for_indexing([original])
    document_id = prepared[0].id
-    await service.index(prepared[0], original, llm=mocker.Mock())
+    await service.index(prepared[0], original)

    renamed = make_connector_document(
        search_space_id=db_search_space.id, title="Updated Title"
@ -338,9 +338,7 @@ async def test_same_content_from_different_source_is_skipped(
    assert len(result.scalars().all()) == 1


-@pytest.mark.usefixtures(
-    "patched_summarize_raises", "patched_embed_texts", "patched_chunk_text"
-)
+@pytest.mark.usefixtures("patched_embed_texts_raises", "patched_chunk_text")
 async def test_failed_document_with_unchanged_content_is_requeued(
    db_session,
    db_search_space,
@ -351,10 +349,10 @@ async def test_failed_document_with_unchanged_content_is_requeued(
    doc = make_connector_document(search_space_id=db_search_space.id)
    service = IndexingPipelineService(session=db_session)

-    # First run: document is created and indexing crashes → status = failed
+    # First run: document is created and indexing crashes, so status becomes failed.
    prepared = await service.prepare_for_indexing([doc])
    document_id = prepared[0].id
-    await service.index(prepared[0], doc, llm=mocker.Mock())
+    await service.index(prepared[0], doc)

    result = await db_session.execute(
        select(Document).filter(Document.id == document_id)
--- a/surfsense_backend/tests/unit/agents/new_chat/tools/test_resume_page_limits.py
+++ b/surfsense_backend/tests/unit/agents/new_chat/tools/test_resume_page_limits.py
@ -142,7 +142,7 @@ async def test_generate_resume_defaults_to_one_page_target(monkeypatch) -> None:
    llm = SimpleNamespace(ainvoke=AsyncMock(side_effect=_llm_invoke))
    monkeypatch.setattr(
        resume_tool,
-        "get_document_summary_llm",
+        "get_agent_llm",
        AsyncMock(return_value=llm),
    )
    monkeypatch.setattr(resume_tool, "_compile_typst", lambda _source: b"pdf")
@ -171,7 +171,7 @@ async def test_generate_resume_compresses_when_over_limit(monkeypatch) -> None:
    llm = SimpleNamespace(ainvoke=AsyncMock(side_effect=responses))
    monkeypatch.setattr(
        resume_tool,
-        "get_document_summary_llm",
+        "get_agent_llm",
        AsyncMock(return_value=llm),
    )
    monkeypatch.setattr(resume_tool, "_compile_typst", lambda _source: b"pdf")
@ -206,7 +206,7 @@ async def test_generate_resume_returns_ready_when_target_not_met(monkeypatch) ->
    llm = SimpleNamespace(ainvoke=AsyncMock(side_effect=responses))
    monkeypatch.setattr(
        resume_tool,
-        "get_document_summary_llm",
+        "get_agent_llm",
        AsyncMock(return_value=llm),
    )
    monkeypatch.setattr(resume_tool, "_compile_typst", lambda _source: b"pdf")
@ -239,7 +239,7 @@ async def test_generate_resume_fails_when_hard_limit_exceeded(monkeypatch) -> No
    llm = SimpleNamespace(ainvoke=AsyncMock(side_effect=responses))
    monkeypatch.setattr(
        resume_tool,
-        "get_document_summary_llm",
+        "get_agent_llm",
        AsyncMock(return_value=llm),
    )
    monkeypatch.setattr(resume_tool, "_compile_typst", lambda _source: b"pdf")
--- a/surfsense_backend/tests/unit/connector_indexers/test_confluence_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_confluence_parallel.py
@ -71,7 +71,6 @@ async def test_build_connector_doc_produces_correct_fields():
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert doc.title == "Engineering Handbook"
@ -81,7 +80,6 @@ async def test_build_connector_doc_produces_correct_fields():
    assert doc.search_space_id == _SEARCH_SPACE_ID
    assert doc.connector_id == _CONNECTOR_ID
    assert doc.created_by_id == _USER_ID
-    assert doc.should_summarize is True
    assert doc.metadata["page_id"] == "abc-123"
    assert doc.metadata["page_title"] == "Engineering Handbook"
    assert doc.metadata["space_id"] == "ENG"
@ -89,21 +87,6 @@ async def test_build_connector_doc_produces_correct_fields():
    assert doc.metadata["connector_id"] == _CONNECTOR_ID
    assert doc.metadata["document_type"] == "Confluence Page"
    assert doc.metadata["connector_type"] == "Confluence"
-    assert doc.fallback_summary is not None
-    assert "Engineering Handbook" in doc.fallback_summary
-    assert markdown in doc.fallback_summary
-
-
-async def test_build_connector_doc_summary_disabled():
-    doc = _build_connector_doc(
-        _make_page(),
-        _to_markdown(_make_page()),
-        connector_id=_CONNECTOR_ID,
-        search_space_id=_SEARCH_SPACE_ID,
-        user_id=_USER_ID,
-        enable_summary=False,
-    )
-    assert doc.should_summarize is False


 # ---------------------------------------------------------------------------
@ -111,10 +94,9 @@ async def test_build_connector_doc_summary_disabled():
 # ---------------------------------------------------------------------------


-def _mock_connector(enable_summary: bool = True):
+def _mock_connector():
    c = MagicMock()
    c.config = {"access_token": "tok"}
-    c.enable_summary = enable_summary
    c.last_indexed_at = None
    return c

--- a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
@ -71,7 +71,6 @@ async def test_single_file_returns_one_connector_document(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 1
@ -97,7 +96,6 @@ async def test_multiple_files_all_produce_documents(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 3
@ -125,7 +123,6 @@ async def test_one_download_exception_does_not_block_others(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 2
@ -152,7 +149,6 @@ async def test_etl_error_counts_as_download_failure(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 1
@ -191,7 +187,6 @@ async def test_concurrency_bounded_by_semaphore(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
        max_concurrency=2,
    )

@ -231,7 +226,6 @@ async def test_heartbeat_fires_during_parallel_downloads(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
        on_heartbeat=_on_heartbeat,
    )

@ -324,7 +318,6 @@ async def _run_full_scan(mocks, monkeypatch, page_files, *, max_files=500):
        mocks["task_logger"],
        mocks["log_entry"],
        max_files,
-        enable_summary=True,
    )


@ -434,7 +427,6 @@ async def _run_selected(mocks, file_tuples):
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )


@ -569,7 +561,6 @@ async def test_delta_sync_deletions_call_remove_document(monkeypatch):
        mock_task_logger,
        MagicMock(),
        max_files=500,
-        enable_summary=True,
    )

    assert sorted(remove_calls) == ["id:del1", "id:del2"]
@ -608,7 +599,6 @@ async def test_delta_sync_upserts_filtered_and_downloaded(monkeypatch):
        mock_task_logger,
        MagicMock(),
        max_files=500,
-        enable_summary=True,
    )

    assert indexed == 2
@ -670,7 +660,6 @@ async def test_delta_sync_mix_deletions_and_upserts(monkeypatch):
        mock_task_logger,
        MagicMock(),
        max_files=500,
-        enable_summary=True,
    )

    assert sorted(remove_calls) == ["id:del1", "id:del2"]
@ -704,7 +693,6 @@ async def test_delta_sync_returns_new_cursor(monkeypatch):
        mock_task_logger,
        MagicMock(),
        max_files=500,
-        enable_summary=True,
    )

    assert cursor == "brand-new-cursor-xyz"
@ -725,7 +713,7 @@ def orchestrator_mocks(monkeypatch):
    mock_connector = MagicMock()
    mock_connector.config = {"_token_encrypted": False}
    mock_connector.last_indexed_at = None
-    mock_connector.enable_summary = True
+    mock_connector.enable_vision_llm = True

    monkeypatch.setattr(
        _mod,
--- a/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
@ -66,7 +66,6 @@ async def test_single_file_returns_one_connector_document(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 1
@ -91,7 +90,6 @@ async def test_multiple_files_all_produce_documents(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 3
@ -119,7 +117,6 @@ async def test_one_download_exception_does_not_block_others(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 2
@ -146,7 +143,6 @@ async def test_etl_error_counts_as_download_failure(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 1
@ -186,7 +182,6 @@ async def test_concurrency_bounded_by_semaphore(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
        max_concurrency=2,
    )

@ -226,7 +221,6 @@ async def test_heartbeat_fires_during_parallel_downloads(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
        on_heartbeat=_on_heartbeat,
    )

@ -300,12 +294,6 @@ def full_scan_mocks(mock_drive_client, monkeypatch):
        MagicMock(return_value=pipeline_mock),
    )

-    monkeypatch.setattr(
-        _mod,
-        "get_user_long_context_llm",
-        AsyncMock(return_value=MagicMock()),
-    )
-
    return {
        "drive_client": mock_drive_client,
        "session": mock_session,
@ -333,7 +321,6 @@ async def _run_full_scan(mocks, *, max_files=500, include_subfolders=False):
        mocks["log_entry"],
        max_files,
        include_subfolders=include_subfolders,
-        enable_summary=True,
    )


@ -487,12 +474,6 @@ async def test_delta_sync_removals_serial_rest_parallel(monkeypatch):
        "IndexingPipelineService",
        MagicMock(return_value=pipeline_mock),
    )
-    monkeypatch.setattr(
-        _mod,
-        "get_user_long_context_llm",
-        AsyncMock(return_value=MagicMock()),
-    )
-
    mock_session, _ = _make_page_limit_session()
    mock_task_logger = MagicMock()
    mock_task_logger.log_task_progress = AsyncMock()
@ -509,7 +490,6 @@ async def test_delta_sync_removals_serial_rest_parallel(monkeypatch):
        mock_task_logger,
        MagicMock(),
        max_files=500,
-        enable_summary=True,
    )

    assert sorted(remove_calls) == ["del1", "del2", "trash1"]
@ -577,7 +557,6 @@ async def _run_selected(mocks, file_ids):
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )


--- a/surfsense_backend/tests/unit/connector_indexers/test_linear_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_linear_parallel.py
@ -70,7 +70,6 @@ async def test_build_connector_doc_produces_correct_fields():
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert doc.title == "ENG-42: Fix login bug"
@ -80,7 +79,6 @@ async def test_build_connector_doc_produces_correct_fields():
    assert doc.search_space_id == _SEARCH_SPACE_ID
    assert doc.connector_id == _CONNECTOR_ID
    assert doc.created_by_id == _USER_ID
-    assert doc.should_summarize is True
    assert doc.metadata["issue_id"] == "abc-123"
    assert doc.metadata["issue_identifier"] == "ENG-42"
    assert doc.metadata["issue_title"] == "Fix login bug"
@ -90,24 +88,6 @@ async def test_build_connector_doc_produces_correct_fields():
    assert doc.metadata["connector_id"] == _CONNECTOR_ID
    assert doc.metadata["document_type"] == "Linear Issue"
    assert doc.metadata["connector_type"] == "Linear"
-    assert doc.fallback_summary is not None
-    assert "ENG-42" in doc.fallback_summary
-    assert markdown in doc.fallback_summary
-
-
-async def test_build_connector_doc_summary_disabled():
-    """When enable_summary is False, should_summarize is False."""
-    doc = _build_connector_doc(
-        _make_issue(),
-        _make_formatted_issue(),
-        "# content",
-        connector_id=_CONNECTOR_ID,
-        search_space_id=_SEARCH_SPACE_ID,
-        user_id=_USER_ID,
-        enable_summary=False,
-    )
-
-    assert doc.should_summarize is False


 # ---------------------------------------------------------------------------
@ -115,10 +95,9 @@ async def test_build_connector_doc_summary_disabled():
 # ---------------------------------------------------------------------------


-def _mock_connector(enable_summary: bool = True):
+def _mock_connector():
    c = MagicMock()
    c.config = {"access_token": "tok"}
-    c.enable_summary = enable_summary
    c.last_indexed_at = None
    return c

--- a/surfsense_backend/tests/unit/connector_indexers/test_notion_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_notion_parallel.py
@ -41,7 +41,6 @@ async def test_build_connector_doc_produces_correct_fields():
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert doc.title == "My Notion Page"
@ -51,29 +50,11 @@ async def test_build_connector_doc_produces_correct_fields():
    assert doc.search_space_id == _SEARCH_SPACE_ID
    assert doc.connector_id == _CONNECTOR_ID
    assert doc.created_by_id == _USER_ID
-    assert doc.should_summarize is True
    assert doc.metadata["page_title"] == "My Notion Page"
    assert doc.metadata["page_id"] == "abc-123"
    assert doc.metadata["connector_id"] == _CONNECTOR_ID
    assert doc.metadata["document_type"] == "Notion Page"
    assert doc.metadata["connector_type"] == "Notion"
-    assert doc.fallback_summary is not None
-    assert "My Notion Page" in doc.fallback_summary
-    assert markdown in doc.fallback_summary
-
-
-async def test_build_connector_doc_summary_disabled():
-    """When enable_summary is False, should_summarize is False."""
-    doc = _build_connector_doc(
-        _make_page(),
-        "# content",
-        connector_id=_CONNECTOR_ID,
-        search_space_id=_SEARCH_SPACE_ID,
-        user_id=_USER_ID,
-        enable_summary=False,
-    )
-
-    assert doc.should_summarize is False


 # ---------------------------------------------------------------------------
@ -81,10 +62,9 @@ async def test_build_connector_doc_summary_disabled():
 # ---------------------------------------------------------------------------


-def _mock_connector(enable_summary: bool = True):
+def _mock_connector():
    c = MagicMock()
    c.config = {"access_token": "tok"}
-    c.enable_summary = enable_summary
    c.last_indexed_at = None
    return c

--- a/surfsense_backend/tests/unit/connector_indexers/test_onedrive_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_onedrive_parallel.py
@ -65,7 +65,6 @@ async def test_single_file_returns_one_connector_document(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 1
@ -91,7 +90,6 @@ async def test_multiple_files_all_produce_documents(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 3
@ -119,7 +117,6 @@ async def test_one_download_exception_does_not_block_others(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 2
@ -146,7 +143,6 @@ async def test_etl_error_counts_as_download_failure(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )

    assert len(docs) == 1
@ -185,7 +181,6 @@ async def test_concurrency_bounded_by_semaphore(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
        max_concurrency=2,
    )

@ -225,7 +220,6 @@ async def test_heartbeat_fires_during_parallel_downloads(
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
        on_heartbeat=_on_heartbeat,
    )

--- a/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
@ -180,7 +180,6 @@ async def _run_gdrive_selected(mocks, file_ids):
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )


@ -336,10 +335,6 @@ def gdrive_full_scan_mocks(monkeypatch):
    monkeypatch.setattr(
        _mod, "IndexingPipelineService", MagicMock(return_value=pipeline_mock)
    )
-    monkeypatch.setattr(
-        _mod, "get_user_long_context_llm", AsyncMock(return_value=MagicMock())
-    )
-
    return {
        "mod": _mod,
        "session": session,
@ -366,7 +361,6 @@ async def _run_gdrive_full_scan(mocks, max_files=500):
        MagicMock(),
        max_files,
        include_subfolders=False,
-        enable_summary=True,
    )


@ -454,10 +448,6 @@ async def test_gdrive_delta_sync_skips_over_quota(monkeypatch):
    monkeypatch.setattr(
        _mod, "IndexingPipelineService", MagicMock(return_value=pipeline_mock)
    )
-    monkeypatch.setattr(
-        _mod, "get_user_long_context_llm", AsyncMock(return_value=MagicMock())
-    )
-
    mock_task_logger = MagicMock()
    mock_task_logger.log_task_progress = AsyncMock()

@ -473,7 +463,6 @@ async def test_gdrive_delta_sync_skips_over_quota(monkeypatch):
        mock_task_logger,
        MagicMock(),
        max_files=500,
-        enable_summary=True,
    )

    call_files = download_mock.call_args[0][1]
@ -539,7 +528,6 @@ async def _run_onedrive_selected(mocks, file_ids):
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )


@ -641,7 +629,6 @@ async def _run_dropbox_selected(mocks, file_paths):
        connector_id=_CONNECTOR_ID,
        search_space_id=_SEARCH_SPACE_ID,
        user_id=_USER_ID,
-        enable_summary=True,
    )


--- a/surfsense_backend/tests/unit/gateway/test_webhook_routes.py
+++ b/surfsense_backend/tests/unit/gateway/test_webhook_routes.py
@ -92,6 +92,13 @@ def _signed_slack_request(payload: dict, *, secret: str = "signing-secret") -> R
    )


+def _enable_slack_gateway(monkeypatch):
+    monkeypatch.setattr(routes.config, "GATEWAY_SLACK_ENABLED", True)
+    monkeypatch.setattr(routes.config, "GATEWAY_SLACK_CLIENT_ID", "client-id")
+    monkeypatch.setattr(routes.config, "GATEWAY_SLACK_CLIENT_SECRET", "client-secret")
+    monkeypatch.setattr(routes.config, "GATEWAY_SLACK_SIGNING_SECRET", "signing-secret")
+
+
 async def _call_webhook(*, request: RequestStub, account_id: int, session):
    return await routes.telegram_webhook(
        request=request,
@ -230,7 +237,7 @@ def test_verify_slack_signature_accepts_valid_signature():

@pytest.mark.asyncio
 async def test_slack_webhook_url_verification(monkeypatch, mocker):
-    monkeypatch.setattr(routes.config, "GATEWAY_SLACK_SIGNING_SECRET", "signing-secret")
+    _enable_slack_gateway(monkeypatch)
    request = _signed_slack_request({"type": "url_verification", "challenge": "abc123"})

    response = await routes.slack_webhook(request=request, session=mocker.AsyncMock())
@ -241,7 +248,7 @@ async def test_slack_webhook_url_verification(monkeypatch, mocker):

@pytest.mark.asyncio
 async def test_slack_webhook_persists_event(monkeypatch, mocker):
-    monkeypatch.setattr(routes.config, "GATEWAY_SLACK_SIGNING_SECRET", "signing-secret")
+    _enable_slack_gateway(monkeypatch)
    session = mocker.AsyncMock()
    monkeypatch.setattr(routes, "get_slack_account_by_team", mocker.AsyncMock(return_value=_slack_account()))
    persist = mocker.AsyncMock(return_value=100)
@ -271,7 +278,7 @@ async def test_slack_webhook_persists_event(monkeypatch, mocker):

@pytest.mark.asyncio
 async def test_slack_webhook_ignores_self_event(monkeypatch, mocker):
-    monkeypatch.setattr(routes.config, "GATEWAY_SLACK_SIGNING_SECRET", "signing-secret")
+    _enable_slack_gateway(monkeypatch)
    session = mocker.AsyncMock()
    monkeypatch.setattr(routes, "get_slack_account_by_team", mocker.AsyncMock(return_value=_slack_account()))
    persist = mocker.AsyncMock(return_value=100)
--- a/surfsense_backend/tests/unit/indexing_pipeline/test_connector_document.py
+++ b/surfsense_backend/tests/unit/indexing_pipeline/test_connector_document.py
@ -18,7 +18,6 @@ def test_valid_document_created_with_required_fields():
        connector_id=42,
        created_by_id="00000000-0000-0000-0000-000000000001",
    )
-    assert doc.should_summarize is True
    assert doc.should_use_code_chunker is False
    assert doc.metadata == {}
    assert doc.connector_id == 42
--- a/surfsense_backend/tests/unit/indexing_pipeline/test_document_summarizer.py
+++ b/surfsense_backend/tests/unit/indexing_pipeline/test_document_summarizer.py
@ -1,41 +0,0 @@
-from unittest.mock import MagicMock
-
-import pytest
-
-from app.indexing_pipeline.document_summarizer import summarize_document
-
-pytestmark = pytest.mark.unit
-
-
-@pytest.mark.usefixtures("patched_summarizer_chain")
-async def test_without_metadata_returns_raw_summary():
-    """Summarizer returns the LLM output directly when no metadata is provided."""
-    result = await summarize_document("# Content", llm=MagicMock(model="gpt-4"))
-
-    assert result == "The summary."
-
-
-@pytest.mark.usefixtures("patched_summarizer_chain")
-async def test_with_metadata_includes_metadata_values_in_output():
-    """Non-empty metadata values are prepended to the summary output."""
-    result = await summarize_document(
-        "# Content",
-        llm=MagicMock(model="gpt-4"),
-        metadata={"author": "Alice", "source": "Notion"},
-    )
-
-    assert "Alice" in result
-    assert "Notion" in result
-
-
-@pytest.mark.usefixtures("patched_summarizer_chain")
-async def test_with_metadata_omits_empty_fields_from_output():
-    """Empty metadata fields are omitted from the summary output."""
-    result = await summarize_document(
-        "# Content",
-        llm=MagicMock(model="gpt-4"),
-        metadata={"author": "Alice", "description": ""},
-    )
-
-    assert "Alice" in result
-    assert "description" not in result.lower()
--- a/surfsense_backend/tests/unit/indexing_pipeline/test_index_batch.py
+++ b/surfsense_backend/tests/unit/indexing_pipeline/test_index_batch.py
@ -37,12 +37,10 @@ async def test_calls_prepare_then_index_per_document(pipeline, make_connector_do
    orm2 = MagicMock(spec=Document)
    orm2.unique_identifier_hash = compute_unique_identifier_hash(doc2)

-    mock_llm = MagicMock()
-
    pipeline.prepare_for_indexing = AsyncMock(return_value=[orm1, orm2])
-    pipeline.index = AsyncMock(side_effect=lambda doc, cdoc, llm: doc)
+    pipeline.index = AsyncMock(side_effect=lambda doc, cdoc: doc)

-    results = await pipeline.index_batch([doc1, doc2], mock_llm)
+    results = await pipeline.index_batch([doc1, doc2])

    pipeline.prepare_for_indexing.assert_awaited_once_with([doc1, doc2])
    assert pipeline.index.await_count == 2
@ -53,7 +51,7 @@ async def test_empty_input_returns_empty(pipeline):
    """Empty connector_docs list returns empty result."""
    pipeline.prepare_for_indexing = AsyncMock(return_value=[])

-    results = await pipeline.index_batch([], MagicMock())
+    results = await pipeline.index_batch([])

    assert results == []

@ -74,7 +72,7 @@ async def test_skips_document_without_matching_connector_doc(
    pipeline.prepare_for_indexing = AsyncMock(return_value=[orphan_orm])
    pipeline.index = AsyncMock()

-    results = await pipeline.index_batch([doc1], MagicMock())
+    results = await pipeline.index_batch([doc1])

    pipeline.index.assert_not_awaited()
    assert results == []
--- a/surfsense_backend/tests/unit/indexing_pipeline/test_index_batch_parallel.py
+++ b/surfsense_backend/tests/unit/indexing_pipeline/test_index_batch_parallel.py
@ -51,11 +51,6 @@ async def test_index_calls_embed_and_chunk_via_to_thread(
        return await original_to_thread(func, *args, **kwargs)

    monkeypatch.setattr(asyncio, "to_thread", tracking_to_thread)
-
-    monkeypatch.setattr(
-        "app.indexing_pipeline.indexing_pipeline_service.summarize_document",
-        AsyncMock(return_value="Summary."),
-    )
    mock_chunk_hybrid = MagicMock(return_value=["chunk1"])
    mock_chunk_hybrid.__name__ = "chunk_text_hybrid"
    monkeypatch.setattr(
@ -85,7 +80,7 @@ async def test_index_calls_embed_and_chunk_via_to_thread(
    document.id = 1
    document.status = DocumentStatus.pending()

-    await pipeline.index(document, connector_doc, llm=MagicMock())
+    await pipeline.index(document, connector_doc)

    # Either chunker entry point satisfies the "chunking runs off the event
    # loop" contract this test guards. Routing between the two is verified
@ -104,10 +99,6 @@ async def test_non_code_documents_use_hybrid_chunker(
    mid-row. Only documents flagged with ``should_use_code_chunker=True``
    should take the ``chunk_text`` path.
    """
-    monkeypatch.setattr(
-        "app.indexing_pipeline.indexing_pipeline_service.summarize_document",
-        AsyncMock(return_value="Summary."),
-    )
    mock_chunk_hybrid = MagicMock(return_value=["chunk1"])
    mock_chunk_hybrid.__name__ = "chunk_text_hybrid"
    monkeypatch.setattr(
@ -139,7 +130,7 @@ async def test_non_code_documents_use_hybrid_chunker(
    document.id = 1
    document.status = DocumentStatus.pending()

-    await pipeline.index(document, connector_doc, llm=MagicMock())
+    await pipeline.index(document, connector_doc)

    mock_chunk_hybrid.assert_called_once()
    mock_chunk_code.assert_not_called()
@ -192,19 +183,14 @@ async def test_batch_parallel_indexes_all_documents(

    index_calls = []

-    async def fake_index(self, document, connector_doc, llm):
+    async def fake_index(self, document, connector_doc):
        index_calls.append(document.id)
        document.status = DocumentStatus.ready()
        return document

    monkeypatch.setattr(IndexingPipelineService, "index", fake_index)

-    async def mock_get_llm(session):
-        return MagicMock()
-
-    _, indexed, failed = await pipeline.index_batch_parallel(
-        docs, mock_get_llm, max_concurrency=2
-    )
+    _, indexed, failed = await pipeline.index_batch_parallel(docs, max_concurrency=2)

    assert indexed == 3
    assert failed == 0
@ -233,20 +219,15 @@ async def test_batch_parallel_one_failure_does_not_affect_others(
        _mock_session_factory(orm_by_id),
    )

-    async def failing_index(self, document, connector_doc, llm):
+    async def failing_index(self, document, connector_doc):
        if document.id == 2:
-            raise RuntimeError("LLM exploded")
+            raise RuntimeError("Indexing exploded")
        document.status = DocumentStatus.ready()
        return document

    monkeypatch.setattr(IndexingPipelineService, "index", failing_index)

-    async def mock_get_llm(session):
-        return MagicMock()
-
-    _, indexed, failed = await pipeline.index_batch_parallel(
-        docs, mock_get_llm, max_concurrency=4
-    )
+    _, indexed, failed = await pipeline.index_batch_parallel(docs, max_concurrency=4)

    assert indexed == 2
    assert failed == 1