feat(db): Remove document summary LLM schema

2026-07-22 23:31:12 +02:00 · 2026-06-04 00:48:53 +05:30 · 2026-06-04 00:48:53 +05:30 · 290a9539ef
commit 290a9539ef
parent e68b3f9532
9 changed files with 137 additions and 67 deletions
--- a/surfsense_backend/app/db.py
+++ b/surfsense_backend/app/db.py
@ -1781,9 +1781,6 @@ class SearchSpace(BaseModel, TimestampMixin):
    agent_llm_id = Column(
        Integer, nullable=True, default=0
    )  # For agent/chat operations, defaults to Auto mode
-    document_summary_llm_id = Column(
-        Integer, nullable=True, default=0
-    )  # For document summarization, defaults to Auto mode
    image_generation_config_id = Column(
        Integer, nullable=True, default=0
    )  # For image generation, defaults to Auto mode
@ -1951,12 +1948,6 @@ class SearchSourceConnector(BaseModel, TimestampMixin):
    last_indexed_at = Column(TIMESTAMP(timezone=True), nullable=True)
    config = Column(JSON, nullable=False)

-    # Summary generation (LLM-based) - disabled by default to save resources.
-    # When enabled, improves hybrid search quality at the cost of LLM calls.
-    enable_summary = Column(
-        Boolean, nullable=False, default=False, server_default="false"
-    )
-
    # Vision LLM for image files - disabled by default to save cost/time.
    # When enabled, images are described via a vision language model instead
    # of falling back to the document parser.
--- a/surfsense_backend/app/routes/search_spaces_routes.py
+++ b/surfsense_backend/app/routes/search_spaces_routes.py
@ -617,9 +617,6 @@ async def get_llm_preferences(

        # Get full config objects for each role
        agent_llm = await _get_llm_config_by_id(session, search_space.agent_llm_id)
-        document_summary_llm = await _get_llm_config_by_id(
-            session, search_space.document_summary_llm_id
-        )
        image_generation_config = await _get_image_gen_config_by_id(
            session, search_space.image_generation_config_id
        )
@ -629,11 +626,9 @@ async def get_llm_preferences(

        return LLMPreferencesRead(
            agent_llm_id=search_space.agent_llm_id,
-            document_summary_llm_id=search_space.document_summary_llm_id,
            image_generation_config_id=search_space.image_generation_config_id,
            vision_llm_config_id=search_space.vision_llm_config_id,
            agent_llm=agent_llm,
-            document_summary_llm=document_summary_llm,
            image_generation_config=image_generation_config,
            vision_llm_config=vision_llm_config,
        )
@ -707,9 +702,6 @@ async def update_llm_preferences(

        # Get full config objects for response
        agent_llm = await _get_llm_config_by_id(session, search_space.agent_llm_id)
-        document_summary_llm = await _get_llm_config_by_id(
-            session, search_space.document_summary_llm_id
-        )
        image_generation_config = await _get_image_gen_config_by_id(
            session, search_space.image_generation_config_id
        )
@ -719,11 +711,9 @@ async def update_llm_preferences(

        return LLMPreferencesRead(
            agent_llm_id=search_space.agent_llm_id,
-            document_summary_llm_id=search_space.document_summary_llm_id,
            image_generation_config_id=search_space.image_generation_config_id,
            vision_llm_config_id=search_space.vision_llm_config_id,
            agent_llm=agent_llm,
-            document_summary_llm=document_summary_llm,
            image_generation_config=image_generation_config,
            vision_llm_config=vision_llm_config,
        )
--- a/surfsense_backend/app/schemas/new_llm_config.py
+++ b/surfsense_backend/app/schemas/new_llm_config.py
@ -221,9 +221,6 @@ class LLMPreferencesRead(BaseModel):
    agent_llm_id: int | None = Field(
        None, description="ID of the LLM config to use for agent/chat tasks"
    )
-    document_summary_llm_id: int | None = Field(
-        None, description="ID of the LLM config to use for document summarization"
-    )
    image_generation_config_id: int | None = Field(
        None, description="ID of the image generation config to use"
    )
@ -234,9 +231,6 @@ class LLMPreferencesRead(BaseModel):
    agent_llm: dict[str, Any] | None = Field(
        None, description="Full config for agent LLM"
    )
-    document_summary_llm: dict[str, Any] | None = Field(
-        None, description="Full config for document summary LLM"
-    )
    image_generation_config: dict[str, Any] | None = Field(
        None, description="Full config for image generation"
    )
@ -253,9 +247,6 @@ class LLMPreferencesUpdate(BaseModel):
    agent_llm_id: int | None = Field(
        None, description="ID of the LLM config to use for agent/chat tasks"
    )
-    document_summary_llm_id: int | None = Field(
-        None, description="ID of the LLM config to use for document summarization"
-    )
    image_generation_config_id: int | None = Field(
        None, description="ID of the image generation config to use"
    )
--- a/surfsense_backend/app/schemas/search_source_connector.py
+++ b/surfsense_backend/app/schemas/search_source_connector.py
@ -16,7 +16,6 @@ class SearchSourceConnectorBase(BaseModel):
    is_indexable: bool
    last_indexed_at: datetime | None = None
    config: dict[str, Any]
-    enable_summary: bool = False
    enable_vision_llm: bool = False
    periodic_indexing_enabled: bool = False
    indexing_frequency_minutes: int | None = None
@ -67,7 +66,6 @@ class SearchSourceConnectorUpdate(BaseModel):
    is_indexable: bool | None = None
    last_indexed_at: datetime | None = None
    config: dict[str, Any] | None = None
-    enable_summary: bool | None = None
    enable_vision_llm: bool | None = None
    periodic_indexing_enabled: bool | None = None
    indexing_frequency_minutes: int | None = None
--- a/surfsense_backend/app/services/llm_service.py
+++ b/surfsense_backend/app/services/llm_service.py
@ -68,7 +68,6 @@ def _is_interactive_auth_provider(

 class LLMRole:
    AGENT = "agent"  # For agent/chat operations
-    DOCUMENT_SUMMARY = "document_summary"  # For document summarization


 def get_global_llm_config(llm_config_id: int) -> dict | None:
@ -266,7 +265,7 @@ async def get_search_space_llm_instance(
    Args:
        session: Database session
        search_space_id: Search Space ID
-        role: LLM role ('agent' or 'document_summary')
+        role: LLM role ('agent')

    Returns:
        ChatLiteLLM or ChatLiteLLMRouter instance, or None if not found
@ -283,11 +282,8 @@ async def get_search_space_llm_instance(
            return None

        # Get the appropriate LLM config ID based on role
-        llm_config_id = None
        if role == LLMRole.AGENT:
            llm_config_id = search_space.agent_llm_id
-        elif role == LLMRole.DOCUMENT_SUMMARY:
-            llm_config_id = search_space.document_summary_llm_id
        else:
            logger.error(f"Invalid LLM role: {role}")
            return None
@ -470,20 +466,13 @@ async def get_search_space_llm_instance(


 async def get_agent_llm(
-    session: AsyncSession, search_space_id: int
-) -> ChatLiteLLM | ChatLiteLLMRouter | None:
-    """Get the search space's agent LLM instance for chat operations."""
-    return await get_search_space_llm_instance(session, search_space_id, LLMRole.AGENT)
-
-
-async def get_document_summary_llm(
    session: AsyncSession, search_space_id: int, disable_streaming: bool = False
 ) -> ChatLiteLLM | ChatLiteLLMRouter | None:
-    """Get the search space's document summary LLM instance."""
+    """Get the search space's agent LLM instance for chat operations."""
    return await get_search_space_llm_instance(
        session,
        search_space_id,
-        LLMRole.DOCUMENT_SUMMARY,
+        LLMRole.AGENT,
        disable_streaming=disable_streaming,
    )

@ -645,22 +634,6 @@ async def get_vision_llm(
        return None


-# Backward-compatible alias (LLM preferences are now per-search-space, not per-user)
-async def get_user_long_context_llm(
-    session: AsyncSession,
-    user_id: str,
-    search_space_id: int,
-    disable_streaming: bool = False,
-) -> ChatLiteLLM | ChatLiteLLMRouter | None:
-    """
-    Deprecated: Use get_document_summary_llm instead.
-    The user_id parameter is ignored as LLM preferences are now per-search-space.
-    """
-    return await get_document_summary_llm(
-        session, search_space_id, disable_streaming=disable_streaming
-    )
-
-
 def get_planner_llm() -> ChatLiteLLM | None:
    """Return a planner LLM instance from the first global config marked
    ``is_planner: true``, or ``None`` if no planner config is defined.