SurfSense/surfsense_backend/app/agents/researcher/qna_agent/nodes.py

from typing import Any

from langchain_core.messages import HumanMessage, SystemMessage
from langchain_core.runnables import RunnableConfig

from app.services.reranker_service import RerankerService

from ..utils import (
    calculate_token_count,
    format_documents_section,
    optimize_documents_for_token_limit,
)
from .configuration import Configuration
from .prompts import get_qna_citation_system_prompt, get_qna_no_documents_system_prompt
from .state import State


async def rerank_documents(state: State, config: RunnableConfig) -> dict[str, Any]:
    """
    Rerank the documents based on relevance to the user's question.

    This node takes the relevant documents provided in the configuration,
    reranks them using the reranker service based on the user's query,
    and updates the state with the reranked documents.

    Returns:
        Dict containing the reranked documents.
    """
    # Get configuration and relevant documents
    configuration = Configuration.from_runnable_config(config)
    documents = configuration.relevant_documents
    user_query = configuration.user_query
    reformulated_query = configuration.reformulated_query

    # If no documents were provided, return empty list
    if not documents or len(documents) == 0:
        return {"reranked_documents": []}

    # Get reranker service from app config
    reranker_service = RerankerService.get_reranker_instance()

    # Use documents as is if no reranker service is available
    reranked_docs = documents

    if reranker_service:
        try:
            # Convert documents to format expected by reranker if needed
            reranker_input_docs = [
                {
                    "chunk_id": doc.get("chunk_id", f"chunk_{i}"),
                    "content": doc.get("content", ""),
                    "score": doc.get("score", 0.0),
                    "document": {
                        "id": doc.get("document", {}).get("id", ""),
                        "title": doc.get("document", {}).get("title", ""),
                        "document_type": doc.get("document", {}).get(
                            "document_type", ""
                        ),
                        "metadata": doc.get("document", {}).get("metadata", {}),
                    },
                }
                for i, doc in enumerate(documents)
            ]

            # Rerank documents using the user's query
            reranked_docs = reranker_service.rerank_documents(
                user_query + "\n" + reformulated_query, reranker_input_docs
            )

            # Sort by score in descending order
            reranked_docs.sort(key=lambda x: x.get("score", 0), reverse=True)

            print(
                f"Reranked {len(reranked_docs)} documents for Q&A query: {user_query}"
            )
        except Exception as e:
            print(f"Error during reranking: {e!s}")
            # Use original docs if reranking fails

    return {"reranked_documents": reranked_docs}


async def answer_question(state: State, config: RunnableConfig) -> dict[str, Any]:
    """
    Answer the user's question using the provided documents.

    This node takes the relevant documents provided in the configuration and uses
    an LLM to generate a comprehensive answer to the user's question with
    proper citations. The citations follow [citation:source_id] format using source IDs from the
    documents. If no documents are provided, it will use chat history to generate
    an answer.

    Returns:
        Dict containing the final answer in the "final_answer" key.
    """
    from app.services.llm_service import get_user_fast_llm

    # Get configuration and relevant documents from configuration
    configuration = Configuration.from_runnable_config(config)
    documents = state.reranked_documents
    user_query = configuration.user_query
    user_id = configuration.user_id

    # Get user's fast LLM
    llm = await get_user_fast_llm(state.db_session, user_id)
    if not llm:
        error_message = f"No fast LLM configured for user {user_id}"
        print(error_message)
        raise RuntimeError(error_message)

    # Determine if we have documents and optimize for token limits
    has_documents_initially = documents and len(documents) > 0

    if has_documents_initially:
        # Create base message template for token calculation (without documents)
        base_human_message_template = f"""
        
        User's question:
        <user_query>
            {user_query}
        </user_query>
        
        Please provide a detailed, comprehensive answer to the user's question using the information from their personal knowledge sources. Make sure to cite all information appropriately and engage in a conversational manner.
        """

        # Use initial system prompt for token calculation
        initial_system_prompt = get_qna_citation_system_prompt()
        base_messages = [
            *state.chat_history,
            SystemMessage(content=initial_system_prompt),
            HumanMessage(content=base_human_message_template),
        ]

        # Optimize documents to fit within token limits
        optimized_documents, has_optimized_documents = (
            optimize_documents_for_token_limit(documents, base_messages, llm.model)
        )

        # Update state based on optimization result
        documents = optimized_documents
        has_documents = has_optimized_documents
    else:
        has_documents = False

    # Choose system prompt based on final document availability
    system_prompt = (
        get_qna_citation_system_prompt()
        if has_documents
        else get_qna_no_documents_system_prompt()
    )

    # Generate documents section
    documents_text = (
        format_documents_section(
            documents, "Source material from your personal knowledge base"
        )
        if has_documents
        else ""
    )

    # Create final human message content
    instruction_text = (
        "Please provide a detailed, comprehensive answer to the user's question using the information from their personal knowledge sources. Make sure to cite all information appropriately and engage in a conversational manner."
        if has_documents
        else "Please provide a helpful answer to the user's question based on our conversation history and your general knowledge. Engage in a conversational manner."
    )

    human_message_content = f"""
    {documents_text}
    
    User's question:
    <user_query>
        {user_query}
    </user_query>
    
    {instruction_text}
    """

    # Create final messages for the LLM
    messages_with_chat_history = [
        *state.chat_history,
        SystemMessage(content=system_prompt),
        HumanMessage(content=human_message_content),
    ]

    # Log final token count
    total_tokens = calculate_token_count(messages_with_chat_history, llm.model)
    print(f"Final token count: {total_tokens}")

    # Call the LLM and get the response
    response = await llm.ainvoke(messages_with_chat_history)
    final_answer = response.content

    return {"final_answer": final_answer}
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`from typing import Any`

$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`from langchain_core.messages import HumanMessage, SystemMessage`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`from langchain_core.runnables import RunnableConfig`

			`from app.services.reranker_service import RerankerService`

$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`from ..utils import (`
			`calculate_token_count,`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`format_documents_section,`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`optimize_documents_for_token_limit,`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`from .configuration import Configuration`
			`from .prompts import get_qna_citation_system_prompt, get_qna_no_documents_system_prompt`
			`from .state import State`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`async def rerank_documents(state: State, config: RunnableConfig) -> dict[str, Any]:`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`"""`
			`Rerank the documents based on relevance to the user's question.`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`This node takes the relevant documents provided in the configuration,`
			`reranks them using the reranker service based on the user's query,`
			`and updates the state with the reranked documents.`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`Returns:`
			`Dict containing the reranked documents.`
			`"""`
			`# Get configuration and relevant documents`
			`configuration = Configuration.from_runnable_config(config)`
			`documents = configuration.relevant_documents`
			`user_query = configuration.user_query`
$DESKTOP-RTLN3BA\$punk$ fix: q/a agent 2025-06-05 23:52:34 -07:00			`reformulated_query = configuration.reformulated_query`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00
			`# If no documents were provided, return empty list`
			`if not documents or len(documents) == 0:`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`return {"reranked_documents": []}`

$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`# Get reranker service from app config`
$DESKTOP-RTLN3BA\$punk$ fix: Fix rerank_documents node in sub_section_writer & qna_agent 2025-07-03 14:09:36 -07:00			`reranker_service = RerankerService.get_reranker_instance()`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`# Use documents as is if no reranker service is available`
			`reranked_docs = documents`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`if reranker_service:`
			`try:`
			`# Convert documents to format expected by reranker if needed`
			`reranker_input_docs = [`
			`{`
			`"chunk_id": doc.get("chunk_id", f"chunk_{i}"),`
			`"content": doc.get("content", ""),`
			`"score": doc.get("score", 0.0),`
			`"document": {`
			`"id": doc.get("document", {}).get("id", ""),`
			`"title": doc.get("document", {}).get("title", ""),`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`"document_type": doc.get("document", {}).get(`
			`"document_type", ""`
			`),`
			`"metadata": doc.get("document", {}).get("metadata", {}),`
			`},`
			`}`
			`for i, doc in enumerate(documents)`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`]`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`# Rerank documents using the user's query`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`reranked_docs = reranker_service.rerank_documents(`
			`user_query + "\n" + reformulated_query, reranker_input_docs`
			`)`

$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`# Sort by score in descending order`
			`reranked_docs.sort(key=lambda x: x.get("score", 0), reverse=True)`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
			`print(`
			`f"Reranked {len(reranked_docs)} documents for Q&A query: {user_query}"`
			`)`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`except Exception as e:`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`print(f"Error during reranking: {e!s}")`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`# Use original docs if reranking fails`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
			`return {"reranked_documents": reranked_docs}`

$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`async def answer_question(state: State, config: RunnableConfig) -> dict[str, Any]:`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`"""`
			`Answer the user's question using the provided documents.`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`This node takes the relevant documents provided in the configuration and uses`
			`an LLM to generate a comprehensive answer to the user's question with`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`proper citations. The citations follow [citation:source_id] format using source IDs from the`
$DESKTOP-RTLN3BA\$punk$ fix: Fix for case where nothing is selected for context. 2025-06-04 23:09:31 -07:00			`documents. If no documents are provided, it will use chat history to generate`
			`an answer.`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`Returns:`
			`Dict containing the final answer in the "final_answer" key.`
			`"""`
$DESKTOP-RTLN3BA\$punk$ refactor: Move utility services to a dedicated 'services' module - Updated import paths for LLM, connector, query, and streaming services to reflect their new location in the 'services' module. - Removed obsolete utility service files that have been migrated. 2025-07-06 17:51:24 -07:00			`from app.services.llm_service import get_user_fast_llm`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`# Get configuration and relevant documents from configuration`
			`configuration = Configuration.from_runnable_config(config)`
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`documents = state.reranked_documents`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`user_query = configuration.user_query`
$DESKTOP-RTLN3BA\$punk$ feat: added configurable LLM's 2025-06-09 15:50:15 -07:00			`user_id = configuration.user_id`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: added configurable LLM's 2025-06-09 15:50:15 -07:00			`# Get user's fast LLM`
			`llm = await get_user_fast_llm(state.db_session, user_id)`
			`if not llm:`
			`error_message = f"No fast LLM configured for user {user_id}"`
			`print(error_message)`
			`raise RuntimeError(error_message)`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`# Determine if we have documents and optimize for token limits`
			`has_documents_initially = documents and len(documents) > 0`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`if has_documents_initially:`
			`# Create base message template for token calculation (without documents)`
			`base_human_message_template = f"""`

			`User's question:`
			`<user_query>`
			`{user_query}`
			`</user_query>`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`Please provide a detailed, comprehensive answer to the user's question using the information from their personal knowledge sources. Make sure to cite all information appropriately and engage in a conversational manner.`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`"""`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`# Use initial system prompt for token calculation`
			`initial_system_prompt = get_qna_citation_system_prompt()`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`base_messages = [`
			`*state.chat_history,`
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`SystemMessage(content=initial_system_prompt),`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`HumanMessage(content=base_human_message_template),`
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`]`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`# Optimize documents to fit within token limits`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`optimized_documents, has_optimized_documents = (`
			`optimize_documents_for_token_limit(documents, base_messages, llm.model)`
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`)`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`# Update state based on optimization result`
			`documents = optimized_documents`
			`has_documents = has_optimized_documents`
			`else:`
			`has_documents = False`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`# Choose system prompt based on final document availability`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`system_prompt = (`
			`get_qna_citation_system_prompt()`
			`if has_documents`
			`else get_qna_no_documents_system_prompt()`
			`)`

$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`# Generate documents section`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`documents_text = (`
			`format_documents_section(`
			`documents, "Source material from your personal knowledge base"`
			`)`
			`if has_documents`
			`else ""`
			`)`

$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`# Create final human message content`
			`instruction_text = (`
			`"Please provide a detailed, comprehensive answer to the user's question using the information from their personal knowledge sources. Make sure to cite all information appropriately and engage in a conversational manner."`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`if has_documents`
			`else "Please provide a helpful answer to the user's question based on our conversation history and your general knowledge. Engage in a conversational manner."`
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`)`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`human_message_content = f"""`
$DESKTOP-RTLN3BA\$punk$ fix: Fix for case where nothing is selected for context. 2025-06-04 23:09:31 -07:00			`{documents_text}`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00
			`User's question:`
			`<user_query>`
			`{user_query}`
			`</user_query>`

$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`{instruction_text}`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`"""`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`# Create final messages for the LLM`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`messages_with_chat_history = [`
			`*state.chat_history,`
$DESKTOP-RTLN3BA\$punk$ fix: Fix for case where nothing is selected for context. 2025-06-04 23:09:31 -07:00			`SystemMessage(content=system_prompt),`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00			`HumanMessage(content=human_message_content),`
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`]`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`# Log final token count`
$DESKTOP-RTLN3BA\$punk$ feat: added configurable LLM's 2025-06-09 15:50:15 -07:00			`total_tokens = calculate_token_count(messages_with_chat_history, llm.model)`
$DESKTOP-RTLN3BA\$punk$ refactor: optimized document handling and added token management in Q&A and sub-section writing agents 2025-06-05 20:33:09 -07:00			`print(f"Final token count: {total_tokens}")`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Added Q/A Mode in Research Agent 2025-06-03 00:10:35 -07:00			`# Call the LLM and get the response`
			`response = await llm.ainvoke(messages_with_chat_history)`
			`final_answer = response.content`
Added inline citations and updated sources display as per new data format 2025-07-25 15:11:19 -07:00
			`return {"final_answer": final_answer}`