Merge upstream/dev into feature/human-in-the-loop

2026-05-17 18:35:19 +02:00 · 2026-02-13 20:17:59 +02:00 · 2026-02-13 20:17:59 +02:00 · 66a6fb685e
commit 66a6fb685e
parent d8d62ab2c5 5714d2c290
47 changed files with 7257 additions and 4582 deletions
--- a/surfsense_backend/app/agents/new_chat/tools/registry.py
+++ b/surfsense_backend/app/agents/new_chat/tools/registry.py
@ -56,6 +56,7 @@ from .notion import (
    create_update_notion_page_tool,
 )
 from .podcast import create_generate_podcast_tool
+from .report import create_generate_report_tool
 from .scrape_webpage import create_scrape_webpage_tool
 from .search_surfsense_docs import create_search_surfsense_docs_tool
 from .shared_memory import (
@ -123,6 +124,17 @@ BUILTIN_TOOLS: list[ToolDefinition] = [
        ),
        requires=["search_space_id", "db_session", "thread_id"],
    ),
+    # Report generation tool (inline, no Celery)
+    ToolDefinition(
+        name="generate_report",
+        description="Generate a structured Markdown report from provided content",
+        factory=lambda deps: create_generate_report_tool(
+            search_space_id=deps["search_space_id"],
+            db_session=deps["db_session"],
+            thread_id=deps["thread_id"],
+        ),
+        requires=["search_space_id", "db_session", "thread_id"],
+    ),
    # Link preview tool - fetches Open Graph metadata for URLs
    ToolDefinition(
        name="link_preview",
--- a/surfsense_backend/app/agents/new_chat/tools/report.py
+++ b/surfsense_backend/app/agents/new_chat/tools/report.py
@ -0,0 +1,396 @@
+"""
+Report generation tool for the SurfSense agent.
+
+This module provides a factory function for creating the generate_report tool
+that generates a structured Markdown report inline (no Celery). The LLM is
+called within the tool, the result is saved to the database, and the tool
+returns immediately with a ready status.
+
+This follows the same inline pattern as generate_image and display_image,
+NOT the Celery-based podcast pattern.
+"""
+
+import logging
+import re
+from typing import Any
+
+from langchain_core.tools import tool
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.db import Report
+from app.services.llm_service import get_document_summary_llm
+
+logger = logging.getLogger(__name__)
+
+# Prompt template for report generation (new report from scratch)
+_REPORT_PROMPT = """You are an expert report writer. Generate a well-structured, comprehensive Markdown report based on the provided information.
+
+**Topic:** {topic}
+
+**Report Style:** {report_style}
+
+{user_instructions_section}
+
+{previous_version_section}
+
+**Source Content:**
+{source_content}
+
+---
+
+**Instructions:**
+1. Write the report in well-formatted Markdown.
+2. Include a clear title (as a level-1 heading), an executive summary, and logically organized sections.
+3. Use headings (##, ###), bullet points, numbered lists, bold/italic text, and tables where appropriate.
+4. Cite specific facts, figures, and findings from the source content.
+5. Be thorough and comprehensive — include all relevant information from the source content.
+6. End with a conclusion or key takeaways section.
+7. The report should be professional and ready to export.
+8. When including code examples, ALWAYS format them as proper fenced code blocks with the correct language identifier (e.g. ```java, ```python). Code inside code blocks MUST have proper line breaks and indentation — NEVER put multiple statements on a single line. Each statement, brace, and logical block must be on its own line with correct indentation.
+9. When including Mermaid diagrams, use ```mermaid fenced code blocks. Each Mermaid statement MUST be on its own line — NEVER use semicolons to join multiple statements on one line. For line breaks inside node labels, use <br> (NOT <br/>). Example:
+   ```mermaid
+   graph TD
+       A[Source Code] --> B[Compiler]
+       B --> C[Bytecode]
+   ```
+
+Write the report now:
+"""
+
+
+def _strip_wrapping_code_fences(text: str) -> str:
+    """Remove wrapping code fences that LLMs often add around Markdown output.
+
+    Handles patterns like:
+        ```markdown\\n...content...\\n```
+        ```md\\n...content...\\n```
+        ```\\n...content...\\n```
+    """
+    stripped = text.strip()
+    # Match opening fence with optional language tag (markdown, md, or bare)
+    m = re.match(r"^```(?:markdown|md)?\s*\n", stripped)
+    if m and stripped.endswith("```"):
+        stripped = stripped[m.end() :]  # remove opening fence
+        stripped = stripped[:-3].rstrip()  # remove closing fence
+    return stripped
+
+
+def _extract_metadata(content: str) -> dict[str, Any]:
+    """Extract metadata from generated Markdown content."""
+    # Count section headings
+    headings = re.findall(r"^(#{1,6})\s+(.+)$", content, re.MULTILINE)
+
+    # Word count
+    word_count = len(content.split())
+
+    # Character count
+    char_count = len(content)
+
+    return {
+        "status": "ready",
+        "word_count": word_count,
+        "char_count": char_count,
+        "section_count": len(headings),
+    }
+
+
+def create_generate_report_tool(
+    search_space_id: int,
+    db_session: AsyncSession,
+    thread_id: int | None = None,
+):
+    """
+    Factory function to create the generate_report tool with injected dependencies.
+
+    The tool generates a Markdown report inline using the search space's
+    document summary LLM, saves it to the database, and returns immediately.
+
+    Args:
+        search_space_id: The user's search space ID
+        db_session: Database session for creating the report record
+        thread_id: The chat thread ID for associating the report
+
+    Returns:
+        A configured tool function for generating reports
+    """
+
+    @tool
+    async def generate_report(
+        topic: str,
+        source_content: str,
+        report_style: str = "detailed",
+        user_instructions: str | None = None,
+        parent_report_id: int | None = None,
+    ) -> dict[str, Any]:
+        """
+        Generate a structured Markdown report from provided content.
+
+        Use this tool when the user asks to create, generate, write, produce, draft,
+        or summarize into a report-style deliverable.
+        HIGH-PRIORITY DECISION RULE:
+        - If the user asks for a report in any form,
+          call this tool rather than writing the full report directly in chat.
+        - Only skip this tool when the user explicitly requests chat-only output and
+          says they do not want a generated report card.
+        Trigger classes include:
+        - Direct trigger words: report, document, memo, letter, template
+        - Creation-intent phrases: "write a document/report/post/article"
+        - File-intent words: requests containing "save", "file", or "document" when
+          intent is to create a report-like deliverable
+        - Word-doc specific triggers: professional report-style deliverable,
+          professional document, Word doc, .docx
+        - Other report-like output intents: one-pager, blog post, article,
+          standalone written content, comprehensive guide
+        - General artifact-style intents: analysis / writing as substantial deliverables
+        Common triggers include phrases like:
+        - "Generate a report about this"
+        - "Write a report from this conversation"
+        - "Create a detailed report about..."
+        - "Make a research report on..."
+        - "Summarize this into a report"
+        - "Turn this into a report"
+        - "Write a report/document"
+        - "Draft a report"
+        - "Create an executive summary"
+        - "Make a briefing note"
+        - "Write a one-pager"
+        - "Write a blog post"
+        - "Write an article"
+        - "Create a comprehensive guide"
+        - "Prepare a report"
+        - "Create a small report"
+        - "Write a short report"
+        - "Make a quick report"
+        - "Brief report for class"
+
+        FORMAT/EXPORT RULE:
+        - Always generate the report content in Markdown.
+        - If the user requests DOCX/Word/PDF or another file format, export from
+          the generated Markdown report.
+        SOURCE-COLLECTION RULE:
+        - If enough source material is already present in the conversation (chat
+          history, pasted text, uploaded files, or a provided video/article summary),
+          generate directly from that source_content.
+        - Use knowledge-base search first only when extra context is needed beyond
+          what the user already provided.
+
+        VERSIONING — parent_report_id:
+        - Set parent_report_id when the user wants to MODIFY, REVISE, IMPROVE,
+          UPDATE, EXPAND, or ADD CONTENT TO an existing report that was already
+          generated in this conversation.
+        - This includes both explicit AND implicit modification requests. If the
+          user references the existing report using words like "it", "this",
+          "here", "the report", or clearly refers to a previously generated
+          report, treat it as a revision request.
+        - The value must be the report_id from a previous generate_report
+          result in this same conversation.
+        - Do NOT set parent_report_id when:
+          * The user asks for a report on a completely NEW/DIFFERENT topic
+          * The user says "generate another report" (new report, not a revision)
+          * There is no prior report to reference
+        - When parent_report_id is set, the previous report's content will be
+          used as a base. Your user_instructions should describe WHAT TO CHANGE.
+
+        Examples of when to SET parent_report_id:
+          User: "Make that report shorter" → parent_report_id = <previous report_id>
+          User: "Add a cost analysis section to the report" → parent_report_id = <previous report_id>
+          User: "Rewrite the report in a more formal tone" → parent_report_id = <previous report_id>
+          User: "I want more details about pricing in here" → parent_report_id = <previous report_id>
+          User: "Include more examples" → parent_report_id = <previous report_id>
+          User: "Can you also cover security in this?" → parent_report_id = <previous report_id>
+          User: "Make it more detailed" → parent_report_id = <previous report_id>
+          User: "I want more about X for in here" → parent_report_id = <previous report_id>
+
+        Examples of when to LEAVE parent_report_id as None:
+          User: "Generate a report on climate change" → parent_report_id = None (new topic)
+          User: "Write me a report about the budget" → parent_report_id = None (new topic)
+          User: "Create another report, this time about marketing" → parent_report_id = None
+
+        Args:
+            topic: A short, concise title for the report (maximum 8 words). Keep it brief and descriptive — e.g. "AI in Healthcare Analysis: A Comprehensive Report" instead of "Comprehensive Analysis of Artificial Intelligence Applications in Modern Healthcare Systems".
+            source_content: The text content to base the report on. This MUST be comprehensive and include:
+                * If discussing the current conversation: a detailed summary of the FULL chat history
+                * If based on knowledge base search: the key findings and insights from search results
+                * You can combine both: conversation context + search results for richer reports
+                * The more detailed the source_content, the better the report quality
+            report_style: Style of the report. Options: "detailed", "executive_summary", "deep_research", "brief". Default: "detailed"
+            user_instructions: Optional specific instructions for the report (e.g., "focus on financial impacts", "include recommendations"). When revising an existing report (parent_report_id is set), this should describe the changes to make.
+            parent_report_id: Optional ID of a previously generated report to revise. When set, the new report is created as a new version in the same version group. The previous report's content is included as context for the LLM to refine.
+
+        Returns:
+            A dictionary containing:
+            - status: "ready" or "failed"
+            - report_id: The report ID
+            - title: The report title
+            - word_count: Number of words in the report
+            - message: Status message (or "error" field if failed)
+        """
+        # Resolve the parent report and its group (if versioning)
+        parent_report: Report | None = None
+        report_group_id: int | None = None
+
+        if parent_report_id:
+            parent_report = await db_session.get(Report, parent_report_id)
+            if parent_report:
+                report_group_id = parent_report.report_group_id
+                logger.info(
+                    f"[generate_report] Creating new version from parent {parent_report_id} "
+                    f"(group {report_group_id})"
+                )
+            else:
+                logger.warning(
+                    f"[generate_report] parent_report_id={parent_report_id} not found, "
+                    "creating standalone report"
+                )
+
+        async def _save_failed_report(error_msg: str) -> int | None:
+            """Persist a failed report row so the error is visible later."""
+            try:
+                failed_report = Report(
+                    title=topic,
+                    content=None,
+                    report_metadata={
+                        "status": "failed",
+                        "error_message": error_msg,
+                    },
+                    report_style=report_style,
+                    search_space_id=search_space_id,
+                    thread_id=thread_id,
+                    report_group_id=report_group_id,
+                )
+                db_session.add(failed_report)
+                await db_session.commit()
+                await db_session.refresh(failed_report)
+                # If this is a new group (v1 failed), set group to self
+                if not failed_report.report_group_id:
+                    failed_report.report_group_id = failed_report.id
+                    await db_session.commit()
+                logger.info(
+                    f"[generate_report] Saved failed report {failed_report.id}: {error_msg}"
+                )
+                return failed_report.id
+            except Exception:
+                logger.exception(
+                    "[generate_report] Could not persist failed report row"
+                )
+                return None
+
+        try:
+            # Get the LLM instance for this search space
+            llm = await get_document_summary_llm(db_session, search_space_id)
+            if not llm:
+                error_msg = (
+                    "No LLM configured. Please configure a language model in Settings."
+                )
+                report_id = await _save_failed_report(error_msg)
+                return {
+                    "status": "failed",
+                    "error": error_msg,
+                    "report_id": report_id,
+                    "title": topic,
+                }
+
+            # Build the prompt
+            user_instructions_section = ""
+            if user_instructions:
+                user_instructions_section = (
+                    f"**Additional Instructions:** {user_instructions}"
+                )
+
+            # If revising, include previous version content
+            previous_version_section = ""
+            if parent_report and parent_report.content:
+                previous_version_section = (
+                    "**Previous Version of This Report (refine this based on the instructions above — "
+                    "preserve structure and quality, apply only the requested changes):**\n\n"
+                    f"{parent_report.content}"
+                )
+
+            prompt = _REPORT_PROMPT.format(
+                topic=topic,
+                report_style=report_style,
+                user_instructions_section=user_instructions_section,
+                previous_version_section=previous_version_section,
+                source_content=source_content[:100000],  # Cap source content
+            )
+
+            # Call the LLM inline
+            from langchain_core.messages import HumanMessage
+
+            response = await llm.ainvoke([HumanMessage(content=prompt)])
+            report_content = response.content
+
+            if not report_content or not isinstance(report_content, str):
+                error_msg = "LLM returned empty or invalid content"
+                report_id = await _save_failed_report(error_msg)
+                return {
+                    "status": "failed",
+                    "error": error_msg,
+                    "report_id": report_id,
+                    "title": topic,
+                }
+
+            # LLMs often wrap output in ```markdown ... ``` fences — strip them
+            # so the stored content is clean Markdown.
+            report_content = _strip_wrapping_code_fences(report_content)
+
+            if not report_content:
+                error_msg = "LLM returned empty or invalid content"
+                report_id = await _save_failed_report(error_msg)
+                return {
+                    "status": "failed",
+                    "error": error_msg,
+                    "report_id": report_id,
+                    "title": topic,
+                }
+
+            # Extract metadata (includes "status": "ready")
+            metadata = _extract_metadata(report_content)
+
+            # Save to database
+            report = Report(
+                title=topic,
+                content=report_content,
+                report_metadata=metadata,
+                report_style=report_style,
+                search_space_id=search_space_id,
+                thread_id=thread_id,
+                report_group_id=report_group_id,  # None for v1, inherited for v2+
+            )
+            db_session.add(report)
+            await db_session.commit()
+            await db_session.refresh(report)
+
+            # If this is a brand-new report (v1), set report_group_id = own id
+            if not report.report_group_id:
+                report.report_group_id = report.id
+                await db_session.commit()
+
+            logger.info(
+                f"[generate_report] Created report {report.id} "
+                f"(group={report.report_group_id}): "
+                f"{metadata.get('word_count', 0)} words, "
+                f"{metadata.get('section_count', 0)} sections"
+            )
+
+            return {
+                "status": "ready",
+                "report_id": report.id,
+                "title": topic,
+                "word_count": metadata.get("word_count", 0),
+                "message": f"Report generated successfully: {topic}",
+            }
+
+        except Exception as e:
+            error_message = str(e)
+            logger.exception(f"[generate_report] Error: {error_message}")
+            report_id = await _save_failed_report(error_message)
+
+            return {
+                "status": "failed",
+                "error": error_message,
+                "report_id": report_id,
+                "title": topic,
+            }
+
+    return generate_report