feat: implement team memory extraction and validation mechanisms, enhancing memory management by enforcing scope restrictions and improving memory persistence for shared threads

2026-04-29 19:06:24 +02:00 · 2026-04-10 01:54:00 +05:30 · 2026-04-10 01:54:00 +05:30 · a0883d2ab6
commit a0883d2ab6
parent 33626d4f91
8 changed files with 322 additions and 49 deletions
--- a/surfsense_backend/app/agents/new_chat/middleware/memory_injection.py
+++ b/surfsense_backend/app/agents/new_chat/middleware/memory_injection.py
@ -1,10 +1,8 @@
 """Memory injection middleware for the SurfSense agent.

-Loads the user's personal memory (User.memory_md) and, for shared threads,
-the team memory (SearchSpace.shared_memory_md) from the database and injects
-them into the system prompt as <user_memory> / <team_memory> XML blocks on
-every turn.  This ensures the LLM always has the full memory context without
-requiring a tool call.
+Injects memory markdown into the system prompt on every turn:
+- Private threads: only personal memory (<user_memory>)
+- Shared threads: only team memory (<team_memory>)
 """

 from __future__ import annotations
@ -58,7 +56,25 @@ class MemoryInjectionMiddleware(AgentMiddleware):  # type: ignore[type-arg]
        memory_blocks: list[str] = []

        async with shielded_async_session() as session:
-            if self.user_id is not None:
+            if self.visibility == ChatVisibility.SEARCH_SPACE:
+                team_memory = await self._load_team_memory(session)
+                if team_memory:
+                    chars = len(team_memory)
+                    memory_blocks.append(
+                        f'<team_memory chars="{chars}" limit="{MEMORY_HARD_LIMIT}">\n'
+                        f"{team_memory}\n"
+                        f"</team_memory>"
+                    )
+                    if chars > MEMORY_SOFT_LIMIT:
+                        memory_blocks.append(
+                            f"<memory_warning>Team memory is at "
+                            f"{chars:,}/{MEMORY_HARD_LIMIT:,} characters and approaching "
+                            f"the hard limit. On your next update_memory call, consolidate "
+                            f"by merging duplicates, removing outdated entries, and "
+                            f"shortening descriptions before adding anything new."
+                            f"</memory_warning>"
+                        )
+            elif self.user_id is not None:
                user_memory, display_name = await self._load_user_memory(session)
                if display_name:
                    first_name = display_name.split()[0]
@ -80,25 +96,6 @@ class MemoryInjectionMiddleware(AgentMiddleware):  # type: ignore[type-arg]
                            f"</memory_warning>"
                        )

-            if self.visibility == ChatVisibility.SEARCH_SPACE:
-                team_memory = await self._load_team_memory(session)
-                if team_memory:
-                    chars = len(team_memory)
-                    memory_blocks.append(
-                        f'<team_memory chars="{chars}" limit="{MEMORY_HARD_LIMIT}">\n'
-                        f"{team_memory}\n"
-                        f"</team_memory>"
-                    )
-                    if chars > MEMORY_SOFT_LIMIT:
-                        memory_blocks.append(
-                            f"<memory_warning>Team memory is at "
-                            f"{chars:,}/{MEMORY_HARD_LIMIT:,} characters and approaching "
-                            f"the hard limit. On your next update_memory call, consolidate "
-                            f"by merging duplicates, removing outdated entries, and "
-                            f"shortening descriptions before adding anything new."
-                            f"</memory_warning>"
-                        )
-
        if not memory_blocks:
            return None