From 8a8af948dba50c3ecbfcbe0ceae9a8adc0f9a5d9 Mon Sep 17 00:00:00 2001
From: JoeMakuta <makutajosue@gmail.com>
Date: Wed, 1 Apr 2026 13:07:27 +0200
Subject: [PATCH 001/202] feat: add experimental package import optimization
 configuration

---
 surfsense_web/next.config.ts | 10 ++++++++++
 1 file changed, 10 insertions(+)
diff --git a/surfsense_web/next.config.ts b/surfsense_web/next.config.ts
index 263b3e6f6..5414d548d 100644
--- a/surfsense_web/next.config.ts
+++ b/surfsense_web/next.config.ts
@@ -24,6 +24,16 @@ const nextConfig: NextConfig = {
 			},
 		],
 	},
+	experimental: {
+		optimizePackageImports: [
+			"lucide-react",
+			"@tabler/icons-react",
+			"date-fns",
+			"@assistant-ui/react",
+			"@assistant-ui/react-markdown",
+			"motion",
+		],
+	},
 	// Turbopack config (used during `next dev --turbopack`)
 	turbopack: {
 		rules: {

From 9d6d81871219906432e8b35260a8f5c3de6edbc6 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Wed, 1 Apr 2026 18:52:04 +0530
Subject: [PATCH 002/202] fix: add select-none class to TabBar

---
 surfsense_web/components/layout/ui/tabs/TabBar.tsx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/surfsense_web/components/layout/ui/tabs/TabBar.tsx b/surfsense_web/components/layout/ui/tabs/TabBar.tsx
index 18e1ba141..8d0d986d3 100644
--- a/surfsense_web/components/layout/ui/tabs/TabBar.tsx
+++ b/surfsense_web/components/layout/ui/tabs/TabBar.tsx
@@ -72,7 +72,7 @@ export function TabBar({ onTabSwitch, onNewChat, rightActions, className }: TabB
 	if (tabs.length <= 1) return null;
 
 	return (
-		<div className={cn("mb-2 flex h-9 items-center shrink-0 px-1 gap-0.5", className)}>
+		<div className={cn("mb-2 flex h-9 items-center shrink-0 px-1 gap-0.5 select-none", className)}>
 			<div
 				ref={scrollRef}
 				className="flex h-full items-center flex-1 gap-0.5 overflow-x-auto overflow-y-hidden scrollbar-hide [scrollbar-width:none] [-ms-overflow-style:none] [&::-webkit-scrollbar]:hidden py-1"

From fc4f9ba7c0563260e5a9e65a8e5df0ad33827c01 Mon Sep 17 00:00:00 2001
From: JoeMakuta <makutajosue@gmail.com>
Date: Wed, 1 Apr 2026 15:41:11 +0200
Subject: [PATCH 003/202] refac: import of UI components for dropdown menu,
 separator, toggle group, toggle, tooltip, and checkbox

---
 surfsense_web/components/ui/checkbox.tsx      | 2 +-
 surfsense_web/components/ui/dropdown-menu.tsx | 2 +-
 surfsense_web/components/ui/separator.tsx     | 2 +-
 surfsense_web/components/ui/toggle-group.tsx  | 2 +-
 surfsense_web/components/ui/toggle.tsx        | 2 +-
 surfsense_web/components/ui/tooltip.tsx       | 2 +-
 6 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/surfsense_web/components/ui/checkbox.tsx b/surfsense_web/components/ui/checkbox.tsx
index 0936a383e..586e3e602 100644
--- a/surfsense_web/components/ui/checkbox.tsx
+++ b/surfsense_web/components/ui/checkbox.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { CheckIcon } from "lucide-react";
-import { Checkbox as CheckboxPrimitive } from "radix-ui";
+import * as CheckboxPrimitive from "@radix-ui/react-checkbox";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/dropdown-menu.tsx b/surfsense_web/components/ui/dropdown-menu.tsx
index 24b99467e..2904b93dd 100644
--- a/surfsense_web/components/ui/dropdown-menu.tsx
+++ b/surfsense_web/components/ui/dropdown-menu.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { CheckIcon, ChevronRightIcon, CircleIcon } from "lucide-react";
-import { DropdownMenu as DropdownMenuPrimitive } from "radix-ui";
+import * as DropdownMenuPrimitive from "@radix-ui/react-dropdown-menu";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/separator.tsx b/surfsense_web/components/ui/separator.tsx
index 63b8e6a69..d7cf2cd81 100644
--- a/surfsense_web/components/ui/separator.tsx
+++ b/surfsense_web/components/ui/separator.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { Separator as SeparatorPrimitive } from "radix-ui";
+import * as SeparatorPrimitive from "@radix-ui/react-separator";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/toggle-group.tsx b/surfsense_web/components/ui/toggle-group.tsx
index eb212182a..33aa433b2 100644
--- a/surfsense_web/components/ui/toggle-group.tsx
+++ b/surfsense_web/components/ui/toggle-group.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import type { VariantProps } from "class-variance-authority";
-import { ToggleGroup as ToggleGroupPrimitive } from "radix-ui";
+import * as ToggleGroupPrimitive from "@radix-ui/react-toggle-group";
 import * as React from "react";
 import { toggleVariants } from "@/components/ui/toggle";
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/toggle.tsx b/surfsense_web/components/ui/toggle.tsx
index 5841cdc35..f0e68cec9 100644
--- a/surfsense_web/components/ui/toggle.tsx
+++ b/surfsense_web/components/ui/toggle.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { cva, type VariantProps } from "class-variance-authority";
-import { Toggle as TogglePrimitive } from "radix-ui";
+import * as TogglePrimitive from "@radix-ui/react-toggle";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/tooltip.tsx b/surfsense_web/components/ui/tooltip.tsx
index c19ce6f82..2fc85aae4 100644
--- a/surfsense_web/components/ui/tooltip.tsx
+++ b/surfsense_web/components/ui/tooltip.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { Tooltip as TooltipPrimitive } from "radix-ui";
+import * as TooltipPrimitive from "@radix-ui/react-tooltip";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";

From 0a65aa1a31cee5689f0f89ff00723deff5ac67f3 Mon Sep 17 00:00:00 2001
From: JoeMakuta <makutajosue@gmail.com>
Date: Wed, 1 Apr 2026 15:59:11 +0200
Subject: [PATCH 004/202] feat: dynamic import of PostHog

---
 surfsense_web/app/error.tsx                |  8 +++++--
 surfsense_web/lib/apis/base-api.service.ts | 26 ++++++++++++----------
 2 files changed, 20 insertions(+), 14 deletions(-)

diff --git a/surfsense_web/app/error.tsx b/surfsense_web/app/error.tsx
index 7bbd74e0e..3935f84d5 100644
--- a/surfsense_web/app/error.tsx
+++ b/surfsense_web/app/error.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import posthog from "posthog-js";
+
 import { useEffect } from "react";
 
 export default function ErrorPage({
@@ -11,7 +11,11 @@ export default function ErrorPage({
 	reset: () => void;
 }) {
 	useEffect(() => {
-		posthog.captureException(error);
+		import("posthog-js")
+			.then(({ default: posthog }) => {
+				posthog.captureException(error);
+			})
+			.catch(() => {});
 	}, [error]);
 
 	return (
diff --git a/surfsense_web/lib/apis/base-api.service.ts b/surfsense_web/lib/apis/base-api.service.ts
index 4c3371233..bc9e6c1d8 100644
--- a/surfsense_web/lib/apis/base-api.service.ts
+++ b/surfsense_web/lib/apis/base-api.service.ts
@@ -1,4 +1,3 @@
-import posthog from "posthog-js";
 import type { ZodType } from "zod";
 import { getBearerToken, handleUnauthorized, refreshAccessToken } from "../auth-utils";
 import { AppError, AuthenticationError, AuthorizationError, NotFoundError } from "../error";
@@ -234,18 +233,21 @@ class BaseApiService {
 		} catch (error) {
 			console.error("Request failed:", JSON.stringify(error));
 			if (!(error instanceof AuthenticationError)) {
-				try {
-					posthog.captureException(error, {
-						api_url: url,
-						api_method: options?.method ?? "GET",
-						...(error instanceof AppError && {
-							status_code: error.status,
-							status_text: error.statusText,
-						}),
+				import("posthog-js")
+					.then(({ default: posthog }) => {
+						posthog.captureException(error, {
+							api_url: url,
+							api_method: options?.method ?? "GET",
+							...(error instanceof AppError && {
+								status_code: error.status,
+								status_text: error.statusText,
+							}),
+						});
+					})
+					.catch(() => {
+						// PostHog is not available in the current environment
+						console.error("Failed to capture exception in PostHog");
 					});
-				} catch {
-					// PostHog capture failed — don't block the error flow
-				}
 			}
 			throw error;
 		}

From a42d4d219b1194a8aaab5019c6500042307f3d49 Mon Sep 17 00:00:00 2001
From: Jun Hyeok Lee <bluehyena123@naver.com>
Date: Wed, 1 Apr 2026 23:03:52 +0900
Subject: [PATCH 005/202] fix: avoid mutating shared arrays in changelog and
 comments sync

---
 surfsense_web/app/(home)/changelog/page.tsx | 2 +-
 surfsense_web/hooks/use-comments-sync.ts    | 5 +++--
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/surfsense_web/app/(home)/changelog/page.tsx b/surfsense_web/app/(home)/changelog/page.tsx
index 8d38cb687..c14218dab 100644
--- a/surfsense_web/app/(home)/changelog/page.tsx
+++ b/surfsense_web/app/(home)/changelog/page.tsx
@@ -29,7 +29,7 @@ interface ChangelogPageItem {
 
 export default async function ChangelogPage() {
 	const allPages = source.getPages() as ChangelogPageItem[];
-	const sortedChangelogs = allPages.sort((a, b) => {
+	const sortedChangelogs = allPages.toSorted((a, b) => {
 		const dateA = new Date(a.data.date).getTime();
 		const dateB = new Date(b.data.date).getTime();
 		return dateB - dateA;
diff --git a/surfsense_web/hooks/use-comments-sync.ts b/surfsense_web/hooks/use-comments-sync.ts
index b6a68364d..f8037c656 100644
--- a/surfsense_web/hooks/use-comments-sync.ts
+++ b/surfsense_web/hooks/use-comments-sync.ts
@@ -118,8 +118,9 @@ function transformComments(
 
 	for (const [messageId, group] of byMessage) {
 		const comments: Comment[] = group.topLevel.map((raw) => {
-			const replies = (group.replies.get(raw.id) || [])
-				.sort((a, b) => new Date(a.created_at).getTime() - new Date(b.created_at).getTime())
+			const replies = (group.replies.get(raw.id) ?? []).toSorted(
+				(a, b) => new Date(a.created_at).getTime() - new Date(b.created_at).getTime()
+			)
 				.map((r) => transformReply(r, memberMap, currentUserId, isOwner));
 
 			return {

From e6ec589e1251bcb4963bada86420daef9703dba6 Mon Sep 17 00:00:00 2001
From: JoeMakuta <makutajosue@gmail.com>
Date: Wed, 1 Apr 2026 16:10:27 +0200
Subject: [PATCH 006/202] feat: add dynamic import  and dev only render of
 ReactQueryClientProvider

---
 surfsense_web/lib/query-client/query-client.provider.tsx | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/surfsense_web/lib/query-client/query-client.provider.tsx b/surfsense_web/lib/query-client/query-client.provider.tsx
index 453b9f531..6dc2a4258 100644
--- a/surfsense_web/lib/query-client/query-client.provider.tsx
+++ b/surfsense_web/lib/query-client/query-client.provider.tsx
@@ -1,13 +1,18 @@
 "use client";
-import { ReactQueryDevtools } from "@tanstack/react-query-devtools";
+import dynamic from "next/dynamic";
 import { QueryClientAtomProvider } from "jotai-tanstack-query/react";
 import { queryClient } from "./client";
 
+const ReactQueryDevtools = dynamic(
+	() => import("@tanstack/react-query-devtools").then((m) => ({ default: m.ReactQueryDevtools })),
+	{ ssr: false }
+);
+
 export function ReactQueryClientProvider({ children }: { children: React.ReactNode }) {
 	return (
 		<QueryClientAtomProvider client={queryClient}>
 			{children}
-			<ReactQueryDevtools initialIsOpen={false} />
+			{process.env.NODE_ENV === "development" && <ReactQueryDevtools initialIsOpen={false} />}
 		</QueryClientAtomProvider>
 	);
 }

From 663096a074494b954c9f82a31652cf7dfc83426b Mon Sep 17 00:00:00 2001
From: Jun Hyeok Lee <bluehyena123@naver.com>
Date: Wed, 1 Apr 2026 23:23:36 +0900
Subject: [PATCH 007/202] chore: format issue 1046 frontend changes

---
 surfsense_web/hooks/use-comments-sync.ts | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/surfsense_web/hooks/use-comments-sync.ts b/surfsense_web/hooks/use-comments-sync.ts
index f8037c656..b5ea6cce7 100644
--- a/surfsense_web/hooks/use-comments-sync.ts
+++ b/surfsense_web/hooks/use-comments-sync.ts
@@ -118,9 +118,8 @@ function transformComments(
 
 	for (const [messageId, group] of byMessage) {
 		const comments: Comment[] = group.topLevel.map((raw) => {
-			const replies = (group.replies.get(raw.id) ?? []).toSorted(
-				(a, b) => new Date(a.created_at).getTime() - new Date(b.created_at).getTime()
-			)
+			const replies = (group.replies.get(raw.id) ?? [])
+				.toSorted((a, b) => new Date(a.created_at).getTime() - new Date(b.created_at).getTime())
 				.map((r) => transformReply(r, memberMap, currentUserId, isOwner));
 
 			return {

From d7dd6db1b9e4c9dc1c9b75c0f53ae3920b7453de Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Wed, 1 Apr 2026 20:31:45 +0530
Subject: [PATCH 008/202] fix: improve document loading error handling and UI
 feedback for processing state

---
 surfsense_backend/app/routes/editor_routes.py | 11 ++++--
 .../components/DocumentsTableShell.tsx        |  5 +++
 .../components/documents/DocumentNode.tsx     |  4 +--
 .../components/documents/FolderTreeView.tsx   |  7 ++--
 .../components/editor-panel/editor-panel.tsx  | 22 +++++++++---
 .../layout/ui/tabs/DocumentTabContent.tsx     | 34 +++++++++++++++----
 .../new-chat/source-detail-panel.tsx          | 10 +++---
 7 files changed, 69 insertions(+), 24 deletions(-)

diff --git a/surfsense_backend/app/routes/editor_routes.py b/surfsense_backend/app/routes/editor_routes.py
index f54f18def..0fcbc475d 100644
--- a/surfsense_backend/app/routes/editor_routes.py
+++ b/surfsense_backend/app/routes/editor_routes.py
@@ -127,9 +127,16 @@ async def get_editor_content(
     chunks = sorted(document.chunks, key=lambda c: c.id)
 
     if not chunks:
+        doc_status = document.status or {}
+        state = doc_status.get("state", "ready") if isinstance(doc_status, dict) else "ready"
+        if state in ("pending", "processing"):
+            raise HTTPException(
+                status_code=409,
+                detail="This document is still being processed. Please wait a moment and try again.",
+            )
         raise HTTPException(
             status_code=400,
-            detail="This document has no content and cannot be edited. Please re-upload to enable editing.",
+            detail="This document has no viewable content yet. It may still be syncing. Try again in a few seconds, or re-upload if the issue persists.",
         )
 
     markdown_content = "\n\n".join(chunk.content for chunk in chunks)
@@ -137,7 +144,7 @@ async def get_editor_content(
     if not markdown_content.strip():
         raise HTTPException(
             status_code=400,
-            detail="This document has empty content and cannot be edited.",
+            detail="This document appears to be empty. Try re-uploading or editing it to add content.",
         )
 
     # Persist the lazy migration
diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
index 92ced6e47..0758307f7 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
@@ -748,6 +748,7 @@ export function DocumentsTableShell({
 																	onClick={() =>
 																		onOpenInTab ? onOpenInTab(doc) : handleViewDocument(doc)
 																	}
+																	disabled={isBeingProcessed}
 																>
 																	<Eye className="h-4 w-4" />
 																	Open
@@ -1020,6 +1021,10 @@ export function DocumentsTableShell({
 						<Button
 							variant="secondary"
 							className="justify-start gap-2"
+							disabled={
+								mobileActionDoc?.status?.state === "pending" ||
+								mobileActionDoc?.status?.state === "processing"
+							}
 							onClick={() => {
 								if (mobileActionDoc) handleViewDocument(mobileActionDoc);
 								setMobileActionDoc(null);
diff --git a/surfsense_web/components/documents/DocumentNode.tsx b/surfsense_web/components/documents/DocumentNode.tsx
index dd7731f22..691a6eb0d 100644
--- a/surfsense_web/components/documents/DocumentNode.tsx
+++ b/surfsense_web/components/documents/DocumentNode.tsx
@@ -219,7 +219,7 @@ export const DocumentNode = React.memo(function DocumentNode({
 							</Button>
 						</DropdownMenuTrigger>
 						<DropdownMenuContent align="end" className="w-40" onClick={(e) => e.stopPropagation()}>
-							<DropdownMenuItem onClick={() => onPreview(doc)}>
+							<DropdownMenuItem onClick={() => onPreview(doc)} disabled={isProcessing}>
 								<Eye className="mr-2 h-4 w-4" />
 								Open
 							</DropdownMenuItem>
@@ -259,7 +259,7 @@ export const DocumentNode = React.memo(function DocumentNode({
 
 			{contextMenuOpen && (
 				<ContextMenuContent className="w-40" onClick={(e) => e.stopPropagation()}>
-					<ContextMenuItem onClick={() => onPreview(doc)}>
+					<ContextMenuItem onClick={() => onPreview(doc)} disabled={isProcessing}>
 						<Eye className="mr-2 h-4 w-4" />
 						Open
 					</ContextMenuItem>
diff --git a/surfsense_web/components/documents/FolderTreeView.tsx b/surfsense_web/components/documents/FolderTreeView.tsx
index f63d5da5c..7695923e3 100644
--- a/surfsense_web/components/documents/FolderTreeView.tsx
+++ b/surfsense_web/components/documents/FolderTreeView.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useAtom } from "jotai";
-import { CirclePlus } from "lucide-react";
+import { Search } from "lucide-react";
 import { useCallback, useMemo, useState } from "react";
 import { DndProvider } from "react-dnd";
 import { HTML5Backend } from "react-dnd-html5-backend";
@@ -250,8 +250,9 @@ export function FolderTreeView({
 	if (treeNodes.length === 0 && (activeTypes.length > 0 || searchQuery)) {
 		return (
 			<div className="flex flex-1 flex-col items-center justify-center gap-3 px-4 py-12 text-muted-foreground">
-				<CirclePlus className="h-10 w-10 rotate-45" />
-				<p className="text-sm">No matching documents</p>
+				<Search className="h-10 w-10" />
+				<p className="text-sm text-muted-foreground">No matching documents</p>
+				<p className="text-xs text-muted-foreground/70 mt-1">Try a different search term</p>
 			</div>
 		);
 	}
diff --git a/surfsense_web/components/editor-panel/editor-panel.tsx b/surfsense_web/components/editor-panel/editor-panel.tsx
index 3ea36f800..7496e6aec 100644
--- a/surfsense_web/components/editor-panel/editor-panel.tsx
+++ b/surfsense_web/components/editor-panel/editor-panel.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useAtomValue, useSetAtom } from "jotai";
-import { AlertCircle, XIcon } from "lucide-react";
+import { FileQuestionMark, RefreshCw, XIcon } from "lucide-react";
 import dynamic from "next/dynamic";
 import { useCallback, useEffect, useRef, useState } from "react";
 import { toast } from "sonner";
@@ -200,10 +200,22 @@ export function EditorPanelContent({
 					<EditorPanelSkeleton />
 				) : error || !editorDoc ? (
 					<div className="flex flex-1 flex-col items-center justify-center gap-3 p-6 text-center">
-						<AlertCircle className="size-8 text-destructive" />
-						<div>
-							<p className="font-medium text-foreground">Failed to load document</p>
-							<p className="text-sm text-red-500 mt-1">{error || "An unknown error occurred"}</p>
+						{error?.toLowerCase().includes("still being processed") ? (
+							<div className="rounded-full bg-muted/50 p-3">
+								<RefreshCw className="size-6 text-muted-foreground animate-spin" />
+							</div>
+						) : (
+							<div className="rounded-full bg-muted/50 p-3">
+								<FileQuestionMark className="size-6 text-muted-foreground" />
+							</div>
+						)}
+						<div className="space-y-1 max-w-xs">
+							<p className="font-medium text-foreground">
+								{error?.toLowerCase().includes("still being processed")
+									? "Document is processing"
+									: "Document unavailable"}
+							</p>
+							<p className="text-sm text-muted-foreground">{error || "An unknown error occurred"}</p>
 						</div>
 					</div>
 				) : isEditableType ? (
diff --git a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
index ac279cd4d..849bdbea5 100644
--- a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
+++ b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { AlertCircle, Pencil } from "lucide-react";
+import { FileQuestionMark, PenLine, RefreshCw } from "lucide-react";
 import { useCallback, useEffect, useRef, useState } from "react";
 import { toast } from "sonner";
 import { PlateEditor } from "@/components/editor/plate-editor";
@@ -160,15 +160,35 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 	if (isLoading) return <DocumentSkeleton />;
 
 	if (error || !doc) {
+		const isProcessing = error?.toLowerCase().includes("still being processed");
 		return (
-			<div className="flex flex-1 flex-col items-center justify-center gap-3 p-6 text-center">
-				<AlertCircle className="size-10 text-destructive" />
-				<div>
-					<p className="font-medium text-foreground text-lg">Failed to load document</p>
-					<p className="text-sm text-muted-foreground mt-1">
+			<div className="flex flex-1 flex-col items-center justify-center gap-4 p-8 text-center">
+				<div className="rounded-full bg-muted/50 p-4">
+					{isProcessing ? (
+						<RefreshCw className="size-8 text-muted-foreground animate-spin" />
+					) : (
+						<FileQuestionMark className="size-8 text-muted-foreground" />
+					)}
+				</div>
+				<div className="space-y-1.5 max-w-sm">
+					<p className="font-semibold text-foreground text-lg">
+						{isProcessing ? "Document is processing" : "Document unavailable"}
+					</p>
+					<p className="text-sm text-muted-foreground">
 						{error || "An unknown error occurred"}
 					</p>
 				</div>
+				{!isProcessing && (
+					<Button
+						variant="outline"
+						size="sm"
+						className="mt-1 gap-1.5"
+						onClick={() => window.location.reload()}
+					>
+						<RefreshCw className="size-3.5" />
+						Retry
+					</Button>
+				)}
 			</div>
 		);
 	}
@@ -229,7 +249,7 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 						onClick={() => setIsEditing(true)}
 						className="gap-1.5"
 					>
-						<Pencil className="size-3.5" />
+						<PenLine className="size-3.5" />
 						Edit
 					</Button>
 				)}
diff --git a/surfsense_web/components/new-chat/source-detail-panel.tsx b/surfsense_web/components/new-chat/source-detail-panel.tsx
index b02b2e217..9c1167efe 100644
--- a/surfsense_web/components/new-chat/source-detail-panel.tsx
+++ b/surfsense_web/components/new-chat/source-detail-panel.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useQuery } from "@tanstack/react-query";
-import { BookOpen, ChevronDown, ExternalLink, FileText, Hash, Sparkles, X } from "lucide-react";
+import { BookOpen, ChevronDown, ExternalLink, FileQuestionMark, FileText, Hash, Sparkles, X } from "lucide-react";
 import { AnimatePresence, motion, useReducedMotion } from "motion/react";
 import { useTranslations } from "next-intl";
 import type React from "react";
@@ -392,12 +392,12 @@ export function SourceDetailPanel({
 									animate={{ opacity: 1, scale: 1 }}
 									className="flex flex-col items-center gap-4 text-center px-6"
 								>
-									<div className="w-20 h-20 rounded-full bg-destructive/10 flex items-center justify-center">
-										<X className="h-10 w-10 text-destructive" />
+									<div className="w-20 h-20 rounded-full bg-muted/50 flex items-center justify-center">
+										<FileQuestionMark className="h-10 w-10 text-muted-foreground" />
 									</div>
 									<div>
-										<p className="font-semibold text-destructive text-lg">
-											Failed to load document
+										<p className="font-semibold text-foreground text-lg">
+											Document unavailable
 										</p>
 										<p className="text-sm text-muted-foreground mt-2 max-w-md">
 											{documentByChunkFetchingError.message ||

From 5c11a15fb6534c55e3e50e49caac4e4ee3703cec Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Wed, 1 Apr 2026 20:51:55 +0530
Subject: [PATCH 009/202] refactor: update UI components by removing unused
 imports and adjusting loading states

---
 .../components/CommunityPromptsContent.tsx    |  2 +-
 .../components/PromptsContent.tsx             |  6 ++--
 .../components/editor-panel/editor-panel.tsx  | 29 +++++++++----------
 .../layout/ui/right-panel/RightPanel.tsx      |  2 +-
 .../settings/image-model-manager.tsx          |  3 +-
 .../settings/model-config-manager.tsx         |  2 --
 6 files changed, 20 insertions(+), 24 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/CommunityPromptsContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/CommunityPromptsContent.tsx
index 4bcdcba7e..239832b2d 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/CommunityPromptsContent.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/CommunityPromptsContent.tsx
@@ -60,7 +60,7 @@ export function CommunityPromptsContent() {
 
 			{list.length === 0 && (
 				<div className="rounded-lg border border-dashed border-border/60 p-8 text-center">
-					<Globe className="mx-auto size-8 text-muted-foreground/40" />
+					<Globe className="mx-auto size-8 text-muted-foreground" />
 					<p className="mt-2 text-sm text-muted-foreground">No community prompts yet</p>
 					<p className="text-xs text-muted-foreground/60">
 						Share your own prompts from the My Prompts tab
diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/PromptsContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/PromptsContent.tsx
index 522d71e59..39362d244 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/PromptsContent.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/PromptsContent.tsx
@@ -1,7 +1,8 @@
 "use client";
 
 import { useAtomValue } from "jotai";
-import { AlertTriangle, Globe, Lock, PenLine, Plus, Sparkles, Trash2 } from "lucide-react";
+import { AlertTriangle, Globe, Lock, PenLine, Sparkles, Trash2 } from "lucide-react";
+import { ShortcutKbd } from "@/components/ui/shortcut-kbd";
 import { useCallback, useState } from "react";
 import { toast } from "sonner";
 import {
@@ -145,7 +146,7 @@ export function PromptsContent() {
 			<div className="flex items-center justify-between">
 				<p className="text-sm text-muted-foreground">
 					Create prompt templates triggered with{" "}
-					<kbd className="rounded border bg-muted px-1.5 py-0.5 text-xs font-mono">/</kbd> in the
+					<ShortcutKbd keys={["/"]} className="ml-0" /> in the
 					chat composer.
 				</p>
 				{!showForm && (
@@ -158,7 +159,6 @@ export function PromptsContent() {
 						}}
 						className="shrink-0 gap-1.5"
 					>
-						<Plus className="size-3.5" />
 						New
 					</Button>
 				)}
diff --git a/surfsense_web/components/editor-panel/editor-panel.tsx b/surfsense_web/components/editor-panel/editor-panel.tsx
index 7496e6aec..802a5ffc3 100644
--- a/surfsense_web/components/editor-panel/editor-panel.tsx
+++ b/surfsense_web/components/editor-panel/editor-panel.tsx
@@ -9,24 +9,9 @@ import { closeEditorPanelAtom, editorPanelAtom } from "@/atoms/editor/editor-pan
 import { MarkdownViewer } from "@/components/markdown-viewer";
 import { Button } from "@/components/ui/button";
 import { Drawer, DrawerContent, DrawerHandle, DrawerTitle } from "@/components/ui/drawer";
-import { Skeleton } from "@/components/ui/skeleton";
 import { useMediaQuery } from "@/hooks/use-media-query";
 import { authenticatedFetch, getBearerToken, redirectToLogin } from "@/lib/auth-utils";
 
-const PlateEditor = dynamic(
-	() => import("@/components/editor/plate-editor").then((m) => ({ default: m.PlateEditor })),
-	{ ssr: false, loading: () => <Skeleton className="h-64 w-full" /> }
-);
-
-interface EditorContent {
-	document_id: number;
-	title: string;
-	document_type?: string;
-	source_markdown: string;
-}
-
-const EDITABLE_DOCUMENT_TYPES = new Set(["FILE", "NOTE"]);
-
 function EditorPanelSkeleton() {
 	return (
 		<div className="space-y-6 p-6">
@@ -47,6 +32,20 @@ function EditorPanelSkeleton() {
 	);
 }
 
+const PlateEditor = dynamic(
+	() => import("@/components/editor/plate-editor").then((m) => ({ default: m.PlateEditor })),
+	{ ssr: false, loading: () => null }
+);
+
+interface EditorContent {
+	document_id: number;
+	title: string;
+	document_type?: string;
+	source_markdown: string;
+}
+
+const EDITABLE_DOCUMENT_TYPES = new Set(["FILE", "NOTE"]);
+
 export function EditorPanelContent({
 	documentId,
 	searchSpaceId,
diff --git a/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx b/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
index ac2f65065..717f5a459 100644
--- a/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
+++ b/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
@@ -19,7 +19,7 @@ const EditorPanelContent = dynamic(
 		import("@/components/editor-panel/editor-panel").then((m) => ({
 			default: m.EditorPanelContent,
 		})),
-	{ ssr: false, loading: () => <Skeleton className="h-96 w-full" /> }
+	{ ssr: false, loading: () => null }
 );
 
 const HitlEditPanelContent = dynamic(
diff --git a/surfsense_web/components/settings/image-model-manager.tsx b/surfsense_web/components/settings/image-model-manager.tsx
index 8f08b7db3..0c45af7d4 100644
--- a/surfsense_web/components/settings/image-model-manager.tsx
+++ b/surfsense_web/components/settings/image-model-manager.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useAtomValue } from "jotai";
-import { AlertCircle, Edit3, Info, Plus, RefreshCw, Trash2, Wand2 } from "lucide-react";
+import { AlertCircle, Edit3, Info, RefreshCw, Trash2, Wand2 } from "lucide-react";
 import { useMemo, useState } from "react";
 import { deleteImageGenConfigMutationAtom } from "@/atoms/image-gen-config/image-gen-config-mutation.atoms";
 import {
@@ -257,7 +257,6 @@ export function ImageModelManager({ searchSpaceId }: ImageModelManagerProps) {
 										size="lg"
 										className="gap-2 text-xs md:text-sm h-9 md:h-10"
 									>
-										<Plus className="h-3 w-3 md:h-4 md:w-4" />
 										Add First Image Model
 									</Button>
 								)}
diff --git a/surfsense_web/components/settings/model-config-manager.tsx b/surfsense_web/components/settings/model-config-manager.tsx
index 046288a96..50d2ab5b7 100644
--- a/surfsense_web/components/settings/model-config-manager.tsx
+++ b/surfsense_web/components/settings/model-config-manager.tsx
@@ -7,7 +7,6 @@ import {
 	FileText,
 	Info,
 	MessageSquareQuote,
-	Plus,
 	RefreshCw,
 	Trash2,
 	Wand2,
@@ -270,7 +269,6 @@ export function ModelConfigManager({ searchSpaceId }: ModelConfigManagerProps) {
 											size="lg"
 											className="gap-2 text-xs md:text-sm h-9 md:h-10"
 										>
-											<Plus className="h-3 w-3 md:h-4 md:w-4" />
 											Create First Configuration
 										</Button>
 									)}

From 33e7aeef9d275a49ad0b7e74a46244b42d4ef547 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Wed, 1 Apr 2026 21:00:52 +0530
Subject: [PATCH 010/202] style: enhance input field focus styles and
 transition effects in login and registration forms

---
 .../app/(home)/login/LocalLoginForm.tsx       |  20 +--
 surfsense_web/app/(home)/register/page.tsx    | 142 +++++++++---------
 2 files changed, 81 insertions(+), 81 deletions(-)

diff --git a/surfsense_web/app/(home)/login/LocalLoginForm.tsx b/surfsense_web/app/(home)/login/LocalLoginForm.tsx
index ee3b47683..1ebbf46b6 100644
--- a/surfsense_web/app/(home)/login/LocalLoginForm.tsx
+++ b/surfsense_web/app/(home)/login/LocalLoginForm.tsx
@@ -160,11 +160,11 @@ export function LocalLoginForm() {
 						placeholder="you@example.com"
 						value={username}
 						onChange={(e) => setUsername(e.target.value)}
-						className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-2 focus:ring-offset-2 bg-background text-foreground transition-all ${
-							error.title
-								? "border-destructive focus:border-destructive focus:ring-destructive"
-								: "border-border focus:border-primary focus:ring-primary"
-						}`}
+					className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
+						error.title
+							? "border-destructive focus:border-destructive focus:ring-destructive/40"
+							: "border-border focus:border-primary focus:ring-primary/40"
+					}`}
 						disabled={isLoggingIn}
 					/>
 				</div>
@@ -181,11 +181,11 @@ export function LocalLoginForm() {
 							placeholder="Enter your password"
 							value={password}
 							onChange={(e) => setPassword(e.target.value)}
-							className={`mt-1 block w-full rounded-md border pr-10 px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-2 focus:ring-offset-2 bg-background text-foreground transition-all ${
-								error.title
-									? "border-destructive focus:border-destructive focus:ring-destructive"
-									: "border-border focus:border-primary focus:ring-primary"
-							}`}
+						className={`mt-1 block w-full rounded-md border pr-10 px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
+							error.title
+								? "border-destructive focus:border-destructive focus:ring-destructive/40"
+								: "border-border focus:border-primary focus:ring-primary/40"
+						}`}
 							disabled={isLoggingIn}
 						/>
 						<button
diff --git a/surfsense_web/app/(home)/register/page.tsx b/surfsense_web/app/(home)/register/page.tsx
index b9200c68f..3161da4a7 100644
--- a/surfsense_web/app/(home)/register/page.tsx
+++ b/surfsense_web/app/(home)/register/page.tsx
@@ -229,78 +229,78 @@ export default function RegisterPage() {
 						</AnimatePresence>
 
 						<div>
-							<label
-								htmlFor="email"
-								className="block text-sm font-medium text-gray-700 dark:text-gray-300"
-							>
-								{t("email")}
-							</label>
-							<input
-								id="email"
-								type="email"
-								required
-								placeholder="you@example.com"
-								value={email}
-								onChange={(e) => setEmail(e.target.value)}
-								className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-2 focus:ring-offset-2 dark:bg-gray-800 dark:text-white transition-all ${
-									error.title
-										? "border-red-300 focus:border-red-500 focus:ring-red-500 dark:border-red-700"
-										: "border-gray-300 focus:border-blue-500 focus:ring-blue-500 dark:border-gray-700"
-								}`}
-								disabled={isRegistering}
-							/>
-						</div>
+						<label
+							htmlFor="email"
+							className="block text-sm font-medium text-foreground"
+						>
+							{t("email")}
+						</label>
+						<input
+							id="email"
+							type="email"
+							required
+							placeholder="you@example.com"
+							value={email}
+							onChange={(e) => setEmail(e.target.value)}
+						className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
+							error.title
+								? "border-destructive focus:border-destructive focus:ring-destructive/40"
+								: "border-border focus:border-primary focus:ring-primary/40"
+						}`}
+						disabled={isRegistering}
+					/>
+					</div>
 
-						<div>
-							<label
-								htmlFor="password"
-								className="block text-sm font-medium text-gray-700 dark:text-gray-300"
-							>
-								{t("password")}
-							</label>
-							<input
-								id="password"
-								type="password"
-								required
-								placeholder="Enter your password"
-								value={password}
-								onChange={(e) => setPassword(e.target.value)}
-								className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-2 focus:ring-offset-2 dark:bg-gray-800 dark:text-white transition-all ${
-									error.title
-										? "border-red-300 focus:border-red-500 focus:ring-red-500 dark:border-red-700"
-										: "border-gray-300 focus:border-blue-500 focus:ring-blue-500 dark:border-gray-700"
-								}`}
-								disabled={isRegistering}
-							/>
-						</div>
+					<div>
+						<label
+							htmlFor="password"
+							className="block text-sm font-medium text-foreground"
+						>
+							{t("password")}
+						</label>
+						<input
+							id="password"
+							type="password"
+							required
+							placeholder="Enter your password"
+							value={password}
+							onChange={(e) => setPassword(e.target.value)}
+							className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
+								error.title
+									? "border-destructive focus:border-destructive focus:ring-destructive/40"
+									: "border-border focus:border-primary focus:ring-primary/40"
+							}`}
+							disabled={isRegistering}
+						/>
+					</div>
 
-						<div>
-							<label
-								htmlFor="confirmPassword"
-								className="block text-sm font-medium text-gray-700 dark:text-gray-300"
-							>
-								{t("confirm_password")}
-							</label>
-							<input
-								id="confirmPassword"
-								type="password"
-								required
-								placeholder="Confirm your password"
-								value={confirmPassword}
-								onChange={(e) => setConfirmPassword(e.target.value)}
-								className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-2 focus:ring-offset-2 dark:bg-gray-800 dark:text-white transition-all ${
-									error.title
-										? "border-red-300 focus:border-red-500 focus:ring-red-500 dark:border-red-700"
-										: "border-gray-300 focus:border-blue-500 focus:ring-blue-500 dark:border-gray-700"
-								}`}
-								disabled={isRegistering}
-							/>
+					<div>
+						<label
+							htmlFor="confirmPassword"
+							className="block text-sm font-medium text-foreground"
+						>
+							{t("confirm_password")}
+						</label>
+						<input
+							id="confirmPassword"
+							type="password"
+							required
+							placeholder="Confirm your password"
+							value={confirmPassword}
+							onChange={(e) => setConfirmPassword(e.target.value)}
+							className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
+								error.title
+									? "border-destructive focus:border-destructive focus:ring-destructive/40"
+									: "border-border focus:border-primary focus:ring-primary/40"
+							}`}
+							disabled={isRegistering}
+						/>
 						</div>
 
 						<button
 							type="submit"
 							disabled={isRegistering}
-							className="relative w-full rounded-md bg-blue-600 px-4 py-1.5 md:py-2 text-white shadow-sm hover:bg-blue-700 focus:outline-none focus:ring-2 focus:ring-blue-500 focus:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50 transition-all text-sm md:text-base flex items-center justify-center gap-2"
+							className="relative w-full rounded-md bg-primary px-4 py-1.5 md:py-2 text-primary-foreground shadow-sm hover:bg-primary/90 focus:outline-none focus:ring-1 focus:ring-primary/40 disabled:cursor-not-allowed disabled:opacity-50 transition-all text-sm md:text-base flex items-center justify-center gap-2"
 						>
 							<span className={isRegistering ? "invisible" : ""}>{t("register")}</span>
 							{isRegistering && (
@@ -312,12 +312,12 @@ export default function RegisterPage() {
 					</form>
 
 					<div className="mt-4 text-center text-sm">
-						<p className="text-gray-600 dark:text-gray-400">
-							{t("already_have_account")}{" "}
-							<Link
-								href="/login"
-								className="font-medium text-blue-600 hover:text-blue-500 dark:text-blue-400"
-							>
+					<p className="text-muted-foreground">
+						{t("already_have_account")}{" "}
+						<Link
+							href="/login"
+							className="font-medium text-primary hover:text-primary/90"
+						>
 								{t("sign_in")}
 							</Link>
 						</p>

From 03a24686fe6553101275491e8a89c56f8eb5ca82 Mon Sep 17 00:00:00 2001
From: JoeMakuta <makutajosue@gmail.com>
Date: Wed, 1 Apr 2026 18:47:57 +0200
Subject: [PATCH 011/202] feat: implement map and find optimization

---
 .../[search_space_id]/new-chat/[[...chat_id]]/page.tsx   | 9 +++++----
 surfsense_web/hooks/use-documents.ts                     | 4 +++-
 surfsense_web/hooks/use-inbox.ts                         | 4 +++-
 3 files changed, 11 insertions(+), 6 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx b/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx
index a594b740d..f80b3a87f 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx
@@ -228,13 +228,14 @@ export default function NewChatPage() {
 					return prev;
 				}
 
+				const memberById = new Map(membersData?.map((m) => [m.user_id, m]) ?? []);
+				const prevById = new Map(prev.map((m) => [m.id, m]));
+
 				return syncedMessages.map((msg) => {
-					const member = msg.author_id
-						? membersData?.find((m) => m.user_id === msg.author_id)
-						: null;
+					const member = msg.author_id ? memberById.get(msg.author_id) ?? null : null;
 
 					// Preserve existing author info if member lookup fails (e.g., cloned chats)
-					const existingMsg = prev.find((m) => m.id === `msg-${msg.id}`);
+					const existingMsg = prevById.get(`msg-${msg.id}`);
 					const existingAuthor = existingMsg?.metadata?.custom?.author as
 						| { displayName?: string | null; avatarUrl?: string | null }
 						| undefined;
diff --git a/surfsense_web/hooks/use-documents.ts b/surfsense_web/hooks/use-documents.ts
index df782ca83..b01adc10a 100644
--- a/surfsense_web/hooks/use-documents.ts
+++ b/surfsense_web/hooks/use-documents.ts
@@ -246,9 +246,11 @@ export function useDocuments(
 					status: (doc.status as unknown as DocumentStatusType) ?? { state: "ready" },
 				}));
 
+			const liveById = new Map(validItems.map((v) => [v.id, v]));
+
 			let updated = prev.map((existing) => {
 				if (liveIds.has(existing.id)) {
-					const liveItem = validItems.find((v) => v.id === existing.id);
+					const liveItem = liveById.get(existing.id);
 					if (liveItem) {
 						return {
 							...existing,
diff --git a/surfsense_web/hooks/use-inbox.ts b/surfsense_web/hooks/use-inbox.ts
index 4203c3506..e1070219a 100644
--- a/surfsense_web/hooks/use-inbox.ts
+++ b/surfsense_web/hooks/use-inbox.ts
@@ -157,8 +157,10 @@ export function useInbox(
 						}) as InboxItem
 				);
 
+			const liveById = new Map(recentItems.map((v) => [v.id, v]));
+
 			let updated = prev.map((existing) => {
-				const liveItem = recentItems.find((v) => v.id === existing.id);
+				const liveItem = liveById.get(existing.id);
 				if (liveItem) {
 					return {
 						...existing,

From 917ec444bb5b5b07b5dbffdb446eb35561984f1f Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Wed, 1 Apr 2026 23:00:45 +0530
Subject: [PATCH 012/202] style: add overscroll-none class to ComposerAction
 component

---
 surfsense_web/components/assistant-ui/thread.tsx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/surfsense_web/components/assistant-ui/thread.tsx b/surfsense_web/components/assistant-ui/thread.tsx
index 2cf0393da..53770ef83 100644
--- a/surfsense_web/components/assistant-ui/thread.tsx
+++ b/surfsense_web/components/assistant-ui/thread.tsx
@@ -1063,7 +1063,7 @@ const ComposerAction: FC<ComposerActionProps> = ({ isBlockedByOtherUser = false
 						>
 							<div className="sr-only">Manage Tools</div>
 							<div
-								className="max-h-48 sm:max-h-64 overflow-y-auto py-0.5 sm:py-1"
+								className="max-h-48 sm:max-h-64 overflow-y-auto overscroll-none py-0.5 sm:py-1"
 								onScroll={handleToolsScroll}
 								style={{
 									maskImage: `linear-gradient(to bottom, ${toolsScrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${toolsScrollPos === "bottom" ? "black" : "transparent"})`,

From 1f8f71b542e5bb8d96c8bea7b1122f41240e076e Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 00:22:10 +0530
Subject: [PATCH 013/202] chore: add chokidar dependency for file watching

---
 surfsense_desktop/package.json   |  1 +
 surfsense_desktop/pnpm-lock.yaml | 17 +++++++++++++++++
 2 files changed, 18 insertions(+)

diff --git a/surfsense_desktop/package.json b/surfsense_desktop/package.json
index bd0cc67ab..5bbd50514 100644
--- a/surfsense_desktop/package.json
+++ b/surfsense_desktop/package.json
@@ -27,6 +27,7 @@
     "wait-on": "^9.0.4"
   },
   "dependencies": {
+    "chokidar": "^5.0.0",
     "electron-updater": "^6.8.3",
     "get-port-please": "^3.2.0"
   }
diff --git a/surfsense_desktop/pnpm-lock.yaml b/surfsense_desktop/pnpm-lock.yaml
index ea65be0bb..1533803fb 100644
--- a/surfsense_desktop/pnpm-lock.yaml
+++ b/surfsense_desktop/pnpm-lock.yaml
@@ -8,6 +8,9 @@ importers:
 
   .:
     dependencies:
+      chokidar:
+        specifier: ^5.0.0
+        version: 5.0.0
       electron-updater:
         specifier: ^6.8.3
         version: 6.8.3
@@ -477,6 +480,10 @@ packages:
     resolution: {integrity: sha512-oKnbhFyRIXpUuez8iBMmyEa4nbj4IOQyuhc/wy9kY7/WVPcwIO9VA668Pu8RkO7+0G76SLROeyw9CpQ061i4mA==}
     engines: {node: '>=10'}
 
+  chokidar@5.0.0:
+    resolution: {integrity: sha512-TQMmc3w+5AxjpL8iIiwebF73dRDF4fBIieAqGn9RGCWaEVwQ6Fb2cGe31Yns0RRIzii5goJ1Y7xbMwo1TxMplw==}
+    engines: {node: '>= 20.19.0'}
+
   chownr@3.0.0:
     resolution: {integrity: sha512-+IxzY9BZOQd/XuYPRmrvEVjF/nqj5kgT4kEq7VofrDoM1MxoRjEWkrCC3EtLi59TVawxTAn+orJwFQcrqEN1+g==}
     engines: {node: '>=18'}
@@ -1222,6 +1229,10 @@ packages:
     resolution: {integrity: sha512-9u/sniCrY3D5WdsERHzHE4G2YCXqoG5FTHUiCC4SIbr6XcLZBY05ya9EKjYek9O5xOAwjGq+1JdGBAS7Q9ScoA==}
     engines: {node: '>= 6'}
 
+  readdirp@5.0.0:
+    resolution: {integrity: sha512-9u/XQ1pvrQtYyMpZe7DXKv2p5CNvyVwzUB6uhLAnQwHMSgKMBR62lc7AHljaeteeHXn11XTAaLLUVZYVZyuRBQ==}
+    engines: {node: '>= 20.19.0'}
+
   require-directory@2.1.1:
     resolution: {integrity: sha512-fGxEI7+wsG9xrvdjsrlmL22OMTTiHRwAMroiEeMgq8gzoLC/PQr7RsRDSTLUg/bZAZtF+TVIkHc6/4RIKrui+Q==}
     engines: {node: '>=0.10.0'}
@@ -2019,6 +2030,10 @@ snapshots:
       ansi-styles: 4.3.0
       supports-color: 7.2.0
 
+  chokidar@5.0.0:
+    dependencies:
+      readdirp: 5.0.0
+
   chownr@3.0.0: {}
 
   chromium-pickle-js@0.2.0: {}
@@ -2863,6 +2878,8 @@ snapshots:
       string_decoder: 1.3.0
       util-deprecate: 1.0.2
 
+  readdirp@5.0.0: {}
+
   require-directory@2.1.1: {}
 
   resedit@1.7.2:

From 5bfeda62f2c9ab96717521e99374bb25b0686bda Mon Sep 17 00:00:00 2001
From: SohamBhattacharjee2003
 <125297948+SohamBhattacharjee2003@users.noreply.github.com>
Date: Thu, 2 Apr 2026 01:45:18 +0530
Subject: [PATCH 014/202] perf: use useDeferredValue for search/filter
 transitions

- prompt-picker: defer externalSearch before filtering prompt list
- document-mention-picker: defer debouncedSearch for client-side single-char filtering
- InboxSidebar: defer activeSource.items and searchResponse.items before filteredItems memo

Keeps search inputs responsive under React 18 Concurrent Mode by marking
expensive filtering computations as non-urgent updates (rule: rerender-transitions 5.11)
---
 .../layout/ui/sidebar/InboxSidebar.tsx        | 19 +++++++++----------
 .../new-chat/document-mention-picker.tsx      | 10 ++++++++--
 .../components/new-chat/prompt-picker.tsx     | 17 +++++++++++------
 3 files changed, 28 insertions(+), 18 deletions(-)

diff --git a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
index 03f2bc982..61eda2a88 100644
--- a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
@@ -20,7 +20,7 @@ import {
 } from "lucide-react";
 import { useParams, useRouter } from "next/navigation";
 import { useTranslations } from "next-intl";
-import { useCallback, useEffect, useMemo, useRef, useState } from "react";
+import { useCallback, useDeferredValue, useEffect, useMemo, useRef, useState } from "react";
 import { getDocumentTypeLabel } from "@/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentTypeIcon";
 import { setTargetCommentIdAtom } from "@/atoms/chat/current-thread.atom";
 import { convertRenderedToDisplay } from "@/components/chat-comments/comment-item/comment-item";
@@ -289,15 +289,14 @@ export function InboxSidebarContent({
 		[activeFilter]
 	);
 
+	// Defer non-urgent list updates so the search input stays responsive.
+	// The deferred snapshot lags one render behind the live value intentionally.
+	const deferredTabItems = useDeferredValue(activeSource.items);
+	const deferredSearchItems = useDeferredValue(searchResponse?.items ?? []);
+
 	// Two data paths: search mode (API) or default (per-tab data source)
 	const filteredItems = useMemo(() => {
-		let tabItems: InboxItem[];
-
-		if (isSearchMode) {
-			tabItems = searchResponse?.items ?? [];
-		} else {
-			tabItems = activeSource.items;
-		}
+		const tabItems: InboxItem[] = isSearchMode ? deferredSearchItems : deferredTabItems;
 
 		let result = tabItems;
 		if (activeFilter !== "all") {
@@ -310,8 +309,8 @@ export function InboxSidebarContent({
 		return result;
 	}, [
 		isSearchMode,
-		searchResponse,
-		activeSource.items,
+		deferredSearchItems,
+		deferredTabItems,
 		activeTab,
 		activeFilter,
 		selectedSource,
diff --git a/surfsense_web/components/new-chat/document-mention-picker.tsx b/surfsense_web/components/new-chat/document-mention-picker.tsx
index ee053a9f5..9c6521f31 100644
--- a/surfsense_web/components/new-chat/document-mention-picker.tsx
+++ b/surfsense_web/components/new-chat/document-mention-picker.tsx
@@ -4,6 +4,7 @@ import { keepPreviousData, useQuery } from "@tanstack/react-query";
 import {
 	forwardRef,
 	useCallback,
+	useDeferredValue,
 	useEffect,
 	useImperativeHandle,
 	useMemo,
@@ -81,6 +82,9 @@ export const DocumentMentionPicker = forwardRef<
 	// Debounced search value to minimize API calls and prevent race conditions
 	const search = externalSearch;
 	const debouncedSearch = useDebounced(search, DEBOUNCE_MS);
+	// Deferred snapshot of debouncedSearch — client-side filtering uses this so it
+	// is treated as a non-urgent update, keeping the input responsive.
+	const deferredSearch = useDeferredValue(debouncedSearch);
 	const [highlightedIndex, setHighlightedIndex] = useState(0);
 	const itemRefs = useRef<Map<number, HTMLButtonElement>>(new Map());
 	const scrollContainerRef = useRef<HTMLDivElement>(null);
@@ -245,12 +249,14 @@ export const DocumentMentionPicker = forwardRef<
 	 * Client-side filtering for single character searches.
 	 * Filters cached documents locally for instant feedback without additional API calls.
 	 * Server-side search is reserved for 2+ character queries to leverage database indexing.
+	 * Uses deferredSearch (a deferred snapshot of debouncedSearch) so this memo is treated
+	 * as non-urgent — React can interrupt it to keep the input responsive.
 	 */
 	const clientFilteredDocs = useMemo(() => {
 		if (!isSingleCharSearch) return null;
-		const searchLower = debouncedSearch.trim().toLowerCase();
+		const searchLower = deferredSearch.trim().toLowerCase();
 		return accumulatedDocuments.filter((doc) => doc.title.toLowerCase().includes(searchLower));
-	}, [isSingleCharSearch, debouncedSearch, accumulatedDocuments]);
+	}, [isSingleCharSearch, deferredSearch, accumulatedDocuments]);
 
 	// Select data source based on search length: client-filtered for single char, server results for 2+
 	const actualDocuments = isSingleCharSearch ? (clientFilteredDocs ?? []) : accumulatedDocuments;
diff --git a/surfsense_web/components/new-chat/prompt-picker.tsx b/surfsense_web/components/new-chat/prompt-picker.tsx
index 9fc435111..3e6457b8c 100644
--- a/surfsense_web/components/new-chat/prompt-picker.tsx
+++ b/surfsense_web/components/new-chat/prompt-picker.tsx
@@ -5,6 +5,7 @@ import { Plus, Zap } from "lucide-react";
 import {
 	forwardRef,
 	useCallback,
+	useDeferredValue,
 	useEffect,
 	useImperativeHandle,
 	useMemo,
@@ -41,15 +42,19 @@ export const PromptPicker = forwardRef<PromptPickerRef, PromptPickerProps>(funct
 	const shouldScrollRef = useRef(false);
 	const itemRefs = useRef<Map<number, HTMLButtonElement>>(new Map());
 
+	// Defer the search value so filtering is non-urgent and the input stays responsive
+	const deferredSearch = useDeferredValue(externalSearch);
+
 	const filtered = useMemo(() => {
 		const list = prompts ?? [];
-		if (!externalSearch) return list;
-		return list.filter((a) => a.name.toLowerCase().includes(externalSearch.toLowerCase()));
-	}, [prompts, externalSearch]);
+		if (!deferredSearch) return list;
+		return list.filter((a) => a.name.toLowerCase().includes(deferredSearch.toLowerCase()));
+	}, [prompts, deferredSearch]);
 
-	const prevSearchRef = useRef(externalSearch);
-	if (prevSearchRef.current !== externalSearch) {
-		prevSearchRef.current = externalSearch;
+	// Reset highlight when the deferred (filtered) search changes
+	const prevSearchRef = useRef(deferredSearch);
+	if (prevSearchRef.current !== deferredSearch) {
+		prevSearchRef.current = deferredSearch;
 		if (highlightedIndex !== 0) {
 			setHighlightedIndex(0);
 		}

From ae3b69443ff4b7422e66686c746dbe92d700d7a2 Mon Sep 17 00:00:00 2001
From: SohamBhattacharjee2003
 <125297948+SohamBhattacharjee2003@users.noreply.github.com>
Date: Thu, 2 Apr 2026 02:26:55 +0530
Subject: [PATCH 015/202] perf: add content-visibility: auto to long list items

Apply content-visibility: auto to off-screen list and sidebar items
to skip browser layout and painting until they scroll into view.

Changes:
- globals.css: add .list-item-lazy (48px) and .sidebar-item-lazy (40px) utilities
- DocumentsTableShell: apply list-item-lazy to desktop <tr> rows and mobile card divs
- AllPrivateChatsSidebar: apply sidebar-item-lazy to thread items
- AllSharedChatsSidebar: apply sidebar-item-lazy to thread items
- InboxSidebar: apply content-visibility inline (80px intrinsic height) to inbox items

Implements Vercel React Best Practices Rule: rendering-content-visibility (6.2)
---
 .../(manage)/components/DocumentsTableShell.tsx       |  4 ++--
 surfsense_web/app/globals.css                         | 11 +++++++++++
 .../layout/ui/sidebar/AllPrivateChatsSidebar.tsx      |  2 +-
 .../layout/ui/sidebar/AllSharedChatsSidebar.tsx       |  2 +-
 .../components/layout/ui/sidebar/InboxSidebar.tsx     |  1 +
 5 files changed, 16 insertions(+), 4 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
index 92ced6e47..4e0c36267 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
@@ -630,7 +630,7 @@ export function DocumentsTableShell({
 									return (
 										<tr
 											key={doc.id}
-											className={`group border-b border-border/50 transition-colors ${
+											className={`list-item-lazy group border-b border-border/50 transition-colors ${
 												isMentioned ? "bg-primary/5 hover:bg-primary/8" : "hover:bg-muted/30"
 											} ${canInteract && hasChatMode ? "cursor-pointer" : ""}`}
 											onClick={handleRowClick}
@@ -871,7 +871,7 @@ export function DocumentsTableShell({
 						return (
 							<MobileCardWrapper key={doc.id} onLongPress={() => setMobileActionDoc(doc)}>
 								<div
-									className={`relative px-3 py-2 transition-colors ${
+									className={`list-item-lazy relative px-3 py-2 transition-colors ${
 										isMentioned ? "bg-primary/5" : "hover:bg-muted/20"
 									} ${canInteract && hasChatMode ? "cursor-pointer" : ""}`}
 								>
diff --git a/surfsense_web/app/globals.css b/surfsense_web/app/globals.css
index 087c5b676..a37ddb8f3 100644
--- a/surfsense_web/app/globals.css
+++ b/surfsense_web/app/globals.css
@@ -246,6 +246,17 @@ button {
 	}
 }
 
+/* content-visibility utilities — skip layout/paint for off-screen list items */
+.list-item-lazy {
+	content-visibility: auto;
+	contain-intrinsic-size: 0 48px;
+}
+
+.sidebar-item-lazy {
+	content-visibility: auto;
+	contain-intrinsic-size: 0 40px;
+}
+
 @source "../node_modules/@llamaindex/chat-ui/**/*.{ts,tsx}";
 @source "../node_modules/streamdown/dist/*.js";
 @source "../node_modules/@streamdown/code/dist/*.js";
diff --git a/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx
index 1bc773374..57c011f01 100644
--- a/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx
@@ -349,7 +349,7 @@ export function AllPrivateChatsSidebarContent({
 								<div
 									key={thread.id}
 									className={cn(
-										"group flex items-center gap-2 rounded-md px-2 py-1.5 text-sm",
+										"sidebar-item-lazy group flex items-center gap-2 rounded-md px-2 py-1.5 text-sm",
 										"hover:bg-accent hover:text-accent-foreground",
 										"transition-colors cursor-pointer",
 										isActive && "bg-accent text-accent-foreground",
diff --git a/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx
index b2ba86673..4a59df440 100644
--- a/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx
@@ -349,7 +349,7 @@ export function AllSharedChatsSidebarContent({
 								<div
 									key={thread.id}
 									className={cn(
-										"group flex items-center gap-2 rounded-md px-2 py-1.5 text-sm",
+										"sidebar-item-lazy group flex items-center gap-2 rounded-md px-2 py-1.5 text-sm",
 										"hover:bg-accent hover:text-accent-foreground",
 										"transition-colors cursor-pointer",
 										isActive && "bg-accent text-accent-foreground",
diff --git a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
index 61eda2a88..72400a589 100644
--- a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
@@ -919,6 +919,7 @@ export function InboxSidebarContent({
 										"transition-colors cursor-pointer",
 										isMarkingAsRead && "opacity-50 pointer-events-none"
 									)}
+									style={{ contentVisibility: "auto", containIntrinsicSize: "0 80px" }}
 								>
 									{isMobile ? (
 										<button

From 767c97682d4de5dde164c3eea35b4dd53760ff58 Mon Sep 17 00:00:00 2001
From: SohamBhattacharjee2003
 <125297948+SohamBhattacharjee2003@users.noreply.github.com>
Date: Thu, 2 Apr 2026 02:45:46 +0530
Subject: [PATCH 016/202] perf: replace useSearchParams() with
 window.location.search in effects

Components were calling useSearchParams() at the top level but only
reading the value inside useEffect or callbacks, never in JSX. This
subscribed the entire component tree to every URL query change.

Fix: read from window.location.search directly inside the effect so
no React subscription is created.

Changes:
- new-chat/page.tsx: read commentId inside effect + popstate listener
  for SPA back/forward support; removes subscription from 1500+ line tree
- dashboard/page.tsx: read window.location.search at redirect time;
  removes searchParams from dep array
- public-chat-footer.tsx: one-shot mount read for action=clone param
- TokenHandler.tsx: one-shot mount read for token + refresh_token params

Implements Vercel React Best Practices Rule: rerender-defer-reads (5.2)
---
 .../new-chat/[[...chat_id]]/page.tsx          | 36 ++++++++++++-------
 surfsense_web/app/dashboard/page.tsx          | 10 +++---
 surfsense_web/components/TokenHandler.tsx     | 15 ++++----
 .../public-chat/public-chat-footer.tsx        | 11 +++---
 4 files changed, 42 insertions(+), 30 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx b/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx
index a594b740d..bc28ba6a0 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx
@@ -8,7 +8,7 @@ import {
 } from "@assistant-ui/react";
 import { useQueryClient } from "@tanstack/react-query";
 import { useAtomValue, useSetAtom } from "jotai";
-import { useParams, useSearchParams } from "next/navigation";
+import { useParams } from "next/navigation";
 import { useCallback, useEffect, useMemo, useRef, useState } from "react";
 import { toast } from "sonner";
 import { z } from "zod";
@@ -388,22 +388,32 @@ export default function NewChatPage() {
 	}, [searchSpaceId, queryClient]);
 
 	// Handle scroll to comment from URL query params (e.g., from inbox item click)
-	const searchParams = useSearchParams();
-	const targetCommentIdParam = searchParams.get("commentId");
-
-	// Set target comment ID from URL param - the AssistantMessage and CommentItem
-	// components will handle scrolling and highlighting once comments are loaded
+	// Read from window.location.search inside the effect instead of subscribing via
+	// useSearchParams() — avoids re-rendering this heavy component tree on every
+	// unrelated query-string change. (Vercel Best Practice: rerender-defer-reads 5.2)
 	useEffect(() => {
-		if (targetCommentIdParam && !isInitializing) {
-			const commentId = Number.parseInt(targetCommentIdParam, 10);
-			if (!Number.isNaN(commentId)) {
-				setTargetCommentId(commentId);
+		const readAndApplyCommentId = () => {
+			const params = new URLSearchParams(window.location.search);
+			const raw = params.get("commentId");
+			if (raw && !isInitializing) {
+				const commentId = Number.parseInt(raw, 10);
+				if (!Number.isNaN(commentId)) {
+					setTargetCommentId(commentId);
+				}
 			}
-		}
+		};
+
+		readAndApplyCommentId();
+
+		// Also respond to SPA navigations (back/forward) that change the query string
+		window.addEventListener("popstate", readAndApplyCommentId);
 
 		// Cleanup on unmount or when navigating away
-		return () => clearTargetCommentId();
-	}, [targetCommentIdParam, isInitializing, setTargetCommentId, clearTargetCommentId]);
+		return () => {
+			window.removeEventListener("popstate", readAndApplyCommentId);
+			clearTargetCommentId();
+		};
+	}, [isInitializing, setTargetCommentId, clearTargetCommentId]);
 
 	// Sync current thread state to atom
 	useEffect(() => {
diff --git a/surfsense_web/app/dashboard/page.tsx b/surfsense_web/app/dashboard/page.tsx
index 525060bed..09ace6542 100644
--- a/surfsense_web/app/dashboard/page.tsx
+++ b/surfsense_web/app/dashboard/page.tsx
@@ -3,7 +3,7 @@
 import { useAtomValue } from "jotai";
 import { AlertCircle, Plus, Search } from "lucide-react";
 import { motion } from "motion/react";
-import { useRouter, useSearchParams } from "next/navigation";
+import { useRouter } from "next/navigation";
 import { useTranslations } from "next-intl";
 import { useEffect, useState } from "react";
 import { searchSpacesAtom } from "@/atoms/search-spaces/search-space-query.atoms";
@@ -89,7 +89,6 @@ function EmptyState({ onCreateClick }: { onCreateClick: () => void }) {
 
 export default function DashboardPage() {
 	const router = useRouter();
-	const searchParams = useSearchParams();
 	const [showCreateDialog, setShowCreateDialog] = useState(false);
 
 	const t = useTranslations("dashboard");
@@ -99,11 +98,12 @@ export default function DashboardPage() {
 		if (isLoading) return;
 
 		if (searchSpaces.length > 0) {
-			const params = searchParams.toString();
-			const query = params ? `?${params}` : "";
+			// Read the query string at the time of redirect — no subscription needed.
+			// (Vercel Best Practice: rerender-defer-reads 5.2)
+			const query = window.location.search;
 			router.replace(`/dashboard/${searchSpaces[0].id}/new-chat${query}`);
 		}
-	}, [isLoading, searchSpaces, router, searchParams]);
+	}, [isLoading, searchSpaces, router]);
 
 	// Show loading while fetching or while we have spaces and are about to redirect
 	const shouldShowLoading = isLoading || searchSpaces.length > 0;
diff --git a/surfsense_web/components/TokenHandler.tsx b/surfsense_web/components/TokenHandler.tsx
index 230cda81a..02a7089d9 100644
--- a/surfsense_web/components/TokenHandler.tsx
+++ b/surfsense_web/components/TokenHandler.tsx
@@ -1,6 +1,5 @@
 "use client";
 
-import { useSearchParams } from "next/navigation";
 import { useEffect } from "react";
 import { useGlobalLoadingEffect } from "@/hooks/use-global-loading";
 import { getAndClearRedirectPath, setBearerToken, setRefreshToken } from "@/lib/auth-utils";
@@ -26,8 +25,6 @@ const TokenHandler = ({
 	tokenParamName = "token",
 	storageKey = "surfsense_bearer_token",
 }: TokenHandlerProps) => {
-	const searchParams = useSearchParams();
-
 	// Always show loading for this component - spinner animation won't reset
 	useGlobalLoadingEffect(true);
 
@@ -35,9 +32,13 @@ const TokenHandler = ({
 		// Only run on client-side
 		if (typeof window === "undefined") return;
 
-		// Get tokens from URL parameters
-		const token = searchParams.get(tokenParamName);
-		const refreshToken = searchParams.get("refresh_token");
+		// Read tokens from URL at mount time — no subscription needed.
+		// TokenHandler only runs once after an auth redirect, so a stale read
+		// is impossible and useSearchParams() would add a pointless subscription.
+		// (Vercel Best Practice: rerender-defer-reads 5.2)
+		const params = new URLSearchParams(window.location.search);
+		const token = params.get(tokenParamName);
+		const refreshToken = params.get("refresh_token");
 
 		if (token) {
 			try {
@@ -74,7 +75,7 @@ const TokenHandler = ({
 				window.location.href = redirectPath;
 			}
 		}
-	}, [searchParams, tokenParamName, storageKey, redirectPath]);
+	}, [tokenParamName, storageKey, redirectPath]);
 
 	// Return null - the global provider handles the loading UI
 	return null;
diff --git a/surfsense_web/components/public-chat/public-chat-footer.tsx b/surfsense_web/components/public-chat/public-chat-footer.tsx
index 79b317ddf..e341a9a0c 100644
--- a/surfsense_web/components/public-chat/public-chat-footer.tsx
+++ b/surfsense_web/components/public-chat/public-chat-footer.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { Copy } from "lucide-react";
-import { useRouter, useSearchParams } from "next/navigation";
+import { useRouter } from "next/navigation";
 import { useCallback, useEffect, useRef, useState } from "react";
 import { toast } from "sonner";
 import { Button } from "@/components/ui/button";
@@ -15,7 +15,6 @@ interface PublicChatFooterProps {
 
 export function PublicChatFooter({ shareToken }: PublicChatFooterProps) {
 	const router = useRouter();
-	const searchParams = useSearchParams();
 	const [isCloning, setIsCloning] = useState(false);
 	const hasAutoCloned = useRef(false);
 
@@ -36,9 +35,11 @@ export function PublicChatFooter({ shareToken }: PublicChatFooterProps) {
 		}
 	}, [shareToken, router]);
 
-	// Auto-trigger clone if user just logged in with action=clone
+	// Auto-trigger clone if user just logged in with action=clone.
+	// Read from window.location.search on mount — no subscription needed since
+	// this is a one-time post-login check. (Vercel Best Practice: rerender-defer-reads 5.2)
 	useEffect(() => {
-		const action = searchParams.get("action");
+		const action = new URLSearchParams(window.location.search).get("action");
 		const token = getBearerToken();
 
 		// Only auto-clone once, if authenticated and action=clone is present
@@ -46,7 +47,7 @@ export function PublicChatFooter({ shareToken }: PublicChatFooterProps) {
 			hasAutoCloned.current = true;
 			triggerClone();
 		}
-	}, [searchParams, isCloning, triggerClone]);
+	}, [isCloning, triggerClone]);
 
 	const handleCopyAndContinue = async () => {
 		const token = getBearerToken();

From 6163503501944147321147506dec047806dcabbd Mon Sep 17 00:00:00 2001
From: Chisom Uma <chisomuma476@gmail.com>
Date: Wed, 1 Apr 2026 23:09:57 +0000
Subject: [PATCH 017/202] refactor: Converted disabledTools to Set for O(1)
 membership checks

---
 surfsense_web/components/assistant-ui/thread.tsx | 15 ++++++++-------
 1 file changed, 8 insertions(+), 7 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/thread.tsx b/surfsense_web/components/assistant-ui/thread.tsx
index 2cf0393da..0d0163d8a 100644
--- a/surfsense_web/components/assistant-ui/thread.tsx
+++ b/surfsense_web/components/assistant-ui/thread.tsx
@@ -834,6 +834,7 @@ const ComposerAction: FC<ComposerActionProps> = ({ isBlockedByOtherUser = false
 
 	const { data: agentTools } = useAtomValue(agentToolsAtom);
 	const disabledTools = useAtomValue(disabledToolsAtom);
+	const disabledToolsSet = useMemo(() => new Set(disabledTools), [disabledTools]);
 	const toggleTool = useSetAtom(toggleToolAtom);
 	const setDisabledTools = useSetAtom(disabledToolsAtom);
 	const hydrateDisabled = useSetAtom(hydrateDisabledToolsAtom);
@@ -846,18 +847,18 @@ const ComposerAction: FC<ComposerActionProps> = ({ isBlockedByOtherUser = false
 
 	const toggleToolGroup = useCallback(
 		(toolNames: string[]) => {
-			const allDisabled = toolNames.every((name) => disabledTools.includes(name));
+			const allDisabled = toolNames.every((name) => disabledToolsSet.has(name));
 			if (allDisabled) {
 				setDisabledTools((prev) => prev.filter((t) => !toolNames.includes(t)));
 			} else {
 				setDisabledTools((prev) => [...new Set([...prev, ...toolNames])]);
 			}
 		},
-		[disabledTools, setDisabledTools]
+		[disabledToolsSet, setDisabledTools]
 	);
 
 	const hasWebSearchTool = agentTools?.some((t) => t.name === "web_search") ?? false;
-	const isWebSearchEnabled = hasWebSearchTool && !disabledTools.includes("web_search");
+	const isWebSearchEnabled = hasWebSearchTool && !disabledToolsSet.has("web_search");
 	const filteredTools = useMemo(
 		() => agentTools?.filter((t) => t.name !== "web_search"),
 		[agentTools]
@@ -957,7 +958,7 @@ const ComposerAction: FC<ComposerActionProps> = ({ isBlockedByOtherUser = false
 													{group.label}
 												</div>
 												{group.tools.map((tool) => {
-													const isDisabled = disabledTools.includes(tool.name);
+													const isDisabled = disabledToolsSet.has(tool.name);
 													const ToolIcon = getToolIcon(tool.name);
 													return (
 														<div
@@ -989,7 +990,7 @@ const ComposerAction: FC<ComposerActionProps> = ({ isBlockedByOtherUser = false
 													const iconKey = group.connectorIcon ?? "";
 													const iconInfo = CONNECTOR_TOOL_ICON_PATHS[iconKey];
 													const toolNames = group.tools.map((t) => t.name);
-													const allDisabled = toolNames.every((n) => disabledTools.includes(n));
+													const allDisabled = toolNames.every((n) => disabledToolsSet.has(n));
 													return (
 														<div
 															key={group.label}
@@ -1078,7 +1079,7 @@ const ComposerAction: FC<ComposerActionProps> = ({ isBlockedByOtherUser = false
 												{group.label}
 											</div>
 											{group.tools.map((tool) => {
-												const isDisabled = disabledTools.includes(tool.name);
+												const isDisabled = disabledToolsSet.has(tool.name);
 												const ToolIcon = getToolIcon(tool.name);
 												const row = (
 													<div className="flex w-full items-center gap-2 sm:gap-3 px-2.5 sm:px-3 py-1 sm:py-1.5 hover:bg-muted-foreground/10 transition-colors">
@@ -1115,7 +1116,7 @@ const ComposerAction: FC<ComposerActionProps> = ({ isBlockedByOtherUser = false
 												const iconKey = group.connectorIcon ?? "";
 												const iconInfo = CONNECTOR_TOOL_ICON_PATHS[iconKey];
 												const toolNames = group.tools.map((t) => t.name);
-												const allDisabled = toolNames.every((n) => disabledTools.includes(n));
+												const allDisabled = toolNames.every((n) => disabledToolsSet.has(n));
 												const groupDef = TOOL_GROUPS.find((g) => g.label === group.label);
 												const row = (
 													<div className="flex w-full items-center gap-2 sm:gap-3 px-2.5 sm:px-3 py-1 sm:py-1.5 hover:bg-muted-foreground/10 transition-colors">

From 2df9708df9e5b3c9fafca48144a43b96ffe160b8 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 09:16:07 +0530
Subject: [PATCH 018/202] style: update alert components and empty state UI

---
 .../assistant-ui/connector-popup.tsx          |  6 ++--
 .../assistant-ui/document-upload-popup.tsx    |  6 ++--
 .../public-chat-snapshots-empty-state.tsx     |  7 ++---
 .../settings/image-model-manager.tsx          | 18 ++----------
 .../settings/model-config-manager.tsx         | 28 +++++--------------
 5 files changed, 18 insertions(+), 47 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/connector-popup.tsx b/surfsense_web/components/assistant-ui/connector-popup.tsx
index d1f6dd31f..b31b7cbd1 100644
--- a/surfsense_web/components/assistant-ui/connector-popup.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup.tsx
@@ -376,14 +376,14 @@ export const ConnectorIndicator = forwardRef<ConnectorIndicatorHandle, Connector
 									<div className="px-4 sm:px-12 py-4 sm:py-8 pb-12 sm:pb-16">
 										{/* LLM Configuration Warning */}
 										{!llmConfigLoading && !hasDocumentSummaryLLM && (
-											<Alert variant="destructive" className="mb-6">
+											<Alert variant="destructive" className="mb-6 bg-muted/50 rounded-xl border-destructive/30">
 												<AlertTriangle className="h-4 w-4" />
 												<AlertTitle>LLM Configuration Required</AlertTitle>
 												<AlertDescription className="mt-2">
 													<p className="mb-3">
 														{isAutoMode && !hasGlobalConfigs
-															? "Auto mode is selected but no global LLM configurations are available. Please configure a custom LLM in Settings to process and summarize documents from your connected sources."
-															: "You need to configure a Document Summary LLM before adding connectors. This LLM is used to process and summarize documents from your connected sources."}
+															? "Auto mode requires a global LLM configuration. Please add one in Settings"
+															: "A Document Summary LLM is required to process uploads, configure one in Settings"}
 													</p>
 													<Button
 														size="sm"
diff --git a/surfsense_web/components/assistant-ui/document-upload-popup.tsx b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
index c34890dff..06b0d38e7 100644
--- a/surfsense_web/components/assistant-ui/document-upload-popup.tsx
+++ b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
@@ -149,14 +149,14 @@ const DocumentUploadPopupContent: FC<{
 					{/* Content */}
 					<div className="px-4 sm:px-12 pb-4 sm:pb-16">
 						{!isLoading && !hasDocumentSummaryLLM ? (
-							<Alert variant="destructive" className="mb-4">
+							<Alert variant="destructive" className="mb-4 bg-muted/50 rounded-xl border-destructive/30">
 								<AlertTriangle className="h-4 w-4" />
 								<AlertTitle>LLM Configuration Required</AlertTitle>
 								<AlertDescription className="mt-2">
 									<p className="mb-3">
 										{isAutoMode && !hasGlobalConfigs
-											? "Auto mode is selected but no global LLM configurations are available. Please configure a custom LLM in Settings to process and summarize your uploaded documents."
-											: "You need to configure a Document Summary LLM before uploading files. This LLM is used to process and summarize your uploaded documents."}
+											? "Auto mode requires a global LLM configuration. Please add one in Settings"
+											: "A Document Summary LLM is required to process uploads, configure one in Settings"}
 									</p>
 									<Button
 										size="sm"
diff --git a/surfsense_web/components/public-chat-snapshots/public-chat-snapshots-empty-state.tsx b/surfsense_web/components/public-chat-snapshots/public-chat-snapshots-empty-state.tsx
index 4a4a57770..4e8ec5bb6 100644
--- a/surfsense_web/components/public-chat-snapshots/public-chat-snapshots-empty-state.tsx
+++ b/surfsense_web/components/public-chat-snapshots/public-chat-snapshots-empty-state.tsx
@@ -11,11 +11,8 @@ export function PublicChatSnapshotsEmptyState({
 }: PublicChatSnapshotsEmptyStateProps) {
 	return (
 		<div className="flex flex-col items-center justify-center py-12 text-center">
-			<div className="rounded-full bg-muted p-3 mb-4">
-				<Link2Off className="h-6 w-6 text-muted-foreground" />
-			</div>
-			<h3 className="text-sm font-medium text-foreground mb-1">{title}</h3>
-			<p className="text-xs text-muted-foreground max-w-sm">{description}</p>
+			<h3 className="text-sm md:text-base font-semibold mb-2">{title}</h3>
+			<p className="text-[11px] md:text-xs text-muted-foreground max-w-sm">{description}</p>
 		</div>
 	);
 }
diff --git a/surfsense_web/components/settings/image-model-manager.tsx b/surfsense_web/components/settings/image-model-manager.tsx
index 0c45af7d4..55128dc59 100644
--- a/surfsense_web/components/settings/image-model-manager.tsx
+++ b/surfsense_web/components/settings/image-model-manager.tsx
@@ -240,26 +240,14 @@ export function ImageModelManager({ searchSpaceId }: ImageModelManagerProps) {
 			{!isLoading && (
 				<div className="space-y-4 md:space-y-6">
 					{(userConfigs?.length ?? 0) === 0 ? (
-						<Card className="border-dashed border-2 border-muted-foreground/25">
+						<Card className="border-0 bg-transparent shadow-none">
 							<CardContent className="flex flex-col items-center justify-center py-10 md:py-16 text-center">
-								<div className="rounded-full bg-gradient-to-br from-teal-500/10 to-cyan-500/10 p-4 md:p-6 mb-4">
-									<Wand2 className="h-8 w-8 md:h-12 md:w-12 text-teal-600 dark:text-teal-400" />
-								</div>
-								<h3 className="text-lg font-semibold mb-2">No Image Models Yet</h3>
-								<p className="text-xs md:text-sm text-muted-foreground max-w-sm mb-4">
+								<h3 className="text-sm md:text-base font-semibold mb-2">No Image Models Yet</h3>
+								<p className="text-[11px] md:text-xs text-muted-foreground max-w-sm mb-4">
 									{canCreate
 										? "Add your own image generation model (DALL-E 3, GPT Image 1, etc.)"
 										: "No image models have been added to this space yet. Contact a space owner to add one."}
 								</p>
-								{canCreate && (
-									<Button
-										onClick={openNewDialog}
-										size="lg"
-										className="gap-2 text-xs md:text-sm h-9 md:h-10"
-									>
-										Add First Image Model
-									</Button>
-								)}
 							</CardContent>
 						</Card>
 					) : (
diff --git a/surfsense_web/components/settings/model-config-manager.tsx b/surfsense_web/components/settings/model-config-manager.tsx
index 50d2ab5b7..837060c70 100644
--- a/surfsense_web/components/settings/model-config-manager.tsx
+++ b/surfsense_web/components/settings/model-config-manager.tsx
@@ -250,28 +250,14 @@ export function ModelConfigManager({ searchSpaceId }: ModelConfigManagerProps) {
 				<div className="space-y-4">
 					{configs?.length === 0 ? (
 						<div>
-							<Card className="border-dashed border-2 border-muted-foreground/25">
+							<Card className="border-0 bg-transparent shadow-none">
 								<CardContent className="flex flex-col items-center justify-center py-10 md:py-16 text-center">
-									<div className="rounded-full bg-gradient-to-br from-violet-500/10 to-purple-500/10 p-4 md:p-6 mb-4 md:mb-6">
-										<Wand2 className="h-8 w-8 md:h-12 md:w-12 text-violet-600 dark:text-violet-400" />
-									</div>
-									<div className="space-y-2 mb-4 md:mb-6">
-										<h3 className="text-lg md:text-xl font-semibold">No Configurations Yet</h3>
-										<p className="text-xs md:text-sm text-muted-foreground max-w-sm">
-											{canCreate
-												? "Create your first AI configuration to customize how your agent responds"
-												: "No AI configurations have been added to this space yet. Contact a space owner to add one."}
-										</p>
-									</div>
-									{canCreate && (
-										<Button
-											onClick={openNewDialog}
-											size="lg"
-											className="gap-2 text-xs md:text-sm h-9 md:h-10"
-										>
-											Create First Configuration
-										</Button>
-									)}
+									<h3 className="text-sm md:text-base font-semibold mb-2">No LLM Models Yet</h3>
+									<p className="text-[11px] md:text-xs text-muted-foreground max-w-sm mb-4">
+										{canCreate
+											? "Add your first LLM model to power document summarization, chat, and other agent capabilities"
+											: "No LLM models have been added to this space yet. Contact a space owner to add one"}
+									</p>
 								</CardContent>
 							</Card>
 						</div>

From 407175ffae46a23d775bcba9c35fdfb465766ba0 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 09:26:16 +0530
Subject: [PATCH 019/202] style: replace loading indicators with Spinner
 component in alert dialogs

---
 .../layout/providers/LayoutDataProvider.tsx       | 15 +++++----------
 1 file changed, 5 insertions(+), 10 deletions(-)

diff --git a/surfsense_web/components/layout/providers/LayoutDataProvider.tsx b/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
index fd6b45c52..6138b67fb 100644
--- a/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
+++ b/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
@@ -775,7 +775,8 @@ export function LayoutDataProvider({ searchSpaceId, children }: LayoutDataProvid
 					<AlertDialogHeader>
 						<AlertDialogTitle>{t("delete_chat")}</AlertDialogTitle>
 						<AlertDialogDescription>
-							{t("delete_chat_confirm")} <span className="font-medium">{chatToDelete?.name}</span>?{" "}
+							{t("delete_chat_confirm")}{" "}
+							<span className="font-medium break-all">{chatToDelete?.name}</span>?{" "}
 							{t("action_cannot_undone")}
 						</AlertDialogDescription>
 					</AlertDialogHeader>
@@ -835,9 +836,7 @@ export function LayoutDataProvider({ searchSpaceId, children }: LayoutDataProvid
 							<span className={isRenamingChat ? "opacity-0" : ""}>
 								{tSidebar("rename") || "Rename"}
 							</span>
-							{isRenamingChat && (
-								<span className="absolute h-4 w-4 animate-spin rounded-full border-2 border-current border-t-transparent" />
-							)}
+							{isRenamingChat && <Spinner size="sm" className="absolute" />}
 						</Button>
 					</DialogFooter>
 				</DialogContent>
@@ -865,9 +864,7 @@ export function LayoutDataProvider({ searchSpaceId, children }: LayoutDataProvid
 							className="relative bg-destructive text-destructive-foreground hover:bg-destructive/90"
 						>
 							<span className={isDeletingSearchSpace ? "opacity-0" : ""}>{tCommon("delete")}</span>
-							{isDeletingSearchSpace && (
-								<span className="absolute h-4 w-4 animate-spin rounded-full border-2 border-current border-t-transparent" />
-							)}
+							{isDeletingSearchSpace && <Spinner size="sm" className="absolute" />}
 						</AlertDialogAction>
 					</AlertDialogFooter>
 				</AlertDialogContent>
@@ -895,9 +892,7 @@ export function LayoutDataProvider({ searchSpaceId, children }: LayoutDataProvid
 							className="relative bg-destructive text-destructive-foreground hover:bg-destructive/90"
 						>
 							<span className={isLeavingSearchSpace ? "opacity-0" : ""}>{t("leave")}</span>
-							{isLeavingSearchSpace && (
-								<span className="absolute h-4 w-4 animate-spin rounded-full border-2 border-current border-t-transparent" />
-							)}
+							{isLeavingSearchSpace && <Spinner size="sm" className="absolute" />}
 						</AlertDialogAction>
 					</AlertDialogFooter>
 				</AlertDialogContent>

From d2cf3fb3b7eafce01c881e80049346239c84bc6f Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 09:58:14 +0530
Subject: [PATCH 020/202] refactor: update LLM role management logic and
 enhance UI feedback

---
 .../new-llm-config-mutation.atoms.ts          |   9 +-
 .../components/settings/llm-role-manager.tsx  | 165 +++++-------------
 2 files changed, 52 insertions(+), 122 deletions(-)

diff --git a/surfsense_web/atoms/new-llm-config/new-llm-config-mutation.atoms.ts b/surfsense_web/atoms/new-llm-config/new-llm-config-mutation.atoms.ts
index 861606f80..d6d3aa820 100644
--- a/surfsense_web/atoms/new-llm-config/new-llm-config-mutation.atoms.ts
+++ b/surfsense_web/atoms/new-llm-config/new-llm-config-mutation.atoms.ts
@@ -109,10 +109,11 @@ export const updateLLMPreferencesMutationAtom = atomWithMutation((get) => {
 		mutationFn: async (request: UpdateLLMPreferencesRequest) => {
 			return newLLMConfigApiService.updateLLMPreferences(request);
 		},
-		onSuccess: () => {
-			queryClient.invalidateQueries({
-				queryKey: cacheKeys.newLLMConfigs.preferences(Number(searchSpaceId)),
-			});
+		onSuccess: (_data, request: UpdateLLMPreferencesRequest) => {
+			queryClient.setQueryData(
+				cacheKeys.newLLMConfigs.preferences(Number(searchSpaceId)),
+				(old: Record<string, unknown> | undefined) => ({ ...old, ...request.data })
+			);
 		},
 		onError: (error: Error) => {
 			toast.error(error.message || "Failed to update LLM preferences");
diff --git a/surfsense_web/components/settings/llm-role-manager.tsx b/surfsense_web/components/settings/llm-role-manager.tsx
index 07ec492a3..22e17e431 100644
--- a/surfsense_web/components/settings/llm-role-manager.tsx
+++ b/surfsense_web/components/settings/llm-role-manager.tsx
@@ -4,16 +4,14 @@ import { useAtomValue } from "jotai";
 import {
 	AlertCircle,
 	Bot,
-	CheckCircle,
+	CircleCheck,
 	CircleDashed,
 	FileText,
 	ImageIcon,
 	RefreshCw,
-	RotateCcw,
-	Save,
 	Shuffle,
 } from "lucide-react";
-import { useEffect, useState } from "react";
+import { useCallback, useEffect, useRef, useState } from "react";
 import { toast } from "sonner";
 import {
 	globalImageGenConfigsAtom,
@@ -40,6 +38,7 @@ import {
 	SelectValue,
 } from "@/components/ui/select";
 import { Skeleton } from "@/components/ui/skeleton";
+import { Spinner } from "@/components/ui/spinner";
 import { getProviderIcon } from "@/lib/provider-icons";
 import { cn } from "@/lib/utils";
 
@@ -48,8 +47,8 @@ const ROLE_DESCRIPTIONS = {
 		icon: Bot,
 		title: "Agent LLM",
 		description: "Primary LLM for chat interactions and agent operations",
-		color: "text-blue-600 dark:text-blue-400",
-		bgColor: "bg-blue-500/10",
+		color: "text-muted-foreground",
+		bgColor: "bg-muted",
 		prefKey: "agent_llm_id" as const,
 		configType: "llm" as const,
 	},
@@ -57,8 +56,8 @@ const ROLE_DESCRIPTIONS = {
 		icon: FileText,
 		title: "Document Summary LLM",
 		description: "Handles document summarization and research synthesis",
-		color: "text-purple-600 dark:text-purple-400",
-		bgColor: "bg-purple-500/10",
+		color: "text-muted-foreground",
+		bgColor: "bg-muted",
 		prefKey: "document_summary_llm_id" as const,
 		configType: "llm" as const,
 	},
@@ -66,8 +65,8 @@ const ROLE_DESCRIPTIONS = {
 		icon: ImageIcon,
 		title: "Image Generation Model",
 		description: "Model used for AI image generation (DALL-E, GPT Image, etc.)",
-		color: "text-teal-600 dark:text-teal-400",
-		bgColor: "bg-teal-500/10",
+		color: "text-muted-foreground",
+		bgColor: "bg-muted",
 		prefKey: "image_generation_config_id" as const,
 		configType: "image" as const,
 	},
@@ -118,88 +117,41 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 		image_generation_config_id: preferences.image_generation_config_id ?? "",
 	}));
 
-	const [hasChanges, setHasChanges] = useState(false);
-	const [isSaving, setIsSaving] = useState(false);
+	const [savingRole, setSavingRole] = useState<string | null>(null);
+	const savingRef = useRef(false);
 
 	useEffect(() => {
-		const newAssignments = {
-			agent_llm_id: preferences.agent_llm_id ?? "",
-			document_summary_llm_id: preferences.document_summary_llm_id ?? "",
-			image_generation_config_id: preferences.image_generation_config_id ?? "",
-		};
-		setAssignments(newAssignments);
-		setHasChanges(false);
+		if (!savingRef.current) {
+			setAssignments({
+				agent_llm_id: preferences.agent_llm_id ?? "",
+				document_summary_llm_id: preferences.document_summary_llm_id ?? "",
+				image_generation_config_id: preferences.image_generation_config_id ?? "",
+			});
+		}
 	}, [
 		preferences?.agent_llm_id,
 		preferences?.document_summary_llm_id,
 		preferences?.image_generation_config_id,
 	]);
 
-	const handleRoleAssignment = (prefKey: string, configId: string) => {
-		const newAssignments = {
-			...assignments,
-			[prefKey]: configId === "unassigned" ? "" : parseInt(configId),
-		};
+	const handleRoleAssignment = useCallback(async (prefKey: string, configId: string) => {
+		const value = configId === "unassigned" ? "" : parseInt(configId);
 
-		setAssignments(newAssignments);
+		setAssignments((prev) => ({ ...prev, [prefKey]: value }));
+		setSavingRole(prefKey);
+		savingRef.current = true;
 
-		const currentPrefs = {
-			agent_llm_id: preferences.agent_llm_id ?? "",
-			document_summary_llm_id: preferences.document_summary_llm_id ?? "",
-			image_generation_config_id: preferences.image_generation_config_id ?? "",
-		};
-
-		const hasChangesNow = Object.keys(newAssignments).some(
-			(key) =>
-				newAssignments[key as keyof typeof newAssignments] !==
-				currentPrefs[key as keyof typeof currentPrefs]
-		);
-
-		setHasChanges(hasChangesNow);
-	};
-
-	const handleSave = async () => {
-		setIsSaving(true);
-
-		const toNumericOrUndefined = (val: string | number) =>
-			typeof val === "string" ? (val ? parseInt(val) : undefined) : val;
-
-		const numericAssignments = {
-			agent_llm_id: toNumericOrUndefined(assignments.agent_llm_id),
-			document_summary_llm_id: toNumericOrUndefined(assignments.document_summary_llm_id),
-			image_generation_config_id: toNumericOrUndefined(assignments.image_generation_config_id),
-		};
-
-		await updatePreferences({
-			search_space_id: searchSpaceId,
-			data: numericAssignments,
-		});
-
-		setHasChanges(false);
-		toast.success("Role assignments saved successfully!");
-
-		setIsSaving(false);
-	};
-
-	const handleReset = () => {
-		setAssignments({
-			agent_llm_id: preferences.agent_llm_id ?? "",
-			document_summary_llm_id: preferences.document_summary_llm_id ?? "",
-			image_generation_config_id: preferences.image_generation_config_id ?? "",
-		});
-		setHasChanges(false);
-	};
-
-	const isAssignmentComplete =
-		assignments.agent_llm_id !== "" &&
-		assignments.agent_llm_id !== null &&
-		assignments.agent_llm_id !== undefined &&
-		assignments.document_summary_llm_id !== "" &&
-		assignments.document_summary_llm_id !== null &&
-		assignments.document_summary_llm_id !== undefined &&
-		assignments.image_generation_config_id !== "" &&
-		assignments.image_generation_config_id !== null &&
-		assignments.image_generation_config_id !== undefined;
+		try {
+			await updatePreferences({
+				search_space_id: searchSpaceId,
+				data: { [prefKey]: value || undefined },
+			});
+			toast.success("Role assignment updated");
+		} finally {
+			setSavingRole(null);
+			savingRef.current = false;
+		}
+	}, [updatePreferences, searchSpaceId]);
 
 	// Combine global and custom LLM configs
 	const allLLMConfigs = [
@@ -213,6 +165,11 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 		...(userImageConfigs ?? []).filter((config) => config.id && config.id.toString().trim() !== ""),
 	];
 
+	const isAssignmentComplete =
+		allLLMConfigs.some((c) => c.id === assignments.agent_llm_id) &&
+		allLLMConfigs.some((c) => c.id === assignments.document_summary_llm_id) &&
+		allImageConfigs.some((c) => c.id === assignments.image_generation_config_id);
+
 	const isLoading =
 		configsLoading ||
 		preferencesLoading ||
@@ -244,9 +201,9 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 				{isAssignmentComplete && !isLoading && !hasError && (
 					<Badge
 						variant="outline"
-						className="text-xs gap-1.5 border-emerald-500/30 text-emerald-700 dark:text-emerald-300 bg-emerald-500/5"
+						className="text-xs gap-1.5 text-muted-foreground"
 					>
-						<CheckCircle className="h-3 w-3" />
+						<CircleCheck className="h-3 w-3" />
 						All roles assigned
 					</Badge>
 				)}
@@ -332,10 +289,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 						const roleAllConfigs = isImageRole ? allImageConfigs : allLLMConfigs;
 
 						const assignedConfig = roleAllConfigs.find((config) => config.id === currentAssignment);
-						const isAssigned =
-							currentAssignment !== "" &&
-							currentAssignment !== null &&
-							currentAssignment !== undefined;
+						const isAssigned = !!assignedConfig;
 						const isAutoMode =
 							assignedConfig && "is_auto_mode" in assignedConfig && assignedConfig.is_auto_mode;
 
@@ -361,8 +315,10 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 													</p>
 												</div>
 											</div>
-											{isAssigned ? (
-												<CheckCircle className="w-4 h-4 text-emerald-500 shrink-0 mt-0.5" />
+											{savingRole === role.prefKey ? (
+												<Spinner size="sm" className="shrink-0 mt-0.5 text-muted-foreground" />
+											) : isAssigned ? (
+												<CircleCheck className="w-4 h-4 text-muted-foreground/40 shrink-0 mt-0.5" />
 											) : (
 												<CircleDashed className="w-4 h-4 text-muted-foreground/40 shrink-0 mt-0.5" />
 											)}
@@ -374,7 +330,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 												Configuration
 											</Label>
 											<Select
-												value={currentAssignment?.toString() || "unassigned"}
+												value={isAssigned ? currentAssignment.toString() : "unassigned"}
 												onValueChange={(value) => handleRoleAssignment(role.prefKey, value)}
 											>
 												<SelectTrigger className="w-full h-9 md:h-10 text-xs md:text-sm">
@@ -534,33 +490,6 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 				</div>
 			)}
 
-			{/* Save / Reset Bar */}
-			{hasChanges && (
-				<div className="flex items-center justify-between gap-3 rounded-lg border border-border bg-muted/50 p-3 md:p-4">
-					<p className="text-xs md:text-sm text-muted-foreground">You have unsaved changes</p>
-					<div className="flex items-center gap-2">
-						<Button
-							variant="outline"
-							size="sm"
-							onClick={handleReset}
-							disabled={isSaving}
-							className="h-8 text-xs gap-1.5"
-						>
-							<RotateCcw className="w-3 h-3" />
-							Reset
-						</Button>
-						<Button
-							size="sm"
-							onClick={handleSave}
-							disabled={isSaving}
-							className="h-8 text-xs gap-1.5"
-						>
-							<Save className="w-3 h-3" />
-							{isSaving ? "Saving…" : "Save Changes"}
-						</Button>
-					</div>
-				</div>
-			)}
 		</div>
 	);
 }

From 000c2d9b5b670804c0c3cf09294a5af12322e7d6 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 10:11:35 +0530
Subject: [PATCH 021/202] style: simplify LLM model terminology in UI

---
 docs/chinese-llm-setup.md                              |  2 +-
 .../alembic/versions/51_add_new_llm_config_table.py    |  6 +++---
 .../app/config/global_llm_config.example.yaml          |  2 +-
 surfsense_backend/app/indexing_pipeline/exceptions.py  |  4 ++--
 surfsense_backend/app/routes/__init__.py               |  2 +-
 surfsense_backend/app/routes/model_list_routes.py      |  4 ++--
 surfsense_backend/app/routes/new_llm_config_routes.py  |  2 +-
 surfsense_backend/app/schemas/new_llm_config.py        | 10 +++++-----
 surfsense_backend/app/services/model_list_service.py   |  2 +-
 .../new-llm-config/new-llm-config-mutation.atoms.ts    |  2 +-
 .../atoms/new-llm-config/new-llm-config-query.atoms.ts |  2 +-
 surfsense_web/components/new-chat/model-selector.tsx   |  2 +-
 .../components/settings/model-config-manager.tsx       | 10 +++++-----
 surfsense_web/content/docs/testing.mdx                 |  2 +-
 surfsense_web/contracts/enums/llm-models.ts            |  2 +-
 surfsense_web/contracts/types/new-llm-config.types.ts  |  6 +++---
 surfsense_web/lib/apis/new-llm-config-api.service.ts   |  2 +-
 surfsense_web/messages/en.json                         |  2 +-
 18 files changed, 32 insertions(+), 32 deletions(-)

diff --git a/docs/chinese-llm-setup.md b/docs/chinese-llm-setup.md
index 1fb0ce2a1..6638dbba1 100644
--- a/docs/chinese-llm-setup.md
+++ b/docs/chinese-llm-setup.md
@@ -24,7 +24,7 @@ SurfSense 现已支持以下国产 LLM：
 
 1. 登录 SurfSense Dashboard
 2. 进入 **Settings** → **API Keys** (或 **LLM Configurations**)
-3. 点击 **Add LLM Model**
+3. 点击 **Add Model**
 4. 从 **Provider** 下拉菜单中选择你的国产 LLM 提供商
 5. 填写必填字段（见下方各提供商详细配置）
 6. 点击 **Save**
diff --git a/surfsense_backend/alembic/versions/51_add_new_llm_config_table.py b/surfsense_backend/alembic/versions/51_add_new_llm_config_table.py
index 89a5c1246..7d90f4b13 100644
--- a/surfsense_backend/alembic/versions/51_add_new_llm_config_table.py
+++ b/surfsense_backend/alembic/versions/51_add_new_llm_config_table.py
@@ -17,10 +17,10 @@ depends_on: str | Sequence[str] | None = None
 
 def upgrade() -> None:
     """
-    Add the new_llm_configs table that combines LLM model settings with prompt configuration.
+    Add the new_llm_configs table that combines model settings with prompt configuration.
 
     This table includes:
-    - LLM model configuration (provider, model_name, api_key, etc.)
+    - Model configuration (provider, model_name, api_key, etc.)
     - Configurable system instructions
     - Citation toggle
     """
@@ -41,7 +41,7 @@ def upgrade() -> None:
                     name VARCHAR(100) NOT NULL,
                     description VARCHAR(500),
                     
-                    -- LLM Model Configuration (same as llm_configs, excluding language)
+                    -- Model Configuration (same as llm_configs, excluding language)
                     provider litellmprovider NOT NULL,
                     custom_provider VARCHAR(100),
                     model_name VARCHAR(100) NOT NULL,
diff --git a/surfsense_backend/app/config/global_llm_config.example.yaml b/surfsense_backend/app/config/global_llm_config.example.yaml
index 6ca3e95e3..49a8d0295 100644
--- a/surfsense_backend/app/config/global_llm_config.example.yaml
+++ b/surfsense_backend/app/config/global_llm_config.example.yaml
@@ -17,7 +17,7 @@
 # - Configure router_settings below to customize the load balancing behavior
 #
 # Structure matches NewLLMConfig:
-# - LLM model configuration (provider, model_name, api_key, etc.)
+# - Model configuration (provider, model_name, api_key, etc.)
 # - Prompt configuration (system_instructions, citations_enabled)
 
 # Router Settings for Auto Mode
diff --git a/surfsense_backend/app/indexing_pipeline/exceptions.py b/surfsense_backend/app/indexing_pipeline/exceptions.py
index 9155e9baa..666fa4b9f 100644
--- a/surfsense_backend/app/indexing_pipeline/exceptions.py
+++ b/surfsense_backend/app/indexing_pipeline/exceptions.py
@@ -59,7 +59,7 @@ class PipelineMessages:
 
     LLM_AUTH = "LLM authentication failed. Check your API key."
     LLM_PERMISSION = "LLM request denied. Check your account permissions."
-    LLM_NOT_FOUND = "LLM model not found. Check your model configuration."
+    LLM_NOT_FOUND = "Model not found. Check your model configuration."
     LLM_BAD_REQUEST = "LLM rejected the request. Document content may be invalid."
     LLM_UNPROCESSABLE = (
         "Document exceeds the LLM context window even after optimization."
@@ -67,7 +67,7 @@ class PipelineMessages:
     LLM_RESPONSE = "LLM returned an invalid response."
     LLM_AUTH = "LLM authentication failed. Check your API key."
     LLM_PERMISSION = "LLM request denied. Check your account permissions."
-    LLM_NOT_FOUND = "LLM model not found. Check your model configuration."
+    LLM_NOT_FOUND = "Model not found. Check your model configuration."
     LLM_BAD_REQUEST = "LLM rejected the request. Document content may be invalid."
     LLM_UNPROCESSABLE = (
         "Document exceeds the LLM context window even after optimization."
diff --git a/surfsense_backend/app/routes/__init__.py b/surfsense_backend/app/routes/__init__.py
index 1937f11cb..efa0ff2f6 100644
--- a/surfsense_backend/app/routes/__init__.py
+++ b/surfsense_backend/app/routes/__init__.py
@@ -84,7 +84,7 @@ router.include_router(confluence_add_connector_router)
 router.include_router(clickup_add_connector_router)
 router.include_router(dropbox_add_connector_router)
 router.include_router(new_llm_config_router)  # LLM configs with prompt configuration
-router.include_router(model_list_router)  # Dynamic LLM model catalogue from OpenRouter
+router.include_router(model_list_router)  # Dynamic model catalogue from OpenRouter
 router.include_router(logs_router)
 router.include_router(circleback_webhook_router)  # Circleback meeting webhooks
 router.include_router(surfsense_docs_router)  # Surfsense documentation for citations
diff --git a/surfsense_backend/app/routes/model_list_routes.py b/surfsense_backend/app/routes/model_list_routes.py
index ef6e30514..79ae7221f 100644
--- a/surfsense_backend/app/routes/model_list_routes.py
+++ b/surfsense_backend/app/routes/model_list_routes.py
@@ -1,5 +1,5 @@
 """
-API route for fetching the available LLM models catalogue.
+API route for fetching the available models catalogue.
 
 Serves a dynamically-updated list sourced from the OpenRouter public API,
 with a local JSON fallback when the API is unreachable.
@@ -30,7 +30,7 @@ async def list_available_models(
     user: User = Depends(current_active_user),
 ):
     """
-    Return all available LLM models grouped by provider.
+    Return all available models grouped by provider.
 
     The list is sourced from the OpenRouter public API and cached for 1 hour.
     If the API is unreachable, a local fallback file is used instead.
diff --git a/surfsense_backend/app/routes/new_llm_config_routes.py b/surfsense_backend/app/routes/new_llm_config_routes.py
index f784bd273..78907c719 100644
--- a/surfsense_backend/app/routes/new_llm_config_routes.py
+++ b/surfsense_backend/app/routes/new_llm_config_routes.py
@@ -1,7 +1,7 @@
 """
 API routes for NewLLMConfig CRUD operations.
 
-NewLLMConfig combines LLM model settings with prompt configuration:
+NewLLMConfig combines model settings with prompt configuration:
 - LLM provider, model, API key, etc.
 - Configurable system instructions
 - Citation toggle
diff --git a/surfsense_backend/app/schemas/new_llm_config.py b/surfsense_backend/app/schemas/new_llm_config.py
index 9863665b6..15ed4ce67 100644
--- a/surfsense_backend/app/schemas/new_llm_config.py
+++ b/surfsense_backend/app/schemas/new_llm_config.py
@@ -1,7 +1,7 @@
 """
 Pydantic schemas for the NewLLMConfig API.
 
-NewLLMConfig combines LLM model settings with prompt configuration:
+NewLLMConfig combines model settings with prompt configuration:
 - LLM provider, model, API key, etc.
 - Configurable system instructions
 - Citation toggle
@@ -26,7 +26,7 @@ class NewLLMConfigBase(BaseModel):
         None, max_length=500, description="Optional description"
     )
 
-    # LLM Model Configuration
+    # Model Configuration
     provider: LiteLLMProvider = Field(..., description="LiteLLM provider type")
     custom_provider: str | None = Field(
         None, max_length=100, description="Custom provider name when provider is CUSTOM"
@@ -71,7 +71,7 @@ class NewLLMConfigUpdate(BaseModel):
     name: str | None = Field(None, max_length=100)
     description: str | None = Field(None, max_length=500)
 
-    # LLM Model Configuration
+    # Model Configuration
     provider: LiteLLMProvider | None = None
     custom_provider: str | None = Field(None, max_length=100)
     model_name: str | None = Field(None, max_length=100)
@@ -106,7 +106,7 @@ class NewLLMConfigPublic(BaseModel):
     name: str
     description: str | None = None
 
-    # LLM Model Configuration (no api_key)
+    # Model Configuration (no api_key)
     provider: LiteLLMProvider
     custom_provider: str | None = None
     model_name: str
@@ -149,7 +149,7 @@ class GlobalNewLLMConfigRead(BaseModel):
     name: str
     description: str | None = None
 
-    # LLM Model Configuration (no api_key)
+    # Model Configuration (no api_key)
     provider: str  # String because YAML doesn't enforce enum, "AUTO" for Auto mode
     custom_provider: str | None = None
     model_name: str
diff --git a/surfsense_backend/app/services/model_list_service.py b/surfsense_backend/app/services/model_list_service.py
index ebc0e0d7c..2a81c2d52 100644
--- a/surfsense_backend/app/services/model_list_service.py
+++ b/surfsense_backend/app/services/model_list_service.py
@@ -1,5 +1,5 @@
 """
-Service for fetching and caching the available LLM model list.
+Service for fetching and caching the available model list.
 
 Uses the OpenRouter public API as the primary source, with a local
 fallback JSON file when the API is unreachable.
diff --git a/surfsense_web/atoms/new-llm-config/new-llm-config-mutation.atoms.ts b/surfsense_web/atoms/new-llm-config/new-llm-config-mutation.atoms.ts
index d6d3aa820..2a048ca3e 100644
--- a/surfsense_web/atoms/new-llm-config/new-llm-config-mutation.atoms.ts
+++ b/surfsense_web/atoms/new-llm-config/new-llm-config-mutation.atoms.ts
@@ -34,7 +34,7 @@ export const createNewLLMConfigMutationAtom = atomWithMutation((get) => {
 			});
 		},
 		onError: (error: Error) => {
-			toast.error(error.message || "Failed to create LLM model");
+			toast.error(error.message || "Failed to create model");
 		},
 	};
 });
diff --git a/surfsense_web/atoms/new-llm-config/new-llm-config-query.atoms.ts b/surfsense_web/atoms/new-llm-config/new-llm-config-query.atoms.ts
index e4c8bcffc..32250d394 100644
--- a/surfsense_web/atoms/new-llm-config/new-llm-config-query.atoms.ts
+++ b/surfsense_web/atoms/new-llm-config/new-llm-config-query.atoms.ts
@@ -66,7 +66,7 @@ export const defaultSystemInstructionsAtom = atomWithQuery(() => {
 });
 
 /**
- * Query atom for the dynamic LLM model catalogue.
+ * Query atom for the dynamic model catalogue.
  * Fetched from the backend (which proxies OpenRouter's public API).
  * Falls back to the static hardcoded list on error.
  */
diff --git a/surfsense_web/components/new-chat/model-selector.tsx b/surfsense_web/components/new-chat/model-selector.tsx
index 7a2a471ba..b207d82b4 100644
--- a/surfsense_web/components/new-chat/model-selector.tsx
+++ b/surfsense_web/components/new-chat/model-selector.tsx
@@ -498,7 +498,7 @@ export function ModelSelector({
 										}}
 									>
 										<Plus className="size-4 text-primary" />
-										<span className="text-sm font-medium">Add LLM Model</span>
+										<span className="text-sm font-medium">Add Model</span>
 									</Button>
 								</div>
 							</CommandList>
diff --git a/surfsense_web/components/settings/model-config-manager.tsx b/surfsense_web/components/settings/model-config-manager.tsx
index 837060c70..79504451a 100644
--- a/surfsense_web/components/settings/model-config-manager.tsx
+++ b/surfsense_web/components/settings/model-config-manager.tsx
@@ -150,7 +150,7 @@ export function ModelConfigManager({ searchSpaceId }: ModelConfigManagerProps) {
 						onClick={openNewDialog}
 						className="gap-2 bg-white text-black hover:bg-neutral-100 dark:bg-white dark:text-black dark:hover:bg-neutral-200"
 					>
-						Add LLM Model
+						Add Model
 					</Button>
 				)}
 			</div>
@@ -252,11 +252,11 @@ export function ModelConfigManager({ searchSpaceId }: ModelConfigManagerProps) {
 						<div>
 							<Card className="border-0 bg-transparent shadow-none">
 								<CardContent className="flex flex-col items-center justify-center py-10 md:py-16 text-center">
-									<h3 className="text-sm md:text-base font-semibold mb-2">No LLM Models Yet</h3>
+									<h3 className="text-sm md:text-base font-semibold mb-2">No Models Yet</h3>
 									<p className="text-[11px] md:text-xs text-muted-foreground max-w-sm mb-4">
 										{canCreate
-											? "Add your first LLM model to power document summarization, chat, and other agent capabilities"
-											: "No LLM models have been added to this space yet. Contact a space owner to add one"}
+											? "Add your first model to power document summarization, chat, and other agent capabilities"
+											: "No models have been added to this space yet. Contact a space owner to add one"}
 									</p>
 								</CardContent>
 							</Card>
@@ -420,7 +420,7 @@ export function ModelConfigManager({ searchSpaceId }: ModelConfigManagerProps) {
 			>
 				<AlertDialogContent className="select-none">
 					<AlertDialogHeader>
-						<AlertDialogTitle>Delete LLM Model</AlertDialogTitle>
+						<AlertDialogTitle>Delete Model</AlertDialogTitle>
 						<AlertDialogDescription>
 							Are you sure you want to delete{" "}
 							<span className="font-semibold text-foreground">{configToDelete?.name}</span>? This
diff --git a/surfsense_web/content/docs/testing.mdx b/surfsense_web/content/docs/testing.mdx
index 9c4682b90..c6739de10 100644
--- a/surfsense_web/content/docs/testing.mdx
+++ b/surfsense_web/content/docs/testing.mdx
@@ -10,7 +10,7 @@ SurfSense uses [pytest](https://docs.pytest.org/) with two test layers: **unit**
 
 - **PostgreSQL + pgvector** running locally (database `surfsense_test` will be used)
 - **`REGISTRATION_ENABLED=TRUE`** in your `.env` (this is the default)
-- A working LLM model with a valid API key in `global_llm_config.yaml` (for integration tests)
+- A working model with a valid API key in `global_llm_config.yaml` (for integration tests)
 
 No Redis or Celery is required — integration tests use an inline task dispatcher.
 
diff --git a/surfsense_web/contracts/enums/llm-models.ts b/surfsense_web/contracts/enums/llm-models.ts
index 31097ca6e..74cc056f3 100644
--- a/surfsense_web/contracts/enums/llm-models.ts
+++ b/surfsense_web/contracts/enums/llm-models.ts
@@ -5,7 +5,7 @@ export interface LLMModel {
 	contextWindow?: string;
 }
 
-// Comprehensive LLM models database organized by provider
+// Comprehensive models database organized by provider
 export const LLM_MODELS: LLMModel[] = [
 	// OpenAI
 	{
diff --git a/surfsense_web/contracts/types/new-llm-config.types.ts b/surfsense_web/contracts/types/new-llm-config.types.ts
index 3bb43680a..4422857ab 100644
--- a/surfsense_web/contracts/types/new-llm-config.types.ts
+++ b/surfsense_web/contracts/types/new-llm-config.types.ts
@@ -41,14 +41,14 @@ export const liteLLMProviderEnum = z.enum([
 export type LiteLLMProvider = z.infer<typeof liteLLMProviderEnum>;
 
 /**
- * NewLLMConfig - combines LLM model settings with prompt configuration
+ * NewLLMConfig - combines model settings with prompt configuration
  */
 export const newLLMConfig = z.object({
 	id: z.number(),
 	name: z.string().max(100),
 	description: z.string().max(500).nullable().optional(),
 
-	// LLM Model Configuration
+	// Model Configuration
 	provider: liteLLMProviderEnum,
 	custom_provider: z.string().max(100).nullable().optional(),
 	model_name: z.string().max(100),
@@ -148,7 +148,7 @@ export const globalNewLLMConfig = z.object({
 	name: z.string(),
 	description: z.string().nullable().optional(),
 
-	// LLM Model Configuration (no api_key)
+	// Model Configuration (no api_key)
 	provider: z.string(), // String because YAML doesn't enforce enum, "AUTO" for Auto mode
 	custom_provider: z.string().nullable().optional(),
 	model_name: z.string(),
diff --git a/surfsense_web/lib/apis/new-llm-config-api.service.ts b/surfsense_web/lib/apis/new-llm-config-api.service.ts
index 71af1a8d9..a1040a9bc 100644
--- a/surfsense_web/lib/apis/new-llm-config-api.service.ts
+++ b/surfsense_web/lib/apis/new-llm-config-api.service.ts
@@ -147,7 +147,7 @@ class NewLLMConfigApiService {
 	};
 
 	/**
-	 * Get the dynamic LLM model catalogue (sourced from OpenRouter API)
+	 * Get the dynamic model catalogue (sourced from OpenRouter API)
 	 */
 	getModels = async () => {
 		return baseApiService.get(`/api/v1/models`, getModelListResponse);
diff --git a/surfsense_web/messages/en.json b/surfsense_web/messages/en.json
index 53f80ea5f..4310bc707 100644
--- a/surfsense_web/messages/en.json
+++ b/surfsense_web/messages/en.json
@@ -737,7 +737,7 @@
 		"nav_general": "General",
 		"nav_general_desc": "Name, description & basic info",
 		"nav_agent_configs": "Agent Configs",
-		"nav_agent_configs_desc": "LLM models with prompts & citations",
+		"nav_agent_configs_desc": "Models with prompts & citations",
 		"nav_role_assignments": "Role Assignments",
 		"nav_role_assignments_desc": "Assign configs to agent roles",
 		"nav_image_models": "Image Models",

From c9ae4fcaca3ce8178c26485ef6290010e0327c62 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 10:12:34 +0530
Subject: [PATCH 022/202] style: update badge component in LLM role manager for
 improved visual consistency

---
 surfsense_web/components/settings/llm-role-manager.tsx | 8 +-------
 1 file changed, 1 insertion(+), 7 deletions(-)

diff --git a/surfsense_web/components/settings/llm-role-manager.tsx b/surfsense_web/components/settings/llm-role-manager.tsx
index 22e17e431..d1651b7f0 100644
--- a/surfsense_web/components/settings/llm-role-manager.tsx
+++ b/surfsense_web/components/settings/llm-role-manager.tsx
@@ -360,13 +360,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 																	>
 																		<div className="flex items-center gap-1 md:gap-1.5 flex-wrap min-w-0">
 																			{isAuto ? (
-																				<Badge
-																					variant="outline"
-																					className="text-[9px] md:text-[10px] shrink-0 bg-violet-100 text-violet-700 dark:bg-violet-900/30 dark:text-violet-300 border-violet-200 dark:border-violet-700"
-																				>
-																					<Shuffle className="size-2 md:size-2.5 mr-0.5" />
-																					AUTO
-																				</Badge>
+																				<Shuffle className="size-3 md:size-3.5 shrink-0 text-muted-foreground" />
 																			) : (
 																				getProviderIcon(config.provider, {
 																					className: "size-3 md:size-3.5 shrink-0",

From 3b92e99d28087554bd23b6b9b95ccb8b32433a0c Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 10:35:32 +0530
Subject: [PATCH 023/202] feat: add local folder connector and document
 versioning functionality

---
 ...d_local_folder_connector_and_versioning.py | 135 ++++++++++++
 surfsense_backend/app/db.py                   |  22 ++
 .../app/routes/documents_routes.py            | 123 +++++++++++
 .../routes/search_source_connectors_routes.py | 195 ++++++++++++++++--
 4 files changed, 459 insertions(+), 16 deletions(-)
 create mode 100644 surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py

diff --git a/surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py b/surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py
new file mode 100644
index 000000000..e97a4787c
--- /dev/null
+++ b/surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py
@@ -0,0 +1,135 @@
+"""Add local folder connector enums and document_versions table
+
+Revision ID: 117
+Revises: 116
+"""
+
+from collections.abc import Sequence
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "117"
+down_revision: str | None = "116"
+branch_labels: str | Sequence[str] | None = None
+depends_on: str | Sequence[str] | None = None
+
+PUBLICATION_NAME = "zero_publication"
+
+
+def upgrade() -> None:
+    conn = op.get_bind()
+
+    # Add LOCAL_FOLDER_CONNECTOR to searchsourceconnectortype enum
+    op.execute(
+        """
+    DO $$
+    BEGIN
+        IF NOT EXISTS (
+            SELECT 1 FROM pg_type t
+            JOIN pg_enum e ON t.oid = e.enumtypid
+            WHERE t.typname = 'searchsourceconnectortype' AND e.enumlabel = 'LOCAL_FOLDER_CONNECTOR'
+        ) THEN
+            ALTER TYPE searchsourceconnectortype ADD VALUE 'LOCAL_FOLDER_CONNECTOR';
+        END IF;
+    END
+    $$;
+    """
+    )
+
+    # Add LOCAL_FOLDER_FILE to documenttype enum
+    op.execute(
+        """
+    DO $$
+    BEGIN
+        IF NOT EXISTS (
+            SELECT 1 FROM pg_type t
+            JOIN pg_enum e ON t.oid = e.enumtypid
+            WHERE t.typname = 'documenttype' AND e.enumlabel = 'LOCAL_FOLDER_FILE'
+        ) THEN
+            ALTER TYPE documenttype ADD VALUE 'LOCAL_FOLDER_FILE';
+        END IF;
+    END
+    $$;
+    """
+    )
+
+    # Create document_versions table
+    table_exists = conn.execute(
+        sa.text(
+            "SELECT 1 FROM information_schema.tables WHERE table_name = 'document_versions'"
+        )
+    ).fetchone()
+    if not table_exists:
+        op.create_table(
+            "document_versions",
+            sa.Column("id", sa.Integer(), nullable=False, autoincrement=True),
+            sa.Column("document_id", sa.Integer(), nullable=False),
+            sa.Column("version_number", sa.Integer(), nullable=False),
+            sa.Column("source_markdown", sa.Text(), nullable=True),
+            sa.Column("content_hash", sa.String(), nullable=False),
+            sa.Column("title", sa.String(), nullable=True),
+            sa.Column(
+                "created_at",
+                sa.TIMESTAMP(timezone=True),
+                server_default=sa.text("now()"),
+                nullable=False,
+            ),
+            sa.ForeignKeyConstraint(
+                ["document_id"],
+                ["documents.id"],
+                ondelete="CASCADE",
+            ),
+            sa.PrimaryKeyConstraint("id"),
+            sa.UniqueConstraint(
+                "document_id",
+                "version_number",
+                name="uq_document_version",
+            ),
+        )
+
+    op.execute(
+        "CREATE INDEX IF NOT EXISTS ix_document_versions_document_id "
+        "ON document_versions (document_id)"
+    )
+    op.execute(
+        "CREATE INDEX IF NOT EXISTS ix_document_versions_created_at "
+        "ON document_versions (created_at)"
+    )
+
+    # Add document_versions to Zero publication
+    pub_exists = conn.execute(
+        sa.text("SELECT 1 FROM pg_publication WHERE pubname = :name"),
+        {"name": PUBLICATION_NAME},
+    ).fetchone()
+    if pub_exists:
+        already_in_pub = conn.execute(
+            sa.text(
+                "SELECT 1 FROM pg_publication_tables "
+                "WHERE pubname = :name AND tablename = 'document_versions'"
+            ),
+            {"name": PUBLICATION_NAME},
+        ).fetchone()
+        if not already_in_pub:
+            op.execute(
+                f"ALTER PUBLICATION {PUBLICATION_NAME} ADD TABLE document_versions"
+            )
+
+
+def downgrade() -> None:
+    conn = op.get_bind()
+
+    # Remove from publication
+    pub_exists = conn.execute(
+        sa.text("SELECT 1 FROM pg_publication WHERE pubname = :name"),
+        {"name": PUBLICATION_NAME},
+    ).fetchone()
+    if pub_exists:
+        op.execute(
+            f"ALTER PUBLICATION {PUBLICATION_NAME} DROP TABLE IF EXISTS document_versions"
+        )
+
+    op.execute("DROP INDEX IF EXISTS ix_document_versions_created_at")
+    op.execute("DROP INDEX IF EXISTS ix_document_versions_document_id")
+    op.execute("DROP TABLE IF EXISTS document_versions")
diff --git a/surfsense_backend/app/db.py b/surfsense_backend/app/db.py
index 90630cc83..25045e84a 100644
--- a/surfsense_backend/app/db.py
+++ b/surfsense_backend/app/db.py
@@ -64,6 +64,7 @@ class DocumentType(StrEnum):
     COMPOSIO_GOOGLE_DRIVE_CONNECTOR = "COMPOSIO_GOOGLE_DRIVE_CONNECTOR"
     COMPOSIO_GMAIL_CONNECTOR = "COMPOSIO_GMAIL_CONNECTOR"
     COMPOSIO_GOOGLE_CALENDAR_CONNECTOR = "COMPOSIO_GOOGLE_CALENDAR_CONNECTOR"
+    LOCAL_FOLDER_FILE = "LOCAL_FOLDER_FILE"
 
 
 # Native Google document types → their legacy Composio equivalents.
@@ -109,6 +110,7 @@ class SearchSourceConnectorType(StrEnum):
     COMPOSIO_GOOGLE_DRIVE_CONNECTOR = "COMPOSIO_GOOGLE_DRIVE_CONNECTOR"
     COMPOSIO_GMAIL_CONNECTOR = "COMPOSIO_GMAIL_CONNECTOR"
     COMPOSIO_GOOGLE_CALENDAR_CONNECTOR = "COMPOSIO_GOOGLE_CALENDAR_CONNECTOR"
+    LOCAL_FOLDER_CONNECTOR = "LOCAL_FOLDER_CONNECTOR"
 
 
 class PodcastStatus(StrEnum):
@@ -1039,6 +1041,26 @@ class Document(BaseModel, TimestampMixin):
     )
 
 
+class DocumentVersion(BaseModel, TimestampMixin):
+    __tablename__ = "document_versions"
+    __table_args__ = (
+        UniqueConstraint("document_id", "version_number", name="uq_document_version"),
+    )
+
+    document_id = Column(
+        Integer,
+        ForeignKey("documents.id", ondelete="CASCADE"),
+        nullable=False,
+        index=True,
+    )
+    version_number = Column(Integer, nullable=False)
+    source_markdown = Column(Text, nullable=True)
+    content_hash = Column(String, nullable=False)
+    title = Column(String, nullable=True)
+
+    document = relationship("Document", backref="versions")
+
+
 class Chunk(BaseModel, TimestampMixin):
     __tablename__ = "chunks"
 
diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index 6e69218f1..9271d4630 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -10,6 +10,7 @@ from app.db import (
     Chunk,
     Document,
     DocumentType,
+    DocumentVersion,
     Permission,
     SearchSpace,
     SearchSpaceMembership,
@@ -1135,3 +1136,125 @@ async def delete_document(
         raise HTTPException(
             status_code=500, detail=f"Failed to delete document: {e!s}"
         ) from e
+
+
+# ====================================================================
+# Version History Endpoints
+# ====================================================================
+
+
+@router.get("/documents/{document_id}/versions")
+async def list_document_versions(
+    document_id: int,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """List all versions for a document, ordered by version_number descending."""
+    document = (
+        await session.execute(select(Document).where(Document.id == document_id))
+    ).scalar_one_or_none()
+    if not document:
+        raise HTTPException(status_code=404, detail="Document not found")
+
+    await check_permission(session, user, document.search_space_id, Permission.READ)
+
+    versions = (
+        await session.execute(
+            select(DocumentVersion)
+            .where(DocumentVersion.document_id == document_id)
+            .order_by(DocumentVersion.version_number.desc())
+        )
+    ).scalars().all()
+
+    return [
+        {
+            "version_number": v.version_number,
+            "title": v.title,
+            "content_hash": v.content_hash,
+            "created_at": v.created_at.isoformat() if v.created_at else None,
+        }
+        for v in versions
+    ]
+
+
+@router.get("/documents/{document_id}/versions/{version_number}")
+async def get_document_version(
+    document_id: int,
+    version_number: int,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """Get full version content including source_markdown."""
+    document = (
+        await session.execute(select(Document).where(Document.id == document_id))
+    ).scalar_one_or_none()
+    if not document:
+        raise HTTPException(status_code=404, detail="Document not found")
+
+    await check_permission(session, user, document.search_space_id, Permission.READ)
+
+    version = (
+        await session.execute(
+            select(DocumentVersion).where(
+                DocumentVersion.document_id == document_id,
+                DocumentVersion.version_number == version_number,
+            )
+        )
+    ).scalar_one_or_none()
+    if not version:
+        raise HTTPException(status_code=404, detail="Version not found")
+
+    return {
+        "version_number": version.version_number,
+        "title": version.title,
+        "content_hash": version.content_hash,
+        "source_markdown": version.source_markdown,
+        "created_at": version.created_at.isoformat() if version.created_at else None,
+    }
+
+
+@router.post("/documents/{document_id}/versions/{version_number}/restore")
+async def restore_document_version(
+    document_id: int,
+    version_number: int,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """Restore a previous version: snapshot current state, then overwrite document content."""
+    document = (
+        await session.execute(
+            select(Document).where(Document.id == document_id)
+        )
+    ).scalar_one_or_none()
+    if not document:
+        raise HTTPException(status_code=404, detail="Document not found")
+
+    await check_permission(session, user, document.search_space_id, Permission.WRITE)
+
+    version = (
+        await session.execute(
+            select(DocumentVersion).where(
+                DocumentVersion.document_id == document_id,
+                DocumentVersion.version_number == version_number,
+            )
+        )
+    ).scalar_one_or_none()
+    if not version:
+        raise HTTPException(status_code=404, detail="Version not found")
+
+    # Snapshot current state before restoring
+    from app.utils.document_versioning import create_version_snapshot
+
+    await create_version_snapshot(session, document)
+
+    # Restore the version's content onto the document
+    document.source_markdown = version.source_markdown
+    document.title = version.title or document.title
+    document.content_needs_reindexing = True
+    await session.commit()
+
+    return {
+        "message": f"Restored version {version_number}",
+        "document_id": document_id,
+        "restored_version": version_number,
+    }
diff --git a/surfsense_backend/app/routes/search_source_connectors_routes.py b/surfsense_backend/app/routes/search_source_connectors_routes.py
index b73b8c789..439d83ac1 100644
--- a/surfsense_backend/app/routes/search_source_connectors_routes.py
+++ b/surfsense_backend/app/routes/search_source_connectors_routes.py
@@ -20,6 +20,7 @@ Non-OAuth connectors (BookStack, GitHub, etc.) are limited to one per search spa
 
 import asyncio
 import logging
+import os
 from contextlib import suppress
 from datetime import UTC, datetime, timedelta
 from typing import Any
@@ -55,23 +56,12 @@ from app.schemas import (
 )
 from app.services.composio_service import ComposioService, get_composio_service
 from app.services.notification_service import NotificationService
-from app.tasks.connector_indexers import (
-    index_airtable_records,
-    index_clickup_tasks,
-    index_confluence_pages,
-    index_crawled_urls,
-    index_discord_messages,
-    index_elasticsearch_documents,
-    index_github_repos,
-    index_google_calendar_events,
-    index_google_gmail_messages,
-    index_jira_issues,
-    index_linear_issues,
-    index_luma_events,
-    index_notion_pages,
-    index_slack_messages,
-)
 from app.users import current_active_user
+
+# NOTE: connector indexer functions are imported lazily inside each
+# ``run_*_indexing`` helper to break a circular import cycle:
+#   connector_indexers.__init__ → airtable_indexer → airtable_history
+#   → app.routes.__init__ → this file → connector_indexers (not ready yet)
 from app.utils.connector_naming import ensure_unique_connector_name
 from app.utils.indexing_locks import (
     acquire_connector_indexing_lock,
@@ -1180,6 +1170,24 @@ async def index_connector_content(
             )
             response_message = "Obsidian vault indexing started in the background."
 
+        elif connector.connector_type == SearchSourceConnectorType.LOCAL_FOLDER_CONNECTOR:
+            from app.config import config as app_config
+            from app.tasks.celery_tasks.connector_tasks import index_local_folder_task
+
+            if not app_config.is_self_hosted():
+                raise HTTPException(
+                    status_code=400,
+                    detail="Local folder connector is only available in self-hosted mode",
+                )
+
+            logger.info(
+                f"Triggering local folder indexing for connector {connector_id} into search space {search_space_id}"
+            )
+            index_local_folder_task.delay(
+                connector_id, search_space_id, str(user.id), indexing_from, indexing_to
+            )
+            response_message = "Local folder indexing started in the background."
+
         elif (
             connector.connector_type
             == SearchSourceConnectorType.COMPOSIO_GOOGLE_DRIVE_CONNECTOR
@@ -1312,6 +1320,76 @@ async def index_connector_content(
         ) from e
 
 
+class IndexFileRequest(BaseModel):
+    file_path: str = Field(..., description="Absolute path to the file to index")
+
+
+@router.post(
+    "/search-source-connectors/{connector_id}/index-file",
+    response_model=dict[str, Any],
+)
+async def index_single_file(
+    connector_id: int,
+    body: IndexFileRequest,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """Index a single file from a local folder connector (chokidar real-time trigger)."""
+    from app.config import config as app_config
+    from app.tasks.celery_tasks.connector_tasks import index_local_folder_task
+
+    if not app_config.is_self_hosted():
+        raise HTTPException(
+            status_code=400,
+            detail="Local folder connector is only available in self-hosted mode",
+        )
+
+    result = await session.execute(
+        select(SearchSourceConnector).filter(
+            SearchSourceConnector.id == connector_id,
+            SearchSourceConnector.connector_type
+            == SearchSourceConnectorType.LOCAL_FOLDER_CONNECTOR,
+        )
+    )
+    connector = result.scalars().first()
+    if not connector:
+        raise HTTPException(status_code=404, detail="Local folder connector not found")
+
+    await check_permission(session, user, connector.search_space_id, Permission.WRITE)
+
+    folder_path = connector.config.get("folder_path", "")
+
+    # Security: resolve symlinks and verify the file is inside folder_path
+    try:
+        resolved_file = os.path.realpath(body.file_path)
+        resolved_folder = os.path.realpath(folder_path)
+        if not resolved_file.startswith(resolved_folder + os.sep) and resolved_file != resolved_folder:
+            raise HTTPException(
+                status_code=403,
+                detail="File path is outside the configured folder",
+            )
+    except (OSError, ValueError):
+        raise HTTPException(
+            status_code=403,
+            detail="Invalid file path",
+        )
+
+    index_local_folder_task.delay(
+        connector_id,
+        connector.search_space_id,
+        str(user.id),
+        None,
+        None,
+        target_file_path=resolved_file,
+    )
+
+    return {
+        "message": "Single file indexing started",
+        "connector_id": connector_id,
+        "file_path": body.file_path,
+    }
+
+
 async def _update_connector_timestamp_by_id(session: AsyncSession, connector_id: int):
     """
     Update the last_indexed_at timestamp for a connector by its ID.
@@ -1378,6 +1456,8 @@ async def run_slack_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_slack_messages
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -1824,6 +1904,8 @@ async def run_notion_indexing_with_new_session(
     Create a new session and run the Notion indexing task.
     This prevents session leaks by creating a dedicated session for the background task.
     """
+    from app.tasks.connector_indexers import index_notion_pages
+
     async with async_session_maker() as session:
         await _run_indexing_with_notifications(
             session=session,
@@ -1858,6 +1940,8 @@ async def run_notion_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_notion_pages
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -1910,6 +1994,8 @@ async def run_github_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_github_repos
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -1961,6 +2047,8 @@ async def run_linear_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_linear_issues
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -2011,6 +2099,8 @@ async def run_discord_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_discord_messages
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -2113,6 +2203,8 @@ async def run_jira_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_jira_issues
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -2166,6 +2258,8 @@ async def run_confluence_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_confluence_pages
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -2217,6 +2311,8 @@ async def run_clickup_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_clickup_tasks
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -2268,6 +2364,8 @@ async def run_airtable_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_airtable_records
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -2321,6 +2419,8 @@ async def run_google_calendar_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_google_calendar_events
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -2370,6 +2470,7 @@ async def run_google_gmail_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_google_gmail_messages
 
     # Create a wrapper function that calls index_google_gmail_messages with max_messages
     async def gmail_indexing_wrapper(
@@ -2836,6 +2937,8 @@ async def run_luma_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_luma_events
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -2888,6 +2991,8 @@ async def run_elasticsearch_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_elasticsearch_documents
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -2938,6 +3043,8 @@ async def run_web_page_indexing(
         start_date: Start date for indexing
         end_date: End date for indexing
     """
+    from app.tasks.connector_indexers import index_crawled_urls
+
     await _run_indexing_with_notifications(
         session=session,
         connector_id=connector_id,
@@ -3059,6 +3166,62 @@ async def run_obsidian_indexing(
     )
 
 
+async def run_local_folder_indexing_with_new_session(
+    connector_id: int,
+    search_space_id: int,
+    user_id: str,
+    start_date: str,
+    end_date: str,
+    target_file_path: str | None = None,
+):
+    """Wrapper to run local folder indexing with its own database session."""
+    logger.info(
+        f"Background task started: Indexing local folder connector {connector_id} into space {search_space_id}"
+    )
+    async with async_session_maker() as session:
+        await run_local_folder_indexing(
+            session, connector_id, search_space_id, user_id, start_date, end_date,
+            target_file_path=target_file_path,
+        )
+    logger.info(f"Background task finished: Indexing local folder connector {connector_id}")
+
+
+async def run_local_folder_indexing(
+    session: AsyncSession,
+    connector_id: int,
+    search_space_id: int,
+    user_id: str,
+    start_date: str,
+    end_date: str,
+    target_file_path: str | None = None,
+):
+    """Background task to run local folder indexing."""
+    from app.tasks.connector_indexers import index_local_folder
+
+    await _run_indexing_with_notifications(
+        session=session,
+        connector_id=connector_id,
+        search_space_id=search_space_id,
+        user_id=user_id,
+        start_date=start_date,
+        end_date=end_date,
+        indexing_function=lambda session, connector_id, search_space_id, user_id,
+        start_date, end_date, update_last_indexed, on_heartbeat_callback: index_local_folder(
+            session=session,
+            connector_id=connector_id,
+            search_space_id=search_space_id,
+            user_id=user_id,
+            start_date=start_date,
+            end_date=end_date,
+            update_last_indexed=update_last_indexed,
+            on_heartbeat_callback=on_heartbeat_callback,
+            target_file_path=target_file_path,
+        ),
+        update_timestamp_func=_update_connector_timestamp_by_id,
+        supports_heartbeat_callback=True,
+    )
+
+
 async def run_composio_indexing_with_new_session(
     connector_id: int,
     search_space_id: int,

From fe6c2e9b525be5b29cd9b2ec53ea0b5ea463f95f Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 10:37:05 +0530
Subject: [PATCH 024/202] chore: add electron-store dependency for persistent
 data storage

---
 surfsense_desktop/package.json   |   1 +
 surfsense_desktop/pnpm-lock.yaml | 151 ++++++++++++++++++++++++++++++-
 2 files changed, 151 insertions(+), 1 deletion(-)

diff --git a/surfsense_desktop/package.json b/surfsense_desktop/package.json
index 5bbd50514..21e7f4bea 100644
--- a/surfsense_desktop/package.json
+++ b/surfsense_desktop/package.json
@@ -28,6 +28,7 @@
   },
   "dependencies": {
     "chokidar": "^5.0.0",
+    "electron-store": "^11.0.2",
     "electron-updater": "^6.8.3",
     "get-port-please": "^3.2.0"
   }
diff --git a/surfsense_desktop/pnpm-lock.yaml b/surfsense_desktop/pnpm-lock.yaml
index 1533803fb..528f81539 100644
--- a/surfsense_desktop/pnpm-lock.yaml
+++ b/surfsense_desktop/pnpm-lock.yaml
@@ -11,6 +11,9 @@ importers:
       chokidar:
         specifier: ^5.0.0
         version: 5.0.0
+      electron-store:
+        specifier: ^11.0.2
+        version: 11.0.2
       electron-updater:
         specifier: ^6.8.3
         version: 6.8.3
@@ -355,6 +358,14 @@ packages:
     resolution: {integrity: sha512-MnA+YT8fwfJPgBx3m60MNqakm30XOkyIoH1y6huTQvC0PwZG7ki8NacLBcrPbNoo8vEZy7Jpuk7+jMO+CUovTQ==}
     engines: {node: '>= 14'}
 
+  ajv-formats@3.0.1:
+    resolution: {integrity: sha512-8iUql50EUR+uUcdRQ3HDqa6EVyo3docL8g5WJ3FNcWmu62IbkGUue/pEyLBW8VGKKucTPgqeks4fIU1DA4yowQ==}
+    peerDependencies:
+      ajv: ^8.0.0
+    peerDependenciesMeta:
+      ajv:
+        optional: true
+
   ajv-keywords@3.5.2:
     resolution: {integrity: sha512-5p6WTN0DdTGVQk6VjcEju19IgaHudalcfabD7yhDGeA6bcQnmL+CpveLJq/3hvfwd1aof6L386Ougkx6RfyMIQ==}
     peerDependencies:
@@ -363,6 +374,9 @@ packages:
   ajv@6.14.0:
     resolution: {integrity: sha512-IWrosm/yrn43eiKqkfkHis7QioDleaXQHdDVPKg0FSwwd/DuvyX79TZnFOnYpB7dcsFAMmtFztZuXPDvSePkFw==}
 
+  ajv@8.18.0:
+    resolution: {integrity: sha512-PlXPeEWMXMZ7sPYOHqmDyCJzcfNrUr3fGNKtezX14ykXOEIvyK81d+qydx89KY5O71FKMPaQ2vBfBFI5NHR63A==}
+
   ansi-regex@5.0.1:
     resolution: {integrity: sha512-quJQXlTSUGL2LH9SUXo8VwsY4soanhgo6LNSm84E1LBcE8s3O0wpdiRzyR9z/ZZJMlMWv37qOOb9pdJlMUEKFQ==}
     engines: {node: '>=8'}
@@ -414,6 +428,9 @@ packages:
     resolution: {integrity: sha512-+q/t7Ekv1EDY2l6Gda6LLiX14rU9TV20Wa3ofeQmwPFZbOMo9DXrLbOjFaaclkXKWidIaopwAObQDqwWtGUjqg==}
     engines: {node: '>= 4.0.0'}
 
+  atomically@2.1.1:
+    resolution: {integrity: sha512-P4w9o2dqARji6P7MHprklbfiArZAWvo07yW7qs3pdljb3BWr12FIB7W+p0zJiuiVsUpRO0iZn1kFFcpPegg0tQ==}
+
   axios@1.13.6:
     resolution: {integrity: sha512-ChTCHMouEe2kn713WHbQGcuYrr6fXTBiu460OTwWrWob16g1bXn4vtz07Ope7ewMozJAnEquLk5lWQWtBig9DQ==}
 
@@ -553,6 +570,10 @@ packages:
     engines: {node: '>=18'}
     hasBin: true
 
+  conf@15.1.0:
+    resolution: {integrity: sha512-Uy5YN9KEu0WWDaZAVJ5FAmZoaJt9rdK6kH+utItPyGsCqCgaTKkrmZx3zoE0/3q6S3bcp3Ihkk+ZqPxWxFK5og==}
+    engines: {node: '>=20'}
+
   core-util-is@1.0.2:
     resolution: {integrity: sha512-3lqz5YjWTYnW6dlDa5TLaTCcShfar1e40rmcJVwCBJC6mWlFuj0eCHIElmG1g5kyuJ/GD+8Wn4FFCcz4gJPfaQ==}
 
@@ -566,6 +587,10 @@ packages:
     resolution: {integrity: sha512-uV2QOWP2nWzsy2aMp8aRibhi9dlzF5Hgh5SHaB9OiTGEyDTiJJyx0uy51QXdyWbtAHNua4XJzUKca3OzKUd3vA==}
     engines: {node: '>= 8'}
 
+  debounce-fn@6.0.0:
+    resolution: {integrity: sha512-rBMW+F2TXryBwB54Q0d8drNEI+TfoS9JpNTAoVpukbWEhjXQq4rySFYLaqXMFXwdv61Zb2OHtj5bviSoimqxRQ==}
+    engines: {node: '>=18'}
+
   debug@4.4.3:
     resolution: {integrity: sha512-RGwwWnwQvkVfavKVt22FGLw+xYSdzARwm0ru6DhTVA3umU5hZc28V3kO4stgYryrTlLpuvgI9GiijltAjNbcqA==}
     engines: {node: '>=6.0'}
@@ -617,6 +642,10 @@ packages:
     os: [darwin]
     hasBin: true
 
+  dot-prop@10.1.0:
+    resolution: {integrity: sha512-MVUtAugQMOff5RnBy2d9N31iG0lNwg1qAoAOn7pOK5wf94WIaE3My2p3uwTQuvS2AcqchkcR3bHByjaM0mmi7Q==}
+    engines: {node: '>=20'}
+
   dotenv-expand@11.0.7:
     resolution: {integrity: sha512-zIHwmZPRshsCdpMDyVsqGmgyP0yT8GAgXUnkdAoJisxvf33k7yO6OuoKmcTGuXPWSsm8Oh88nZicRLA9Y0rUeA==}
     engines: {node: '>=12'}
@@ -652,6 +681,10 @@ packages:
   electron-publish@26.8.1:
     resolution: {integrity: sha512-q+jrSTIh/Cv4eGZa7oVR+grEJo/FoLMYBAnSL5GCtqwUpr1T+VgKB/dn1pnzxIxqD8S/jP1yilT9VrwCqINR4w==}
 
+  electron-store@11.0.2:
+    resolution: {integrity: sha512-4VkNRdN+BImL2KcCi41WvAYbh6zLX5AUTi4so68yPqiItjbgTjqpEnGAqasgnG+lB6GuAyUltKwVopp6Uv+gwQ==}
+    engines: {node: '>=20'}
+
   electron-updater@6.8.3:
     resolution: {integrity: sha512-Z6sgw3jgbikWKXei1ENdqFOxBP0WlXg3TtKfz0rgw2vIZFJUyI4pD7ZN7jrkm7EoMK+tcm/qTnPUdqfZukBlBQ==}
 
@@ -680,6 +713,10 @@ packages:
     resolution: {integrity: sha512-+h1lkLKhZMTYjog1VEpJNG7NZJWcuc2DDk/qsqSTRRCOXiLjeQ1d1/udrUGhqMxUgAlwKNZ0cf2uqan5GLuS2A==}
     engines: {node: '>=6'}
 
+  env-paths@3.0.0:
+    resolution: {integrity: sha512-dtJUTepzMW3Lm/NPxRf3wP4642UWhjL2sQxc+ym2YMj1m/H2zDNQOlezafzkHwn6sMstjHTwG6iQQsctDW/b1A==}
+    engines: {node: ^12.20.0 || ^14.13.1 || >=16.0.0}
+
   err-code@2.0.3:
     resolution: {integrity: sha512-2bmlRpNKBxT/CRmPOlyISQpNj+qSeYvcym/uT0Jx2bMOlKLtSy1ZmLuVxSEKKyor/N5yhvp/ZiG1oE3DEYMSFA==}
 
@@ -733,6 +770,9 @@ packages:
   fast-json-stable-stringify@2.1.0:
     resolution: {integrity: sha512-lhd/wF+Lk98HZoTCtlVraHtfh5XYijIjalXck7saUtuanSDyLMxnHhSXEDJqHxD7msR8D0uCmqlkwjCV8xvwHw==}
 
+  fast-uri@3.1.0:
+    resolution: {integrity: sha512-iPeeDKJSWf4IEOasVVrknXpaBV0IApz/gp7S2bb7Z4Lljbl2MGJRqInZiUrQwV16cpzw/D3S5j5Julj/gT52AA==}
+
   fd-slicer@1.1.0:
     resolution: {integrity: sha512-cE1qsB/VwyQozZ+q1dGxR8LBYNZeofhEdUNGSMbQD3Gw2lAzX9Zb3uIU6Ebc/Fmyjo9AWWfnn0AUCHqtevs/8g==}
 
@@ -960,6 +1000,12 @@ packages:
   json-schema-traverse@0.4.1:
     resolution: {integrity: sha512-xbbCH5dCYU5T8LcEhhuh7HJ88HXuW3qsI3Y0zOZFKfZEHcpWiHU/Jxzk629Brsab/mMiHQti9wMP+845RPe3Vg==}
 
+  json-schema-traverse@1.0.0:
+    resolution: {integrity: sha512-NM8/P9n3XjXhIZn1lLhkFaACTOURQXjWhV4BA/RnOv8xvgqtqpAX9IO4mRQxSx1Rlo4tqzeqb0sOlruaOy3dug==}
+
+  json-schema-typed@8.0.2:
+    resolution: {integrity: sha512-fQhoXdcvc3V28x7C7BMs4P5+kNlgUURe2jmUT1T//oBRMDrqy1QPelJimwZGo7Hg9VPV3EQV5Bnq4hbFy2vetA==}
+
   json-stringify-safe@5.0.1:
     resolution: {integrity: sha512-ZClg6AaYvamvYEE82d3Iyd3vSSIjQ+odgjaTzRuO3s7toCdFKczob2i0zCh7JE8kWn17yvAWhUVxvqGwUalsRA==}
 
@@ -990,6 +1036,9 @@ packages:
   lodash@4.17.23:
     resolution: {integrity: sha512-LgVTMpQtIopCi79SJeDiP0TfWi5CNEc/L/aRdTh3yIvmZXTnheWpKjSZhnvMl8iXbC1tFg9gdHHDMLoV7CnG+w==}
 
+  lodash@4.18.1:
+    resolution: {integrity: sha512-dMInicTPVE8d1e5otfwmmjlxkZoUpiVLwyeTdUsi/Caj/gfzzblBcCE5sRHV/AsjuCmxWrte2TNGSYuCeCq+0Q==}
+
   log-symbols@4.1.0:
     resolution: {integrity: sha512-8XPvpAA8uyhfteu8pIvQxpJZ7SYYdpUivZpGy6sFsBuKRY/7rQGavedeB8aK+Zkyq6upMFVL/9AW6vOYzfRyLg==}
     engines: {node: '>=10'}
@@ -1034,6 +1083,10 @@ packages:
     resolution: {integrity: sha512-OqbOk5oEQeAZ8WXWydlu9HJjz9WVdEIvamMCcXmuqUYjTknH/sqsWvhQ3vgwKFRR1HpjvNBKQ37nbJgYzGqGcg==}
     engines: {node: '>=6'}
 
+  mimic-function@5.0.1:
+    resolution: {integrity: sha512-VP79XUPxV2CigYP3jWwAUFSku2aKqBH7uTAapFWCBqutsbmDo96KY5o8uh6U+/YSIn5OxJnXp73beVkpqMIGhA==}
+    engines: {node: '>=18'}
+
   mimic-response@1.0.1:
     resolution: {integrity: sha512-j5EctnkH7amfV/q5Hgmoal1g2QHFJRraOtmx0JpIqkxhBhI/lJSl1nMpQ45hVarwNETOoWEimndZ4QK0RHxuxQ==}
     engines: {node: '>=4'}
@@ -1237,6 +1290,10 @@ packages:
     resolution: {integrity: sha512-fGxEI7+wsG9xrvdjsrlmL22OMTTiHRwAMroiEeMgq8gzoLC/PQr7RsRDSTLUg/bZAZtF+TVIkHc6/4RIKrui+Q==}
     engines: {node: '>=0.10.0'}
 
+  require-from-string@2.0.2:
+    resolution: {integrity: sha512-Xf0nWe6RseziFMu+Ap9biiUbmplq6S9/p+7w7YXP/JBHhrUDDUhwa+vANyubuqfZWTveU//DYVGsDG7RKL/vEw==}
+    engines: {node: '>=0.10.0'}
+
   resedit@1.7.2:
     resolution: {integrity: sha512-vHjcY2MlAITJhC0eRD/Vv8Vlgmu9Sd3LX9zZvtGzU5ZImdTN3+d6e/4mnTyV8vEbyf1sgNIrWxhWlrys52OkEA==}
     engines: {node: '>=12', npm: '>=6'}
@@ -1376,6 +1433,12 @@ packages:
     resolution: {integrity: sha512-yDPMNjp4WyfYBkHnjIRLfca1i6KMyGCtsVgoKe/z1+6vukgaENdgGBZt+ZmKPc4gavvEZ5OgHfHdrazhgNyG7w==}
     engines: {node: '>=12'}
 
+  stubborn-fs@2.0.0:
+    resolution: {integrity: sha512-Y0AvSwDw8y+nlSNFXMm2g6L51rBGdAQT20J3YSOqxC53Lo3bjWRtr2BKcfYoAf352WYpsZSTURrA0tqhfgudPA==}
+
+  stubborn-utils@1.0.2:
+    resolution: {integrity: sha512-zOh9jPYI+xrNOyisSelgym4tolKTJCQd5GBhK0+0xJvcYDcwlOoxF/rnFKQ2KRZknXSG9jWAp66fwP6AxN9STg==}
+
   sumchecker@3.0.1:
     resolution: {integrity: sha512-MvjXzkz/BOfyVDkG0oFOtBxHX2u3gKbMHIF/dXblZsgD3BWOFLmHovIpZY7BykJdAjcqRCBi1WYBNdEC9yI7vg==}
     engines: {node: '>= 8.0'}
@@ -1388,6 +1451,10 @@ packages:
     resolution: {integrity: sha512-MpUEN2OodtUzxvKQl72cUF7RQ5EiHsGvSsVG0ia9c5RbWGL2CI4C7EpPS8UTBIplnlzZiNuV56w+FuNxy3ty2Q==}
     engines: {node: '>=10'}
 
+  tagged-tag@1.0.0:
+    resolution: {integrity: sha512-yEFYrVhod+hdNyx7g5Bnkkb0G6si8HJurOoOEgC8B/O0uXLHlaey/65KRv6cuWBNhBgHKAROVpc7QyYqE5gFng==}
+    engines: {node: '>=20'}
+
   tar@7.5.11:
     resolution: {integrity: sha512-ChjMH33/KetonMTAtpYdgUFr0tbz69Fp2v7zWxQfYZX4g5ZN2nOBXm1R2xyA+lMIKrLKIoKAwFj93jE/avX9cQ==}
     engines: {node: '>=18'}
@@ -1430,11 +1497,19 @@ packages:
     resolution: {integrity: sha512-34R7HTnG0XIJcBSn5XhDd7nNFPRcXYRZrBB2O2jdKqYODldSzBAqzsWoZYYvduky73toYS/ESqxPvkDf/F0XMg==}
     engines: {node: '>=10'}
 
+  type-fest@5.5.0:
+    resolution: {integrity: sha512-PlBfpQwiUvGViBNX84Yxwjsdhd1TUlXr6zjX7eoirtCPIr08NAmxwa+fcYBTeRQxHo9YC9wwF3m9i700sHma8g==}
+    engines: {node: '>=20'}
+
   typescript@5.9.3:
     resolution: {integrity: sha512-jl1vZzPDinLr9eUt3J/t7V6FgNEw9QjvBPdysz9KfQDD41fQrC2Y4vKQdiaUpFT4bXlb1RHhLpp8wtm6M5TgSw==}
     engines: {node: '>=14.17'}
     hasBin: true
 
+  uint8array-extras@1.5.0:
+    resolution: {integrity: sha512-rvKSBiC5zqCCiDZ9kAOszZcDvdAHwwIKJG33Ykj43OKcWsnmcBRL09YTU4nOeHZ8Y2a7l1MgTd08SBe9A8Qj6A==}
+    engines: {node: '>=18'}
+
   undici-types@7.16.0:
     resolution: {integrity: sha512-Zz+aZWSj8LE6zoxD+xrjh4VfkIG8Ya6LvYkZqtUQGJPZjYl53ypCaUwWqo7eI0x66KBGeRo+mlBEkMSeSZ38Nw==}
 
@@ -1478,6 +1553,9 @@ packages:
   wcwidth@1.0.1:
     resolution: {integrity: sha512-XHPEwS0q6TaxcvG85+8EYkbiCux2XtWG2mkc47Ng2A77BQu9+DqIOJldST4HgPkuea7dvKSj5VgX3P1d4rW8Tg==}
 
+  when-exit@2.1.5:
+    resolution: {integrity: sha512-VGkKJ564kzt6Ms1dbgPP/yuIoQCrsFAnRbptpC5wOEsDaNsbCB2bnfnaA8i/vRs5tjUSEOtIuvl9/MyVsvQZCg==}
+
   which@2.0.2:
     resolution: {integrity: sha512-BLI3Tl1TW3Pvl70l3yq3Y64i+awpwXqsGBYWkkqMtnbXgrMD+yj7rhW0kuEDxzJaYXGjEW5ogapKNMEKNMjibA==}
     engines: {node: '>= 8'}
@@ -1838,6 +1916,10 @@ snapshots:
 
   agent-base@7.1.4: {}
 
+  ajv-formats@3.0.1(ajv@8.18.0):
+    optionalDependencies:
+      ajv: 8.18.0
+
   ajv-keywords@3.5.2(ajv@6.14.0):
     dependencies:
       ajv: 6.14.0
@@ -1849,6 +1931,13 @@ snapshots:
       json-schema-traverse: 0.4.1
       uri-js: 4.4.1
 
+  ajv@8.18.0:
+    dependencies:
+      fast-deep-equal: 3.1.3
+      fast-uri: 3.1.0
+      json-schema-traverse: 1.0.0
+      require-from-string: 2.0.2
+
   ansi-regex@5.0.1: {}
 
   ansi-regex@6.2.2: {}
@@ -1920,6 +2009,11 @@ snapshots:
 
   at-least-node@1.0.0: {}
 
+  atomically@2.1.1:
+    dependencies:
+      stubborn-fs: 2.0.0
+      when-exit: 2.1.5
+
   axios@1.13.6:
     dependencies:
       follow-redirects: 1.15.11
@@ -2094,6 +2188,18 @@ snapshots:
       tree-kill: 1.2.2
       yargs: 17.7.2
 
+  conf@15.1.0:
+    dependencies:
+      ajv: 8.18.0
+      ajv-formats: 3.0.1(ajv@8.18.0)
+      atomically: 2.1.1
+      debounce-fn: 6.0.0
+      dot-prop: 10.1.0
+      env-paths: 3.0.0
+      json-schema-typed: 8.0.2
+      semver: 7.7.4
+      uint8array-extras: 1.5.0
+
   core-util-is@1.0.2:
     optional: true
 
@@ -2111,6 +2217,10 @@ snapshots:
       shebang-command: 2.0.0
       which: 2.0.2
 
+  debounce-fn@6.0.0:
+    dependencies:
+      mimic-function: 5.0.1
+
   debug@4.4.3:
     dependencies:
       ms: 2.1.3
@@ -2176,6 +2286,10 @@ snapshots:
       verror: 1.10.1
     optional: true
 
+  dot-prop@10.1.0:
+    dependencies:
+      type-fest: 5.5.0
+
   dotenv-expand@11.0.7:
     dependencies:
       dotenv: 16.6.1
@@ -2234,6 +2348,11 @@ snapshots:
     transitivePeerDependencies:
       - supports-color
 
+  electron-store@11.0.2:
+    dependencies:
+      conf: 15.1.0
+      type-fest: 5.5.0
+
   electron-updater@6.8.3:
     dependencies:
       builder-util-runtime: 9.5.1
@@ -2252,7 +2371,7 @@ snapshots:
       '@electron/asar': 3.4.1
       debug: 4.4.3
       fs-extra: 7.0.1
-      lodash: 4.17.23
+      lodash: 4.18.1
       temp: 0.9.4
     optionalDependencies:
       '@electron/windows-sign': 1.2.2
@@ -2282,6 +2401,8 @@ snapshots:
 
   env-paths@2.2.1: {}
 
+  env-paths@3.0.0: {}
+
   err-code@2.0.3: {}
 
   es-define-property@1.0.1: {}
@@ -2355,6 +2476,8 @@ snapshots:
 
   fast-json-stable-stringify@2.1.0: {}
 
+  fast-uri@3.1.0: {}
+
   fd-slicer@1.1.0:
     dependencies:
       pend: 1.2.0
@@ -2610,6 +2733,10 @@ snapshots:
 
   json-schema-traverse@0.4.1: {}
 
+  json-schema-traverse@1.0.0: {}
+
+  json-schema-typed@8.0.2: {}
+
   json-stringify-safe@5.0.1:
     optional: true
 
@@ -2637,6 +2764,8 @@ snapshots:
 
   lodash@4.17.23: {}
 
+  lodash@4.18.1: {}
+
   log-symbols@4.1.0:
     dependencies:
       chalk: 4.1.2
@@ -2683,6 +2812,8 @@ snapshots:
 
   mimic-fn@2.1.0: {}
 
+  mimic-function@5.0.1: {}
+
   mimic-response@1.0.1: {}
 
   mimic-response@3.1.0: {}
@@ -2882,6 +3013,8 @@ snapshots:
 
   require-directory@2.1.1: {}
 
+  require-from-string@2.0.2: {}
+
   resedit@1.7.2:
     dependencies:
       pe-library: 0.4.1
@@ -3019,6 +3152,12 @@ snapshots:
     dependencies:
       ansi-regex: 6.2.2
 
+  stubborn-fs@2.0.0:
+    dependencies:
+      stubborn-utils: 1.0.2
+
+  stubborn-utils@1.0.2: {}
+
   sumchecker@3.0.1:
     dependencies:
       debug: 4.4.3
@@ -3033,6 +3172,8 @@ snapshots:
     dependencies:
       has-flag: 4.0.0
 
+  tagged-tag@1.0.0: {}
+
   tar@7.5.11:
     dependencies:
       '@isaacs/fs-minipass': 4.0.1
@@ -3079,8 +3220,14 @@ snapshots:
   type-fest@0.13.1:
     optional: true
 
+  type-fest@5.5.0:
+    dependencies:
+      tagged-tag: 1.0.0
+
   typescript@5.9.3: {}
 
+  uint8array-extras@1.5.0: {}
+
   undici-types@7.16.0: {}
 
   undici-types@7.18.2: {}
@@ -3126,6 +3273,8 @@ snapshots:
     dependencies:
       defaults: 1.0.4
 
+  when-exit@2.1.5: {}
+
   which@2.0.2:
     dependencies:
       isexe: 2.0.0

From 96a58d0d30fa9ff169ace3e005757becfef16261 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 11:11:57 +0530
Subject: [PATCH 025/202] feat: implement local folder indexing and document
 versioning capabilities

---
 .../app/tasks/celery_tasks/connector_tasks.py |  46 +
 .../app/tasks/connector_indexers/__init__.py  |   4 +-
 .../local_folder_indexer.py                   | 971 ++++++++++++++++++
 .../app/utils/document_versioning.py          | 107 ++
 4 files changed, 1127 insertions(+), 1 deletion(-)
 create mode 100644 surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
 create mode 100644 surfsense_backend/app/utils/document_versioning.py

diff --git a/surfsense_backend/app/tasks/celery_tasks/connector_tasks.py b/surfsense_backend/app/tasks/celery_tasks/connector_tasks.py
index 57475c9fd..9ff578ad2 100644
--- a/surfsense_backend/app/tasks/celery_tasks/connector_tasks.py
+++ b/surfsense_backend/app/tasks/celery_tasks/connector_tasks.py
@@ -926,6 +926,52 @@ async def _index_obsidian_vault(
         )
 
 
+@celery_app.task(name="index_local_folder", bind=True)
+def index_local_folder_task(
+    self,
+    connector_id: int,
+    search_space_id: int,
+    user_id: str,
+    start_date: str = None,
+    end_date: str = None,
+    target_file_path: str = None,
+):
+    """Celery task to index a local folder."""
+    import asyncio
+
+    loop = asyncio.new_event_loop()
+    asyncio.set_event_loop(loop)
+
+    try:
+        loop.run_until_complete(
+            _index_local_folder(
+                connector_id, search_space_id, user_id, start_date, end_date, target_file_path
+            )
+        )
+    finally:
+        loop.close()
+
+
+async def _index_local_folder(
+    connector_id: int,
+    search_space_id: int,
+    user_id: str,
+    start_date: str = None,
+    end_date: str = None,
+    target_file_path: str = None,
+):
+    """Index local folder with new session."""
+    from app.routes.search_source_connectors_routes import (
+        run_local_folder_indexing,
+    )
+
+    async with get_celery_session_maker()() as session:
+        await run_local_folder_indexing(
+            session, connector_id, search_space_id, user_id, start_date, end_date,
+            target_file_path=target_file_path,
+        )
+
+
 @celery_app.task(name="index_composio_connector", bind=True)
 def index_composio_connector_task(
     self,
diff --git a/surfsense_backend/app/tasks/connector_indexers/__init__.py b/surfsense_backend/app/tasks/connector_indexers/__init__.py
index 9a1d17fd5..8e4ad69e5 100644
--- a/surfsense_backend/app/tasks/connector_indexers/__init__.py
+++ b/surfsense_backend/app/tasks/connector_indexers/__init__.py
@@ -42,9 +42,10 @@ from .jira_indexer import index_jira_issues
 
 # Issue tracking and project management
 from .linear_indexer import index_linear_issues
-from .luma_indexer import index_luma_events
 
 # Documentation and knowledge management
+from .local_folder_indexer import index_local_folder
+from .luma_indexer import index_luma_events
 from .notion_indexer import index_notion_pages
 from .obsidian_indexer import index_obsidian_vault
 from .slack_indexer import index_slack_messages
@@ -74,4 +75,5 @@ __all__ = [  # noqa: RUF022
     # Communication platforms
     "index_slack_messages",
     "index_google_gmail_messages",
+    "index_local_folder",
 ]
diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
new file mode 100644
index 000000000..fc7fdaf66
--- /dev/null
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -0,0 +1,971 @@
+"""
+Local folder connector indexer.
+
+Indexes files from a local folder on disk. Supports:
+- Full-scan mode (startup reconciliation / manual trigger)
+- Single-file mode (chokidar real-time trigger)
+- Filesystem folder structure mirroring into DB Folder rows
+- Document versioning via create_version_snapshot
+- ETL-based file parsing for binary formats (PDF, DOCX, images, audio, etc.)
+
+Electron-only: all change detection is driven by chokidar in the desktop app.
+"""
+
+import os
+import time
+from collections.abc import Awaitable, Callable
+from datetime import UTC, datetime
+from pathlib import Path
+
+from sqlalchemy import delete, select
+from sqlalchemy.exc import SQLAlchemyError
+from sqlalchemy.ext.asyncio import AsyncSession
+from sqlalchemy.orm.attributes import flag_modified
+
+from app.config import config
+from app.db import (
+    Document,
+    DocumentStatus,
+    DocumentType,
+    Folder,
+    SearchSourceConnectorType,
+)
+from app.services.llm_service import get_user_long_context_llm
+from app.services.task_logging_service import TaskLoggingService
+from app.utils.document_converters import (
+    create_document_chunks,
+    embed_text,
+    generate_content_hash,
+    generate_document_summary,
+    generate_unique_identifier_hash,
+)
+from app.utils.document_versioning import create_version_snapshot
+
+from .base import (
+    build_document_metadata_string,
+    check_document_by_unique_identifier,
+    check_duplicate_document_by_hash,
+    get_connector_by_id,
+    get_current_timestamp,
+    logger,
+    safe_set_chunks,
+    update_connector_last_indexed,
+)
+
+PLAINTEXT_EXTENSIONS = frozenset({
+    ".md", ".markdown", ".txt", ".text", ".csv", ".tsv",
+    ".json", ".jsonl", ".yaml", ".yml", ".toml", ".ini", ".cfg", ".conf",
+    ".xml", ".html", ".htm", ".css", ".scss", ".less", ".sass",
+    ".py", ".pyw", ".pyi", ".pyx",
+    ".js", ".jsx", ".ts", ".tsx", ".mjs", ".cjs",
+    ".java", ".kt", ".kts", ".scala", ".groovy",
+    ".c", ".h", ".cpp", ".cxx", ".cc", ".hpp", ".hxx",
+    ".cs", ".fs", ".fsx",
+    ".go", ".rs", ".rb", ".php", ".pl", ".pm", ".lua",
+    ".swift", ".m", ".mm",
+    ".r", ".R", ".jl",
+    ".sh", ".bash", ".zsh", ".fish", ".bat", ".cmd", ".ps1",
+    ".sql", ".graphql", ".gql",
+    ".env", ".gitignore", ".dockerignore", ".editorconfig",
+    ".makefile", ".cmake",
+    ".log", ".rst", ".tex", ".bib", ".org", ".adoc", ".asciidoc",
+    ".vue", ".svelte", ".astro",
+    ".tf", ".hcl", ".proto",
+})
+
+AUDIO_EXTENSIONS = frozenset({
+    ".mp3", ".mp4", ".mpeg", ".mpga", ".m4a", ".wav", ".webm",
+})
+
+
+def _is_plaintext_file(filename: str) -> bool:
+    return Path(filename).suffix.lower() in PLAINTEXT_EXTENSIONS
+
+
+def _is_audio_file(filename: str) -> bool:
+    return Path(filename).suffix.lower() in AUDIO_EXTENSIONS
+
+
+def _needs_etl(filename: str) -> bool:
+    """File is not plaintext and not audio — requires ETL service to parse."""
+    return not _is_plaintext_file(filename) and not _is_audio_file(filename)
+
+HeartbeatCallbackType = Callable[[int], Awaitable[None]]
+HEARTBEAT_INTERVAL_SECONDS = 30
+
+DEFAULT_EXCLUDE_PATTERNS = [
+    ".git",
+    "node_modules",
+    "__pycache__",
+    ".DS_Store",
+    ".obsidian",
+    ".trash",
+]
+
+
+def scan_folder(
+    folder_path: str,
+    file_extensions: list[str] | None = None,
+    exclude_patterns: list[str] | None = None,
+) -> list[dict]:
+    """Walk a directory and return a list of file entries.
+
+    Args:
+        folder_path: Absolute path to the folder to scan.
+        file_extensions: If provided, only include files with these extensions
+            (e.g. [".md", ".txt"]). ``None`` means include all files.
+        exclude_patterns: Directory/file names to exclude.  Any path component
+            matching one of these strings is skipped.
+
+    Returns:
+        List of dicts with keys: path, relative_path, name, modified_at, size.
+    """
+    root = Path(folder_path)
+    if not root.exists():
+        raise ValueError(f"Folder path does not exist: {folder_path}")
+
+    if exclude_patterns is None:
+        exclude_patterns = []
+
+    files: list[dict] = []
+    for dirpath, dirnames, filenames in os.walk(root):
+        rel_dir = Path(dirpath).relative_to(root)
+
+        # Prune excluded directories in-place so os.walk skips them
+        dirnames[:] = [
+            d for d in dirnames if d not in exclude_patterns
+        ]
+
+        # Check if the current directory itself is excluded
+        if any(part in exclude_patterns for part in rel_dir.parts):
+            continue
+
+        for fname in filenames:
+            if fname in exclude_patterns:
+                continue
+
+            full = Path(dirpath) / fname
+
+            if file_extensions is not None:
+                if full.suffix.lower() not in file_extensions:
+                    continue
+
+            try:
+                stat = full.stat()
+                rel_path = full.relative_to(root)
+                files.append(
+                    {
+                        "path": str(full),
+                        "relative_path": str(rel_path),
+                        "name": full.name,
+                        "modified_at": datetime.fromtimestamp(stat.st_mtime, tz=UTC),
+                        "size": stat.st_size,
+                    }
+                )
+            except OSError as e:
+                logger.warning(f"Could not stat file {full}: {e}")
+
+    return files
+
+
+def _read_plaintext_file(file_path: str) -> str:
+    """Read a plaintext/text-based file as UTF-8."""
+    with open(file_path, encoding="utf-8", errors="replace") as f:
+        content = f.read()
+    if "\x00" in content:
+        raise ValueError(
+            f"File contains null bytes — likely a binary file opened as text: {file_path}"
+        )
+    return content
+
+
+async def _read_file_content(file_path: str, filename: str) -> str:
+    """Read file content, using ETL for binary formats.
+
+    Plaintext files are read directly. Audio and document files (PDF, DOCX, etc.)
+    are routed through the configured ETL service (same as Google Drive / OneDrive).
+
+    Raises ValueError if the file cannot be parsed (e.g. no ETL service configured
+    for a binary file).
+    """
+    if _is_plaintext_file(filename):
+        return _read_plaintext_file(file_path)
+
+    if _is_audio_file(filename):
+        etl_service = config.ETL_SERVICE if hasattr(config, "ETL_SERVICE") else None
+        stt_service_val = config.STT_SERVICE if hasattr(config, "STT_SERVICE") else None
+        if not stt_service_val and not etl_service:
+            raise ValueError(
+                f"No STT_SERVICE configured — cannot transcribe audio file: {filename}"
+            )
+
+    if _needs_etl(filename):
+        etl_service = getattr(config, "ETL_SERVICE", None)
+        if not etl_service:
+            raise ValueError(
+                f"No ETL_SERVICE configured — cannot parse binary file: {filename}. "
+                f"Set ETL_SERVICE to UNSTRUCTURED, LLAMACLOUD, or DOCLING in your .env"
+            )
+
+    from app.connectors.onedrive.content_extractor import (
+        _parse_file_to_markdown,
+    )
+
+    return await _parse_file_to_markdown(file_path, filename)
+
+
+async def _compute_file_content_hash(
+    file_path: str, filename: str, search_space_id: int,
+) -> tuple[str, str]:
+    """Read a file (via ETL if needed) and compute its content hash.
+
+    Returns (content_text, content_hash).
+    """
+    content = await _read_file_content(file_path, filename)
+    content_hash = generate_content_hash(content, search_space_id)
+    return content, content_hash
+
+
+async def _mirror_folder_structure(
+    session: AsyncSession,
+    folder_path: str,
+    folder_name: str,
+    search_space_id: int,
+    user_id: str,
+    connector_config: dict,
+    connector,
+    exclude_patterns: list[str] | None = None,
+) -> dict[str, int]:
+    """Mirror the local filesystem directory structure into DB Folder rows.
+
+    Returns a mapping of relative_dir_path -> folder_id.
+    The empty string key ("") maps to the root folder.
+    """
+    root = Path(folder_path)
+    if exclude_patterns is None:
+        exclude_patterns = []
+
+    # Collect all subdirectory paths relative to root
+    subdirs: list[str] = []
+    for dirpath, dirnames, _ in os.walk(root):
+        dirnames[:] = [d for d in dirnames if d not in exclude_patterns]
+        rel = Path(dirpath).relative_to(root)
+        if any(part in exclude_patterns for part in rel.parts):
+            continue
+        rel_str = str(rel) if str(rel) != "." else ""
+        if rel_str:
+            subdirs.append(rel_str)
+
+    # Sort by depth so parents are created before children
+    subdirs.sort(key=lambda p: p.count(os.sep))
+
+    mapping: dict[str, int] = {}
+
+    # Get or create root folder
+    root_folder_id = connector_config.get("root_folder_id")
+    if root_folder_id:
+        existing = (
+            await session.execute(
+                select(Folder).where(Folder.id == root_folder_id)
+            )
+        ).scalar_one_or_none()
+        if existing:
+            mapping[""] = existing.id
+        else:
+            root_folder_id = None
+
+    if not root_folder_id:
+        root_folder = Folder(
+            name=folder_name,
+            search_space_id=search_space_id,
+            created_by_id=user_id,
+            position="a0",
+        )
+        session.add(root_folder)
+        await session.flush()
+        mapping[""] = root_folder.id
+        # Persist root_folder_id into connector config
+        connector_config["root_folder_id"] = root_folder.id
+        connector.config = {**connector.config, "root_folder_id": root_folder.id}
+        flag_modified(connector, "config")
+
+    # Create/reuse subdirectory Folder rows
+    for rel_dir in subdirs:
+        dir_parts = Path(rel_dir).parts
+        dir_name = dir_parts[-1]
+        parent_rel = str(Path(*dir_parts[:-1])) if len(dir_parts) > 1 else ""
+
+        parent_id = mapping.get(parent_rel, mapping[""])
+
+        existing_folder = (
+            await session.execute(
+                select(Folder).where(
+                    Folder.name == dir_name,
+                    Folder.parent_id == parent_id,
+                    Folder.search_space_id == search_space_id,
+                )
+            )
+        ).scalar_one_or_none()
+
+        if existing_folder:
+            mapping[rel_dir] = existing_folder.id
+        else:
+            new_folder = Folder(
+                name=dir_name,
+                parent_id=parent_id,
+                search_space_id=search_space_id,
+                created_by_id=user_id,
+                position="a0",
+            )
+            session.add(new_folder)
+            await session.flush()
+            mapping[rel_dir] = new_folder.id
+
+    await session.flush()
+    return mapping
+
+
+async def _cleanup_empty_folders(
+    session: AsyncSession,
+    root_folder_id: int,
+    search_space_id: int,
+    existing_dirs_on_disk: set[str],
+    folder_mapping: dict[str, int],
+) -> None:
+    """Delete Folder rows that are empty (no docs, no children) and no longer on disk.
+
+    Queries ALL folders under this search space (not just the current mapping)
+    so that stale folders from previous syncs are also cleaned up.
+    """
+    # Build a reverse mapping from folder_id → rel_dir for known dirs
+    id_to_rel: dict[int, str] = {fid: rel for rel, fid in folder_mapping.items() if rel}
+
+    # Also find any folders in the DB that are children of the root but NOT
+    # in the current mapping (stale from a previous sync).
+    all_folders = (
+        await session.execute(
+            select(Folder).where(
+                Folder.search_space_id == search_space_id,
+                Folder.id != root_folder_id,
+            )
+        )
+    ).scalars().all()
+
+    # Build candidates: folders not on disk that we might delete
+    candidates: list[Folder] = []
+    for folder in all_folders:
+        rel = id_to_rel.get(folder.id)
+        if rel and rel in existing_dirs_on_disk:
+            continue
+        candidates.append(folder)
+
+    # Sort deepest first (by name depth heuristic — folders with no children first)
+    # Repeat until no more deletions happen (cascading empty parents)
+    changed = True
+    while changed:
+        changed = False
+        remaining: list[Folder] = []
+        for folder in candidates:
+            doc_exists = (
+                await session.execute(
+                    select(Document.id).where(Document.folder_id == folder.id).limit(1)
+                )
+            ).scalar_one_or_none()
+            if doc_exists is not None:
+                remaining.append(folder)
+                continue
+
+            child_exists = (
+                await session.execute(
+                    select(Folder.id).where(Folder.parent_id == folder.id).limit(1)
+                )
+            ).scalar_one_or_none()
+            if child_exists is not None:
+                remaining.append(folder)
+                continue
+
+            await session.execute(delete(Folder).where(Folder.id == folder.id))
+            changed = True
+        candidates = remaining
+
+
+async def index_local_folder(
+    session: AsyncSession,
+    connector_id: int,
+    search_space_id: int,
+    user_id: str,
+    start_date: str | None = None,
+    end_date: str | None = None,
+    update_last_indexed: bool = True,
+    on_heartbeat_callback: HeartbeatCallbackType | None = None,
+    target_file_path: str | None = None,
+) -> tuple[int, int, str | None]:
+    """Index files from a local folder.
+
+    Supports two modes:
+    - Full scan (target_file_path=None): walks entire folder, handles new/changed/deleted files.
+    - Single-file (target_file_path set): processes only that file.
+
+    Returns (indexed_count, skipped_count, error_or_warning_message).
+    """
+    task_logger = TaskLoggingService(session, search_space_id)
+
+    log_entry = await task_logger.log_task_start(
+        task_name="local_folder_indexing",
+        source="connector_indexing_task",
+        message=f"Starting local folder indexing for connector {connector_id}",
+        metadata={
+            "connector_id": connector_id,
+            "user_id": str(user_id),
+            "target_file_path": target_file_path,
+        },
+    )
+
+    try:
+        connector = await get_connector_by_id(
+            session, connector_id, SearchSourceConnectorType.LOCAL_FOLDER_CONNECTOR
+        )
+        if not connector:
+            await task_logger.log_task_failure(
+                log_entry,
+                f"Connector {connector_id} not found",
+                "Connector not found",
+                {},
+            )
+            return 0, 0, f"Connector {connector_id} not found"
+
+        folder_path = connector.config.get("folder_path")
+        if not folder_path or not os.path.exists(folder_path):
+            await task_logger.log_task_failure(
+                log_entry,
+                f"Folder path missing or does not exist: {folder_path}",
+                "Folder not found",
+                {},
+            )
+            return 0, 0, f"Folder path missing or does not exist: {folder_path}"
+
+        folder_name = connector.config.get("folder_name") or os.path.basename(folder_path)
+        exclude_patterns = connector.config.get("exclude_patterns", DEFAULT_EXCLUDE_PATTERNS)
+        file_extensions = connector.config.get("file_extensions")  # None = all
+
+        # ====================================================================
+        # SINGLE-FILE MODE
+        # ====================================================================
+        if target_file_path:
+            return await _index_single_file(
+                session=session,
+                connector=connector,
+                connector_id=connector_id,
+                search_space_id=search_space_id,
+                user_id=user_id,
+                folder_path=folder_path,
+                folder_name=folder_name,
+                target_file_path=target_file_path,
+                task_logger=task_logger,
+                log_entry=log_entry,
+                update_last_indexed=update_last_indexed,
+            )
+
+        # ====================================================================
+        # FULL-SCAN MODE
+        # ====================================================================
+
+        # Phase 0: Mirror folder structure
+        await task_logger.log_task_progress(
+            log_entry, "Mirroring folder structure", {"stage": "folder_mirror"}
+        )
+
+        folder_mapping = await _mirror_folder_structure(
+            session=session,
+            folder_path=folder_path,
+            folder_name=folder_name,
+            search_space_id=search_space_id,
+            user_id=user_id,
+            connector_config=connector.config,
+            connector=connector,
+            exclude_patterns=exclude_patterns,
+        )
+        await session.flush()
+
+        # Scan files on disk
+        try:
+            files = scan_folder(folder_path, file_extensions, exclude_patterns)
+        except Exception as e:
+            await task_logger.log_task_failure(
+                log_entry, f"Failed to scan folder: {e}", "Scan error", {}
+            )
+            return 0, 0, f"Failed to scan folder: {e}"
+
+        logger.info(f"Found {len(files)} files in folder")
+
+        indexed_count = 0
+        skipped_count = 0
+        failed_count = 0
+        duplicate_count = 0
+
+        last_heartbeat_time = time.time()
+
+        # ================================================================
+        # PHASE 1: Analyze all files, create pending documents
+        # ================================================================
+        files_to_process: list[dict] = []
+        new_documents_created = False
+        seen_unique_hashes: set[str] = set()
+
+        for file_info in files:
+            try:
+                relative_path = file_info["relative_path"]
+                file_path_abs = file_info["path"]
+
+                unique_identifier = f"{folder_name}:{relative_path}"
+                unique_identifier_hash = generate_unique_identifier_hash(
+                    DocumentType.LOCAL_FOLDER_FILE,
+                    unique_identifier,
+                    search_space_id,
+                )
+                seen_unique_hashes.add(unique_identifier_hash)
+
+                existing_document = await check_document_by_unique_identifier(
+                    session, unique_identifier_hash
+                )
+
+                if existing_document:
+                    # Check mtime first (cheap)
+                    stored_mtime = (existing_document.document_metadata or {}).get("mtime")
+                    current_mtime = file_info["modified_at"].timestamp()
+
+                    if stored_mtime and abs(current_mtime - stored_mtime) < 1.0:
+                        if not DocumentStatus.is_state(
+                            existing_document.status, DocumentStatus.READY
+                        ):
+                            existing_document.status = DocumentStatus.ready()
+                        skipped_count += 1
+                        continue
+
+                    # mtime differs — read file and check content hash
+                    try:
+                        content, content_hash = await _compute_file_content_hash(
+                            file_path_abs, file_info["relative_path"], search_space_id
+                        )
+                    except Exception as read_err:
+                        logger.warning(f"Could not read {file_path_abs}: {read_err}")
+                        skipped_count += 1
+                        continue
+
+                    if existing_document.content_hash == content_hash:
+                        # Content same, just update mtime in metadata
+                        meta = dict(existing_document.document_metadata or {})
+                        meta["mtime"] = current_mtime
+                        existing_document.document_metadata = meta
+                        if not DocumentStatus.is_state(
+                            existing_document.status, DocumentStatus.READY
+                        ):
+                            existing_document.status = DocumentStatus.ready()
+                        skipped_count += 1
+                        continue
+
+                    # Content actually changed — snapshot version, queue for re-index
+                    await create_version_snapshot(session, existing_document)
+
+                    files_to_process.append(
+                        {
+                            "document": existing_document,
+                            "is_new": False,
+                            "file_info": file_info,
+                            "content": content,
+                            "content_hash": content_hash,
+                            "unique_identifier_hash": unique_identifier_hash,
+                            "relative_path": relative_path,
+                            "title": file_info["name"],
+                        }
+                    )
+                    continue
+
+                # New document — read content
+                try:
+                    content, content_hash = await _compute_file_content_hash(
+                        file_path_abs, file_info["relative_path"], search_space_id
+                    )
+                except Exception as read_err:
+                    logger.warning(f"Could not read {file_path_abs}: {read_err}")
+                    skipped_count += 1
+                    continue
+
+                if not content.strip():
+                    skipped_count += 1
+                    continue
+
+                # Check for duplicate content from another connector
+                with session.no_autoflush:
+                    dup = await check_duplicate_document_by_hash(session, content_hash)
+                if dup:
+                    duplicate_count += 1
+                    skipped_count += 1
+                    continue
+
+                # Determine folder_id for this file
+                parent_dir = str(Path(relative_path).parent)
+                if parent_dir == ".":
+                    parent_dir = ""
+                folder_id = folder_mapping.get(parent_dir, folder_mapping.get(""))
+
+                document = Document(
+                    search_space_id=search_space_id,
+                    title=file_info["name"],
+                    document_type=DocumentType.LOCAL_FOLDER_FILE,
+                    document_metadata={
+                        "folder_name": folder_name,
+                        "file_path": relative_path,
+                        "connector_id": connector_id,
+                        "mtime": file_info["modified_at"].timestamp(),
+                    },
+                    content="Pending...",
+                    content_hash=unique_identifier_hash,  # Temp unique — updated in phase 2
+                    unique_identifier_hash=unique_identifier_hash,
+                    embedding=None,
+                    status=DocumentStatus.pending(),
+                    updated_at=get_current_timestamp(),
+                    created_by_id=user_id,
+                    connector_id=connector_id,
+                    folder_id=folder_id,
+                )
+                session.add(document)
+                new_documents_created = True
+
+                files_to_process.append(
+                    {
+                        "document": document,
+                        "is_new": True,
+                        "file_info": file_info,
+                        "content": content,
+                        "content_hash": content_hash,
+                        "unique_identifier_hash": unique_identifier_hash,
+                        "relative_path": relative_path,
+                        "title": file_info["name"],
+                    }
+                )
+
+            except Exception as e:
+                logger.exception(f"Phase 1 error for {file_info.get('path')}: {e}")
+                failed_count += 1
+
+        if new_documents_created:
+            await session.commit()
+
+        # ================================================================
+        # PHASE 1.5: Delete documents no longer on disk
+        # ================================================================
+        all_connector_docs = (
+            await session.execute(
+                select(Document).where(
+                    Document.connector_id == connector_id,
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                )
+            )
+        ).scalars().all()
+
+        for doc in all_connector_docs:
+            if doc.unique_identifier_hash not in seen_unique_hashes:
+                await session.delete(doc)
+
+        await session.flush()
+
+        # ================================================================
+        # PHASE 2: Process each document
+        # ================================================================
+        long_context_llm = await get_user_long_context_llm(
+            session, user_id, search_space_id
+        )
+
+        for item in files_to_process:
+            if on_heartbeat_callback:
+                current_time = time.time()
+                if current_time - last_heartbeat_time >= HEARTBEAT_INTERVAL_SECONDS:
+                    await on_heartbeat_callback(indexed_count)
+                    last_heartbeat_time = current_time
+
+            document = item["document"]
+            try:
+                document.status = DocumentStatus.processing()
+                await session.commit()
+
+                title = item["title"]
+                relative_path = item["relative_path"]
+                content = item["content"]
+                content_hash = item["content_hash"]
+                file_info = item["file_info"]
+
+                metadata_sections = [
+                    (
+                        "METADATA",
+                        [
+                            f"Title: {title}",
+                            f"Folder: {folder_name}",
+                            f"Path: {relative_path}",
+                        ],
+                    ),
+                    ("CONTENT", [content]),
+                ]
+                document_string = build_document_metadata_string(metadata_sections)
+
+                summary_content = ""
+                if long_context_llm and connector.enable_summary:
+                    doc_meta = {
+                        "folder_name": folder_name,
+                        "file_path": relative_path,
+                    }
+                    summary_content, _ = await generate_document_summary(
+                        document_string, long_context_llm, doc_meta
+                    )
+
+                embedding = embed_text(document_string)
+                chunks = await create_document_chunks(document_string)
+
+                # Determine folder_id
+                parent_dir = str(Path(relative_path).parent)
+                if parent_dir == ".":
+                    parent_dir = ""
+                folder_id = folder_mapping.get(parent_dir, folder_mapping.get(""))
+
+                document.title = title
+                document.content = document_string
+                document.content_hash = content_hash
+                document.source_markdown = content
+                document.embedding = embedding
+                document.document_metadata = {
+                    "folder_name": folder_name,
+                    "file_path": relative_path,
+                    "connector_id": connector_id,
+                    "summary": summary_content,
+                    "mtime": file_info["modified_at"].timestamp(),
+                }
+                document.folder_id = folder_id
+                await safe_set_chunks(session, document, chunks)
+                document.updated_at = get_current_timestamp()
+                document.status = DocumentStatus.ready()
+
+                indexed_count += 1
+
+                if indexed_count % 10 == 0:
+                    await session.commit()
+
+            except Exception as e:
+                logger.exception(f"Phase 2 error for {item.get('relative_path')}: {e}")
+                try:
+                    await session.rollback()
+                except Exception:
+                    pass
+                try:
+                    document.status = DocumentStatus.failed(str(e)[:500])
+                    document.updated_at = get_current_timestamp()
+                    await session.commit()
+                except Exception:
+                    try:
+                        await session.rollback()
+                    except Exception:
+                        pass
+                failed_count += 1
+
+        # Cleanup empty folders
+        existing_dirs = set()
+        for dirpath, dirnames, _ in os.walk(folder_path):
+            dirnames[:] = [d for d in dirnames if d not in exclude_patterns]
+            rel = str(Path(dirpath).relative_to(folder_path))
+            if rel == ".":
+                rel = ""
+            if rel and not any(part in exclude_patterns for part in Path(rel).parts):
+                existing_dirs.add(rel)
+
+        root_fid = folder_mapping.get("")
+        if root_fid:
+            await _cleanup_empty_folders(
+                session, root_fid, search_space_id, existing_dirs, folder_mapping
+            )
+
+        await update_connector_last_indexed(session, connector, update_last_indexed)
+
+        try:
+            await session.commit()
+        except Exception as e:
+            if "duplicate key value violates unique constraint" in str(e).lower():
+                logger.warning(f"Duplicate key during commit: {e}")
+                await session.rollback()
+            else:
+                raise
+
+        warning_parts = []
+        if duplicate_count > 0:
+            warning_parts.append(f"{duplicate_count} duplicate")
+        if failed_count > 0:
+            warning_parts.append(f"{failed_count} failed")
+        warning_message = ", ".join(warning_parts) if warning_parts else None
+
+        await task_logger.log_task_success(
+            log_entry,
+            f"Completed local folder indexing for connector {connector_id}",
+            {
+                "indexed": indexed_count,
+                "skipped": skipped_count,
+                "failed": failed_count,
+                "duplicates": duplicate_count,
+            },
+        )
+
+        return indexed_count, skipped_count, warning_message
+
+    except SQLAlchemyError as e:
+        logger.exception(f"Database error during local folder indexing: {e}")
+        await session.rollback()
+        await task_logger.log_task_failure(
+            log_entry, f"DB error: {e}", "Database error", {}
+        )
+        return 0, 0, f"Database error: {e}"
+
+    except Exception as e:
+        logger.exception(f"Error during local folder indexing: {e}")
+        await task_logger.log_task_failure(
+            log_entry, f"Error: {e}", "Unexpected error", {}
+        )
+        return 0, 0, str(e)
+
+
+async def _index_single_file(
+    session: AsyncSession,
+    connector,
+    connector_id: int,
+    search_space_id: int,
+    user_id: str,
+    folder_path: str,
+    folder_name: str,
+    target_file_path: str,
+    task_logger,
+    log_entry,
+    update_last_indexed: bool = True,
+) -> tuple[int, int, str | None]:
+    """Process a single file (chokidar real-time trigger)."""
+    try:
+        full_path = Path(target_file_path)
+        if not full_path.exists():
+            # File was deleted — find and remove the document
+            rel = str(full_path.relative_to(folder_path))
+            unique_id = f"{folder_name}:{rel}"
+            uid_hash = generate_unique_identifier_hash(
+                DocumentType.LOCAL_FOLDER_FILE, unique_id, search_space_id
+            )
+            existing = await check_document_by_unique_identifier(session, uid_hash)
+            if existing:
+                await session.delete(existing)
+                await session.commit()
+                return 0, 0, None
+            return 0, 0, None
+
+        rel_path = str(full_path.relative_to(folder_path))
+
+        unique_id = f"{folder_name}:{rel_path}"
+        uid_hash = generate_unique_identifier_hash(
+            DocumentType.LOCAL_FOLDER_FILE, unique_id, search_space_id
+        )
+
+        try:
+            content, content_hash = await _compute_file_content_hash(
+                str(full_path), full_path.name, search_space_id
+            )
+        except Exception as e:
+            return 0, 1, f"Could not read file: {e}"
+
+        if not content.strip():
+            return 0, 1, None
+
+        existing = await check_document_by_unique_identifier(session, uid_hash)
+
+        if existing:
+            if existing.content_hash == content_hash:
+                # Update mtime
+                mtime = full_path.stat().st_mtime
+                meta = dict(existing.document_metadata or {})
+                meta["mtime"] = mtime
+                existing.document_metadata = meta
+                await session.commit()
+                return 0, 1, None
+
+            # Content changed — snapshot + re-index
+            await create_version_snapshot(session, existing)
+
+        # Get LLM
+        long_context_llm = await get_user_long_context_llm(
+            session, user_id, search_space_id
+        )
+
+        title = full_path.name
+        mtime = full_path.stat().st_mtime
+
+        metadata_sections = [
+            ("METADATA", [f"Title: {title}", f"Folder: {folder_name}", f"Path: {rel_path}"]),
+            ("CONTENT", [content]),
+        ]
+        document_string = build_document_metadata_string(metadata_sections)
+
+        summary_content = ""
+        if long_context_llm and connector.enable_summary:
+            summary_content, _ = await generate_document_summary(
+                document_string, long_context_llm, {"folder_name": folder_name, "file_path": rel_path}
+            )
+
+        embedding = embed_text(document_string)
+        chunks = await create_document_chunks(document_string)
+
+        doc_metadata = {
+            "folder_name": folder_name,
+            "file_path": rel_path,
+            "connector_id": connector_id,
+            "summary": summary_content,
+            "mtime": mtime,
+        }
+
+        if existing:
+            existing.title = title
+            existing.content = document_string
+            existing.content_hash = content_hash
+            existing.source_markdown = content
+            existing.embedding = embedding
+            existing.document_metadata = doc_metadata
+            await safe_set_chunks(session, existing, chunks)
+            existing.updated_at = get_current_timestamp()
+            existing.status = DocumentStatus.ready()
+        else:
+            document = Document(
+                search_space_id=search_space_id,
+                title=title,
+                document_type=DocumentType.LOCAL_FOLDER_FILE,
+                document_metadata=doc_metadata,
+                content=document_string,
+                content_hash=content_hash,
+                unique_identifier_hash=uid_hash,
+                source_markdown=content,
+                embedding=embedding,
+                status=DocumentStatus.ready(),
+                updated_at=get_current_timestamp(),
+                created_by_id=user_id,
+                connector_id=connector_id,
+            )
+            session.add(document)
+            # Set chunks
+            await session.flush()
+            for chunk in chunks:
+                chunk.document_id = document.id
+            session.add_all(chunks)
+
+        await update_connector_last_indexed(session, connector, update_last_indexed)
+        await session.commit()
+
+        await task_logger.log_task_success(
+            log_entry,
+            f"Single file indexed: {rel_path}",
+            {"file": rel_path},
+        )
+        return 1, 0, None
+
+    except Exception as e:
+        logger.exception(f"Error indexing single file {target_file_path}: {e}")
+        await session.rollback()
+        return 0, 0, str(e)
diff --git a/surfsense_backend/app/utils/document_versioning.py b/surfsense_backend/app/utils/document_versioning.py
new file mode 100644
index 000000000..889bc4a3a
--- /dev/null
+++ b/surfsense_backend/app/utils/document_versioning.py
@@ -0,0 +1,107 @@
+"""Document versioning: snapshot creation and cleanup.
+
+Rules:
+- 30-minute debounce window: if the latest version was created < 30 min ago,
+  overwrite it instead of creating a new row.
+- Maximum 20 versions per document.
+- Versions older than 90 days are cleaned up.
+"""
+
+from datetime import UTC, datetime, timedelta
+
+from sqlalchemy import delete, func, select
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.db import Document, DocumentVersion
+
+MAX_VERSIONS_PER_DOCUMENT = 20
+DEBOUNCE_MINUTES = 30
+RETENTION_DAYS = 90
+
+
+def _now() -> datetime:
+    return datetime.now(UTC)
+
+
+async def create_version_snapshot(
+    session: AsyncSession,
+    document: Document,
+) -> DocumentVersion | None:
+    """Snapshot the document's current state into a DocumentVersion row.
+
+    Returns the created/updated DocumentVersion, or None if nothing was done.
+    """
+    now = _now()
+
+    latest = (
+        await session.execute(
+            select(DocumentVersion)
+            .where(DocumentVersion.document_id == document.id)
+            .order_by(DocumentVersion.version_number.desc())
+            .limit(1)
+        )
+    ).scalar_one_or_none()
+
+    if latest is not None:
+        age = now - latest.created_at.replace(tzinfo=UTC)
+        if age < timedelta(minutes=DEBOUNCE_MINUTES):
+            latest.source_markdown = document.source_markdown
+            latest.content_hash = document.content_hash
+            latest.title = document.title
+            latest.created_at = now
+            await session.flush()
+            return latest
+
+    max_num = (
+        await session.execute(
+            select(func.coalesce(func.max(DocumentVersion.version_number), 0)).where(
+                DocumentVersion.document_id == document.id
+            )
+        )
+    ).scalar_one()
+
+    version = DocumentVersion(
+        document_id=document.id,
+        version_number=max_num + 1,
+        source_markdown=document.source_markdown,
+        content_hash=document.content_hash,
+        title=document.title,
+        created_at=now,
+    )
+    session.add(version)
+    await session.flush()
+
+    # Cleanup: remove versions older than 90 days
+    cutoff = now - timedelta(days=RETENTION_DAYS)
+    await session.execute(
+        delete(DocumentVersion).where(
+            DocumentVersion.document_id == document.id,
+            DocumentVersion.created_at < cutoff,
+        )
+    )
+
+    # Cleanup: cap at MAX_VERSIONS_PER_DOCUMENT
+    count = (
+        await session.execute(
+            select(func.count()).select_from(DocumentVersion).where(
+                DocumentVersion.document_id == document.id
+            )
+        )
+    ).scalar_one()
+
+    if count > MAX_VERSIONS_PER_DOCUMENT:
+        excess = count - MAX_VERSIONS_PER_DOCUMENT
+        oldest_ids_result = await session.execute(
+            select(DocumentVersion.id)
+            .where(DocumentVersion.document_id == document.id)
+            .order_by(DocumentVersion.version_number.asc())
+            .limit(excess)
+        )
+        oldest_ids = [row[0] for row in oldest_ids_result.all()]
+        if oldest_ids:
+            await session.execute(
+                delete(DocumentVersion).where(DocumentVersion.id.in_(oldest_ids))
+            )
+
+    await session.flush()
+    return version

From 775dea7894f5737de3ab79bd5230b595f2dcc956 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 11:12:16 +0530
Subject: [PATCH 026/202] feat: add integration and unit tests for local folder
 indexing and document versioning

---
 .../tests/integration/conftest.py             |  21 +
 .../test_local_folder_pipeline.py             | 609 ++++++++++++++++++
 .../integration/test_document_versioning.py   | 184 ++++++
 .../test_local_folder_scan.py                 |  80 +++
 4 files changed, 894 insertions(+)
 create mode 100644 surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
 create mode 100644 surfsense_backend/tests/integration/test_document_versioning.py
 create mode 100644 surfsense_backend/tests/unit/connector_indexers/test_local_folder_scan.py

diff --git a/surfsense_backend/tests/integration/conftest.py b/surfsense_backend/tests/integration/conftest.py
index d9d7cacae..840246e2f 100644
--- a/surfsense_backend/tests/integration/conftest.py
+++ b/surfsense_backend/tests/integration/conftest.py
@@ -166,3 +166,24 @@ def make_connector_document(db_connector, db_user):
         return ConnectorDocument(**defaults)
 
     return _make
+
+
+@pytest_asyncio.fixture
+async def db_local_folder_connector(
+    db_session: AsyncSession, db_user: User, db_search_space: SearchSpace, tmp_path
+) -> SearchSourceConnector:
+    connector = SearchSourceConnector(
+        name="Test Local Folder",
+        connector_type=SearchSourceConnectorType.LOCAL_FOLDER_CONNECTOR,
+        config={
+            "folder_path": str(tmp_path),
+            "folder_name": "test-folder",
+            "exclude_patterns": [],
+            "file_extensions": None,
+        },
+        search_space_id=db_search_space.id,
+        user_id=db_user.id,
+    )
+    db_session.add(connector)
+    await db_session.flush()
+    return connector
diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
new file mode 100644
index 000000000..988905f8f
--- /dev/null
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -0,0 +1,609 @@
+"""Integration tests for local folder indexer — Tier 3 (I1-I5), Tier 4 (F1-F5), Tier 5 (P1)."""
+
+import os
+from pathlib import Path
+from unittest.mock import AsyncMock, MagicMock
+
+import pytest
+from sqlalchemy import func, select
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.db import (
+    Document,
+    DocumentStatus,
+    DocumentType,
+    DocumentVersion,
+    Folder,
+    SearchSourceConnector,
+    SearchSpace,
+    User,
+)
+
+import app.tasks.connector_indexers.local_folder_indexer as _lfi_mod
+
+pytestmark = pytest.mark.integration
+
+
+@pytest.fixture
+def patched_self_hosted(monkeypatch):
+    _cfg = type("_Cfg", (), {"is_self_hosted": staticmethod(lambda: True)})()
+    monkeypatch.setattr(_lfi_mod, "config", _cfg)
+
+
+@pytest.fixture
+def patched_embed_for_indexer(monkeypatch):
+    from app.config import config as app_config
+    dim = app_config.embedding_model_instance.dimension
+    mock = MagicMock(return_value=[0.1] * dim)
+    monkeypatch.setattr(_lfi_mod, "embed_text", mock)
+    return mock
+
+
+@pytest.fixture
+def patched_chunks_for_indexer(monkeypatch):
+    from app.db import Chunk
+    from app.config import config as app_config
+    dim = app_config.embedding_model_instance.dimension
+
+    async def mock_create_chunks(text):
+        return [Chunk(content="chunk", embedding=[0.1] * dim)]
+
+    monkeypatch.setattr(_lfi_mod, "create_document_chunks", mock_create_chunks)
+
+
+@pytest.fixture
+def patched_summary_for_indexer(monkeypatch):
+    monkeypatch.setattr(_lfi_mod, "get_user_long_context_llm", AsyncMock(return_value=None))
+
+
+# ====================================================================
+# Tier 3: Full Indexer Integration (I1-I5)
+# ====================================================================
+
+
+class TestFullIndexer:
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_i1_new_file_indexed(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """I1: Single new .md file is indexed with status READY."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "note.md").write_text("# Hello World\n\nContent here.")
+
+        count, skipped, err = await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        assert err is None
+        assert count == 1
+
+        docs = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.connector_id == db_local_folder_connector.id
+                )
+            )
+        ).scalars().all()
+        assert len(docs) == 1
+        assert docs[0].document_type == DocumentType.LOCAL_FOLDER_FILE
+        assert DocumentStatus.is_state(docs[0].status, DocumentStatus.READY)
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_i2_unchanged_skipped(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """I2: Second run on unchanged directory creates no new documents."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "note.md").write_text("# Hello\n\nSame content.")
+
+        count1, _, _ = await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+        assert count1 == 1
+
+        # Second run — unchanged
+        count2, _, _ = await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+        assert count2 == 0
+
+        total = (
+            await db_session.execute(
+                select(func.count()).select_from(Document).where(
+                    Document.connector_id == db_local_folder_connector.id
+                )
+            )
+        ).scalar_one()
+        assert total == 1
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_i3_changed_reindexed(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """I3: Modified file content triggers re-index and creates a version."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        f = tmp_path / "note.md"
+        f.write_text("# Version 1\n\nOriginal.")
+
+        await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        # Modify
+        f.write_text("# Version 2\n\nUpdated.")
+        # Touch mtime to ensure it's detected as different
+        os.utime(f, (f.stat().st_atime + 10, f.stat().st_mtime + 10))
+
+        count, _, _ = await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+        assert count == 1
+
+        # Should have a version snapshot
+        versions = (
+            await db_session.execute(
+                select(DocumentVersion).join(Document).where(
+                    Document.connector_id == db_local_folder_connector.id
+                )
+            )
+        ).scalars().all()
+        assert len(versions) >= 1
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_i4_deleted_removed(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """I4: Deleted file is removed from DB on re-sync."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        f = tmp_path / "to_delete.md"
+        f.write_text("# Delete me")
+
+        await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        docs_before = (
+            await db_session.execute(
+                select(func.count()).select_from(Document).where(
+                    Document.connector_id == db_local_folder_connector.id
+                )
+            )
+        ).scalar_one()
+        assert docs_before == 1
+
+        f.unlink()
+
+        await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        docs_after = (
+            await db_session.execute(
+                select(func.count()).select_from(Document).where(
+                    Document.connector_id == db_local_folder_connector.id
+                )
+            )
+        ).scalar_one()
+        assert docs_after == 0
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_i5_single_file_mode(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """I5: Single-file mode only processes the specified file."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "a.md").write_text("File A")
+        (tmp_path / "b.md").write_text("File B")
+        (tmp_path / "c.md").write_text("File C")
+
+        count, _, _ = await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            target_file_path=str(tmp_path / "b.md"),
+        )
+        assert count == 1
+
+        docs = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.connector_id == db_local_folder_connector.id
+                )
+            )
+        ).scalars().all()
+        assert len(docs) == 1
+        assert docs[0].title == "b"
+
+
+# ====================================================================
+# Tier 4: Folder Mirroring (F1-F5)
+# ====================================================================
+
+
+class TestFolderMirroring:
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_f1_root_folder_created(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """F1: First sync creates a root Folder and stores root_folder_id."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "root.md").write_text("Root file")
+
+        await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        # Refresh connector
+        await db_session.refresh(db_local_folder_connector)
+        root_id = db_local_folder_connector.config.get("root_folder_id")
+        assert root_id is not None
+
+        root_folder = (
+            await db_session.execute(select(Folder).where(Folder.id == root_id))
+        ).scalar_one()
+        assert root_folder.name == "test-folder"
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_f2_nested_folder_rows(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """F2: Nested dirs create Folder rows with correct parent_id chain."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        daily = tmp_path / "notes" / "daily"
+        daily.mkdir(parents=True)
+        weekly = tmp_path / "notes" / "weekly"
+        weekly.mkdir(parents=True)
+        (daily / "today.md").write_text("today")
+        (weekly / "review.md").write_text("review")
+
+        await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        folders = (
+            await db_session.execute(
+                select(Folder).where(Folder.search_space_id == db_search_space.id)
+            )
+        ).scalars().all()
+
+        folder_names = {f.name for f in folders}
+        assert "notes" in folder_names
+        assert "daily" in folder_names
+        assert "weekly" in folder_names
+
+        notes_folder = next(f for f in folders if f.name == "notes")
+        daily_folder = next(f for f in folders if f.name == "daily")
+        weekly_folder = next(f for f in folders if f.name == "weekly")
+
+        assert daily_folder.parent_id == notes_folder.id
+        assert weekly_folder.parent_id == notes_folder.id
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_f3_resync_reuses_folders(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """F3: Re-sync reuses existing Folder rows, no duplicates."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        sub = tmp_path / "docs"
+        sub.mkdir()
+        (sub / "file.md").write_text("content")
+
+        await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        folders_before = (
+            await db_session.execute(
+                select(Folder).where(Folder.search_space_id == db_search_space.id)
+            )
+        ).scalars().all()
+        ids_before = {f.id for f in folders_before}
+
+        # Re-sync
+        await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        folders_after = (
+            await db_session.execute(
+                select(Folder).where(Folder.search_space_id == db_search_space.id)
+            )
+        ).scalars().all()
+        ids_after = {f.id for f in folders_after}
+
+        assert ids_before == ids_after
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_f4_folder_id_assigned(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """F4: Documents get correct folder_id based on their directory."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        daily = tmp_path / "notes" / "daily"
+        daily.mkdir(parents=True)
+        (daily / "today.md").write_text("today note")
+        (tmp_path / "root.md").write_text("root note")
+
+        await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        docs = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.connector_id == db_local_folder_connector.id
+                )
+            )
+        ).scalars().all()
+
+        today_doc = next(d for d in docs if d.title == "today")
+        root_doc = next(d for d in docs if d.title == "root")
+
+        daily_folder = (
+            await db_session.execute(
+                select(Folder).where(Folder.name == "daily")
+            )
+        ).scalar_one()
+
+        assert today_doc.folder_id == daily_folder.id
+
+        # Root doc should be in the root folder
+        await db_session.refresh(db_local_folder_connector)
+        root_fid = db_local_folder_connector.config.get("root_folder_id")
+        assert root_doc.folder_id == root_fid
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_f5_empty_folder_cleanup(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """F5: Deleted dir's empty Folder row is cleaned up on re-sync."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+        import shutil
+
+        daily = tmp_path / "notes" / "daily"
+        daily.mkdir(parents=True)
+        weekly = tmp_path / "notes" / "weekly"
+        weekly.mkdir(parents=True)
+        (daily / "today.md").write_text("today")
+        (weekly / "review.md").write_text("review")
+
+        await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        # Verify weekly folder exists
+        weekly_folder = (
+            await db_session.execute(
+                select(Folder).where(Folder.name == "weekly")
+            )
+        ).scalar_one_or_none()
+        assert weekly_folder is not None
+
+        # Delete weekly directory + its file
+        shutil.rmtree(weekly)
+
+        await index_local_folder(
+            session=db_session,
+            connector_id=db_local_folder_connector.id,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+        )
+
+        # weekly Folder should be gone (empty, dir removed)
+        weekly_after = (
+            await db_session.execute(
+                select(Folder).where(Folder.name == "weekly")
+            )
+        ).scalar_one_or_none()
+        assert weekly_after is None
+
+        # daily should still exist
+        daily_after = (
+            await db_session.execute(
+                select(Folder).where(Folder.name == "daily")
+            )
+        ).scalar_one_or_none()
+        assert daily_after is not None
+
+
+# ====================================================================
+# Tier 5: Pipeline Integration (P1)
+# ====================================================================
+
+
+class TestPipelineIntegration:
+
+    @pytest.mark.usefixtures(
+        "patched_summarize", "patched_embed_texts", "patched_chunk_text"
+    )
+    async def test_p1_local_folder_file_through_pipeline(
+        self,
+        db_session: AsyncSession,
+        db_local_folder_connector: SearchSourceConnector,
+        db_user: User,
+        db_search_space: SearchSpace,
+        mocker,
+    ):
+        """P1: LOCAL_FOLDER_FILE ConnectorDocument through prepare+index to READY."""
+        from app.indexing_pipeline.connector_document import ConnectorDocument
+        from app.indexing_pipeline.indexing_pipeline_service import IndexingPipelineService
+
+        doc = ConnectorDocument(
+            title="Test Local File",
+            source_markdown="## Local file\n\nContent from disk.",
+            unique_id="test-folder:test.md",
+            document_type=DocumentType.LOCAL_FOLDER_FILE,
+            search_space_id=db_search_space.id,
+            connector_id=db_local_folder_connector.id,
+            created_by_id=str(db_user.id),
+        )
+
+        service = IndexingPipelineService(session=db_session)
+        prepared = await service.prepare_for_indexing([doc])
+        assert len(prepared) == 1
+
+        db_doc = prepared[0]
+        result = await service.index(db_doc, doc, llm=mocker.Mock())
+        assert result is not None
+
+        docs = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
+                )
+            )
+        ).scalars().all()
+        assert len(docs) == 1
+        assert DocumentStatus.is_state(docs[0].status, DocumentStatus.READY)
diff --git a/surfsense_backend/tests/integration/test_document_versioning.py b/surfsense_backend/tests/integration/test_document_versioning.py
new file mode 100644
index 000000000..87e3c490c
--- /dev/null
+++ b/surfsense_backend/tests/integration/test_document_versioning.py
@@ -0,0 +1,184 @@
+"""Integration tests for document versioning snapshot + cleanup."""
+
+from datetime import UTC, datetime, timedelta
+
+import pytest
+import pytest_asyncio
+from sqlalchemy import func, select
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.db import Document, DocumentType, DocumentVersion, SearchSpace, User
+
+pytestmark = pytest.mark.integration
+
+
+@pytest_asyncio.fixture
+async def db_document(
+    db_session: AsyncSession, db_user: User, db_search_space: SearchSpace
+) -> Document:
+    doc = Document(
+        title="Test Doc",
+        document_type=DocumentType.LOCAL_FOLDER_FILE,
+        document_metadata={},
+        content="Summary of test doc.",
+        content_hash="abc123",
+        unique_identifier_hash="local_folder:test-folder:test.md",
+        source_markdown="# Test\n\nOriginal content.",
+        search_space_id=db_search_space.id,
+        created_by_id=db_user.id,
+    )
+    db_session.add(doc)
+    await db_session.flush()
+    return doc
+
+
+async def _version_count(session: AsyncSession, document_id: int) -> int:
+    result = await session.execute(
+        select(func.count()).select_from(DocumentVersion).where(
+            DocumentVersion.document_id == document_id
+        )
+    )
+    return result.scalar_one()
+
+
+async def _get_versions(session: AsyncSession, document_id: int) -> list[DocumentVersion]:
+    result = await session.execute(
+        select(DocumentVersion)
+        .where(DocumentVersion.document_id == document_id)
+        .order_by(DocumentVersion.version_number)
+    )
+    return list(result.scalars().all())
+
+
+class TestCreateVersionSnapshot:
+    """V1-V5: TDD slices for create_version_snapshot."""
+
+    async def test_v1_creates_first_version(self, db_session, db_document):
+        """V1: First snapshot creates version 1 with the document's current state."""
+        from app.utils.document_versioning import create_version_snapshot
+
+        await create_version_snapshot(db_session, db_document)
+
+        versions = await _get_versions(db_session, db_document.id)
+        assert len(versions) == 1
+        assert versions[0].version_number == 1
+        assert versions[0].source_markdown == "# Test\n\nOriginal content."
+        assert versions[0].content_hash == "abc123"
+        assert versions[0].title == "Test Doc"
+        assert versions[0].document_id == db_document.id
+
+    async def test_v2_creates_version_2_after_30_min(
+        self, db_session, db_document, monkeypatch
+    ):
+        """V2: After 30+ minutes, a new version is created (not overwritten)."""
+        from app.utils.document_versioning import create_version_snapshot
+
+        t0 = datetime(2025, 1, 1, 12, 0, 0, tzinfo=UTC)
+        monkeypatch.setattr(
+            "app.utils.document_versioning._now", lambda: t0
+        )
+        await create_version_snapshot(db_session, db_document)
+
+        # Simulate content change and time passing
+        db_document.source_markdown = "# Test\n\nUpdated content."
+        db_document.content_hash = "def456"
+        t1 = t0 + timedelta(minutes=31)
+        monkeypatch.setattr(
+            "app.utils.document_versioning._now", lambda: t1
+        )
+        await create_version_snapshot(db_session, db_document)
+
+        versions = await _get_versions(db_session, db_document.id)
+        assert len(versions) == 2
+        assert versions[0].version_number == 1
+        assert versions[1].version_number == 2
+        assert versions[1].source_markdown == "# Test\n\nUpdated content."
+
+    async def test_v3_overwrites_within_30_min(
+        self, db_session, db_document, monkeypatch
+    ):
+        """V3: Within 30 minutes, the latest version is overwritten."""
+        from app.utils.document_versioning import create_version_snapshot
+
+        t0 = datetime(2025, 1, 1, 12, 0, 0, tzinfo=UTC)
+        monkeypatch.setattr(
+            "app.utils.document_versioning._now", lambda: t0
+        )
+        await create_version_snapshot(db_session, db_document)
+        count_after_first = await _version_count(db_session, db_document.id)
+        assert count_after_first == 1
+
+        # Simulate quick edit within 30 minutes
+        db_document.source_markdown = "# Test\n\nQuick edit."
+        db_document.content_hash = "quick123"
+        t1 = t0 + timedelta(minutes=10)
+        monkeypatch.setattr(
+            "app.utils.document_versioning._now", lambda: t1
+        )
+        await create_version_snapshot(db_session, db_document)
+
+        count_after_second = await _version_count(db_session, db_document.id)
+        assert count_after_second == 1  # still 1, not 2
+
+        versions = await _get_versions(db_session, db_document.id)
+        assert versions[0].source_markdown == "# Test\n\nQuick edit."
+        assert versions[0].content_hash == "quick123"
+
+    async def test_v4_cleanup_90_day_old_versions(
+        self, db_session, db_document, monkeypatch
+    ):
+        """V4: Versions older than 90 days are cleaned up."""
+        from app.utils.document_versioning import create_version_snapshot
+
+        base = datetime(2025, 1, 1, 12, 0, 0, tzinfo=UTC)
+
+        # Create 5 versions spread across time: 3 older than 90 days, 2 recent
+        for i in range(5):
+            db_document.source_markdown = f"Content v{i+1}"
+            db_document.content_hash = f"hash_{i+1}"
+            if i < 3:
+                t = base + timedelta(days=i)  # old
+            else:
+                t = base + timedelta(days=100 + i)  # recent
+            monkeypatch.setattr(
+                "app.utils.document_versioning._now", lambda _t=t: _t
+            )
+            await create_version_snapshot(db_session, db_document)
+
+        # Now trigger cleanup from a "current" time that makes the first 3 versions > 90 days old
+        now = base + timedelta(days=200)
+        monkeypatch.setattr(
+            "app.utils.document_versioning._now", lambda: now
+        )
+        db_document.source_markdown = "Content v6"
+        db_document.content_hash = "hash_6"
+        await create_version_snapshot(db_session, db_document)
+
+        versions = await _get_versions(db_session, db_document.id)
+        # The first 3 (old) should be cleaned up; versions 4, 5, 6 remain
+        for v in versions:
+            age = now - v.created_at.replace(tzinfo=UTC)
+            assert age <= timedelta(days=90), f"Version {v.version_number} is too old"
+
+    async def test_v5_cap_at_20_versions(
+        self, db_session, db_document, monkeypatch
+    ):
+        """V5: More than 20 versions triggers cap — oldest gets deleted."""
+        from app.utils.document_versioning import create_version_snapshot
+
+        base = datetime(2025, 6, 1, 12, 0, 0, tzinfo=UTC)
+
+        # Create 21 versions (all within 90 days, each 31 min apart)
+        for i in range(21):
+            db_document.source_markdown = f"Content v{i+1}"
+            db_document.content_hash = f"hash_{i+1}"
+            t = base + timedelta(minutes=31 * i)
+            monkeypatch.setattr(
+                "app.utils.document_versioning._now", lambda _t=t: _t
+            )
+            await create_version_snapshot(db_session, db_document)
+
+        versions = await _get_versions(db_session, db_document.id)
+        assert len(versions) == 20
+        # The lowest version_number should be 2 (version 1 was the oldest and got capped)
+        assert versions[0].version_number == 2
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_local_folder_scan.py b/surfsense_backend/tests/unit/connector_indexers/test_local_folder_scan.py
new file mode 100644
index 000000000..9b4c73f25
--- /dev/null
+++ b/surfsense_backend/tests/unit/connector_indexers/test_local_folder_scan.py
@@ -0,0 +1,80 @@
+"""Unit tests for scan_folder() pure logic — Tier 2 TDD slices (S1-S4)."""
+
+from pathlib import Path
+
+import pytest
+
+pytestmark = pytest.mark.unit
+
+
+class TestScanFolder:
+    """S1-S4: scan_folder() with real tmp_path filesystem."""
+
+    def test_s1_single_md_file(self, tmp_path: Path):
+        """S1: scan_folder on a dir with one .md file returns correct entry."""
+        from app.tasks.connector_indexers.local_folder_indexer import scan_folder
+
+        md = tmp_path / "note.md"
+        md.write_text("# Hello")
+
+        results = scan_folder(str(tmp_path))
+
+        assert len(results) == 1
+        entry = results[0]
+        assert entry["relative_path"] == "note.md"
+        assert entry["size"] > 0
+        assert "modified_at" in entry
+        assert entry["path"] == str(md)
+
+    def test_s2_extension_filter(self, tmp_path: Path):
+        """S2: file_extensions filter returns only matching files."""
+        from app.tasks.connector_indexers.local_folder_indexer import scan_folder
+
+        (tmp_path / "a.md").write_text("md")
+        (tmp_path / "b.txt").write_text("txt")
+        (tmp_path / "c.pdf").write_bytes(b"%PDF")
+
+        results = scan_folder(str(tmp_path), file_extensions=[".md"])
+        names = {r["relative_path"] for r in results}
+
+        assert names == {"a.md"}
+
+    def test_s3_exclude_patterns(self, tmp_path: Path):
+        """S3: exclude_patterns skips files inside excluded directories."""
+        from app.tasks.connector_indexers.local_folder_indexer import scan_folder
+
+        (tmp_path / "good.md").write_text("good")
+        nm = tmp_path / "node_modules"
+        nm.mkdir()
+        (nm / "dep.js").write_text("module")
+        git = tmp_path / ".git"
+        git.mkdir()
+        (git / "config").write_text("gitconfig")
+
+        results = scan_folder(
+            str(tmp_path), exclude_patterns=["node_modules", ".git"]
+        )
+        names = {r["relative_path"] for r in results}
+
+        assert "good.md" in names
+        assert not any("node_modules" in n for n in names)
+        assert not any(".git" in n for n in names)
+
+    def test_s4_nested_dirs(self, tmp_path: Path):
+        """S4: nested subdirectories produce correct relative paths."""
+        from app.tasks.connector_indexers.local_folder_indexer import scan_folder
+
+        daily = tmp_path / "notes" / "daily"
+        daily.mkdir(parents=True)
+        weekly = tmp_path / "notes" / "weekly"
+        weekly.mkdir(parents=True)
+        (daily / "today.md").write_text("today")
+        (weekly / "review.md").write_text("review")
+        (tmp_path / "root.txt").write_text("root")
+
+        results = scan_folder(str(tmp_path))
+        paths = {r["relative_path"] for r in results}
+
+        assert "notes/daily/today.md" in paths or "notes\\daily\\today.md" in paths
+        assert "notes/weekly/review.md" in paths or "notes\\weekly\\review.md" in paths
+        assert "root.txt" in paths

From 28f556224af78b618992cc40241e4834f5cc528c Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 11:17:49 +0530
Subject: [PATCH 027/202] feat: implement folder watching functionality with
 IPC integration

---
 surfsense_desktop/src/ipc/channels.ts         |  10 +
 surfsense_desktop/src/ipc/handlers.ts         |  28 +++
 surfsense_desktop/src/main.ts                 |   3 +
 .../src/modules/folder-watcher.ts             | 216 ++++++++++++++++++
 surfsense_desktop/src/preload.ts              |  23 ++
 5 files changed, 280 insertions(+)
 create mode 100644 surfsense_desktop/src/modules/folder-watcher.ts

diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index 25ec1bc0e..362d3362d 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -6,4 +6,14 @@ export const IPC_CHANNELS = {
   SET_QUICK_ASK_MODE: 'set-quick-ask-mode',
   GET_QUICK_ASK_MODE: 'get-quick-ask-mode',
   REPLACE_TEXT: 'replace-text',
+  // Folder sync channels
+  FOLDER_SYNC_SELECT_FOLDER: 'folder-sync:select-folder',
+  FOLDER_SYNC_ADD_FOLDER: 'folder-sync:add-folder',
+  FOLDER_SYNC_REMOVE_FOLDER: 'folder-sync:remove-folder',
+  FOLDER_SYNC_GET_FOLDERS: 'folder-sync:get-folders',
+  FOLDER_SYNC_GET_STATUS: 'folder-sync:get-status',
+  FOLDER_SYNC_FILE_CHANGED: 'folder-sync:file-changed',
+  FOLDER_SYNC_WATCHER_READY: 'folder-sync:watcher-ready',
+  FOLDER_SYNC_PAUSE: 'folder-sync:pause',
+  FOLDER_SYNC_RESUME: 'folder-sync:resume',
 } as const;
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index 18e343719..2baf957b0 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -1,5 +1,14 @@
 import { app, ipcMain, shell } from 'electron';
 import { IPC_CHANNELS } from './channels';
+import {
+  selectFolder,
+  addWatchedFolder,
+  removeWatchedFolder,
+  getWatchedFolders,
+  getWatcherStatus,
+  pauseWatcher,
+  resumeWatcher,
+} from '../modules/folder-watcher';
 
 export function registerIpcHandlers(): void {
   ipcMain.on(IPC_CHANNELS.OPEN_EXTERNAL, (_event, url: string) => {
@@ -16,4 +25,23 @@ export function registerIpcHandlers(): void {
   ipcMain.handle(IPC_CHANNELS.GET_APP_VERSION, () => {
     return app.getVersion();
   });
+
+  // Folder sync handlers
+  ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_SELECT_FOLDER, () => selectFolder());
+
+  ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_ADD_FOLDER, (_event, config) =>
+    addWatchedFolder(config)
+  );
+
+  ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_REMOVE_FOLDER, (_event, folderPath: string) =>
+    removeWatchedFolder(folderPath)
+  );
+
+  ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_GET_FOLDERS, () => getWatchedFolders());
+
+  ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_GET_STATUS, () => getWatcherStatus());
+
+  ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_PAUSE, () => pauseWatcher());
+
+  ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_RESUME, () => resumeWatcher());
 }
diff --git a/surfsense_desktop/src/main.ts b/surfsense_desktop/src/main.ts
index 3ab41073b..f745d9b5e 100644
--- a/surfsense_desktop/src/main.ts
+++ b/surfsense_desktop/src/main.ts
@@ -6,6 +6,7 @@ import { setupDeepLinks, handlePendingDeepLink } from './modules/deep-links';
 import { setupAutoUpdater } from './modules/auto-updater';
 import { setupMenu } from './modules/menu';
 import { registerQuickAsk, unregisterQuickAsk } from './modules/quick-ask';
+import { registerFolderWatcher, unregisterFolderWatcher } from './modules/folder-watcher';
 import { registerIpcHandlers } from './ipc/handlers';
 
 registerGlobalErrorHandlers();
@@ -28,6 +29,7 @@ app.whenReady().then(async () => {
   }
   createMainWindow();
   registerQuickAsk();
+  registerFolderWatcher();
   setupAutoUpdater();
 
   handlePendingDeepLink();
@@ -47,4 +49,5 @@ app.on('window-all-closed', () => {
 
 app.on('will-quit', () => {
   unregisterQuickAsk();
+  unregisterFolderWatcher();
 });
diff --git a/surfsense_desktop/src/modules/folder-watcher.ts b/surfsense_desktop/src/modules/folder-watcher.ts
new file mode 100644
index 000000000..bfd2136c9
--- /dev/null
+++ b/surfsense_desktop/src/modules/folder-watcher.ts
@@ -0,0 +1,216 @@
+import { BrowserWindow, dialog } from 'electron';
+import chokidar from 'chokidar';
+import * as path from 'path';
+import * as fs from 'fs';
+import { IPC_CHANNELS } from '../ipc/channels';
+
+export interface WatchedFolderConfig {
+  path: string;
+  name: string;
+  excludePatterns: string[];
+  fileExtensions: string[] | null;
+  connectorId: number;
+  searchSpaceId: number;
+  active: boolean;
+}
+
+interface WatcherEntry {
+  config: WatchedFolderConfig;
+  watcher: chokidar.FSWatcher | null;
+}
+
+const STORE_KEY = 'watchedFolders';
+let store: any = null;
+let watchers: Map<string, WatcherEntry> = new Map();
+
+async function getStore() {
+  if (!store) {
+    const { default: Store } = await import('electron-store');
+    store = new Store({
+      name: 'folder-watcher',
+      defaults: {
+        [STORE_KEY]: [] as WatchedFolderConfig[],
+      },
+    });
+  }
+  return store;
+}
+
+function getMainWindow(): BrowserWindow | null {
+  const windows = BrowserWindow.getAllWindows();
+  return windows.length > 0 ? windows[0] : null;
+}
+
+function sendToRenderer(channel: string, data: any) {
+  const win = getMainWindow();
+  if (win && !win.isDestroyed()) {
+    win.webContents.send(channel, data);
+  }
+}
+
+function startWatcher(config: WatchedFolderConfig) {
+  if (watchers.has(config.path)) {
+    return;
+  }
+
+  const ignored = [
+    /(^|[/\\])\../, // dotfiles by default
+    ...config.excludePatterns.map((p) => `**/${p}/**`),
+  ];
+
+  const watcher = chokidar.watch(config.path, {
+    persistent: true,
+    ignoreInitial: false,
+    awaitWriteFinish: {
+      stabilityThreshold: 500,
+      pollInterval: 100,
+    },
+    ignored,
+  });
+
+  let ready = false;
+
+  watcher.on('ready', () => {
+    ready = true;
+    sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_WATCHER_READY, {
+      connectorId: config.connectorId,
+      folderPath: config.path,
+    });
+  });
+
+  const handleFileEvent = (filePath: string, action: string) => {
+    if (!ready) return;
+
+    const relativePath = path.relative(config.path, filePath);
+
+    if (
+      config.fileExtensions &&
+      config.fileExtensions.length > 0
+    ) {
+      const ext = path.extname(filePath).toLowerCase();
+      if (!config.fileExtensions.includes(ext)) return;
+    }
+
+    sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, {
+      connectorId: config.connectorId,
+      searchSpaceId: config.searchSpaceId,
+      folderPath: config.path,
+      relativePath,
+      fullPath: filePath,
+      action,
+      timestamp: Date.now(),
+    });
+  };
+
+  watcher.on('add', (fp) => handleFileEvent(fp, 'add'));
+  watcher.on('change', (fp) => handleFileEvent(fp, 'change'));
+  watcher.on('unlink', (fp) => handleFileEvent(fp, 'unlink'));
+
+  watchers.set(config.path, { config, watcher });
+}
+
+function stopWatcher(folderPath: string) {
+  const entry = watchers.get(folderPath);
+  if (entry?.watcher) {
+    entry.watcher.close();
+  }
+  watchers.delete(folderPath);
+}
+
+export async function selectFolder(): Promise<string | null> {
+  const result = await dialog.showOpenDialog({
+    properties: ['openDirectory'],
+    title: 'Select a folder to watch',
+  });
+  if (result.canceled || result.filePaths.length === 0) {
+    return null;
+  }
+  return result.filePaths[0];
+}
+
+export async function addWatchedFolder(
+  config: WatchedFolderConfig
+): Promise<WatchedFolderConfig[]> {
+  const s = await getStore();
+  const folders: WatchedFolderConfig[] = s.get(STORE_KEY, []);
+
+  const existing = folders.findIndex((f: WatchedFolderConfig) => f.path === config.path);
+  if (existing >= 0) {
+    folders[existing] = config;
+  } else {
+    folders.push(config);
+  }
+
+  s.set(STORE_KEY, folders);
+
+  if (config.active) {
+    startWatcher(config);
+  }
+
+  return folders;
+}
+
+export async function removeWatchedFolder(
+  folderPath: string
+): Promise<WatchedFolderConfig[]> {
+  const s = await getStore();
+  const folders: WatchedFolderConfig[] = s.get(STORE_KEY, []);
+  const updated = folders.filter((f: WatchedFolderConfig) => f.path !== folderPath);
+  s.set(STORE_KEY, updated);
+
+  stopWatcher(folderPath);
+
+  return updated;
+}
+
+export async function getWatchedFolders(): Promise<WatchedFolderConfig[]> {
+  const s = await getStore();
+  return s.get(STORE_KEY, []);
+}
+
+export async function getWatcherStatus(): Promise<
+  { path: string; active: boolean; watching: boolean }[]
+> {
+  const s = await getStore();
+  const folders: WatchedFolderConfig[] = s.get(STORE_KEY, []);
+  return folders.map((f: WatchedFolderConfig) => ({
+    path: f.path,
+    active: f.active,
+    watching: watchers.has(f.path),
+  }));
+}
+
+export async function pauseWatcher(): Promise<void> {
+  for (const [, entry] of watchers) {
+    if (entry.watcher) {
+      await entry.watcher.close();
+      entry.watcher = null;
+    }
+  }
+}
+
+export async function resumeWatcher(): Promise<void> {
+  for (const [folderPath, entry] of watchers) {
+    if (!entry.watcher && entry.config.active) {
+      startWatcher(entry.config);
+    }
+  }
+}
+
+export async function registerFolderWatcher(): Promise<void> {
+  const s = await getStore();
+  const folders: WatchedFolderConfig[] = s.get(STORE_KEY, []);
+
+  for (const config of folders) {
+    if (config.active && fs.existsSync(config.path)) {
+      startWatcher(config);
+    }
+  }
+}
+
+export async function unregisterFolderWatcher(): Promise<void> {
+  for (const [folderPath] of watchers) {
+    stopWatcher(folderPath);
+  }
+  watchers.clear();
+}
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 264ec25b3..8f65aa633 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -21,4 +21,27 @@ contextBridge.exposeInMainWorld('electronAPI', {
   setQuickAskMode: (mode: string) => ipcRenderer.invoke(IPC_CHANNELS.SET_QUICK_ASK_MODE, mode),
   getQuickAskMode: () => ipcRenderer.invoke(IPC_CHANNELS.GET_QUICK_ASK_MODE),
   replaceText: (text: string) => ipcRenderer.invoke(IPC_CHANNELS.REPLACE_TEXT, text),
+
+  // Folder sync
+  selectFolder: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_SELECT_FOLDER),
+  addWatchedFolder: (config: any) => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_ADD_FOLDER, config),
+  removeWatchedFolder: (folderPath: string) => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_REMOVE_FOLDER, folderPath),
+  getWatchedFolders: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_GET_FOLDERS),
+  getWatcherStatus: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_GET_STATUS),
+  onFileChanged: (callback: (data: any) => void) => {
+    const listener = (_event: unknown, data: any) => callback(data);
+    ipcRenderer.on(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, listener);
+    return () => {
+      ipcRenderer.removeListener(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, listener);
+    };
+  },
+  onWatcherReady: (callback: (data: any) => void) => {
+    const listener = (_event: unknown, data: any) => callback(data);
+    ipcRenderer.on(IPC_CHANNELS.FOLDER_SYNC_WATCHER_READY, listener);
+    return () => {
+      ipcRenderer.removeListener(IPC_CHANNELS.FOLDER_SYNC_WATCHER_READY, listener);
+    };
+  },
+  pauseWatcher: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_PAUSE),
+  resumeWatcher: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_RESUME),
 });

From e2f946b7c03c71496515ec722254d53de2155146 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 11:38:40 +0530
Subject: [PATCH 028/202] feat: add support for Local Folder connector in UI
 components and configuration

---
 .../[search_space_id]/client-layout.tsx       |  4 ++
 .../views/connector-connect-view.tsx          |  1 +
 .../views/connector-edit-view.tsx             | 69 ++++++++++---------
 .../views/indexing-configuration-view.tsx     | 12 ++--
 .../constants/connector-constants.ts          |  8 +++
 .../tabs/all-connectors-tab.tsx               | 25 +++----
 surfsense_web/contracts/enums/connector.ts    |  1 +
 .../contracts/enums/connectorIcons.tsx        |  3 +
 .../contracts/types/connector.types.ts        |  1 +
 9 files changed, 72 insertions(+), 52 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx b/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx
index 1715e525f..60b8aef12 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx
@@ -17,6 +17,7 @@ import { DocumentUploadDialogProvider } from "@/components/assistant-ui/document
 import { LayoutDataProvider } from "@/components/layout";
 import { OnboardingTour } from "@/components/onboarding-tour";
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
+import { useFolderSync } from "@/hooks/use-folder-sync";
 import { useGlobalLoadingEffect } from "@/hooks/use-global-loading";
 
 export function DashboardClientLayout({
@@ -159,6 +160,9 @@ export function DashboardClientLayout({
 	// Use global loading screen - spinner animation won't reset
 	useGlobalLoadingEffect(shouldShowLoading);
 
+	// Wire desktop app file watcher -> single-file re-index API
+	useFolderSync();
+
 	if (shouldShowLoading) {
 		return null;
 	}
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx
index 596b98e93..0b6d0917a 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx
@@ -20,6 +20,7 @@ const FORM_ID_MAP: Record<string, string> = {
 	CIRCLEBACK_CONNECTOR: "circleback-connect-form",
 	MCP_CONNECTOR: "mcp-connect-form",
 	OBSIDIAN_CONNECTOR: "obsidian-connect-form",
+	LOCAL_FOLDER_CONNECTOR: "local-folder-connect-form",
 };
 
 interface ConnectorConnectViewProps {
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
index 20d4a8e53..dcedb4743 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
@@ -272,13 +272,14 @@ export const ConnectorEditView: FC<ConnectorEditViewProps> = ({
 								{/* AI Summary toggle */}
 								<SummaryConfig enabled={enableSummary} onEnabledChange={onEnableSummaryChange} />
 
-								{/* Date range selector - not shown for file-based connectors (Drive, Dropbox, OneDrive), Webcrawler, or GitHub (indexes full repo snapshots) */}
+								{/* Date range selector - not shown for file-based connectors (Drive, Dropbox, OneDrive), Webcrawler, GitHub, or Local Folder */}
 								{connector.connector_type !== "GOOGLE_DRIVE_CONNECTOR" &&
 									connector.connector_type !== "COMPOSIO_GOOGLE_DRIVE_CONNECTOR" &&
 									connector.connector_type !== "DROPBOX_CONNECTOR" &&
 									connector.connector_type !== "ONEDRIVE_CONNECTOR" &&
 									connector.connector_type !== "WEBCRAWLER_CONNECTOR" &&
-									connector.connector_type !== "GITHUB_CONNECTOR" && (
+									connector.connector_type !== "GITHUB_CONNECTOR" &&
+									connector.connector_type !== "LOCAL_FOLDER_CONNECTOR" && (
 										<DateRangeSelector
 											startDate={startDate}
 											endDate={endDate}
@@ -293,39 +294,39 @@ export const ConnectorEditView: FC<ConnectorEditViewProps> = ({
 										/>
 									)}
 
-								{/* Periodic sync - shown for all indexable connectors */}
-								{(() => {
-									// Check if Google Drive (regular or Composio) has folders/files selected
-									const isGoogleDrive = connector.connector_type === "GOOGLE_DRIVE_CONNECTOR";
-									const isComposioGoogleDrive =
-										connector.connector_type === "COMPOSIO_GOOGLE_DRIVE_CONNECTOR";
-									const requiresFolderSelection = isGoogleDrive || isComposioGoogleDrive;
-									const selectedFolders =
-										(connector.config?.selected_folders as
-											| Array<{ id: string; name: string }>
-											| undefined) || [];
-									const selectedFiles =
-										(connector.config?.selected_files as
-											| Array<{ id: string; name: string }>
-											| undefined) || [];
-									const hasItemsSelected = selectedFolders.length > 0 || selectedFiles.length > 0;
-									const isDisabled = requiresFolderSelection && !hasItemsSelected;
+								{/* Periodic sync - shown for all indexable connectors except Local Folder */}
+								{connector.connector_type !== "LOCAL_FOLDER_CONNECTOR" &&
+									(() => {
+										const isGoogleDrive = connector.connector_type === "GOOGLE_DRIVE_CONNECTOR";
+										const isComposioGoogleDrive =
+											connector.connector_type === "COMPOSIO_GOOGLE_DRIVE_CONNECTOR";
+										const requiresFolderSelection = isGoogleDrive || isComposioGoogleDrive;
+										const selectedFolders =
+											(connector.config?.selected_folders as
+												| Array<{ id: string; name: string }>
+												| undefined) || [];
+										const selectedFiles =
+											(connector.config?.selected_files as
+												| Array<{ id: string; name: string }>
+												| undefined) || [];
+										const hasItemsSelected = selectedFolders.length > 0 || selectedFiles.length > 0;
+										const isDisabled = requiresFolderSelection && !hasItemsSelected;
 
-									return (
-										<PeriodicSyncConfig
-											enabled={periodicEnabled}
-											frequencyMinutes={frequencyMinutes}
-											onEnabledChange={onPeriodicEnabledChange}
-											onFrequencyChange={onFrequencyChange}
-											disabled={isDisabled}
-											disabledMessage={
-												isDisabled
-													? "Select at least one folder or file above to enable periodic sync"
-													: undefined
-											}
-										/>
-									);
-								})()}
+										return (
+											<PeriodicSyncConfig
+												enabled={periodicEnabled}
+												frequencyMinutes={frequencyMinutes}
+												onEnabledChange={onPeriodicEnabledChange}
+												onFrequencyChange={onFrequencyChange}
+												disabled={isDisabled}
+												disabledMessage={
+													isDisabled
+														? "Select at least one folder or file above to enable periodic sync"
+														: undefined
+												}
+											/>
+										);
+									})()}
 							</>
 						)}
 
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/indexing-configuration-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/indexing-configuration-view.tsx
index 564cb87ee..436ce7843 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/indexing-configuration-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/indexing-configuration-view.tsx
@@ -158,13 +158,14 @@ export const IndexingConfigurationView: FC<IndexingConfigurationViewProps> = ({
 								{/* AI Summary toggle */}
 								<SummaryConfig enabled={enableSummary} onEnabledChange={onEnableSummaryChange} />
 
-								{/* Date range selector - not shown for file-based connectors (Drive, Dropbox, OneDrive), Webcrawler, or GitHub (indexes full repo snapshots) */}
+								{/* Date range selector - not shown for file-based connectors (Drive, Dropbox, OneDrive), Webcrawler, GitHub, or Local Folder */}
 								{config.connectorType !== "GOOGLE_DRIVE_CONNECTOR" &&
 									config.connectorType !== "COMPOSIO_GOOGLE_DRIVE_CONNECTOR" &&
 									config.connectorType !== "DROPBOX_CONNECTOR" &&
 									config.connectorType !== "ONEDRIVE_CONNECTOR" &&
 									config.connectorType !== "WEBCRAWLER_CONNECTOR" &&
-									config.connectorType !== "GITHUB_CONNECTOR" && (
+									config.connectorType !== "GITHUB_CONNECTOR" &&
+									config.connectorType !== "LOCAL_FOLDER_CONNECTOR" && (
 										<DateRangeSelector
 											startDate={startDate}
 											endDate={endDate}
@@ -179,9 +180,12 @@ export const IndexingConfigurationView: FC<IndexingConfigurationViewProps> = ({
 										/>
 									)}
 
-								{/* Periodic sync - not shown for Google Drive (regular and Composio) */}
+								{/* Periodic sync - not shown for file-based connectors (Drive, Dropbox, OneDrive) or Local Folder in initial setup; configured in edit view instead */}
 								{config.connectorType !== "GOOGLE_DRIVE_CONNECTOR" &&
-									config.connectorType !== "COMPOSIO_GOOGLE_DRIVE_CONNECTOR" && (
+									config.connectorType !== "COMPOSIO_GOOGLE_DRIVE_CONNECTOR" &&
+									config.connectorType !== "DROPBOX_CONNECTOR" &&
+									config.connectorType !== "ONEDRIVE_CONNECTOR" &&
+									config.connectorType !== "LOCAL_FOLDER_CONNECTOR" && (
 										<PeriodicSyncConfig
 											enabled={periodicEnabled}
 											frequencyMinutes={frequencyMinutes}
diff --git a/surfsense_web/components/assistant-ui/connector-popup/constants/connector-constants.ts b/surfsense_web/components/assistant-ui/connector-popup/constants/connector-constants.ts
index 2e92f637b..3f7d90cd8 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/constants/connector-constants.ts
+++ b/surfsense_web/components/assistant-ui/connector-popup/constants/connector-constants.ts
@@ -184,6 +184,14 @@ export const OTHER_CONNECTORS = [
 		connectorType: EnumConnectorName.OBSIDIAN_CONNECTOR,
 		selfHostedOnly: true,
 	},
+	{
+		id: "local-folder-connector",
+		title: "Local Folder",
+		description: "Watch and sync local folders (desktop only)",
+		connectorType: EnumConnectorName.LOCAL_FOLDER_CONNECTOR,
+		selfHostedOnly: true,
+		desktopOnly: true,
+	},
 ] as const;
 
 // Composio Connectors - Individual entries for each supported toolkit
diff --git a/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx b/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx
index ad2418865..3e8aad620 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx
@@ -76,29 +76,26 @@ export const AllConnectorsTab: FC<AllConnectorsTabProps> = ({
 }) => {
 	// Check if self-hosted mode (for showing self-hosted only connectors)
 	const selfHosted = isSelfHosted();
+	const isDesktop = typeof window !== "undefined" && !!window.electronAPI;
+
+	const matchesSearch = (title: string, description: string) =>
+		title.toLowerCase().includes(searchQuery.toLowerCase()) ||
+		description.toLowerCase().includes(searchQuery.toLowerCase());
+
+	const passesDeploymentFilter = (c: { selfHostedOnly?: boolean; desktopOnly?: boolean }) =>
+		(!c.selfHostedOnly || selfHosted) && (!c.desktopOnly || isDesktop);
 
 	// Filter connectors based on search and deployment mode
 	const filteredOAuth = OAUTH_CONNECTORS.filter(
-		(c) =>
-			// Filter by search query
-			(c.title.toLowerCase().includes(searchQuery.toLowerCase()) ||
-				c.description.toLowerCase().includes(searchQuery.toLowerCase())) &&
-			// Filter self-hosted only connectors in cloud mode
-			(!("selfHostedOnly" in c) || !c.selfHostedOnly || selfHosted)
+		(c) => matchesSearch(c.title, c.description) && passesDeploymentFilter(c)
 	);
 
 	const filteredCrawlers = CRAWLERS.filter(
-		(c) =>
-			(c.title.toLowerCase().includes(searchQuery.toLowerCase()) ||
-				c.description.toLowerCase().includes(searchQuery.toLowerCase())) &&
-			(!("selfHostedOnly" in c) || !c.selfHostedOnly || selfHosted)
+		(c) => matchesSearch(c.title, c.description) && passesDeploymentFilter(c)
 	);
 
 	const filteredOther = OTHER_CONNECTORS.filter(
-		(c) =>
-			(c.title.toLowerCase().includes(searchQuery.toLowerCase()) ||
-				c.description.toLowerCase().includes(searchQuery.toLowerCase())) &&
-			(!("selfHostedOnly" in c) || !c.selfHostedOnly || selfHosted)
+		(c) => matchesSearch(c.title, c.description) && passesDeploymentFilter(c)
 	);
 
 	// Filter Composio connectors
diff --git a/surfsense_web/contracts/enums/connector.ts b/surfsense_web/contracts/enums/connector.ts
index 501f5d9a3..ecf96d88e 100644
--- a/surfsense_web/contracts/enums/connector.ts
+++ b/surfsense_web/contracts/enums/connector.ts
@@ -25,6 +25,7 @@ export enum EnumConnectorName {
 	YOUTUBE_CONNECTOR = "YOUTUBE_CONNECTOR",
 	CIRCLEBACK_CONNECTOR = "CIRCLEBACK_CONNECTOR",
 	OBSIDIAN_CONNECTOR = "OBSIDIAN_CONNECTOR",
+	LOCAL_FOLDER_CONNECTOR = "LOCAL_FOLDER_CONNECTOR",
 	DROPBOX_CONNECTOR = "DROPBOX_CONNECTOR",
 	MCP_CONNECTOR = "MCP_CONNECTOR",
 	COMPOSIO_GOOGLE_DRIVE_CONNECTOR = "COMPOSIO_GOOGLE_DRIVE_CONNECTOR",
diff --git a/surfsense_web/contracts/enums/connectorIcons.tsx b/surfsense_web/contracts/enums/connectorIcons.tsx
index 2e609b060..f7378b74b 100644
--- a/surfsense_web/contracts/enums/connectorIcons.tsx
+++ b/surfsense_web/contracts/enums/connectorIcons.tsx
@@ -3,6 +3,7 @@ import {
 	BookOpen,
 	File,
 	FileText,
+	FolderSync,
 	Globe,
 	Microscope,
 	Search,
@@ -75,6 +76,8 @@ export const getConnectorIcon = (connectorType: EnumConnectorName | string, clas
 			return <Image src="/connectors/circleback.svg" alt="Circleback" {...imgProps} />;
 		case EnumConnectorName.MCP_CONNECTOR:
 			return <Image src="/connectors/modelcontextprotocol.svg" alt="MCP" {...imgProps} />;
+		case EnumConnectorName.LOCAL_FOLDER_CONNECTOR:
+			return <FolderSync {...iconProps} />;
 		case EnumConnectorName.OBSIDIAN_CONNECTOR:
 			return <Image src="/connectors/obsidian.svg" alt="Obsidian" {...imgProps} />;
 		case EnumConnectorName.COMPOSIO_GOOGLE_DRIVE_CONNECTOR:
diff --git a/surfsense_web/contracts/types/connector.types.ts b/surfsense_web/contracts/types/connector.types.ts
index b83e05dcc..269941375 100644
--- a/surfsense_web/contracts/types/connector.types.ts
+++ b/surfsense_web/contracts/types/connector.types.ts
@@ -30,6 +30,7 @@ export const searchSourceConnectorTypeEnum = z.enum([
 	"DROPBOX_CONNECTOR",
 	"MCP_CONNECTOR",
 	"OBSIDIAN_CONNECTOR",
+	"LOCAL_FOLDER_CONNECTOR",
 	"COMPOSIO_GOOGLE_DRIVE_CONNECTOR",
 	"COMPOSIO_GMAIL_CONNECTOR",
 	"COMPOSIO_GOOGLE_CALENDAR_CONNECTOR",

From 5eeee99bb1be4f118e8417f31c3fe0322d558fb4 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 11:40:04 +0530
Subject: [PATCH 029/202] feat: enhance Local Folder connector with version
 history and folder sync capabilities

---
 .../(manage)/components/DocumentTypeIcon.tsx  |   1 +
 .../components/local-folder-connect-form.tsx  | 272 ++++++++++++++++++
 .../connect-forms/connector-benefits.ts       |   8 +
 .../connector-popup/connect-forms/index.tsx   |   4 +-
 .../components/local-folder-config.tsx        | 163 +++++++++++
 .../connector-configs/index.tsx               |   3 +
 .../utils/connector-document-mapping.ts       |   1 +
 .../components/documents/version-history.tsx  | 185 ++++++++++++
 .../contracts/types/document.types.ts         |   1 +
 surfsense_web/hooks/use-folder-sync.ts        |  41 +++
 .../lib/apis/connectors-api.service.ts        |  12 +
 .../lib/apis/documents-api.service.ts         |  16 ++
 surfsense_web/lib/connectors/utils.ts         |   1 +
 surfsense_web/types/window.d.ts               |  35 +++
 14 files changed, 742 insertions(+), 1 deletion(-)
 create mode 100644 surfsense_web/components/assistant-ui/connector-popup/connect-forms/components/local-folder-connect-form.tsx
 create mode 100644 surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/local-folder-config.tsx
 create mode 100644 surfsense_web/components/documents/version-history.tsx
 create mode 100644 surfsense_web/hooks/use-folder-sync.ts

diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentTypeIcon.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentTypeIcon.tsx
index 43108c745..5c03d96fa 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentTypeIcon.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentTypeIcon.tsx
@@ -35,6 +35,7 @@ export function getDocumentTypeLabel(type: string): string {
 		BOOKSTACK_CONNECTOR: "BookStack",
 		CIRCLEBACK: "Circleback",
 		OBSIDIAN_CONNECTOR: "Obsidian",
+		LOCAL_FOLDER_FILE: "Local Folder",
 		SURFSENSE_DOCS: "SurfSense Docs",
 		NOTE: "Note",
 		COMPOSIO_GOOGLE_DRIVE_CONNECTOR: "Composio Google Drive",
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/components/local-folder-connect-form.tsx b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/components/local-folder-connect-form.tsx
new file mode 100644
index 000000000..2e893c1c0
--- /dev/null
+++ b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/components/local-folder-connect-form.tsx
@@ -0,0 +1,272 @@
+"use client";
+
+import { zodResolver } from "@hookform/resolvers/zod";
+import { FolderSync, Info } from "lucide-react";
+import type { FC } from "react";
+import { useRef } from "react";
+import { useForm } from "react-hook-form";
+import * as z from "zod";
+import { Alert, AlertDescription, AlertTitle } from "@/components/ui/alert";
+import { Button } from "@/components/ui/button";
+import {
+	Form,
+	FormControl,
+	FormDescription,
+	FormField,
+	FormItem,
+	FormLabel,
+	FormMessage,
+} from "@/components/ui/form";
+import { Input } from "@/components/ui/input";
+import { EnumConnectorName } from "@/contracts/enums/connector";
+import { getConnectorBenefits } from "../connector-benefits";
+import type { ConnectFormProps } from "../index";
+
+const localFolderFormSchema = z.object({
+	name: z.string().min(3, {
+		message: "Connector name must be at least 3 characters.",
+	}),
+	folder_path: z.string().min(1, {
+		message: "Folder path is required.",
+	}),
+	folder_name: z.string().min(1, {
+		message: "Folder name is required.",
+	}),
+	exclude_patterns: z.string().optional(),
+	file_extensions: z.string().optional(),
+});
+
+type LocalFolderFormValues = z.infer<typeof localFolderFormSchema>;
+
+export const LocalFolderConnectForm: FC<ConnectFormProps> = ({ onSubmit, isSubmitting }) => {
+	const isSubmittingRef = useRef(false);
+	const isElectron = typeof window !== "undefined" && !!window.electronAPI;
+
+	const form = useForm<LocalFolderFormValues>({
+		resolver: zodResolver(localFolderFormSchema),
+		defaultValues: {
+			name: "Local Folder",
+			folder_path: "",
+			folder_name: "",
+			exclude_patterns: "node_modules,.git,.DS_Store",
+			file_extensions: "",
+		},
+	});
+
+	const handleBrowse = async () => {
+		if (!isElectron) return;
+		const selected = await window.electronAPI!.selectFolder();
+		if (selected) {
+			form.setValue("folder_path", selected);
+			const folderName = selected.split(/[\\/]/).pop() || "folder";
+			if (!form.getValues("folder_name")) {
+				form.setValue("folder_name", folderName);
+			}
+			if (form.getValues("name") === "Local Folder") {
+				form.setValue("name", folderName);
+			}
+		}
+	};
+
+	const handleSubmit = async (values: LocalFolderFormValues) => {
+		if (isSubmittingRef.current || isSubmitting) return;
+		isSubmittingRef.current = true;
+
+		try {
+			const excludePatterns = values.exclude_patterns
+				? values.exclude_patterns
+						.split(",")
+						.map((p) => p.trim())
+						.filter(Boolean)
+				: [];
+
+			const fileExtensions = values.file_extensions
+				? values.file_extensions
+						.split(",")
+						.map((e) => {
+							const ext = e.trim();
+							return ext.startsWith(".") ? ext : `.${ext}`;
+						})
+						.filter(Boolean)
+				: null;
+
+			await onSubmit({
+				name: values.name,
+				connector_type: EnumConnectorName.LOCAL_FOLDER_CONNECTOR,
+				config: {
+					folder_path: values.folder_path,
+					folder_name: values.folder_name,
+					exclude_patterns: excludePatterns,
+					file_extensions: fileExtensions,
+				},
+				is_indexable: true,
+				is_active: true,
+				last_indexed_at: null,
+				periodic_indexing_enabled: false,
+				indexing_frequency_minutes: null,
+				next_scheduled_at: null,
+			});
+		} finally {
+			isSubmittingRef.current = false;
+		}
+	};
+
+	return (
+		<div className="space-y-6 pb-6">
+			<Alert className="bg-blue-500/10 dark:bg-blue-500/10 border-blue-500/30 p-2 sm:p-3">
+				<Info className="size-4 shrink-0 text-blue-500" />
+				<AlertTitle className="text-xs sm:text-sm">Desktop App Required</AlertTitle>
+				<AlertDescription className="text-[10px] sm:text-xs">
+					Real-time file watching is powered by the SurfSense desktop app. Files are
+					automatically synced whenever changes are detected.
+				</AlertDescription>
+			</Alert>
+
+			<div className="rounded-xl border border-border bg-slate-400/5 dark:bg-white/5 p-3 sm:p-6 space-y-3 sm:space-y-4">
+				<Form {...form}>
+					<form
+						id="local-folder-connect-form"
+						onSubmit={form.handleSubmit(handleSubmit)}
+						className="space-y-4 sm:space-y-6"
+					>
+						<FormField
+							control={form.control}
+							name="name"
+							render={({ field }) => (
+								<FormItem>
+									<FormLabel className="text-xs sm:text-sm">Connector Name</FormLabel>
+									<FormControl>
+										<Input
+											placeholder="My Documents"
+											className="h-8 sm:h-10 px-2 sm:px-3 text-xs sm:text-sm border-slate-400/20 focus-visible:border-slate-400/40"
+											disabled={isSubmitting}
+											{...field}
+										/>
+									</FormControl>
+									<FormMessage />
+								</FormItem>
+							)}
+						/>
+
+						<FormField
+							control={form.control}
+							name="folder_path"
+							render={({ field }) => (
+								<FormItem>
+									<FormLabel className="text-xs sm:text-sm">Folder Path</FormLabel>
+									<div className="flex gap-2">
+										<FormControl>
+											<Input
+												placeholder="/path/to/your/folder"
+												className="h-8 sm:h-10 px-2 sm:px-3 text-xs sm:text-sm border-slate-400/20 focus-visible:border-slate-400/40 font-mono flex-1"
+												disabled={isSubmitting}
+												{...field}
+											/>
+										</FormControl>
+										{isElectron && (
+											<Button
+												type="button"
+												variant="outline"
+												size="sm"
+												onClick={handleBrowse}
+												disabled={isSubmitting}
+												className="shrink-0"
+											>
+												<FolderSync className="h-4 w-4 mr-1" />
+												Browse
+											</Button>
+										)}
+									</div>
+									<FormDescription className="text-[10px] sm:text-xs">
+										The absolute path to the folder to watch and sync.
+									</FormDescription>
+									<FormMessage />
+								</FormItem>
+							)}
+						/>
+
+						<FormField
+							control={form.control}
+							name="folder_name"
+							render={({ field }) => (
+								<FormItem>
+									<FormLabel className="text-xs sm:text-sm">Display Name</FormLabel>
+									<FormControl>
+										<Input
+											placeholder="My Notes"
+											className="h-8 sm:h-10 px-2 sm:px-3 text-xs sm:text-sm border-slate-400/20 focus-visible:border-slate-400/40"
+											disabled={isSubmitting}
+											{...field}
+										/>
+									</FormControl>
+									<FormDescription className="text-[10px] sm:text-xs">
+										A friendly name shown in the documents sidebar.
+									</FormDescription>
+									<FormMessage />
+								</FormItem>
+							)}
+						/>
+
+						<FormField
+							control={form.control}
+							name="exclude_patterns"
+							render={({ field }) => (
+								<FormItem>
+									<FormLabel className="text-xs sm:text-sm">Exclude Patterns</FormLabel>
+									<FormControl>
+										<Input
+											placeholder="node_modules,.git,.DS_Store"
+											className="h-8 sm:h-10 px-2 sm:px-3 text-xs sm:text-sm border-slate-400/20 focus-visible:border-slate-400/40 font-mono"
+											disabled={isSubmitting}
+											{...field}
+										/>
+									</FormControl>
+									<FormDescription className="text-[10px] sm:text-xs">
+										Comma-separated patterns of directories/files to exclude.
+									</FormDescription>
+									<FormMessage />
+								</FormItem>
+							)}
+						/>
+
+						<FormField
+							control={form.control}
+							name="file_extensions"
+							render={({ field }) => (
+								<FormItem>
+									<FormLabel className="text-xs sm:text-sm">File Extensions (optional)</FormLabel>
+									<FormControl>
+										<Input
+											placeholder=".md,.txt,.rst"
+											className="h-8 sm:h-10 px-2 sm:px-3 text-xs sm:text-sm border-slate-400/20 focus-visible:border-slate-400/40 font-mono"
+											disabled={isSubmitting}
+											{...field}
+										/>
+									</FormControl>
+									<FormDescription className="text-[10px] sm:text-xs">
+										Leave empty to index all supported files, or specify comma-separated extensions.
+									</FormDescription>
+									<FormMessage />
+								</FormItem>
+							)}
+						/>
+
+					</form>
+				</Form>
+			</div>
+
+			{getConnectorBenefits(EnumConnectorName.LOCAL_FOLDER_CONNECTOR) && (
+				<div className="rounded-xl border border-border bg-slate-400/5 dark:bg-white/5 px-3 sm:px-6 py-4 space-y-2">
+					<h4 className="text-xs sm:text-sm font-medium">
+						What you get with Local Folder sync:
+					</h4>
+					<ul className="list-disc pl-5 text-[10px] sm:text-xs text-muted-foreground space-y-1">
+						{getConnectorBenefits(EnumConnectorName.LOCAL_FOLDER_CONNECTOR)?.map(
+							(benefit) => <li key={benefit}>{benefit}</li>
+						)}
+					</ul>
+				</div>
+			)}
+		</div>
+	);
+};
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/connector-benefits.ts b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/connector-benefits.ts
index 0dc093100..40c6a7fdd 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/connector-benefits.ts
+++ b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/connector-benefits.ts
@@ -111,6 +111,14 @@ export function getConnectorBenefits(connectorType: string): string[] | null {
 			"Incremental sync - only changed files are re-indexed",
 			"Full support for your vault's folder structure",
 		],
+		LOCAL_FOLDER_CONNECTOR: [
+			"Watch local folders for real-time changes via the desktop app",
+			"Automatic change detection — only modified files are re-indexed",
+			"Version history with up to 20 snapshots per document",
+			"Mirrors your folder structure in the SurfSense sidebar",
+			"Supports any text-based file format",
+			"Works as a periodic sync fallback when the desktop app is not running",
+		],
 	};
 
 	return benefits[connectorType] || null;
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/index.tsx b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/index.tsx
index 37d4ad5d8..116893399 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/index.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/index.tsx
@@ -7,6 +7,7 @@ import { GithubConnectForm } from "./components/github-connect-form";
 import { LinkupApiConnectForm } from "./components/linkup-api-connect-form";
 import { LumaConnectForm } from "./components/luma-connect-form";
 import { MCPConnectForm } from "./components/mcp-connect-form";
+import { LocalFolderConnectForm } from "./components/local-folder-connect-form";
 import { ObsidianConnectForm } from "./components/obsidian-connect-form";
 import { TavilyApiConnectForm } from "./components/tavily-api-connect-form";
 
@@ -58,7 +59,8 @@ export function getConnectFormComponent(connectorType: string): ConnectFormCompo
 			return MCPConnectForm;
 		case "OBSIDIAN_CONNECTOR":
 			return ObsidianConnectForm;
-		// Add other connector types here as needed
+		case "LOCAL_FOLDER_CONNECTOR":
+			return LocalFolderConnectForm;
 		default:
 			return null;
 	}
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/local-folder-config.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/local-folder-config.tsx
new file mode 100644
index 000000000..cb4295079
--- /dev/null
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/local-folder-config.tsx
@@ -0,0 +1,163 @@
+"use client";
+
+import type { FC } from "react";
+import { useState } from "react";
+import { FolderSync } from "lucide-react";
+import { Button } from "@/components/ui/button";
+import { Input } from "@/components/ui/input";
+import { Label } from "@/components/ui/label";
+import type { ConnectorConfigProps } from "../index";
+
+export const LocalFolderConfig: FC<ConnectorConfigProps> = ({
+	connector,
+	onConfigChange,
+	onNameChange,
+}) => {
+	const isElectron = typeof window !== "undefined" && !!window.electronAPI;
+
+	const [folderPath, setFolderPath] = useState<string>(
+		(connector.config?.folder_path as string) || ""
+	);
+	const [folderName, setFolderName] = useState<string>(
+		(connector.config?.folder_name as string) || ""
+	);
+	const [excludePatterns, setExcludePatterns] = useState<string>(() => {
+		const patterns = connector.config?.exclude_patterns;
+		if (Array.isArray(patterns)) {
+			return patterns.join(", ");
+		}
+		return (patterns as string) || "node_modules, .git, .DS_Store";
+	});
+	const [fileExtensions, setFileExtensions] = useState<string>(() => {
+		const exts = connector.config?.file_extensions;
+		if (Array.isArray(exts)) {
+			return exts.join(", ");
+		}
+		return (exts as string) || "";
+	});
+	const [name, setName] = useState<string>(connector.name || "");
+
+	const handleFolderPathChange = (value: string) => {
+		setFolderPath(value);
+		onConfigChange?.({ ...connector.config, folder_path: value });
+	};
+
+	const handleFolderNameChange = (value: string) => {
+		setFolderName(value);
+		onConfigChange?.({ ...connector.config, folder_name: value });
+	};
+
+	const handleExcludePatternsChange = (value: string) => {
+		setExcludePatterns(value);
+		const arr = value
+			.split(",")
+			.map((p) => p.trim())
+			.filter(Boolean);
+		onConfigChange?.({ ...connector.config, exclude_patterns: arr });
+	};
+
+	const handleFileExtensionsChange = (value: string) => {
+		setFileExtensions(value);
+		const arr = value
+			? value
+					.split(",")
+					.map((e) => {
+						const ext = e.trim();
+						return ext.startsWith(".") ? ext : `.${ext}`;
+					})
+					.filter(Boolean)
+			: null;
+		onConfigChange?.({ ...connector.config, file_extensions: arr });
+	};
+
+	const handleNameChange = (value: string) => {
+		setName(value);
+		onNameChange?.(value);
+	};
+
+	const handleBrowse = async () => {
+		if (!isElectron) return;
+		const selected = await window.electronAPI!.selectFolder();
+		if (selected) {
+			handleFolderPathChange(selected);
+			const autoName = selected.split(/[\\/]/).pop() || "folder";
+			if (!folderName) handleFolderNameChange(autoName);
+		}
+	};
+
+	return (
+		<div className="space-y-6">
+			<div className="rounded-xl border border-border bg-slate-400/5 dark:bg-white/5 p-3 sm:p-6 space-y-3 sm:space-y-4">
+				<div className="space-y-2">
+					<Label className="text-xs sm:text-sm">Connector Name</Label>
+					<Input
+						value={name}
+						onChange={(e) => handleNameChange(e.target.value)}
+						placeholder="Local Folder"
+						className="border-slate-400/20 focus-visible:border-slate-400/40"
+					/>
+				</div>
+			</div>
+
+			<div className="rounded-xl border border-border bg-slate-400/5 dark:bg-white/5 p-3 sm:p-6 space-y-3 sm:space-y-4">
+				<h3 className="font-medium text-sm sm:text-base">Folder Configuration</h3>
+
+				<div className="space-y-4">
+					<div className="space-y-2">
+						<Label className="text-xs sm:text-sm">Folder Path</Label>
+						<div className="flex gap-2">
+							<Input
+								value={folderPath}
+								onChange={(e) => handleFolderPathChange(e.target.value)}
+								placeholder="/path/to/your/folder"
+								className="border-slate-400/20 focus-visible:border-slate-400/40 font-mono flex-1"
+							/>
+							{isElectron && (
+								<Button type="button" variant="outline" size="sm" onClick={handleBrowse} className="shrink-0">
+									<FolderSync className="h-4 w-4 mr-1" />
+									Browse
+								</Button>
+							)}
+						</div>
+					</div>
+
+					<div className="space-y-2">
+						<Label className="text-xs sm:text-sm">Display Name</Label>
+						<Input
+							value={folderName}
+							onChange={(e) => handleFolderNameChange(e.target.value)}
+							placeholder="My Notes"
+							className="border-slate-400/20 focus-visible:border-slate-400/40"
+						/>
+					</div>
+
+					<div className="space-y-2">
+						<Label className="text-xs sm:text-sm">Exclude Patterns</Label>
+						<Input
+							value={excludePatterns}
+							onChange={(e) => handleExcludePatternsChange(e.target.value)}
+							placeholder="node_modules, .git, .DS_Store"
+							className="border-slate-400/20 focus-visible:border-slate-400/40 font-mono"
+						/>
+						<p className="text-[10px] sm:text-xs text-muted-foreground">
+							Comma-separated patterns of directories/files to exclude.
+						</p>
+					</div>
+
+					<div className="space-y-2">
+						<Label className="text-xs sm:text-sm">File Extensions (optional)</Label>
+						<Input
+							value={fileExtensions}
+							onChange={(e) => handleFileExtensionsChange(e.target.value)}
+							placeholder=".md, .txt, .rst"
+							className="border-slate-400/20 focus-visible:border-slate-400/40 font-mono"
+						/>
+						<p className="text-[10px] sm:text-xs text-muted-foreground">
+							Leave empty to index all supported files.
+						</p>
+					</div>
+				</div>
+			</div>
+		</div>
+	);
+};
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/index.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/index.tsx
index a63435260..3dc1891c8 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/index.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/index.tsx
@@ -19,6 +19,7 @@ import { JiraConfig } from "./components/jira-config";
 import { LinkupApiConfig } from "./components/linkup-api-config";
 import { LumaConfig } from "./components/luma-config";
 import { MCPConfig } from "./components/mcp-config";
+import { LocalFolderConfig } from "./components/local-folder-config";
 import { ObsidianConfig } from "./components/obsidian-config";
 import { OneDriveConfig } from "./components/onedrive-config";
 import { SlackConfig } from "./components/slack-config";
@@ -82,6 +83,8 @@ export function getConnectorConfigComponent(
 			return MCPConfig;
 		case "OBSIDIAN_CONNECTOR":
 			return ObsidianConfig;
+		case "LOCAL_FOLDER_CONNECTOR":
+			return LocalFolderConfig;
 		case "COMPOSIO_GOOGLE_DRIVE_CONNECTOR":
 			return ComposioDriveConfig;
 		case "COMPOSIO_GMAIL_CONNECTOR":
diff --git a/surfsense_web/components/assistant-ui/connector-popup/utils/connector-document-mapping.ts b/surfsense_web/components/assistant-ui/connector-popup/utils/connector-document-mapping.ts
index f924bb15f..dd5978002 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/utils/connector-document-mapping.ts
+++ b/surfsense_web/components/assistant-ui/connector-popup/utils/connector-document-mapping.ts
@@ -29,6 +29,7 @@ export const CONNECTOR_TO_DOCUMENT_TYPE: Record<string, string> = {
 	BOOKSTACK_CONNECTOR: "BOOKSTACK_CONNECTOR",
 	CIRCLEBACK_CONNECTOR: "CIRCLEBACK",
 	OBSIDIAN_CONNECTOR: "OBSIDIAN_CONNECTOR",
+	LOCAL_FOLDER_CONNECTOR: "LOCAL_FOLDER_FILE",
 
 	// Special mappings (connector type differs from document type)
 	GOOGLE_DRIVE_CONNECTOR: "GOOGLE_DRIVE_FILE",
diff --git a/surfsense_web/components/documents/version-history.tsx b/surfsense_web/components/documents/version-history.tsx
new file mode 100644
index 000000000..29740e079
--- /dev/null
+++ b/surfsense_web/components/documents/version-history.tsx
@@ -0,0 +1,185 @@
+"use client";
+
+import { useCallback, useEffect, useState } from "react";
+import { Clock, RotateCcw } from "lucide-react";
+import { Button } from "@/components/ui/button";
+import {
+	Sheet,
+	SheetContent,
+	SheetHeader,
+	SheetTitle,
+	SheetTrigger,
+} from "@/components/ui/sheet";
+import { Spinner } from "@/components/ui/spinner";
+import { documentsApiService } from "@/lib/apis/documents-api.service";
+import { toast } from "sonner";
+
+interface DocumentVersionSummary {
+	version_number: number;
+	title: string;
+	content_hash: string;
+	created_at: string | null;
+}
+
+interface VersionHistoryProps {
+	documentId: number;
+	documentType: string;
+}
+
+export function VersionHistoryButton({ documentId, documentType }: VersionHistoryProps) {
+	const showVersionHistory = documentType === "LOCAL_FOLDER_FILE" || documentType === "OBSIDIAN_CONNECTOR";
+	if (!showVersionHistory) return null;
+
+	return (
+		<Sheet>
+			<SheetTrigger asChild>
+				<Button variant="ghost" size="sm" className="gap-1.5 text-xs">
+					<Clock className="h-3.5 w-3.5" />
+					Versions
+				</Button>
+			</SheetTrigger>
+			<SheetContent className="w-[400px] sm:w-[540px]">
+				<SheetHeader>
+					<SheetTitle>Version History</SheetTitle>
+				</SheetHeader>
+				<VersionHistoryPanel documentId={documentId} />
+			</SheetContent>
+		</Sheet>
+	);
+}
+
+function VersionHistoryPanel({ documentId }: { documentId: number }) {
+	const [versions, setVersions] = useState<DocumentVersionSummary[]>([]);
+	const [loading, setLoading] = useState(true);
+	const [selectedVersion, setSelectedVersion] = useState<number | null>(null);
+	const [versionContent, setVersionContent] = useState<string>("");
+	const [contentLoading, setContentLoading] = useState(false);
+	const [restoring, setRestoring] = useState(false);
+
+	const loadVersions = useCallback(async () => {
+		setLoading(true);
+		try {
+			const data = await documentsApiService.listDocumentVersions(documentId);
+			setVersions(data as DocumentVersionSummary[]);
+		} catch {
+			toast.error("Failed to load version history");
+		} finally {
+			setLoading(false);
+		}
+	}, [documentId]);
+
+	useEffect(() => {
+		loadVersions();
+	}, [loadVersions]);
+
+	const handleSelectVersion = async (versionNumber: number) => {
+		setSelectedVersion(versionNumber);
+		setContentLoading(true);
+		try {
+			const data = (await documentsApiService.getDocumentVersion(
+				documentId,
+				versionNumber
+			)) as { source_markdown: string };
+			setVersionContent(data.source_markdown || "");
+		} catch {
+			toast.error("Failed to load version content");
+		} finally {
+			setContentLoading(false);
+		}
+	};
+
+	const handleRestore = async (versionNumber: number) => {
+		setRestoring(true);
+		try {
+			await documentsApiService.restoreDocumentVersion(documentId, versionNumber);
+			toast.success(`Restored version ${versionNumber}`);
+			await loadVersions();
+		} catch {
+			toast.error("Failed to restore version");
+		} finally {
+			setRestoring(false);
+		}
+	};
+
+	if (loading) {
+		return (
+			<div className="flex items-center justify-center py-12">
+				<Spinner size="lg" className="text-muted-foreground" />
+			</div>
+		);
+	}
+
+	if (versions.length === 0) {
+		return (
+			<div className="flex flex-col items-center justify-center py-12 text-muted-foreground">
+				<Clock className="h-8 w-8 mb-2 opacity-50" />
+				<p className="text-sm">No version history available yet.</p>
+				<p className="text-xs mt-1">Versions are created when file content changes.</p>
+			</div>
+		);
+	}
+
+	return (
+		<div className="flex flex-col gap-4 pt-4 h-full">
+			<div className="flex-1 overflow-y-auto space-y-2">
+				{versions.map((v) => (
+					<div
+						key={v.version_number}
+						className={`rounded-lg border p-3 cursor-pointer transition-colors ${
+							selectedVersion === v.version_number
+								? "border-primary bg-primary/5"
+								: "border-border hover:border-primary/50"
+						}`}
+						onClick={() => handleSelectVersion(v.version_number)}
+					>
+						<div className="flex items-center justify-between">
+							<div className="space-y-1">
+								<p className="text-sm font-medium">Version {v.version_number}</p>
+								{v.created_at && (
+									<p className="text-xs text-muted-foreground">
+										{new Date(v.created_at).toLocaleString()}
+									</p>
+								)}
+								{v.title && (
+									<p className="text-xs text-muted-foreground truncate max-w-[200px]">
+										{v.title}
+									</p>
+								)}
+							</div>
+							<Button
+								variant="outline"
+								size="sm"
+								className="shrink-0 gap-1"
+								disabled={restoring}
+								onClick={(e) => {
+									e.stopPropagation();
+									handleRestore(v.version_number);
+								}}
+							>
+								<RotateCcw className="h-3 w-3" />
+								Restore
+							</Button>
+						</div>
+					</div>
+				))}
+			</div>
+
+			{selectedVersion !== null && (
+				<div className="border-t pt-4 max-h-[40vh] overflow-y-auto">
+					<h4 className="text-sm font-medium mb-2">
+						Preview — Version {selectedVersion}
+					</h4>
+					{contentLoading ? (
+						<div className="flex items-center justify-center py-6">
+							<Spinner size="sm" />
+						</div>
+					) : (
+						<pre className="text-xs whitespace-pre-wrap font-mono bg-muted/50 rounded-lg p-3 max-h-[30vh] overflow-y-auto">
+							{versionContent || "(empty)"}
+						</pre>
+					)}
+				</div>
+			)}
+		</div>
+	);
+}
diff --git a/surfsense_web/contracts/types/document.types.ts b/surfsense_web/contracts/types/document.types.ts
index 1a3326bae..c663d6115 100644
--- a/surfsense_web/contracts/types/document.types.ts
+++ b/surfsense_web/contracts/types/document.types.ts
@@ -26,6 +26,7 @@ export const documentTypeEnum = z.enum([
 	"BOOKSTACK_CONNECTOR",
 	"CIRCLEBACK",
 	"OBSIDIAN_CONNECTOR",
+	"LOCAL_FOLDER_FILE",
 	"SURFSENSE_DOCS",
 	"NOTE",
 	"COMPOSIO_GOOGLE_DRIVE_CONNECTOR",
diff --git a/surfsense_web/hooks/use-folder-sync.ts b/surfsense_web/hooks/use-folder-sync.ts
new file mode 100644
index 000000000..a35faf98f
--- /dev/null
+++ b/surfsense_web/hooks/use-folder-sync.ts
@@ -0,0 +1,41 @@
+"use client";
+
+import { useEffect, useRef } from "react";
+import { connectorsApiService } from "@/lib/apis/connectors-api.service";
+
+const DEBOUNCE_MS = 2000;
+
+export function useFolderSync() {
+	const pendingRef = useRef<Map<string, ReturnType<typeof setTimeout>>>(new Map());
+
+	useEffect(() => {
+		const api = typeof window !== "undefined" ? window.electronAPI : null;
+		if (!api?.onFileChanged) return;
+
+		const cleanup = api.onFileChanged((event) => {
+			const key = `${event.connectorId}:${event.fullPath}`;
+
+			const existing = pendingRef.current.get(key);
+			if (existing) clearTimeout(existing);
+
+			const timeout = setTimeout(async () => {
+				pendingRef.current.delete(key);
+				try {
+					await connectorsApiService.indexFile(event.connectorId, event.fullPath);
+				} catch (err) {
+					console.error("[FolderSync] Failed to trigger re-index:", err);
+				}
+			}, DEBOUNCE_MS);
+
+			pendingRef.current.set(key, timeout);
+		});
+
+		return () => {
+			cleanup();
+			for (const timeout of pendingRef.current.values()) {
+				clearTimeout(timeout);
+			}
+			pendingRef.current.clear();
+		};
+	}, []);
+}
diff --git a/surfsense_web/lib/apis/connectors-api.service.ts b/surfsense_web/lib/apis/connectors-api.service.ts
index abd16c7a7..f2722df70 100644
--- a/surfsense_web/lib/apis/connectors-api.service.ts
+++ b/surfsense_web/lib/apis/connectors-api.service.ts
@@ -404,6 +404,18 @@ class ConnectorsApiService {
 			listDiscordChannelsResponse
 		);
 	};
+
+	// =============================================================================
+	// Local Folder Connector Methods
+	// =============================================================================
+
+	indexFile = async (connectorId: number, filePath: string) => {
+		return baseApiService.post(
+			`/api/v1/search-source-connectors/${connectorId}/index-file`,
+			undefined,
+			{ body: { file_path: filePath } }
+		);
+	};
 }
 
 export type { SlackChannel, DiscordChannel };
diff --git a/surfsense_web/lib/apis/documents-api.service.ts b/surfsense_web/lib/apis/documents-api.service.ts
index 14a247032..d4a80f8a0 100644
--- a/surfsense_web/lib/apis/documents-api.service.ts
+++ b/surfsense_web/lib/apis/documents-api.service.ts
@@ -379,6 +379,22 @@ class DocumentsApiService {
 		});
 	};
 
+	listDocumentVersions = async (documentId: number) => {
+		return baseApiService.get(`/api/v1/documents/${documentId}/versions`);
+	};
+
+	getDocumentVersion = async (documentId: number, versionNumber: number) => {
+		return baseApiService.get(
+			`/api/v1/documents/${documentId}/versions/${versionNumber}`
+		);
+	};
+
+	restoreDocumentVersion = async (documentId: number, versionNumber: number) => {
+		return baseApiService.post(
+			`/api/v1/documents/${documentId}/versions/${versionNumber}/restore`
+		);
+	};
+
 	/**
 	 * Delete a document
 	 */
diff --git a/surfsense_web/lib/connectors/utils.ts b/surfsense_web/lib/connectors/utils.ts
index 90f7f5d21..6ce78be67 100644
--- a/surfsense_web/lib/connectors/utils.ts
+++ b/surfsense_web/lib/connectors/utils.ts
@@ -30,6 +30,7 @@ export const getConnectorTypeDisplay = (type: string): string => {
 		YOUTUBE_CONNECTOR: "YouTube",
 		CIRCLEBACK_CONNECTOR: "Circleback",
 		OBSIDIAN_CONNECTOR: "Obsidian",
+		LOCAL_FOLDER_CONNECTOR: "Local Folder",
 		DROPBOX_CONNECTOR: "Dropbox",
 		MCP_CONNECTOR: "MCP Server",
 	};
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 9cf1aa596..921449b41 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -1,5 +1,30 @@
 import type { PostHog } from "posthog-js";
 
+interface WatchedFolderConfig {
+	path: string;
+	name: string;
+	excludePatterns: string[];
+	fileExtensions: string[] | null;
+	connectorId: number;
+	searchSpaceId: number;
+	active: boolean;
+}
+
+interface FolderSyncFileChangedEvent {
+	connectorId: number;
+	searchSpaceId: number;
+	folderPath: string;
+	relativePath: string;
+	fullPath: string;
+	action: "add" | "change" | "unlink";
+	timestamp: number;
+}
+
+interface FolderSyncWatcherReadyEvent {
+	connectorId: number;
+	folderPath: string;
+}
+
 interface ElectronAPI {
 	versions: {
 		electron: string;
@@ -14,6 +39,16 @@ interface ElectronAPI {
 	setQuickAskMode: (mode: string) => Promise<void>;
 	getQuickAskMode: () => Promise<string>;
 	replaceText: (text: string) => Promise<void>;
+	// Folder sync
+	selectFolder: () => Promise<string | null>;
+	addWatchedFolder: (config: WatchedFolderConfig) => Promise<WatchedFolderConfig[]>;
+	removeWatchedFolder: (folderPath: string) => Promise<WatchedFolderConfig[]>;
+	getWatchedFolders: () => Promise<WatchedFolderConfig[]>;
+	getWatcherStatus: () => Promise<{ path: string; active: boolean; watching: boolean }[]>;
+	onFileChanged: (callback: (data: FolderSyncFileChangedEvent) => void) => () => void;
+	onWatcherReady: (callback: (data: FolderSyncWatcherReadyEvent) => void) => () => void;
+	pauseWatcher: () => Promise<void>;
+	resumeWatcher: () => Promise<void>;
 }
 
 declare global {

From b93da843dc6125434d712ad8881bf248906782d1 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 11:55:29 +0530
Subject: [PATCH 030/202] feat: implement mtime tracking and synchronization
 for folder watcher

---
 .../src/modules/folder-watcher.ts             | 172 +++++++++++++++++-
 1 file changed, 164 insertions(+), 8 deletions(-)

diff --git a/surfsense_desktop/src/modules/folder-watcher.ts b/surfsense_desktop/src/modules/folder-watcher.ts
index bfd2136c9..072ae7b3f 100644
--- a/surfsense_desktop/src/modules/folder-watcher.ts
+++ b/surfsense_desktop/src/modules/folder-watcher.ts
@@ -1,5 +1,5 @@
 import { BrowserWindow, dialog } from 'electron';
-import chokidar from 'chokidar';
+import chokidar, { type FSWatcher } from 'chokidar';
 import * as path from 'path';
 import * as fs from 'fs';
 import { IPC_CHANNELS } from '../ipc/channels';
@@ -16,13 +16,24 @@ export interface WatchedFolderConfig {
 
 interface WatcherEntry {
   config: WatchedFolderConfig;
-  watcher: chokidar.FSWatcher | null;
+  watcher: FSWatcher | null;
 }
 
+type MtimeMap = Record<string, number>;
+
 const STORE_KEY = 'watchedFolders';
+const MTIME_TOLERANCE_S = 1.0;
+
 let store: any = null;
+let mtimeStore: any = null;
 let watchers: Map<string, WatcherEntry> = new Map();
 
+/**
+ * In-memory cache of mtime maps, keyed by folder path.
+ * Persisted to electron-store on mutation.
+ */
+const mtimeMaps: Map<string, MtimeMap> = new Map();
+
 async function getStore() {
   if (!store) {
     const { default: Store } = await import('electron-store');
@@ -36,6 +47,73 @@ async function getStore() {
   return store;
 }
 
+async function getMtimeStore() {
+  if (!mtimeStore) {
+    const { default: Store } = await import('electron-store');
+    mtimeStore = new Store({
+      name: 'folder-mtime-maps',
+      defaults: {} as Record<string, MtimeMap>,
+    });
+  }
+  return mtimeStore;
+}
+
+function loadMtimeMap(folderPath: string): MtimeMap {
+  return mtimeMaps.get(folderPath) ?? {};
+}
+
+function persistMtimeMap(folderPath: string) {
+  const map = mtimeMaps.get(folderPath) ?? {};
+  getMtimeStore().then((s) => s.set(folderPath, map));
+}
+
+function walkFolderMtimes(config: WatchedFolderConfig): MtimeMap {
+  const root = config.path;
+  const result: MtimeMap = {};
+  const excludes = new Set(config.excludePatterns);
+
+  function walk(dir: string) {
+    let entries: fs.Dirent[];
+    try {
+      entries = fs.readdirSync(dir, { withFileTypes: true });
+    } catch {
+      return;
+    }
+
+    for (const entry of entries) {
+      const name = entry.name;
+
+      // Skip dotfiles/dotdirs and excluded names
+      if (name.startsWith('.') || excludes.has(name)) continue;
+
+      const full = path.join(dir, name);
+
+      if (entry.isDirectory()) {
+        walk(full);
+      } else if (entry.isFile()) {
+        if (
+          config.fileExtensions &&
+          config.fileExtensions.length > 0
+        ) {
+          const ext = path.extname(name).toLowerCase();
+          if (!config.fileExtensions.includes(ext)) continue;
+        }
+
+        try {
+          const stat = fs.statSync(full);
+          const rel = path.relative(root, full);
+          result[rel] = stat.mtimeMs;
+        } catch {
+          // File may have been removed between readdir and stat
+        }
+      }
+    }
+  }
+
+  walk(root);
+  return result;
+}
+
 function getMainWindow(): BrowserWindow | null {
   const windows = BrowserWindow.getAllWindows();
   return windows.length > 0 ? windows[0] : null;
@@ -48,11 +126,16 @@ function sendToRenderer(channel: string, data: any) {
   }
 }
 
-function startWatcher(config: WatchedFolderConfig) {
+async function startWatcher(config: WatchedFolderConfig) {
   if (watchers.has(config.path)) {
     return;
   }
 
+  // Load persisted mtime map into memory before starting the watcher
+  const ms = await getMtimeStore();
+  const storedMap: MtimeMap = ms.get(config.path) ?? {};
+  mtimeMaps.set(config.path, { ...storedMap });
+
   const ignored = [
     /(^|[/\\])\../, // dotfiles by default
     ...config.excludePatterns.map((p) => `**/${p}/**`),
@@ -60,7 +143,7 @@ function startWatcher(config: WatchedFolderConfig) {
 
   const watcher = chokidar.watch(config.path, {
     persistent: true,
-    ignoreInitial: false,
+    ignoreInitial: true,
     awaitWriteFinish: {
       stabilityThreshold: 500,
       pollInterval: 100,
@@ -72,6 +155,58 @@ function startWatcher(config: WatchedFolderConfig) {
 
   watcher.on('ready', () => {
     ready = true;
+
+    // Detect offline changes by diffing current filesystem against stored mtime map
+    const currentMap = walkFolderMtimes(config);
+    const storedSnapshot = loadMtimeMap(config.path);
+    const now = Date.now();
+
+    for (const [rel, currentMtime] of Object.entries(currentMap)) {
+      const storedMtime = storedSnapshot[rel];
+      if (storedMtime === undefined) {
+        // New file added while app was closed
+        sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, {
+          connectorId: config.connectorId,
+          searchSpaceId: config.searchSpaceId,
+          folderPath: config.path,
+          relativePath: rel,
+          fullPath: path.join(config.path, rel),
+          action: 'add',
+          timestamp: now,
+        });
+      } else if (Math.abs(currentMtime - storedMtime) >= MTIME_TOLERANCE_S * 1000) {
+        // File modified while app was closed
+        sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, {
+          connectorId: config.connectorId,
+          searchSpaceId: config.searchSpaceId,
+          folderPath: config.path,
+          relativePath: rel,
+          fullPath: path.join(config.path, rel),
+          action: 'change',
+          timestamp: now,
+        });
+      }
+    }
+
+    for (const rel of Object.keys(storedSnapshot)) {
+      if (!(rel in currentMap)) {
+        // File deleted while app was closed
+        sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, {
+          connectorId: config.connectorId,
+          searchSpaceId: config.searchSpaceId,
+          folderPath: config.path,
+          relativePath: rel,
+          fullPath: path.join(config.path, rel),
+          action: 'unlink',
+          timestamp: now,
+        });
+      }
+    }
+
+    // Replace stored map with current filesystem state
+    mtimeMaps.set(config.path, currentMap);
+    persistMtimeMap(config.path);
+
     sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_WATCHER_READY, {
       connectorId: config.connectorId,
       folderPath: config.path,
@@ -91,6 +226,21 @@ function startWatcher(config: WatchedFolderConfig) {
       if (!config.fileExtensions.includes(ext)) return;
     }
 
+    // Keep mtime map in sync with live changes
+    const map = mtimeMaps.get(config.path);
+    if (map) {
+      if (action === 'unlink') {
+        delete map[relativePath];
+      } else {
+        try {
+          map[relativePath] = fs.statSync(filePath).mtimeMs;
+        } catch {
+          // File may have been removed between event and stat
+        }
+      }
+      persistMtimeMap(config.path);
+    }
+
     sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, {
       connectorId: config.connectorId,
       searchSpaceId: config.searchSpaceId,
@@ -110,6 +260,7 @@ function startWatcher(config: WatchedFolderConfig) {
 }
 
 function stopWatcher(folderPath: string) {
+  persistMtimeMap(folderPath);
   const entry = watchers.get(folderPath);
   if (entry?.watcher) {
     entry.watcher.close();
@@ -144,7 +295,7 @@ export async function addWatchedFolder(
   s.set(STORE_KEY, folders);
 
   if (config.active) {
-    startWatcher(config);
+    await startWatcher(config);
   }
 
   return folders;
@@ -160,6 +311,11 @@ export async function removeWatchedFolder(
 
   stopWatcher(folderPath);
 
+  // Clean up persisted mtime map for this folder
+  mtimeMaps.delete(folderPath);
+  const ms = await getMtimeStore();
+  ms.delete(folderPath);
+
   return updated;
 }
 
@@ -190,9 +346,9 @@ export async function pauseWatcher(): Promise<void> {
 }
 
 export async function resumeWatcher(): Promise<void> {
-  for (const [folderPath, entry] of watchers) {
+  for (const [, entry] of watchers) {
     if (!entry.watcher && entry.config.active) {
-      startWatcher(entry.config);
+      await startWatcher(entry.config);
     }
   }
 }
@@ -203,7 +359,7 @@ export async function registerFolderWatcher(): Promise<void> {
 
   for (const config of folders) {
     if (config.active && fs.existsSync(config.path)) {
-      startWatcher(config);
+      await startWatcher(config);
     }
   }
 }

From 543b8b9376eb4fd89698deffdfde0f6d9e69a2e8 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 12:08:18 +0530
Subject: [PATCH 031/202] feat: add real-time folder watcher registration and
 unregistration for Local Folder connector

---
 .../hooks/use-connector-dialog.ts             | 28 +++++++++++++++++++
 1 file changed, 28 insertions(+)

diff --git a/surfsense_web/components/assistant-ui/connector-popup/hooks/use-connector-dialog.ts b/surfsense_web/components/assistant-ui/connector-popup/hooks/use-connector-dialog.ts
index 6543bbd72..2404b8eb5 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/hooks/use-connector-dialog.ts
+++ b/surfsense_web/components/assistant-ui/connector-popup/hooks/use-connector-dialog.ts
@@ -586,6 +586,23 @@ export const useConnectorDialog = () => {
 									},
 								});
 
+								// Register folder watcher in Electron for real-time sync
+								if (
+									currentConnectorType === EnumConnectorName.LOCAL_FOLDER_CONNECTOR &&
+									window.electronAPI?.addWatchedFolder
+								) {
+									const cfg = connector.config || {};
+									await window.electronAPI.addWatchedFolder({
+										path: cfg.folder_path as string,
+										name: cfg.folder_name as string,
+										excludePatterns: (cfg.exclude_patterns as string[]) || [],
+										fileExtensions: (cfg.file_extensions as string[] | null) ?? null,
+										connectorId: connector.id,
+										searchSpaceId: Number(searchSpaceId),
+										active: true,
+									});
+								}
+
 								const successMessage =
 									currentConnectorType === "MCP_CONNECTOR"
 										? `${connector.name} added successfully`
@@ -1190,6 +1207,17 @@ export const useConnectorDialog = () => {
 					id: editingConnector.id,
 				});
 
+				// Unregister folder watcher in Electron when removing a Local Folder connector
+				if (
+					editingConnector.connector_type === EnumConnectorName.LOCAL_FOLDER_CONNECTOR &&
+					window.electronAPI?.removeWatchedFolder &&
+					editingConnector.config?.folder_path
+				) {
+					await window.electronAPI.removeWatchedFolder(
+						editingConnector.config.folder_path as string
+					);
+				}
+
 				// Track connector deleted event
 				trackConnectorDeleted(
 					Number(searchSpaceId),

From 8e58094a861a1517e6587a8e8f55182c3cffed7b Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 12:13:14 +0530
Subject: [PATCH 032/202] refactor: update permission checks in document and
 connector routes to use specific permission values

---
 surfsense_backend/app/routes/documents_routes.py            | 6 +++---
 .../app/routes/search_source_connectors_routes.py           | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index 9271d4630..2d999eae3 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -1156,7 +1156,7 @@ async def list_document_versions(
     if not document:
         raise HTTPException(status_code=404, detail="Document not found")
 
-    await check_permission(session, user, document.search_space_id, Permission.READ)
+    await check_permission(session, user, document.search_space_id, Permission.DOCUMENTS_READ.value)
 
     versions = (
         await session.execute(
@@ -1191,7 +1191,7 @@ async def get_document_version(
     if not document:
         raise HTTPException(status_code=404, detail="Document not found")
 
-    await check_permission(session, user, document.search_space_id, Permission.READ)
+    await check_permission(session, user, document.search_space_id, Permission.DOCUMENTS_READ.value)
 
     version = (
         await session.execute(
@@ -1229,7 +1229,7 @@ async def restore_document_version(
     if not document:
         raise HTTPException(status_code=404, detail="Document not found")
 
-    await check_permission(session, user, document.search_space_id, Permission.WRITE)
+    await check_permission(session, user, document.search_space_id, Permission.DOCUMENTS_UPDATE.value)
 
     version = (
         await session.execute(
diff --git a/surfsense_backend/app/routes/search_source_connectors_routes.py b/surfsense_backend/app/routes/search_source_connectors_routes.py
index 439d83ac1..5ea88c418 100644
--- a/surfsense_backend/app/routes/search_source_connectors_routes.py
+++ b/surfsense_backend/app/routes/search_source_connectors_routes.py
@@ -1355,7 +1355,7 @@ async def index_single_file(
     if not connector:
         raise HTTPException(status_code=404, detail="Local folder connector not found")
 
-    await check_permission(session, user, connector.search_space_id, Permission.WRITE)
+    await check_permission(session, user, connector.search_space_id, Permission.CONNECTORS_UPDATE.value)
 
     folder_path = connector.config.get("folder_path", "")
 

From ccd0e3b807a1f0a9f27decb3c2be00600baa9ddb Mon Sep 17 00:00:00 2001
From: SohamBhattacharjee2003
 <125297948+SohamBhattacharjee2003@users.noreply.github.com>
Date: Thu, 2 Apr 2026 13:16:55 +0530
Subject: [PATCH 033/202] fix(connector-popup): remove unused currentUserAtom
 import

---
 surfsense_web/components/assistant-ui/connector-popup.tsx | 2 --
 1 file changed, 2 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/connector-popup.tsx b/surfsense_web/components/assistant-ui/connector-popup.tsx
index d1f6dd31f..791775cd3 100644
--- a/surfsense_web/components/assistant-ui/connector-popup.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup.tsx
@@ -11,7 +11,6 @@ import {
 } from "@/atoms/new-llm-config/new-llm-config-query.atoms";
 import { activeSearchSpaceIdAtom } from "@/atoms/search-spaces/search-space-query.atoms";
 import { searchSpaceSettingsDialogAtom } from "@/atoms/settings/settings-dialog.atoms";
-import { currentUserAtom } from "@/atoms/user/user-query.atoms";
 import { Alert, AlertDescription, AlertTitle } from "@/components/ui/alert";
 import { Button } from "@/components/ui/button";
 import { Dialog, DialogContent, DialogTitle } from "@/components/ui/dialog";
@@ -47,7 +46,6 @@ export const ConnectorIndicator = forwardRef<ConnectorIndicatorHandle, Connector
 	(_props, ref) => {
 		const searchSpaceId = useAtomValue(activeSearchSpaceIdAtom);
 		const setSearchSpaceSettingsDialog = useSetAtom(searchSpaceSettingsDialogAtom);
-		useAtomValue(currentUserAtom);
 		const { data: preferences = {}, isFetching: preferencesLoading } =
 			useAtomValue(llmPreferencesAtom);
 		const { data: globalConfigs = [], isFetching: globalConfigsLoading } =

From f1be2652a0543cf3ebda60b653106de4e278675e Mon Sep 17 00:00:00 2001
From: SohamBhattacharjee2003
 <125297948+SohamBhattacharjee2003@users.noreply.github.com>
Date: Thu, 2 Apr 2026 13:31:48 +0530
Subject: [PATCH 034/202] fix(comment-composer): hoist RegExp out of loop to
 satisfy js-hoist-regexp rule

---
 .../comment-composer/comment-composer.tsx          | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx b/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
index 3e9b4504f..bee3f2da6 100644
--- a/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
+++ b/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
@@ -15,13 +15,17 @@ function convertDisplayToData(displayContent: string, mentions: InsertedMention[
 
 	const sortedMentions = [...mentions].sort((a, b) => b.displayName.length - a.displayName.length);
 
-	for (const mention of sortedMentions) {
-		const displayPattern = new RegExp(
+	const mentionPatterns = sortedMentions.map((mention) => ({
+		pattern: new RegExp(
 			`@${escapeRegExp(mention.displayName)}(?=\\s|$|[.,!?;:])`,
 			"g"
-		);
-		const dataFormat = `@[${mention.id}]`;
-		result = result.replace(displayPattern, dataFormat);
+		),
+		dataFormat: `@[${mention.id}]`,
+	}));
+
+	for (const { pattern, dataFormat } of mentionPatterns) {
+		pattern.lastIndex = 0; // reset global regex state
+		result = result.replace(pattern, dataFormat);
 	}
 
 	return result;

From 0cd2b8164da696daee5c2118782ed0a695185762 Mon Sep 17 00:00:00 2001
From: SohamBhattacharjee2003
 <125297948+SohamBhattacharjee2003@users.noreply.github.com>
Date: Thu, 2 Apr 2026 13:41:51 +0530
Subject: [PATCH 035/202] fix(ui): use scoped radix-ui imports to optimize
 bundle

---
 surfsense_web/components/ui/checkbox.tsx      | 2 +-
 surfsense_web/components/ui/dropdown-menu.tsx | 2 +-
 surfsense_web/components/ui/separator.tsx     | 2 +-
 surfsense_web/components/ui/toggle-group.tsx  | 2 +-
 surfsense_web/components/ui/toggle.tsx        | 2 +-
 surfsense_web/components/ui/tooltip.tsx       | 2 +-
 6 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/surfsense_web/components/ui/checkbox.tsx b/surfsense_web/components/ui/checkbox.tsx
index 0936a383e..586e3e602 100644
--- a/surfsense_web/components/ui/checkbox.tsx
+++ b/surfsense_web/components/ui/checkbox.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { CheckIcon } from "lucide-react";
-import { Checkbox as CheckboxPrimitive } from "radix-ui";
+import * as CheckboxPrimitive from "@radix-ui/react-checkbox";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/dropdown-menu.tsx b/surfsense_web/components/ui/dropdown-menu.tsx
index 24b99467e..2904b93dd 100644
--- a/surfsense_web/components/ui/dropdown-menu.tsx
+++ b/surfsense_web/components/ui/dropdown-menu.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { CheckIcon, ChevronRightIcon, CircleIcon } from "lucide-react";
-import { DropdownMenu as DropdownMenuPrimitive } from "radix-ui";
+import * as DropdownMenuPrimitive from "@radix-ui/react-dropdown-menu";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/separator.tsx b/surfsense_web/components/ui/separator.tsx
index 63b8e6a69..d7cf2cd81 100644
--- a/surfsense_web/components/ui/separator.tsx
+++ b/surfsense_web/components/ui/separator.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { Separator as SeparatorPrimitive } from "radix-ui";
+import * as SeparatorPrimitive from "@radix-ui/react-separator";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/toggle-group.tsx b/surfsense_web/components/ui/toggle-group.tsx
index eb212182a..33aa433b2 100644
--- a/surfsense_web/components/ui/toggle-group.tsx
+++ b/surfsense_web/components/ui/toggle-group.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import type { VariantProps } from "class-variance-authority";
-import { ToggleGroup as ToggleGroupPrimitive } from "radix-ui";
+import * as ToggleGroupPrimitive from "@radix-ui/react-toggle-group";
 import * as React from "react";
 import { toggleVariants } from "@/components/ui/toggle";
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/toggle.tsx b/surfsense_web/components/ui/toggle.tsx
index 5841cdc35..f0e68cec9 100644
--- a/surfsense_web/components/ui/toggle.tsx
+++ b/surfsense_web/components/ui/toggle.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { cva, type VariantProps } from "class-variance-authority";
-import { Toggle as TogglePrimitive } from "radix-ui";
+import * as TogglePrimitive from "@radix-ui/react-toggle";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/tooltip.tsx b/surfsense_web/components/ui/tooltip.tsx
index c19ce6f82..2fc85aae4 100644
--- a/surfsense_web/components/ui/tooltip.tsx
+++ b/surfsense_web/components/ui/tooltip.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { Tooltip as TooltipPrimitive } from "radix-ui";
+import * as TooltipPrimitive from "@radix-ui/react-tooltip";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";

From f4d197f7022b0ceec560925f38fe6c125a77b0fc Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Thu, 2 Apr 2026 13:18:20 +0200
Subject: [PATCH 036/202] feat: add native module support for desktop
 autocomplete

---
 surfsense_desktop/.npmrc                     |  1 +
 surfsense_desktop/electron-builder.yml       | 13 +++++
 surfsense_desktop/package.json               |  8 +++-
 surfsense_desktop/pnpm-lock.yaml             | 50 ++++++++++++++++++++
 surfsense_desktop/scripts/build-electron.mjs |  2 +-
 5 files changed, 71 insertions(+), 3 deletions(-)
 create mode 100644 surfsense_desktop/.npmrc

diff --git a/surfsense_desktop/.npmrc b/surfsense_desktop/.npmrc
new file mode 100644
index 000000000..d67f37488
--- /dev/null
+++ b/surfsense_desktop/.npmrc
@@ -0,0 +1 @@
+node-linker=hoisted
diff --git a/surfsense_desktop/electron-builder.yml b/surfsense_desktop/electron-builder.yml
index eaca0f19b..74c69d223 100644
--- a/surfsense_desktop/electron-builder.yml
+++ b/surfsense_desktop/electron-builder.yml
@@ -9,6 +9,16 @@ directories:
 files:
   - dist/**/*
   - "!node_modules"
+  - node_modules/uiohook-napi/**/*
+  - "!node_modules/uiohook-napi/build"
+  - "!node_modules/uiohook-napi/src"
+  - "!node_modules/uiohook-napi/libuiohook"
+  - "!node_modules/uiohook-napi/binding.gyp"
+  - node_modules/node-gyp-build/**/*
+  - node_modules/node-mac-permissions/**/*
+  - "!node_modules/node-mac-permissions/build"
+  - "!node_modules/node-mac-permissions/src"
+  - "!node_modules/node-mac-permissions/binding.gyp"
   - "!src"
   - "!scripts"
   - "!release"
@@ -29,6 +39,9 @@ extraResources:
     filter: ["**/*"]
 asarUnpack:
   - "**/*.node"
+  - "node_modules/uiohook-napi/**/*"
+  - "node_modules/node-gyp-build/**/*"
+  - "node_modules/node-mac-permissions/**/*"
 mac:
   icon: assets/icon.icns
   category: public.app-category.productivity
diff --git a/surfsense_desktop/package.json b/surfsense_desktop/package.json
index bd0cc67ab..a2e452b7c 100644
--- a/surfsense_desktop/package.json
+++ b/surfsense_desktop/package.json
@@ -11,12 +11,14 @@
     "dist:mac": "pnpm build && electron-builder --mac --config electron-builder.yml",
     "dist:win": "pnpm build && electron-builder --win --config electron-builder.yml",
     "dist:linux": "pnpm build && electron-builder --linux --config electron-builder.yml",
-    "typecheck": "tsc --noEmit"
+    "typecheck": "tsc --noEmit",
+    "postinstall": "electron-rebuild"
   },
   "author": "MODSetter",
   "license": "MIT",
   "packageManager": "pnpm@10.24.0",
   "devDependencies": {
+    "@electron/rebuild": "^4.0.3",
     "@types/node": "^25.5.0",
     "concurrently": "^9.2.1",
     "dotenv": "^17.3.1",
@@ -28,6 +30,8 @@
   },
   "dependencies": {
     "electron-updater": "^6.8.3",
-    "get-port-please": "^3.2.0"
+    "get-port-please": "^3.2.0",
+    "node-mac-permissions": "^2.5.0",
+    "uiohook-napi": "^1.5.5"
   }
 }
diff --git a/surfsense_desktop/pnpm-lock.yaml b/surfsense_desktop/pnpm-lock.yaml
index ea65be0bb..82bad9456 100644
--- a/surfsense_desktop/pnpm-lock.yaml
+++ b/surfsense_desktop/pnpm-lock.yaml
@@ -14,7 +14,16 @@ importers:
       get-port-please:
         specifier: ^3.2.0
         version: 3.2.0
+      node-mac-permissions:
+        specifier: ^2.5.0
+        version: 2.5.0
+      uiohook-napi:
+        specifier: ^1.5.5
+        version: 1.5.5
     devDependencies:
+      '@electron/rebuild':
+        specifier: ^4.0.3
+        version: 4.0.3
       '@types/node':
         specifier: ^25.5.0
         version: 25.5.0
@@ -343,6 +352,7 @@ packages:
   '@xmldom/xmldom@0.8.11':
     resolution: {integrity: sha512-cQzWCtO6C8TQiYl1ruKNn2U6Ao4o4WBBcbL61yJl84x+j5sOWWFU9X7DpND8XZG3daDppSsigMdfAIl2upQBRw==}
     engines: {node: '>=10.0.0'}
+    deprecated: this version has critical issues, please update to the latest version
 
   abbrev@3.0.1:
     resolution: {integrity: sha512-AO2ac6pjRB3SJmGJo+v5/aK6Omggp6fsLrs6wN9bd35ulu4cCwaAU9+7ZhXjeqHVkaHThLuzH0nZr0YpCDhygg==}
@@ -424,6 +434,9 @@ packages:
   base64-js@1.5.1:
     resolution: {integrity: sha512-AKpaYlHn8t4SVbOHCy+b5+KKgvR4vrsD8vbvrbiQJps7fKDTkjkDry6ji0rUJjC0kzbNePLwzxq8iypo41qeWA==}
 
+  bindings@1.5.0:
+    resolution: {integrity: sha512-p2q/t/mhvuOj/UeLlV6566GD/guowlr0hHxClI0W9m7MWYkL1F0hLo+0Aexs9HSPCtR1SXQ0TD3MMKrXZajbiQ==}
+
   bl@4.1.0:
     resolution: {integrity: sha512-1W07cM9gS6DcLperZfFSj+bWLtaPGSOHWhPiGzXmvVJbRLdG82sH/Kn8EtW1VqWVA54AKf2h5k5BbnIbwF3h6w==}
 
@@ -738,6 +751,9 @@ packages:
       picomatch:
         optional: true
 
+  file-uri-to-path@1.0.0:
+    resolution: {integrity: sha512-0Zt+s3L7Vf1biwWZ29aARiVYLx7iMGnEUl9x33fbB/j3jR81u/O2LbqK+Bm1CDSNDKVtJ/YjwY7TUd5SkeLQLw==}
+
   filelist@1.0.6:
     resolution: {integrity: sha512-5giy2PkLYY1cP39p17Ech+2xlpTRL9HLspOfEgm0L6CwBXBTgsK5ou0JtzYuepxkaQ/tvhCFIJ5uXo0OrM2DxA==}
 
@@ -1103,14 +1119,25 @@ packages:
   node-addon-api@1.7.2:
     resolution: {integrity: sha512-ibPK3iA+vaY1eEjESkQkM0BbCqFOaZMiXRTtdB0u7b4djtY6JnsjvPdUHVMg6xQt3B8fpTTWHI9A+ADjM9frzg==}
 
+  node-addon-api@7.1.1:
+    resolution: {integrity: sha512-5m3bsyrjFWE1xf7nz7YXdN4udnVtXK6/Yfgn5qnahL6bCkf2yKt4k3nuTKAtT4r3IG8JNR2ncsIMdZuAzJjHQQ==}
+
   node-api-version@0.2.1:
     resolution: {integrity: sha512-2xP/IGGMmmSQpI1+O/k72jF/ykvZ89JeuKX3TLJAYPDVLUalrshrLHkeVcCCZqG/eEa635cr8IBYzgnDvM2O8Q==}
 
+  node-gyp-build@4.8.4:
+    resolution: {integrity: sha512-LA4ZjwlnUblHVgq0oBF3Jl/6h/Nvs5fzBLwdEF4nuxnFdsfajde4WfxtJr3CaiH+F6ewcIB/q4jQ4UzPyid+CQ==}
+    hasBin: true
+
   node-gyp@11.5.0:
     resolution: {integrity: sha512-ra7Kvlhxn5V9Slyus0ygMa2h+UqExPqUIkfk7Pc8QTLT956JLSy51uWFwHtIYy0vI8cB4BDhc/S03+880My/LQ==}
     engines: {node: ^18.17.0 || >=20.5.0}
     hasBin: true
 
+  node-mac-permissions@2.5.0:
+    resolution: {integrity: sha512-zR8SVCaN3WqV1xwWd04XVAdzm3UTdjbxciLrZtB0Cc7F2Kd34AJfhPD4hm1HU0YH3oGUZO4X9OBLY5ijSTHsGw==}
+    os: [darwin]
+
   nopt@8.1.0:
     resolution: {integrity: sha512-ieGu42u/Qsa4TFktmaKEwM6MQH0pOWnaB3htzh0JRtx84+Mebc0cbZYN5bC+6WTZ4+77xrL9Pn5m7CV6VIkV7A==}
     engines: {node: ^18.17.0 || >=20.5.0}
@@ -1424,6 +1451,10 @@ packages:
     engines: {node: '>=14.17'}
     hasBin: true
 
+  uiohook-napi@1.5.5:
+    resolution: {integrity: sha512-oSlTdnECw2GBfsJPTbBQBeE4v/EXP0EZmX6BJq5nzH/JgFaBE8JpFwEA/kLhiEP7HxQw28FViWiYgdIZzWuuJQ==}
+    engines: {node: '>= 16'}
+
   undici-types@7.16.0:
     resolution: {integrity: sha512-Zz+aZWSj8LE6zoxD+xrjh4VfkIG8Ya6LvYkZqtUQGJPZjYl53ypCaUwWqo7eI0x66KBGeRo+mlBEkMSeSZ38Nw==}
 
@@ -1923,6 +1954,10 @@ snapshots:
 
   base64-js@1.5.1: {}
 
+  bindings@1.5.0:
+    dependencies:
+      file-uri-to-path: 1.0.0
+
   bl@4.1.0:
     dependencies:
       buffer: 5.7.1
@@ -2348,6 +2383,8 @@ snapshots:
     optionalDependencies:
       picomatch: 4.0.3
 
+  file-uri-to-path@1.0.0: {}
+
   filelist@1.0.6:
     dependencies:
       minimatch: 5.1.9
@@ -2739,10 +2776,14 @@ snapshots:
   node-addon-api@1.7.2:
     optional: true
 
+  node-addon-api@7.1.1: {}
+
   node-api-version@0.2.1:
     dependencies:
       semver: 7.7.4
 
+  node-gyp-build@4.8.4: {}
+
   node-gyp@11.5.0:
     dependencies:
       env-paths: 2.2.1
@@ -2758,6 +2799,11 @@ snapshots:
     transitivePeerDependencies:
       - supports-color
 
+  node-mac-permissions@2.5.0:
+    dependencies:
+      bindings: 1.5.0
+      node-addon-api: 7.1.1
+
   nopt@8.1.0:
     dependencies:
       abbrev: 3.0.1
@@ -3064,6 +3110,10 @@ snapshots:
 
   typescript@5.9.3: {}
 
+  uiohook-napi@1.5.5:
+    dependencies:
+      node-gyp-build: 4.8.4
+
   undici-types@7.16.0: {}
 
   undici-types@7.18.2: {}
diff --git a/surfsense_desktop/scripts/build-electron.mjs b/surfsense_desktop/scripts/build-electron.mjs
index 923830296..83d941dd2 100644
--- a/surfsense_desktop/scripts/build-electron.mjs
+++ b/surfsense_desktop/scripts/build-electron.mjs
@@ -104,7 +104,7 @@ async function buildElectron() {
     bundle: true,
     platform: 'node',
     target: 'node18',
-    external: ['electron'],
+    external: ['electron', 'uiohook-napi', 'node-mac-permissions'],
     sourcemap: true,
     minify: false,
     define: {

From fbd033d0a4ed756a789879b1bba69c08bc71506d Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Thu, 2 Apr 2026 13:19:21 +0200
Subject: [PATCH 037/202] feat: add autocomplete streaming endpoint with KB
 context

---
 surfsense_backend/app/routes/__init__.py      |   2 +
 .../app/routes/autocomplete_routes.py         | 136 ++++++++++++++++++
 2 files changed, 138 insertions(+)
 create mode 100644 surfsense_backend/app/routes/autocomplete_routes.py

diff --git a/surfsense_backend/app/routes/__init__.py b/surfsense_backend/app/routes/__init__.py
index 1937f11cb..a063b5976 100644
--- a/surfsense_backend/app/routes/__init__.py
+++ b/surfsense_backend/app/routes/__init__.py
@@ -3,6 +3,7 @@ from fastapi import APIRouter
 from .airtable_add_connector_route import (
     router as airtable_add_connector_router,
 )
+from .autocomplete_routes import router as autocomplete_router
 from .chat_comments_routes import router as chat_comments_router
 from .circleback_webhook_route import router as circleback_webhook_router
 from .clickup_add_connector_route import router as clickup_add_connector_router
@@ -95,3 +96,4 @@ router.include_router(incentive_tasks_router)  # Incentive tasks for earning fre
 router.include_router(stripe_router)  # Stripe checkout for additional page packs
 router.include_router(youtube_router)  # YouTube playlist resolution
 router.include_router(prompts_router)
+router.include_router(autocomplete_router)  # Lightweight autocomplete with KB context
diff --git a/surfsense_backend/app/routes/autocomplete_routes.py b/surfsense_backend/app/routes/autocomplete_routes.py
new file mode 100644
index 000000000..9a285a723
--- /dev/null
+++ b/surfsense_backend/app/routes/autocomplete_routes.py
@@ -0,0 +1,136 @@
+import logging
+from typing import AsyncGenerator
+
+from fastapi import APIRouter, Depends, Query
+from fastapi.responses import StreamingResponse
+from langchain_core.messages import HumanMessage, SystemMessage
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.db import User, get_async_session
+from app.retriever.chunks_hybrid_search import ChucksHybridSearchRetriever
+from app.services.llm_service import get_agent_llm
+from app.services.new_streaming_service import VercelStreamingService
+from app.users import current_active_user
+
+logger = logging.getLogger(__name__)
+
+router = APIRouter(prefix="/autocomplete", tags=["autocomplete"])
+
+AUTOCOMPLETE_SYSTEM_PROMPT = """You are an inline text autocomplete engine. Your job is to complete the user's text naturally.
+
+Rules:
+- Output ONLY the continuation text. Do NOT repeat what the user already typed.
+- Keep completions concise: 1-3 sentences maximum.
+- Match the user's tone, style, and language.
+- If knowledge base context is provided, use it to make the completion factually accurate and personalized.
+- Do NOT add quotes, explanations, or meta-commentary.
+- Do NOT start with a space unless grammatically required.
+- If you cannot produce a useful completion, output nothing."""
+
+KB_CONTEXT_TEMPLATE = """
+Relevant knowledge base context (use this to personalize the completion):
+---
+{kb_context}
+---
+"""
+
+
+async def _stream_autocomplete(
+    text: str,
+    cursor_position: int,
+    search_space_id: int,
+    session: AsyncSession,
+) -> AsyncGenerator[str, None]:
+    """Stream an autocomplete response with KB context."""
+    streaming_service = VercelStreamingService()
+
+    try:
+        # Text before cursor is what we're completing
+        text_before_cursor = text[:cursor_position] if cursor_position >= 0 else text
+
+        if not text_before_cursor.strip():
+            yield streaming_service.format_message_start()
+            yield streaming_service.format_finish()
+            yield streaming_service.format_done()
+            return
+
+        # Fast KB lookup: vector-only search, top 3 chunks, no planner LLM
+        kb_context = ""
+        try:
+            retriever = ChucksHybridSearchRetriever(session)
+            chunks = await retriever.vector_search(
+                query_text=text_before_cursor[-200:],  # last 200 chars for relevance
+                top_k=3,
+                search_space_id=search_space_id,
+            )
+            if chunks:
+                kb_snippets = []
+                for chunk in chunks:
+                    content = getattr(chunk, "content", None) or getattr(chunk, "chunk_text", "")
+                    if content:
+                        kb_snippets.append(content[:300])
+                if kb_snippets:
+                    kb_context = KB_CONTEXT_TEMPLATE.format(
+                        kb_context="\n\n".join(kb_snippets)
+                    )
+        except Exception as e:
+            logger.warning(f"KB search failed for autocomplete, proceeding without context: {e}")
+
+        # Get the search space's configured LLM
+        llm = await get_agent_llm(session, search_space_id)
+        if not llm:
+            yield streaming_service.format_message_start()
+            error_msg = "No LLM configured for this search space"
+            yield streaming_service.format_error(error_msg)
+            yield streaming_service.format_done()
+            return
+
+        system_prompt = AUTOCOMPLETE_SYSTEM_PROMPT
+        if kb_context:
+            system_prompt += kb_context
+
+        messages = [
+            SystemMessage(content=system_prompt),
+            HumanMessage(content=f"Complete this text:\n{text_before_cursor}"),
+        ]
+
+        # Stream the response
+        yield streaming_service.format_message_start()
+        text_id = streaming_service.generate_text_id()
+        yield streaming_service.format_text_start(text_id)
+
+        async for chunk in llm.astream(messages):
+            token = chunk.content if hasattr(chunk, "content") else str(chunk)
+            if token:
+                yield streaming_service.format_text_delta(text_id, token)
+
+        yield streaming_service.format_text_end(text_id)
+        yield streaming_service.format_finish()
+        yield streaming_service.format_done()
+
+    except Exception as e:
+        logger.error(f"Autocomplete streaming error: {e}")
+        yield streaming_service.format_error(str(e))
+        yield streaming_service.format_done()
+
+
+@router.post("/stream")
+async def autocomplete_stream(
+    text: str = Query(..., description="Current text in the input field"),
+    cursor_position: int = Query(-1, description="Cursor position in the text (-1 for end)"),
+    search_space_id: int = Query(..., description="Search space ID for KB context and LLM config"),
+    user: User = Depends(current_active_user),
+    session: AsyncSession = Depends(get_async_session),
+):
+    """Stream an autocomplete suggestion based on the current text and KB context."""
+    if cursor_position < 0:
+        cursor_position = len(text)
+
+    return StreamingResponse(
+        _stream_autocomplete(text, cursor_position, search_space_id, session),
+        media_type="text/event-stream",
+        headers={
+            **VercelStreamingService.get_response_headers(),
+            "X-Accel-Buffering": "no",
+        },
+    )

From bcc227a4ddc34fbd6af3fb1115e01af0997bac85 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Thu, 2 Apr 2026 13:19:59 +0200
Subject: [PATCH 038/202] feat: add suggestion tooltip UI and autocomplete API
 types

---
 surfsense_web/app/suggestion/layout.tsx     |  13 ++
 surfsense_web/app/suggestion/page.tsx       | 160 ++++++++++++++++++++
 surfsense_web/app/suggestion/suggestion.css |  96 ++++++++++++
 surfsense_web/types/window.d.ts             |   6 +
 4 files changed, 275 insertions(+)
 create mode 100644 surfsense_web/app/suggestion/layout.tsx
 create mode 100644 surfsense_web/app/suggestion/page.tsx
 create mode 100644 surfsense_web/app/suggestion/suggestion.css

diff --git a/surfsense_web/app/suggestion/layout.tsx b/surfsense_web/app/suggestion/layout.tsx
new file mode 100644
index 000000000..36b7e037b
--- /dev/null
+++ b/surfsense_web/app/suggestion/layout.tsx
@@ -0,0 +1,13 @@
+import "./suggestion.css";
+
+export const metadata = {
+	title: "SurfSense Suggestion",
+};
+
+export default function SuggestionLayout({
+	children,
+}: {
+	children: React.ReactNode;
+}) {
+	return <div className="suggestion-body">{children}</div>;
+}
diff --git a/surfsense_web/app/suggestion/page.tsx b/surfsense_web/app/suggestion/page.tsx
new file mode 100644
index 000000000..14dfab3af
--- /dev/null
+++ b/surfsense_web/app/suggestion/page.tsx
@@ -0,0 +1,160 @@
+"use client";
+
+import { useCallback, useEffect, useRef, useState } from "react";
+import { getBearerToken } from "@/lib/auth-utils";
+
+type SSEEvent =
+	| { type: "text-delta"; id: string; delta: string }
+	| { type: "text-start"; id: string }
+	| { type: "text-end"; id: string }
+	| { type: "start"; messageId: string }
+	| { type: "finish" }
+	| { type: "error"; errorText: string };
+
+export default function SuggestionPage() {
+	const [suggestion, setSuggestion] = useState("");
+	const [isLoading, setIsLoading] = useState(true);
+	const [error, setError] = useState<string | null>(null);
+	const abortRef = useRef<AbortController | null>(null);
+
+	const fetchSuggestion = useCallback(
+		async (text: string, cursorPosition: number, searchSpaceId: string) => {
+			abortRef.current?.abort();
+			const controller = new AbortController();
+			abortRef.current = controller;
+
+			setIsLoading(true);
+			setSuggestion("");
+			setError(null);
+
+			const token = getBearerToken();
+			if (!token) {
+				setError("Not authenticated");
+				setIsLoading(false);
+				return;
+			}
+
+			const backendUrl =
+				process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL || "http://localhost:8000";
+
+			const params = new URLSearchParams({
+				text,
+				cursor_position: String(cursorPosition),
+				search_space_id: searchSpaceId,
+			});
+
+			try {
+				const response = await fetch(
+					`${backendUrl}/api/v1/autocomplete/stream?${params}`,
+					{
+						method: "POST",
+						headers: {
+							Authorization: `Bearer ${token}`,
+							"Content-Type": "application/json",
+						},
+						signal: controller.signal,
+					},
+				);
+
+				if (!response.ok) {
+					setError(`Error: ${response.status}`);
+					setIsLoading(false);
+					return;
+				}
+
+				if (!response.body) {
+					setError("No response body");
+					setIsLoading(false);
+					return;
+				}
+
+				const reader = response.body.getReader();
+				const decoder = new TextDecoder();
+				let buffer = "";
+
+				while (true) {
+					const { done, value } = await reader.read();
+					if (done) break;
+
+					buffer += decoder.decode(value, { stream: true });
+					const events = buffer.split(/\r?\n\r?\n/);
+					buffer = events.pop() || "";
+
+					for (const event of events) {
+						const lines = event.split(/\r?\n/);
+						for (const line of lines) {
+							if (!line.startsWith("data: ")) continue;
+							const data = line.slice(6).trim();
+							if (!data || data === "[DONE]") continue;
+
+							try {
+								const parsed: SSEEvent = JSON.parse(data);
+								if (parsed.type === "text-delta") {
+									setSuggestion((prev) => {
+										const updated = prev + parsed.delta;
+										window.electronAPI?.updateSuggestionText?.(updated);
+										return updated;
+									});
+								} else if (parsed.type === "error") {
+									setError(parsed.errorText);
+								}
+							} catch {
+								continue;
+							}
+						}
+					}
+				}
+			} catch (err) {
+				if (err instanceof DOMException && err.name === "AbortError") return;
+				setError("Failed to get suggestion");
+			} finally {
+				setIsLoading(false);
+			}
+		},
+		[],
+	);
+
+	useEffect(() => {
+		if (!window.electronAPI?.onAutocompleteContext) return;
+
+		const cleanup = window.electronAPI.onAutocompleteContext((data) => {
+			const searchSpaceId = data.searchSpaceId || "1";
+			fetchSuggestion(data.text, data.cursorPosition, searchSpaceId);
+		});
+
+		return cleanup;
+	}, [fetchSuggestion]);
+
+	if (error) {
+		return (
+			<div className="suggestion-tooltip suggestion-error">
+				<span className="suggestion-error-text">{error}</span>
+			</div>
+		);
+	}
+
+	if (isLoading && !suggestion) {
+		return (
+			<div className="suggestion-tooltip">
+				<div className="suggestion-loading">
+					<span className="suggestion-dot" />
+					<span className="suggestion-dot" />
+					<span className="suggestion-dot" />
+				</div>
+			</div>
+		);
+	}
+
+	if (!suggestion) return null;
+
+	return (
+		<div className="suggestion-tooltip">
+			<p className="suggestion-text">{suggestion}</p>
+			<div className="suggestion-hint">
+				<span className="suggestion-key">Tab</span> accept
+				<span className="suggestion-separator">·</span>
+				<span className="suggestion-key">Esc</span> dismiss
+			</div>
+		</div>
+	);
+}
diff --git a/surfsense_web/app/suggestion/suggestion.css b/surfsense_web/app/suggestion/suggestion.css
new file mode 100644
index 000000000..e9471e7f8
--- /dev/null
+++ b/surfsense_web/app/suggestion/suggestion.css
@@ -0,0 +1,96 @@
+.suggestion-body {
+  margin: 0;
+  padding: 0;
+  background: transparent;
+  overflow: hidden;
+  font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+  -webkit-font-smoothing: antialiased;
+  user-select: none;
+  -webkit-app-region: no-drag;
+}
+
+.suggestion-tooltip {
+  background: rgba(30, 30, 30, 0.95);
+  backdrop-filter: blur(12px);
+  -webkit-backdrop-filter: blur(12px);
+  border: 1px solid rgba(255, 255, 255, 0.1);
+  border-radius: 10px;
+  padding: 10px 14px;
+  margin: 4px;
+  max-width: 400px;
+  box-shadow: 0 8px 32px rgba(0, 0, 0, 0.4),
+              0 2px 8px rgba(0, 0, 0, 0.2);
+}
+
+.suggestion-text {
+  color: rgba(255, 255, 255, 0.9);
+  font-size: 13px;
+  line-height: 1.5;
+  margin: 0 0 8px 0;
+  word-wrap: break-word;
+  white-space: pre-wrap;
+}
+
+.suggestion-hint {
+  color: rgba(255, 255, 255, 0.4);
+  font-size: 11px;
+  display: flex;
+  align-items: center;
+  gap: 4px;
+}
+
+.suggestion-key {
+  background: rgba(255, 255, 255, 0.1);
+  border: 1px solid rgba(255, 255, 255, 0.15);
+  border-radius: 3px;
+  padding: 1px 5px;
+  font-size: 10px;
+  font-weight: 500;
+  color: rgba(255, 255, 255, 0.6);
+}
+
+.suggestion-separator {
+  margin: 0 2px;
+}
+
+.suggestion-error {
+  border-color: rgba(255, 80, 80, 0.3);
+}
+
+.suggestion-error-text {
+  color: rgba(255, 120, 120, 0.9);
+  font-size: 12px;
+}
+
+.suggestion-loading {
+  display: flex;
+  gap: 4px;
+  padding: 4px 0;
+}
+
+.suggestion-dot {
+  width: 5px;
+  height: 5px;
+  border-radius: 50%;
+  background: rgba(255, 255, 255, 0.4);
+  animation: suggestion-pulse 1.2s infinite ease-in-out;
+}
+
+.suggestion-dot:nth-child(2) {
+  animation-delay: 0.15s;
+}
+
+.suggestion-dot:nth-child(3) {
+  animation-delay: 0.3s;
+}
+
+@keyframes suggestion-pulse {
+  0%, 80%, 100% {
+    opacity: 0.3;
+    transform: scale(0.8);
+  }
+  40% {
+    opacity: 1;
+    transform: scale(1);
+  }
+}
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 9cf1aa596..a30358527 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -14,6 +14,12 @@ interface ElectronAPI {
 	setQuickAskMode: (mode: string) => Promise<void>;
 	getQuickAskMode: () => Promise<string>;
 	replaceText: (text: string) => Promise<void>;
+	onAutocompleteContext: (callback: (data: { text: string; cursorPosition: number; searchSpaceId?: string }) => void) => () => void;
+	acceptSuggestion: (text: string) => Promise<void>;
+	dismissSuggestion: () => Promise<void>;
+	updateSuggestionText: (text: string) => Promise<void>;
+	setAutocompleteEnabled: (enabled: boolean) => Promise<void>;
+	getAutocompleteEnabled: () => Promise<boolean>;
 }
 
 declare global {

From ec2b7851b6393147b09a9f24273fe84d4314371f Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Thu, 2 Apr 2026 13:26:32 +0200
Subject: [PATCH 039/202] feat: add macOS permission infrastructure for
 autocomplete

---
 surfsense_desktop/src/ipc/channels.ts        |  5 ++
 surfsense_desktop/src/ipc/handlers.ts        | 22 +++++++++
 surfsense_desktop/src/modules/permissions.ts | 50 ++++++++++++++++++++
 surfsense_desktop/src/preload.ts             |  5 ++
 surfsense_web/types/window.d.ts              |  9 ++++
 5 files changed, 91 insertions(+)
 create mode 100644 surfsense_desktop/src/modules/permissions.ts

diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index 25ec1bc0e..a5209dcf3 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -6,4 +6,9 @@ export const IPC_CHANNELS = {
   SET_QUICK_ASK_MODE: 'set-quick-ask-mode',
   GET_QUICK_ASK_MODE: 'get-quick-ask-mode',
   REPLACE_TEXT: 'replace-text',
+  // Permissions
+  GET_PERMISSIONS_STATUS: 'get-permissions-status',
+  REQUEST_ACCESSIBILITY: 'request-accessibility',
+  REQUEST_INPUT_MONITORING: 'request-input-monitoring',
+  RESTART_APP: 'restart-app',
 } as const;
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index 18e343719..fc31329f1 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -1,5 +1,11 @@
 import { app, ipcMain, shell } from 'electron';
 import { IPC_CHANNELS } from './channels';
+import {
+  getPermissionsStatus,
+  requestAccessibility,
+  requestInputMonitoring,
+  restartApp,
+} from '../modules/permissions';
 
 export function registerIpcHandlers(): void {
   ipcMain.on(IPC_CHANNELS.OPEN_EXTERNAL, (_event, url: string) => {
@@ -16,4 +22,20 @@ export function registerIpcHandlers(): void {
   ipcMain.handle(IPC_CHANNELS.GET_APP_VERSION, () => {
     return app.getVersion();
   });
+
+  ipcMain.handle(IPC_CHANNELS.GET_PERMISSIONS_STATUS, () => {
+    return getPermissionsStatus();
+  });
+
+  ipcMain.handle(IPC_CHANNELS.REQUEST_ACCESSIBILITY, () => {
+    requestAccessibility();
+  });
+
+  ipcMain.handle(IPC_CHANNELS.REQUEST_INPUT_MONITORING, () => {
+    requestInputMonitoring();
+  });
+
+  ipcMain.handle(IPC_CHANNELS.RESTART_APP, () => {
+    restartApp();
+  });
 }
diff --git a/surfsense_desktop/src/modules/permissions.ts b/surfsense_desktop/src/modules/permissions.ts
new file mode 100644
index 000000000..9a6159c9a
--- /dev/null
+++ b/surfsense_desktop/src/modules/permissions.ts
@@ -0,0 +1,50 @@
+import { app } from 'electron';
+
+type PermissionStatus = 'authorized' | 'denied' | 'not determined' | 'restricted' | 'limited';
+
+export interface PermissionsStatus {
+  accessibility: PermissionStatus;
+  inputMonitoring: PermissionStatus;
+}
+
+function isMac(): boolean {
+  return process.platform === 'darwin';
+}
+
+function getNodeMacPermissions() {
+  return require('node-mac-permissions');
+}
+
+export function getPermissionsStatus(): PermissionsStatus {
+  if (!isMac()) {
+    return { accessibility: 'authorized', inputMonitoring: 'authorized' };
+  }
+
+  const perms = getNodeMacPermissions();
+  return {
+    accessibility: perms.getAuthStatus('accessibility'),
+    inputMonitoring: perms.getAuthStatus('input-monitoring'),
+  };
+}
+
+export function allPermissionsGranted(): boolean {
+  const status = getPermissionsStatus();
+  return status.accessibility === 'authorized' && status.inputMonitoring === 'authorized';
+}
+
+export function requestAccessibility(): void {
+  if (!isMac()) return;
+  const perms = getNodeMacPermissions();
+  perms.askForAccessibilityAccess();
+}
+
+export async function requestInputMonitoring(): Promise<string> {
+  if (!isMac()) return 'authorized';
+  const perms = getNodeMacPermissions();
+  return perms.askForInputMonitoringAccess('listen');
+}
+
+export function restartApp(): void {
+  app.relaunch();
+  app.exit(0);
+}
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 264ec25b3..069276489 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -21,4 +21,9 @@ contextBridge.exposeInMainWorld('electronAPI', {
   setQuickAskMode: (mode: string) => ipcRenderer.invoke(IPC_CHANNELS.SET_QUICK_ASK_MODE, mode),
   getQuickAskMode: () => ipcRenderer.invoke(IPC_CHANNELS.GET_QUICK_ASK_MODE),
   replaceText: (text: string) => ipcRenderer.invoke(IPC_CHANNELS.REPLACE_TEXT, text),
+  // Permissions
+  getPermissionsStatus: () => ipcRenderer.invoke(IPC_CHANNELS.GET_PERMISSIONS_STATUS),
+  requestAccessibility: () => ipcRenderer.invoke(IPC_CHANNELS.REQUEST_ACCESSIBILITY),
+  requestInputMonitoring: () => ipcRenderer.invoke(IPC_CHANNELS.REQUEST_INPUT_MONITORING),
+  restartApp: () => ipcRenderer.invoke(IPC_CHANNELS.RESTART_APP),
 });
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index a30358527..8cf331b42 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -14,6 +14,15 @@ interface ElectronAPI {
 	setQuickAskMode: (mode: string) => Promise<void>;
 	getQuickAskMode: () => Promise<string>;
 	replaceText: (text: string) => Promise<void>;
+	// Permissions
+	getPermissionsStatus: () => Promise<{
+		accessibility: 'authorized' | 'denied' | 'not determined' | 'restricted' | 'limited';
+		inputMonitoring: 'authorized' | 'denied' | 'not determined' | 'restricted' | 'limited';
+	}>;
+	requestAccessibility: () => Promise<void>;
+	requestInputMonitoring: () => Promise<void>;
+	restartApp: () => Promise<void>;
+	// Autocomplete
 	onAutocompleteContext: (callback: (data: { text: string; cursorPosition: number; searchSpaceId?: string }) => void) => () => void;
 	acceptSuggestion: (text: string) => Promise<void>;
 	dismissSuggestion: () => Promise<void>;

From eaabad38fcd2bfc8d6bef87f8ea60ea4d8192d78 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Thu, 2 Apr 2026 13:44:57 +0200
Subject: [PATCH 040/202] feat: add permission onboarding page and startup
 routing for macOS

---
 surfsense_desktop/src/ipc/handlers.ts         |   4 +-
 surfsense_desktop/src/main.ts                 |  15 +-
 surfsense_desktop/src/modules/window.ts       |   4 +-
 .../app/desktop/permissions/page.tsx          | 212 ++++++++++++++++++
 .../app/{ => desktop}/suggestion/layout.tsx   |   0
 .../app/{ => desktop}/suggestion/page.tsx     |   0
 .../{ => desktop}/suggestion/suggestion.css   |   0
 7 files changed, 228 insertions(+), 7 deletions(-)
 create mode 100644 surfsense_web/app/desktop/permissions/page.tsx
 rename surfsense_web/app/{ => desktop}/suggestion/layout.tsx (100%)
 rename surfsense_web/app/{ => desktop}/suggestion/page.tsx (100%)
 rename surfsense_web/app/{ => desktop}/suggestion/suggestion.css (100%)

diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index fc31329f1..a6d82be4b 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -31,8 +31,8 @@ export function registerIpcHandlers(): void {
     requestAccessibility();
   });
 
-  ipcMain.handle(IPC_CHANNELS.REQUEST_INPUT_MONITORING, () => {
-    requestInputMonitoring();
+  ipcMain.handle(IPC_CHANNELS.REQUEST_INPUT_MONITORING, async () => {
+    return await requestInputMonitoring();
   });
 
   ipcMain.handle(IPC_CHANNELS.RESTART_APP, () => {
diff --git a/surfsense_desktop/src/main.ts b/surfsense_desktop/src/main.ts
index 3ab41073b..bc164758b 100644
--- a/surfsense_desktop/src/main.ts
+++ b/surfsense_desktop/src/main.ts
@@ -7,6 +7,7 @@ import { setupAutoUpdater } from './modules/auto-updater';
 import { setupMenu } from './modules/menu';
 import { registerQuickAsk, unregisterQuickAsk } from './modules/quick-ask';
 import { registerIpcHandlers } from './ipc/handlers';
+import { allPermissionsGranted } from './modules/permissions';
 
 registerGlobalErrorHandlers();
 
@@ -16,7 +17,13 @@ if (!setupDeepLinks()) {
 
 registerIpcHandlers();
 
-// App lifecycle
+function getInitialPath(): string {
+  if (process.platform === 'darwin' && !allPermissionsGranted()) {
+    return '/desktop/permissions';
+  }
+  return '/dashboard';
+}
+
 app.whenReady().then(async () => {
   setupMenu();
   try {
@@ -26,7 +33,9 @@ app.whenReady().then(async () => {
     setTimeout(() => app.quit(), 0);
     return;
   }
-  createMainWindow();
+
+  const initialPath = getInitialPath();
+  createMainWindow(initialPath);
   registerQuickAsk();
   setupAutoUpdater();
 
@@ -34,7 +43,7 @@ app.whenReady().then(async () => {
 
   app.on('activate', () => {
     if (BrowserWindow.getAllWindows().length === 0) {
-      createMainWindow();
+      createMainWindow(getInitialPath());
     }
   });
 });
diff --git a/surfsense_desktop/src/modules/window.ts b/surfsense_desktop/src/modules/window.ts
index 245814cad..7a77773d8 100644
--- a/surfsense_desktop/src/modules/window.ts
+++ b/surfsense_desktop/src/modules/window.ts
@@ -12,7 +12,7 @@ export function getMainWindow(): BrowserWindow | null {
   return mainWindow;
 }
 
-export function createMainWindow(): BrowserWindow {
+export function createMainWindow(initialPath = '/dashboard'): BrowserWindow {
   mainWindow = new BrowserWindow({
     width: 1280,
     height: 800,
@@ -33,7 +33,7 @@ export function createMainWindow(): BrowserWindow {
     mainWindow?.show();
   });
 
-  mainWindow.loadURL(`http://localhost:${getServerPort()}/dashboard`);
+  mainWindow.loadURL(`http://localhost:${getServerPort()}${initialPath}`);
 
   mainWindow.webContents.setWindowOpenHandler(({ url }) => {
     if (url.startsWith('http://localhost')) {
diff --git a/surfsense_web/app/desktop/permissions/page.tsx b/surfsense_web/app/desktop/permissions/page.tsx
new file mode 100644
index 000000000..2bcdc42df
--- /dev/null
+++ b/surfsense_web/app/desktop/permissions/page.tsx
@@ -0,0 +1,212 @@
+"use client";
+
+import { useEffect, useState } from "react";
+import { useRouter } from "next/navigation";
+import { Logo } from "@/components/Logo";
+import { Button } from "@/components/ui/button";
+import { Spinner } from "@/components/ui/spinner";
+
+type PermissionStatus = "authorized" | "denied" | "not determined" | "restricted" | "limited";
+
+interface PermissionsStatus {
+	accessibility: PermissionStatus;
+	inputMonitoring: PermissionStatus;
+}
+
+const STEPS = [
+	{
+		id: "input-monitoring",
+		title: "Input Monitoring",
+		description: "Helps you write faster by enriching your text with suggestions from your knowledge base.",
+		action: "requestInputMonitoring",
+		field: "inputMonitoring" as const,
+	},
+	{
+		id: "accessibility",
+		title: "Accessibility",
+		description: "Lets you accept suggestions seamlessly, right where you're typing.",
+		action: "requestAccessibility",
+		field: "accessibility" as const,
+	},
+];
+
+function StatusBadge({ status }: { status: PermissionStatus }) {
+	if (status === "authorized") {
+		return (
+			<span className="inline-flex items-center gap-1.5 text-xs font-medium text-green-700 dark:text-green-400">
+				<span className="h-2 w-2 rounded-full bg-green-500" />
+				Granted
+			</span>
+		);
+	}
+	if (status === "denied") {
+		return (
+			<span className="inline-flex items-center gap-1.5 text-xs font-medium text-amber-700 dark:text-amber-400">
+				<span className="h-2 w-2 rounded-full bg-amber-500" />
+				Denied
+			</span>
+		);
+	}
+	return (
+		<span className="inline-flex items-center gap-1.5 text-xs font-medium text-muted-foreground">
+			<span className="h-2 w-2 rounded-full bg-muted-foreground/40" />
+			Pending
+		</span>
+	);
+}
+
+export default function DesktopPermissionsPage() {
+	const router = useRouter();
+	const [permissions, setPermissions] = useState<PermissionsStatus | null>(null);
+	const [isElectron, setIsElectron] = useState(false);
+
+	useEffect(() => {
+		if (!window.electronAPI) return;
+		setIsElectron(true);
+
+		let interval: ReturnType<typeof setInterval> | null = null;
+
+		const isResolved = (s: string) => s === "authorized" || s === "restricted";
+
+		const poll = async () => {
+			const status = await window.electronAPI!.getPermissionsStatus();
+			setPermissions(status);
+
+			if (isResolved(status.accessibility) && isResolved(status.inputMonitoring)) {
+				if (interval) clearInterval(interval);
+			}
+		};
+
+		poll();
+		interval = setInterval(poll, 2000);
+		return () => { if (interval) clearInterval(interval); };
+	}, []);
+
+	if (!isElectron) {
+		return (
+			<div className="h-screen flex items-center justify-center bg-background">
+				<p className="text-muted-foreground">This page is only available in the desktop app.</p>
+			</div>
+		);
+	}
+
+	if (!permissions) {
+		return (
+			<div className="h-screen flex items-center justify-center bg-background">
+				<Spinner size="lg" />
+			</div>
+		);
+	}
+
+	const allGranted = permissions.accessibility === "authorized" && permissions.inputMonitoring === "authorized";
+
+	const handleRequest = async (action: string) => {
+		if (action === "requestInputMonitoring") {
+			await window.electronAPI!.requestInputMonitoring();
+		} else if (action === "requestAccessibility") {
+			await window.electronAPI!.requestAccessibility();
+		}
+	};
+
+	const handleContinue = () => {
+		if (allGranted) {
+			window.electronAPI!.restartApp();
+		}
+	};
+
+	const handleSkip = () => {
+		router.push("/dashboard");
+	};
+
+	return (
+		<div className="h-screen flex flex-col items-center p-4 bg-background dark:bg-neutral-900 select-none overflow-hidden">
+			<div className="w-full max-w-lg flex flex-col min-h-0 h-full gap-6 py-8">
+				{/* Header */}
+				<div className="text-center space-y-3 shrink-0">
+					<Logo className="w-12 h-12 mx-auto" />
+					<div className="space-y-1">
+						<h1 className="text-2xl font-semibold tracking-tight">System Permissions</h1>
+						<p className="text-sm text-muted-foreground">
+							SurfSense needs two macOS permissions to provide system-wide autocomplete.
+						</p>
+					</div>
+				</div>
+
+				{/* Steps */}
+				<div className="rounded-xl border bg-background dark:bg-neutral-900 flex-1 min-h-0 overflow-y-auto px-6 py-6 space-y-6">
+					{STEPS.map((step, index) => {
+						const status = permissions[step.field];
+						const isGranted = status === "authorized";
+
+						return (
+							<div
+								key={step.id}
+								className={`rounded-lg border p-4 transition-colors ${
+									isGranted
+										? "border-green-200 bg-green-50/50 dark:border-green-900 dark:bg-green-950/20"
+										: "border-border"
+								}`}
+							>
+								<div className="flex items-start justify-between gap-3">
+									<div className="flex items-start gap-3">
+										<span className="flex h-7 w-7 shrink-0 items-center justify-center rounded-full bg-primary/10 text-sm font-medium text-primary">
+											{isGranted ? "✓" : index + 1}
+										</span>
+										<div className="space-y-1">
+											<h3 className="text-sm font-medium">{step.title}</h3>
+											<p className="text-xs text-muted-foreground">{step.description}</p>
+										</div>
+									</div>
+									<StatusBadge status={status} />
+								</div>
+								{!isGranted && (
+									<div className="mt-3 pl-10 space-y-2">
+										<Button
+											size="sm"
+											variant="outline"
+											onClick={() => handleRequest(step.action)}
+											className="text-xs"
+										>
+											Open System Settings
+										</Button>
+										{status === "denied" && (
+											<p className="text-xs text-amber-700 dark:text-amber-400">
+												Toggle SurfSense on in System Settings to continue.
+											</p>
+										)}
+									</div>
+								)}
+							</div>
+						);
+					})}
+				</div>
+
+				{/* Footer */}
+				<div className="text-center space-y-3 shrink-0">
+					{allGranted ? (
+						<>
+							<Button onClick={handleContinue} className="text-sm h-9 min-w-[180px]">
+								Restart &amp; Get Started
+							</Button>
+							<p className="text-xs text-muted-foreground">
+								A restart is needed for permissions to take effect.
+							</p>
+						</>
+					) : (
+						<>
+							<Button disabled className="text-sm h-9 min-w-[180px]">
+								Grant permissions to continue
+							</Button>
+							<button
+								onClick={handleSkip}
+								className="block mx-auto text-xs text-muted-foreground hover:text-foreground transition-colors"
+							>
+								Skip for now
+							</button>
+						</>
+					)}
+				</div>
+			</div>
+		</div>
+	);
+}
diff --git a/surfsense_web/app/suggestion/layout.tsx b/surfsense_web/app/desktop/suggestion/layout.tsx
similarity index 100%
rename from surfsense_web/app/suggestion/layout.tsx
rename to surfsense_web/app/desktop/suggestion/layout.tsx
diff --git a/surfsense_web/app/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
similarity index 100%
rename from surfsense_web/app/suggestion/page.tsx
rename to surfsense_web/app/desktop/suggestion/page.tsx
diff --git a/surfsense_web/app/suggestion/suggestion.css b/surfsense_web/app/desktop/suggestion/suggestion.css
similarity index 100%
rename from surfsense_web/app/suggestion/suggestion.css
rename to surfsense_web/app/desktop/suggestion/suggestion.css

From b2706b00a1bf793e8d1aa63235a0c53d5cc6766c Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Thu, 2 Apr 2026 14:29:12 +0200
Subject: [PATCH 041/202] feat: add autocomplete module with keystroke
 monitoring and IPC wiring

---
 surfsense_desktop/src/ipc/channels.ts         |   7 +
 surfsense_desktop/src/main.ts                 |   3 +
 surfsense_desktop/src/modules/autocomplete.ts | 267 ++++++++++++++++++
 surfsense_desktop/src/modules/platform.ts     |  40 +++
 surfsense_desktop/src/preload.ts              |  13 +
 5 files changed, 330 insertions(+)
 create mode 100644 surfsense_desktop/src/modules/autocomplete.ts

diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index a5209dcf3..2965f516f 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -11,4 +11,11 @@ export const IPC_CHANNELS = {
   REQUEST_ACCESSIBILITY: 'request-accessibility',
   REQUEST_INPUT_MONITORING: 'request-input-monitoring',
   RESTART_APP: 'restart-app',
+  // Autocomplete
+  AUTOCOMPLETE_CONTEXT: 'autocomplete-context',
+  ACCEPT_SUGGESTION: 'accept-suggestion',
+  DISMISS_SUGGESTION: 'dismiss-suggestion',
+  UPDATE_SUGGESTION_TEXT: 'update-suggestion-text',
+  SET_AUTOCOMPLETE_ENABLED: 'set-autocomplete-enabled',
+  GET_AUTOCOMPLETE_ENABLED: 'get-autocomplete-enabled',
 } as const;
diff --git a/surfsense_desktop/src/main.ts b/surfsense_desktop/src/main.ts
index bc164758b..9623be82e 100644
--- a/surfsense_desktop/src/main.ts
+++ b/surfsense_desktop/src/main.ts
@@ -6,6 +6,7 @@ import { setupDeepLinks, handlePendingDeepLink } from './modules/deep-links';
 import { setupAutoUpdater } from './modules/auto-updater';
 import { setupMenu } from './modules/menu';
 import { registerQuickAsk, unregisterQuickAsk } from './modules/quick-ask';
+import { registerAutocomplete, unregisterAutocomplete } from './modules/autocomplete';
 import { registerIpcHandlers } from './ipc/handlers';
 import { allPermissionsGranted } from './modules/permissions';
 
@@ -37,6 +38,7 @@ app.whenReady().then(async () => {
   const initialPath = getInitialPath();
   createMainWindow(initialPath);
   registerQuickAsk();
+  registerAutocomplete();
   setupAutoUpdater();
 
   handlePendingDeepLink();
@@ -56,4 +58,5 @@ app.on('window-all-closed', () => {
 
 app.on('will-quit', () => {
   unregisterQuickAsk();
+  unregisterAutocomplete();
 });
diff --git a/surfsense_desktop/src/modules/autocomplete.ts b/surfsense_desktop/src/modules/autocomplete.ts
new file mode 100644
index 000000000..2b877723f
--- /dev/null
+++ b/surfsense_desktop/src/modules/autocomplete.ts
@@ -0,0 +1,267 @@
+import { BrowserWindow, clipboard, ipcMain, screen, shell } from 'electron';
+import path from 'path';
+import { IPC_CHANNELS } from '../ipc/channels';
+import { allPermissionsGranted } from './permissions';
+import { getFieldContent, getFrontmostApp, hasAccessibilityPermission, simulatePaste } from './platform';
+import { getServerPort } from './server';
+import { getMainWindow } from './window';
+
+const DEBOUNCE_MS = 600;
+const TOOLTIP_WIDTH = 420;
+const TOOLTIP_HEIGHT = 140;
+
+let uIOhook: any = null;
+let UiohookKey: any = {};
+let IGNORED_KEYCODES: Set<number> = new Set();
+
+let suggestionWindow: BrowserWindow | null = null;
+let debounceTimer: ReturnType<typeof setTimeout> | null = null;
+let hookStarted = false;
+let autocompleteEnabled = true;
+let savedClipboard = '';
+let sourceApp = '';
+let pendingSuggestionText = '';
+
+function loadUiohook(): boolean {
+  if (uIOhook) return true;
+  try {
+    const mod = require('uiohook-napi');
+    uIOhook = mod.uIOhook;
+    UiohookKey = mod.UiohookKey;
+    IGNORED_KEYCODES = new Set([
+      UiohookKey.Shift, UiohookKey.ShiftRight,
+      UiohookKey.Ctrl, UiohookKey.CtrlRight,
+      UiohookKey.Alt, UiohookKey.AltRight,
+      UiohookKey.Meta, UiohookKey.MetaRight,
+      UiohookKey.CapsLock, UiohookKey.NumLock, UiohookKey.ScrollLock,
+      UiohookKey.F1, UiohookKey.F2, UiohookKey.F3, UiohookKey.F4,
+      UiohookKey.F5, UiohookKey.F6, UiohookKey.F7, UiohookKey.F8,
+      UiohookKey.F9, UiohookKey.F10, UiohookKey.F11, UiohookKey.F12,
+      UiohookKey.PrintScreen,
+      UiohookKey.Insert, UiohookKey.Delete,
+      UiohookKey.Home, UiohookKey.End,
+      UiohookKey.PageUp, UiohookKey.PageDown,
+      UiohookKey.ArrowUp, UiohookKey.ArrowDown,
+      UiohookKey.ArrowLeft, UiohookKey.ArrowRight,
+    ]);
+    console.log('[autocomplete] uiohook-napi loaded');
+    return true;
+  } catch (err) {
+    console.error('[autocomplete] Failed to load uiohook-napi:', err);
+    return false;
+  }
+}
+
+function destroySuggestion(): void {
+  if (suggestionWindow && !suggestionWindow.isDestroyed()) {
+    suggestionWindow.close();
+  }
+  suggestionWindow = null;
+}
+
+function clampToScreen(x: number, y: number, w: number, h: number): { x: number; y: number } {
+  const display = screen.getDisplayNearestPoint({ x, y });
+  const { x: dx, y: dy, width: dw, height: dh } = display.workArea;
+  return {
+    x: Math.max(dx, Math.min(x, dx + dw - w)),
+    y: Math.max(dy, Math.min(y, dy + dh - h)),
+  };
+}
+
+function createSuggestionWindow(x: number, y: number): BrowserWindow {
+  destroySuggestion();
+
+  const pos = clampToScreen(x, y + 20, TOOLTIP_WIDTH, TOOLTIP_HEIGHT);
+
+  suggestionWindow = new BrowserWindow({
+    width: TOOLTIP_WIDTH,
+    height: TOOLTIP_HEIGHT,
+    x: pos.x,
+    y: pos.y,
+    frame: false,
+    transparent: true,
+    focusable: false,
+    alwaysOnTop: true,
+    skipTaskbar: true,
+    resizable: false,
+    hasShadow: true,
+    type: 'panel',
+    webPreferences: {
+      preload: path.join(__dirname, 'preload.js'),
+      contextIsolation: true,
+      nodeIntegration: false,
+      sandbox: true,
+    },
+    show: false,
+  });
+
+  suggestionWindow.loadURL(`http://localhost:${getServerPort()}/desktop/suggestion?t=${Date.now()}`);
+
+  suggestionWindow.once('ready-to-show', () => {
+    suggestionWindow?.showInactive();
+  });
+
+  suggestionWindow.webContents.setWindowOpenHandler(({ url }) => {
+    if (url.startsWith('http://localhost')) {
+      return { action: 'allow' };
+    }
+    shell.openExternal(url);
+    return { action: 'deny' };
+  });
+
+  suggestionWindow.on('closed', () => {
+    suggestionWindow = null;
+  });
+
+  return suggestionWindow;
+}
+
+function clearDebounce(): void {
+  if (debounceTimer) {
+    clearTimeout(debounceTimer);
+    debounceTimer = null;
+  }
+}
+
+function isSurfSenseWindow(): boolean {
+  const app = getFrontmostApp();
+  return app === 'Electron' || app === 'SurfSense' || app === 'surfsense-desktop';
+}
+
+function onKeyDown(event: { keycode: number; ctrlKey?: boolean; metaKey?: boolean; altKey?: boolean }): void {
+  if (!autocompleteEnabled) return;
+
+  if (event.keycode === UiohookKey.Tab && suggestionWindow && !suggestionWindow.isDestroyed()) {
+    if (pendingSuggestionText) {
+      acceptAndInject(pendingSuggestionText);
+    }
+    return;
+  }
+
+  if (event.keycode === UiohookKey.Escape) {
+    if (suggestionWindow && !suggestionWindow.isDestroyed()) {
+      destroySuggestion();
+      pendingSuggestionText = '';
+    }
+    clearDebounce();
+    return;
+  }
+
+  if (IGNORED_KEYCODES.has(event.keycode)) return;
+  if (event.ctrlKey || event.metaKey || event.altKey) return;
+  if (isSurfSenseWindow()) return;
+
+  if (suggestionWindow && !suggestionWindow.isDestroyed()) {
+    destroySuggestion();
+  }
+
+  clearDebounce();
+  debounceTimer = setTimeout(() => {
+    triggerAutocomplete();
+  }, DEBOUNCE_MS);
+}
+
+async function triggerAutocomplete(): Promise<void> {
+  if (!hasAccessibilityPermission()) return;
+  if (isSurfSenseWindow()) return;
+
+  const fieldContent = getFieldContent();
+  if (!fieldContent || !fieldContent.text.trim()) return;
+  if (fieldContent.text.trim().length < 5) return;
+
+  sourceApp = getFrontmostApp();
+  savedClipboard = clipboard.readText();
+
+  const cursor = screen.getCursorScreenPoint();
+  const win = createSuggestionWindow(cursor.x, cursor.y);
+
+  let searchSpaceId = '1';
+  const mainWin = getMainWindow();
+  if (mainWin && !mainWin.isDestroyed()) {
+    const mainUrl = mainWin.webContents.getURL();
+    const match = mainUrl.match(/\/dashboard\/(\d+)/);
+    if (match) {
+      searchSpaceId = match[1];
+    }
+  }
+
+  win.webContents.once('did-finish-load', () => {
+    if (suggestionWindow && !suggestionWindow.isDestroyed()) {
+      suggestionWindow.webContents.send(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, {
+        text: fieldContent.text,
+        cursorPosition: fieldContent.cursorPosition,
+        searchSpaceId,
+      });
+    }
+  });
+}
+
+async function acceptAndInject(text: string): Promise<void> {
+  if (!sourceApp) return;
+  if (!hasAccessibilityPermission()) return;
+
+  clipboard.writeText(text);
+  destroySuggestion();
+  pendingSuggestionText = '';
+
+  try {
+    await new Promise((r) => setTimeout(r, 50));
+    simulatePaste();
+    await new Promise((r) => setTimeout(r, 100));
+    clipboard.writeText(savedClipboard);
+  } catch {
+    clipboard.writeText(savedClipboard);
+  }
+}
+
+function registerIpcHandlers(): void {
+  ipcMain.handle(IPC_CHANNELS.ACCEPT_SUGGESTION, async (_event, text: string) => {
+    await acceptAndInject(text);
+  });
+  ipcMain.handle(IPC_CHANNELS.DISMISS_SUGGESTION, () => {
+    destroySuggestion();
+    pendingSuggestionText = '';
+  });
+  ipcMain.handle(IPC_CHANNELS.UPDATE_SUGGESTION_TEXT, (_event, text: string) => {
+    pendingSuggestionText = text;
+  });
+  ipcMain.handle(IPC_CHANNELS.SET_AUTOCOMPLETE_ENABLED, (_event, enabled: boolean) => {
+    autocompleteEnabled = enabled;
+    if (!enabled) {
+      clearDebounce();
+      destroySuggestion();
+    }
+  });
+  ipcMain.handle(IPC_CHANNELS.GET_AUTOCOMPLETE_ENABLED, () => autocompleteEnabled);
+}
+
+export function registerAutocomplete(): void {
+  registerIpcHandlers();
+
+  if (!allPermissionsGranted()) {
+    console.log('[autocomplete] Permissions not granted — hook not started');
+    return;
+  }
+
+  if (!loadUiohook()) {
+    console.error('[autocomplete] Cannot start: uiohook-napi failed to load');
+    return;
+  }
+
+  uIOhook.on('keydown', onKeyDown);
+  try {
+    uIOhook.start();
+    hookStarted = true;
+    console.log('[autocomplete] uIOhook started');
+  } catch (err) {
+    console.error('[autocomplete] uIOhook.start() failed:', err);
+  }
+}
+
+export function unregisterAutocomplete(): void {
+  clearDebounce();
+  destroySuggestion();
+  if (uIOhook && hookStarted) {
+    try { uIOhook.stop(); } catch { /* already stopped */ }
+  }
+}
diff --git a/surfsense_desktop/src/modules/platform.ts b/surfsense_desktop/src/modules/platform.ts
index 37e126799..262866d07 100644
--- a/surfsense_desktop/src/modules/platform.ts
+++ b/surfsense_desktop/src/modules/platform.ts
@@ -53,3 +53,43 @@ export function checkAccessibilityPermission(): boolean {
   if (process.platform !== 'darwin') return true;
   return systemPreferences.isTrustedAccessibilityClient(true);
 }
+
+export function hasAccessibilityPermission(): boolean {
+  if (process.platform !== 'darwin') return true;
+  return systemPreferences.isTrustedAccessibilityClient(false);
+}
+
+export interface FieldContent {
+  text: string;
+  cursorPosition: number;
+}
+
+export function getFieldContent(): FieldContent | null {
+  if (process.platform !== 'darwin') return null;
+
+  try {
+    const text = execSync(
+      'osascript -e \'tell application "System Events" to get value of attribute "AXValue" of focused UI element of first application process whose frontmost is true\'',
+      { timeout: 500 }
+    ).toString().trim();
+
+    let cursorPosition = text.length;
+    try {
+      const rangeStr = execSync(
+        'osascript -e \'tell application "System Events" to get value of attribute "AXSelectedTextRange" of focused UI element of first application process whose frontmost is true\'',
+        { timeout: 500 }
+      ).toString().trim();
+
+      const locationMatch = rangeStr.match(/location[:\s]*(\d+)/i);
+      if (locationMatch) {
+        cursorPosition = parseInt(locationMatch[1], 10);
+      }
+    } catch {
+      // Fall back to end of text
+    }
+
+    return { text, cursorPosition };
+  } catch {
+    return null;
+  }
+}
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 069276489..956afcc46 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -26,4 +26,17 @@ contextBridge.exposeInMainWorld('electronAPI', {
   requestAccessibility: () => ipcRenderer.invoke(IPC_CHANNELS.REQUEST_ACCESSIBILITY),
   requestInputMonitoring: () => ipcRenderer.invoke(IPC_CHANNELS.REQUEST_INPUT_MONITORING),
   restartApp: () => ipcRenderer.invoke(IPC_CHANNELS.RESTART_APP),
+  // Autocomplete
+  onAutocompleteContext: (callback: (data: { text: string; cursorPosition: number; searchSpaceId?: string }) => void) => {
+    const listener = (_event: unknown, data: { text: string; cursorPosition: number; searchSpaceId?: string }) => callback(data);
+    ipcRenderer.on(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, listener);
+    return () => {
+      ipcRenderer.removeListener(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, listener);
+    };
+  },
+  acceptSuggestion: (text: string) => ipcRenderer.invoke(IPC_CHANNELS.ACCEPT_SUGGESTION, text),
+  dismissSuggestion: () => ipcRenderer.invoke(IPC_CHANNELS.DISMISS_SUGGESTION),
+  updateSuggestionText: (text: string) => ipcRenderer.invoke(IPC_CHANNELS.UPDATE_SUGGESTION_TEXT, text),
+  setAutocompleteEnabled: (enabled: boolean) => ipcRenderer.invoke(IPC_CHANNELS.SET_AUTOCOMPLETE_ENABLED, enabled),
+  getAutocompleteEnabled: () => ipcRenderer.invoke(IPC_CHANNELS.GET_AUTOCOMPLETE_ENABLED),
 });

From 6899134a20605b619e372564666a25eba5bb76fa Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Thu, 2 Apr 2026 14:37:26 +0200
Subject: [PATCH 042/202] feat: add autocomplete toggle in desktop settings

---
 .../components/DesktopContent.tsx             | 79 +++++++++++++++++++
 .../settings/user-settings-dialog.tsx         |  7 +-
 2 files changed, 85 insertions(+), 1 deletion(-)
 create mode 100644 surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx

diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
new file mode 100644
index 000000000..1522e153f
--- /dev/null
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
@@ -0,0 +1,79 @@
+"use client";
+
+import { useEffect, useState } from "react";
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
+import { Label } from "@/components/ui/label";
+import { Switch } from "@/components/ui/switch";
+import { Spinner } from "@/components/ui/spinner";
+
+export function DesktopContent() {
+	const [isElectron, setIsElectron] = useState(false);
+	const [loading, setLoading] = useState(true);
+	const [enabled, setEnabled] = useState(true);
+
+	useEffect(() => {
+		if (!window.electronAPI) {
+			setLoading(false);
+			return;
+		}
+		setIsElectron(true);
+
+		window.electronAPI.getAutocompleteEnabled().then((val) => {
+			setEnabled(val);
+			setLoading(false);
+		});
+	}, []);
+
+	if (!isElectron) {
+		return (
+			<div className="flex flex-col items-center justify-center py-12 text-center">
+				<p className="text-sm text-muted-foreground">
+					Desktop settings are only available in the SurfSense desktop app.
+				</p>
+			</div>
+		);
+	}
+
+	if (loading) {
+		return (
+			<div className="flex items-center justify-center py-12">
+				<Spinner size="md" className="text-muted-foreground" />
+			</div>
+		);
+	}
+
+	const handleToggle = async (checked: boolean) => {
+		setEnabled(checked);
+		await window.electronAPI!.setAutocompleteEnabled(checked);
+	};
+
+	return (
+		<div className="space-y-4 md:space-y-6">
+			<Card>
+				<CardHeader className="px-3 md:px-6 pt-3 md:pt-6 pb-2 md:pb-3">
+					<CardTitle className="text-base md:text-lg">Autocomplete</CardTitle>
+					<CardDescription className="text-xs md:text-sm">
+						Get inline writing suggestions powered by your knowledge base as you type in any app.
+					</CardDescription>
+				</CardHeader>
+				<CardContent className="px-3 md:px-6 pb-3 md:pb-6">
+					<div className="flex items-center justify-between rounded-lg border p-4">
+						<div className="space-y-0.5">
+							<Label htmlFor="autocomplete-toggle" className="text-sm font-medium cursor-pointer">
+								Enable autocomplete
+							</Label>
+							<p className="text-xs text-muted-foreground">
+								Show suggestions while typing in other applications.
+							</p>
+						</div>
+						<Switch
+							id="autocomplete-toggle"
+							checked={enabled}
+							onCheckedChange={handleToggle}
+						/>
+					</div>
+				</CardContent>
+			</Card>
+		</div>
+	);
+}
diff --git a/surfsense_web/components/settings/user-settings-dialog.tsx b/surfsense_web/components/settings/user-settings-dialog.tsx
index 389ebc5fd..b74ff973b 100644
--- a/surfsense_web/components/settings/user-settings-dialog.tsx
+++ b/surfsense_web/components/settings/user-settings-dialog.tsx
@@ -1,13 +1,14 @@
 "use client";
 
 import { useAtom } from "jotai";
-import { Globe, KeyRound, Receipt, Sparkles, User } from "lucide-react";
+import { Globe, KeyRound, Monitor, Receipt, Sparkles, User } from "lucide-react";
 import { useTranslations } from "next-intl";
 import { ApiKeyContent } from "@/app/dashboard/[search_space_id]/user-settings/components/ApiKeyContent";
 import { CommunityPromptsContent } from "@/app/dashboard/[search_space_id]/user-settings/components/CommunityPromptsContent";
 import { ProfileContent } from "@/app/dashboard/[search_space_id]/user-settings/components/ProfileContent";
 import { PromptsContent } from "@/app/dashboard/[search_space_id]/user-settings/components/PromptsContent";
 import { PurchaseHistoryContent } from "@/app/dashboard/[search_space_id]/user-settings/components/PurchaseHistoryContent";
+import { DesktopContent } from "@/app/dashboard/[search_space_id]/user-settings/components/DesktopContent";
 import { userSettingsDialogAtom } from "@/atoms/settings/settings-dialog.atoms";
 import { SettingsDialog } from "@/components/settings/settings-dialog";
 
@@ -37,6 +38,9 @@ export function UserSettingsDialog() {
 			label: "Purchase History",
 			icon: <Receipt className="h-4 w-4" />,
 		},
+		...(typeof window !== "undefined" && window.electronAPI
+			? [{ value: "desktop", label: "Desktop", icon: <Monitor className="h-4 w-4" /> }]
+			: []),
 	];
 
 	return (
@@ -54,6 +58,7 @@ export function UserSettingsDialog() {
 				{state.initialTab === "prompts" && <PromptsContent />}
 				{state.initialTab === "community-prompts" && <CommunityPromptsContent />}
 				{state.initialTab === "purchases" && <PurchaseHistoryContent />}
+				{state.initialTab === "desktop" && <DesktopContent />}
 			</div>
 		</SettingsDialog>
 	);

From 40ade4889e23b18ed43eaaa39a0489483fa5bbdc Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 21:01:31 +0530
Subject: [PATCH 043/202] feat: add LOCAL_FOLDER_FILE document type and update
 document_versions table management

---
 ...d_local_folder_connector_and_versioning.py | 33 +++++++------------
 1 file changed, 12 insertions(+), 21 deletions(-)

diff --git a/surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py b/surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py
index e97a4787c..a9da3beb4 100644
--- a/surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py
+++ b/surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py
@@ -1,4 +1,4 @@
-"""Add local folder connector enums and document_versions table
+"""Add LOCAL_FOLDER_FILE document type and document_versions table
 
 Revision ID: 117
 Revises: 116
@@ -21,23 +21,6 @@ PUBLICATION_NAME = "zero_publication"
 def upgrade() -> None:
     conn = op.get_bind()
 
-    # Add LOCAL_FOLDER_CONNECTOR to searchsourceconnectortype enum
-    op.execute(
-        """
-    DO $$
-    BEGIN
-        IF NOT EXISTS (
-            SELECT 1 FROM pg_type t
-            JOIN pg_enum e ON t.oid = e.enumtypid
-            WHERE t.typname = 'searchsourceconnectortype' AND e.enumlabel = 'LOCAL_FOLDER_CONNECTOR'
-        ) THEN
-            ALTER TYPE searchsourceconnectortype ADD VALUE 'LOCAL_FOLDER_CONNECTOR';
-        END IF;
-    END
-    $$;
-    """
-    )
-
     # Add LOCAL_FOLDER_FILE to documenttype enum
     op.execute(
         """
@@ -126,9 +109,17 @@ def downgrade() -> None:
         {"name": PUBLICATION_NAME},
     ).fetchone()
     if pub_exists:
-        op.execute(
-            f"ALTER PUBLICATION {PUBLICATION_NAME} DROP TABLE IF EXISTS document_versions"
-        )
+        already_in_pub = conn.execute(
+            sa.text(
+                "SELECT 1 FROM pg_publication_tables "
+                "WHERE pubname = :name AND tablename = 'document_versions'"
+            ),
+            {"name": PUBLICATION_NAME},
+        ).fetchone()
+        if already_in_pub:
+            op.execute(
+                f"ALTER PUBLICATION {PUBLICATION_NAME} DROP TABLE document_versions"
+            )
 
     op.execute("DROP INDEX IF EXISTS ix_document_versions_created_at")
     op.execute("DROP INDEX IF EXISTS ix_document_versions_document_id")

From 1ef0d913e7471c7df6b03b94647064bae76abb39 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 22:19:55 +0530
Subject: [PATCH 044/202] refactor: remove Local Folder connector components
 and related configurations from the UI

---
 .../(manage)/components/DocumentsFilters.tsx  |  43 ++-
 .../components/local-folder-connect-form.tsx  | 272 ------------------
 .../connect-forms/connector-benefits.ts       |   8 -
 .../connector-popup/connect-forms/index.tsx   |   3 -
 .../components/local-folder-config.tsx        | 163 -----------
 .../connector-configs/index.tsx               |   3 -
 .../views/connector-connect-view.tsx          |   1 -
 .../views/connector-edit-view.tsx             |   7 +-
 .../views/indexing-configuration-view.tsx     |   7 +-
 9 files changed, 35 insertions(+), 472 deletions(-)
 delete mode 100644 surfsense_web/components/assistant-ui/connector-popup/connect-forms/components/local-folder-connect-form.tsx
 delete mode 100644 surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/local-folder-config.tsx

diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
index b85af13b7..fcd3a39da 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { FolderPlus, ListFilter, Search, Upload, X } from "lucide-react";
+import { Eye, FolderPlus, ListFilter, Search, Upload, X } from "lucide-react";
 import { useTranslations } from "next-intl";
 import React, { useCallback, useMemo, useRef, useState } from "react";
 import { useDocumentUploadDialog } from "@/components/assistant-ui/document-upload-popup";
@@ -19,6 +19,7 @@ export function DocumentsFilters({
 	onToggleType,
 	activeTypes,
 	onCreateFolder,
+	onWatchFolder,
 }: {
 	typeCounts: Partial<Record<DocumentTypeEnum, number>>;
 	onSearch: (v: string) => void;
@@ -26,6 +27,7 @@ export function DocumentsFilters({
 	onToggleType: (type: DocumentTypeEnum, checked: boolean) => void;
 	activeTypes: DocumentTypeEnum[];
 	onCreateFolder?: () => void;
+	onWatchFolder?: () => void;
 }) {
 	const t = useTranslations("documents");
 	const id = React.useId();
@@ -214,17 +216,34 @@ export function DocumentsFilters({
 					</Tooltip>
 				)}
 
-				{/* Upload Button */}
-				<Button
-					data-joyride="upload-button"
-					onClick={openUploadDialog}
-					variant="outline"
-					size="sm"
-					className="h-9 shrink-0 gap-1.5 bg-white text-gray-700 border-white hover:bg-gray-50 dark:bg-white dark:text-gray-800 dark:hover:bg-gray-100"
-				>
-					<Upload size={14} />
-					<span>Upload</span>
-				</Button>
+			{/* Watch Folder Button (desktop only) */}
+			{onWatchFolder && (
+				<Tooltip>
+					<TooltipTrigger asChild>
+						<Button
+							variant="outline"
+							size="icon"
+							className="h-9 w-9 shrink-0 border-dashed border-sidebar-border text-sidebar-foreground/60 hover:text-sidebar-foreground hover:border-sidebar-border bg-sidebar"
+							onClick={onWatchFolder}
+						>
+							<Eye size={14} />
+						</Button>
+					</TooltipTrigger>
+					<TooltipContent>Watch folder</TooltipContent>
+				</Tooltip>
+			)}
+
+			{/* Upload Button */}
+			<Button
+				data-joyride="upload-button"
+				onClick={openUploadDialog}
+				variant="outline"
+				size="sm"
+				className="h-9 shrink-0 gap-1.5 bg-white text-gray-700 border-white hover:bg-gray-50 dark:bg-white dark:text-gray-800 dark:hover:bg-gray-100"
+			>
+				<Upload size={14} />
+				<span>Upload</span>
+			</Button>
 			</div>
 		</div>
 	);
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/components/local-folder-connect-form.tsx b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/components/local-folder-connect-form.tsx
deleted file mode 100644
index 2e893c1c0..000000000
--- a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/components/local-folder-connect-form.tsx
+++ /dev/null
@@ -1,272 +0,0 @@
-"use client";
-
-import { zodResolver } from "@hookform/resolvers/zod";
-import { FolderSync, Info } from "lucide-react";
-import type { FC } from "react";
-import { useRef } from "react";
-import { useForm } from "react-hook-form";
-import * as z from "zod";
-import { Alert, AlertDescription, AlertTitle } from "@/components/ui/alert";
-import { Button } from "@/components/ui/button";
-import {
-	Form,
-	FormControl,
-	FormDescription,
-	FormField,
-	FormItem,
-	FormLabel,
-	FormMessage,
-} from "@/components/ui/form";
-import { Input } from "@/components/ui/input";
-import { EnumConnectorName } from "@/contracts/enums/connector";
-import { getConnectorBenefits } from "../connector-benefits";
-import type { ConnectFormProps } from "../index";
-
-const localFolderFormSchema = z.object({
-	name: z.string().min(3, {
-		message: "Connector name must be at least 3 characters.",
-	}),
-	folder_path: z.string().min(1, {
-		message: "Folder path is required.",
-	}),
-	folder_name: z.string().min(1, {
-		message: "Folder name is required.",
-	}),
-	exclude_patterns: z.string().optional(),
-	file_extensions: z.string().optional(),
-});
-
-type LocalFolderFormValues = z.infer<typeof localFolderFormSchema>;
-
-export const LocalFolderConnectForm: FC<ConnectFormProps> = ({ onSubmit, isSubmitting }) => {
-	const isSubmittingRef = useRef(false);
-	const isElectron = typeof window !== "undefined" && !!window.electronAPI;
-
-	const form = useForm<LocalFolderFormValues>({
-		resolver: zodResolver(localFolderFormSchema),
-		defaultValues: {
-			name: "Local Folder",
-			folder_path: "",
-			folder_name: "",
-			exclude_patterns: "node_modules,.git,.DS_Store",
-			file_extensions: "",
-		},
-	});
-
-	const handleBrowse = async () => {
-		if (!isElectron) return;
-		const selected = await window.electronAPI!.selectFolder();
-		if (selected) {
-			form.setValue("folder_path", selected);
-			const folderName = selected.split(/[\\/]/).pop() || "folder";
-			if (!form.getValues("folder_name")) {
-				form.setValue("folder_name", folderName);
-			}
-			if (form.getValues("name") === "Local Folder") {
-				form.setValue("name", folderName);
-			}
-		}
-	};
-
-	const handleSubmit = async (values: LocalFolderFormValues) => {
-		if (isSubmittingRef.current || isSubmitting) return;
-		isSubmittingRef.current = true;
-
-		try {
-			const excludePatterns = values.exclude_patterns
-				? values.exclude_patterns
-						.split(",")
-						.map((p) => p.trim())
-						.filter(Boolean)
-				: [];
-
-			const fileExtensions = values.file_extensions
-				? values.file_extensions
-						.split(",")
-						.map((e) => {
-							const ext = e.trim();
-							return ext.startsWith(".") ? ext : `.${ext}`;
-						})
-						.filter(Boolean)
-				: null;
-
-			await onSubmit({
-				name: values.name,
-				connector_type: EnumConnectorName.LOCAL_FOLDER_CONNECTOR,
-				config: {
-					folder_path: values.folder_path,
-					folder_name: values.folder_name,
-					exclude_patterns: excludePatterns,
-					file_extensions: fileExtensions,
-				},
-				is_indexable: true,
-				is_active: true,
-				last_indexed_at: null,
-				periodic_indexing_enabled: false,
-				indexing_frequency_minutes: null,
-				next_scheduled_at: null,
-			});
-		} finally {
-			isSubmittingRef.current = false;
-		}
-	};
-
-	return (
-		<div className="space-y-6 pb-6">
-			<Alert className="bg-blue-500/10 dark:bg-blue-500/10 border-blue-500/30 p-2 sm:p-3">
-				<Info className="size-4 shrink-0 text-blue-500" />
-				<AlertTitle className="text-xs sm:text-sm">Desktop App Required</AlertTitle>
-				<AlertDescription className="text-[10px] sm:text-xs">
-					Real-time file watching is powered by the SurfSense desktop app. Files are
-					automatically synced whenever changes are detected.
-				</AlertDescription>
-			</Alert>
-
-			<div className="rounded-xl border border-border bg-slate-400/5 dark:bg-white/5 p-3 sm:p-6 space-y-3 sm:space-y-4">
-				<Form {...form}>
-					<form
-						id="local-folder-connect-form"
-						onSubmit={form.handleSubmit(handleSubmit)}
-						className="space-y-4 sm:space-y-6"
-					>
-						<FormField
-							control={form.control}
-							name="name"
-							render={({ field }) => (
-								<FormItem>
-									<FormLabel className="text-xs sm:text-sm">Connector Name</FormLabel>
-									<FormControl>
-										<Input
-											placeholder="My Documents"
-											className="h-8 sm:h-10 px-2 sm:px-3 text-xs sm:text-sm border-slate-400/20 focus-visible:border-slate-400/40"
-											disabled={isSubmitting}
-											{...field}
-										/>
-									</FormControl>
-									<FormMessage />
-								</FormItem>
-							)}
-						/>
-
-						<FormField
-							control={form.control}
-							name="folder_path"
-							render={({ field }) => (
-								<FormItem>
-									<FormLabel className="text-xs sm:text-sm">Folder Path</FormLabel>
-									<div className="flex gap-2">
-										<FormControl>
-											<Input
-												placeholder="/path/to/your/folder"
-												className="h-8 sm:h-10 px-2 sm:px-3 text-xs sm:text-sm border-slate-400/20 focus-visible:border-slate-400/40 font-mono flex-1"
-												disabled={isSubmitting}
-												{...field}
-											/>
-										</FormControl>
-										{isElectron && (
-											<Button
-												type="button"
-												variant="outline"
-												size="sm"
-												onClick={handleBrowse}
-												disabled={isSubmitting}
-												className="shrink-0"
-											>
-												<FolderSync className="h-4 w-4 mr-1" />
-												Browse
-											</Button>
-										)}
-									</div>
-									<FormDescription className="text-[10px] sm:text-xs">
-										The absolute path to the folder to watch and sync.
-									</FormDescription>
-									<FormMessage />
-								</FormItem>
-							)}
-						/>
-
-						<FormField
-							control={form.control}
-							name="folder_name"
-							render={({ field }) => (
-								<FormItem>
-									<FormLabel className="text-xs sm:text-sm">Display Name</FormLabel>
-									<FormControl>
-										<Input
-											placeholder="My Notes"
-											className="h-8 sm:h-10 px-2 sm:px-3 text-xs sm:text-sm border-slate-400/20 focus-visible:border-slate-400/40"
-											disabled={isSubmitting}
-											{...field}
-										/>
-									</FormControl>
-									<FormDescription className="text-[10px] sm:text-xs">
-										A friendly name shown in the documents sidebar.
-									</FormDescription>
-									<FormMessage />
-								</FormItem>
-							)}
-						/>
-
-						<FormField
-							control={form.control}
-							name="exclude_patterns"
-							render={({ field }) => (
-								<FormItem>
-									<FormLabel className="text-xs sm:text-sm">Exclude Patterns</FormLabel>
-									<FormControl>
-										<Input
-											placeholder="node_modules,.git,.DS_Store"
-											className="h-8 sm:h-10 px-2 sm:px-3 text-xs sm:text-sm border-slate-400/20 focus-visible:border-slate-400/40 font-mono"
-											disabled={isSubmitting}
-											{...field}
-										/>
-									</FormControl>
-									<FormDescription className="text-[10px] sm:text-xs">
-										Comma-separated patterns of directories/files to exclude.
-									</FormDescription>
-									<FormMessage />
-								</FormItem>
-							)}
-						/>
-
-						<FormField
-							control={form.control}
-							name="file_extensions"
-							render={({ field }) => (
-								<FormItem>
-									<FormLabel className="text-xs sm:text-sm">File Extensions (optional)</FormLabel>
-									<FormControl>
-										<Input
-											placeholder=".md,.txt,.rst"
-											className="h-8 sm:h-10 px-2 sm:px-3 text-xs sm:text-sm border-slate-400/20 focus-visible:border-slate-400/40 font-mono"
-											disabled={isSubmitting}
-											{...field}
-										/>
-									</FormControl>
-									<FormDescription className="text-[10px] sm:text-xs">
-										Leave empty to index all supported files, or specify comma-separated extensions.
-									</FormDescription>
-									<FormMessage />
-								</FormItem>
-							)}
-						/>
-
-					</form>
-				</Form>
-			</div>
-
-			{getConnectorBenefits(EnumConnectorName.LOCAL_FOLDER_CONNECTOR) && (
-				<div className="rounded-xl border border-border bg-slate-400/5 dark:bg-white/5 px-3 sm:px-6 py-4 space-y-2">
-					<h4 className="text-xs sm:text-sm font-medium">
-						What you get with Local Folder sync:
-					</h4>
-					<ul className="list-disc pl-5 text-[10px] sm:text-xs text-muted-foreground space-y-1">
-						{getConnectorBenefits(EnumConnectorName.LOCAL_FOLDER_CONNECTOR)?.map(
-							(benefit) => <li key={benefit}>{benefit}</li>
-						)}
-					</ul>
-				</div>
-			)}
-		</div>
-	);
-};
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/connector-benefits.ts b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/connector-benefits.ts
index 40c6a7fdd..0dc093100 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/connector-benefits.ts
+++ b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/connector-benefits.ts
@@ -111,14 +111,6 @@ export function getConnectorBenefits(connectorType: string): string[] | null {
 			"Incremental sync - only changed files are re-indexed",
 			"Full support for your vault's folder structure",
 		],
-		LOCAL_FOLDER_CONNECTOR: [
-			"Watch local folders for real-time changes via the desktop app",
-			"Automatic change detection — only modified files are re-indexed",
-			"Version history with up to 20 snapshots per document",
-			"Mirrors your folder structure in the SurfSense sidebar",
-			"Supports any text-based file format",
-			"Works as a periodic sync fallback when the desktop app is not running",
-		],
 	};
 
 	return benefits[connectorType] || null;
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/index.tsx b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/index.tsx
index 116893399..b6d813748 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connect-forms/index.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connect-forms/index.tsx
@@ -7,7 +7,6 @@ import { GithubConnectForm } from "./components/github-connect-form";
 import { LinkupApiConnectForm } from "./components/linkup-api-connect-form";
 import { LumaConnectForm } from "./components/luma-connect-form";
 import { MCPConnectForm } from "./components/mcp-connect-form";
-import { LocalFolderConnectForm } from "./components/local-folder-connect-form";
 import { ObsidianConnectForm } from "./components/obsidian-connect-form";
 import { TavilyApiConnectForm } from "./components/tavily-api-connect-form";
 
@@ -59,8 +58,6 @@ export function getConnectFormComponent(connectorType: string): ConnectFormCompo
 			return MCPConnectForm;
 		case "OBSIDIAN_CONNECTOR":
 			return ObsidianConnectForm;
-		case "LOCAL_FOLDER_CONNECTOR":
-			return LocalFolderConnectForm;
 		default:
 			return null;
 	}
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/local-folder-config.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/local-folder-config.tsx
deleted file mode 100644
index cb4295079..000000000
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/local-folder-config.tsx
+++ /dev/null
@@ -1,163 +0,0 @@
-"use client";
-
-import type { FC } from "react";
-import { useState } from "react";
-import { FolderSync } from "lucide-react";
-import { Button } from "@/components/ui/button";
-import { Input } from "@/components/ui/input";
-import { Label } from "@/components/ui/label";
-import type { ConnectorConfigProps } from "../index";
-
-export const LocalFolderConfig: FC<ConnectorConfigProps> = ({
-	connector,
-	onConfigChange,
-	onNameChange,
-}) => {
-	const isElectron = typeof window !== "undefined" && !!window.electronAPI;
-
-	const [folderPath, setFolderPath] = useState<string>(
-		(connector.config?.folder_path as string) || ""
-	);
-	const [folderName, setFolderName] = useState<string>(
-		(connector.config?.folder_name as string) || ""
-	);
-	const [excludePatterns, setExcludePatterns] = useState<string>(() => {
-		const patterns = connector.config?.exclude_patterns;
-		if (Array.isArray(patterns)) {
-			return patterns.join(", ");
-		}
-		return (patterns as string) || "node_modules, .git, .DS_Store";
-	});
-	const [fileExtensions, setFileExtensions] = useState<string>(() => {
-		const exts = connector.config?.file_extensions;
-		if (Array.isArray(exts)) {
-			return exts.join(", ");
-		}
-		return (exts as string) || "";
-	});
-	const [name, setName] = useState<string>(connector.name || "");
-
-	const handleFolderPathChange = (value: string) => {
-		setFolderPath(value);
-		onConfigChange?.({ ...connector.config, folder_path: value });
-	};
-
-	const handleFolderNameChange = (value: string) => {
-		setFolderName(value);
-		onConfigChange?.({ ...connector.config, folder_name: value });
-	};
-
-	const handleExcludePatternsChange = (value: string) => {
-		setExcludePatterns(value);
-		const arr = value
-			.split(",")
-			.map((p) => p.trim())
-			.filter(Boolean);
-		onConfigChange?.({ ...connector.config, exclude_patterns: arr });
-	};
-
-	const handleFileExtensionsChange = (value: string) => {
-		setFileExtensions(value);
-		const arr = value
-			? value
-					.split(",")
-					.map((e) => {
-						const ext = e.trim();
-						return ext.startsWith(".") ? ext : `.${ext}`;
-					})
-					.filter(Boolean)
-			: null;
-		onConfigChange?.({ ...connector.config, file_extensions: arr });
-	};
-
-	const handleNameChange = (value: string) => {
-		setName(value);
-		onNameChange?.(value);
-	};
-
-	const handleBrowse = async () => {
-		if (!isElectron) return;
-		const selected = await window.electronAPI!.selectFolder();
-		if (selected) {
-			handleFolderPathChange(selected);
-			const autoName = selected.split(/[\\/]/).pop() || "folder";
-			if (!folderName) handleFolderNameChange(autoName);
-		}
-	};
-
-	return (
-		<div className="space-y-6">
-			<div className="rounded-xl border border-border bg-slate-400/5 dark:bg-white/5 p-3 sm:p-6 space-y-3 sm:space-y-4">
-				<div className="space-y-2">
-					<Label className="text-xs sm:text-sm">Connector Name</Label>
-					<Input
-						value={name}
-						onChange={(e) => handleNameChange(e.target.value)}
-						placeholder="Local Folder"
-						className="border-slate-400/20 focus-visible:border-slate-400/40"
-					/>
-				</div>
-			</div>
-
-			<div className="rounded-xl border border-border bg-slate-400/5 dark:bg-white/5 p-3 sm:p-6 space-y-3 sm:space-y-4">
-				<h3 className="font-medium text-sm sm:text-base">Folder Configuration</h3>
-
-				<div className="space-y-4">
-					<div className="space-y-2">
-						<Label className="text-xs sm:text-sm">Folder Path</Label>
-						<div className="flex gap-2">
-							<Input
-								value={folderPath}
-								onChange={(e) => handleFolderPathChange(e.target.value)}
-								placeholder="/path/to/your/folder"
-								className="border-slate-400/20 focus-visible:border-slate-400/40 font-mono flex-1"
-							/>
-							{isElectron && (
-								<Button type="button" variant="outline" size="sm" onClick={handleBrowse} className="shrink-0">
-									<FolderSync className="h-4 w-4 mr-1" />
-									Browse
-								</Button>
-							)}
-						</div>
-					</div>
-
-					<div className="space-y-2">
-						<Label className="text-xs sm:text-sm">Display Name</Label>
-						<Input
-							value={folderName}
-							onChange={(e) => handleFolderNameChange(e.target.value)}
-							placeholder="My Notes"
-							className="border-slate-400/20 focus-visible:border-slate-400/40"
-						/>
-					</div>
-
-					<div className="space-y-2">
-						<Label className="text-xs sm:text-sm">Exclude Patterns</Label>
-						<Input
-							value={excludePatterns}
-							onChange={(e) => handleExcludePatternsChange(e.target.value)}
-							placeholder="node_modules, .git, .DS_Store"
-							className="border-slate-400/20 focus-visible:border-slate-400/40 font-mono"
-						/>
-						<p className="text-[10px] sm:text-xs text-muted-foreground">
-							Comma-separated patterns of directories/files to exclude.
-						</p>
-					</div>
-
-					<div className="space-y-2">
-						<Label className="text-xs sm:text-sm">File Extensions (optional)</Label>
-						<Input
-							value={fileExtensions}
-							onChange={(e) => handleFileExtensionsChange(e.target.value)}
-							placeholder=".md, .txt, .rst"
-							className="border-slate-400/20 focus-visible:border-slate-400/40 font-mono"
-						/>
-						<p className="text-[10px] sm:text-xs text-muted-foreground">
-							Leave empty to index all supported files.
-						</p>
-					</div>
-				</div>
-			</div>
-		</div>
-	);
-};
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/index.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/index.tsx
index 3dc1891c8..a63435260 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/index.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/index.tsx
@@ -19,7 +19,6 @@ import { JiraConfig } from "./components/jira-config";
 import { LinkupApiConfig } from "./components/linkup-api-config";
 import { LumaConfig } from "./components/luma-config";
 import { MCPConfig } from "./components/mcp-config";
-import { LocalFolderConfig } from "./components/local-folder-config";
 import { ObsidianConfig } from "./components/obsidian-config";
 import { OneDriveConfig } from "./components/onedrive-config";
 import { SlackConfig } from "./components/slack-config";
@@ -83,8 +82,6 @@ export function getConnectorConfigComponent(
 			return MCPConfig;
 		case "OBSIDIAN_CONNECTOR":
 			return ObsidianConfig;
-		case "LOCAL_FOLDER_CONNECTOR":
-			return LocalFolderConfig;
 		case "COMPOSIO_GOOGLE_DRIVE_CONNECTOR":
 			return ComposioDriveConfig;
 		case "COMPOSIO_GMAIL_CONNECTOR":
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx
index 0b6d0917a..596b98e93 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx
@@ -20,7 +20,6 @@ const FORM_ID_MAP: Record<string, string> = {
 	CIRCLEBACK_CONNECTOR: "circleback-connect-form",
 	MCP_CONNECTOR: "mcp-connect-form",
 	OBSIDIAN_CONNECTOR: "obsidian-connect-form",
-	LOCAL_FOLDER_CONNECTOR: "local-folder-connect-form",
 };
 
 interface ConnectorConnectViewProps {
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
index dcedb4743..05d42adcb 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
@@ -278,8 +278,7 @@ export const ConnectorEditView: FC<ConnectorEditViewProps> = ({
 									connector.connector_type !== "DROPBOX_CONNECTOR" &&
 									connector.connector_type !== "ONEDRIVE_CONNECTOR" &&
 									connector.connector_type !== "WEBCRAWLER_CONNECTOR" &&
-									connector.connector_type !== "GITHUB_CONNECTOR" &&
-									connector.connector_type !== "LOCAL_FOLDER_CONNECTOR" && (
+									connector.connector_type !== "GITHUB_CONNECTOR" && (
 										<DateRangeSelector
 											startDate={startDate}
 											endDate={endDate}
@@ -294,9 +293,7 @@ export const ConnectorEditView: FC<ConnectorEditViewProps> = ({
 										/>
 									)}
 
-								{/* Periodic sync - shown for all indexable connectors except Local Folder */}
-								{connector.connector_type !== "LOCAL_FOLDER_CONNECTOR" &&
-									(() => {
+								{(() => {
 										const isGoogleDrive = connector.connector_type === "GOOGLE_DRIVE_CONNECTOR";
 										const isComposioGoogleDrive =
 											connector.connector_type === "COMPOSIO_GOOGLE_DRIVE_CONNECTOR";
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/indexing-configuration-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/indexing-configuration-view.tsx
index 436ce7843..e583cbe17 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/indexing-configuration-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/indexing-configuration-view.tsx
@@ -164,8 +164,7 @@ export const IndexingConfigurationView: FC<IndexingConfigurationViewProps> = ({
 									config.connectorType !== "DROPBOX_CONNECTOR" &&
 									config.connectorType !== "ONEDRIVE_CONNECTOR" &&
 									config.connectorType !== "WEBCRAWLER_CONNECTOR" &&
-									config.connectorType !== "GITHUB_CONNECTOR" &&
-									config.connectorType !== "LOCAL_FOLDER_CONNECTOR" && (
+									config.connectorType !== "GITHUB_CONNECTOR" && (
 										<DateRangeSelector
 											startDate={startDate}
 											endDate={endDate}
@@ -180,12 +179,10 @@ export const IndexingConfigurationView: FC<IndexingConfigurationViewProps> = ({
 										/>
 									)}
 
-								{/* Periodic sync - not shown for file-based connectors (Drive, Dropbox, OneDrive) or Local Folder in initial setup; configured in edit view instead */}
 								{config.connectorType !== "GOOGLE_DRIVE_CONNECTOR" &&
 									config.connectorType !== "COMPOSIO_GOOGLE_DRIVE_CONNECTOR" &&
 									config.connectorType !== "DROPBOX_CONNECTOR" &&
-									config.connectorType !== "ONEDRIVE_CONNECTOR" &&
-									config.connectorType !== "LOCAL_FOLDER_CONNECTOR" && (
+									config.connectorType !== "ONEDRIVE_CONNECTOR" && (
 										<PeriodicSyncConfig
 											enabled={periodicEnabled}
 											frequencyMinutes={frequencyMinutes}

From 5d6e3ffb7b353ee8766fa212d2271a35e7d63455 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 22:20:11 +0530
Subject: [PATCH 045/202] feat: add renderer readiness signaling and update IPC
 channels for folder sync

---
 surfsense_desktop/src/ipc/channels.ts         |  1 +
 surfsense_desktop/src/ipc/handlers.ts         |  5 ++
 .../src/modules/folder-watcher.ts             | 61 +++++++++++++------
 surfsense_desktop/src/preload.ts              |  1 +
 4 files changed, 48 insertions(+), 20 deletions(-)

diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index 362d3362d..66788d90e 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -16,4 +16,5 @@ export const IPC_CHANNELS = {
   FOLDER_SYNC_WATCHER_READY: 'folder-sync:watcher-ready',
   FOLDER_SYNC_PAUSE: 'folder-sync:pause',
   FOLDER_SYNC_RESUME: 'folder-sync:resume',
+  FOLDER_SYNC_RENDERER_READY: 'folder-sync:renderer-ready',
 } as const;
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index 2baf957b0..19051e871 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -8,6 +8,7 @@ import {
   getWatcherStatus,
   pauseWatcher,
   resumeWatcher,
+  markRendererReady,
 } from '../modules/folder-watcher';
 
 export function registerIpcHandlers(): void {
@@ -44,4 +45,8 @@ export function registerIpcHandlers(): void {
   ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_PAUSE, () => pauseWatcher());
 
   ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_RESUME, () => resumeWatcher());
+
+  ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_RENDERER_READY, () => {
+    markRendererReady();
+  });
 }
diff --git a/surfsense_desktop/src/modules/folder-watcher.ts b/surfsense_desktop/src/modules/folder-watcher.ts
index 072ae7b3f..81a835c22 100644
--- a/surfsense_desktop/src/modules/folder-watcher.ts
+++ b/surfsense_desktop/src/modules/folder-watcher.ts
@@ -9,7 +9,7 @@ export interface WatchedFolderConfig {
   name: string;
   excludePatterns: string[];
   fileExtensions: string[] | null;
-  connectorId: number;
+  rootFolderId: number | null;
   searchSpaceId: number;
   active: boolean;
 }
@@ -34,6 +34,25 @@ let watchers: Map<string, WatcherEntry> = new Map();
  */
 const mtimeMaps: Map<string, MtimeMap> = new Map();
 
+let rendererReady = false;
+const pendingEvents: any[] = [];
+
+export function markRendererReady() {
+  rendererReady = true;
+  for (const event of pendingEvents) {
+    sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, event);
+  }
+  pendingEvents.length = 0;
+}
+
+function sendFileChangedEvent(data: any) {
+  if (rendererReady) {
+    sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, data);
+  } else {
+    pendingEvents.push(data);
+  }
+}
+
 async function getStore() {
   if (!store) {
     const { default: Store } = await import('electron-store');
@@ -83,7 +102,6 @@ function walkFolderMtimes(config: WatchedFolderConfig): MtimeMap {
     for (const entry of entries) {
       const name = entry.name;
 
-      // Skip dotfiles/dotdirs and excluded names
       if (name.startsWith('.') || excludes.has(name)) continue;
 
       const full = path.join(dir, name);
@@ -131,7 +149,6 @@ async function startWatcher(config: WatchedFolderConfig) {
     return;
   }
 
-  // Load persisted mtime map into memory before starting the watcher
   const ms = await getMtimeStore();
   const storedMap: MtimeMap = ms.get(config.path) ?? {};
   mtimeMaps.set(config.path, { ...storedMap });
@@ -156,45 +173,49 @@ async function startWatcher(config: WatchedFolderConfig) {
   watcher.on('ready', () => {
     ready = true;
 
-    // Detect offline changes by diffing current filesystem against stored mtime map
     const currentMap = walkFolderMtimes(config);
     const storedSnapshot = loadMtimeMap(config.path);
     const now = Date.now();
 
+    // Track which files are unchanged so we can selectively update the mtime map
+    const unchangedMap: MtimeMap = {};
+
     for (const [rel, currentMtime] of Object.entries(currentMap)) {
       const storedMtime = storedSnapshot[rel];
       if (storedMtime === undefined) {
-        // New file added while app was closed
-        sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, {
-          connectorId: config.connectorId,
+        sendFileChangedEvent({
+          rootFolderId: config.rootFolderId,
           searchSpaceId: config.searchSpaceId,
           folderPath: config.path,
+          folderName: config.name,
           relativePath: rel,
           fullPath: path.join(config.path, rel),
           action: 'add',
           timestamp: now,
         });
       } else if (Math.abs(currentMtime - storedMtime) >= MTIME_TOLERANCE_S * 1000) {
-        // File modified while app was closed
-        sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, {
-          connectorId: config.connectorId,
+        sendFileChangedEvent({
+          rootFolderId: config.rootFolderId,
           searchSpaceId: config.searchSpaceId,
           folderPath: config.path,
+          folderName: config.name,
           relativePath: rel,
           fullPath: path.join(config.path, rel),
           action: 'change',
           timestamp: now,
         });
+      } else {
+        unchangedMap[rel] = currentMtime;
       }
     }
 
     for (const rel of Object.keys(storedSnapshot)) {
       if (!(rel in currentMap)) {
-        // File deleted while app was closed
-        sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, {
-          connectorId: config.connectorId,
+        sendFileChangedEvent({
+          rootFolderId: config.rootFolderId,
           searchSpaceId: config.searchSpaceId,
           folderPath: config.path,
+          folderName: config.name,
           relativePath: rel,
           fullPath: path.join(config.path, rel),
           action: 'unlink',
@@ -203,12 +224,13 @@ async function startWatcher(config: WatchedFolderConfig) {
       }
     }
 
-    // Replace stored map with current filesystem state
-    mtimeMaps.set(config.path, currentMap);
+    // Only update the mtime map for unchanged files; changed files keep their
+    // stored mtime so they'll be re-detected if the app crashes before indexing.
+    mtimeMaps.set(config.path, unchangedMap);
     persistMtimeMap(config.path);
 
     sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_WATCHER_READY, {
-      connectorId: config.connectorId,
+      rootFolderId: config.rootFolderId,
       folderPath: config.path,
     });
   });
@@ -226,7 +248,6 @@ async function startWatcher(config: WatchedFolderConfig) {
       if (!config.fileExtensions.includes(ext)) return;
     }
 
-    // Keep mtime map in sync with live changes
     const map = mtimeMaps.get(config.path);
     if (map) {
       if (action === 'unlink') {
@@ -241,10 +262,11 @@ async function startWatcher(config: WatchedFolderConfig) {
       persistMtimeMap(config.path);
     }
 
-    sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, {
-      connectorId: config.connectorId,
+    sendFileChangedEvent({
+      rootFolderId: config.rootFolderId,
       searchSpaceId: config.searchSpaceId,
       folderPath: config.path,
+      folderName: config.name,
       relativePath,
       fullPath: filePath,
       action,
@@ -311,7 +333,6 @@ export async function removeWatchedFolder(
 
   stopWatcher(folderPath);
 
-  // Clean up persisted mtime map for this folder
   mtimeMaps.delete(folderPath);
   const ms = await getMtimeStore();
   ms.delete(folderPath);
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 8f65aa633..7c190db10 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -44,4 +44,5 @@ contextBridge.exposeInMainWorld('electronAPI', {
   },
   pauseWatcher: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_PAUSE),
   resumeWatcher: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_RESUME),
+  signalRendererReady: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_RENDERER_READY),
 });

From 493d720b891cf6ef478223d2645ba9e4b9504ab6 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 22:21:01 +0530
Subject: [PATCH 046/202] refactor: remove Local Folder connector references
 and enhance folder management features

---
 .../constants/connector-constants.ts          |   8 -
 .../hooks/use-connector-dialog.ts             |  28 ---
 .../utils/connector-document-mapping.ts       |   1 -
 .../components/documents/FolderNode.tsx       | 139 ++++++++-----
 .../components/documents/FolderTreeView.tsx   |   9 +
 .../components/editor-panel/editor-panel.tsx  |  18 +-
 .../layout/ui/sidebar/DocumentsSidebar.tsx    | 186 ++++++++++++++----
 7 files changed, 257 insertions(+), 132 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/connector-popup/constants/connector-constants.ts b/surfsense_web/components/assistant-ui/connector-popup/constants/connector-constants.ts
index 3f7d90cd8..2e92f637b 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/constants/connector-constants.ts
+++ b/surfsense_web/components/assistant-ui/connector-popup/constants/connector-constants.ts
@@ -184,14 +184,6 @@ export const OTHER_CONNECTORS = [
 		connectorType: EnumConnectorName.OBSIDIAN_CONNECTOR,
 		selfHostedOnly: true,
 	},
-	{
-		id: "local-folder-connector",
-		title: "Local Folder",
-		description: "Watch and sync local folders (desktop only)",
-		connectorType: EnumConnectorName.LOCAL_FOLDER_CONNECTOR,
-		selfHostedOnly: true,
-		desktopOnly: true,
-	},
 ] as const;
 
 // Composio Connectors - Individual entries for each supported toolkit
diff --git a/surfsense_web/components/assistant-ui/connector-popup/hooks/use-connector-dialog.ts b/surfsense_web/components/assistant-ui/connector-popup/hooks/use-connector-dialog.ts
index 2404b8eb5..6543bbd72 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/hooks/use-connector-dialog.ts
+++ b/surfsense_web/components/assistant-ui/connector-popup/hooks/use-connector-dialog.ts
@@ -586,23 +586,6 @@ export const useConnectorDialog = () => {
 									},
 								});
 
-								// Register folder watcher in Electron for real-time sync
-								if (
-									currentConnectorType === EnumConnectorName.LOCAL_FOLDER_CONNECTOR &&
-									window.electronAPI?.addWatchedFolder
-								) {
-									const cfg = connector.config || {};
-									await window.electronAPI.addWatchedFolder({
-										path: cfg.folder_path as string,
-										name: cfg.folder_name as string,
-										excludePatterns: (cfg.exclude_patterns as string[]) || [],
-										fileExtensions: (cfg.file_extensions as string[] | null) ?? null,
-										connectorId: connector.id,
-										searchSpaceId: Number(searchSpaceId),
-										active: true,
-									});
-								}
-
 								const successMessage =
 									currentConnectorType === "MCP_CONNECTOR"
 										? `${connector.name} added successfully`
@@ -1207,17 +1190,6 @@ export const useConnectorDialog = () => {
 					id: editingConnector.id,
 				});
 
-				// Unregister folder watcher in Electron when removing a Local Folder connector
-				if (
-					editingConnector.connector_type === EnumConnectorName.LOCAL_FOLDER_CONNECTOR &&
-					window.electronAPI?.removeWatchedFolder &&
-					editingConnector.config?.folder_path
-				) {
-					await window.electronAPI.removeWatchedFolder(
-						editingConnector.config.folder_path as string
-					);
-				}
-
 				// Track connector deleted event
 				trackConnectorDeleted(
 					Number(searchSpaceId),
diff --git a/surfsense_web/components/assistant-ui/connector-popup/utils/connector-document-mapping.ts b/surfsense_web/components/assistant-ui/connector-popup/utils/connector-document-mapping.ts
index dd5978002..f924bb15f 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/utils/connector-document-mapping.ts
+++ b/surfsense_web/components/assistant-ui/connector-popup/utils/connector-document-mapping.ts
@@ -29,7 +29,6 @@ export const CONNECTOR_TO_DOCUMENT_TYPE: Record<string, string> = {
 	BOOKSTACK_CONNECTOR: "BOOKSTACK_CONNECTOR",
 	CIRCLEBACK_CONNECTOR: "CIRCLEBACK",
 	OBSIDIAN_CONNECTOR: "OBSIDIAN_CONNECTOR",
-	LOCAL_FOLDER_CONNECTOR: "LOCAL_FOLDER_FILE",
 
 	// Special mappings (connector type differs from document type)
 	GOOGLE_DRIVE_CONNECTOR: "GOOGLE_DRIVE_FILE",
diff --git a/surfsense_web/components/documents/FolderNode.tsx b/surfsense_web/components/documents/FolderNode.tsx
index 6a36f724f..1521c06fe 100644
--- a/surfsense_web/components/documents/FolderNode.tsx
+++ b/surfsense_web/components/documents/FolderNode.tsx
@@ -3,12 +3,15 @@
 import {
 	ChevronDown,
 	ChevronRight,
+	Eye,
+	EyeOff,
 	Folder,
 	FolderOpen,
 	FolderPlus,
 	MoreHorizontal,
 	Move,
 	PenLine,
+	RefreshCw,
 	Trash2,
 } from "lucide-react";
 import React, { useCallback, useEffect, useRef, useState } from "react";
@@ -70,6 +73,9 @@ interface FolderNodeProps {
 	disabledDropIds?: Set<number>;
 	contextMenuOpen?: boolean;
 	onContextMenuOpenChange?: (open: boolean) => void;
+	isWatched?: boolean;
+	onRescan?: (folder: FolderDisplay) => void;
+	onStopWatching?: (folder: FolderDisplay) => void;
 }
 
 function getDropZone(
@@ -107,6 +113,9 @@ export const FolderNode = React.memo(function FolderNode({
 	disabledDropIds,
 	contextMenuOpen,
 	onContextMenuOpenChange,
+	isWatched,
+	onRescan,
+	onStopWatching,
 }: FolderNodeProps) {
 	const [renameValue, setRenameValue] = useState(folder.name);
 	const inputRef = useRef<HTMLInputElement>(null);
@@ -307,73 +316,107 @@ export const FolderNode = React.memo(function FolderNode({
 									<MoreHorizontal className="h-3.5 w-3.5" />
 								</Button>
 							</DropdownMenuTrigger>
-							<DropdownMenuContent align="end" className="w-40">
+						<DropdownMenuContent align="end" className="w-40">
+							{isWatched && onRescan && (
 								<DropdownMenuItem
 									onClick={(e) => {
 										e.stopPropagation();
-										onCreateSubfolder(folder.id);
+										onRescan(folder);
 									}}
 								>
-									<FolderPlus className="mr-2 h-4 w-4" />
-									New subfolder
+									<RefreshCw className="mr-2 h-4 w-4" />
+									Re-scan
 								</DropdownMenuItem>
+							)}
+							{isWatched && onStopWatching && (
 								<DropdownMenuItem
 									onClick={(e) => {
 										e.stopPropagation();
-										startRename();
+										onStopWatching(folder);
 									}}
 								>
-									<PenLine className="mr-2 h-4 w-4" />
-									Rename
+									<EyeOff className="mr-2 h-4 w-4" />
+									Stop watching
 								</DropdownMenuItem>
-								<DropdownMenuItem
-									onClick={(e) => {
-										e.stopPropagation();
-										onMove(folder);
-									}}
-								>
-									<Move className="mr-2 h-4 w-4" />
-									Move to...
-								</DropdownMenuItem>
-								<DropdownMenuItem
-									className="text-destructive focus:text-destructive"
-									onClick={(e) => {
-										e.stopPropagation();
-										onDelete(folder);
-									}}
-								>
-									<Trash2 className="mr-2 h-4 w-4" />
-									Delete
-								</DropdownMenuItem>
-							</DropdownMenuContent>
+							)}
+							<DropdownMenuItem
+								onClick={(e) => {
+									e.stopPropagation();
+									onCreateSubfolder(folder.id);
+								}}
+							>
+								<FolderPlus className="mr-2 h-4 w-4" />
+								New subfolder
+							</DropdownMenuItem>
+							<DropdownMenuItem
+								onClick={(e) => {
+									e.stopPropagation();
+									startRename();
+								}}
+							>
+								<PenLine className="mr-2 h-4 w-4" />
+								Rename
+							</DropdownMenuItem>
+							<DropdownMenuItem
+								onClick={(e) => {
+									e.stopPropagation();
+									onMove(folder);
+								}}
+							>
+								<Move className="mr-2 h-4 w-4" />
+								Move to...
+							</DropdownMenuItem>
+							<DropdownMenuItem
+								className="text-destructive focus:text-destructive"
+								onClick={(e) => {
+									e.stopPropagation();
+									onDelete(folder);
+								}}
+							>
+								<Trash2 className="mr-2 h-4 w-4" />
+								Delete
+							</DropdownMenuItem>
+						</DropdownMenuContent>
 						</DropdownMenu>
 					)}
 				</div>
 			</ContextMenuTrigger>
 
-			{!isRenaming && contextMenuOpen && (
-				<ContextMenuContent className="w-40">
-					<ContextMenuItem onClick={() => onCreateSubfolder(folder.id)}>
-						<FolderPlus className="mr-2 h-4 w-4" />
-						New subfolder
+		{!isRenaming && contextMenuOpen && (
+			<ContextMenuContent className="w-40">
+				{isWatched && onRescan && (
+					<ContextMenuItem onClick={() => onRescan(folder)}>
+						<RefreshCw className="mr-2 h-4 w-4" />
+						Re-scan
 					</ContextMenuItem>
-					<ContextMenuItem onClick={() => startRename()}>
-						<PenLine className="mr-2 h-4 w-4" />
-						Rename
+				)}
+				{isWatched && onStopWatching && (
+					<ContextMenuItem onClick={() => onStopWatching(folder)}>
+						<EyeOff className="mr-2 h-4 w-4" />
+						Stop watching
 					</ContextMenuItem>
-					<ContextMenuItem onClick={() => onMove(folder)}>
-						<Move className="mr-2 h-4 w-4" />
-						Move to...
-					</ContextMenuItem>
-					<ContextMenuItem
-						className="text-destructive focus:text-destructive"
-						onClick={() => onDelete(folder)}
-					>
-						<Trash2 className="mr-2 h-4 w-4" />
-						Delete
-					</ContextMenuItem>
-				</ContextMenuContent>
-			)}
+				)}
+				<ContextMenuItem onClick={() => onCreateSubfolder(folder.id)}>
+					<FolderPlus className="mr-2 h-4 w-4" />
+					New subfolder
+				</ContextMenuItem>
+				<ContextMenuItem onClick={() => startRename()}>
+					<PenLine className="mr-2 h-4 w-4" />
+					Rename
+				</ContextMenuItem>
+				<ContextMenuItem onClick={() => onMove(folder)}>
+					<Move className="mr-2 h-4 w-4" />
+					Move to...
+				</ContextMenuItem>
+				<ContextMenuItem
+					className="text-destructive focus:text-destructive"
+					onClick={() => onDelete(folder)}
+				>
+					<Trash2 className="mr-2 h-4 w-4" />
+					Delete
+				</ContextMenuItem>
+			</ContextMenuContent>
+		)}
 		</ContextMenu>
 	);
 });
diff --git a/surfsense_web/components/documents/FolderTreeView.tsx b/surfsense_web/components/documents/FolderTreeView.tsx
index 7695923e3..5945edccb 100644
--- a/surfsense_web/components/documents/FolderTreeView.tsx
+++ b/surfsense_web/components/documents/FolderTreeView.tsx
@@ -40,6 +40,9 @@ interface FolderTreeViewProps {
 		targetFolderId: number | null
 	) => void;
 	onReorderFolder?: (folderId: number, beforePos: string | null, afterPos: string | null) => void;
+	watchedFolderIds?: Set<number>;
+	onRescanFolder?: (folder: FolderDisplay) => void;
+	onStopWatchingFolder?: (folder: FolderDisplay) => void;
 }
 
 function groupBy<T>(items: T[], keyFn: (item: T) => string | number): Record<string | number, T[]> {
@@ -73,6 +76,9 @@ export function FolderTreeView({
 	searchQuery,
 	onDropIntoFolder,
 	onReorderFolder,
+	watchedFolderIds,
+	onRescanFolder,
+	onStopWatchingFolder,
 }: FolderTreeViewProps) {
 	const foldersByParent = useMemo(() => groupBy(folders, (f) => f.parentId ?? "root"), [folders]);
 
@@ -204,6 +210,9 @@ export function FolderTreeView({
 					siblingPositions={siblingPositions}
 					contextMenuOpen={openContextMenuId === `folder-${f.id}`}
 					onContextMenuOpenChange={(open) => setOpenContextMenuId(open ? `folder-${f.id}` : null)}
+					isWatched={watchedFolderIds?.has(f.id)}
+					onRescan={onRescanFolder}
+					onStopWatching={onStopWatchingFolder}
 				/>
 			);
 
diff --git a/surfsense_web/components/editor-panel/editor-panel.tsx b/surfsense_web/components/editor-panel/editor-panel.tsx
index 802a5ffc3..a1195ef33 100644
--- a/surfsense_web/components/editor-panel/editor-panel.tsx
+++ b/surfsense_web/components/editor-panel/editor-panel.tsx
@@ -6,6 +6,7 @@ import dynamic from "next/dynamic";
 import { useCallback, useEffect, useRef, useState } from "react";
 import { toast } from "sonner";
 import { closeEditorPanelAtom, editorPanelAtom } from "@/atoms/editor/editor-panel.atom";
+import { VersionHistoryButton } from "@/components/documents/version-history";
 import { MarkdownViewer } from "@/components/markdown-viewer";
 import { Button } from "@/components/ui/button";
 import { Drawer, DrawerContent, DrawerHandle, DrawerTitle } from "@/components/ui/drawer";
@@ -180,12 +181,16 @@ export function EditorPanelContent({
 	return (
 		<>
 			<div className="flex items-center justify-between px-4 py-2 shrink-0 border-b">
-				<div className="flex-1 min-w-0">
-					<h2 className="text-sm font-semibold truncate">{displayTitle}</h2>
-					{isEditableType && editedMarkdown !== null && (
-						<p className="text-[10px] text-muted-foreground">Unsaved changes</p>
-					)}
-				</div>
+			<div className="flex-1 min-w-0">
+				<h2 className="text-sm font-semibold truncate">{displayTitle}</h2>
+				{isEditableType && editedMarkdown !== null && (
+					<p className="text-[10px] text-muted-foreground">Unsaved changes</p>
+				)}
+			</div>
+			<div className="flex items-center gap-1 shrink-0">
+				{editorDoc?.document_type && (
+					<VersionHistoryButton documentId={documentId} documentType={editorDoc.document_type} />
+				)}
 				{onClose && (
 					<Button variant="ghost" size="icon" onClick={onClose} className="size-7 shrink-0">
 						<XIcon className="size-4" />
@@ -193,6 +198,7 @@ export function EditorPanelContent({
 					</Button>
 				)}
 			</div>
+		</div>
 
 			<div className="flex-1 overflow-hidden">
 				{isLoading ? (
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index d880524bd..202d170d9 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -40,6 +40,7 @@ import { getConnectorIcon } from "@/contracts/enums/connectorIcons";
 import type { DocumentTypeEnum } from "@/contracts/types/document.types";
 import { useDebouncedValue } from "@/hooks/use-debounced-value";
 import { useMediaQuery } from "@/hooks/use-media-query";
+import { documentsApiService } from "@/lib/apis/documents-api.service";
 import { foldersApiService } from "@/lib/apis/folders-api.service";
 import { authenticatedFetch } from "@/lib/auth-utils";
 import { queries } from "@/zero/queries/index";
@@ -92,6 +93,24 @@ export function DocumentsSidebar({
 	const [search, setSearch] = useState("");
 	const debouncedSearch = useDebouncedValue(search, 250);
 	const [activeTypes, setActiveTypes] = useState<DocumentTypeEnum[]>([]);
+	const [watchedFolderIds, setWatchedFolderIds] = useState<Set<number>>(new Set());
+
+	useEffect(() => {
+		const api = typeof window !== "undefined" ? window.electronAPI : null;
+		if (!api?.getWatchedFolders) return;
+
+		async function loadWatchedIds() {
+			const folders = await api!.getWatchedFolders();
+			const ids = new Set(
+				folders
+					.filter((f) => f.rootFolderId != null)
+					.map((f) => f.rootFolderId as number)
+			);
+			setWatchedFolderIds(ids);
+		}
+
+		loadWatchedIds();
+	}, []);
 	const { mutateAsync: deleteDocumentMutation } = useAtomValue(deleteDocumentMutationAtom);
 
 	const [sidebarDocs, setSidebarDocs] = useAtom(sidebarSelectedDocumentsAtom);
@@ -223,6 +242,87 @@ export function DocumentsSidebar({
 		[createFolderParentId, searchSpaceId, setExpandedFolderMap]
 	);
 
+	const isElectron = typeof window !== "undefined" && !!window.electronAPI;
+
+	const handleWatchFolder = useCallback(async () => {
+		const api = window.electronAPI;
+		if (!api) return;
+
+		const folderPath = await api.selectFolder();
+		if (!folderPath) return;
+
+		const folderName = folderPath.split("/").pop() || folderPath.split("\\").pop() || folderPath;
+
+		try {
+			const result = await documentsApiService.folderIndex(searchSpaceId, {
+				folder_path: folderPath,
+				folder_name: folderName,
+				search_space_id: searchSpaceId,
+			});
+
+			const rootFolderId = (result as { root_folder_id?: number })?.root_folder_id ?? null;
+
+			await api.addWatchedFolder({
+				path: folderPath,
+				name: folderName,
+				excludePatterns: [".git", "node_modules", "__pycache__", ".DS_Store", ".obsidian", ".trash"],
+				fileExtensions: null,
+				rootFolderId,
+				searchSpaceId,
+				active: true,
+			});
+
+			toast.success(`Watching folder: ${folderName}`);
+		} catch (err) {
+			toast.error((err as Error)?.message || "Failed to watch folder");
+		}
+	}, [searchSpaceId]);
+
+	const handleRescanFolder = useCallback(
+		async (folder: FolderDisplay) => {
+			const api = window.electronAPI;
+			if (!api) return;
+
+			const watchedFolders = await api.getWatchedFolders();
+			const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
+			if (!matched) {
+				toast.error("This folder is not being watched");
+				return;
+			}
+
+			try {
+				await documentsApiService.folderIndex(searchSpaceId, {
+					folder_path: matched.path,
+					folder_name: matched.name,
+					search_space_id: searchSpaceId,
+					root_folder_id: folder.id,
+				});
+				toast.success(`Re-scanning folder: ${matched.name}`);
+			} catch (err) {
+				toast.error((err as Error)?.message || "Failed to re-scan folder");
+			}
+		},
+		[searchSpaceId]
+	);
+
+	const handleStopWatching = useCallback(
+		async (folder: FolderDisplay) => {
+			const api = window.electronAPI;
+			if (!api) return;
+
+			const watchedFolders = await api.getWatchedFolders();
+			const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
+			if (!matched) {
+				toast.error("This folder is not being watched");
+				return;
+			}
+
+			await api.removeWatchedFolder(matched.path);
+			toast.success(`Stopped watching: ${matched.name}`);
+		},
+		[]
+	);
+
 	const handleRenameFolder = useCallback(async (folder: FolderDisplay, newName: string) => {
 		try {
 			await foldersApiService.updateFolder(folder.id, { name: newName });
@@ -641,14 +741,15 @@ export function DocumentsSidebar({
 
 			<div className="flex-1 min-h-0 overflow-x-hidden pt-0 flex flex-col">
 				<div className="px-4 pb-2">
-					<DocumentsFilters
-						typeCounts={typeCounts}
-						onSearch={setSearch}
-						searchValue={search}
-						onToggleType={onToggleType}
-						activeTypes={activeTypes}
-						onCreateFolder={() => handleCreateFolder(null)}
-					/>
+				<DocumentsFilters
+					typeCounts={typeCounts}
+					onSearch={setSearch}
+					searchValue={search}
+					onToggleType={onToggleType}
+					activeTypes={activeTypes}
+					onCreateFolder={() => handleCreateFolder(null)}
+					onWatchFolder={isElectron ? handleWatchFolder : undefined}
+				/>
 				</div>
 
 				{deletableSelectedIds.length > 0 && (
@@ -666,39 +767,42 @@ export function DocumentsSidebar({
 				)}
 
 				<FolderTreeView
-					folders={treeFolders}
-					documents={searchFilteredDocuments}
-					expandedIds={expandedIds}
-					onToggleExpand={toggleFolderExpand}
-					mentionedDocIds={mentionedDocIds}
-					onToggleChatMention={handleToggleChatMention}
-					onToggleFolderSelect={handleToggleFolderSelect}
-					onRenameFolder={handleRenameFolder}
-					onDeleteFolder={handleDeleteFolder}
-					onMoveFolder={handleMoveFolder}
-					onCreateFolder={handleCreateFolder}
-					searchQuery={debouncedSearch.trim() || undefined}
-					onPreviewDocument={(doc) => {
-						openEditorPanel({
-							documentId: doc.id,
-							searchSpaceId,
-							title: doc.title,
-						});
-					}}
-					onEditDocument={(doc) => {
-						openEditorPanel({
-							documentId: doc.id,
-							searchSpaceId,
-							title: doc.title,
-						});
-					}}
-					onDeleteDocument={(doc) => handleDeleteDocument(doc.id)}
-					onMoveDocument={handleMoveDocument}
-					onExportDocument={handleExportDocument}
-					activeTypes={activeTypes}
-					onDropIntoFolder={handleDropIntoFolder}
-					onReorderFolder={handleReorderFolder}
-				/>
+				folders={treeFolders}
+				documents={searchFilteredDocuments}
+				expandedIds={expandedIds}
+				onToggleExpand={toggleFolderExpand}
+				mentionedDocIds={mentionedDocIds}
+				onToggleChatMention={handleToggleChatMention}
+				onToggleFolderSelect={handleToggleFolderSelect}
+				onRenameFolder={handleRenameFolder}
+				onDeleteFolder={handleDeleteFolder}
+				onMoveFolder={handleMoveFolder}
+				onCreateFolder={handleCreateFolder}
+				searchQuery={debouncedSearch.trim() || undefined}
+				onPreviewDocument={(doc) => {
+					openEditorPanel({
+						documentId: doc.id,
+						searchSpaceId,
+						title: doc.title,
+					});
+				}}
+				onEditDocument={(doc) => {
+					openEditorPanel({
+						documentId: doc.id,
+						searchSpaceId,
+						title: doc.title,
+					});
+				}}
+				onDeleteDocument={(doc) => handleDeleteDocument(doc.id)}
+				onMoveDocument={handleMoveDocument}
+				onExportDocument={handleExportDocument}
+				activeTypes={activeTypes}
+				onDropIntoFolder={handleDropIntoFolder}
+				onReorderFolder={handleReorderFolder}
+				watchedFolderIds={watchedFolderIds}
+				onRescanFolder={handleRescanFolder}
+				onStopWatchingFolder={handleStopWatching}
+			/>
 			</div>
 
 			<FolderPickerDialog

From 149ccb97ddce4a56b15f1cdfce315833edf7a6c5 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 22:21:16 +0530
Subject: [PATCH 047/202] refactor: completely remove Local Folder connector
 references and update folder sync logic

---
 surfsense_web/contracts/enums/connector.ts    |  1 -
 .../contracts/enums/connectorIcons.tsx        |  3 -
 .../contracts/types/connector.types.ts        |  1 -
 surfsense_web/hooks/use-folder-sync.ts        | 62 ++++++++++++++-----
 .../lib/apis/connectors-api.service.ts        | 11 ----
 .../lib/apis/documents-api.service.ts         |  8 +++
 surfsense_web/lib/connectors/utils.ts         |  1 -
 surfsense_web/types/window.d.ts               |  8 ++-
 8 files changed, 60 insertions(+), 35 deletions(-)

diff --git a/surfsense_web/contracts/enums/connector.ts b/surfsense_web/contracts/enums/connector.ts
index ecf96d88e..501f5d9a3 100644
--- a/surfsense_web/contracts/enums/connector.ts
+++ b/surfsense_web/contracts/enums/connector.ts
@@ -25,7 +25,6 @@ export enum EnumConnectorName {
 	YOUTUBE_CONNECTOR = "YOUTUBE_CONNECTOR",
 	CIRCLEBACK_CONNECTOR = "CIRCLEBACK_CONNECTOR",
 	OBSIDIAN_CONNECTOR = "OBSIDIAN_CONNECTOR",
-	LOCAL_FOLDER_CONNECTOR = "LOCAL_FOLDER_CONNECTOR",
 	DROPBOX_CONNECTOR = "DROPBOX_CONNECTOR",
 	MCP_CONNECTOR = "MCP_CONNECTOR",
 	COMPOSIO_GOOGLE_DRIVE_CONNECTOR = "COMPOSIO_GOOGLE_DRIVE_CONNECTOR",
diff --git a/surfsense_web/contracts/enums/connectorIcons.tsx b/surfsense_web/contracts/enums/connectorIcons.tsx
index f7378b74b..2e609b060 100644
--- a/surfsense_web/contracts/enums/connectorIcons.tsx
+++ b/surfsense_web/contracts/enums/connectorIcons.tsx
@@ -3,7 +3,6 @@ import {
 	BookOpen,
 	File,
 	FileText,
-	FolderSync,
 	Globe,
 	Microscope,
 	Search,
@@ -76,8 +75,6 @@ export const getConnectorIcon = (connectorType: EnumConnectorName | string, clas
 			return <Image src="/connectors/circleback.svg" alt="Circleback" {...imgProps} />;
 		case EnumConnectorName.MCP_CONNECTOR:
 			return <Image src="/connectors/modelcontextprotocol.svg" alt="MCP" {...imgProps} />;
-		case EnumConnectorName.LOCAL_FOLDER_CONNECTOR:
-			return <FolderSync {...iconProps} />;
 		case EnumConnectorName.OBSIDIAN_CONNECTOR:
 			return <Image src="/connectors/obsidian.svg" alt="Obsidian" {...imgProps} />;
 		case EnumConnectorName.COMPOSIO_GOOGLE_DRIVE_CONNECTOR:
diff --git a/surfsense_web/contracts/types/connector.types.ts b/surfsense_web/contracts/types/connector.types.ts
index 269941375..b83e05dcc 100644
--- a/surfsense_web/contracts/types/connector.types.ts
+++ b/surfsense_web/contracts/types/connector.types.ts
@@ -30,7 +30,6 @@ export const searchSourceConnectorTypeEnum = z.enum([
 	"DROPBOX_CONNECTOR",
 	"MCP_CONNECTOR",
 	"OBSIDIAN_CONNECTOR",
-	"LOCAL_FOLDER_CONNECTOR",
 	"COMPOSIO_GOOGLE_DRIVE_CONNECTOR",
 	"COMPOSIO_GMAIL_CONNECTOR",
 	"COMPOSIO_GOOGLE_CALENDAR_CONNECTOR",
diff --git a/surfsense_web/hooks/use-folder-sync.ts b/surfsense_web/hooks/use-folder-sync.ts
index a35faf98f..fcfb2814e 100644
--- a/surfsense_web/hooks/use-folder-sync.ts
+++ b/surfsense_web/hooks/use-folder-sync.ts
@@ -1,41 +1,73 @@
 "use client";
 
 import { useEffect, useRef } from "react";
-import { connectorsApiService } from "@/lib/apis/connectors-api.service";
+import { documentsApiService } from "@/lib/apis/documents-api.service";
+
+interface FileChangedEvent {
+	rootFolderId: number | null;
+	searchSpaceId: number;
+	folderPath: string;
+	folderName: string;
+	relativePath: string;
+	fullPath: string;
+	action: string;
+	timestamp: number;
+}
 
 const DEBOUNCE_MS = 2000;
 
 export function useFolderSync() {
-	const pendingRef = useRef<Map<string, ReturnType<typeof setTimeout>>>(new Map());
+	const queueRef = useRef<FileChangedEvent[]>([]);
+	const processingRef = useRef(false);
+	const debounceTimers = useRef<Map<string, ReturnType<typeof setTimeout>>>(new Map());
+
+	async function processQueue() {
+		if (processingRef.current) return;
+		processingRef.current = true;
+		while (queueRef.current.length > 0) {
+			const event = queueRef.current.shift()!;
+			try {
+				await documentsApiService.folderIndexFile(event.searchSpaceId, {
+					folder_path: event.folderPath,
+					folder_name: event.folderName,
+					search_space_id: event.searchSpaceId,
+					target_file_path: event.fullPath,
+				});
+			} catch (err) {
+				console.error("[FolderSync] Failed to trigger re-index:", err);
+			}
+		}
+		processingRef.current = false;
+	}
 
 	useEffect(() => {
 		const api = typeof window !== "undefined" ? window.electronAPI : null;
 		if (!api?.onFileChanged) return;
 
-		const cleanup = api.onFileChanged((event) => {
-			const key = `${event.connectorId}:${event.fullPath}`;
+		// Signal to main process that the renderer is ready to receive events
+		api.signalRendererReady?.();
 
-			const existing = pendingRef.current.get(key);
+		const cleanup = api.onFileChanged((event: FileChangedEvent) => {
+			const key = `${event.folderPath}:${event.fullPath}`;
+
+			const existing = debounceTimers.current.get(key);
 			if (existing) clearTimeout(existing);
 
-			const timeout = setTimeout(async () => {
-				pendingRef.current.delete(key);
-				try {
-					await connectorsApiService.indexFile(event.connectorId, event.fullPath);
-				} catch (err) {
-					console.error("[FolderSync] Failed to trigger re-index:", err);
-				}
+			const timeout = setTimeout(() => {
+				debounceTimers.current.delete(key);
+				queueRef.current.push(event);
+				processQueue();
 			}, DEBOUNCE_MS);
 
-			pendingRef.current.set(key, timeout);
+			debounceTimers.current.set(key, timeout);
 		});
 
 		return () => {
 			cleanup();
-			for (const timeout of pendingRef.current.values()) {
+			for (const timeout of debounceTimers.current.values()) {
 				clearTimeout(timeout);
 			}
-			pendingRef.current.clear();
+			debounceTimers.current.clear();
 		};
 	}, []);
 }
diff --git a/surfsense_web/lib/apis/connectors-api.service.ts b/surfsense_web/lib/apis/connectors-api.service.ts
index f2722df70..7b94b3746 100644
--- a/surfsense_web/lib/apis/connectors-api.service.ts
+++ b/surfsense_web/lib/apis/connectors-api.service.ts
@@ -405,17 +405,6 @@ class ConnectorsApiService {
 		);
 	};
 
-	// =============================================================================
-	// Local Folder Connector Methods
-	// =============================================================================
-
-	indexFile = async (connectorId: number, filePath: string) => {
-		return baseApiService.post(
-			`/api/v1/search-source-connectors/${connectorId}/index-file`,
-			undefined,
-			{ body: { file_path: filePath } }
-		);
-	};
 }
 
 export type { SlackChannel, DiscordChannel };
diff --git a/surfsense_web/lib/apis/documents-api.service.ts b/surfsense_web/lib/apis/documents-api.service.ts
index d4a80f8a0..c77cd6848 100644
--- a/surfsense_web/lib/apis/documents-api.service.ts
+++ b/surfsense_web/lib/apis/documents-api.service.ts
@@ -395,6 +395,14 @@ class DocumentsApiService {
 		);
 	};
 
+	folderIndex = async (searchSpaceId: number, body: { folder_path: string; folder_name: string; search_space_id: number; exclude_patterns?: string[]; file_extensions?: string[]; root_folder_id?: number; enable_summary?: boolean }) => {
+		return baseApiService.post(`/api/v1/documents/folder-index`, undefined, { body });
+	};
+
+	folderIndexFile = async (searchSpaceId: number, body: { folder_path: string; folder_name: string; search_space_id: number; target_file_path: string; enable_summary?: boolean }) => {
+		return baseApiService.post(`/api/v1/documents/folder-index-file`, undefined, { body });
+	};
+
 	/**
 	 * Delete a document
 	 */
diff --git a/surfsense_web/lib/connectors/utils.ts b/surfsense_web/lib/connectors/utils.ts
index 6ce78be67..90f7f5d21 100644
--- a/surfsense_web/lib/connectors/utils.ts
+++ b/surfsense_web/lib/connectors/utils.ts
@@ -30,7 +30,6 @@ export const getConnectorTypeDisplay = (type: string): string => {
 		YOUTUBE_CONNECTOR: "YouTube",
 		CIRCLEBACK_CONNECTOR: "Circleback",
 		OBSIDIAN_CONNECTOR: "Obsidian",
-		LOCAL_FOLDER_CONNECTOR: "Local Folder",
 		DROPBOX_CONNECTOR: "Dropbox",
 		MCP_CONNECTOR: "MCP Server",
 	};
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 921449b41..b399664d6 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -5,15 +5,16 @@ interface WatchedFolderConfig {
 	name: string;
 	excludePatterns: string[];
 	fileExtensions: string[] | null;
-	connectorId: number;
+	rootFolderId: number | null;
 	searchSpaceId: number;
 	active: boolean;
 }
 
 interface FolderSyncFileChangedEvent {
-	connectorId: number;
+	rootFolderId: number | null;
 	searchSpaceId: number;
 	folderPath: string;
+	folderName: string;
 	relativePath: string;
 	fullPath: string;
 	action: "add" | "change" | "unlink";
@@ -21,7 +22,7 @@ interface FolderSyncFileChangedEvent {
 }
 
 interface FolderSyncWatcherReadyEvent {
-	connectorId: number;
+	rootFolderId: number | null;
 	folderPath: string;
 }
 
@@ -49,6 +50,7 @@ interface ElectronAPI {
 	onWatcherReady: (callback: (data: FolderSyncWatcherReadyEvent) => void) => () => void;
 	pauseWatcher: () => Promise<void>;
 	resumeWatcher: () => Promise<void>;
+	signalRendererReady: () => Promise<void>;
 }
 
 declare global {

From 22ee5c99cc9a656a3c5f0afae9c100874144e1b6 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 22:21:31 +0530
Subject: [PATCH 048/202] refactor: remove Local Folder connector and related
 tasks, implement new folder indexing endpoints

---
 surfsense_backend/app/db.py                   |   1 -
 .../app/routes/documents_routes.py            | 143 ++++++++++++++++
 .../routes/search_source_connectors_routes.py | 144 ----------------
 .../app/tasks/celery_tasks/connector_tasks.py |  46 ------
 .../app/tasks/celery_tasks/document_tasks.py  |  66 ++++++++
 .../app/tasks/connector_indexers/__init__.py  |   2 -
 .../local_folder_indexer.py                   | 155 ++++++------------
 .../tests/integration/conftest.py             |  19 ---
 .../test_local_folder_pipeline.py             | 126 +++++++-------
 9 files changed, 326 insertions(+), 376 deletions(-)

diff --git a/surfsense_backend/app/db.py b/surfsense_backend/app/db.py
index 25045e84a..1a4d3ea06 100644
--- a/surfsense_backend/app/db.py
+++ b/surfsense_backend/app/db.py
@@ -110,7 +110,6 @@ class SearchSourceConnectorType(StrEnum):
     COMPOSIO_GOOGLE_DRIVE_CONNECTOR = "COMPOSIO_GOOGLE_DRIVE_CONNECTOR"
     COMPOSIO_GMAIL_CONNECTOR = "COMPOSIO_GMAIL_CONNECTOR"
     COMPOSIO_GOOGLE_CALENDAR_CONNECTOR = "COMPOSIO_GOOGLE_CALENDAR_CONNECTOR"
-    LOCAL_FOLDER_CONNECTOR = "LOCAL_FOLDER_CONNECTOR"
 
 
 class PodcastStatus(StrEnum):
diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index 2d999eae3..d7974f9ff 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -2,6 +2,7 @@
 import asyncio
 
 from fastapi import APIRouter, Depends, Form, HTTPException, UploadFile
+from pydantic import BaseModel as PydanticBaseModel
 from sqlalchemy.ext.asyncio import AsyncSession
 from sqlalchemy.future import select
 from sqlalchemy.orm import selectinload
@@ -11,6 +12,7 @@ from app.db import (
     Document,
     DocumentType,
     DocumentVersion,
+    Folder,
     Permission,
     SearchSpace,
     SearchSpaceMembership,
@@ -1258,3 +1260,144 @@ async def restore_document_version(
         "document_id": document_id,
         "restored_version": version_number,
     }
+
+
+# ===== Local folder indexing endpoints =====
+
+
+class FolderIndexRequest(PydanticBaseModel):
+    folder_path: str
+    folder_name: str
+    search_space_id: int
+    exclude_patterns: list[str] | None = None
+    file_extensions: list[str] | None = None
+    root_folder_id: int | None = None
+    enable_summary: bool = False
+
+
+class FolderIndexFileRequest(PydanticBaseModel):
+    folder_path: str
+    folder_name: str
+    search_space_id: int
+    target_file_path: str
+    enable_summary: bool = False
+
+
+@router.post("/documents/folder-index")
+async def folder_index(
+    request: FolderIndexRequest,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """Full-scan index of a local folder. Creates the root Folder row synchronously
+    and dispatches the heavy indexing work to a Celery task.
+    Returns the root_folder_id so the desktop can persist it.
+    """
+    from app.config import config as app_config
+
+    if not app_config.is_self_hosted():
+        raise HTTPException(
+            status_code=400,
+            detail="Local folder indexing is only available in self-hosted mode",
+        )
+
+    await check_permission(
+        session,
+        user,
+        request.search_space_id,
+        Permission.DOCUMENTS_CREATE.value,
+        "You don't have permission to create documents in this search space",
+    )
+
+    root_folder_id = request.root_folder_id
+    if root_folder_id:
+        existing = (
+            await session.execute(
+                select(Folder).where(Folder.id == root_folder_id)
+            )
+        ).scalar_one_or_none()
+        if not existing:
+            root_folder_id = None
+
+    if not root_folder_id:
+        root_folder = Folder(
+            name=request.folder_name,
+            search_space_id=request.search_space_id,
+            created_by_id=str(user.id),
+            position="a0",
+        )
+        session.add(root_folder)
+        await session.flush()
+        root_folder_id = root_folder.id
+        await session.commit()
+
+    from app.tasks.celery_tasks.document_tasks import index_local_folder_task
+
+    index_local_folder_task.delay(
+        search_space_id=request.search_space_id,
+        user_id=str(user.id),
+        folder_path=request.folder_path,
+        folder_name=request.folder_name,
+        exclude_patterns=request.exclude_patterns,
+        file_extensions=request.file_extensions,
+        root_folder_id=root_folder_id,
+        enable_summary=request.enable_summary,
+    )
+
+    return {
+        "message": "Folder indexing started",
+        "status": "processing",
+        "root_folder_id": root_folder_id,
+    }
+
+
+@router.post("/documents/folder-index-file")
+async def folder_index_file(
+    request: FolderIndexFileRequest,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """Index a single file within a watched folder (chokidar trigger).
+    Validates that target_file_path is under folder_path.
+    """
+    from app.config import config as app_config
+
+    if not app_config.is_self_hosted():
+        raise HTTPException(
+            status_code=400,
+            detail="Local folder indexing is only available in self-hosted mode",
+        )
+
+    await check_permission(
+        session,
+        user,
+        request.search_space_id,
+        Permission.DOCUMENTS_CREATE.value,
+        "You don't have permission to create documents in this search space",
+    )
+
+    from pathlib import Path
+
+    try:
+        Path(request.target_file_path).relative_to(request.folder_path)
+    except ValueError:
+        raise HTTPException(
+            status_code=400,
+            detail="target_file_path must be inside folder_path",
+        )
+
+    from app.tasks.celery_tasks.document_tasks import index_local_folder_task
+
+    index_local_folder_task.delay(
+        search_space_id=request.search_space_id,
+        user_id=str(user.id),
+        folder_path=request.folder_path,
+        folder_name=request.folder_name,
+        target_file_path=request.target_file_path,
+        enable_summary=request.enable_summary,
+    )
+
+    return {
+        "message": "File indexing started",
+        "status": "processing",
+    }
diff --git a/surfsense_backend/app/routes/search_source_connectors_routes.py b/surfsense_backend/app/routes/search_source_connectors_routes.py
index 5ea88c418..f49ba2d5d 100644
--- a/surfsense_backend/app/routes/search_source_connectors_routes.py
+++ b/surfsense_backend/app/routes/search_source_connectors_routes.py
@@ -1170,24 +1170,6 @@ async def index_connector_content(
             )
             response_message = "Obsidian vault indexing started in the background."
 
-        elif connector.connector_type == SearchSourceConnectorType.LOCAL_FOLDER_CONNECTOR:
-            from app.config import config as app_config
-            from app.tasks.celery_tasks.connector_tasks import index_local_folder_task
-
-            if not app_config.is_self_hosted():
-                raise HTTPException(
-                    status_code=400,
-                    detail="Local folder connector is only available in self-hosted mode",
-                )
-
-            logger.info(
-                f"Triggering local folder indexing for connector {connector_id} into search space {search_space_id}"
-            )
-            index_local_folder_task.delay(
-                connector_id, search_space_id, str(user.id), indexing_from, indexing_to
-            )
-            response_message = "Local folder indexing started in the background."
-
         elif (
             connector.connector_type
             == SearchSourceConnectorType.COMPOSIO_GOOGLE_DRIVE_CONNECTOR
@@ -1320,76 +1302,6 @@ async def index_connector_content(
         ) from e
 
 
-class IndexFileRequest(BaseModel):
-    file_path: str = Field(..., description="Absolute path to the file to index")
-
-
-@router.post(
-    "/search-source-connectors/{connector_id}/index-file",
-    response_model=dict[str, Any],
-)
-async def index_single_file(
-    connector_id: int,
-    body: IndexFileRequest,
-    session: AsyncSession = Depends(get_async_session),
-    user: User = Depends(current_active_user),
-):
-    """Index a single file from a local folder connector (chokidar real-time trigger)."""
-    from app.config import config as app_config
-    from app.tasks.celery_tasks.connector_tasks import index_local_folder_task
-
-    if not app_config.is_self_hosted():
-        raise HTTPException(
-            status_code=400,
-            detail="Local folder connector is only available in self-hosted mode",
-        )
-
-    result = await session.execute(
-        select(SearchSourceConnector).filter(
-            SearchSourceConnector.id == connector_id,
-            SearchSourceConnector.connector_type
-            == SearchSourceConnectorType.LOCAL_FOLDER_CONNECTOR,
-        )
-    )
-    connector = result.scalars().first()
-    if not connector:
-        raise HTTPException(status_code=404, detail="Local folder connector not found")
-
-    await check_permission(session, user, connector.search_space_id, Permission.CONNECTORS_UPDATE.value)
-
-    folder_path = connector.config.get("folder_path", "")
-
-    # Security: resolve symlinks and verify the file is inside folder_path
-    try:
-        resolved_file = os.path.realpath(body.file_path)
-        resolved_folder = os.path.realpath(folder_path)
-        if not resolved_file.startswith(resolved_folder + os.sep) and resolved_file != resolved_folder:
-            raise HTTPException(
-                status_code=403,
-                detail="File path is outside the configured folder",
-            )
-    except (OSError, ValueError):
-        raise HTTPException(
-            status_code=403,
-            detail="Invalid file path",
-        )
-
-    index_local_folder_task.delay(
-        connector_id,
-        connector.search_space_id,
-        str(user.id),
-        None,
-        None,
-        target_file_path=resolved_file,
-    )
-
-    return {
-        "message": "Single file indexing started",
-        "connector_id": connector_id,
-        "file_path": body.file_path,
-    }
-
-
 async def _update_connector_timestamp_by_id(session: AsyncSession, connector_id: int):
     """
     Update the last_indexed_at timestamp for a connector by its ID.
@@ -3166,62 +3078,6 @@ async def run_obsidian_indexing(
     )
 
 
-async def run_local_folder_indexing_with_new_session(
-    connector_id: int,
-    search_space_id: int,
-    user_id: str,
-    start_date: str,
-    end_date: str,
-    target_file_path: str | None = None,
-):
-    """Wrapper to run local folder indexing with its own database session."""
-    logger.info(
-        f"Background task started: Indexing local folder connector {connector_id} into space {search_space_id}"
-    )
-    async with async_session_maker() as session:
-        await run_local_folder_indexing(
-            session, connector_id, search_space_id, user_id, start_date, end_date,
-            target_file_path=target_file_path,
-        )
-    logger.info(f"Background task finished: Indexing local folder connector {connector_id}")
-
-
-async def run_local_folder_indexing(
-    session: AsyncSession,
-    connector_id: int,
-    search_space_id: int,
-    user_id: str,
-    start_date: str,
-    end_date: str,
-    target_file_path: str | None = None,
-):
-    """Background task to run local folder indexing."""
-    from app.tasks.connector_indexers import index_local_folder
-
-    await _run_indexing_with_notifications(
-        session=session,
-        connector_id=connector_id,
-        search_space_id=search_space_id,
-        user_id=user_id,
-        start_date=start_date,
-        end_date=end_date,
-        indexing_function=lambda session, connector_id, search_space_id, user_id,
-        start_date, end_date, update_last_indexed, on_heartbeat_callback: index_local_folder(
-            session=session,
-            connector_id=connector_id,
-            search_space_id=search_space_id,
-            user_id=user_id,
-            start_date=start_date,
-            end_date=end_date,
-            update_last_indexed=update_last_indexed,
-            on_heartbeat_callback=on_heartbeat_callback,
-            target_file_path=target_file_path,
-        ),
-        update_timestamp_func=_update_connector_timestamp_by_id,
-        supports_heartbeat_callback=True,
-    )
-
-
 async def run_composio_indexing_with_new_session(
     connector_id: int,
     search_space_id: int,
diff --git a/surfsense_backend/app/tasks/celery_tasks/connector_tasks.py b/surfsense_backend/app/tasks/celery_tasks/connector_tasks.py
index 9ff578ad2..57475c9fd 100644
--- a/surfsense_backend/app/tasks/celery_tasks/connector_tasks.py
+++ b/surfsense_backend/app/tasks/celery_tasks/connector_tasks.py
@@ -926,52 +926,6 @@ async def _index_obsidian_vault(
         )
 
 
-@celery_app.task(name="index_local_folder", bind=True)
-def index_local_folder_task(
-    self,
-    connector_id: int,
-    search_space_id: int,
-    user_id: str,
-    start_date: str = None,
-    end_date: str = None,
-    target_file_path: str = None,
-):
-    """Celery task to index a local folder."""
-    import asyncio
-
-    loop = asyncio.new_event_loop()
-    asyncio.set_event_loop(loop)
-
-    try:
-        loop.run_until_complete(
-            _index_local_folder(
-                connector_id, search_space_id, user_id, start_date, end_date, target_file_path
-            )
-        )
-    finally:
-        loop.close()
-
-
-async def _index_local_folder(
-    connector_id: int,
-    search_space_id: int,
-    user_id: str,
-    start_date: str = None,
-    end_date: str = None,
-    target_file_path: str = None,
-):
-    """Index local folder with new session."""
-    from app.routes.search_source_connectors_routes import (
-        run_local_folder_indexing,
-    )
-
-    async with get_celery_session_maker()() as session:
-        await run_local_folder_indexing(
-            session, connector_id, search_space_id, user_id, start_date, end_date,
-            target_file_path=target_file_path,
-        )
-
-
 @celery_app.task(name="index_composio_connector", bind=True)
 def index_composio_connector_task(
     self,
diff --git a/surfsense_backend/app/tasks/celery_tasks/document_tasks.py b/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
index 662b41f2a..110f3deee 100644
--- a/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
+++ b/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
@@ -10,6 +10,7 @@ from app.config import config
 from app.services.notification_service import NotificationService
 from app.services.task_logging_service import TaskLoggingService
 from app.tasks.celery_tasks import get_celery_session_maker
+from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
 from app.tasks.document_processors import (
     add_extension_received_document,
     add_youtube_video_document,
@@ -1243,3 +1244,68 @@ async def _process_circleback_meeting(
                 heartbeat_task.cancel()
             if notification:
                 _stop_heartbeat(notification.id)
+
+
+# ===== Local folder indexing task =====
+
+
+@celery_app.task(name="index_local_folder", bind=True)
+def index_local_folder_task(
+    self,
+    search_space_id: int,
+    user_id: str,
+    folder_path: str,
+    folder_name: str,
+    exclude_patterns: list[str] | None = None,
+    file_extensions: list[str] | None = None,
+    root_folder_id: int | None = None,
+    enable_summary: bool = False,
+    target_file_path: str | None = None,
+):
+    """Celery task to index a local folder. Config is passed directly — no connector row."""
+    loop = asyncio.new_event_loop()
+    asyncio.set_event_loop(loop)
+
+    try:
+        loop.run_until_complete(
+            _index_local_folder_async(
+                search_space_id=search_space_id,
+                user_id=user_id,
+                folder_path=folder_path,
+                folder_name=folder_name,
+                exclude_patterns=exclude_patterns,
+                file_extensions=file_extensions,
+                root_folder_id=root_folder_id,
+                enable_summary=enable_summary,
+                target_file_path=target_file_path,
+            )
+        )
+    finally:
+        loop.close()
+
+
+async def _index_local_folder_async(
+    search_space_id: int,
+    user_id: str,
+    folder_path: str,
+    folder_name: str,
+    exclude_patterns: list[str] | None = None,
+    file_extensions: list[str] | None = None,
+    root_folder_id: int | None = None,
+    enable_summary: bool = False,
+    target_file_path: str | None = None,
+):
+    """Run local folder indexing with a fresh DB session."""
+    async with get_celery_session_maker()() as session:
+        await index_local_folder(
+            session=session,
+            search_space_id=search_space_id,
+            user_id=user_id,
+            folder_path=folder_path,
+            folder_name=folder_name,
+            exclude_patterns=exclude_patterns,
+            file_extensions=file_extensions,
+            root_folder_id=root_folder_id,
+            enable_summary=enable_summary,
+            target_file_path=target_file_path,
+        )
diff --git a/surfsense_backend/app/tasks/connector_indexers/__init__.py b/surfsense_backend/app/tasks/connector_indexers/__init__.py
index 8e4ad69e5..1b032d54a 100644
--- a/surfsense_backend/app/tasks/connector_indexers/__init__.py
+++ b/surfsense_backend/app/tasks/connector_indexers/__init__.py
@@ -44,7 +44,6 @@ from .jira_indexer import index_jira_issues
 from .linear_indexer import index_linear_issues
 
 # Documentation and knowledge management
-from .local_folder_indexer import index_local_folder
 from .luma_indexer import index_luma_events
 from .notion_indexer import index_notion_pages
 from .obsidian_indexer import index_obsidian_vault
@@ -75,5 +74,4 @@ __all__ = [  # noqa: RUF022
     # Communication platforms
     "index_slack_messages",
     "index_google_gmail_messages",
-    "index_local_folder",
 ]
diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index fc7fdaf66..591914625 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -1,5 +1,5 @@
 """
-Local folder connector indexer.
+Local folder indexer.
 
 Indexes files from a local folder on disk. Supports:
 - Full-scan mode (startup reconciliation / manual trigger)
@@ -8,7 +8,9 @@ Indexes files from a local folder on disk. Supports:
 - Document versioning via create_version_snapshot
 - ETL-based file parsing for binary formats (PDF, DOCX, images, audio, etc.)
 
-Electron-only: all change detection is driven by chokidar in the desktop app.
+Desktop-only: all change detection is driven by chokidar in the desktop app.
+Config (folder_path, exclude_patterns, etc.) is passed in from the caller —
+no connector row is read.
 """
 
 import os
@@ -17,10 +19,9 @@ from collections.abc import Awaitable, Callable
 from datetime import UTC, datetime
 from pathlib import Path
 
-from sqlalchemy import delete, select
+from sqlalchemy import select
 from sqlalchemy.exc import SQLAlchemyError
 from sqlalchemy.ext.asyncio import AsyncSession
-from sqlalchemy.orm.attributes import flag_modified
 
 from app.config import config
 from app.db import (
@@ -28,7 +29,6 @@ from app.db import (
     DocumentStatus,
     DocumentType,
     Folder,
-    SearchSourceConnectorType,
 )
 from app.services.llm_service import get_user_long_context_llm
 from app.services.task_logging_service import TaskLoggingService
@@ -45,11 +45,9 @@ from .base import (
     build_document_metadata_string,
     check_document_by_unique_identifier,
     check_duplicate_document_by_hash,
-    get_connector_by_id,
     get_current_timestamp,
     logger,
     safe_set_chunks,
-    update_connector_last_indexed,
 )
 
 PLAINTEXT_EXTENSIONS = frozenset({
@@ -131,12 +129,10 @@ def scan_folder(
     for dirpath, dirnames, filenames in os.walk(root):
         rel_dir = Path(dirpath).relative_to(root)
 
-        # Prune excluded directories in-place so os.walk skips them
         dirnames[:] = [
             d for d in dirnames if d not in exclude_patterns
         ]
 
-        # Check if the current directory itself is excluded
         if any(part in exclude_patterns for part in rel_dir.parts):
             continue
 
@@ -232,20 +228,18 @@ async def _mirror_folder_structure(
     folder_name: str,
     search_space_id: int,
     user_id: str,
-    connector_config: dict,
-    connector,
+    root_folder_id: int | None = None,
     exclude_patterns: list[str] | None = None,
-) -> dict[str, int]:
+) -> tuple[dict[str, int], int]:
     """Mirror the local filesystem directory structure into DB Folder rows.
 
-    Returns a mapping of relative_dir_path -> folder_id.
-    The empty string key ("") maps to the root folder.
+    Returns (mapping, root_folder_id) where mapping is
+    relative_dir_path -> folder_id. The empty string key maps to the root folder.
     """
     root = Path(folder_path)
     if exclude_patterns is None:
         exclude_patterns = []
 
-    # Collect all subdirectory paths relative to root
     subdirs: list[str] = []
     for dirpath, dirnames, _ in os.walk(root):
         dirnames[:] = [d for d in dirnames if d not in exclude_patterns]
@@ -256,13 +250,10 @@ async def _mirror_folder_structure(
         if rel_str:
             subdirs.append(rel_str)
 
-    # Sort by depth so parents are created before children
     subdirs.sort(key=lambda p: p.count(os.sep))
 
     mapping: dict[str, int] = {}
 
-    # Get or create root folder
-    root_folder_id = connector_config.get("root_folder_id")
     if root_folder_id:
         existing = (
             await session.execute(
@@ -284,12 +275,8 @@ async def _mirror_folder_structure(
         session.add(root_folder)
         await session.flush()
         mapping[""] = root_folder.id
-        # Persist root_folder_id into connector config
-        connector_config["root_folder_id"] = root_folder.id
-        connector.config = {**connector.config, "root_folder_id": root_folder.id}
-        flag_modified(connector, "config")
+        root_folder_id = root_folder.id
 
-    # Create/reuse subdirectory Folder rows
     for rel_dir in subdirs:
         dir_parts = Path(rel_dir).parts
         dir_name = dir_parts[-1]
@@ -322,7 +309,7 @@ async def _mirror_folder_structure(
             mapping[rel_dir] = new_folder.id
 
     await session.flush()
-    return mapping
+    return mapping, root_folder_id
 
 
 async def _cleanup_empty_folders(
@@ -332,16 +319,11 @@ async def _cleanup_empty_folders(
     existing_dirs_on_disk: set[str],
     folder_mapping: dict[str, int],
 ) -> None:
-    """Delete Folder rows that are empty (no docs, no children) and no longer on disk.
+    """Delete Folder rows that are empty (no docs, no children) and no longer on disk."""
+    from sqlalchemy import delete as sa_delete
 
-    Queries ALL folders under this search space (not just the current mapping)
-    so that stale folders from previous syncs are also cleaned up.
-    """
-    # Build a reverse mapping from folder_id → rel_dir for known dirs
     id_to_rel: dict[int, str] = {fid: rel for rel, fid in folder_mapping.items() if rel}
 
-    # Also find any folders in the DB that are children of the root but NOT
-    # in the current mapping (stale from a previous sync).
     all_folders = (
         await session.execute(
             select(Folder).where(
@@ -351,7 +333,6 @@ async def _cleanup_empty_folders(
         )
     ).scalars().all()
 
-    # Build candidates: folders not on disk that we might delete
     candidates: list[Folder] = []
     for folder in all_folders:
         rel = id_to_rel.get(folder.id)
@@ -359,8 +340,6 @@ async def _cleanup_empty_folders(
             continue
         candidates.append(folder)
 
-    # Sort deepest first (by name depth heuristic — folders with no children first)
-    # Repeat until no more deletions happen (cascading empty parents)
     changed = True
     while changed:
         changed = False
@@ -384,57 +363,46 @@ async def _cleanup_empty_folders(
                 remaining.append(folder)
                 continue
 
-            await session.execute(delete(Folder).where(Folder.id == folder.id))
+            await session.execute(sa_delete(Folder).where(Folder.id == folder.id))
             changed = True
         candidates = remaining
 
 
 async def index_local_folder(
     session: AsyncSession,
-    connector_id: int,
     search_space_id: int,
     user_id: str,
-    start_date: str | None = None,
-    end_date: str | None = None,
-    update_last_indexed: bool = True,
-    on_heartbeat_callback: HeartbeatCallbackType | None = None,
+    folder_path: str,
+    folder_name: str,
+    exclude_patterns: list[str] | None = None,
+    file_extensions: list[str] | None = None,
+    root_folder_id: int | None = None,
+    enable_summary: bool = False,
     target_file_path: str | None = None,
-) -> tuple[int, int, str | None]:
+    on_heartbeat_callback: HeartbeatCallbackType | None = None,
+) -> tuple[int, int, int | None, str | None]:
     """Index files from a local folder.
 
     Supports two modes:
     - Full scan (target_file_path=None): walks entire folder, handles new/changed/deleted files.
     - Single-file (target_file_path set): processes only that file.
 
-    Returns (indexed_count, skipped_count, error_or_warning_message).
+    Returns (indexed_count, skipped_count, root_folder_id, error_or_warning_message).
     """
     task_logger = TaskLoggingService(session, search_space_id)
 
     log_entry = await task_logger.log_task_start(
         task_name="local_folder_indexing",
-        source="connector_indexing_task",
-        message=f"Starting local folder indexing for connector {connector_id}",
+        source="local_folder_indexing_task",
+        message=f"Starting local folder indexing for {folder_name}",
         metadata={
-            "connector_id": connector_id,
+            "folder_path": folder_path,
             "user_id": str(user_id),
             "target_file_path": target_file_path,
         },
     )
 
     try:
-        connector = await get_connector_by_id(
-            session, connector_id, SearchSourceConnectorType.LOCAL_FOLDER_CONNECTOR
-        )
-        if not connector:
-            await task_logger.log_task_failure(
-                log_entry,
-                f"Connector {connector_id} not found",
-                "Connector not found",
-                {},
-            )
-            return 0, 0, f"Connector {connector_id} not found"
-
-        folder_path = connector.config.get("folder_path")
         if not folder_path or not os.path.exists(folder_path):
             await task_logger.log_task_failure(
                 log_entry,
@@ -442,59 +410,54 @@ async def index_local_folder(
                 "Folder not found",
                 {},
             )
-            return 0, 0, f"Folder path missing or does not exist: {folder_path}"
+            return 0, 0, root_folder_id, f"Folder path missing or does not exist: {folder_path}"
 
-        folder_name = connector.config.get("folder_name") or os.path.basename(folder_path)
-        exclude_patterns = connector.config.get("exclude_patterns", DEFAULT_EXCLUDE_PATTERNS)
-        file_extensions = connector.config.get("file_extensions")  # None = all
+        if exclude_patterns is None:
+            exclude_patterns = DEFAULT_EXCLUDE_PATTERNS
 
         # ====================================================================
         # SINGLE-FILE MODE
         # ====================================================================
         if target_file_path:
-            return await _index_single_file(
+            indexed, skipped, err = await _index_single_file(
                 session=session,
-                connector=connector,
-                connector_id=connector_id,
                 search_space_id=search_space_id,
                 user_id=user_id,
                 folder_path=folder_path,
                 folder_name=folder_name,
                 target_file_path=target_file_path,
+                enable_summary=enable_summary,
                 task_logger=task_logger,
                 log_entry=log_entry,
-                update_last_indexed=update_last_indexed,
             )
+            return indexed, skipped, root_folder_id, err
 
         # ====================================================================
         # FULL-SCAN MODE
         # ====================================================================
 
-        # Phase 0: Mirror folder structure
         await task_logger.log_task_progress(
             log_entry, "Mirroring folder structure", {"stage": "folder_mirror"}
         )
 
-        folder_mapping = await _mirror_folder_structure(
+        folder_mapping, root_folder_id = await _mirror_folder_structure(
             session=session,
             folder_path=folder_path,
             folder_name=folder_name,
             search_space_id=search_space_id,
             user_id=user_id,
-            connector_config=connector.config,
-            connector=connector,
+            root_folder_id=root_folder_id,
             exclude_patterns=exclude_patterns,
         )
         await session.flush()
 
-        # Scan files on disk
         try:
             files = scan_folder(folder_path, file_extensions, exclude_patterns)
         except Exception as e:
             await task_logger.log_task_failure(
                 log_entry, f"Failed to scan folder: {e}", "Scan error", {}
             )
-            return 0, 0, f"Failed to scan folder: {e}"
+            return 0, 0, root_folder_id, f"Failed to scan folder: {e}"
 
         logger.info(f"Found {len(files)} files in folder")
 
@@ -530,7 +493,6 @@ async def index_local_folder(
                 )
 
                 if existing_document:
-                    # Check mtime first (cheap)
                     stored_mtime = (existing_document.document_metadata or {}).get("mtime")
                     current_mtime = file_info["modified_at"].timestamp()
 
@@ -542,7 +504,6 @@ async def index_local_folder(
                         skipped_count += 1
                         continue
 
-                    # mtime differs — read file and check content hash
                     try:
                         content, content_hash = await _compute_file_content_hash(
                             file_path_abs, file_info["relative_path"], search_space_id
@@ -553,7 +514,6 @@ async def index_local_folder(
                         continue
 
                     if existing_document.content_hash == content_hash:
-                        # Content same, just update mtime in metadata
                         meta = dict(existing_document.document_metadata or {})
                         meta["mtime"] = current_mtime
                         existing_document.document_metadata = meta
@@ -564,7 +524,6 @@ async def index_local_folder(
                         skipped_count += 1
                         continue
 
-                    # Content actually changed — snapshot version, queue for re-index
                     await create_version_snapshot(session, existing_document)
 
                     files_to_process.append(
@@ -581,7 +540,6 @@ async def index_local_folder(
                     )
                     continue
 
-                # New document — read content
                 try:
                     content, content_hash = await _compute_file_content_hash(
                         file_path_abs, file_info["relative_path"], search_space_id
@@ -595,7 +553,6 @@ async def index_local_folder(
                     skipped_count += 1
                     continue
 
-                # Check for duplicate content from another connector
                 with session.no_autoflush:
                     dup = await check_duplicate_document_by_hash(session, content_hash)
                 if dup:
@@ -603,7 +560,6 @@ async def index_local_folder(
                     skipped_count += 1
                     continue
 
-                # Determine folder_id for this file
                 parent_dir = str(Path(relative_path).parent)
                 if parent_dir == ".":
                     parent_dir = ""
@@ -616,17 +572,16 @@ async def index_local_folder(
                     document_metadata={
                         "folder_name": folder_name,
                         "file_path": relative_path,
-                        "connector_id": connector_id,
                         "mtime": file_info["modified_at"].timestamp(),
                     },
                     content="Pending...",
-                    content_hash=unique_identifier_hash,  # Temp unique — updated in phase 2
+                    content_hash=unique_identifier_hash,
                     unique_identifier_hash=unique_identifier_hash,
                     embedding=None,
                     status=DocumentStatus.pending(),
                     updated_at=get_current_timestamp(),
                     created_by_id=user_id,
-                    connector_id=connector_id,
+                    connector_id=None,
                     folder_id=folder_id,
                 )
                 session.add(document)
@@ -655,16 +610,17 @@ async def index_local_folder(
         # ================================================================
         # PHASE 1.5: Delete documents no longer on disk
         # ================================================================
-        all_connector_docs = (
+        all_folder_docs = (
             await session.execute(
                 select(Document).where(
-                    Document.connector_id == connector_id,
                     Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == search_space_id,
+                    Document.folder_id.in_(list(folder_mapping.values())),
                 )
             )
         ).scalars().all()
 
-        for doc in all_connector_docs:
+        for doc in all_folder_docs:
             if doc.unique_identifier_hash not in seen_unique_hashes:
                 await session.delete(doc)
 
@@ -709,7 +665,7 @@ async def index_local_folder(
                 document_string = build_document_metadata_string(metadata_sections)
 
                 summary_content = ""
-                if long_context_llm and connector.enable_summary:
+                if long_context_llm and enable_summary:
                     doc_meta = {
                         "folder_name": folder_name,
                         "file_path": relative_path,
@@ -721,7 +677,6 @@ async def index_local_folder(
                 embedding = embed_text(document_string)
                 chunks = await create_document_chunks(document_string)
 
-                # Determine folder_id
                 parent_dir = str(Path(relative_path).parent)
                 if parent_dir == ".":
                     parent_dir = ""
@@ -735,7 +690,6 @@ async def index_local_folder(
                 document.document_metadata = {
                     "folder_name": folder_name,
                     "file_path": relative_path,
-                    "connector_id": connector_id,
                     "summary": summary_content,
                     "mtime": file_info["modified_at"].timestamp(),
                 }
@@ -782,8 +736,6 @@ async def index_local_folder(
                 session, root_fid, search_space_id, existing_dirs, folder_mapping
             )
 
-        await update_connector_last_indexed(session, connector, update_last_indexed)
-
         try:
             await session.commit()
         except Exception as e:
@@ -802,7 +754,7 @@ async def index_local_folder(
 
         await task_logger.log_task_success(
             log_entry,
-            f"Completed local folder indexing for connector {connector_id}",
+            f"Completed local folder indexing for {folder_name}",
             {
                 "indexed": indexed_count,
                 "skipped": skipped_count,
@@ -811,7 +763,7 @@ async def index_local_folder(
             },
         )
 
-        return indexed_count, skipped_count, warning_message
+        return indexed_count, skipped_count, root_folder_id, warning_message
 
     except SQLAlchemyError as e:
         logger.exception(f"Database error during local folder indexing: {e}")
@@ -819,34 +771,31 @@ async def index_local_folder(
         await task_logger.log_task_failure(
             log_entry, f"DB error: {e}", "Database error", {}
         )
-        return 0, 0, f"Database error: {e}"
+        return 0, 0, root_folder_id, f"Database error: {e}"
 
     except Exception as e:
         logger.exception(f"Error during local folder indexing: {e}")
         await task_logger.log_task_failure(
             log_entry, f"Error: {e}", "Unexpected error", {}
         )
-        return 0, 0, str(e)
+        return 0, 0, root_folder_id, str(e)
 
 
 async def _index_single_file(
     session: AsyncSession,
-    connector,
-    connector_id: int,
     search_space_id: int,
     user_id: str,
     folder_path: str,
     folder_name: str,
     target_file_path: str,
+    enable_summary: bool,
     task_logger,
     log_entry,
-    update_last_indexed: bool = True,
 ) -> tuple[int, int, str | None]:
     """Process a single file (chokidar real-time trigger)."""
     try:
         full_path = Path(target_file_path)
         if not full_path.exists():
-            # File was deleted — find and remove the document
             rel = str(full_path.relative_to(folder_path))
             unique_id = f"{folder_name}:{rel}"
             uid_hash = generate_unique_identifier_hash(
@@ -880,7 +829,6 @@ async def _index_single_file(
 
         if existing:
             if existing.content_hash == content_hash:
-                # Update mtime
                 mtime = full_path.stat().st_mtime
                 meta = dict(existing.document_metadata or {})
                 meta["mtime"] = mtime
@@ -888,10 +836,8 @@ async def _index_single_file(
                 await session.commit()
                 return 0, 1, None
 
-            # Content changed — snapshot + re-index
             await create_version_snapshot(session, existing)
 
-        # Get LLM
         long_context_llm = await get_user_long_context_llm(
             session, user_id, search_space_id
         )
@@ -906,7 +852,7 @@ async def _index_single_file(
         document_string = build_document_metadata_string(metadata_sections)
 
         summary_content = ""
-        if long_context_llm and connector.enable_summary:
+        if long_context_llm and enable_summary:
             summary_content, _ = await generate_document_summary(
                 document_string, long_context_llm, {"folder_name": folder_name, "file_path": rel_path}
             )
@@ -917,7 +863,6 @@ async def _index_single_file(
         doc_metadata = {
             "folder_name": folder_name,
             "file_path": rel_path,
-            "connector_id": connector_id,
             "summary": summary_content,
             "mtime": mtime,
         }
@@ -946,16 +891,14 @@ async def _index_single_file(
                 status=DocumentStatus.ready(),
                 updated_at=get_current_timestamp(),
                 created_by_id=user_id,
-                connector_id=connector_id,
+                connector_id=None,
             )
             session.add(document)
-            # Set chunks
             await session.flush()
             for chunk in chunks:
                 chunk.document_id = document.id
             session.add_all(chunks)
 
-        await update_connector_last_indexed(session, connector, update_last_indexed)
         await session.commit()
 
         await task_logger.log_task_success(
diff --git a/surfsense_backend/tests/integration/conftest.py b/surfsense_backend/tests/integration/conftest.py
index 840246e2f..9c91011ae 100644
--- a/surfsense_backend/tests/integration/conftest.py
+++ b/surfsense_backend/tests/integration/conftest.py
@@ -168,22 +168,3 @@ def make_connector_document(db_connector, db_user):
     return _make
 
 
-@pytest_asyncio.fixture
-async def db_local_folder_connector(
-    db_session: AsyncSession, db_user: User, db_search_space: SearchSpace, tmp_path
-) -> SearchSourceConnector:
-    connector = SearchSourceConnector(
-        name="Test Local Folder",
-        connector_type=SearchSourceConnectorType.LOCAL_FOLDER_CONNECTOR,
-        config={
-            "folder_path": str(tmp_path),
-            "folder_name": "test-folder",
-            "exclude_patterns": [],
-            "file_extensions": None,
-        },
-        search_space_id=db_search_space.id,
-        user_id=db_user.id,
-    )
-    db_session.add(connector)
-    await db_session.flush()
-    return connector
diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index 988905f8f..e46d59a67 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -14,7 +14,6 @@ from app.db import (
     DocumentType,
     DocumentVersion,
     Folder,
-    SearchSourceConnector,
     SearchSpace,
     User,
 )
@@ -72,7 +71,6 @@ class TestFullIndexer:
     async def test_i1_new_file_indexed(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         tmp_path: Path,
@@ -82,11 +80,12 @@ class TestFullIndexer:
 
         (tmp_path / "note.md").write_text("# Hello World\n\nContent here.")
 
-        count, skipped, err = await index_local_folder(
+        count, skipped, root_folder_id, err = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
         )
 
         assert err is None
@@ -95,7 +94,8 @@ class TestFullIndexer:
         docs = (
             await db_session.execute(
                 select(Document).where(
-                    Document.connector_id == db_local_folder_connector.id
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
                 )
             )
         ).scalars().all()
@@ -112,7 +112,6 @@ class TestFullIndexer:
     async def test_i2_unchanged_skipped(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         tmp_path: Path,
@@ -122,27 +121,31 @@ class TestFullIndexer:
 
         (tmp_path / "note.md").write_text("# Hello\n\nSame content.")
 
-        count1, _, _ = await index_local_folder(
+        count1, _, root_folder_id, _ = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
         )
         assert count1 == 1
 
-        # Second run — unchanged
-        count2, _, _ = await index_local_folder(
+        # Second run — unchanged, pass root_folder_id from first run
+        count2, _, _, _ = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            root_folder_id=root_folder_id,
         )
         assert count2 == 0
 
         total = (
             await db_session.execute(
                 select(func.count()).select_from(Document).where(
-                    Document.connector_id == db_local_folder_connector.id
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
                 )
             )
         ).scalar_one()
@@ -157,7 +160,6 @@ class TestFullIndexer:
     async def test_i3_changed_reindexed(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         tmp_path: Path,
@@ -168,11 +170,12 @@ class TestFullIndexer:
         f = tmp_path / "note.md"
         f.write_text("# Version 1\n\nOriginal.")
 
-        await index_local_folder(
+        _, _, root_folder_id, _ = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
         )
 
         # Modify
@@ -180,11 +183,13 @@ class TestFullIndexer:
         # Touch mtime to ensure it's detected as different
         os.utime(f, (f.stat().st_atime + 10, f.stat().st_mtime + 10))
 
-        count, _, _ = await index_local_folder(
+        count, _, _, _ = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            root_folder_id=root_folder_id,
         )
         assert count == 1
 
@@ -192,7 +197,8 @@ class TestFullIndexer:
         versions = (
             await db_session.execute(
                 select(DocumentVersion).join(Document).where(
-                    Document.connector_id == db_local_folder_connector.id
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
                 )
             )
         ).scalars().all()
@@ -207,7 +213,6 @@ class TestFullIndexer:
     async def test_i4_deleted_removed(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         tmp_path: Path,
@@ -218,17 +223,19 @@ class TestFullIndexer:
         f = tmp_path / "to_delete.md"
         f.write_text("# Delete me")
 
-        await index_local_folder(
+        _, _, root_folder_id, _ = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
         )
 
         docs_before = (
             await db_session.execute(
                 select(func.count()).select_from(Document).where(
-                    Document.connector_id == db_local_folder_connector.id
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
                 )
             )
         ).scalar_one()
@@ -238,15 +245,18 @@ class TestFullIndexer:
 
         await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            root_folder_id=root_folder_id,
         )
 
         docs_after = (
             await db_session.execute(
                 select(func.count()).select_from(Document).where(
-                    Document.connector_id == db_local_folder_connector.id
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
                 )
             )
         ).scalar_one()
@@ -261,7 +271,6 @@ class TestFullIndexer:
     async def test_i5_single_file_mode(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         tmp_path: Path,
@@ -273,11 +282,12 @@ class TestFullIndexer:
         (tmp_path / "b.md").write_text("File B")
         (tmp_path / "c.md").write_text("File C")
 
-        count, _, _ = await index_local_folder(
+        count, _, _, _ = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
             target_file_path=str(tmp_path / "b.md"),
         )
         assert count == 1
@@ -285,12 +295,13 @@ class TestFullIndexer:
         docs = (
             await db_session.execute(
                 select(Document).where(
-                    Document.connector_id == db_local_folder_connector.id
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
                 )
             )
         ).scalars().all()
         assert len(docs) == 1
-        assert docs[0].title == "b"
+        assert docs[0].title == "b.md"
 
 
 # ====================================================================
@@ -309,30 +320,27 @@ class TestFolderMirroring:
     async def test_f1_root_folder_created(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         tmp_path: Path,
     ):
-        """F1: First sync creates a root Folder and stores root_folder_id."""
+        """F1: First sync creates a root Folder and returns root_folder_id."""
         from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
 
         (tmp_path / "root.md").write_text("Root file")
 
-        await index_local_folder(
+        _, _, root_folder_id, _ = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
         )
 
-        # Refresh connector
-        await db_session.refresh(db_local_folder_connector)
-        root_id = db_local_folder_connector.config.get("root_folder_id")
-        assert root_id is not None
+        assert root_folder_id is not None
 
         root_folder = (
-            await db_session.execute(select(Folder).where(Folder.id == root_id))
+            await db_session.execute(select(Folder).where(Folder.id == root_folder_id))
         ).scalar_one()
         assert root_folder.name == "test-folder"
 
@@ -345,7 +353,6 @@ class TestFolderMirroring:
     async def test_f2_nested_folder_rows(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         tmp_path: Path,
@@ -362,9 +369,10 @@ class TestFolderMirroring:
 
         await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
         )
 
         folders = (
@@ -394,7 +402,6 @@ class TestFolderMirroring:
     async def test_f3_resync_reuses_folders(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         tmp_path: Path,
@@ -406,11 +413,12 @@ class TestFolderMirroring:
         sub.mkdir()
         (sub / "file.md").write_text("content")
 
-        await index_local_folder(
+        _, _, root_folder_id, _ = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
         )
 
         folders_before = (
@@ -420,12 +428,14 @@ class TestFolderMirroring:
         ).scalars().all()
         ids_before = {f.id for f in folders_before}
 
-        # Re-sync
+        # Re-sync with root_folder_id from first run
         await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            root_folder_id=root_folder_id,
         )
 
         folders_after = (
@@ -446,7 +456,6 @@ class TestFolderMirroring:
     async def test_f4_folder_id_assigned(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         tmp_path: Path,
@@ -459,17 +468,19 @@ class TestFolderMirroring:
         (daily / "today.md").write_text("today note")
         (tmp_path / "root.md").write_text("root note")
 
-        await index_local_folder(
+        _, _, root_folder_id, _ = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
         )
 
         docs = (
             await db_session.execute(
                 select(Document).where(
-                    Document.connector_id == db_local_folder_connector.id
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
                 )
             )
         ).scalars().all()
@@ -486,9 +497,7 @@ class TestFolderMirroring:
         assert today_doc.folder_id == daily_folder.id
 
         # Root doc should be in the root folder
-        await db_session.refresh(db_local_folder_connector)
-        root_fid = db_local_folder_connector.config.get("root_folder_id")
-        assert root_doc.folder_id == root_fid
+        assert root_doc.folder_id == root_folder_id
 
     @pytest.mark.usefixtures(
         "patched_self_hosted",
@@ -499,7 +508,6 @@ class TestFolderMirroring:
     async def test_f5_empty_folder_cleanup(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         tmp_path: Path,
@@ -515,11 +523,12 @@ class TestFolderMirroring:
         (daily / "today.md").write_text("today")
         (weekly / "review.md").write_text("review")
 
-        await index_local_folder(
+        _, _, root_folder_id, _ = await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
         )
 
         # Verify weekly folder exists
@@ -535,9 +544,11 @@ class TestFolderMirroring:
 
         await index_local_folder(
             session=db_session,
-            connector_id=db_local_folder_connector.id,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            root_folder_id=root_folder_id,
         )
 
         # weekly Folder should be gone (empty, dir removed)
@@ -570,7 +581,6 @@ class TestPipelineIntegration:
     async def test_p1_local_folder_file_through_pipeline(
         self,
         db_session: AsyncSession,
-        db_local_folder_connector: SearchSourceConnector,
         db_user: User,
         db_search_space: SearchSpace,
         mocker,
@@ -585,7 +595,7 @@ class TestPipelineIntegration:
             unique_id="test-folder:test.md",
             document_type=DocumentType.LOCAL_FOLDER_FILE,
             search_space_id=db_search_space.id,
-            connector_id=db_local_folder_connector.id,
+            connector_id=None,
             created_by_id=str(db_user.id),
         )
 

From caf2525ab5d32ffbb6db0c96a5e4109996a24030 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 22:29:07 +0530
Subject: [PATCH 049/202] fix: update folder ID collection logic to include
 deleted directories and adjust test cases for document titles

---
 .../connector_indexers/local_folder_indexer.py    | 15 ++++++++++++++-
 .../test_local_folder_pipeline.py                 |  4 ++--
 2 files changed, 16 insertions(+), 3 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index 591914625..93c6649a2 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -610,12 +610,25 @@ async def index_local_folder(
         # ================================================================
         # PHASE 1.5: Delete documents no longer on disk
         # ================================================================
+        # Collect ALL folder IDs under this root (including folders that no
+        # longer exist on disk but still have rows in the DB) so we catch
+        # documents in deleted directories too.
+        all_root_folder_ids = set(folder_mapping.values())
+        all_db_folders = (
+            await session.execute(
+                select(Folder.id).where(
+                    Folder.search_space_id == search_space_id,
+                )
+            )
+        ).scalars().all()
+        all_root_folder_ids.update(all_db_folders)
+
         all_folder_docs = (
             await session.execute(
                 select(Document).where(
                     Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
                     Document.search_space_id == search_space_id,
-                    Document.folder_id.in_(list(folder_mapping.values())),
+                    Document.folder_id.in_(list(all_root_folder_ids)),
                 )
             )
         ).scalars().all()
diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index e46d59a67..34efad789 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -485,8 +485,8 @@ class TestFolderMirroring:
             )
         ).scalars().all()
 
-        today_doc = next(d for d in docs if d.title == "today")
-        root_doc = next(d for d in docs if d.title == "root")
+        today_doc = next(d for d in docs if d.title == "today.md")
+        root_doc = next(d for d in docs if d.title == "root.md")
 
         daily_folder = (
             await db_session.execute(

From c27d24a117633aac32de889b12f153239b58a832 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 22:41:45 +0530
Subject: [PATCH 050/202] feat: enhance folder indexing by adding root folder
 ID support and implement folder creation and cleanup logic

---
 .../app/routes/documents_routes.py            |   2 +
 .../local_folder_indexer.py                   | 102 ++++++++++++++
 .../test_local_folder_pipeline.py             | 130 ++++++++++++++++++
 surfsense_web/hooks/use-folder-sync.ts        |   1 +
 .../lib/apis/documents-api.service.ts         |   2 +-
 5 files changed, 236 insertions(+), 1 deletion(-)

diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index d7974f9ff..05221b192 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -1280,6 +1280,7 @@ class FolderIndexFileRequest(PydanticBaseModel):
     folder_name: str
     search_space_id: int
     target_file_path: str
+    root_folder_id: int | None = None
     enable_summary: bool = False
 
 
@@ -1394,6 +1395,7 @@ async def folder_index_file(
         folder_path=request.folder_path,
         folder_name=request.folder_name,
         target_file_path=request.target_file_path,
+        root_folder_id=request.root_folder_id,
         enable_summary=request.enable_summary,
     )
 
diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index 93c6649a2..3d4ddc19e 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -312,6 +312,92 @@ async def _mirror_folder_structure(
     return mapping, root_folder_id
 
 
+async def _resolve_folder_for_file(
+    session: AsyncSession,
+    rel_path: str,
+    root_folder_id: int,
+    search_space_id: int,
+    user_id: str,
+) -> int:
+    """Given a file's relative path, ensure all parent Folder rows exist and
+    return the folder_id for the file's immediate parent directory.
+
+    For a file at "notes/daily/today.md", this ensures Folder rows exist for
+    "notes" and "notes/daily", and returns the id of "notes/daily".
+    For a file at "readme.md" (root level), returns root_folder_id.
+    """
+    parent_dir = str(Path(rel_path).parent)
+    if parent_dir == ".":
+        return root_folder_id
+
+    parts = Path(parent_dir).parts
+    current_parent_id = root_folder_id
+
+    for part in parts:
+        existing = (
+            await session.execute(
+                select(Folder).where(
+                    Folder.name == part,
+                    Folder.parent_id == current_parent_id,
+                    Folder.search_space_id == search_space_id,
+                )
+            )
+        ).scalar_one_or_none()
+
+        if existing:
+            current_parent_id = existing.id
+        else:
+            new_folder = Folder(
+                name=part,
+                parent_id=current_parent_id,
+                search_space_id=search_space_id,
+                created_by_id=user_id,
+                position="a0",
+            )
+            session.add(new_folder)
+            await session.flush()
+            current_parent_id = new_folder.id
+
+    return current_parent_id
+
+
+async def _cleanup_empty_folder_chain(
+    session: AsyncSession,
+    folder_id: int,
+    root_folder_id: int,
+) -> None:
+    """Walk up from folder_id toward root, deleting empty folders (no docs, no
+    children). Stops at root_folder_id which is never deleted."""
+    current_id = folder_id
+    while current_id and current_id != root_folder_id:
+        has_doc = (
+            await session.execute(
+                select(Document.id).where(Document.folder_id == current_id).limit(1)
+            )
+        ).scalar_one_or_none()
+        if has_doc is not None:
+            break
+
+        has_child = (
+            await session.execute(
+                select(Folder.id).where(Folder.parent_id == current_id).limit(1)
+            )
+        ).scalar_one_or_none()
+        if has_child is not None:
+            break
+
+        folder = (
+            await session.execute(select(Folder).where(Folder.id == current_id))
+        ).scalar_one_or_none()
+        if not folder:
+            break
+
+        parent_id = folder.parent_id
+        await session.delete(folder)
+        await session.flush()
+        current_id = parent_id
+
+
 async def _cleanup_empty_folders(
     session: AsyncSession,
     root_folder_id: int,
@@ -427,6 +513,7 @@ async def index_local_folder(
                 folder_name=folder_name,
                 target_file_path=target_file_path,
                 enable_summary=enable_summary,
+                root_folder_id=root_folder_id,
                 task_logger=task_logger,
                 log_entry=log_entry,
             )
@@ -802,6 +889,7 @@ async def _index_single_file(
     folder_name: str,
     target_file_path: str,
     enable_summary: bool,
+    root_folder_id: int | None,
     task_logger,
     log_entry,
 ) -> tuple[int, int, str | None]:
@@ -816,7 +904,13 @@ async def _index_single_file(
             )
             existing = await check_document_by_unique_identifier(session, uid_hash)
             if existing:
+                deleted_folder_id = existing.folder_id
                 await session.delete(existing)
+                await session.flush()
+                if deleted_folder_id and root_folder_id:
+                    await _cleanup_empty_folder_chain(
+                        session, deleted_folder_id, root_folder_id
+                    )
                 await session.commit()
                 return 0, 0, None
             return 0, 0, None
@@ -880,6 +974,12 @@ async def _index_single_file(
             "mtime": mtime,
         }
 
+        folder_id = None
+        if root_folder_id:
+            folder_id = await _resolve_folder_for_file(
+                session, rel_path, root_folder_id, search_space_id, user_id
+            )
+
         if existing:
             existing.title = title
             existing.content = document_string
@@ -887,6 +987,7 @@ async def _index_single_file(
             existing.source_markdown = content
             existing.embedding = embedding
             existing.document_metadata = doc_metadata
+            existing.folder_id = folder_id
             await safe_set_chunks(session, existing, chunks)
             existing.updated_at = get_current_timestamp()
             existing.status = DocumentStatus.ready()
@@ -905,6 +1006,7 @@ async def _index_single_file(
                 updated_at=get_current_timestamp(),
                 created_by_id=user_id,
                 connector_id=None,
+                folder_id=folder_id,
             )
             session.add(document)
             await session.flush()
diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index 34efad789..110aa6caf 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -567,6 +567,136 @@ class TestFolderMirroring:
         ).scalar_one_or_none()
         assert daily_after is not None
 
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_f6_single_file_creates_subfolder(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """F6: Single-file mode creates missing Folder rows and assigns correct folder_id."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "root.md").write_text("root")
+
+        _, _, root_folder_id, _ = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+        )
+
+        sub = tmp_path / "notes" / "daily"
+        sub.mkdir(parents=True)
+        (sub / "new.md").write_text("new note in subfolder")
+
+        count, _, _, _ = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            target_file_path=str(sub / "new.md"),
+            root_folder_id=root_folder_id,
+        )
+        assert count == 1
+
+        doc = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.title == "new.md",
+                )
+            )
+        ).scalar_one()
+
+        daily_folder = (
+            await db_session.execute(
+                select(Folder).where(Folder.name == "daily")
+            )
+        ).scalar_one()
+
+        assert doc.folder_id == daily_folder.id
+        assert daily_folder.parent_id is not None
+
+        notes_folder = (
+            await db_session.execute(
+                select(Folder).where(Folder.name == "notes")
+            )
+        ).scalar_one()
+        assert daily_folder.parent_id == notes_folder.id
+        assert notes_folder.parent_id == root_folder_id
+
+    @pytest.mark.usefixtures(
+        "patched_self_hosted",
+        "patched_embed_for_indexer",
+        "patched_chunks_for_indexer",
+        "patched_summary_for_indexer",
+    )
+    async def test_f7_single_file_delete_cleans_empty_folders(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """F7: Deleting the only file in a subfolder via single-file mode removes empty Folder rows."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        sub = tmp_path / "notes" / "ephemeral"
+        sub.mkdir(parents=True)
+        (sub / "temp.md").write_text("temporary")
+        (tmp_path / "keep.md").write_text("keep this")
+
+        _, _, root_folder_id, _ = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+        )
+
+        eph_folder = (
+            await db_session.execute(
+                select(Folder).where(Folder.name == "ephemeral")
+            )
+        ).scalar_one_or_none()
+        assert eph_folder is not None
+
+        target = sub / "temp.md"
+        target.unlink()
+
+        await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            target_file_path=str(target),
+            root_folder_id=root_folder_id,
+        )
+
+        eph_after = (
+            await db_session.execute(
+                select(Folder).where(Folder.name == "ephemeral")
+            )
+        ).scalar_one_or_none()
+        assert eph_after is None
+
+        notes_after = (
+            await db_session.execute(
+                select(Folder).where(Folder.name == "notes")
+            )
+        ).scalar_one_or_none()
+        assert notes_after is None
+
 
 # ====================================================================
 # Tier 5: Pipeline Integration (P1)
diff --git a/surfsense_web/hooks/use-folder-sync.ts b/surfsense_web/hooks/use-folder-sync.ts
index fcfb2814e..f051b7df6 100644
--- a/surfsense_web/hooks/use-folder-sync.ts
+++ b/surfsense_web/hooks/use-folder-sync.ts
@@ -32,6 +32,7 @@ export function useFolderSync() {
 					folder_name: event.folderName,
 					search_space_id: event.searchSpaceId,
 					target_file_path: event.fullPath,
+					root_folder_id: event.rootFolderId,
 				});
 			} catch (err) {
 				console.error("[FolderSync] Failed to trigger re-index:", err);
diff --git a/surfsense_web/lib/apis/documents-api.service.ts b/surfsense_web/lib/apis/documents-api.service.ts
index c77cd6848..a8e3831d4 100644
--- a/surfsense_web/lib/apis/documents-api.service.ts
+++ b/surfsense_web/lib/apis/documents-api.service.ts
@@ -399,7 +399,7 @@ class DocumentsApiService {
 		return baseApiService.post(`/api/v1/documents/folder-index`, undefined, { body });
 	};
 
-	folderIndexFile = async (searchSpaceId: number, body: { folder_path: string; folder_name: string; search_space_id: number; target_file_path: string; enable_summary?: boolean }) => {
+	folderIndexFile = async (searchSpaceId: number, body: { folder_path: string; folder_name: string; search_space_id: number; target_file_path: string; root_folder_id?: number | null; enable_summary?: boolean }) => {
 		return baseApiService.post(`/api/v1/documents/folder-index-file`, undefined, { body });
 	};
 

From 53df393cf7ca300e9eb79f14429bb94857bde492 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 23:28:23 +0530
Subject: [PATCH 051/202] refactor: streamline local folder indexing logic by
 removing unused imports, enhancing content hashing, and improving document
 creation process

---
 .../local_folder_indexer.py                   | 415 +++++++-----------
 .../test_local_folder_pipeline.py             | 139 +-----
 2 files changed, 174 insertions(+), 380 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index 3d4ddc19e..a3281eaea 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -14,7 +14,6 @@ no connector row is read.
 """
 
 import os
-import time
 from collections.abc import Awaitable, Callable
 from datetime import UTC, datetime
 from pathlib import Path
@@ -30,24 +29,16 @@ from app.db import (
     DocumentType,
     Folder,
 )
+from app.indexing_pipeline.connector_document import ConnectorDocument
+from app.indexing_pipeline.document_hashing import compute_identifier_hash
+from app.indexing_pipeline.indexing_pipeline_service import IndexingPipelineService
 from app.services.llm_service import get_user_long_context_llm
 from app.services.task_logging_service import TaskLoggingService
-from app.utils.document_converters import (
-    create_document_chunks,
-    embed_text,
-    generate_content_hash,
-    generate_document_summary,
-    generate_unique_identifier_hash,
-)
 from app.utils.document_versioning import create_version_snapshot
 
 from .base import (
-    build_document_metadata_string,
     check_document_by_unique_identifier,
-    check_duplicate_document_by_hash,
-    get_current_timestamp,
     logger,
-    safe_set_chunks,
 )
 
 PLAINTEXT_EXTENSIONS = frozenset({
@@ -89,7 +80,6 @@ def _needs_etl(filename: str) -> bool:
     return not _is_plaintext_file(filename) and not _is_audio_file(filename)
 
 HeartbeatCallbackType = Callable[[int], Awaitable[None]]
-HEARTBEAT_INTERVAL_SECONDS = 30
 
 DEFAULT_EXCLUDE_PATTERNS = [
     ".git",
@@ -210,6 +200,16 @@ async def _read_file_content(file_path: str, filename: str) -> str:
     return await _parse_file_to_markdown(file_path, filename)
 
 
+def _content_hash(content: str, search_space_id: int) -> str:
+    """SHA-256 hash of content scoped to a search space.
+
+    Matches the format used by ``compute_content_hash`` in the unified
+    pipeline so that dedup checks are consistent.
+    """
+    import hashlib
+    return hashlib.sha256(f"{search_space_id}:{content}".encode("utf-8")).hexdigest()
+
+
 async def _compute_file_content_hash(
     file_path: str, filename: str, search_space_id: int,
 ) -> tuple[str, str]:
@@ -218,8 +218,7 @@ async def _compute_file_content_hash(
     Returns (content_text, content_hash).
     """
     content = await _read_file_content(file_path, filename)
-    content_hash = generate_content_hash(content, search_space_id)
-    return content, content_hash
+    return content, _content_hash(content, search_space_id)
 
 
 async def _mirror_folder_structure(
@@ -454,6 +453,40 @@ async def _cleanup_empty_folders(
         candidates = remaining
 
 
+def _build_connector_doc(
+    title: str,
+    content: str,
+    relative_path: str,
+    folder_name: str,
+    *,
+    search_space_id: int,
+    user_id: str,
+    enable_summary: bool,
+) -> ConnectorDocument:
+    """Build a ConnectorDocument from a local file's extracted content."""
+    unique_id = f"{folder_name}:{relative_path}"
+    metadata = {
+        "folder_name": folder_name,
+        "file_path": relative_path,
+        "document_type": "Local Folder File",
+        "connector_type": "Local Folder",
+    }
+    fallback_summary = f"File: {title}\n\n{content[:4000]}"
+
+    return ConnectorDocument(
+        title=title,
+        source_markdown=content,
+        unique_id=unique_id,
+        document_type=DocumentType.LOCAL_FOLDER_FILE,
+        search_space_id=search_space_id,
+        connector_id=None,
+        created_by_id=user_id,
+        should_summarize=enable_summary,
+        fallback_summary=fallback_summary,
+        metadata=metadata,
+    )
+
+
 async def index_local_folder(
     session: AsyncSession,
     search_space_id: int,
@@ -551,15 +584,13 @@ async def index_local_folder(
         indexed_count = 0
         skipped_count = 0
         failed_count = 0
-        duplicate_count = 0
-
-        last_heartbeat_time = time.time()
 
         # ================================================================
-        # PHASE 1: Analyze all files, create pending documents
+        # PHASE 1: Pre-filter files (mtime / content-hash), version changed
         # ================================================================
-        files_to_process: list[dict] = []
-        new_documents_created = False
+        connector_docs: list[ConnectorDocument] = []
+        # Maps unique_id -> (relative_path, mtime) for post-pipeline folder_id assignment
+        file_meta_map: dict[str, dict] = {}
         seen_unique_hashes: set[str] = set()
 
         for file_info in files:
@@ -568,8 +599,8 @@ async def index_local_folder(
                 file_path_abs = file_info["path"]
 
                 unique_identifier = f"{folder_name}:{relative_path}"
-                unique_identifier_hash = generate_unique_identifier_hash(
-                    DocumentType.LOCAL_FOLDER_FILE,
+                unique_identifier_hash = compute_identifier_hash(
+                    DocumentType.LOCAL_FOLDER_FILE.value,
                     unique_identifier,
                     search_space_id,
                 )
@@ -612,94 +643,42 @@ async def index_local_folder(
                         continue
 
                     await create_version_snapshot(session, existing_document)
+                else:
+                    try:
+                        content, content_hash = await _compute_file_content_hash(
+                            file_path_abs, file_info["relative_path"], search_space_id
+                        )
+                    except Exception as read_err:
+                        logger.warning(f"Could not read {file_path_abs}: {read_err}")
+                        skipped_count += 1
+                        continue
 
-                    files_to_process.append(
-                        {
-                            "document": existing_document,
-                            "is_new": False,
-                            "file_info": file_info,
-                            "content": content,
-                            "content_hash": content_hash,
-                            "unique_identifier_hash": unique_identifier_hash,
-                            "relative_path": relative_path,
-                            "title": file_info["name"],
-                        }
-                    )
-                    continue
+                    if not content.strip():
+                        skipped_count += 1
+                        continue
 
-                try:
-                    content, content_hash = await _compute_file_content_hash(
-                        file_path_abs, file_info["relative_path"], search_space_id
-                    )
-                except Exception as read_err:
-                    logger.warning(f"Could not read {file_path_abs}: {read_err}")
-                    skipped_count += 1
-                    continue
-
-                if not content.strip():
-                    skipped_count += 1
-                    continue
-
-                with session.no_autoflush:
-                    dup = await check_duplicate_document_by_hash(session, content_hash)
-                if dup:
-                    duplicate_count += 1
-                    skipped_count += 1
-                    continue
-
-                parent_dir = str(Path(relative_path).parent)
-                if parent_dir == ".":
-                    parent_dir = ""
-                folder_id = folder_mapping.get(parent_dir, folder_mapping.get(""))
-
-                document = Document(
-                    search_space_id=search_space_id,
+                doc = _build_connector_doc(
                     title=file_info["name"],
-                    document_type=DocumentType.LOCAL_FOLDER_FILE,
-                    document_metadata={
-                        "folder_name": folder_name,
-                        "file_path": relative_path,
-                        "mtime": file_info["modified_at"].timestamp(),
-                    },
-                    content="Pending...",
-                    content_hash=unique_identifier_hash,
-                    unique_identifier_hash=unique_identifier_hash,
-                    embedding=None,
-                    status=DocumentStatus.pending(),
-                    updated_at=get_current_timestamp(),
-                    created_by_id=user_id,
-                    connector_id=None,
-                    folder_id=folder_id,
-                )
-                session.add(document)
-                new_documents_created = True
-
-                files_to_process.append(
-                    {
-                        "document": document,
-                        "is_new": True,
-                        "file_info": file_info,
-                        "content": content,
-                        "content_hash": content_hash,
-                        "unique_identifier_hash": unique_identifier_hash,
-                        "relative_path": relative_path,
-                        "title": file_info["name"],
-                    }
+                    content=content,
+                    relative_path=relative_path,
+                    folder_name=folder_name,
+                    search_space_id=search_space_id,
+                    user_id=user_id,
+                    enable_summary=enable_summary,
                 )
+                connector_docs.append(doc)
+                file_meta_map[unique_identifier] = {
+                    "relative_path": relative_path,
+                    "mtime": file_info["modified_at"].timestamp(),
+                }
 
             except Exception as e:
                 logger.exception(f"Phase 1 error for {file_info.get('path')}: {e}")
                 failed_count += 1
 
-        if new_documents_created:
-            await session.commit()
-
         # ================================================================
         # PHASE 1.5: Delete documents no longer on disk
         # ================================================================
-        # Collect ALL folder IDs under this root (including folders that no
-        # longer exist on disk but still have rows in the DB) so we catch
-        # documents in deleted directories too.
         all_root_folder_ids = set(folder_mapping.values())
         all_db_folders = (
             await session.execute(
@@ -727,98 +706,51 @@ async def index_local_folder(
         await session.flush()
 
         # ================================================================
-        # PHASE 2: Process each document
+        # PHASE 2: Index via unified pipeline
         # ================================================================
-        long_context_llm = await get_user_long_context_llm(
-            session, user_id, search_space_id
-        )
+        if connector_docs:
+            from app.indexing_pipeline.document_hashing import (
+                compute_unique_identifier_hash,
+            )
 
-        for item in files_to_process:
-            if on_heartbeat_callback:
-                current_time = time.time()
-                if current_time - last_heartbeat_time >= HEARTBEAT_INTERVAL_SECONDS:
+            pipeline = IndexingPipelineService(session)
+            doc_map = {
+                compute_unique_identifier_hash(cd): cd for cd in connector_docs
+            }
+            documents = await pipeline.prepare_for_indexing(connector_docs)
+
+            llm = await get_user_long_context_llm(session, user_id, search_space_id)
+
+            for document in documents:
+                connector_doc = doc_map.get(document.unique_identifier_hash)
+                if connector_doc is None:
+                    failed_count += 1
+                    continue
+
+                result = await pipeline.index(document, connector_doc, llm)
+
+                if DocumentStatus.is_state(result.status, DocumentStatus.READY):
+                    indexed_count += 1
+
+                    # Assign folder_id and mtime post-pipeline
+                    rel_path = (connector_doc.metadata or {}).get("file_path", "")
+                    parent_dir = str(Path(rel_path).parent) if rel_path else ""
+                    if parent_dir == ".":
+                        parent_dir = ""
+                    fid = folder_mapping.get(parent_dir, folder_mapping.get(""))
+
+                    unique_id = connector_doc.unique_id
+                    mtime_info = file_meta_map.get(unique_id, {})
+
+                    result.folder_id = fid
+                    doc_meta = dict(result.document_metadata or {})
+                    doc_meta["mtime"] = mtime_info.get("mtime")
+                    result.document_metadata = doc_meta
+                else:
+                    failed_count += 1
+
+                if on_heartbeat_callback and indexed_count % 5 == 0:
                     await on_heartbeat_callback(indexed_count)
-                    last_heartbeat_time = current_time
-
-            document = item["document"]
-            try:
-                document.status = DocumentStatus.processing()
-                await session.commit()
-
-                title = item["title"]
-                relative_path = item["relative_path"]
-                content = item["content"]
-                content_hash = item["content_hash"]
-                file_info = item["file_info"]
-
-                metadata_sections = [
-                    (
-                        "METADATA",
-                        [
-                            f"Title: {title}",
-                            f"Folder: {folder_name}",
-                            f"Path: {relative_path}",
-                        ],
-                    ),
-                    ("CONTENT", [content]),
-                ]
-                document_string = build_document_metadata_string(metadata_sections)
-
-                summary_content = ""
-                if long_context_llm and enable_summary:
-                    doc_meta = {
-                        "folder_name": folder_name,
-                        "file_path": relative_path,
-                    }
-                    summary_content, _ = await generate_document_summary(
-                        document_string, long_context_llm, doc_meta
-                    )
-
-                embedding = embed_text(document_string)
-                chunks = await create_document_chunks(document_string)
-
-                parent_dir = str(Path(relative_path).parent)
-                if parent_dir == ".":
-                    parent_dir = ""
-                folder_id = folder_mapping.get(parent_dir, folder_mapping.get(""))
-
-                document.title = title
-                document.content = document_string
-                document.content_hash = content_hash
-                document.source_markdown = content
-                document.embedding = embedding
-                document.document_metadata = {
-                    "folder_name": folder_name,
-                    "file_path": relative_path,
-                    "summary": summary_content,
-                    "mtime": file_info["modified_at"].timestamp(),
-                }
-                document.folder_id = folder_id
-                await safe_set_chunks(session, document, chunks)
-                document.updated_at = get_current_timestamp()
-                document.status = DocumentStatus.ready()
-
-                indexed_count += 1
-
-                if indexed_count % 10 == 0:
-                    await session.commit()
-
-            except Exception as e:
-                logger.exception(f"Phase 2 error for {item.get('relative_path')}: {e}")
-                try:
-                    await session.rollback()
-                except Exception:
-                    pass
-                try:
-                    document.status = DocumentStatus.failed(str(e)[:500])
-                    document.updated_at = get_current_timestamp()
-                    await session.commit()
-                except Exception:
-                    try:
-                        await session.rollback()
-                    except Exception:
-                        pass
-                failed_count += 1
 
         # Cleanup empty folders
         existing_dirs = set()
@@ -846,8 +778,6 @@ async def index_local_folder(
                 raise
 
         warning_parts = []
-        if duplicate_count > 0:
-            warning_parts.append(f"{duplicate_count} duplicate")
         if failed_count > 0:
             warning_parts.append(f"{failed_count} failed")
         warning_message = ", ".join(warning_parts) if warning_parts else None
@@ -859,7 +789,6 @@ async def index_local_folder(
                 "indexed": indexed_count,
                 "skipped": skipped_count,
                 "failed": failed_count,
-                "duplicates": duplicate_count,
             },
         )
 
@@ -899,8 +828,8 @@ async def _index_single_file(
         if not full_path.exists():
             rel = str(full_path.relative_to(folder_path))
             unique_id = f"{folder_name}:{rel}"
-            uid_hash = generate_unique_identifier_hash(
-                DocumentType.LOCAL_FOLDER_FILE, unique_id, search_space_id
+            uid_hash = compute_identifier_hash(
+                DocumentType.LOCAL_FOLDER_FILE.value, unique_id, search_space_id
             )
             existing = await check_document_by_unique_identifier(session, uid_hash)
             if existing:
@@ -918,8 +847,8 @@ async def _index_single_file(
         rel_path = str(full_path.relative_to(folder_path))
 
         unique_id = f"{folder_name}:{rel_path}"
-        uid_hash = generate_unique_identifier_hash(
-            DocumentType.LOCAL_FOLDER_FILE, unique_id, search_space_id
+        uid_hash = compute_identifier_hash(
+            DocumentType.LOCAL_FOLDER_FILE.value, unique_id, search_space_id
         )
 
         try:
@@ -945,83 +874,51 @@ async def _index_single_file(
 
             await create_version_snapshot(session, existing)
 
-        long_context_llm = await get_user_long_context_llm(
-            session, user_id, search_space_id
-        )
-
-        title = full_path.name
         mtime = full_path.stat().st_mtime
 
-        metadata_sections = [
-            ("METADATA", [f"Title: {title}", f"Folder: {folder_name}", f"Path: {rel_path}"]),
-            ("CONTENT", [content]),
-        ]
-        document_string = build_document_metadata_string(metadata_sections)
+        connector_doc = _build_connector_doc(
+            title=full_path.name,
+            content=content,
+            relative_path=rel_path,
+            folder_name=folder_name,
+            search_space_id=search_space_id,
+            user_id=user_id,
+            enable_summary=enable_summary,
+        )
 
-        summary_content = ""
-        if long_context_llm and enable_summary:
-            summary_content, _ = await generate_document_summary(
-                document_string, long_context_llm, {"folder_name": folder_name, "file_path": rel_path}
-            )
+        pipeline = IndexingPipelineService(session)
+        llm = await get_user_long_context_llm(session, user_id, search_space_id)
+        documents = await pipeline.prepare_for_indexing([connector_doc])
 
-        embedding = embed_text(document_string)
-        chunks = await create_document_chunks(document_string)
+        if not documents:
+            return 0, 1, None
 
-        doc_metadata = {
-            "folder_name": folder_name,
-            "file_path": rel_path,
-            "summary": summary_content,
-            "mtime": mtime,
-        }
+        db_doc = documents[0]
+        await pipeline.index(db_doc, connector_doc, llm)
 
+        # Post-pipeline: assign folder_id and mtime
+        await session.refresh(db_doc)
         folder_id = None
         if root_folder_id:
             folder_id = await _resolve_folder_for_file(
                 session, rel_path, root_folder_id, search_space_id, user_id
             )
-
-        if existing:
-            existing.title = title
-            existing.content = document_string
-            existing.content_hash = content_hash
-            existing.source_markdown = content
-            existing.embedding = embedding
-            existing.document_metadata = doc_metadata
-            existing.folder_id = folder_id
-            await safe_set_chunks(session, existing, chunks)
-            existing.updated_at = get_current_timestamp()
-            existing.status = DocumentStatus.ready()
-        else:
-            document = Document(
-                search_space_id=search_space_id,
-                title=title,
-                document_type=DocumentType.LOCAL_FOLDER_FILE,
-                document_metadata=doc_metadata,
-                content=document_string,
-                content_hash=content_hash,
-                unique_identifier_hash=uid_hash,
-                source_markdown=content,
-                embedding=embedding,
-                status=DocumentStatus.ready(),
-                updated_at=get_current_timestamp(),
-                created_by_id=user_id,
-                connector_id=None,
-                folder_id=folder_id,
-            )
-            session.add(document)
-            await session.flush()
-            for chunk in chunks:
-                chunk.document_id = document.id
-            session.add_all(chunks)
-
+        db_doc.folder_id = folder_id
+        doc_meta = dict(db_doc.document_metadata or {})
+        doc_meta["mtime"] = mtime
+        db_doc.document_metadata = doc_meta
         await session.commit()
 
-        await task_logger.log_task_success(
-            log_entry,
-            f"Single file indexed: {rel_path}",
-            {"file": rel_path},
-        )
-        return 1, 0, None
+        indexed = 1 if DocumentStatus.is_state(db_doc.status, DocumentStatus.READY) else 0
+        failed_msg = None if indexed else "Indexing failed"
+
+        if indexed:
+            await task_logger.log_task_success(
+                log_entry,
+                f"Single file indexed: {rel_path}",
+                {"file": rel_path},
+            )
+        return indexed, 0 if indexed else 1, failed_msg
 
     except Exception as e:
         logger.exception(f"Error indexing single file {target_file_path}: {e}")
diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index 110aa6caf..154cc6e0e 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -1,8 +1,7 @@
-"""Integration tests for local folder indexer — Tier 3 (I1-I5), Tier 4 (F1-F5), Tier 5 (P1)."""
+"""Integration tests for local folder indexer — Tier 3 (I1-I5), Tier 4 (F1-F7), Tier 5 (P1)."""
 
 import os
 from pathlib import Path
-from unittest.mock import AsyncMock, MagicMock
 
 import pytest
 from sqlalchemy import func, select
@@ -18,41 +17,11 @@ from app.db import (
     User,
 )
 
-import app.tasks.connector_indexers.local_folder_indexer as _lfi_mod
-
 pytestmark = pytest.mark.integration
 
-
-@pytest.fixture
-def patched_self_hosted(monkeypatch):
-    _cfg = type("_Cfg", (), {"is_self_hosted": staticmethod(lambda: True)})()
-    monkeypatch.setattr(_lfi_mod, "config", _cfg)
-
-
-@pytest.fixture
-def patched_embed_for_indexer(monkeypatch):
-    from app.config import config as app_config
-    dim = app_config.embedding_model_instance.dimension
-    mock = MagicMock(return_value=[0.1] * dim)
-    monkeypatch.setattr(_lfi_mod, "embed_text", mock)
-    return mock
-
-
-@pytest.fixture
-def patched_chunks_for_indexer(monkeypatch):
-    from app.db import Chunk
-    from app.config import config as app_config
-    dim = app_config.embedding_model_instance.dimension
-
-    async def mock_create_chunks(text):
-        return [Chunk(content="chunk", embedding=[0.1] * dim)]
-
-    monkeypatch.setattr(_lfi_mod, "create_document_chunks", mock_create_chunks)
-
-
-@pytest.fixture
-def patched_summary_for_indexer(monkeypatch):
-    monkeypatch.setattr(_lfi_mod, "get_user_long_context_llm", AsyncMock(return_value=None))
+UNIFIED_FIXTURES = (
+    "patched_summarize", "patched_embed_texts", "patched_chunk_text",
+)
 
 
 # ====================================================================
@@ -62,12 +31,7 @@ def patched_summary_for_indexer(monkeypatch):
 
 class TestFullIndexer:
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_i1_new_file_indexed(
         self,
         db_session: AsyncSession,
@@ -103,12 +67,7 @@ class TestFullIndexer:
         assert docs[0].document_type == DocumentType.LOCAL_FOLDER_FILE
         assert DocumentStatus.is_state(docs[0].status, DocumentStatus.READY)
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_i2_unchanged_skipped(
         self,
         db_session: AsyncSession,
@@ -130,7 +89,6 @@ class TestFullIndexer:
         )
         assert count1 == 1
 
-        # Second run — unchanged, pass root_folder_id from first run
         count2, _, _, _ = await index_local_folder(
             session=db_session,
             search_space_id=db_search_space.id,
@@ -151,12 +109,7 @@ class TestFullIndexer:
         ).scalar_one()
         assert total == 1
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_i3_changed_reindexed(
         self,
         db_session: AsyncSession,
@@ -178,9 +131,7 @@ class TestFullIndexer:
             folder_name="test-folder",
         )
 
-        # Modify
         f.write_text("# Version 2\n\nUpdated.")
-        # Touch mtime to ensure it's detected as different
         os.utime(f, (f.stat().st_atime + 10, f.stat().st_mtime + 10))
 
         count, _, _, _ = await index_local_folder(
@@ -193,7 +144,6 @@ class TestFullIndexer:
         )
         assert count == 1
 
-        # Should have a version snapshot
         versions = (
             await db_session.execute(
                 select(DocumentVersion).join(Document).where(
@@ -204,12 +154,7 @@ class TestFullIndexer:
         ).scalars().all()
         assert len(versions) >= 1
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_i4_deleted_removed(
         self,
         db_session: AsyncSession,
@@ -262,12 +207,7 @@ class TestFullIndexer:
         ).scalar_one()
         assert docs_after == 0
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_i5_single_file_mode(
         self,
         db_session: AsyncSession,
@@ -305,18 +245,13 @@ class TestFullIndexer:
 
 
 # ====================================================================
-# Tier 4: Folder Mirroring (F1-F5)
+# Tier 4: Folder Mirroring (F1-F7)
 # ====================================================================
 
 
 class TestFolderMirroring:
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_f1_root_folder_created(
         self,
         db_session: AsyncSession,
@@ -344,12 +279,7 @@ class TestFolderMirroring:
         ).scalar_one()
         assert root_folder.name == "test-folder"
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_f2_nested_folder_rows(
         self,
         db_session: AsyncSession,
@@ -393,12 +323,7 @@ class TestFolderMirroring:
         assert daily_folder.parent_id == notes_folder.id
         assert weekly_folder.parent_id == notes_folder.id
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_f3_resync_reuses_folders(
         self,
         db_session: AsyncSession,
@@ -428,7 +353,6 @@ class TestFolderMirroring:
         ).scalars().all()
         ids_before = {f.id for f in folders_before}
 
-        # Re-sync with root_folder_id from first run
         await index_local_folder(
             session=db_session,
             search_space_id=db_search_space.id,
@@ -447,12 +371,7 @@ class TestFolderMirroring:
 
         assert ids_before == ids_after
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_f4_folder_id_assigned(
         self,
         db_session: AsyncSession,
@@ -496,15 +415,9 @@ class TestFolderMirroring:
 
         assert today_doc.folder_id == daily_folder.id
 
-        # Root doc should be in the root folder
         assert root_doc.folder_id == root_folder_id
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_f5_empty_folder_cleanup(
         self,
         db_session: AsyncSession,
@@ -531,7 +444,6 @@ class TestFolderMirroring:
             folder_name="test-folder",
         )
 
-        # Verify weekly folder exists
         weekly_folder = (
             await db_session.execute(
                 select(Folder).where(Folder.name == "weekly")
@@ -539,7 +451,6 @@ class TestFolderMirroring:
         ).scalar_one_or_none()
         assert weekly_folder is not None
 
-        # Delete weekly directory + its file
         shutil.rmtree(weekly)
 
         await index_local_folder(
@@ -551,7 +462,6 @@ class TestFolderMirroring:
             root_folder_id=root_folder_id,
         )
 
-        # weekly Folder should be gone (empty, dir removed)
         weekly_after = (
             await db_session.execute(
                 select(Folder).where(Folder.name == "weekly")
@@ -559,7 +469,6 @@ class TestFolderMirroring:
         ).scalar_one_or_none()
         assert weekly_after is None
 
-        # daily should still exist
         daily_after = (
             await db_session.execute(
                 select(Folder).where(Folder.name == "daily")
@@ -567,12 +476,7 @@ class TestFolderMirroring:
         ).scalar_one_or_none()
         assert daily_after is not None
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_f6_single_file_creates_subfolder(
         self,
         db_session: AsyncSession,
@@ -634,12 +538,7 @@ class TestFolderMirroring:
         assert daily_folder.parent_id == notes_folder.id
         assert notes_folder.parent_id == root_folder_id
 
-    @pytest.mark.usefixtures(
-        "patched_self_hosted",
-        "patched_embed_for_indexer",
-        "patched_chunks_for_indexer",
-        "patched_summary_for_indexer",
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_f7_single_file_delete_cleans_empty_folders(
         self,
         db_session: AsyncSession,
@@ -705,9 +604,7 @@ class TestFolderMirroring:
 
 class TestPipelineIntegration:
 
-    @pytest.mark.usefixtures(
-        "patched_summarize", "patched_embed_texts", "patched_chunk_text"
-    )
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_p1_local_folder_file_through_pipeline(
         self,
         db_session: AsyncSession,

From 25358fddcf17ff41c2f02a534bf0218eef96701f Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Thu, 2 Apr 2026 23:46:21 +0530
Subject: [PATCH 052/202] feat: implement local folder synchronization and
 versioning with new metadata handling and document_versions table

---
 ...7_add_local_folder_sync_and_versioning.py} | 25 +++++-
 surfsense_backend/app/db.py                   |  1 +
 .../app/routes/documents_routes.py            | 42 ++++++++++
 .../app/routes/folders_routes.py              | 27 +++++++
 surfsense_backend/app/schemas/folders.py      |  3 +
 .../components/documents/FolderNode.tsx       | 24 ++++--
 .../components/documents/FolderTreeView.tsx   | 11 ++-
 .../layout/ui/sidebar/DocumentsSidebar.tsx    | 79 +++++++++++++++++--
 surfsense_web/contracts/types/folder.types.ts |  1 +
 .../lib/apis/documents-api.service.ts         |  5 ++
 surfsense_web/lib/apis/folders-api.service.ts |  4 +
 11 files changed, 205 insertions(+), 17 deletions(-)
 rename surfsense_backend/alembic/versions/{117_add_local_folder_connector_and_versioning.py => 117_add_local_folder_sync_and_versioning.py} (82%)

diff --git a/surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py b/surfsense_backend/alembic/versions/117_add_local_folder_sync_and_versioning.py
similarity index 82%
rename from surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py
rename to surfsense_backend/alembic/versions/117_add_local_folder_sync_and_versioning.py
index a9da3beb4..e322a608d 100644
--- a/surfsense_backend/alembic/versions/117_add_local_folder_connector_and_versioning.py
+++ b/surfsense_backend/alembic/versions/117_add_local_folder_sync_and_versioning.py
@@ -1,4 +1,4 @@
-"""Add LOCAL_FOLDER_FILE document type and document_versions table
+"""Add LOCAL_FOLDER_FILE document type, folder metadata, and document_versions table
 
 Revision ID: 117
 Revises: 116
@@ -38,6 +38,19 @@ def upgrade() -> None:
     """
     )
 
+    # Add JSONB metadata column to folders table
+    col_exists = conn.execute(
+        sa.text(
+            "SELECT 1 FROM information_schema.columns "
+            "WHERE table_name = 'folders' AND column_name = 'metadata'"
+        )
+    ).fetchone()
+    if not col_exists:
+        op.add_column(
+            "folders",
+            sa.Column("metadata", sa.dialects.postgresql.JSONB, nullable=True),
+        )
+
     # Create document_versions table
     table_exists = conn.execute(
         sa.text(
@@ -124,3 +137,13 @@ def downgrade() -> None:
     op.execute("DROP INDEX IF EXISTS ix_document_versions_created_at")
     op.execute("DROP INDEX IF EXISTS ix_document_versions_document_id")
     op.execute("DROP TABLE IF EXISTS document_versions")
+
+    # Drop metadata column from folders
+    col_exists = conn.execute(
+        sa.text(
+            "SELECT 1 FROM information_schema.columns "
+            "WHERE table_name = 'folders' AND column_name = 'metadata'"
+        )
+    ).fetchone()
+    if col_exists:
+        op.drop_column("folders", "metadata")
diff --git a/surfsense_backend/app/db.py b/surfsense_backend/app/db.py
index 1a4d3ea06..077b7daa6 100644
--- a/surfsense_backend/app/db.py
+++ b/surfsense_backend/app/db.py
@@ -956,6 +956,7 @@ class Folder(BaseModel, TimestampMixin):
         onupdate=lambda: datetime.now(UTC),
         index=True,
     )
+    folder_metadata = Column("metadata", JSONB, nullable=True)
 
     parent = relationship("Folder", remote_side="Folder.id", backref="children")
     search_space = relationship("SearchSpace", back_populates="folders")
diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index 05221b192..81bbb1477 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -1310,6 +1310,13 @@ async def folder_index(
         "You don't have permission to create documents in this search space",
     )
 
+    watched_metadata = {
+        "watched": True,
+        "folder_path": request.folder_path,
+        "exclude_patterns": request.exclude_patterns,
+        "file_extensions": request.file_extensions,
+    }
+
     root_folder_id = request.root_folder_id
     if root_folder_id:
         existing = (
@@ -1319,6 +1326,9 @@ async def folder_index(
         ).scalar_one_or_none()
         if not existing:
             root_folder_id = None
+        else:
+            existing.folder_metadata = watched_metadata
+            await session.commit()
 
     if not root_folder_id:
         root_folder = Folder(
@@ -1326,6 +1336,7 @@ async def folder_index(
             search_space_id=request.search_space_id,
             created_by_id=str(user.id),
             position="a0",
+            folder_metadata=watched_metadata,
         )
         session.add(root_folder)
         await session.flush()
@@ -1403,3 +1414,34 @@ async def folder_index_file(
         "message": "File indexing started",
         "status": "processing",
     }
+
+
+@router.get("/documents/watched-folders", response_model=list["FolderRead"])
+async def get_watched_folders(
+    search_space_id: int,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """Return root folders that are marked as watched (metadata->>'watched' = 'true')."""
+    from app.schemas import FolderRead  # noqa: F811
+
+    await check_permission(
+        session,
+        user,
+        search_space_id,
+        Permission.DOCUMENTS_READ.value,
+        "You don't have permission to read documents in this search space",
+    )
+
+    folders = (
+        await session.execute(
+            select(Folder).where(
+                Folder.search_space_id == search_space_id,
+                Folder.parent_id.is_(None),
+                Folder.folder_metadata.isnot(None),
+                Folder.folder_metadata["watched"].astext == "true",
+            )
+        )
+    ).scalars().all()
+
+    return folders
diff --git a/surfsense_backend/app/routes/folders_routes.py b/surfsense_backend/app/routes/folders_routes.py
index d688e692a..6e524d4a4 100644
--- a/surfsense_backend/app/routes/folders_routes.py
+++ b/surfsense_backend/app/routes/folders_routes.py
@@ -192,6 +192,33 @@ async def get_folder_breadcrumb(
         ) from e
 
 
+@router.patch("/folders/{folder_id}/watched")
+async def stop_watching_folder(
+    folder_id: int,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """Clear the watched flag from a folder's metadata."""
+    folder = await session.get(Folder, folder_id)
+    if not folder:
+        raise HTTPException(status_code=404, detail="Folder not found")
+
+    await check_permission(
+        session,
+        user,
+        folder.search_space_id,
+        Permission.DOCUMENTS_UPDATE.value,
+        "You don't have permission to update folders in this search space",
+    )
+
+    if folder.folder_metadata and isinstance(folder.folder_metadata, dict):
+        updated = {**folder.folder_metadata, "watched": False}
+        folder.folder_metadata = updated
+    await session.commit()
+
+    return {"message": "Folder watch status updated"}
+
+
 @router.put("/folders/{folder_id}", response_model=FolderRead)
 async def update_folder(
     folder_id: int,
diff --git a/surfsense_backend/app/schemas/folders.py b/surfsense_backend/app/schemas/folders.py
index 263817182..e8bdf3821 100644
--- a/surfsense_backend/app/schemas/folders.py
+++ b/surfsense_backend/app/schemas/folders.py
@@ -3,6 +3,8 @@
 from datetime import datetime
 from uuid import UUID
 
+from typing import Any
+
 from pydantic import BaseModel, ConfigDict, Field
 
 
@@ -34,6 +36,7 @@ class FolderRead(BaseModel):
     created_by_id: UUID | None
     created_at: datetime
     updated_at: datetime
+    metadata: dict[str, Any] | None = Field(default=None, validation_alias="folder_metadata")
 
     model_config = ConfigDict(from_attributes=True)
 
diff --git a/surfsense_web/components/documents/FolderNode.tsx b/surfsense_web/components/documents/FolderNode.tsx
index 1521c06fe..6780bd1e5 100644
--- a/surfsense_web/components/documents/FolderNode.tsx
+++ b/surfsense_web/components/documents/FolderNode.tsx
@@ -76,6 +76,7 @@ interface FolderNodeProps {
 	isWatched?: boolean;
 	onRescan?: (folder: FolderDisplay) => void;
 	onStopWatching?: (folder: FolderDisplay) => void;
+	onViewMetadata?: (folder: FolderDisplay) => void;
 }
 
 function getDropZone(
@@ -116,6 +117,7 @@ export const FolderNode = React.memo(function FolderNode({
 	isWatched,
 	onRescan,
 	onStopWatching,
+	onViewMetadata,
 }: FolderNodeProps) {
 	const [renameValue, setRenameValue] = useState(folder.name);
 	const inputRef = useRef<HTMLInputElement>(null);
@@ -251,13 +253,21 @@ export const FolderNode = React.memo(function FolderNode({
 						isOver && !canDrop && "cursor-not-allowed"
 					)}
 					style={{ paddingLeft: `${depth * 16 + 4}px` }}
-					onClick={() => onToggleExpand(folder.id)}
-					onKeyDown={(e) => {
-						if (e.key === "Enter" || e.key === " ") {
-							e.preventDefault();
-							onToggleExpand(folder.id);
-						}
-					}}
+				onClick={(e) => {
+					if ((e.ctrlKey || e.metaKey) && onViewMetadata) {
+						e.preventDefault();
+						e.stopPropagation();
+						onViewMetadata(folder);
+						return;
+					}
+					onToggleExpand(folder.id);
+				}}
+				onKeyDown={(e) => {
+					if (e.key === "Enter" || e.key === " ") {
+						e.preventDefault();
+						onToggleExpand(folder.id);
+					}
+				}}
 					onDoubleClick={(e) => {
 						e.stopPropagation();
 						startRename();
diff --git a/surfsense_web/components/documents/FolderTreeView.tsx b/surfsense_web/components/documents/FolderTreeView.tsx
index 5945edccb..f34b9a0c2 100644
--- a/surfsense_web/components/documents/FolderTreeView.tsx
+++ b/surfsense_web/components/documents/FolderTreeView.tsx
@@ -43,6 +43,7 @@ interface FolderTreeViewProps {
 	watchedFolderIds?: Set<number>;
 	onRescanFolder?: (folder: FolderDisplay) => void;
 	onStopWatchingFolder?: (folder: FolderDisplay) => void;
+	onViewFolderMetadata?: (folder: FolderDisplay) => void;
 }
 
 function groupBy<T>(items: T[], keyFn: (item: T) => string | number): Record<string | number, T[]> {
@@ -79,6 +80,7 @@ export function FolderTreeView({
 	watchedFolderIds,
 	onRescanFolder,
 	onStopWatchingFolder,
+	onViewFolderMetadata,
 }: FolderTreeViewProps) {
 	const foldersByParent = useMemo(() => groupBy(folders, (f) => f.parentId ?? "root"), [folders]);
 
@@ -210,10 +212,11 @@ export function FolderTreeView({
 					siblingPositions={siblingPositions}
 					contextMenuOpen={openContextMenuId === `folder-${f.id}`}
 					onContextMenuOpenChange={(open) => setOpenContextMenuId(open ? `folder-${f.id}` : null)}
-					isWatched={watchedFolderIds?.has(f.id)}
-					onRescan={onRescanFolder}
-					onStopWatching={onStopWatchingFolder}
-				/>
+				isWatched={watchedFolderIds?.has(f.id)}
+				onRescan={onRescanFolder}
+				onStopWatching={onStopWatchingFolder}
+				onViewMetadata={onViewFolderMetadata}
+			/>
 			);
 
 			if (isExpanded) {
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index 202d170d9..f9d32bf98 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -21,6 +21,7 @@ import type { DocumentNodeDoc } from "@/components/documents/DocumentNode";
 import type { FolderDisplay } from "@/components/documents/FolderNode";
 import { FolderPickerDialog } from "@/components/documents/FolderPickerDialog";
 import { FolderTreeView } from "@/components/documents/FolderTreeView";
+import { JsonMetadataViewer } from "@/components/json-metadata-viewer";
 import { EXPORT_FILE_EXTENSIONS } from "@/components/shared/ExportMenuItems";
 import {
 	AlertDialog,
@@ -95,12 +96,46 @@ export function DocumentsSidebar({
 	const [activeTypes, setActiveTypes] = useState<DocumentTypeEnum[]>([]);
 	const [watchedFolderIds, setWatchedFolderIds] = useState<Set<number>>(new Set());
 
+	const [metadataFolder, setMetadataFolder] = useState<FolderDisplay | null>(null);
+	const [metadataJson, setMetadataJson] = useState<Record<string, unknown> | null>(null);
+	const [metadataLoading, setMetadataLoading] = useState(false);
+
 	useEffect(() => {
 		const api = typeof window !== "undefined" ? window.electronAPI : null;
 		if (!api?.getWatchedFolders) return;
 
 		async function loadWatchedIds() {
 			const folders = await api!.getWatchedFolders();
+
+			if (folders.length === 0) {
+				try {
+					const backendFolders = await documentsApiService.getWatchedFolders(searchSpaceId);
+					for (const bf of backendFolders) {
+						const meta = bf.metadata as Record<string, unknown> | null;
+						if (!meta?.watched || !meta.folder_path) continue;
+						await api!.addWatchedFolder({
+							path: meta.folder_path as string,
+							name: bf.name,
+							rootFolderId: bf.id,
+							searchSpaceId: bf.search_space_id,
+							excludePatterns: (meta.exclude_patterns as string[]) ?? [],
+							fileExtensions: (meta.file_extensions as string[] | null) ?? null,
+							active: true,
+						});
+					}
+					const recovered = await api!.getWatchedFolders();
+					const ids = new Set(
+						recovered
+							.filter((f) => f.rootFolderId != null)
+							.map((f) => f.rootFolderId as number)
+					);
+					setWatchedFolderIds(ids);
+					return;
+				} catch (err) {
+					console.error("[DocumentsSidebar] Recovery from backend failed:", err);
+				}
+			}
+
 			const ids = new Set(
 				folders
 					.filter((f) => f.rootFolderId != null)
@@ -110,7 +145,7 @@ export function DocumentsSidebar({
 		}
 
 		loadWatchedIds();
-	}, []);
+	}, [searchSpaceId]);
 	const { mutateAsync: deleteDocumentMutation } = useAtomValue(deleteDocumentMutationAtom);
 
 	const [sidebarDocs, setSidebarDocs] = useAtom(sidebarSelectedDocumentsAtom);
@@ -318,11 +353,30 @@ export function DocumentsSidebar({
 			}
 
 			await api.removeWatchedFolder(matched.path);
+			try {
+				await foldersApiService.stopWatching(folder.id);
+			} catch (err) {
+				console.error("[DocumentsSidebar] Failed to clear watched metadata:", err);
+			}
 			toast.success(`Stopped watching: ${matched.name}`);
 		},
 		[]
 	);
 
+	const handleViewFolderMetadata = useCallback(async (folder: FolderDisplay) => {
+		setMetadataFolder(folder);
+		setMetadataLoading(true);
+		try {
+			const fullFolder = await foldersApiService.getFolder(folder.id);
+			setMetadataJson((fullFolder.metadata as Record<string, unknown>) ?? {});
+		} catch (err) {
+			console.error("[DocumentsSidebar] Failed to fetch folder metadata:", err);
+			setMetadataJson({ error: "Failed to load folder metadata" });
+		} finally {
+			setMetadataLoading(false);
+		}
+	}, []);
+
 	const handleRenameFolder = useCallback(async (folder: FolderDisplay, newName: string) => {
 		try {
 			await foldersApiService.updateFolder(folder.id, { name: newName });
@@ -801,11 +855,26 @@ export function DocumentsSidebar({
 				onReorderFolder={handleReorderFolder}
 				watchedFolderIds={watchedFolderIds}
 				onRescanFolder={handleRescanFolder}
-				onStopWatchingFolder={handleStopWatching}
-			/>
-			</div>
+			onStopWatchingFolder={handleStopWatching}
+			onViewFolderMetadata={handleViewFolderMetadata}
+		/>
+		</div>
 
-			<FolderPickerDialog
+		<JsonMetadataViewer
+			title={metadataFolder?.name ?? "Folder"}
+			metadata={metadataJson}
+			loading={metadataLoading}
+			open={!!metadataFolder}
+			onOpenChange={(open) => {
+				if (!open) {
+					setMetadataFolder(null);
+					setMetadataJson(null);
+					setMetadataLoading(false);
+				}
+			}}
+		/>
+
+		<FolderPickerDialog
 				open={folderPickerOpen}
 				onOpenChange={setFolderPickerOpen}
 				folders={treeFolders}
diff --git a/surfsense_web/contracts/types/folder.types.ts b/surfsense_web/contracts/types/folder.types.ts
index d33a3ddd7..60919bf46 100644
--- a/surfsense_web/contracts/types/folder.types.ts
+++ b/surfsense_web/contracts/types/folder.types.ts
@@ -9,6 +9,7 @@ export const folder = z.object({
 	created_by_id: z.string().nullable().optional(),
 	created_at: z.string(),
 	updated_at: z.string(),
+	metadata: z.record(z.unknown()).nullable().optional(),
 });
 
 export const folderCreateRequest = z.object({
diff --git a/surfsense_web/lib/apis/documents-api.service.ts b/surfsense_web/lib/apis/documents-api.service.ts
index a8e3831d4..e8b228d03 100644
--- a/surfsense_web/lib/apis/documents-api.service.ts
+++ b/surfsense_web/lib/apis/documents-api.service.ts
@@ -37,6 +37,7 @@ import {
 	uploadDocumentRequest,
 	uploadDocumentResponse,
 } from "@/contracts/types/document.types";
+import { folderListResponse } from "@/contracts/types/folder.types";
 import { ValidationError } from "../error";
 import { baseApiService } from "./base-api.service";
 
@@ -403,6 +404,10 @@ class DocumentsApiService {
 		return baseApiService.post(`/api/v1/documents/folder-index-file`, undefined, { body });
 	};
 
+	getWatchedFolders = async (searchSpaceId: number) => {
+		return baseApiService.get(`/api/v1/documents/watched-folders?search_space_id=${searchSpaceId}`, folderListResponse);
+	};
+
 	/**
 	 * Delete a document
 	 */
diff --git a/surfsense_web/lib/apis/folders-api.service.ts b/surfsense_web/lib/apis/folders-api.service.ts
index 99d9ad774..2e535d615 100644
--- a/surfsense_web/lib/apis/folders-api.service.ts
+++ b/surfsense_web/lib/apis/folders-api.service.ts
@@ -85,6 +85,10 @@ class FoldersApiService {
 		return baseApiService.delete(`/api/v1/folders/${folderId}`, folderDeleteResponse);
 	};
 
+	stopWatching = async (folderId: number) => {
+		return baseApiService.patch(`/api/v1/folders/${folderId}/watched`, undefined);
+	};
+
 	moveDocument = async (documentId: number, request: DocumentMoveRequest) => {
 		const parsed = documentMoveRequest.safeParse(request);
 		if (!parsed.success) {

From 9c1d9357c4e3b0fe5eb25f737069d6494cea2188 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Thu, 2 Apr 2026 20:19:16 +0200
Subject: [PATCH 053/202] refactor: fix dynamic tooltip resizing and split
 autocomplete into SPR modules

---
 surfsense_desktop/electron-builder.yml        |  12 +-
 surfsense_desktop/package.json                |   1 +
 surfsense_desktop/pnpm-lock.yaml              |   3 +
 surfsense_desktop/scripts/build-electron.mjs  |   2 +-
 surfsense_desktop/src/main.ts                 |   3 +-
 .../index.ts}                                 | 181 ++++++++----------
 .../modules/autocomplete/keystroke-buffer.ts  |  76 ++++++++
 .../modules/autocomplete/suggestion-window.ts | 103 ++++++++++
 surfsense_desktop/src/modules/platform.ts     |  49 -----
 .../app/desktop/permissions/page.tsx          |  13 +-
 surfsense_web/app/desktop/suggestion/page.tsx |   6 +-
 .../app/desktop/suggestion/suggestion.css     |  70 ++++---
 12 files changed, 326 insertions(+), 193 deletions(-)
 rename surfsense_desktop/src/modules/{autocomplete.ts => autocomplete/index.ts} (55%)
 create mode 100644 surfsense_desktop/src/modules/autocomplete/keystroke-buffer.ts
 create mode 100644 surfsense_desktop/src/modules/autocomplete/suggestion-window.ts

diff --git a/surfsense_desktop/electron-builder.yml b/surfsense_desktop/electron-builder.yml
index 74c69d223..115b69c8e 100644
--- a/surfsense_desktop/electron-builder.yml
+++ b/surfsense_desktop/electron-builder.yml
@@ -10,13 +10,13 @@ files:
   - dist/**/*
   - "!node_modules"
   - node_modules/uiohook-napi/**/*
-  - "!node_modules/uiohook-napi/build"
   - "!node_modules/uiohook-napi/src"
   - "!node_modules/uiohook-napi/libuiohook"
   - "!node_modules/uiohook-napi/binding.gyp"
   - node_modules/node-gyp-build/**/*
+  - node_modules/bindings/**/*
+  - node_modules/file-uri-to-path/**/*
   - node_modules/node-mac-permissions/**/*
-  - "!node_modules/node-mac-permissions/build"
   - "!node_modules/node-mac-permissions/src"
   - "!node_modules/node-mac-permissions/binding.gyp"
   - "!src"
@@ -41,13 +41,19 @@ asarUnpack:
   - "**/*.node"
   - "node_modules/uiohook-napi/**/*"
   - "node_modules/node-gyp-build/**/*"
+  - "node_modules/bindings/**/*"
+  - "node_modules/file-uri-to-path/**/*"
   - "node_modules/node-mac-permissions/**/*"
 mac:
   icon: assets/icon.icns
   category: public.app-category.productivity
   artifactName: "${productName}-${version}-${arch}.${ext}"
-  hardenedRuntime: true
+  hardenedRuntime: false
   gatekeeperAssess: false
+  extendInfo:
+    NSInputMonitoringUsageDescription: "SurfSense uses input monitoring to provide system-wide autocomplete suggestions as you type."
+    NSAccessibilityUsageDescription: "SurfSense uses accessibility features to read text fields and insert suggestions."
+    NSAppleEventsUsageDescription: "SurfSense uses Apple Events to read text from the active application and insert autocomplete suggestions."
   target:
     - target: dmg
       arch: [x64, arm64]
diff --git a/surfsense_desktop/package.json b/surfsense_desktop/package.json
index a2e452b7c..01a63b265 100644
--- a/surfsense_desktop/package.json
+++ b/surfsense_desktop/package.json
@@ -29,6 +29,7 @@
     "wait-on": "^9.0.4"
   },
   "dependencies": {
+    "bindings": "^1.5.0",
     "electron-updater": "^6.8.3",
     "get-port-please": "^3.2.0",
     "node-mac-permissions": "^2.5.0",
diff --git a/surfsense_desktop/pnpm-lock.yaml b/surfsense_desktop/pnpm-lock.yaml
index 82bad9456..d0b453d31 100644
--- a/surfsense_desktop/pnpm-lock.yaml
+++ b/surfsense_desktop/pnpm-lock.yaml
@@ -8,6 +8,9 @@ importers:
 
   .:
     dependencies:
+      bindings:
+        specifier: ^1.5.0
+        version: 1.5.0
       electron-updater:
         specifier: ^6.8.3
         version: 6.8.3
diff --git a/surfsense_desktop/scripts/build-electron.mjs b/surfsense_desktop/scripts/build-electron.mjs
index 83d941dd2..c2869ec46 100644
--- a/surfsense_desktop/scripts/build-electron.mjs
+++ b/surfsense_desktop/scripts/build-electron.mjs
@@ -104,7 +104,7 @@ async function buildElectron() {
     bundle: true,
     platform: 'node',
     target: 'node18',
-    external: ['electron', 'uiohook-napi', 'node-mac-permissions'],
+    external: ['electron', 'uiohook-napi', 'node-mac-permissions', 'bindings', 'file-uri-to-path'],
     sourcemap: true,
     minify: false,
     define: {
diff --git a/surfsense_desktop/src/main.ts b/surfsense_desktop/src/main.ts
index 9623be82e..c96453c6d 100644
--- a/surfsense_desktop/src/main.ts
+++ b/surfsense_desktop/src/main.ts
@@ -19,7 +19,8 @@ if (!setupDeepLinks()) {
 registerIpcHandlers();
 
 function getInitialPath(): string {
-  if (process.platform === 'darwin' && !allPermissionsGranted()) {
+  const granted = allPermissionsGranted();
+  if (process.platform === 'darwin' && !granted) {
     return '/desktop/permissions';
   }
   return '/dashboard';
diff --git a/surfsense_desktop/src/modules/autocomplete.ts b/surfsense_desktop/src/modules/autocomplete/index.ts
similarity index 55%
rename from surfsense_desktop/src/modules/autocomplete.ts
rename to surfsense_desktop/src/modules/autocomplete/index.ts
index 2b877723f..2ea37d051 100644
--- a/surfsense_desktop/src/modules/autocomplete.ts
+++ b/surfsense_desktop/src/modules/autocomplete/index.ts
@@ -1,20 +1,19 @@
-import { BrowserWindow, clipboard, ipcMain, screen, shell } from 'electron';
-import path from 'path';
-import { IPC_CHANNELS } from '../ipc/channels';
-import { allPermissionsGranted } from './permissions';
-import { getFieldContent, getFrontmostApp, hasAccessibilityPermission, simulatePaste } from './platform';
-import { getServerPort } from './server';
-import { getMainWindow } from './window';
+import { clipboard, ipcMain, screen } from 'electron';
+import { IPC_CHANNELS } from '../../ipc/channels';
+import { getFrontmostApp, hasAccessibilityPermission, simulatePaste } from '../platform';
+import { getMainWindow } from '../window';
+import {
+  appendToBuffer, buildKeycodeMap, getBuffer, getBufferTrimmed,
+  getLastTrackedApp, removeLastChar, resetBuffer, resolveChar, setLastTrackedApp,
+} from './keystroke-buffer';
+import { createSuggestionWindow, destroySuggestion, getSuggestionWindow } from './suggestion-window';
 
 const DEBOUNCE_MS = 600;
-const TOOLTIP_WIDTH = 420;
-const TOOLTIP_HEIGHT = 140;
 
 let uIOhook: any = null;
 let UiohookKey: any = {};
 let IGNORED_KEYCODES: Set<number> = new Set();
 
-let suggestionWindow: BrowserWindow | null = null;
 let debounceTimer: ReturnType<typeof setTimeout> | null = null;
 let hookStarted = false;
 let autocompleteEnabled = true;
@@ -38,12 +37,8 @@ function loadUiohook(): boolean {
       UiohookKey.F5, UiohookKey.F6, UiohookKey.F7, UiohookKey.F8,
       UiohookKey.F9, UiohookKey.F10, UiohookKey.F11, UiohookKey.F12,
       UiohookKey.PrintScreen,
-      UiohookKey.Insert, UiohookKey.Delete,
-      UiohookKey.Home, UiohookKey.End,
-      UiohookKey.PageUp, UiohookKey.PageDown,
-      UiohookKey.ArrowUp, UiohookKey.ArrowDown,
-      UiohookKey.ArrowLeft, UiohookKey.ArrowRight,
     ]);
+    buildKeycodeMap();
     console.log('[autocomplete] uiohook-napi loaded');
     return true;
   } catch (err) {
@@ -52,70 +47,6 @@ function loadUiohook(): boolean {
   }
 }
 
-function destroySuggestion(): void {
-  if (suggestionWindow && !suggestionWindow.isDestroyed()) {
-    suggestionWindow.close();
-  }
-  suggestionWindow = null;
-}
-
-function clampToScreen(x: number, y: number, w: number, h: number): { x: number; y: number } {
-  const display = screen.getDisplayNearestPoint({ x, y });
-  const { x: dx, y: dy, width: dw, height: dh } = display.workArea;
-  return {
-    x: Math.max(dx, Math.min(x, dx + dw - w)),
-    y: Math.max(dy, Math.min(y, dy + dh - h)),
-  };
-}
-
-function createSuggestionWindow(x: number, y: number): BrowserWindow {
-  destroySuggestion();
-
-  const pos = clampToScreen(x, y + 20, TOOLTIP_WIDTH, TOOLTIP_HEIGHT);
-
-  suggestionWindow = new BrowserWindow({
-    width: TOOLTIP_WIDTH,
-    height: TOOLTIP_HEIGHT,
-    x: pos.x,
-    y: pos.y,
-    frame: false,
-    transparent: true,
-    focusable: false,
-    alwaysOnTop: true,
-    skipTaskbar: true,
-    resizable: false,
-    hasShadow: true,
-    type: 'panel',
-    webPreferences: {
-      preload: path.join(__dirname, 'preload.js'),
-      contextIsolation: true,
-      nodeIntegration: false,
-      sandbox: true,
-    },
-    show: false,
-  });
-
-  suggestionWindow.loadURL(`http://localhost:${getServerPort()}/desktop/suggestion?t=${Date.now()}`);
-
-  suggestionWindow.once('ready-to-show', () => {
-    suggestionWindow?.showInactive();
-  });
-
-  suggestionWindow.webContents.setWindowOpenHandler(({ url }) => {
-    if (url.startsWith('http://localhost')) {
-      return { action: 'allow' };
-    }
-    shell.openExternal(url);
-    return { action: 'deny' };
-  });
-
-  suggestionWindow.on('closed', () => {
-    suggestionWindow = null;
-  });
-
-  return suggestionWindow;
-}
-
 function clearDebounce(): void {
   if (debounceTimer) {
     clearTimeout(debounceTimer);
@@ -128,10 +59,24 @@ function isSurfSenseWindow(): boolean {
   return app === 'Electron' || app === 'SurfSense' || app === 'surfsense-desktop';
 }
 
-function onKeyDown(event: { keycode: number; ctrlKey?: boolean; metaKey?: boolean; altKey?: boolean }): void {
+function onKeyDown(event: {
+  keycode: number;
+  shiftKey?: boolean;
+  ctrlKey?: boolean;
+  metaKey?: boolean;
+  altKey?: boolean;
+}): void {
   if (!autocompleteEnabled) return;
 
-  if (event.keycode === UiohookKey.Tab && suggestionWindow && !suggestionWindow.isDestroyed()) {
+  const currentApp = getFrontmostApp();
+  if (currentApp !== getLastTrackedApp()) {
+    resetBuffer();
+    setLastTrackedApp(currentApp);
+  }
+
+  const win = getSuggestionWindow();
+
+  if (event.keycode === UiohookKey.Tab && win && !win.isDestroyed()) {
     if (pendingSuggestionText) {
       acceptAndInject(pendingSuggestionText);
     }
@@ -139,7 +84,7 @@ function onKeyDown(event: { keycode: number; ctrlKey?: boolean; metaKey?: boolea
   }
 
   if (event.keycode === UiohookKey.Escape) {
-    if (suggestionWindow && !suggestionWindow.isDestroyed()) {
+    if (win && !win.isDestroyed()) {
       destroySuggestion();
       pendingSuggestionText = '';
     }
@@ -147,11 +92,41 @@ function onKeyDown(event: { keycode: number; ctrlKey?: boolean; metaKey?: boolea
     return;
   }
 
-  if (IGNORED_KEYCODES.has(event.keycode)) return;
-  if (event.ctrlKey || event.metaKey || event.altKey) return;
-  if (isSurfSenseWindow()) return;
+  if (currentApp === 'Electron' || currentApp === 'SurfSense' || currentApp === 'surfsense-desktop') {
+    return;
+  }
 
-  if (suggestionWindow && !suggestionWindow.isDestroyed()) {
+  if (event.ctrlKey || event.metaKey || event.altKey) {
+    resetBuffer();
+    clearDebounce();
+    return;
+  }
+
+  if (event.keycode === UiohookKey.Backspace) {
+    removeLastChar();
+  } else if (event.keycode === UiohookKey.Delete) {
+    // forward delete doesn't affect our trailing buffer
+  } else if (event.keycode === UiohookKey.Enter) {
+    appendToBuffer('\n');
+  } else if (event.keycode === UiohookKey.Space) {
+    appendToBuffer(' ');
+  } else if (
+    event.keycode === UiohookKey.ArrowLeft || event.keycode === UiohookKey.ArrowRight ||
+    event.keycode === UiohookKey.ArrowUp || event.keycode === UiohookKey.ArrowDown ||
+    event.keycode === UiohookKey.Home || event.keycode === UiohookKey.End ||
+    event.keycode === UiohookKey.PageUp || event.keycode === UiohookKey.PageDown
+  ) {
+    resetBuffer();
+    clearDebounce();
+    return;
+  } else if (IGNORED_KEYCODES.has(event.keycode)) {
+    return;
+  } else {
+    const ch = resolveChar(event.keycode, !!event.shiftKey);
+    if (ch) appendToBuffer(ch);
+  }
+
+  if (win && !win.isDestroyed()) {
     destroySuggestion();
   }
 
@@ -161,13 +136,16 @@ function onKeyDown(event: { keycode: number; ctrlKey?: boolean; metaKey?: boolea
   }, DEBOUNCE_MS);
 }
 
+function onMouseClick(): void {
+  resetBuffer();
+}
+
 async function triggerAutocomplete(): Promise<void> {
   if (!hasAccessibilityPermission()) return;
   if (isSurfSenseWindow()) return;
 
-  const fieldContent = getFieldContent();
-  if (!fieldContent || !fieldContent.text.trim()) return;
-  if (fieldContent.text.trim().length < 5) return;
+  const text = getBufferTrimmed();
+  if (!text || text.length < 5) return;
 
   sourceApp = getFrontmostApp();
   savedClipboard = clipboard.readText();
@@ -186,13 +164,16 @@ async function triggerAutocomplete(): Promise<void> {
   }
 
   win.webContents.once('did-finish-load', () => {
-    if (suggestionWindow && !suggestionWindow.isDestroyed()) {
-      suggestionWindow.webContents.send(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, {
-        text: fieldContent.text,
-        cursorPosition: fieldContent.cursorPosition,
-        searchSpaceId,
-      });
-    }
+    const sw = getSuggestionWindow();
+    setTimeout(() => {
+      if (sw && !sw.isDestroyed()) {
+        sw.webContents.send(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, {
+          text: getBuffer(),
+          cursorPosition: getBuffer().length,
+          searchSpaceId,
+        });
+      }
+    }, 300);
   });
 }
 
@@ -209,6 +190,7 @@ async function acceptAndInject(text: string): Promise<void> {
     simulatePaste();
     await new Promise((r) => setTimeout(r, 100));
     clipboard.writeText(savedClipboard);
+    appendToBuffer(text);
   } catch {
     clipboard.writeText(savedClipboard);
   }
@@ -238,21 +220,16 @@ function registerIpcHandlers(): void {
 export function registerAutocomplete(): void {
   registerIpcHandlers();
 
-  if (!allPermissionsGranted()) {
-    console.log('[autocomplete] Permissions not granted — hook not started');
-    return;
-  }
-
   if (!loadUiohook()) {
     console.error('[autocomplete] Cannot start: uiohook-napi failed to load');
     return;
   }
 
   uIOhook.on('keydown', onKeyDown);
+  uIOhook.on('click', onMouseClick);
   try {
     uIOhook.start();
     hookStarted = true;
-    console.log('[autocomplete] uIOhook started');
   } catch (err) {
     console.error('[autocomplete] uIOhook.start() failed:', err);
   }
diff --git a/surfsense_desktop/src/modules/autocomplete/keystroke-buffer.ts b/surfsense_desktop/src/modules/autocomplete/keystroke-buffer.ts
new file mode 100644
index 000000000..ca232d307
--- /dev/null
+++ b/surfsense_desktop/src/modules/autocomplete/keystroke-buffer.ts
@@ -0,0 +1,76 @@
+const MAX_BUFFER_LENGTH = 4000;
+const KEYCODE_TO_CHAR: Record<number, [string, string]> = {};
+
+let keystrokeBuffer = '';
+let lastTrackedApp = '';
+
+export function buildKeycodeMap(): void {
+  const letters: [string, number][] = [
+    ['q', 16], ['w', 17], ['e', 18], ['r', 19], ['t', 20],
+    ['y', 21], ['u', 22], ['i', 23], ['o', 24], ['p', 25],
+    ['a', 30], ['s', 31], ['d', 32], ['f', 33], ['g', 34],
+    ['h', 35], ['j', 36], ['k', 37], ['l', 38],
+    ['z', 44], ['x', 45], ['c', 46], ['v', 47],
+    ['b', 48], ['n', 49], ['m', 50],
+  ];
+  for (const [ch, code] of letters) {
+    KEYCODE_TO_CHAR[code] = [ch, ch.toUpperCase()];
+  }
+
+  const digits: [string, string, number][] = [
+    ['1', '!', 2], ['2', '@', 3], ['3', '#', 4], ['4', '$', 5],
+    ['5', '%', 6], ['6', '^', 7], ['7', '&', 8], ['8', '*', 9],
+    ['9', '(', 10], ['0', ')', 11],
+  ];
+  for (const [norm, shifted, code] of digits) {
+    KEYCODE_TO_CHAR[code] = [norm, shifted];
+  }
+
+  const punctuation: [string, string, number][] = [
+    [';', ':', 39], ['=', '+', 13], [',', '<', 51], ['-', '_', 12],
+    ['.', '>', 52], ['/', '?', 53], ['`', '~', 41], ['[', '{', 26],
+    ['\\', '|', 43], [']', '}', 27], ["'", '"', 40],
+  ];
+  for (const [norm, shifted, code] of punctuation) {
+    KEYCODE_TO_CHAR[code] = [norm, shifted];
+  }
+}
+
+export function resetBuffer(): void {
+  keystrokeBuffer = '';
+}
+
+export function appendToBuffer(char: string): void {
+  keystrokeBuffer += char;
+  if (keystrokeBuffer.length > MAX_BUFFER_LENGTH) {
+    keystrokeBuffer = keystrokeBuffer.slice(-MAX_BUFFER_LENGTH);
+  }
+}
+
+export function removeLastChar(): void {
+  if (keystrokeBuffer.length > 0) {
+    keystrokeBuffer = keystrokeBuffer.slice(0, -1);
+  }
+}
+
+export function getBuffer(): string {
+  return keystrokeBuffer;
+}
+
+export function getBufferTrimmed(): string {
+  return keystrokeBuffer.trim();
+}
+
+export function getLastTrackedApp(): string {
+  return lastTrackedApp;
+}
+
+export function setLastTrackedApp(app: string): void {
+  lastTrackedApp = app;
+}
+
+export function resolveChar(keycode: number, shift: boolean): string | null {
+  const mapping = KEYCODE_TO_CHAR[keycode];
+  if (!mapping) return null;
+  return shift ? mapping[1] : mapping[0];
+}
diff --git a/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts b/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts
new file mode 100644
index 000000000..f03930cf6
--- /dev/null
+++ b/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts
@@ -0,0 +1,103 @@
+import { BrowserWindow, screen, shell } from 'electron';
+import path from 'path';
+import { getServerPort } from '../server';
+
+const TOOLTIP_WIDTH = 420;
+const TOOLTIP_HEIGHT = 38;
+const MAX_HEIGHT = 400;
+
+let suggestionWindow: BrowserWindow | null = null;
+let resizeTimer: ReturnType<typeof setInterval> | null = null;
+
+function clampToScreen(x: number, y: number, w: number, h: number): { x: number; y: number } {
+  const display = screen.getDisplayNearestPoint({ x, y });
+  const { x: dx, y: dy, width: dw, height: dh } = display.workArea;
+  return {
+    x: Math.max(dx, Math.min(x, dx + dw - w)),
+    y: Math.max(dy, Math.min(y, dy + dh - h)),
+  };
+}
+
+function stopResizePolling(): void {
+  if (resizeTimer) { clearInterval(resizeTimer); resizeTimer = null; }
+}
+
+function startResizePolling(win: BrowserWindow): void {
+  stopResizePolling();
+  let lastH = 0;
+  resizeTimer = setInterval(async () => {
+    if (!win || win.isDestroyed()) { stopResizePolling(); return; }
+    try {
+      const h: number = await win.webContents.executeJavaScript(
+        `document.body.scrollHeight`
+      );
+      if (h > 0 && h !== lastH) {
+        lastH = h;
+        const clamped = Math.min(h, MAX_HEIGHT);
+        const bounds = win.getBounds();
+        win.setBounds({ x: bounds.x, y: bounds.y, width: TOOLTIP_WIDTH, height: clamped });
+      }
+    } catch {}
+  }, 150);
+}
+
+export function getSuggestionWindow(): BrowserWindow | null {
+  return suggestionWindow;
+}
+
+export function destroySuggestion(): void {
+  stopResizePolling();
+  if (suggestionWindow && !suggestionWindow.isDestroyed()) {
+    suggestionWindow.close();
+  }
+  suggestionWindow = null;
+}
+
+export function createSuggestionWindow(x: number, y: number): BrowserWindow {
+  destroySuggestion();
+
+  const pos = clampToScreen(x, y + 20, TOOLTIP_WIDTH, TOOLTIP_HEIGHT);
+
+  suggestionWindow = new BrowserWindow({
+    width: TOOLTIP_WIDTH,
+    height: TOOLTIP_HEIGHT,
+    x: pos.x,
+    y: pos.y,
+    frame: false,
+    transparent: true,
+    focusable: false,
+    alwaysOnTop: true,
+    skipTaskbar: true,
+    hasShadow: true,
+    type: 'panel',
+    webPreferences: {
+      preload: path.join(__dirname, '..', 'preload.js'),
+      contextIsolation: true,
+      nodeIntegration: false,
+      sandbox: true,
+    },
+    show: false,
+  });
+
+  suggestionWindow.loadURL(`http://localhost:${getServerPort()}/desktop/suggestion?t=${Date.now()}`);
+
+  suggestionWindow.once('ready-to-show', () => {
+    suggestionWindow?.showInactive();
+    if (suggestionWindow) startResizePolling(suggestionWindow);
+  });
+
+  suggestionWindow.webContents.setWindowOpenHandler(({ url }) => {
+    if (url.startsWith('http://localhost')) {
+      return { action: 'allow' };
+    }
+    shell.openExternal(url);
+    return { action: 'deny' };
+  });
+
+  suggestionWindow.on('closed', () => {
+    stopResizePolling();
+    suggestionWindow = null;
+  });
+
+  return suggestionWindow;
+}
diff --git a/surfsense_desktop/src/modules/platform.ts b/surfsense_desktop/src/modules/platform.ts
index 262866d07..1ab0c38fb 100644
--- a/surfsense_desktop/src/modules/platform.ts
+++ b/surfsense_desktop/src/modules/platform.ts
@@ -19,20 +19,6 @@ export function getFrontmostApp(): string {
   return '';
 }
 
-export function getSelectedText(): string {
-  try {
-    if (process.platform === 'darwin') {
-      return execSync(
-        'osascript -e \'tell application "System Events" to get value of attribute "AXSelectedText" of focused UI element of first application process whose frontmost is true\''
-      ).toString().trim();
-    }
-    // Windows: no reliable accessibility API for selected text across apps
-  } catch {
-    return '';
-  }
-  return '';
-}
-
 export function simulateCopy(): void {
   if (process.platform === 'darwin') {
     execSync('osascript -e \'tell application "System Events" to keystroke "c" using command down\'');
@@ -58,38 +44,3 @@ export function hasAccessibilityPermission(): boolean {
   if (process.platform !== 'darwin') return true;
   return systemPreferences.isTrustedAccessibilityClient(false);
 }
-
-export interface FieldContent {
-  text: string;
-  cursorPosition: number;
-}
-
-export function getFieldContent(): FieldContent | null {
-  if (process.platform !== 'darwin') return null;
-
-  try {
-    const text = execSync(
-      'osascript -e \'tell application "System Events" to get value of attribute "AXValue" of focused UI element of first application process whose frontmost is true\'',
-      { timeout: 500 }
-    ).toString().trim();
-
-    let cursorPosition = text.length;
-    try {
-      const rangeStr = execSync(
-        'osascript -e \'tell application "System Events" to get value of attribute "AXSelectedTextRange" of focused UI element of first application process whose frontmost is true\'',
-        { timeout: 500 }
-      ).toString().trim();
-
-      const locationMatch = rangeStr.match(/location[:\s]*(\d+)/i);
-      if (locationMatch) {
-        cursorPosition = parseInt(locationMatch[1], 10);
-      }
-    } catch {
-      // Fall back to end of text
-    }
-
-    return { text, cursorPosition };
-  } catch {
-    return null;
-  }
-}
diff --git a/surfsense_web/app/desktop/permissions/page.tsx b/surfsense_web/app/desktop/permissions/page.tsx
index 2bcdc42df..8bde63357 100644
--- a/surfsense_web/app/desktop/permissions/page.tsx
+++ b/surfsense_web/app/desktop/permissions/page.tsx
@@ -169,11 +169,14 @@ export default function DesktopPermissionsPage() {
 										>
 											Open System Settings
 										</Button>
-										{status === "denied" && (
-											<p className="text-xs text-amber-700 dark:text-amber-400">
-												Toggle SurfSense on in System Settings to continue.
-											</p>
-										)}
+									{status === "denied" && (
+										<p className="text-xs text-amber-700 dark:text-amber-400">
+											Toggle SurfSense on in System Settings to continue.
+										</p>
+									)}
+									<p className="text-xs text-muted-foreground">
+										If SurfSense doesn&apos;t appear in the list, click <strong>+</strong> and select it from Applications.
+									</p>
 									</div>
 								)}
 							</div>
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 14dfab3af..69a19e3f1 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -151,9 +151,9 @@ export default function SuggestionPage() {
 		<div className="suggestion-tooltip">
 			<p className="suggestion-text">{suggestion}</p>
 			<div className="suggestion-hint">
-				<span className="suggestion-key">Tab</span> accept
-				<span className="suggestion-separator">·</span>
-				<span className="suggestion-key">Esc</span> dismiss
+				<kbd>Tab</kbd> accept
+				<span className="suggestion-separator" />
+				<kbd>Esc</kbd> dismiss
 			</div>
 		</div>
 	);
diff --git a/surfsense_web/app/desktop/suggestion/suggestion.css b/surfsense_web/app/desktop/suggestion/suggestion.css
index e9471e7f8..0d3332103 100644
--- a/surfsense_web/app/desktop/suggestion/suggestion.css
+++ b/surfsense_web/app/desktop/suggestion/suggestion.css
@@ -1,8 +1,16 @@
+html, body {
+  margin: 0 !important;
+  padding: 0 !important;
+  background: transparent !important;
+  overflow: hidden !important;
+  height: auto !important;
+  width: 100% !important;
+}
+
 .suggestion-body {
   margin: 0;
   padding: 0;
   background: transparent;
-  overflow: hidden;
   font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
   -webkit-font-smoothing: antialiased;
   user-select: none;
@@ -10,69 +18,73 @@
 }
 
 .suggestion-tooltip {
-  background: rgba(30, 30, 30, 0.95);
-  backdrop-filter: blur(12px);
-  -webkit-backdrop-filter: blur(12px);
-  border: 1px solid rgba(255, 255, 255, 0.1);
-  border-radius: 10px;
-  padding: 10px 14px;
+  background: #1e1e1e;
+  border: 1px solid #3c3c3c;
+  border-radius: 8px;
+  padding: 8px 12px;
   margin: 4px;
   max-width: 400px;
-  box-shadow: 0 8px 32px rgba(0, 0, 0, 0.4),
-              0 2px 8px rgba(0, 0, 0, 0.2);
+  box-shadow: 0 4px 16px rgba(0, 0, 0, 0.5);
 }
 
 .suggestion-text {
-  color: rgba(255, 255, 255, 0.9);
+  color: #d4d4d4;
   font-size: 13px;
-  line-height: 1.5;
-  margin: 0 0 8px 0;
+  line-height: 1.45;
+  margin: 0 0 6px 0;
   word-wrap: break-word;
   white-space: pre-wrap;
 }
 
 .suggestion-hint {
-  color: rgba(255, 255, 255, 0.4);
+  color: #666;
   font-size: 11px;
   display: flex;
   align-items: center;
-  gap: 4px;
+  gap: 6px;
+  border-top: 1px solid #2a2a2a;
+  padding-top: 6px;
 }
 
-.suggestion-key {
-  background: rgba(255, 255, 255, 0.1);
-  border: 1px solid rgba(255, 255, 255, 0.15);
+.suggestion-hint kbd {
+  background: #2a2a2a;
+  border: 1px solid #3c3c3c;
   border-radius: 3px;
-  padding: 1px 5px;
+  padding: 0 4px;
+  font-family: inherit;
   font-size: 10px;
-  font-weight: 500;
-  color: rgba(255, 255, 255, 0.6);
+  font-weight: 600;
+  color: #999;
+  line-height: 18px;
 }
 
 .suggestion-separator {
-  margin: 0 2px;
+  width: 1px;
+  height: 10px;
+  background: #333;
 }
 
 .suggestion-error {
-  border-color: rgba(255, 80, 80, 0.3);
+  border-color: #5c2626;
 }
 
 .suggestion-error-text {
-  color: rgba(255, 120, 120, 0.9);
+  color: #f48771;
   font-size: 12px;
 }
 
 .suggestion-loading {
   display: flex;
-  gap: 4px;
-  padding: 4px 0;
+  gap: 5px;
+  padding: 2px 0;
+  justify-content: center;
 }
 
 .suggestion-dot {
-  width: 5px;
-  height: 5px;
+  width: 4px;
+  height: 4px;
   border-radius: 50%;
-  background: rgba(255, 255, 255, 0.4);
+  background: #666;
   animation: suggestion-pulse 1.2s infinite ease-in-out;
 }
 
@@ -91,6 +103,6 @@
   }
   40% {
     opacity: 1;
-    transform: scale(1);
+    transform: scale(1.1);
   }
 }

From 3e68d4aa3ed04c87f155a4da08a6610251755f74 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Thu, 2 Apr 2026 20:38:09 +0200
Subject: [PATCH 054/202] refactor: extract autocomplete service and fix
 tooltip screen-edge positioning

---
 .../app/routes/autocomplete_routes.py         | 109 +----------------
 .../app/services/autocomplete_service.py      | 110 ++++++++++++++++++
 .../modules/autocomplete/suggestion-window.ts |  27 +++--
 3 files changed, 130 insertions(+), 116 deletions(-)
 create mode 100644 surfsense_backend/app/services/autocomplete_service.py

diff --git a/surfsense_backend/app/routes/autocomplete_routes.py b/surfsense_backend/app/routes/autocomplete_routes.py
index 9a285a723..68c56d0e0 100644
--- a/surfsense_backend/app/routes/autocomplete_routes.py
+++ b/surfsense_backend/app/routes/autocomplete_routes.py
@@ -1,118 +1,14 @@
-import logging
-from typing import AsyncGenerator
-
 from fastapi import APIRouter, Depends, Query
 from fastapi.responses import StreamingResponse
-from langchain_core.messages import HumanMessage, SystemMessage
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from app.db import User, get_async_session
-from app.retriever.chunks_hybrid_search import ChucksHybridSearchRetriever
-from app.services.llm_service import get_agent_llm
+from app.services.autocomplete_service import stream_autocomplete
 from app.services.new_streaming_service import VercelStreamingService
 from app.users import current_active_user
 
-logger = logging.getLogger(__name__)
-
 router = APIRouter(prefix="/autocomplete", tags=["autocomplete"])
 
-AUTOCOMPLETE_SYSTEM_PROMPT = """You are an inline text autocomplete engine. Your job is to complete the user's text naturally.
-
-Rules:
-- Output ONLY the continuation text. Do NOT repeat what the user already typed.
-- Keep completions concise: 1-3 sentences maximum.
-- Match the user's tone, style, and language.
-- If knowledge base context is provided, use it to make the completion factually accurate and personalized.
-- Do NOT add quotes, explanations, or meta-commentary.
-- Do NOT start with a space unless grammatically required.
-- If you cannot produce a useful completion, output nothing."""
-
-KB_CONTEXT_TEMPLATE = """
-Relevant knowledge base context (use this to personalize the completion):
----
-{kb_context}
----
-"""
-
-
-async def _stream_autocomplete(
-    text: str,
-    cursor_position: int,
-    search_space_id: int,
-    session: AsyncSession,
-) -> AsyncGenerator[str, None]:
-    """Stream an autocomplete response with KB context."""
-    streaming_service = VercelStreamingService()
-
-    try:
-        # Text before cursor is what we're completing
-        text_before_cursor = text[:cursor_position] if cursor_position >= 0 else text
-
-        if not text_before_cursor.strip():
-            yield streaming_service.format_message_start()
-            yield streaming_service.format_finish()
-            yield streaming_service.format_done()
-            return
-
-        # Fast KB lookup: vector-only search, top 3 chunks, no planner LLM
-        kb_context = ""
-        try:
-            retriever = ChucksHybridSearchRetriever(session)
-            chunks = await retriever.vector_search(
-                query_text=text_before_cursor[-200:],  # last 200 chars for relevance
-                top_k=3,
-                search_space_id=search_space_id,
-            )
-            if chunks:
-                kb_snippets = []
-                for chunk in chunks:
-                    content = getattr(chunk, "content", None) or getattr(chunk, "chunk_text", "")
-                    if content:
-                        kb_snippets.append(content[:300])
-                if kb_snippets:
-                    kb_context = KB_CONTEXT_TEMPLATE.format(
-                        kb_context="\n\n".join(kb_snippets)
-                    )
-        except Exception as e:
-            logger.warning(f"KB search failed for autocomplete, proceeding without context: {e}")
-
-        # Get the search space's configured LLM
-        llm = await get_agent_llm(session, search_space_id)
-        if not llm:
-            yield streaming_service.format_message_start()
-            error_msg = "No LLM configured for this search space"
-            yield streaming_service.format_error(error_msg)
-            yield streaming_service.format_done()
-            return
-
-        system_prompt = AUTOCOMPLETE_SYSTEM_PROMPT
-        if kb_context:
-            system_prompt += kb_context
-
-        messages = [
-            SystemMessage(content=system_prompt),
-            HumanMessage(content=f"Complete this text:\n{text_before_cursor}"),
-        ]
-
-        # Stream the response
-        yield streaming_service.format_message_start()
-        text_id = streaming_service.generate_text_id()
-        yield streaming_service.format_text_start(text_id)
-
-        async for chunk in llm.astream(messages):
-            token = chunk.content if hasattr(chunk, "content") else str(chunk)
-            if token:
-                yield streaming_service.format_text_delta(text_id, token)
-
-        yield streaming_service.format_text_end(text_id)
-        yield streaming_service.format_finish()
-        yield streaming_service.format_done()
-
-    except Exception as e:
-        logger.error(f"Autocomplete streaming error: {e}")
-        yield streaming_service.format_error(str(e))
-        yield streaming_service.format_done()
-
 
 @router.post("/stream")
 async def autocomplete_stream(
@@ -122,12 +18,11 @@ async def autocomplete_stream(
     user: User = Depends(current_active_user),
     session: AsyncSession = Depends(get_async_session),
 ):
-    """Stream an autocomplete suggestion based on the current text and KB context."""
     if cursor_position < 0:
         cursor_position = len(text)
 
     return StreamingResponse(
-        _stream_autocomplete(text, cursor_position, search_space_id, session),
+        stream_autocomplete(text, cursor_position, search_space_id, session),
         media_type="text/event-stream",
         headers={
             **VercelStreamingService.get_response_headers(),
diff --git a/surfsense_backend/app/services/autocomplete_service.py b/surfsense_backend/app/services/autocomplete_service.py
new file mode 100644
index 000000000..7c172275d
--- /dev/null
+++ b/surfsense_backend/app/services/autocomplete_service.py
@@ -0,0 +1,110 @@
+import logging
+from typing import AsyncGenerator
+
+from langchain_core.messages import HumanMessage, SystemMessage
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.retriever.chunks_hybrid_search import ChucksHybridSearchRetriever
+from app.services.llm_service import get_agent_llm
+from app.services.new_streaming_service import VercelStreamingService
+
+logger = logging.getLogger(__name__)
+
+SYSTEM_PROMPT = """You are an inline text autocomplete engine. Your job is to complete the user's text naturally.
+
+Rules:
+- Output ONLY the continuation text. Do NOT repeat what the user already typed.
+- Keep completions concise: 1-3 sentences maximum.
+- Match the user's tone, style, and language.
+- If knowledge base context is provided, use it to make the completion factually accurate and personalized.
+- Do NOT add quotes, explanations, or meta-commentary.
+- Do NOT start with a space unless grammatically required.
+- If you cannot produce a useful completion, output nothing."""
+
+KB_CONTEXT_TEMPLATE = """
+Relevant knowledge base context (use this to personalize the completion):
+---
+{kb_context}
+---
+"""
+
+
+async def _retrieve_kb_context(
+    session: AsyncSession,
+    text: str,
+    search_space_id: int,
+) -> str:
+    try:
+        retriever = ChucksHybridSearchRetriever(session)
+        chunks = await retriever.vector_search(
+            query_text=text[-200:],
+            top_k=3,
+            search_space_id=search_space_id,
+        )
+        if not chunks:
+            return ""
+        snippets = []
+        for chunk in chunks:
+            content = getattr(chunk, "content", None) or getattr(chunk, "chunk_text", "")
+            if content:
+                snippets.append(content[:300])
+        if not snippets:
+            return ""
+        return KB_CONTEXT_TEMPLATE.format(kb_context="\n\n".join(snippets))
+    except Exception as e:
+        logger.warning(f"KB search failed for autocomplete, proceeding without context: {e}")
+        return ""
+
+
+async def stream_autocomplete(
+    text: str,
+    cursor_position: int,
+    search_space_id: int,
+    session: AsyncSession,
+) -> AsyncGenerator[str, None]:
+    """Build context, call the LLM, and yield SSE-formatted tokens."""
+    streaming = VercelStreamingService()
+    text_before_cursor = text[:cursor_position] if cursor_position >= 0 else text
+
+    if not text_before_cursor.strip():
+        yield streaming.format_message_start()
+        yield streaming.format_finish()
+        yield streaming.format_done()
+        return
+
+    kb_context = await _retrieve_kb_context(session, text_before_cursor, search_space_id)
+
+    llm = await get_agent_llm(session, search_space_id)
+    if not llm:
+        yield streaming.format_message_start()
+        yield streaming.format_error("No LLM configured for this search space")
+        yield streaming.format_done()
+        return
+
+    system_prompt = SYSTEM_PROMPT
+    if kb_context:
+        system_prompt += kb_context
+
+    messages = [
+        SystemMessage(content=system_prompt),
+        HumanMessage(content=f"Complete this text:\n{text_before_cursor}"),
+    ]
+
+    try:
+        yield streaming.format_message_start()
+        text_id = streaming.generate_text_id()
+        yield streaming.format_text_start(text_id)
+
+        async for chunk in llm.astream(messages):
+            token = chunk.content if hasattr(chunk, "content") else str(chunk)
+            if token:
+                yield streaming.format_text_delta(text_id, token)
+
+        yield streaming.format_text_end(text_id)
+        yield streaming.format_finish()
+        yield streaming.format_done()
+
+    except Exception as e:
+        logger.error(f"Autocomplete streaming error: {e}")
+        yield streaming.format_error(str(e))
+        yield streaming.format_done()
diff --git a/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts b/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts
index f03930cf6..e8a2f3a91 100644
--- a/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts
+++ b/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts
@@ -8,14 +8,22 @@ const MAX_HEIGHT = 400;
 
 let suggestionWindow: BrowserWindow | null = null;
 let resizeTimer: ReturnType<typeof setInterval> | null = null;
+let cursorOrigin = { x: 0, y: 0 };
 
-function clampToScreen(x: number, y: number, w: number, h: number): { x: number; y: number } {
-  const display = screen.getDisplayNearestPoint({ x, y });
+const CURSOR_GAP = 20;
+
+function positionOnScreen(cursorX: number, cursorY: number, w: number, h: number): { x: number; y: number } {
+  const display = screen.getDisplayNearestPoint({ x: cursorX, y: cursorY });
   const { x: dx, y: dy, width: dw, height: dh } = display.workArea;
-  return {
-    x: Math.max(dx, Math.min(x, dx + dw - w)),
-    y: Math.max(dy, Math.min(y, dy + dh - h)),
-  };
+
+  const x = Math.max(dx, Math.min(cursorX, dx + dw - w));
+
+  const spaceBelow = (dy + dh) - (cursorY + CURSOR_GAP);
+  const y = spaceBelow >= h
+    ? cursorY + CURSOR_GAP
+    : cursorY - h - CURSOR_GAP;
+
+  return { x, y: Math.max(dy, y) };
 }
 
 function stopResizePolling(): void {
@@ -34,8 +42,8 @@ function startResizePolling(win: BrowserWindow): void {
       if (h > 0 && h !== lastH) {
         lastH = h;
         const clamped = Math.min(h, MAX_HEIGHT);
-        const bounds = win.getBounds();
-        win.setBounds({ x: bounds.x, y: bounds.y, width: TOOLTIP_WIDTH, height: clamped });
+        const pos = positionOnScreen(cursorOrigin.x, cursorOrigin.y, TOOLTIP_WIDTH, clamped);
+        win.setBounds({ x: pos.x, y: pos.y, width: TOOLTIP_WIDTH, height: clamped });
       }
     } catch {}
   }, 150);
@@ -55,8 +63,9 @@ export function destroySuggestion(): void {
 
 export function createSuggestionWindow(x: number, y: number): BrowserWindow {
   destroySuggestion();
+  cursorOrigin = { x, y };
 
-  const pos = clampToScreen(x, y + 20, TOOLTIP_WIDTH, TOOLTIP_HEIGHT);
+  const pos = positionOnScreen(x, y, TOOLTIP_WIDTH, TOOLTIP_HEIGHT);
 
   suggestionWindow = new BrowserWindow({
     width: TOOLTIP_WIDTH,

From f0a7c7134a7e81a8ee202e854afbfc98d9ad182a Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 00:09:17 +0530
Subject: [PATCH 055/202] feat: move endpoint above to retrieve watched folders
 based on search space ID

---
 .../app/routes/documents_routes.py            | 60 ++++++++++---------
 1 file changed, 31 insertions(+), 29 deletions(-)

diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index 81bbb1477..0acc1d30b 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -953,6 +953,37 @@ async def get_document_by_chunk_id(
         ) from e
 
 
+@router.get("/documents/watched-folders", response_model=list["FolderRead"])
+async def get_watched_folders(
+    search_space_id: int,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """Return root folders that are marked as watched (metadata->>'watched' = 'true')."""
+    from app.schemas import FolderRead  # noqa: F811
+
+    await check_permission(
+        session,
+        user,
+        search_space_id,
+        Permission.DOCUMENTS_READ.value,
+        "You don't have permission to read documents in this search space",
+    )
+
+    folders = (
+        await session.execute(
+            select(Folder).where(
+                Folder.search_space_id == search_space_id,
+                Folder.parent_id.is_(None),
+                Folder.folder_metadata.isnot(None),
+                Folder.folder_metadata["watched"].astext == "true",
+            )
+        )
+    ).scalars().all()
+
+    return folders
+
+
 @router.get("/documents/{document_id}", response_model=DocumentRead)
 async def read_document(
     document_id: int,
@@ -1416,32 +1447,3 @@ async def folder_index_file(
     }
 
 
-@router.get("/documents/watched-folders", response_model=list["FolderRead"])
-async def get_watched_folders(
-    search_space_id: int,
-    session: AsyncSession = Depends(get_async_session),
-    user: User = Depends(current_active_user),
-):
-    """Return root folders that are marked as watched (metadata->>'watched' = 'true')."""
-    from app.schemas import FolderRead  # noqa: F811
-
-    await check_permission(
-        session,
-        user,
-        search_space_id,
-        Permission.DOCUMENTS_READ.value,
-        "You don't have permission to read documents in this search space",
-    )
-
-    folders = (
-        await session.execute(
-            select(Folder).where(
-                Folder.search_space_id == search_space_id,
-                Folder.parent_id.is_(None),
-                Folder.folder_metadata.isnot(None),
-                Folder.folder_metadata["watched"].astext == "true",
-            )
-        )
-    ).scalars().all()
-
-    return folders

From b46c5532b3fb02c3fd7277021d128e4f2f8a3180 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 00:28:24 +0530
Subject: [PATCH 056/202] feat: add unified file and folder browsing
 functionality with IPC channel integration

---
 surfsense_desktop/src/ipc/channels.ts         |   2 +
 surfsense_desktop/src/ipc/handlers.ts         |   8 +
 .../src/modules/folder-watcher.ts             |  68 +++++
 surfsense_desktop/src/preload.ts              |   4 +
 .../(manage)/components/DocumentsFilters.tsx  |  23 +-
 .../layout/ui/sidebar/DocumentsSidebar.tsx    |  51 +---
 .../components/sources/DocumentUploadTab.tsx  | 284 ++++++++++++++----
 surfsense_web/types/window.d.ts               |  15 +
 8 files changed, 335 insertions(+), 120 deletions(-)

diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index 66788d90e..19c26607d 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -17,4 +17,6 @@ export const IPC_CHANNELS = {
   FOLDER_SYNC_PAUSE: 'folder-sync:pause',
   FOLDER_SYNC_RESUME: 'folder-sync:resume',
   FOLDER_SYNC_RENDERER_READY: 'folder-sync:renderer-ready',
+  BROWSE_FILE_OR_FOLDER: 'browse:file-or-folder',
+  READ_LOCAL_FILES: 'browse:read-local-files',
 } as const;
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index 19051e871..246f0f6ac 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -9,6 +9,8 @@ import {
   pauseWatcher,
   resumeWatcher,
   markRendererReady,
+  browseFileOrFolder,
+  readLocalFiles,
 } from '../modules/folder-watcher';
 
 export function registerIpcHandlers(): void {
@@ -49,4 +51,10 @@ export function registerIpcHandlers(): void {
   ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_RENDERER_READY, () => {
     markRendererReady();
   });
+
+  ipcMain.handle(IPC_CHANNELS.BROWSE_FILE_OR_FOLDER, () => browseFileOrFolder());
+
+  ipcMain.handle(IPC_CHANNELS.READ_LOCAL_FILES, (_event, paths: string[]) =>
+    readLocalFiles(paths)
+  );
 }
diff --git a/surfsense_desktop/src/modules/folder-watcher.ts b/surfsense_desktop/src/modules/folder-watcher.ts
index 81a835c22..1324858a0 100644
--- a/surfsense_desktop/src/modules/folder-watcher.ts
+++ b/surfsense_desktop/src/modules/folder-watcher.ts
@@ -391,3 +391,71 @@ export async function unregisterFolderWatcher(): Promise<void> {
   }
   watchers.clear();
 }
+
+export interface BrowseResult {
+  type: 'files' | 'folder';
+  paths: string[];
+}
+
+export async function browseFileOrFolder(): Promise<BrowseResult | null> {
+  const result = await dialog.showOpenDialog({
+    properties: ['openFile', 'openDirectory', 'multiSelections'],
+    title: 'Select files or a folder',
+  });
+  if (result.canceled || result.filePaths.length === 0) return null;
+
+  const stat = fs.statSync(result.filePaths[0]);
+  if (stat.isDirectory()) {
+    return { type: 'folder', paths: [result.filePaths[0]] };
+  }
+  return { type: 'files', paths: result.filePaths };
+}
+
+const MIME_MAP: Record<string, string> = {
+  '.pdf': 'application/pdf',
+  '.docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
+  '.xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
+  '.pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation',
+  '.html': 'text/html', '.htm': 'text/html',
+  '.csv': 'text/csv',
+  '.txt': 'text/plain',
+  '.md': 'text/markdown', '.markdown': 'text/markdown',
+  '.mp3': 'audio/mpeg', '.mpeg': 'audio/mpeg', '.mpga': 'audio/mpeg',
+  '.mp4': 'audio/mp4', '.m4a': 'audio/mp4',
+  '.wav': 'audio/wav',
+  '.webm': 'audio/webm',
+  '.jpg': 'image/jpeg', '.jpeg': 'image/jpeg',
+  '.png': 'image/png',
+  '.bmp': 'image/bmp',
+  '.webp': 'image/webp',
+  '.tiff': 'image/tiff',
+  '.doc': 'application/msword',
+  '.rtf': 'application/rtf',
+  '.xml': 'application/xml',
+  '.epub': 'application/epub+zip',
+  '.xls': 'application/vnd.ms-excel',
+  '.ppt': 'application/vnd.ms-powerpoint',
+  '.eml': 'message/rfc822',
+  '.odt': 'application/vnd.oasis.opendocument.text',
+  '.msg': 'application/vnd.ms-outlook',
+};
+
+export interface LocalFileData {
+  name: string;
+  data: ArrayBuffer;
+  mimeType: string;
+  size: number;
+}
+
+export function readLocalFiles(filePaths: string[]): LocalFileData[] {
+  return filePaths.map((p) => {
+    const buf = fs.readFileSync(p);
+    const ext = path.extname(p).toLowerCase();
+    return {
+      name: path.basename(p),
+      data: buf.buffer.slice(buf.byteOffset, buf.byteOffset + buf.byteLength),
+      mimeType: MIME_MAP[ext] || 'application/octet-stream',
+      size: buf.byteLength,
+    };
+  });
+}
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 7c190db10..08ca87f8f 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -45,4 +45,8 @@ contextBridge.exposeInMainWorld('electronAPI', {
   pauseWatcher: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_PAUSE),
   resumeWatcher: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_RESUME),
   signalRendererReady: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_RENDERER_READY),
+
+  // Unified browse (files + folders)
+  browseFileOrFolder: () => ipcRenderer.invoke(IPC_CHANNELS.BROWSE_FILE_OR_FOLDER),
+  readLocalFiles: (paths: string[]) => ipcRenderer.invoke(IPC_CHANNELS.READ_LOCAL_FILES, paths),
 });
diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
index fcd3a39da..150c119de 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { Eye, FolderPlus, ListFilter, Search, Upload, X } from "lucide-react";
+import { FolderPlus, ListFilter, Search, Upload, X } from "lucide-react";
 import { useTranslations } from "next-intl";
 import React, { useCallback, useMemo, useRef, useState } from "react";
 import { useDocumentUploadDialog } from "@/components/assistant-ui/document-upload-popup";
@@ -19,7 +19,6 @@ export function DocumentsFilters({
 	onToggleType,
 	activeTypes,
 	onCreateFolder,
-	onWatchFolder,
 }: {
 	typeCounts: Partial<Record<DocumentTypeEnum, number>>;
 	onSearch: (v: string) => void;
@@ -27,7 +26,6 @@ export function DocumentsFilters({
 	onToggleType: (type: DocumentTypeEnum, checked: boolean) => void;
 	activeTypes: DocumentTypeEnum[];
 	onCreateFolder?: () => void;
-	onWatchFolder?: () => void;
 }) {
 	const t = useTranslations("documents");
 	const id = React.useId();
@@ -216,24 +214,7 @@ export function DocumentsFilters({
 					</Tooltip>
 				)}
 
-			{/* Watch Folder Button (desktop only) */}
-			{onWatchFolder && (
-				<Tooltip>
-					<TooltipTrigger asChild>
-						<Button
-							variant="outline"
-							size="icon"
-							className="h-9 w-9 shrink-0 border-dashed border-sidebar-border text-sidebar-foreground/60 hover:text-sidebar-foreground hover:border-sidebar-border bg-sidebar"
-							onClick={onWatchFolder}
-						>
-							<Eye size={14} />
-						</Button>
-					</TooltipTrigger>
-					<TooltipContent>Watch folder</TooltipContent>
-				</Tooltip>
-			)}
-
-			{/* Upload Button */}
+		{/* Upload Button */}
 			<Button
 				data-joyride="upload-button"
 				onClick={openUploadDialog}
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index f9d32bf98..ed3a78786 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -279,40 +279,6 @@ export function DocumentsSidebar({
 
 	const isElectron = typeof window !== "undefined" && !!window.electronAPI;
 
-	const handleWatchFolder = useCallback(async () => {
-		const api = window.electronAPI;
-		if (!api) return;
-
-		const folderPath = await api.selectFolder();
-		if (!folderPath) return;
-
-		const folderName = folderPath.split("/").pop() || folderPath.split("\\").pop() || folderPath;
-
-		try {
-			const result = await documentsApiService.folderIndex(searchSpaceId, {
-				folder_path: folderPath,
-				folder_name: folderName,
-				search_space_id: searchSpaceId,
-			});
-
-			const rootFolderId = (result as { root_folder_id?: number })?.root_folder_id ?? null;
-
-			await api.addWatchedFolder({
-				path: folderPath,
-				name: folderName,
-				excludePatterns: [".git", "node_modules", "__pycache__", ".DS_Store", ".obsidian", ".trash"],
-				fileExtensions: null,
-				rootFolderId,
-				searchSpaceId,
-				active: true,
-			});
-
-			toast.success(`Watching folder: ${folderName}`);
-		} catch (err) {
-			toast.error((err as Error)?.message || "Failed to watch folder");
-		}
-	}, [searchSpaceId]);
-
 	const handleRescanFolder = useCallback(
 		async (folder: FolderDisplay) => {
 			const api = window.electronAPI;
@@ -795,15 +761,14 @@ export function DocumentsSidebar({
 
 			<div className="flex-1 min-h-0 overflow-x-hidden pt-0 flex flex-col">
 				<div className="px-4 pb-2">
-				<DocumentsFilters
-					typeCounts={typeCounts}
-					onSearch={setSearch}
-					searchValue={search}
-					onToggleType={onToggleType}
-					activeTypes={activeTypes}
-					onCreateFolder={() => handleCreateFolder(null)}
-					onWatchFolder={isElectron ? handleWatchFolder : undefined}
-				/>
+			<DocumentsFilters
+				typeCounts={typeCounts}
+				onSearch={setSearch}
+				searchValue={search}
+				onToggleType={onToggleType}
+				activeTypes={activeTypes}
+				onCreateFolder={() => handleCreateFolder(null)}
+			/>
 				</div>
 
 				{deletableSelectedIds.length > 0 && (
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 6817b19db..3fdf576b5 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useAtom } from "jotai";
-import { CheckCircle2, FileType, Info, Upload, X } from "lucide-react";
+import { CheckCircle2, FileType, FolderOpen, Info, Upload, X } from "lucide-react";
 
 import { useTranslations } from "next-intl";
 import { useCallback, useMemo, useRef, useState } from "react";
@@ -19,9 +19,12 @@ import { Alert, AlertDescription } from "@/components/ui/alert";
 import { Badge } from "@/components/ui/badge";
 import { Button } from "@/components/ui/button";
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
+import { Label } from "@/components/ui/label";
 import { Progress } from "@/components/ui/progress";
 import { Separator } from "@/components/ui/separator";
 import { Spinner } from "@/components/ui/spinner";
+import { Switch } from "@/components/ui/switch";
+import { documentsApiService } from "@/lib/apis/documents-api.service";
 import {
 	trackDocumentUploadFailure,
 	trackDocumentUploadStarted,
@@ -29,6 +32,11 @@ import {
 } from "@/lib/posthog/events";
 import { GridPattern } from "./GridPattern";
 
+interface SelectedFolder {
+	path: string;
+	name: string;
+}
+
 interface DocumentUploadTabProps {
 	searchSpaceId: string;
 	onSuccess?: () => void;
@@ -135,6 +143,11 @@ export function DocumentUploadTab({
 	const { mutate: uploadDocuments, isPending: isUploading } = uploadDocumentMutation;
 	const fileInputRef = useRef<HTMLInputElement>(null);
 
+	const [selectedFolder, setSelectedFolder] = useState<SelectedFolder | null>(null);
+	const [watchFolder, setWatchFolder] = useState(true);
+	const [folderSubmitting, setFolderSubmitting] = useState(false);
+	const isElectron = typeof window !== "undefined" && !!window.electronAPI?.browseFileOrFolder;
+
 	const acceptedFileTypes = useMemo(() => {
 		const etlService = process.env.NEXT_PUBLIC_ETL_SERVICE;
 		return FILE_TYPE_CONFIG[etlService || "default"] || FILE_TYPE_CONFIG.default;
@@ -147,6 +160,7 @@ export function DocumentUploadTab({
 
 	const onDrop = useCallback(
 		(acceptedFiles: File[]) => {
+			setSelectedFolder(null);
 			setFiles((prev) => {
 				const newEntries = acceptedFiles.map((f) => ({
 					id: crypto.randomUUID?.() ?? `file-${Date.now()}-${Math.random().toString(36)}`,
@@ -179,15 +193,60 @@ export function DocumentUploadTab({
 		onDrop,
 		accept: acceptedFileTypes,
 		maxSize: 50 * 1024 * 1024, // 50MB per file
-		noClick: false,
+		noClick: !isElectron,
 		disabled: files.length >= MAX_FILES,
 	});
 
-	// Handle file input click to prevent event bubbling that might reopen dialog
 	const handleFileInputClick = useCallback((e: React.MouseEvent<HTMLInputElement>) => {
 		e.stopPropagation();
 	}, []);
 
+	const handleBrowse = useCallback(async (e: React.MouseEvent) => {
+		e.stopPropagation();
+		e.preventDefault();
+
+		const api = window.electronAPI;
+		if (!api?.browseFileOrFolder) {
+			fileInputRef.current?.click();
+			return;
+		}
+
+		const result = await api.browseFileOrFolder();
+		if (!result) return;
+
+		if (result.type === "folder") {
+			const folderPath = result.paths[0];
+			const folderName = folderPath.split("/").pop() || folderPath.split("\\").pop() || folderPath;
+			setFiles([]);
+			setSelectedFolder({ path: folderPath, name: folderName });
+			setWatchFolder(true);
+		} else {
+			setSelectedFolder(null);
+			const fileDataList = await api.readLocalFiles(result.paths);
+			const newFiles: FileWithId[] = fileDataList.map((fd) => ({
+				id: crypto.randomUUID?.() ?? `file-${Date.now()}-${Math.random().toString(36)}`,
+				file: new File([fd.data], fd.name, { type: fd.mimeType }),
+			}));
+			setFiles((prev) => {
+				const merged = [...prev, ...newFiles];
+				if (merged.length > MAX_FILES) {
+					toast.error(t("max_files_exceeded"), {
+						description: t("max_files_exceeded_desc", { max: MAX_FILES }),
+					});
+					return prev;
+				}
+				const totalSize = merged.reduce((sum, e) => sum + e.file.size, 0);
+				if (totalSize > MAX_TOTAL_SIZE_BYTES) {
+					toast.error(t("max_size_exceeded"), {
+						description: t("max_size_exceeded_desc", { max: MAX_TOTAL_SIZE_MB }),
+					});
+					return prev;
+				}
+				return merged;
+			});
+		}
+	}, [t]);
+
 	const formatFileSize = (bytes: number) => {
 		if (bytes === 0) return "0 Bytes";
 		const k = 1024;
@@ -198,7 +257,6 @@ export function DocumentUploadTab({
 
 	const totalFileSize = files.reduce((total, entry) => total + entry.file.size, 0);
 
-	// Check if limits are reached
 	const isFileCountLimitReached = files.length >= MAX_FILES;
 	const isSizeLimitReached = totalFileSize >= MAX_TOTAL_SIZE_BYTES;
 	const remainingFiles = MAX_FILES - files.length;
@@ -207,7 +265,6 @@ export function DocumentUploadTab({
 		(MAX_TOTAL_SIZE_BYTES - totalFileSize) / (1024 * 1024)
 	).toFixed(1);
 
-	// Track accordion state changes
 	const handleAccordionChange = useCallback(
 		(value: string) => {
 			setAccordionValue(value);
@@ -216,6 +273,46 @@ export function DocumentUploadTab({
 		[onAccordionStateChange]
 	);
 
+	const handleFolderSubmit = useCallback(async () => {
+		if (!selectedFolder) return;
+		const api = window.electronAPI;
+		if (!api) return;
+
+		setFolderSubmitting(true);
+		try {
+			const result = await documentsApiService.folderIndex(Number(searchSpaceId), {
+				folder_path: selectedFolder.path,
+				folder_name: selectedFolder.name,
+				search_space_id: searchSpaceId,
+				enable_summary: shouldSummarize,
+			});
+
+			const rootFolderId = (result as { root_folder_id?: number })?.root_folder_id ?? null;
+
+			if (watchFolder) {
+				await api.addWatchedFolder({
+					path: selectedFolder.path,
+					name: selectedFolder.name,
+					excludePatterns: [".git", "node_modules", "__pycache__", ".DS_Store", ".obsidian", ".trash"],
+					fileExtensions: null,
+					rootFolderId,
+					searchSpaceId: Number(searchSpaceId),
+					active: true,
+				});
+				toast.success(`Watching folder: ${selectedFolder.name}`);
+			} else {
+				toast.success(`Indexing folder: ${selectedFolder.name}`);
+			}
+
+			setSelectedFolder(null);
+			onSuccess?.();
+		} catch (err) {
+			toast.error((err as Error)?.message || "Failed to process folder");
+		} finally {
+			setFolderSubmitting(false);
+		}
+	}, [selectedFolder, watchFolder, searchSpaceId, shouldSummarize, onSuccess]);
+
 	const handleUpload = async () => {
 		setUploadProgress(0);
 		trackDocumentUploadStarted(Number(searchSpaceId), files.length, totalFileSize);
@@ -262,58 +359,68 @@ export function DocumentUploadTab({
 				</AlertDescription>
 			</Alert>
 
-			<Card className={`relative overflow-hidden ${cardClass}`}>
-				<div className="absolute inset-0 [mask-image:radial-gradient(ellipse_at_center,white,transparent)] opacity-30">
-					<GridPattern />
-				</div>
-				<CardContent className="p-4 sm:p-10 relative z-10">
-					<div
-						{...getRootProps()}
-						className={`flex flex-col items-center justify-center min-h-[200px] sm:min-h-[300px] border-2 border-dashed rounded-lg transition-colors ${
-							isFileCountLimitReached || isSizeLimitReached
-								? "border-destructive/50 bg-destructive/5 cursor-not-allowed"
-								: "border-border hover:border-primary/50 cursor-pointer"
-						}`}
-					>
-						<input
-							{...getInputProps()}
-							ref={fileInputRef}
-							className="hidden"
-							onClick={handleFileInputClick}
-						/>
-						{isFileCountLimitReached ? (
-							<div className="flex flex-col items-center gap-2 sm:gap-4 text-center px-4">
-								<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-destructive/70" />
-								<div>
-									<p className="text-sm sm:text-lg font-medium text-destructive">
-										{t("file_limit_reached")}
-									</p>
-									<p className="text-xs sm:text-sm text-muted-foreground mt-1">
-										{t("file_limit_reached_desc", { max: MAX_FILES })}
-									</p>
-								</div>
+		<Card className={`relative overflow-hidden ${cardClass}`}>
+			<div className="absolute inset-0 [mask-image:radial-gradient(ellipse_at_center,white,transparent)] opacity-30">
+				<GridPattern />
+			</div>
+			<CardContent className="p-4 sm:p-10 relative z-10">
+				<div
+					{...getRootProps()}
+					className={`flex flex-col items-center justify-center min-h-[200px] sm:min-h-[300px] border-2 border-dashed rounded-lg transition-colors ${
+						isFileCountLimitReached || isSizeLimitReached
+							? "border-destructive/50 bg-destructive/5 cursor-not-allowed"
+							: "border-border hover:border-primary/50 cursor-pointer"
+					}`}
+				>
+					<input
+						{...getInputProps()}
+						ref={fileInputRef}
+						className="hidden"
+						onClick={handleFileInputClick}
+					/>
+					{isFileCountLimitReached ? (
+						<div className="flex flex-col items-center gap-2 sm:gap-4 text-center px-4">
+							<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-destructive/70" />
+							<div>
+								<p className="text-sm sm:text-lg font-medium text-destructive">
+									{t("file_limit_reached")}
+								</p>
+								<p className="text-xs sm:text-sm text-muted-foreground mt-1">
+									{t("file_limit_reached_desc", { max: MAX_FILES })}
+								</p>
 							</div>
-						) : isDragActive ? (
-							<div className="flex flex-col items-center gap-2 sm:gap-4">
-								<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-primary" />
-								<p className="text-sm sm:text-lg font-medium text-primary">{t("drop_files")}</p>
+						</div>
+					) : isDragActive ? (
+						<div className="flex flex-col items-center gap-2 sm:gap-4">
+							<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-primary" />
+							<p className="text-sm sm:text-lg font-medium text-primary">{t("drop_files")}</p>
+						</div>
+					) : (
+						<div className="flex flex-col items-center gap-2 sm:gap-4">
+							<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-muted-foreground" />
+							<div className="text-center">
+								<p className="text-sm sm:text-lg font-medium">{t("drag_drop")}</p>
+								<p className="text-xs sm:text-sm text-muted-foreground mt-1">{t("or_browse")}</p>
 							</div>
-						) : (
-							<div className="flex flex-col items-center gap-2 sm:gap-4">
-								<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-muted-foreground" />
-								<div className="text-center">
-									<p className="text-sm sm:text-lg font-medium">{t("drag_drop")}</p>
-									<p className="text-xs sm:text-sm text-muted-foreground mt-1">{t("or_browse")}</p>
-								</div>
-								{files.length > 0 && (
-									<p className="text-xs text-muted-foreground">
-										{t("remaining_capacity", { files: remainingFiles, sizeMB: remainingSizeMB })}
-									</p>
-								)}
-							</div>
-						)}
-						{!isFileCountLimitReached && (
-							<div className="mt-2 sm:mt-4">
+							{files.length > 0 && (
+								<p className="text-xs text-muted-foreground">
+									{t("remaining_capacity", { files: remainingFiles, sizeMB: remainingSizeMB })}
+								</p>
+							)}
+						</div>
+					)}
+					{!isFileCountLimitReached && (
+						<div className="mt-2 sm:mt-4">
+							{isElectron ? (
+								<Button
+									variant="secondary"
+									size="sm"
+									className="text-xs sm:text-sm"
+									onClick={handleBrowse}
+								>
+									{t("browse_files")}
+								</Button>
+							) : (
 								<Button
 									variant="secondary"
 									size="sm"
@@ -326,11 +433,76 @@ export function DocumentUploadTab({
 								>
 									{t("browse_files")}
 								</Button>
+							)}
+						</div>
+					)}
+				</div>
+			</CardContent>
+		</Card>
+
+		{selectedFolder && (
+			<Card className={cardClass}>
+				<CardHeader className="p-4 sm:p-6">
+					<div className="flex items-center justify-between gap-2">
+						<div className="flex items-center gap-3 min-w-0 flex-1">
+							<FolderOpen className="h-5 w-5 text-primary flex-shrink-0" />
+							<div className="min-w-0 flex-1">
+								<CardTitle className="text-base sm:text-lg truncate">
+									{selectedFolder.name}
+								</CardTitle>
+								<CardDescription className="text-xs sm:text-sm truncate">
+									{selectedFolder.path}
+								</CardDescription>
 							</div>
-						)}
+						</div>
+						<Button
+							variant="ghost"
+							size="icon"
+							className="h-8 w-8 shrink-0"
+							onClick={() => setSelectedFolder(null)}
+							disabled={folderSubmitting}
+						>
+							<X className="h-4 w-4" />
+						</Button>
 					</div>
+				</CardHeader>
+				<CardContent className="p-4 sm:p-6 pt-0 space-y-4">
+					<div className="flex items-center justify-between rounded-lg border border-border p-3">
+						<Label htmlFor="watch-folder-toggle" className="flex flex-col gap-1 cursor-pointer">
+							<span className="text-sm font-medium">Watch folder</span>
+							<span className="text-xs text-muted-foreground font-normal">
+								Automatically sync changes when files are added, edited, or removed
+							</span>
+						</Label>
+						<Switch
+							id="watch-folder-toggle"
+							checked={watchFolder}
+							onCheckedChange={setWatchFolder}
+						/>
+					</div>
+
+					<SummaryConfig enabled={shouldSummarize} onEnabledChange={setShouldSummarize} />
+
+					<Button
+						className="w-full py-3 sm:py-6 text-xs sm:text-base font-medium"
+						onClick={handleFolderSubmit}
+						disabled={folderSubmitting}
+					>
+						{folderSubmitting ? (
+							<span className="flex items-center gap-2">
+								<Spinner size="sm" />
+								Processing...
+							</span>
+						) : (
+							<span className="flex items-center gap-2">
+								<CheckCircle2 className="h-4 w-4 sm:h-5 sm:w-5" />
+								{watchFolder ? "Watch & Index Folder" : "Index Folder"}
+							</span>
+						)}
+					</Button>
 				</CardContent>
 			</Card>
+		)}
 
 			{files.length > 0 && (
 				<Card className={cardClass}>
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index b399664d6..826a575c7 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -26,6 +26,18 @@ interface FolderSyncWatcherReadyEvent {
 	folderPath: string;
 }
 
+interface BrowseResult {
+	type: "files" | "folder";
+	paths: string[];
+}
+
+interface LocalFileData {
+	name: string;
+	data: ArrayBuffer;
+	mimeType: string;
+	size: number;
+}
+
 interface ElectronAPI {
 	versions: {
 		electron: string;
@@ -51,6 +63,9 @@ interface ElectronAPI {
 	pauseWatcher: () => Promise<void>;
 	resumeWatcher: () => Promise<void>;
 	signalRendererReady: () => Promise<void>;
+	// Unified browse
+	browseFileOrFolder: () => Promise<BrowseResult | null>;
+	readLocalFiles: (paths: string[]) => Promise<LocalFileData[]>;
 }
 
 declare global {

From e0b35cfbabe43add555771e19166558376b30ff7 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 00:40:49 +0530
Subject: [PATCH 057/202] feat: implement pending file event handling using
 durable queue with acknowledgment support in folder synchronization

---
 surfsense_desktop/src/ipc/channels.ts         |   2 +
 surfsense_desktop/src/ipc/handlers.ts         |  10 ++
 .../src/modules/folder-watcher.ts             | 111 +++++++++++++++---
 surfsense_desktop/src/preload.ts              |   2 +
 surfsense_web/hooks/use-folder-sync.ts        |  82 +++++++++----
 surfsense_web/types/window.d.ts               |   3 +
 6 files changed, 175 insertions(+), 35 deletions(-)

diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index 19c26607d..2761960f7 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -17,6 +17,8 @@ export const IPC_CHANNELS = {
   FOLDER_SYNC_PAUSE: 'folder-sync:pause',
   FOLDER_SYNC_RESUME: 'folder-sync:resume',
   FOLDER_SYNC_RENDERER_READY: 'folder-sync:renderer-ready',
+  FOLDER_SYNC_GET_PENDING_EVENTS: 'folder-sync:get-pending-events',
+  FOLDER_SYNC_ACK_EVENTS: 'folder-sync:ack-events',
   BROWSE_FILE_OR_FOLDER: 'browse:file-or-folder',
   READ_LOCAL_FILES: 'browse:read-local-files',
 } as const;
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index 246f0f6ac..7194aaaff 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -6,6 +6,8 @@ import {
   removeWatchedFolder,
   getWatchedFolders,
   getWatcherStatus,
+  getPendingFileEvents,
+  acknowledgeFileEvents,
   pauseWatcher,
   resumeWatcher,
   markRendererReady,
@@ -52,6 +54,14 @@ export function registerIpcHandlers(): void {
     markRendererReady();
   });
 
+  ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_GET_PENDING_EVENTS, () =>
+    getPendingFileEvents()
+  );
+
+  ipcMain.handle(IPC_CHANNELS.FOLDER_SYNC_ACK_EVENTS, (_event, eventIds: string[]) =>
+    acknowledgeFileEvents(eventIds)
+  );
+
   ipcMain.handle(IPC_CHANNELS.BROWSE_FILE_OR_FOLDER, () => browseFileOrFolder());
 
   ipcMain.handle(IPC_CHANNELS.READ_LOCAL_FILES, (_event, paths: string[]) =>
diff --git a/surfsense_desktop/src/modules/folder-watcher.ts b/surfsense_desktop/src/modules/folder-watcher.ts
index 1324858a0..9cbdd9775 100644
--- a/surfsense_desktop/src/modules/folder-watcher.ts
+++ b/surfsense_desktop/src/modules/folder-watcher.ts
@@ -1,5 +1,6 @@
 import { BrowserWindow, dialog } from 'electron';
 import chokidar, { type FSWatcher } from 'chokidar';
+import { randomUUID } from 'crypto';
 import * as path from 'path';
 import * as fs from 'fs';
 import { IPC_CHANNELS } from '../ipc/channels';
@@ -20,12 +21,27 @@ interface WatcherEntry {
 }
 
 type MtimeMap = Record<string, number>;
+type FolderSyncAction = 'add' | 'change' | 'unlink';
+
+export interface FolderSyncFileChangedEvent {
+  id: string;
+  rootFolderId: number | null;
+  searchSpaceId: number;
+  folderPath: string;
+  folderName: string;
+  relativePath: string;
+  fullPath: string;
+  action: FolderSyncAction;
+  timestamp: number;
+}
 
 const STORE_KEY = 'watchedFolders';
+const OUTBOX_STORE_KEY = 'events';
 const MTIME_TOLERANCE_S = 1.0;
 
 let store: any = null;
 let mtimeStore: any = null;
+let outboxStore: any = null;
 let watchers: Map<string, WatcherEntry> = new Map();
 
 /**
@@ -35,22 +51,11 @@ let watchers: Map<string, WatcherEntry> = new Map();
 const mtimeMaps: Map<string, MtimeMap> = new Map();
 
 let rendererReady = false;
-const pendingEvents: any[] = [];
+const outboxEvents: Map<string, FolderSyncFileChangedEvent> = new Map();
+let outboxLoaded = false;
 
 export function markRendererReady() {
   rendererReady = true;
-  for (const event of pendingEvents) {
-    sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, event);
-  }
-  pendingEvents.length = 0;
-}
-
-function sendFileChangedEvent(data: any) {
-  if (rendererReady) {
-    sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, data);
-  } else {
-    pendingEvents.push(data);
-  }
 }
 
 async function getStore() {
@@ -77,6 +82,57 @@ async function getMtimeStore() {
   return mtimeStore;
 }
 
+async function getOutboxStore() {
+  if (!outboxStore) {
+    const { default: Store } = await import('electron-store');
+    outboxStore = new Store({
+      name: 'folder-sync-outbox',
+      defaults: {
+        [OUTBOX_STORE_KEY]: [] as FolderSyncFileChangedEvent[],
+      },
+    });
+  }
+  return outboxStore;
+}
+
+function makeEventKey(event: Pick<FolderSyncFileChangedEvent, 'folderPath' | 'relativePath'>): string {
+  return `${event.folderPath}:${event.relativePath}`;
+}
+
+function persistOutbox() {
+  getOutboxStore().then((s) => {
+    s.set(OUTBOX_STORE_KEY, Array.from(outboxEvents.values()));
+  });
+}
+
+async function loadOutbox() {
+  if (outboxLoaded) return;
+  const s = await getOutboxStore();
+  const stored: FolderSyncFileChangedEvent[] = s.get(OUTBOX_STORE_KEY, []);
+  outboxEvents.clear();
+  for (const event of stored) {
+    if (!event?.id || !event.folderPath || !event.relativePath) continue;
+    outboxEvents.set(makeEventKey(event), event);
+  }
+  outboxLoaded = true;
+}
+
+function sendFileChangedEvent(
+  data: Omit<FolderSyncFileChangedEvent, 'id'>
+) {
+  const event: FolderSyncFileChangedEvent = {
+    id: randomUUID(),
+    ...data,
+  };
+
+  outboxEvents.set(makeEventKey(event), event);
+  persistOutbox();
+
+  if (rendererReady) {
+    sendToRenderer(IPC_CHANNELS.FOLDER_SYNC_FILE_CHANGED, event);
+  }
+}
+
 function loadMtimeMap(folderPath: string): MtimeMap {
   return mtimeMaps.get(folderPath) ?? {};
 }
@@ -235,7 +291,7 @@ async function startWatcher(config: WatchedFolderConfig) {
     });
   });
 
-  const handleFileEvent = (filePath: string, action: string) => {
+  const handleFileEvent = (filePath: string, action: FolderSyncAction) => {
     if (!ready) return;
 
     const relativePath = path.relative(config.path, filePath);
@@ -357,6 +413,32 @@ export async function getWatcherStatus(): Promise<
   }));
 }
 
+export async function getPendingFileEvents(): Promise<FolderSyncFileChangedEvent[]> {
+  await loadOutbox();
+  return Array.from(outboxEvents.values()).sort((a, b) => a.timestamp - b.timestamp);
+}
+
+export async function acknowledgeFileEvents(eventIds: string[]): Promise<{ acknowledged: number }> {
+  if (!eventIds || eventIds.length === 0) return { acknowledged: 0 };
+  await loadOutbox();
+
+  const ackSet = new Set(eventIds);
+  let acknowledged = 0;
+
+  for (const [key, event] of outboxEvents.entries()) {
+    if (ackSet.has(event.id)) {
+      outboxEvents.delete(key);
+      acknowledged += 1;
+    }
+  }
+
+  if (acknowledged > 0) {
+    persistOutbox();
+  }
+
+  return { acknowledged };
+}
+
 export async function pauseWatcher(): Promise<void> {
   for (const [, entry] of watchers) {
     if (entry.watcher) {
@@ -375,6 +457,7 @@ export async function resumeWatcher(): Promise<void> {
 }
 
 export async function registerFolderWatcher(): Promise<void> {
+  await loadOutbox();
   const s = await getStore();
   const folders: WatchedFolderConfig[] = s.get(STORE_KEY, []);
 
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 08ca87f8f..6a2610dc8 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -45,6 +45,8 @@ contextBridge.exposeInMainWorld('electronAPI', {
   pauseWatcher: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_PAUSE),
   resumeWatcher: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_RESUME),
   signalRendererReady: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_RENDERER_READY),
+  getPendingFileEvents: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_GET_PENDING_EVENTS),
+  acknowledgeFileEvents: (eventIds: string[]) => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_ACK_EVENTS, eventIds),
 
   // Unified browse (files + folders)
   browseFileOrFolder: () => ipcRenderer.invoke(IPC_CHANNELS.BROWSE_FILE_OR_FOLDER),
diff --git a/surfsense_web/hooks/use-folder-sync.ts b/surfsense_web/hooks/use-folder-sync.ts
index f051b7df6..59c061afb 100644
--- a/surfsense_web/hooks/use-folder-sync.ts
+++ b/surfsense_web/hooks/use-folder-sync.ts
@@ -4,6 +4,7 @@ import { useEffect, useRef } from "react";
 import { documentsApiService } from "@/lib/apis/documents-api.service";
 
 interface FileChangedEvent {
+	id: string;
 	rootFolderId: number | null;
 	searchSpaceId: number;
 	folderPath: string;
@@ -15,25 +16,35 @@ interface FileChangedEvent {
 }
 
 const DEBOUNCE_MS = 2000;
+interface QueueItem {
+	event: FileChangedEvent;
+	ackIds: string[];
+}
 
 export function useFolderSync() {
-	const queueRef = useRef<FileChangedEvent[]>([]);
+	const queueRef = useRef<QueueItem[]>([]);
 	const processingRef = useRef(false);
 	const debounceTimers = useRef<Map<string, ReturnType<typeof setTimeout>>>(new Map());
+	const pendingByKey = useRef<Map<string, QueueItem>>(new Map());
+	const isMountedRef = useRef(false);
 
 	async function processQueue() {
 		if (processingRef.current) return;
 		processingRef.current = true;
 		while (queueRef.current.length > 0) {
-			const event = queueRef.current.shift()!;
+			const item = queueRef.current.shift()!;
 			try {
-				await documentsApiService.folderIndexFile(event.searchSpaceId, {
-					folder_path: event.folderPath,
-					folder_name: event.folderName,
-					search_space_id: event.searchSpaceId,
-					target_file_path: event.fullPath,
-					root_folder_id: event.rootFolderId,
+				await documentsApiService.folderIndexFile(item.event.searchSpaceId, {
+					folder_path: item.event.folderPath,
+					folder_name: item.event.folderName,
+					search_space_id: item.event.searchSpaceId,
+					target_file_path: item.event.fullPath,
+					root_folder_id: item.event.rootFolderId,
 				});
+				const api = typeof window !== "undefined" ? window.electronAPI : null;
+				if (api?.acknowledgeFileEvents && item.ackIds.length > 0) {
+					await api.acknowledgeFileEvents(item.ackIds);
+				}
 			} catch (err) {
 				console.error("[FolderSync] Failed to trigger re-index:", err);
 			}
@@ -41,34 +52,63 @@ export function useFolderSync() {
 		processingRef.current = false;
 	}
 
+	function enqueueWithDebounce(event: FileChangedEvent) {
+		const key = `${event.folderPath}:${event.relativePath}`;
+		const existing = pendingByKey.current.get(key);
+		const ackSet = new Set(existing?.ackIds ?? []);
+		ackSet.add(event.id);
+		pendingByKey.current.set(key, {
+			event,
+			ackIds: Array.from(ackSet),
+		});
+
+		const existingTimeout = debounceTimers.current.get(key);
+		if (existingTimeout) clearTimeout(existingTimeout);
+
+		const timeout = setTimeout(() => {
+			debounceTimers.current.delete(key);
+			const pending = pendingByKey.current.get(key);
+			if (!pending) return;
+			pendingByKey.current.delete(key);
+			queueRef.current.push(pending);
+			processQueue();
+		}, DEBOUNCE_MS);
+
+		debounceTimers.current.set(key, timeout);
+	}
+
 	useEffect(() => {
+		isMountedRef.current = true;
 		const api = typeof window !== "undefined" ? window.electronAPI : null;
-		if (!api?.onFileChanged) return;
+		if (!api?.onFileChanged) {
+			return () => {
+				isMountedRef.current = false;
+			};
+		}
 
 		// Signal to main process that the renderer is ready to receive events
 		api.signalRendererReady?.();
 
+		// Drain durable outbox first so events survive renderer startup gaps and restarts
+		void api.getPendingFileEvents?.().then((pendingEvents) => {
+			if (!isMountedRef.current || !pendingEvents?.length) return;
+			for (const event of pendingEvents) {
+				enqueueWithDebounce(event);
+			}
+		});
+
 		const cleanup = api.onFileChanged((event: FileChangedEvent) => {
-			const key = `${event.folderPath}:${event.fullPath}`;
-
-			const existing = debounceTimers.current.get(key);
-			if (existing) clearTimeout(existing);
-
-			const timeout = setTimeout(() => {
-				debounceTimers.current.delete(key);
-				queueRef.current.push(event);
-				processQueue();
-			}, DEBOUNCE_MS);
-
-			debounceTimers.current.set(key, timeout);
+			enqueueWithDebounce(event);
 		});
 
 		return () => {
+			isMountedRef.current = false;
 			cleanup();
 			for (const timeout of debounceTimers.current.values()) {
 				clearTimeout(timeout);
 			}
 			debounceTimers.current.clear();
+			pendingByKey.current.clear();
 		};
 	}, []);
 }
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 826a575c7..719373e02 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -11,6 +11,7 @@ interface WatchedFolderConfig {
 }
 
 interface FolderSyncFileChangedEvent {
+	id: string;
 	rootFolderId: number | null;
 	searchSpaceId: number;
 	folderPath: string;
@@ -63,6 +64,8 @@ interface ElectronAPI {
 	pauseWatcher: () => Promise<void>;
 	resumeWatcher: () => Promise<void>;
 	signalRendererReady: () => Promise<void>;
+	getPendingFileEvents: () => Promise<FolderSyncFileChangedEvent[]>;
+	acknowledgeFileEvents: (eventIds: string[]) => Promise<{ acknowledged: number }>;
 	// Unified browse
 	browseFileOrFolder: () => Promise<BrowseResult | null>;
 	readLocalFiles: (paths: string[]) => Promise<LocalFileData[]>;

From a99d999a3658c09ce133940cc0dd15a3353d6cd7 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Thu, 2 Apr 2026 21:29:05 +0200
Subject: [PATCH 058/202] fix: correct preload.js path after autocomplete
 module restructure

---
 surfsense_desktop/src/modules/autocomplete/suggestion-window.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts b/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts
index e8a2f3a91..8f61b2901 100644
--- a/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts
+++ b/surfsense_desktop/src/modules/autocomplete/suggestion-window.ts
@@ -80,7 +80,7 @@ export function createSuggestionWindow(x: number, y: number): BrowserWindow {
     hasShadow: true,
     type: 'panel',
     webPreferences: {
-      preload: path.join(__dirname, '..', 'preload.js'),
+      preload: path.join(__dirname, 'preload.js'),
       contextIsolation: true,
       nodeIntegration: false,
       sandbox: true,

From 530db1053939cd69a6ce41107a6169babab1f707 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 02:56:24 +0530
Subject: [PATCH 059/202] refactor: remove unused Electron API check and update
 search space ID handling in document upload

---
 surfsense_desktop/src/ipc/channels.ts         |   2 +-
 surfsense_desktop/src/ipc/handlers.ts         |   4 +-
 .../src/modules/folder-watcher.ts             |  18 +-
 surfsense_desktop/src/preload.ts              |   4 +-
 .../layout/ui/sidebar/DocumentsSidebar.tsx    |   2 -
 .../components/sources/DocumentUploadTab.tsx  | 162 ++++++++++--------
 surfsense_web/types/window.d.ts               |   9 +-
 7 files changed, 100 insertions(+), 101 deletions(-)

diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index 2761960f7..2000964c7 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -19,6 +19,6 @@ export const IPC_CHANNELS = {
   FOLDER_SYNC_RENDERER_READY: 'folder-sync:renderer-ready',
   FOLDER_SYNC_GET_PENDING_EVENTS: 'folder-sync:get-pending-events',
   FOLDER_SYNC_ACK_EVENTS: 'folder-sync:ack-events',
-  BROWSE_FILE_OR_FOLDER: 'browse:file-or-folder',
+  BROWSE_FILES: 'browse:files',
   READ_LOCAL_FILES: 'browse:read-local-files',
 } as const;
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index 7194aaaff..c4251b30b 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -11,7 +11,7 @@ import {
   pauseWatcher,
   resumeWatcher,
   markRendererReady,
-  browseFileOrFolder,
+  browseFiles,
   readLocalFiles,
 } from '../modules/folder-watcher';
 
@@ -62,7 +62,7 @@ export function registerIpcHandlers(): void {
     acknowledgeFileEvents(eventIds)
   );
 
-  ipcMain.handle(IPC_CHANNELS.BROWSE_FILE_OR_FOLDER, () => browseFileOrFolder());
+  ipcMain.handle(IPC_CHANNELS.BROWSE_FILES, () => browseFiles());
 
   ipcMain.handle(IPC_CHANNELS.READ_LOCAL_FILES, (_event, paths: string[]) =>
     readLocalFiles(paths)
diff --git a/surfsense_desktop/src/modules/folder-watcher.ts b/surfsense_desktop/src/modules/folder-watcher.ts
index 9cbdd9775..969dabe97 100644
--- a/surfsense_desktop/src/modules/folder-watcher.ts
+++ b/surfsense_desktop/src/modules/folder-watcher.ts
@@ -475,23 +475,13 @@ export async function unregisterFolderWatcher(): Promise<void> {
   watchers.clear();
 }
 
-export interface BrowseResult {
-  type: 'files' | 'folder';
-  paths: string[];
-}
-
-export async function browseFileOrFolder(): Promise<BrowseResult | null> {
+export async function browseFiles(): Promise<string[] | null> {
   const result = await dialog.showOpenDialog({
-    properties: ['openFile', 'openDirectory', 'multiSelections'],
-    title: 'Select files or a folder',
+    properties: ['openFile', 'multiSelections'],
+    title: 'Select files',
   });
   if (result.canceled || result.filePaths.length === 0) return null;
-
-  const stat = fs.statSync(result.filePaths[0]);
-  if (stat.isDirectory()) {
-    return { type: 'folder', paths: [result.filePaths[0]] };
-  }
-  return { type: 'files', paths: result.filePaths };
+  return result.filePaths;
 }
 
 const MIME_MAP: Record<string, string> = {
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 6a2610dc8..6fbfd354a 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -48,7 +48,7 @@ contextBridge.exposeInMainWorld('electronAPI', {
   getPendingFileEvents: () => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_GET_PENDING_EVENTS),
   acknowledgeFileEvents: (eventIds: string[]) => ipcRenderer.invoke(IPC_CHANNELS.FOLDER_SYNC_ACK_EVENTS, eventIds),
 
-  // Unified browse (files + folders)
-  browseFileOrFolder: () => ipcRenderer.invoke(IPC_CHANNELS.BROWSE_FILE_OR_FOLDER),
+  // Browse files via native dialog
+  browseFiles: () => ipcRenderer.invoke(IPC_CHANNELS.BROWSE_FILES),
   readLocalFiles: (paths: string[]) => ipcRenderer.invoke(IPC_CHANNELS.READ_LOCAL_FILES, paths),
 });
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index ed3a78786..f8b774d26 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -277,8 +277,6 @@ export function DocumentsSidebar({
 		[createFolderParentId, searchSpaceId, setExpandedFolderMap]
 	);
 
-	const isElectron = typeof window !== "undefined" && !!window.electronAPI;
-
 	const handleRescanFolder = useCallback(
 		async (folder: FolderDisplay) => {
 			const api = window.electronAPI;
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 3fdf576b5..d5ac2770a 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useAtom } from "jotai";
-import { CheckCircle2, FileType, FolderOpen, Info, Upload, X } from "lucide-react";
+import { CheckCircle2, ChevronDown, File as FileIcon, FileType, FolderOpen, Info, Upload, X } from "lucide-react";
 
 import { useTranslations } from "next-intl";
 import { useCallback, useMemo, useRef, useState } from "react";
@@ -19,6 +19,12 @@ import { Alert, AlertDescription } from "@/components/ui/alert";
 import { Badge } from "@/components/ui/badge";
 import { Button } from "@/components/ui/button";
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
+import {
+	DropdownMenu,
+	DropdownMenuContent,
+	DropdownMenuItem,
+	DropdownMenuTrigger,
+} from "@/components/ui/dropdown-menu";
 import { Label } from "@/components/ui/label";
 import { Progress } from "@/components/ui/progress";
 import { Separator } from "@/components/ui/separator";
@@ -146,7 +152,7 @@ export function DocumentUploadTab({
 	const [selectedFolder, setSelectedFolder] = useState<SelectedFolder | null>(null);
 	const [watchFolder, setWatchFolder] = useState(true);
 	const [folderSubmitting, setFolderSubmitting] = useState(false);
-	const isElectron = typeof window !== "undefined" && !!window.electronAPI?.browseFileOrFolder;
+	const isElectron = typeof window !== "undefined" && !!window.electronAPI?.browseFiles;
 
 	const acceptedFileTypes = useMemo(() => {
 		const etlService = process.env.NEXT_PUBLIC_ETL_SERVICE;
@@ -193,7 +199,7 @@ export function DocumentUploadTab({
 		onDrop,
 		accept: acceptedFileTypes,
 		maxSize: 50 * 1024 * 1024, // 50MB per file
-		noClick: !isElectron,
+		noClick: isElectron,
 		disabled: files.length >= MAX_FILES,
 	});
 
@@ -201,52 +207,51 @@ export function DocumentUploadTab({
 		e.stopPropagation();
 	}, []);
 
-	const handleBrowse = useCallback(async (e: React.MouseEvent) => {
-		e.stopPropagation();
-		e.preventDefault();
-
+	const handleBrowseFiles = useCallback(async () => {
 		const api = window.electronAPI;
-		if (!api?.browseFileOrFolder) {
-			fileInputRef.current?.click();
-			return;
-		}
+		if (!api?.browseFiles) return;
 
-		const result = await api.browseFileOrFolder();
-		if (!result) return;
+		const paths = await api.browseFiles();
+		if (!paths || paths.length === 0) return;
 
-		if (result.type === "folder") {
-			const folderPath = result.paths[0];
-			const folderName = folderPath.split("/").pop() || folderPath.split("\\").pop() || folderPath;
-			setFiles([]);
-			setSelectedFolder({ path: folderPath, name: folderName });
-			setWatchFolder(true);
-		} else {
-			setSelectedFolder(null);
-			const fileDataList = await api.readLocalFiles(result.paths);
-			const newFiles: FileWithId[] = fileDataList.map((fd) => ({
-				id: crypto.randomUUID?.() ?? `file-${Date.now()}-${Math.random().toString(36)}`,
-				file: new File([fd.data], fd.name, { type: fd.mimeType }),
-			}));
-			setFiles((prev) => {
-				const merged = [...prev, ...newFiles];
-				if (merged.length > MAX_FILES) {
-					toast.error(t("max_files_exceeded"), {
-						description: t("max_files_exceeded_desc", { max: MAX_FILES }),
-					});
-					return prev;
-				}
-				const totalSize = merged.reduce((sum, e) => sum + e.file.size, 0);
-				if (totalSize > MAX_TOTAL_SIZE_BYTES) {
-					toast.error(t("max_size_exceeded"), {
-						description: t("max_size_exceeded_desc", { max: MAX_TOTAL_SIZE_MB }),
-					});
-					return prev;
-				}
-				return merged;
-			});
-		}
+		setSelectedFolder(null);
+		const fileDataList = await api.readLocalFiles(paths);
+		const newFiles: FileWithId[] = fileDataList.map((fd) => ({
+			id: crypto.randomUUID?.() ?? `file-${Date.now()}-${Math.random().toString(36)}`,
+			file: new File([fd.data], fd.name, { type: fd.mimeType }),
+		}));
+		setFiles((prev) => {
+			const merged = [...prev, ...newFiles];
+			if (merged.length > MAX_FILES) {
+				toast.error(t("max_files_exceeded"), {
+					description: t("max_files_exceeded_desc", { max: MAX_FILES }),
+				});
+				return prev;
+			}
+			const totalSize = merged.reduce((sum, e) => sum + e.file.size, 0);
+			if (totalSize > MAX_TOTAL_SIZE_BYTES) {
+				toast.error(t("max_size_exceeded"), {
+					description: t("max_size_exceeded_desc", { max: MAX_TOTAL_SIZE_MB }),
+				});
+				return prev;
+			}
+			return merged;
+		});
 	}, [t]);
 
+	const handleBrowseFolder = useCallback(async () => {
+		const api = window.electronAPI;
+		if (!api?.selectFolder) return;
+
+		const folderPath = await api.selectFolder();
+		if (!folderPath) return;
+
+		const folderName = folderPath.split("/").pop() || folderPath.split("\\").pop() || folderPath;
+		setFiles([]);
+		setSelectedFolder({ path: folderPath, name: folderName });
+		setWatchFolder(true);
+	}, []);
+
 	const formatFileSize = (bytes: number) => {
 		if (bytes === 0) return "0 Bytes";
 		const k = 1024;
@@ -280,10 +285,11 @@ export function DocumentUploadTab({
 
 		setFolderSubmitting(true);
 		try {
-			const result = await documentsApiService.folderIndex(Number(searchSpaceId), {
+			const numericSpaceId = Number(searchSpaceId);
+			const result = await documentsApiService.folderIndex(numericSpaceId, {
 				folder_path: selectedFolder.path,
 				folder_name: selectedFolder.name,
-				search_space_id: searchSpaceId,
+				search_space_id: numericSpaceId,
 				enable_summary: shouldSummarize,
 			});
 
@@ -409,33 +415,43 @@ export function DocumentUploadTab({
 							)}
 						</div>
 					)}
-					{!isFileCountLimitReached && (
-						<div className="mt-2 sm:mt-4">
-							{isElectron ? (
-								<Button
-									variant="secondary"
-									size="sm"
-									className="text-xs sm:text-sm"
-									onClick={handleBrowse}
-								>
-									{t("browse_files")}
-								</Button>
-							) : (
-								<Button
-									variant="secondary"
-									size="sm"
-									className="text-xs sm:text-sm"
-									onClick={(e) => {
-										e.stopPropagation();
-										e.preventDefault();
-										fileInputRef.current?.click();
-									}}
-								>
-									{t("browse_files")}
-								</Button>
-							)}
-						</div>
-					)}
+				{!isFileCountLimitReached && (
+					<div className="mt-2 sm:mt-4">
+						{isElectron ? (
+							<DropdownMenu>
+								<DropdownMenuTrigger asChild onClick={(e) => e.stopPropagation()}>
+									<Button variant="secondary" size="sm" className="text-xs sm:text-sm gap-1">
+										{t("browse_files")}
+										<ChevronDown className="h-3 w-3 opacity-60" />
+									</Button>
+								</DropdownMenuTrigger>
+								<DropdownMenuContent align="center" onClick={(e) => e.stopPropagation()}>
+									<DropdownMenuItem onClick={handleBrowseFiles}>
+										<FileIcon className="h-4 w-4 mr-2" />
+										Files
+									</DropdownMenuItem>
+									<DropdownMenuItem onClick={handleBrowseFolder}>
+										<FolderOpen className="h-4 w-4 mr-2" />
+										Folder
+									</DropdownMenuItem>
+								</DropdownMenuContent>
+							</DropdownMenu>
+						) : (
+							<Button
+								variant="secondary"
+								size="sm"
+								className="text-xs sm:text-sm"
+								onClick={(e) => {
+									e.stopPropagation();
+									e.preventDefault();
+									fileInputRef.current?.click();
+								}}
+							>
+								{t("browse_files")}
+							</Button>
+						)}
+					</div>
+				)}
 				</div>
 			</CardContent>
 		</Card>
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 719373e02..0842ed655 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -27,11 +27,6 @@ interface FolderSyncWatcherReadyEvent {
 	folderPath: string;
 }
 
-interface BrowseResult {
-	type: "files" | "folder";
-	paths: string[];
-}
-
 interface LocalFileData {
 	name: string;
 	data: ArrayBuffer;
@@ -66,8 +61,8 @@ interface ElectronAPI {
 	signalRendererReady: () => Promise<void>;
 	getPendingFileEvents: () => Promise<FolderSyncFileChangedEvent[]>;
 	acknowledgeFileEvents: (eventIds: string[]) => Promise<{ acknowledged: number }>;
-	// Unified browse
-	browseFileOrFolder: () => Promise<BrowseResult | null>;
+	// Browse files/folders via native dialogs
+	browseFiles: () => Promise<string[] | null>;
 	readLocalFiles: (paths: string[]) => Promise<LocalFileData[]>;
 }
 

From bd21c2842dec8dfeae80a00a040c4b1513c1cf3d Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 04:14:09 +0530
Subject: [PATCH 060/202] feat: enhance document upload and folder
 synchronization UI with improved processing state indicators and responsive
 design adjustments

---
 .../app/routes/documents_routes.py            |   5 +-
 .../assistant-ui/document-upload-popup.tsx    |  29 +-
 .../components/documents/DocumentNode.tsx     |  14 +-
 .../components/documents/FolderNode.tsx       |  48 +-
 .../components/documents/FolderTreeView.tsx   |  30 +
 .../components/sources/DocumentUploadTab.tsx  | 514 +++++++++---------
 .../contracts/enums/connectorIcons.tsx        |   2 +
 7 files changed, 359 insertions(+), 283 deletions(-)

diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index 0acc1d30b..edb01d4cc 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -29,6 +29,7 @@ from app.schemas import (
     DocumentTitleSearchResponse,
     DocumentUpdate,
     DocumentWithChunksRead,
+    FolderRead,
     PaginatedResponse,
 )
 from app.services.task_dispatcher import TaskDispatcher, get_task_dispatcher
@@ -953,15 +954,13 @@ async def get_document_by_chunk_id(
         ) from e
 
 
-@router.get("/documents/watched-folders", response_model=list["FolderRead"])
+@router.get("/documents/watched-folders", response_model=list[FolderRead])
 async def get_watched_folders(
     search_space_id: int,
     session: AsyncSession = Depends(get_async_session),
     user: User = Depends(current_active_user),
 ):
     """Return root folders that are marked as watched (metadata->>'watched' = 'true')."""
-    from app.schemas import FolderRead  # noqa: F811
-
     await check_permission(
         session,
         user,
diff --git a/surfsense_web/components/assistant-ui/document-upload-popup.tsx b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
index 06b0d38e7..78600be47 100644
--- a/surfsense_web/components/assistant-ui/document-upload-popup.tsx
+++ b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
@@ -125,29 +125,23 @@ const DocumentUploadPopupContent: FC<{
 				onPointerDownOutside={(e) => e.preventDefault()}
 				onInteractOutside={(e) => e.preventDefault()}
 				onEscapeKeyDown={(e) => e.preventDefault()}
-				className="select-none max-w-4xl w-[95vw] sm:w-full h-[calc(100dvh-2rem)] sm:h-[85vh] flex flex-col p-0 gap-0 overflow-hidden border border-border ring-0 bg-muted dark:bg-muted text-foreground [&>button]:right-3 sm:[&>button]:right-12 [&>button]:top-3 sm:[&>button]:top-10 [&>button]:opacity-80 hover:[&>button]:opacity-100 [&>button]:z-[100] [&>button_svg]:size-4 sm:[&>button_svg]:size-5"
+				className="select-none max-w-2xl w-[95vw] sm:w-[640px] h-[min(460px,75dvh)] sm:h-[min(520px,80vh)] flex flex-col p-0 gap-0 overflow-hidden border border-border ring-0 bg-muted dark:bg-muted text-foreground [&>button]:right-3 sm:[&>button]:right-6 [&>button]:top-3 sm:[&>button]:top-5 [&>button]:opacity-80 hover:[&>button]:opacity-100 [&>button]:z-[100] [&>button_svg]:size-4 sm:[&>button_svg]:size-5"
 			>
 				<DialogTitle className="sr-only">Upload Document</DialogTitle>
 
-				{/* Scrollable container for mobile */}
 				<div className="flex-1 min-h-0 overflow-y-auto overscroll-contain">
-					{/* Header - scrolls with content on mobile */}
-					<div className="sticky top-0 z-20 bg-muted px-4 sm:px-12 pt-4 sm:pt-10 pb-2 sm:pb-0">
-						{/* Upload header */}
-						<div className="flex items-center gap-2 sm:gap-4 mb-2 sm:mb-6">
-							<div className="flex-1 min-w-0 pr-8 sm:pr-0">
-								<h2 className="text-base sm:text-2xl font-semibold tracking-tight">
-									Upload Documents
-								</h2>
-								<p className="text-xs sm:text-base text-muted-foreground mt-0.5 sm:mt-1 line-clamp-1 sm:line-clamp-none">
-									Upload and sync your documents to your search space
-								</p>
-							</div>
+					<div className="sticky top-0 z-20 bg-muted px-4 sm:px-6 pt-4 sm:pt-5 pb-10">
+						<div className="flex items-center gap-2 mb-1 pr-8 sm:pr-0">
+							<h2 className="text-base sm:text-lg font-semibold tracking-tight">
+								Upload Documents
+							</h2>
 						</div>
+						<p className="text-xs sm:text-sm text-muted-foreground line-clamp-1">
+							Upload and sync your documents to your search space
+						</p>
 					</div>
 
-					{/* Content */}
-					<div className="px-4 sm:px-12 pb-4 sm:pb-16">
+					<div className="px-4 sm:px-6 pb-4 sm:pb-6">
 						{!isLoading && !hasDocumentSummaryLLM ? (
 							<Alert variant="destructive" className="mb-4 bg-muted/50 rounded-xl border-destructive/30">
 								<AlertTriangle className="h-4 w-4" />
@@ -179,9 +173,6 @@ const DocumentUploadPopupContent: FC<{
 						)}
 					</div>
 				</div>
-
-				{/* Bottom fade shadow - hidden on very small screens */}
-				<div className="hidden sm:block absolute bottom-0 left-0 right-0 h-7 bg-gradient-to-t from-muted via-muted/80 to-transparent pointer-events-none z-10" />
 			</DialogContent>
 		</Dialog>
 	);
diff --git a/surfsense_web/components/documents/DocumentNode.tsx b/surfsense_web/components/documents/DocumentNode.tsx
index 691a6eb0d..7a3b3e0ca 100644
--- a/surfsense_web/components/documents/DocumentNode.tsx
+++ b/surfsense_web/components/documents/DocumentNode.tsx
@@ -195,12 +195,14 @@ export const DocumentNode = React.memo(function DocumentNode({
 
 					<span className="flex-1 min-w-0 truncate">{doc.title}</span>
 
-					<span className="shrink-0">
-						{getDocumentTypeIcon(
-							doc.document_type as DocumentTypeEnum,
-							"h-3.5 w-3.5 text-muted-foreground"
-						)}
-					</span>
+					{getDocumentTypeIcon(doc.document_type as DocumentTypeEnum, "h-3.5 w-3.5 text-muted-foreground") && (
+						<span className="shrink-0">
+							{getDocumentTypeIcon(
+								doc.document_type as DocumentTypeEnum,
+								"h-3.5 w-3.5 text-muted-foreground"
+							)}
+						</span>
+					)}
 
 					<DropdownMenu open={dropdownOpen} onOpenChange={setDropdownOpen}>
 						<DropdownMenuTrigger asChild>
diff --git a/surfsense_web/components/documents/FolderNode.tsx b/surfsense_web/components/documents/FolderNode.tsx
index 6780bd1e5..41c1d8f73 100644
--- a/surfsense_web/components/documents/FolderNode.tsx
+++ b/surfsense_web/components/documents/FolderNode.tsx
@@ -1,6 +1,7 @@
 "use client";
 
 import {
+	AlertCircle,
 	ChevronDown,
 	ChevronRight,
 	Eye,
@@ -30,6 +31,8 @@ import {
 	DropdownMenuItem,
 	DropdownMenuTrigger,
 } from "@/components/ui/dropdown-menu";
+import { Spinner } from "@/components/ui/spinner";
+import { Tooltip, TooltipContent, TooltipTrigger } from "@/components/ui/tooltip";
 import { cn } from "@/lib/utils";
 import type { FolderSelectionState } from "./FolderTreeView";
 
@@ -55,6 +58,7 @@ interface FolderNodeProps {
 	isRenaming: boolean;
 	childCount: number;
 	selectionState: FolderSelectionState;
+	processingState: "idle" | "processing" | "failed";
 	onToggleSelect: (folderId: number, selectAll: boolean) => void;
 	onToggleExpand: (folderId: number) => void;
 	onRename: (folder: FolderDisplay, newName: string) => void;
@@ -100,6 +104,7 @@ export const FolderNode = React.memo(function FolderNode({
 	isRenaming,
 	childCount,
 	selectionState,
+	processingState,
 	onToggleSelect,
 	onToggleExpand,
 	onRename,
@@ -281,14 +286,41 @@ export const FolderNode = React.memo(function FolderNode({
 						)}
 					</span>
 
-					<Checkbox
-						checked={
-							selectionState === "all" ? true : selectionState === "some" ? "indeterminate" : false
-						}
-						onCheckedChange={handleCheckChange}
-						onClick={(e) => e.stopPropagation()}
-						className="h-3.5 w-3.5 shrink-0"
-					/>
+					{processingState !== "idle" && selectionState === "none" ? (
+						<>
+							<Tooltip>
+								<TooltipTrigger asChild>
+									<span className="flex h-3.5 w-3.5 shrink-0 items-center justify-center group-hover:hidden">
+										{processingState === "processing" ? (
+											<Spinner size="xs" className="text-primary" />
+										) : (
+											<AlertCircle className="h-3.5 w-3.5 text-destructive" />
+										)}
+									</span>
+								</TooltipTrigger>
+								<TooltipContent side="top">
+									{processingState === "processing"
+										? "Syncing folder contents"
+										: "Some files failed to process"}
+								</TooltipContent>
+							</Tooltip>
+							<Checkbox
+								checked={false}
+								onCheckedChange={handleCheckChange}
+								onClick={(e) => e.stopPropagation()}
+								className="h-3.5 w-3.5 shrink-0 hidden group-hover:flex"
+							/>
+						</>
+					) : (
+						<Checkbox
+							checked={
+								selectionState === "all" ? true : selectionState === "some" ? "indeterminate" : false
+							}
+							onCheckedChange={handleCheckChange}
+							onClick={(e) => e.stopPropagation()}
+							className="h-3.5 w-3.5 shrink-0"
+						/>
+					)}
 
 					<FolderIcon className="h-4 w-4 shrink-0 text-muted-foreground" />
 
diff --git a/surfsense_web/components/documents/FolderTreeView.tsx b/surfsense_web/components/documents/FolderTreeView.tsx
index f34b9a0c2..01af73edc 100644
--- a/surfsense_web/components/documents/FolderTreeView.tsx
+++ b/surfsense_web/components/documents/FolderTreeView.tsx
@@ -166,6 +166,35 @@ export function FolderTreeView({
 		return states;
 	}, [folders, docsByFolder, foldersByParent, mentionedDocIds]);
 
+	const folderProcessingStates = useMemo(() => {
+		const states: Record<number, "idle" | "processing" | "failed"> = {};
+
+		function compute(folderId: number): { hasProcessing: boolean; hasFailed: boolean } {
+			const directDocs = docsByFolder[folderId] ?? [];
+			let hasProcessing = directDocs.some(
+				(d) => d.status?.state === "pending" || d.status?.state === "processing"
+			);
+			let hasFailed = directDocs.some((d) => d.status?.state === "failed");
+
+			for (const child of foldersByParent[folderId] ?? []) {
+				const sub = compute(child.id);
+				hasProcessing = hasProcessing || sub.hasProcessing;
+				hasFailed = hasFailed || sub.hasFailed;
+			}
+
+			if (hasProcessing) states[folderId] = "processing";
+			else if (hasFailed) states[folderId] = "failed";
+			else states[folderId] = "idle";
+
+			return { hasProcessing, hasFailed };
+		}
+
+		for (const f of folders) {
+			if (states[f.id] === undefined) compute(f.id);
+		}
+		return states;
+	}, [folders, docsByFolder, foldersByParent]);
+
 	function renderLevel(parentId: number | null, depth: number): React.ReactNode[] {
 		const key = parentId ?? "root";
 		const childFolders = (foldersByParent[key] ?? [])
@@ -199,6 +228,7 @@ export function FolderTreeView({
 					isRenaming={renamingFolderId === f.id}
 					childCount={folderChildCounts[f.id] ?? 0}
 					selectionState={folderSelectionStates[f.id] ?? "none"}
+					processingState={folderProcessingStates[f.id] ?? "idle"}
 					onToggleSelect={onToggleFolderSelect}
 					onToggleExpand={onToggleExpand}
 					onRename={onRenameFolder}
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index d5ac2770a..7176afae5 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -1,24 +1,21 @@
 "use client";
 
 import { useAtom } from "jotai";
-import { CheckCircle2, ChevronDown, File as FileIcon, FileType, FolderOpen, Info, Upload, X } from "lucide-react";
+import { CheckCircle2, ChevronDown, File as FileIcon, FileType, FolderOpen, Plus, Upload, X } from "lucide-react";
 
 import { useTranslations } from "next-intl";
 import { useCallback, useMemo, useRef, useState } from "react";
 import { useDropzone } from "react-dropzone";
 import { toast } from "sonner";
 import { uploadDocumentMutationAtom } from "@/atoms/documents/document-mutation.atoms";
-import { SummaryConfig } from "@/components/assistant-ui/connector-popup/components/summary-config";
 import {
 	Accordion,
 	AccordionContent,
 	AccordionItem,
 	AccordionTrigger,
 } from "@/components/ui/accordion";
-import { Alert, AlertDescription } from "@/components/ui/alert";
 import { Badge } from "@/components/ui/badge";
 import { Button } from "@/components/ui/button";
-import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
 import {
 	DropdownMenu,
 	DropdownMenuContent,
@@ -27,7 +24,6 @@ import {
 } from "@/components/ui/dropdown-menu";
 import { Label } from "@/components/ui/label";
 import { Progress } from "@/components/ui/progress";
-import { Separator } from "@/components/ui/separator";
 import { Spinner } from "@/components/ui/spinner";
 import { Switch } from "@/components/ui/switch";
 import { documentsApiService } from "@/lib/apis/documents-api.service";
@@ -36,7 +32,6 @@ import {
 	trackDocumentUploadStarted,
 	trackDocumentUploadSuccess,
 } from "@/lib/posthog/events";
-import { GridPattern } from "./GridPattern";
 
 interface SelectedFolder {
 	path: string;
@@ -128,13 +123,12 @@ interface FileWithId {
 	file: File;
 }
 
-const cardClass = "border border-border bg-slate-400/5 dark:bg-white/5";
-
-// Upload limits — files are sent in batches of 5 to avoid proxy timeouts
 const MAX_FILES = 50;
 const MAX_TOTAL_SIZE_MB = 200;
 const MAX_TOTAL_SIZE_BYTES = MAX_TOTAL_SIZE_MB * 1024 * 1024;
 
+const toggleRowClass = "flex items-center justify-between rounded-lg bg-slate-400/5 dark:bg-white/5 p-3";
+
 export function DocumentUploadTab({
 	searchSpaceId,
 	onSuccess,
@@ -198,7 +192,7 @@ export function DocumentUploadTab({
 	const { getRootProps, getInputProps, isDragActive } = useDropzone({
 		onDrop,
 		accept: acceptedFileTypes,
-		maxSize: 50 * 1024 * 1024, // 50MB per file
+		maxSize: 50 * 1024 * 1024,
 		noClick: isElectron,
 		disabled: files.length >= MAX_FILES,
 	});
@@ -270,6 +264,8 @@ export function DocumentUploadTab({
 		(MAX_TOTAL_SIZE_BYTES - totalFileSize) / (1024 * 1024)
 	).toFixed(1);
 
+	const hasContent = files.length > 0 || selectedFolder !== null;
+
 	const handleAccordionChange = useCallback(
 		(value: string) => {
 			setAccordionValue(value);
@@ -307,7 +303,7 @@ export function DocumentUploadTab({
 				});
 				toast.success(`Watching folder: ${selectedFolder.name}`);
 			} else {
-				toast.success(`Indexing folder: ${selectedFolder.name}`);
+				toast.success(`Syncing folder: ${selectedFolder.name}`);
 			}
 
 			setSelectedFolder(null);
@@ -355,139 +351,180 @@ export function DocumentUploadTab({
 		);
 	};
 
-	return (
-		<div className="space-y-3 sm:space-y-6 max-w-4xl mx-auto pt-0">
-			<Alert className="border border-border bg-slate-400/5 dark:bg-white/5">
-				<Info className="h-4 w-4 shrink-0 mt-0.5" />
-				<AlertDescription className="text-xs sm:text-sm leading-relaxed pt-0.5">
-					{t("file_size_limit")}{" "}
-					{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}
-				</AlertDescription>
-			</Alert>
+	const renderBrowseButton = (options?: { compact?: boolean; fullWidth?: boolean }) => {
+		const { compact, fullWidth } = options ?? {};
+		if (isFileCountLimitReached) return null;
 
-		<Card className={`relative overflow-hidden ${cardClass}`}>
-			<div className="absolute inset-0 [mask-image:radial-gradient(ellipse_at_center,white,transparent)] opacity-30">
-				<GridPattern />
-			</div>
-			<CardContent className="p-4 sm:p-10 relative z-10">
-				<div
-					{...getRootProps()}
-					className={`flex flex-col items-center justify-center min-h-[200px] sm:min-h-[300px] border-2 border-dashed rounded-lg transition-colors ${
-						isFileCountLimitReached || isSizeLimitReached
-							? "border-destructive/50 bg-destructive/5 cursor-not-allowed"
-							: "border-border hover:border-primary/50 cursor-pointer"
-					}`}
-				>
-					<input
-						{...getInputProps()}
-						ref={fileInputRef}
-						className="hidden"
-						onClick={handleFileInputClick}
-					/>
-					{isFileCountLimitReached ? (
-						<div className="flex flex-col items-center gap-2 sm:gap-4 text-center px-4">
-							<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-destructive/70" />
-							<div>
-								<p className="text-sm sm:text-lg font-medium text-destructive">
-									{t("file_limit_reached")}
-								</p>
-								<p className="text-xs sm:text-sm text-muted-foreground mt-1">
-									{t("file_limit_reached_desc", { max: MAX_FILES })}
-								</p>
+		const sizeClass = compact ? "h-7" : "h-8";
+		const widthClass = fullWidth ? "w-full" : "";
+
+		if (isElectron) {
+			return (
+				<DropdownMenu>
+					<DropdownMenuTrigger asChild onClick={(e) => e.stopPropagation()}>
+						<Button variant="secondary" size="sm" className={`text-xs gap-1 ${sizeClass} ${widthClass}`}>
+							Browse
+							<ChevronDown className="h-3 w-3 opacity-60" />
+						</Button>
+					</DropdownMenuTrigger>
+					<DropdownMenuContent align="center" onClick={(e) => e.stopPropagation()}>
+						<DropdownMenuItem onClick={handleBrowseFiles}>
+							<FileIcon className="h-4 w-4 mr-2" />
+							Files
+						</DropdownMenuItem>
+						<DropdownMenuItem onClick={handleBrowseFolder}>
+							<FolderOpen className="h-4 w-4 mr-2" />
+							Folder
+						</DropdownMenuItem>
+					</DropdownMenuContent>
+				</DropdownMenu>
+			);
+		}
+
+		return (
+			<Button
+				variant="secondary"
+				size="sm"
+				className={`text-xs ${sizeClass} ${widthClass}`}
+				onClick={(e) => {
+					e.stopPropagation();
+					e.preventDefault();
+					fileInputRef.current?.click();
+				}}
+			>
+				{t("browse_files")}
+			</Button>
+		);
+	};
+
+	return (
+		<div className="space-y-2 w-full mx-auto">
+			{/* Hidden file input for mobile browse */}
+			<input
+				{...getInputProps()}
+				ref={fileInputRef}
+				className="hidden"
+				onClick={handleFileInputClick}
+			/>
+
+			{/* MOBILE DROP ZONE */}
+			<div className="sm:hidden">
+				{hasContent ? (
+					!selectedFolder && !isFileCountLimitReached && (
+						isElectron ? (
+							<div className="w-full">
+								{renderBrowseButton({ compact: true, fullWidth: true })}
 							</div>
-						</div>
-					) : isDragActive ? (
-						<div className="flex flex-col items-center gap-2 sm:gap-4">
-							<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-primary" />
-							<p className="text-sm sm:text-lg font-medium text-primary">{t("drop_files")}</p>
-						</div>
-					) : (
-						<div className="flex flex-col items-center gap-2 sm:gap-4">
-							<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-muted-foreground" />
-							<div className="text-center">
-								<p className="text-sm sm:text-lg font-medium">{t("drag_drop")}</p>
-								<p className="text-xs sm:text-sm text-muted-foreground mt-1">{t("or_browse")}</p>
-							</div>
-							{files.length > 0 && (
-								<p className="text-xs text-muted-foreground">
-									{t("remaining_capacity", { files: remainingFiles, sizeMB: remainingSizeMB })}
-								</p>
-							)}
-						</div>
-					)}
-				{!isFileCountLimitReached && (
-					<div className="mt-2 sm:mt-4">
-						{isElectron ? (
-							<DropdownMenu>
-								<DropdownMenuTrigger asChild onClick={(e) => e.stopPropagation()}>
-									<Button variant="secondary" size="sm" className="text-xs sm:text-sm gap-1">
-										{t("browse_files")}
-										<ChevronDown className="h-3 w-3 opacity-60" />
-									</Button>
-								</DropdownMenuTrigger>
-								<DropdownMenuContent align="center" onClick={(e) => e.stopPropagation()}>
-									<DropdownMenuItem onClick={handleBrowseFiles}>
-										<FileIcon className="h-4 w-4 mr-2" />
-										Files
-									</DropdownMenuItem>
-									<DropdownMenuItem onClick={handleBrowseFolder}>
-										<FolderOpen className="h-4 w-4 mr-2" />
-										Folder
-									</DropdownMenuItem>
-								</DropdownMenuContent>
-							</DropdownMenu>
 						) : (
 							<Button
-								variant="secondary"
+								variant="outline"
 								size="sm"
-								className="text-xs sm:text-sm"
-								onClick={(e) => {
-									e.stopPropagation();
-									e.preventDefault();
-									fileInputRef.current?.click();
-								}}
+								className="w-full text-xs h-8 gap-1.5 border-dashed border-muted-foreground/30"
+								onClick={() => fileInputRef.current?.click()}
 							>
-								{t("browse_files")}
+								<Plus className="h-3.5 w-3.5" />
+								Add more files
 							</Button>
+						)
+					)
+				) : (
+					<div
+						className="flex flex-col items-center gap-3 py-6 px-4 cursor-pointer"
+						onClick={() => {
+							if (!isElectron) fileInputRef.current?.click();
+						}}
+					>
+						<Upload className="h-7 w-7 text-muted-foreground" />
+						<div className="text-center space-y-1">
+							<p className="text-sm font-medium">
+								{isElectron ? "Select files or folder" : "Tap to select files"}
+							</p>
+							<p className="text-xs text-muted-foreground">
+								{t("file_size_limit")}{" "}
+								{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}
+							</p>
+						</div>
+						{isElectron && (
+							<div className="w-full mt-1" onClick={(e) => e.stopPropagation()}>
+								{renderBrowseButton({ fullWidth: true })}
+							</div>
 						)}
 					</div>
 				)}
-				</div>
-			</CardContent>
-		</Card>
+			</div>
 
-		{selectedFolder && (
-			<Card className={cardClass}>
-				<CardHeader className="p-4 sm:p-6">
-					<div className="flex items-center justify-between gap-2">
-						<div className="flex items-center gap-3 min-w-0 flex-1">
-							<FolderOpen className="h-5 w-5 text-primary flex-shrink-0" />
-							<div className="min-w-0 flex-1">
-								<CardTitle className="text-base sm:text-lg truncate">
-									{selectedFolder.name}
-								</CardTitle>
-								<CardDescription className="text-xs sm:text-sm truncate">
-									{selectedFolder.path}
-								</CardDescription>
-							</div>
+			{/* DESKTOP DROP ZONE */}
+			<div
+				{...getRootProps()}
+				className={`hidden sm:block border-2 border-dashed rounded-lg transition-colors ${
+					isFileCountLimitReached || isSizeLimitReached
+						? "border-destructive/50 bg-destructive/5 cursor-not-allowed"
+						: "border-muted-foreground/30 hover:border-foreground/70 cursor-pointer"
+				} ${hasContent ? "p-3" : "py-20 px-4"}`}
+			>
+				{hasContent ? (
+					<div className="flex items-center gap-3">
+						<Upload className="h-4 w-4 text-muted-foreground shrink-0" />
+						<span className="text-xs text-muted-foreground flex-1 truncate">
+							{isDragActive
+								? t("drop_files")
+								: isFileCountLimitReached
+									? t("file_limit_reached")
+									: t("remaining_capacity", { files: remainingFiles, sizeMB: remainingSizeMB })}
+						</span>
+						{renderBrowseButton({ compact: true })}
+					</div>
+				) : isFileCountLimitReached ? (
+					<div className="flex flex-col items-center gap-2 text-center">
+						<Upload className="h-8 w-8 text-destructive/70" />
+						<p className="text-sm font-medium text-destructive">{t("file_limit_reached")}</p>
+						<p className="text-xs text-muted-foreground">
+							{t("file_limit_reached_desc", { max: MAX_FILES })}
+						</p>
+					</div>
+				) : isDragActive ? (
+					<div className="flex flex-col items-center gap-2">
+						<Upload className="h-8 w-8 text-primary" />
+						<p className="text-sm font-medium text-primary">{t("drop_files")}</p>
+					</div>
+				) : (
+					<div className="flex flex-col items-center gap-2">
+						<Upload className="h-8 w-8 text-muted-foreground" />
+						<p className="text-sm font-medium">{t("drag_drop")}</p>
+						<p className="text-xs text-muted-foreground text-center">
+							{t("file_size_limit")}{" "}
+							{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}
+						</p>
+						<div className="mt-1">{renderBrowseButton()}</div>
+					</div>
+				)}
+			</div>
+
+			{/* FOLDER SELECTED */}
+			{selectedFolder && (
+				<div className="rounded-lg border border-border p-3 space-y-2">
+					<div className="flex items-center gap-2">
+						<FolderOpen className="h-4 w-4 text-primary shrink-0" />
+						<div className="min-w-0 flex-1">
+							<p className="text-sm font-medium truncate">{selectedFolder.name}</p>
+							<p className="text-xs text-muted-foreground truncate">{selectedFolder.path}</p>
 						</div>
 						<Button
 							variant="ghost"
 							size="icon"
-							className="h-8 w-8 shrink-0"
+							className="h-7 w-7 shrink-0"
 							onClick={() => setSelectedFolder(null)}
 							disabled={folderSubmitting}
 						>
-							<X className="h-4 w-4" />
+							<X className="h-3.5 w-3.5" />
 						</Button>
 					</div>
-				</CardHeader>
-				<CardContent className="p-4 sm:p-6 pt-0 space-y-4">
-					<div className="flex items-center justify-between rounded-lg border border-border p-3">
-						<Label htmlFor="watch-folder-toggle" className="flex flex-col gap-1 cursor-pointer">
+
+					<div className={toggleRowClass}>
+						<Label htmlFor="watch-folder-toggle" className="flex flex-col gap-0.5 cursor-pointer">
 							<span className="text-sm font-medium">Watch folder</span>
 							<span className="text-xs text-muted-foreground font-normal">
-								Automatically sync changes when files are added, edited, or removed
+								Auto-sync when files change
 							</span>
 						</Label>
 						<Switch
@@ -497,150 +534,133 @@ export function DocumentUploadTab({
 						/>
 					</div>
 
-					<SummaryConfig enabled={shouldSummarize} onEnabledChange={setShouldSummarize} />
+					<div className={toggleRowClass}>
+						<div className="space-y-0.5">
+							<p className="font-medium text-sm">Enable AI Summary</p>
+							<p className="text-xs text-muted-foreground">
+								Improves search quality but adds latency
+							</p>
+						</div>
+						<Switch checked={shouldSummarize} onCheckedChange={setShouldSummarize} />
+					</div>
 
 					<Button
-						className="w-full py-3 sm:py-6 text-xs sm:text-base font-medium"
+						className="w-full relative"
 						onClick={handleFolderSubmit}
 						disabled={folderSubmitting}
 					>
-						{folderSubmitting ? (
-							<span className="flex items-center gap-2">
+						<span className={folderSubmitting ? "invisible" : ""}>
+							{watchFolder ? "Sync & Watch for Changes" : "Sync Folder"}
+						</span>
+						{folderSubmitting && (
+							<span className="absolute inset-0 flex items-center justify-center">
 								<Spinner size="sm" />
-								Processing...
-							</span>
-						) : (
-							<span className="flex items-center gap-2">
-								<CheckCircle2 className="h-4 w-4 sm:h-5 sm:w-5" />
-								{watchFolder ? "Watch & Index Folder" : "Index Folder"}
 							</span>
 						)}
 					</Button>
-				</CardContent>
-			</Card>
-		)}
-
-			{files.length > 0 && (
-				<Card className={cardClass}>
-					<CardHeader className="p-4 sm:p-6">
-						<div className="flex items-center justify-between gap-2">
-							<div className="min-w-0 flex-1">
-								<CardTitle className="text-base sm:text-2xl">
-									{t("selected_files", { count: files.length })}
-								</CardTitle>
-								<CardDescription className="text-xs sm:text-sm">
-									{t("total_size")}: {formatFileSize(totalFileSize)}
-								</CardDescription>
-							</div>
-							<Button
-								variant="outline"
-								size="sm"
-								className="text-xs sm:text-sm shrink-0"
-								onClick={() => setFiles([])}
-								disabled={isUploading}
-							>
-								{t("clear_all")}
-							</Button>
-						</div>
-					</CardHeader>
-					<CardContent className="p-4 sm:p-6 pt-0">
-						<div className="space-y-2 sm:space-y-3 max-h-[250px] sm:max-h-[400px] overflow-y-auto">
-							{files.map((entry) => (
-								<div
-									key={entry.id}
-									className={`flex items-center justify-between p-2 sm:p-4 rounded-lg border border-border ${cardClass} hover:bg-slate-400/10 dark:hover:bg-white/10 transition-colors`}
-								>
-									<div className="flex items-center gap-3 flex-1 min-w-0">
-										<FileType className="h-5 w-5 text-muted-foreground flex-shrink-0" />
-										<div className="flex-1 min-w-0">
-											<p className="text-sm sm:text-base font-medium truncate">{entry.file.name}</p>
-											<div className="flex items-center gap-2 mt-1">
-												<Badge variant="secondary" className="text-xs">
-													{formatFileSize(entry.file.size)}
-												</Badge>
-												<Badge variant="outline" className="text-xs">
-													{entry.file.type || "Unknown type"}
-												</Badge>
-											</div>
-										</div>
-									</div>
-									<Button
-										variant="ghost"
-										size="icon"
-										onClick={() => setFiles((prev) => prev.filter((e) => e.id !== entry.id))}
-										disabled={isUploading}
-										className="h-8 w-8"
-									>
-										<X className="h-4 w-4" />
-									</Button>
-								</div>
-							))}
-						</div>
-
-						{isUploading && (
-							<div className="mt-3 sm:mt-6 space-y-2 sm:space-y-3">
-								<Separator className="bg-border" />
-								<div className="space-y-2">
-									<div className="flex items-center justify-between text-xs sm:text-sm">
-										<span>{t("uploading_files")}</span>
-										<span>{Math.round(uploadProgress)}%</span>
-									</div>
-									<Progress value={uploadProgress} className="h-2" />
-								</div>
-							</div>
-						)}
-
-						<div className="mt-3 sm:mt-6">
-							<SummaryConfig enabled={shouldSummarize} onEnabledChange={setShouldSummarize} />
-						</div>
-
-						<div className="mt-3 sm:mt-6">
-							<Button
-								className="w-full py-3 sm:py-6 text-xs sm:text-base font-medium"
-								onClick={handleUpload}
-								disabled={isUploading || files.length === 0}
-							>
-								{isUploading ? (
-									<span className="flex items-center gap-2">
-										<Spinner size="sm" />
-										{t("uploading")}
-									</span>
-								) : (
-									<span className="flex items-center gap-2">
-										<CheckCircle2 className="h-4 w-4 sm:h-5 sm:w-5" />
-										{t("upload_button", { count: files.length })}
-									</span>
-								)}
-							</Button>
-						</div>
-					</CardContent>
-				</Card>
+				</div>
 			)}
 
+			{/* FILES SELECTED */}
+			{files.length > 0 && (
+				<div className="rounded-lg border border-border p-3 space-y-2">
+					<div className="flex items-center justify-between">
+						<p className="text-sm font-medium">
+							{t("selected_files", { count: files.length })} &middot; {formatFileSize(totalFileSize)}
+						</p>
+						<Button
+							variant="ghost"
+							size="sm"
+							className="h-7 text-xs text-muted-foreground hover:text-foreground"
+							onClick={() => setFiles([])}
+							disabled={isUploading}
+						>
+							{t("clear_all")}
+						</Button>
+					</div>
+
+					<div className="max-h-[160px] sm:max-h-[200px] overflow-y-auto -mx-1">
+						{files.map((entry) => (
+							<div
+								key={entry.id}
+								className="flex items-center gap-2 py-1.5 px-2 rounded-md hover:bg-slate-400/5 dark:hover:bg-white/5 group"
+							>
+								<FileType className="h-4 w-4 text-muted-foreground shrink-0" />
+								<span className="text-sm truncate flex-1 min-w-0">{entry.file.name}</span>
+								<span className="text-xs text-muted-foreground shrink-0">
+									{formatFileSize(entry.file.size)}
+								</span>
+								<Button
+									variant="ghost"
+									size="icon"
+									className="h-6 w-6 shrink-0"
+									onClick={() => setFiles((prev) => prev.filter((e) => e.id !== entry.id))}
+									disabled={isUploading}
+								>
+									<X className="h-3 w-3" />
+								</Button>
+							</div>
+						))}
+					</div>
+
+					{isUploading && (
+						<div className="space-y-1">
+							<div className="flex items-center justify-between text-xs">
+								<span>{t("uploading_files")}</span>
+								<span>{Math.round(uploadProgress)}%</span>
+							</div>
+							<Progress value={uploadProgress} className="h-1.5" />
+						</div>
+					)}
+
+					<div className={toggleRowClass}>
+						<div className="space-y-0.5">
+							<p className="font-medium text-sm">Enable AI Summary</p>
+							<p className="text-xs text-muted-foreground">
+								Improves search quality but adds latency
+							</p>
+						</div>
+						<Switch checked={shouldSummarize} onCheckedChange={setShouldSummarize} />
+					</div>
+
+					<Button
+						className="w-full"
+						onClick={handleUpload}
+						disabled={isUploading || files.length === 0}
+					>
+						{isUploading ? (
+							<span className="flex items-center gap-2">
+								<Spinner size="sm" />
+								{t("uploading")}
+							</span>
+						) : (
+							<span className="flex items-center gap-2">
+								<CheckCircle2 className="h-4 w-4" />
+								{t("upload_button", { count: files.length })}
+							</span>
+						)}
+					</Button>
+				</div>
+			)}
+
+			{/* SUPPORTED FORMATS */}
 			<Accordion
 				type="single"
 				collapsible
 				value={accordionValue}
 				onValueChange={handleAccordionChange}
-				className={`w-full ${cardClass} border border-border rounded-lg mb-0`}
+				className="w-full"
 			>
-				<AccordionItem value="supported-file-types" className="border-0">
-					<AccordionTrigger className="px-3 sm:px-6 py-3 sm:py-4 hover:no-underline !items-center [&>svg]:!translate-y-0">
-						<div className="flex items-center gap-2 flex-1">
-							<div className="text-left min-w-0">
-								<div className="font-semibold text-sm sm:text-base">
-									{t("supported_file_types")}
-								</div>
-								<div className="text-xs sm:text-sm text-muted-foreground font-normal">
-									{t("file_types_desc")}
-								</div>
-							</div>
-						</div>
+				<AccordionItem value="supported-file-types" className="border border-border rounded-lg">
+					<AccordionTrigger className="px-3 py-2.5 hover:no-underline !items-center [&>svg]:!translate-y-0">
+						<span className="text-xs sm:text-sm text-muted-foreground font-normal">
+							{t("supported_file_types")}
+						</span>
 					</AccordionTrigger>
-					<AccordionContent className="px-3 sm:px-6 pb-3 sm:pb-6">
-						<div className="flex flex-wrap gap-2">
+					<AccordionContent className="px-3 pb-3">
+						<div className="flex flex-wrap gap-1">
 							{supportedExtensions.map((ext) => (
-								<Badge key={ext} variant="outline" className="text-xs">
+								<Badge key={ext} variant="outline" className="text-[10px] px-1.5 py-0">
 									{ext}
 								</Badge>
 							))}
diff --git a/surfsense_web/contracts/enums/connectorIcons.tsx b/surfsense_web/contracts/enums/connectorIcons.tsx
index 2e609b060..ab71d58b5 100644
--- a/surfsense_web/contracts/enums/connectorIcons.tsx
+++ b/surfsense_web/contracts/enums/connectorIcons.tsx
@@ -126,6 +126,8 @@ export const getConnectorIcon = (connectorType: EnumConnectorName | string, clas
 			return <Microscope {...iconProps} />;
 		case "DEEPEST":
 			return <Telescope {...iconProps} />;
+		case "LOCAL_FOLDER_FILE":
+			return null;
 		default:
 			return <Search {...iconProps} />;
 	}

From 44e39792da6fc7a35edbe8ae1cb68807e4ac3b3f Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 04:14:28 +0530
Subject: [PATCH 061/202] feat: assign folder_id to documents before indexing
 to ensure correct folder visibility during processing

---
 .../local_folder_indexer.py                   | 37 ++++++++++++-------
 1 file changed, 23 insertions(+), 14 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index a3281eaea..041df71fc 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -719,6 +719,21 @@ async def index_local_folder(
             }
             documents = await pipeline.prepare_for_indexing(connector_docs)
 
+            # Assign folder_id immediately so docs appear in the correct
+            # folder while still pending/processing (visible via Zero sync).
+            for document in documents:
+                cd = doc_map.get(document.unique_identifier_hash)
+                if cd is None:
+                    continue
+                rel_path = (cd.metadata or {}).get("file_path", "")
+                parent_dir = str(Path(rel_path).parent) if rel_path else ""
+                if parent_dir == ".":
+                    parent_dir = ""
+                document.folder_id = folder_mapping.get(
+                    parent_dir, folder_mapping.get("")
+                )
+            await session.commit()
+
             llm = await get_user_long_context_llm(session, user_id, search_space_id)
 
             for document in documents:
@@ -732,17 +747,9 @@ async def index_local_folder(
                 if DocumentStatus.is_state(result.status, DocumentStatus.READY):
                     indexed_count += 1
 
-                    # Assign folder_id and mtime post-pipeline
-                    rel_path = (connector_doc.metadata or {}).get("file_path", "")
-                    parent_dir = str(Path(rel_path).parent) if rel_path else ""
-                    if parent_dir == ".":
-                        parent_dir = ""
-                    fid = folder_mapping.get(parent_dir, folder_mapping.get(""))
-
                     unique_id = connector_doc.unique_id
                     mtime_info = file_meta_map.get(unique_id, {})
 
-                    result.folder_id = fid
                     doc_meta = dict(result.document_metadata or {})
                     doc_meta["mtime"] = mtime_info.get("mtime")
                     result.document_metadata = doc_meta
@@ -894,16 +901,18 @@ async def _index_single_file(
             return 0, 1, None
 
         db_doc = documents[0]
-        await pipeline.index(db_doc, connector_doc, llm)
 
-        # Post-pipeline: assign folder_id and mtime
-        await session.refresh(db_doc)
-        folder_id = None
+        # Assign folder_id before indexing so the doc appears in the
+        # correct folder while still pending/processing.
         if root_folder_id:
-            folder_id = await _resolve_folder_for_file(
+            db_doc.folder_id = await _resolve_folder_for_file(
                 session, rel_path, root_folder_id, search_space_id, user_id
             )
-        db_doc.folder_id = folder_id
+            await session.commit()
+
+        await pipeline.index(db_doc, connector_doc, llm)
+
+        await session.refresh(db_doc)
         doc_meta = dict(db_doc.document_metadata or {})
         doc_meta["mtime"] = mtime
         db_doc.document_metadata = doc_meta

From fe7fcaae5dada13d12bf5883b5722c54dcd5f425 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 04:16:19 +0530
Subject: [PATCH 062/202] feat: update folder deletion process to queue
 document deletions first and handle folder cleanup in Celery task

---
 .../app/routes/folders_routes.py              | 31 +++++++++----------
 .../app/tasks/celery_tasks/document_tasks.py  | 27 ++++++++++++----
 .../layout/ui/sidebar/DocumentsSidebar.tsx    |  7 ++++-
 3 files changed, 42 insertions(+), 23 deletions(-)

diff --git a/surfsense_backend/app/routes/folders_routes.py b/surfsense_backend/app/routes/folders_routes.py
index 6e524d4a4..2dc9bceac 100644
--- a/surfsense_backend/app/routes/folders_routes.py
+++ b/surfsense_backend/app/routes/folders_routes.py
@@ -367,7 +367,7 @@ async def delete_folder(
     session: AsyncSession = Depends(get_async_session),
     user: User = Depends(current_active_user),
 ):
-    """Delete a folder and cascade-delete subfolders. Documents are async-deleted via Celery."""
+    """Mark documents for deletion and dispatch Celery to delete docs first, then folders."""
     try:
         folder = await session.get(Folder, folder_id)
         if not folder:
@@ -399,30 +399,29 @@ async def delete_folder(
             )
             await session.commit()
 
-        await session.execute(Folder.__table__.delete().where(Folder.id == folder_id))
-        await session.commit()
+        try:
+            from app.tasks.celery_tasks.document_tasks import (
+                delete_folder_documents_task,
+            )
 
-        if document_ids:
-            try:
-                from app.tasks.celery_tasks.document_tasks import (
-                    delete_folder_documents_task,
-                )
-
-                delete_folder_documents_task.delay(document_ids)
-            except Exception as err:
+            delete_folder_documents_task.delay(
+                document_ids, folder_subtree_ids=list(subtree_ids)
+            )
+        except Exception as err:
+            if document_ids:
                 await session.execute(
                     Document.__table__.update()
                     .where(Document.id.in_(document_ids))
                     .values(status={"state": "ready"})
                 )
                 await session.commit()
-                raise HTTPException(
-                    status_code=503,
-                    detail="Folder deleted but document cleanup could not be queued. Documents have been restored.",
-                ) from err
+            raise HTTPException(
+                status_code=503,
+                detail="Could not queue folder deletion. Documents have been restored.",
+            ) from err
 
         return {
-            "message": "Folder deleted successfully",
+            "message": "Folder deletion started",
             "documents_queued_for_deletion": len(document_ids),
         }
 
diff --git a/surfsense_backend/app/tasks/celery_tasks/document_tasks.py b/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
index 110f3deee..4701d9911 100644
--- a/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
+++ b/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
@@ -142,21 +142,30 @@ async def _delete_document_background(document_id: int) -> None:
     retry_backoff_max=300,
     max_retries=5,
 )
-def delete_folder_documents_task(self, document_ids: list[int]):
-    """Celery task to batch-delete documents orphaned by folder deletion."""
+def delete_folder_documents_task(
+    self,
+    document_ids: list[int],
+    folder_subtree_ids: list[int] | None = None,
+):
+    """Celery task to delete documents first, then the folder rows."""
     loop = asyncio.new_event_loop()
     asyncio.set_event_loop(loop)
     try:
-        loop.run_until_complete(_delete_folder_documents(document_ids))
+        loop.run_until_complete(
+            _delete_folder_documents(document_ids, folder_subtree_ids)
+        )
     finally:
         loop.close()
 
 
-async def _delete_folder_documents(document_ids: list[int]) -> None:
-    """Delete chunks in batches, then document rows for each orphaned document."""
+async def _delete_folder_documents(
+    document_ids: list[int],
+    folder_subtree_ids: list[int] | None = None,
+) -> None:
+    """Delete chunks in batches, then document rows, then folder rows."""
     from sqlalchemy import delete as sa_delete, select
 
-    from app.db import Chunk, Document
+    from app.db import Chunk, Document, Folder
 
     async with get_celery_session_maker()() as session:
         batch_size = 500
@@ -178,6 +187,12 @@ async def _delete_folder_documents(document_ids: list[int]) -> None:
                 await session.delete(doc)
                 await session.commit()
 
+        if folder_subtree_ids:
+            await session.execute(
+                sa_delete(Folder).where(Folder.id.in_(folder_subtree_ids))
+            )
+            await session.commit()
+
 
 @celery_app.task(
     name="delete_search_space_background",
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index f8b774d26..8dce68eeb 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -188,7 +188,12 @@ export function DocumentsSidebar({
 
 	const treeDocuments: DocumentNodeDoc[] = useMemo(() => {
 		const zeroDocs = (zeroAllDocs ?? [])
-			.filter((d) => d.title && d.title.trim() !== "")
+			.filter((d) => {
+				if (!d.title || d.title.trim() === "") return false;
+				const state = (d.status as { state?: string } | undefined)?.state;
+				if (state === "deleting") return false;
+				return true;
+			})
 			.map((d) => ({
 				id: d.id,
 				title: d.title,

From 62e698d8aae9e6f556203ab8b1e5949b1749a994 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Thu, 2 Apr 2026 19:39:10 -0700
Subject: [PATCH 063/202] refactor: streamline document upload limits and
 enhance handling of mentioned documents

- Updated maximum file size limit to 500 MB per file.
- Removed restrictions on the number of files per upload and total upload size.
- Enhanced handling of user-mentioning documents in the knowledge base search middleware.
- Improved document reading and processing logic to accommodate new features and optimizations.
---
 .../versions/116_create_zero_publication.py   |    4 +-
 ..._optimize_zero_publication_column_lists.py |  102 +
 .../app/agents/new_chat/chat_deepagent.py     |    2 +
 .../agents/new_chat/middleware/filesystem.py  |   10 +
 .../new_chat/middleware/knowledge_search.py   |  178 +-
 .../app/routes/documents_routes.py            |  169 +-
 surfsense_backend/app/routes/editor_routes.py |  161 +-
 surfsense_backend/app/schemas/documents.py    |   11 +-
 .../app/tasks/chat/stream_new_chat.py         |  108 +-
 .../app/tasks/document_processors/__init__.py |   10 +-
 .../tasks/document_processors/_constants.py   |   74 +
 .../document_processors/_direct_converters.py |   90 +
 .../app/tasks/document_processors/_etl.py     |  209 ++
 .../app/tasks/document_processors/_helpers.py |  218 ++
 .../app/tasks/document_processors/_save.py    |  285 ++
 .../document_processors/file_processors.py    | 2753 ++++++-----------
 .../document_processors/markdown_processor.py |   81 +-
 .../document_upload/test_upload_limits.py     |   88 +-
 .../unit/middleware/test_knowledge_search.py  |    6 +-
 .../components/DocumentsTableShell.tsx        |   44 +-
 .../documents/(manage)/components/types.ts    |    2 +-
 .../components/editor-panel/editor-panel.tsx  |   72 +-
 .../layout/ui/tabs/DocumentTabContent.tsx     |   78 +-
 surfsense_web/components/markdown-viewer.tsx  |   12 +-
 .../new-chat/source-detail-panel.tsx          |  206 +-
 .../components/sources/DocumentUploadTab.tsx  |  180 +-
 .../contracts/types/document.types.ts         |   32 +
 .../lib/apis/documents-api.service.ts         |   42 +-
 surfsense_web/messages/en.json                |   21 +-
 surfsense_web/messages/es.json                |   21 +-
 surfsense_web/messages/hi.json                |   21 +-
 surfsense_web/messages/pt.json                |   21 +-
 surfsense_web/messages/zh.json                |   21 +-
 33 files changed, 2889 insertions(+), 2443 deletions(-)
 create mode 100644 surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py
 create mode 100644 surfsense_backend/app/tasks/document_processors/_constants.py
 create mode 100644 surfsense_backend/app/tasks/document_processors/_direct_converters.py
 create mode 100644 surfsense_backend/app/tasks/document_processors/_etl.py
 create mode 100644 surfsense_backend/app/tasks/document_processors/_helpers.py
 create mode 100644 surfsense_backend/app/tasks/document_processors/_save.py

diff --git a/surfsense_backend/alembic/versions/116_create_zero_publication.py b/surfsense_backend/alembic/versions/116_create_zero_publication.py
index 8f0d7b5d3..ff74952a9 100644
--- a/surfsense_backend/alembic/versions/116_create_zero_publication.py
+++ b/surfsense_backend/alembic/versions/116_create_zero_publication.py
@@ -42,9 +42,7 @@ def upgrade() -> None:
     if not exists:
         table_list = ", ".join(TABLES)
         conn.execute(
-            sa.text(
-                f"CREATE PUBLICATION {PUBLICATION_NAME} FOR TABLE {table_list}"
-            )
+            sa.text(f"CREATE PUBLICATION {PUBLICATION_NAME} FOR TABLE {table_list}")
         )
 
 
diff --git a/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py b/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py
new file mode 100644
index 000000000..3c2d34c76
--- /dev/null
+++ b/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py
@@ -0,0 +1,102 @@
+"""optimize zero_publication with column lists
+
+Recreates the zero_publication using column lists for the documents
+table so that large text columns (content, source_markdown,
+blocknote_document, etc.) are excluded from WAL replication.
+This prevents RangeError: Invalid string length in zero-cache's
+change-streamer when documents have very large content.
+
+Also resets REPLICA IDENTITY to DEFAULT on tables that had it set
+to FULL for the old Electric SQL setup (migration 66/75/76).
+With DEFAULT (primary-key) identity, column-list publications
+only need to include the PK — not every column.
+
+After running this migration you MUST:
+  1. Stop zero-cache
+  2. Delete / reset the zero-cache data volume
+  3. Restart zero-cache  (it will do a fresh initial sync)
+
+Revision ID: 117
+Revises: 116
+"""
+
+from collections.abc import Sequence
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "117"
+down_revision: str | None = "116"
+branch_labels: str | Sequence[str] | None = None
+depends_on: str | Sequence[str] | None = None
+
+PUBLICATION_NAME = "zero_publication"
+
+TABLES_WITH_FULL_IDENTITY = [
+    "documents",
+    "notifications",
+    "search_source_connectors",
+    "new_chat_messages",
+    "chat_comments",
+    "chat_session_state",
+]
+
+DOCUMENT_COLS = [
+    "id",
+    "title",
+    "document_type",
+    "search_space_id",
+    "folder_id",
+    "created_by_id",
+    "status",
+    "created_at",
+    "updated_at",
+]
+
+PUBLICATION_DDL_FULL = f"""\
+CREATE PUBLICATION {PUBLICATION_NAME} FOR TABLE
+  notifications, documents, folders,
+  search_source_connectors, new_chat_messages,
+  chat_comments, chat_session_state
+"""
+
+
+def upgrade() -> None:
+    conn = op.get_bind()
+
+    for tbl in TABLES_WITH_FULL_IDENTITY:
+        conn.execute(sa.text(f'ALTER TABLE "{tbl}" REPLICA IDENTITY DEFAULT'))
+
+    conn.execute(sa.text(f"DROP PUBLICATION IF EXISTS {PUBLICATION_NAME}"))
+
+    has_zero_ver = conn.execute(
+        sa.text(
+            "SELECT 1 FROM information_schema.columns "
+            "WHERE table_name = 'documents' AND column_name = '_0_version'"
+        )
+    ).fetchone()
+
+    cols = DOCUMENT_COLS + (['"_0_version"'] if has_zero_ver else [])
+    col_list = ", ".join(cols)
+
+    conn.execute(
+        sa.text(
+            f"CREATE PUBLICATION {PUBLICATION_NAME} FOR TABLE "
+            f"notifications, "
+            f"documents ({col_list}), "
+            f"folders, "
+            f"search_source_connectors, "
+            f"new_chat_messages, "
+            f"chat_comments, "
+            f"chat_session_state"
+        )
+    )
+
+
+def downgrade() -> None:
+    conn = op.get_bind()
+    conn.execute(sa.text(f"DROP PUBLICATION IF EXISTS {PUBLICATION_NAME}"))
+    conn.execute(sa.text(PUBLICATION_DDL_FULL))
+    for tbl in TABLES_WITH_FULL_IDENTITY:
+        conn.execute(sa.text(f'ALTER TABLE "{tbl}" REPLICA IDENTITY FULL'))
diff --git a/surfsense_backend/app/agents/new_chat/chat_deepagent.py b/surfsense_backend/app/agents/new_chat/chat_deepagent.py
index ccc06f272..fc1e80d28 100644
--- a/surfsense_backend/app/agents/new_chat/chat_deepagent.py
+++ b/surfsense_backend/app/agents/new_chat/chat_deepagent.py
@@ -159,6 +159,7 @@ async def create_surfsense_deep_agent(
     additional_tools: Sequence[BaseTool] | None = None,
     firecrawl_api_key: str | None = None,
     thread_visibility: ChatVisibility | None = None,
+    mentioned_document_ids: list[int] | None = None,
 ):
     """
     Create a SurfSense deep agent with configurable tools and prompts.
@@ -451,6 +452,7 @@ async def create_surfsense_deep_agent(
             search_space_id=search_space_id,
             available_connectors=available_connectors,
             available_document_types=available_document_types,
+            mentioned_document_ids=mentioned_document_ids,
         ),
         SurfSenseFilesystemMiddleware(
             search_space_id=search_space_id,
diff --git a/surfsense_backend/app/agents/new_chat/middleware/filesystem.py b/surfsense_backend/app/agents/new_chat/middleware/filesystem.py
index 41b24f88b..d7697ef15 100644
--- a/surfsense_backend/app/agents/new_chat/middleware/filesystem.py
+++ b/surfsense_backend/app/agents/new_chat/middleware/filesystem.py
@@ -66,6 +66,16 @@ the `<chunk_index>`, identify chunks marked `matched="true"`, then use
 those sections instead of reading the entire file sequentially.
 
 Use `<chunk id='...'>` values as citation IDs in your answers.
+
+## User-Mentioned Documents
+
+When the `ls` output tags a file with `[MENTIONED BY USER — read deeply]`,
+the user **explicitly selected** that document. These files are your highest-
+priority sources:
+1. **Always read them thoroughly** — scan the full `<chunk_index>`, then read
+   all major sections, not just matched chunks.
+2. **Prefer their content** over other search results when answering.
+3. **Cite from them first** whenever applicable.
 """
 
 # =============================================================================
diff --git a/surfsense_backend/app/agents/new_chat/middleware/knowledge_search.py b/surfsense_backend/app/agents/new_chat/middleware/knowledge_search.py
index 3728f229c..7b0dd2f71 100644
--- a/surfsense_backend/app/agents/new_chat/middleware/knowledge_search.py
+++ b/surfsense_backend/app/agents/new_chat/middleware/knowledge_search.py
@@ -28,7 +28,13 @@ from sqlalchemy import select
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from app.agents.new_chat.utils import parse_date_or_datetime, resolve_date_range
-from app.db import NATIVE_TO_LEGACY_DOCTYPE, Document, Folder, shielded_async_session
+from app.db import (
+    NATIVE_TO_LEGACY_DOCTYPE,
+    Chunk,
+    Document,
+    Folder,
+    shielded_async_session,
+)
 from app.retriever.chunks_hybrid_search import ChucksHybridSearchRetriever
 from app.utils.document_converters import embed_texts
 from app.utils.perf import get_perf_logger
@@ -430,21 +436,36 @@ async def _get_folder_paths(
 def _build_synthetic_ls(
     existing_files: dict[str, Any] | None,
     new_files: dict[str, Any],
+    *,
+    mentioned_paths: set[str] | None = None,
 ) -> tuple[AIMessage, ToolMessage]:
     """Build a synthetic ls("/documents") tool-call + result for the LLM context.
 
-    Paths are listed with *new* (rank-ordered) files first, then existing files
-    that were already in state from prior turns.
+    Mentioned files are listed first.  A separate header tells the LLM which
+    files the user explicitly selected; the path list itself stays clean so
+    paths can be passed directly to ``read_file`` without stripping tags.
     """
+    _mentioned = mentioned_paths or set()
     merged: dict[str, Any] = {**(existing_files or {}), **new_files}
     doc_paths = [
         p for p, v in merged.items() if p.startswith("/documents/") and v is not None
     ]
 
     new_set = set(new_files)
-    new_paths = [p for p in doc_paths if p in new_set]
+    mentioned_list = [p for p in doc_paths if p in _mentioned]
+    new_non_mentioned = [p for p in doc_paths if p in new_set and p not in _mentioned]
     old_paths = [p for p in doc_paths if p not in new_set]
-    ordered = new_paths + old_paths
+    ordered = mentioned_list + new_non_mentioned + old_paths
+
+    parts: list[str] = []
+    if mentioned_list:
+        parts.append(
+            "USER-MENTIONED documents (read these thoroughly before answering):"
+        )
+        for p in mentioned_list:
+            parts.append(f"  {p}")
+        parts.append("")
+    parts.append(str(ordered) if ordered else "No documents found.")
 
     tool_call_id = f"auto_ls_{uuid.uuid4().hex[:12]}"
     ai_msg = AIMessage(
@@ -452,7 +473,7 @@ def _build_synthetic_ls(
         tool_calls=[{"name": "ls", "args": {"path": "/documents"}, "id": tool_call_id}],
     )
     tool_msg = ToolMessage(
-        content=str(ordered) if ordered else "No documents found.",
+        content="\n".join(parts),
         tool_call_id=tool_call_id,
     )
     return ai_msg, tool_msg
@@ -524,12 +545,92 @@ async def search_knowledge_base(
     return results[:top_k]
 
 
+async def fetch_mentioned_documents(
+    *,
+    document_ids: list[int],
+    search_space_id: int,
+) -> list[dict[str, Any]]:
+    """Fetch explicitly mentioned documents with *all* their chunks.
+
+    Returns the same dict structure as ``search_knowledge_base`` so results
+    can be merged directly into ``build_scoped_filesystem``.  Unlike search
+    results, every chunk is included (no top-K limiting) and none are marked
+    as ``matched`` since the entire document is relevant by virtue of the
+    user's explicit mention.
+    """
+    if not document_ids:
+        return []
+
+    async with shielded_async_session() as session:
+        doc_result = await session.execute(
+            select(Document).where(
+                Document.id.in_(document_ids),
+                Document.search_space_id == search_space_id,
+            )
+        )
+        docs = {doc.id: doc for doc in doc_result.scalars().all()}
+
+        if not docs:
+            return []
+
+        chunk_result = await session.execute(
+            select(Chunk.id, Chunk.content, Chunk.document_id)
+            .where(Chunk.document_id.in_(list(docs.keys())))
+            .order_by(Chunk.document_id, Chunk.id)
+        )
+        chunks_by_doc: dict[int, list[dict[str, Any]]] = {doc_id: [] for doc_id in docs}
+        for row in chunk_result.all():
+            if row.document_id in chunks_by_doc:
+                chunks_by_doc[row.document_id].append(
+                    {"chunk_id": row.id, "content": row.content}
+                )
+
+    results: list[dict[str, Any]] = []
+    for doc_id in document_ids:
+        doc = docs.get(doc_id)
+        if doc is None:
+            continue
+        metadata = doc.document_metadata or {}
+        results.append(
+            {
+                "document_id": doc.id,
+                "content": "",
+                "score": 1.0,
+                "chunks": chunks_by_doc.get(doc.id, []),
+                "matched_chunk_ids": [],
+                "document": {
+                    "id": doc.id,
+                    "title": doc.title,
+                    "document_type": (
+                        doc.document_type.value
+                        if getattr(doc, "document_type", None)
+                        else None
+                    ),
+                    "metadata": metadata,
+                },
+                "source": (
+                    doc.document_type.value
+                    if getattr(doc, "document_type", None)
+                    else None
+                ),
+                "_user_mentioned": True,
+            }
+        )
+    return results
+
+
 async def build_scoped_filesystem(
     *,
     documents: Sequence[dict[str, Any]],
     search_space_id: int,
-) -> dict[str, dict[str, str]]:
-    """Build a StateBackend-compatible files dict from search results."""
+) -> tuple[dict[str, dict[str, str]], dict[int, str]]:
+    """Build a StateBackend-compatible files dict from search results.
+
+    Returns ``(files, doc_id_to_path)`` so callers can reliably map a
+    document id back to its filesystem path without guessing by title.
+    Paths are collision-proof: when two documents resolve to the same
+    path the doc-id is appended to disambiguate.
+    """
     async with shielded_async_session() as session:
         folder_paths = await _get_folder_paths(session, search_space_id)
         doc_ids = [
@@ -551,6 +652,7 @@ async def build_scoped_filesystem(
             }
 
     files: dict[str, dict[str, str]] = {}
+    doc_id_to_path: dict[int, str] = {}
     for document in documents:
         doc_meta = document.get("document") or {}
         title = str(doc_meta.get("title") or "untitled")
@@ -559,6 +661,9 @@ async def build_scoped_filesystem(
         base_folder = folder_paths.get(folder_id, "/documents")
         file_name = _safe_filename(title)
         path = f"{base_folder}/{file_name}"
+        if path in files:
+            stem = file_name.removesuffix(".xml")
+            path = f"{base_folder}/{stem} ({doc_id}).xml"
         matched_ids = set(document.get("matched_chunk_ids") or [])
         xml_content = _build_document_xml(document, matched_chunk_ids=matched_ids)
         files[path] = {
@@ -567,7 +672,9 @@ async def build_scoped_filesystem(
             "created_at": "",
             "modified_at": "",
         }
-    return files
+        if isinstance(doc_id, int):
+            doc_id_to_path[doc_id] = path
+    return files, doc_id_to_path
 
 
 class KnowledgeBaseSearchMiddleware(AgentMiddleware):  # type: ignore[type-arg]
@@ -583,12 +690,14 @@ class KnowledgeBaseSearchMiddleware(AgentMiddleware):  # type: ignore[type-arg]
         available_connectors: list[str] | None = None,
         available_document_types: list[str] | None = None,
         top_k: int = 10,
+        mentioned_document_ids: list[int] | None = None,
     ) -> None:
         self.llm = llm
         self.search_space_id = search_space_id
         self.available_connectors = available_connectors
         self.available_document_types = available_document_types
         self.top_k = top_k
+        self.mentioned_document_ids = mentioned_document_ids or []
 
     async def _plan_search_inputs(
         self,
@@ -680,6 +789,18 @@ class KnowledgeBaseSearchMiddleware(AgentMiddleware):  # type: ignore[type-arg]
             user_text=user_text,
         )
 
+        # --- 1. Fetch mentioned documents (user-selected, all chunks) ---
+        mentioned_results: list[dict[str, Any]] = []
+        if self.mentioned_document_ids:
+            mentioned_results = await fetch_mentioned_documents(
+                document_ids=self.mentioned_document_ids,
+                search_space_id=self.search_space_id,
+            )
+            # Clear after first turn so they are not re-fetched on subsequent
+            # messages within the same agent instance.
+            self.mentioned_document_ids = []
+
+        # --- 2. Run KB hybrid search ---
         search_results = await search_knowledge_base(
             query=planned_query,
             search_space_id=self.search_space_id,
@@ -689,19 +810,50 @@ class KnowledgeBaseSearchMiddleware(AgentMiddleware):  # type: ignore[type-arg]
             start_date=start_date,
             end_date=end_date,
         )
-        new_files = await build_scoped_filesystem(
-            documents=search_results,
+
+        # --- 3. Merge: mentioned first, then search (dedup by doc id) ---
+        seen_doc_ids: set[int] = set()
+        merged: list[dict[str, Any]] = []
+        for doc in mentioned_results:
+            doc_id = (doc.get("document") or {}).get("id")
+            if doc_id is not None:
+                seen_doc_ids.add(doc_id)
+            merged.append(doc)
+        for doc in search_results:
+            doc_id = (doc.get("document") or {}).get("id")
+            if doc_id is not None and doc_id in seen_doc_ids:
+                continue
+            merged.append(doc)
+
+        # --- 4. Build scoped filesystem ---
+        new_files, doc_id_to_path = await build_scoped_filesystem(
+            documents=merged,
             search_space_id=self.search_space_id,
         )
 
-        ai_msg, tool_msg = _build_synthetic_ls(existing_files, new_files)
+        # Identify which paths belong to user-mentioned documents using
+        # the authoritative doc_id -> path mapping (no title guessing).
+        mentioned_doc_ids = {
+            (d.get("document") or {}).get("id") for d in mentioned_results
+        }
+        mentioned_paths = {
+            doc_id_to_path[did] for did in mentioned_doc_ids if did in doc_id_to_path
+        }
+
+        ai_msg, tool_msg = _build_synthetic_ls(
+            existing_files,
+            new_files,
+            mentioned_paths=mentioned_paths,
+        )
 
         if t0 is not None:
             _perf_log.info(
-                "[kb_fs_middleware] completed in %.3fs query=%r optimized=%r new_files=%d total=%d",
+                "[kb_fs_middleware] completed in %.3fs query=%r optimized=%r "
+                "mentioned=%d new_files=%d total=%d",
                 asyncio.get_event_loop().time() - t0,
                 user_text[:80],
                 planned_query[:120],
+                len(mentioned_results),
                 len(new_files),
                 len(new_files) + len(existing_files or {}),
             )
diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index 6e69218f1..f53c81bb6 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -1,7 +1,7 @@
 # Force asyncio to use standard event loop before unstructured imports
 import asyncio
 
-from fastapi import APIRouter, Depends, Form, HTTPException, UploadFile
+from fastapi import APIRouter, Depends, Form, HTTPException, Query, UploadFile
 from sqlalchemy.ext.asyncio import AsyncSession
 from sqlalchemy.future import select
 from sqlalchemy.orm import selectinload
@@ -17,6 +17,7 @@ from app.db import (
     get_async_session,
 )
 from app.schemas import (
+    ChunkRead,
     DocumentRead,
     DocumentsCreate,
     DocumentStatusBatchResponse,
@@ -45,9 +46,7 @@ os.environ["UNSTRUCTURED_HAS_PATCHED_LOOP"] = "1"
 
 router = APIRouter()
 
-MAX_FILES_PER_UPLOAD = 10
-MAX_FILE_SIZE_BYTES = 50 * 1024 * 1024  # 50 MB per file
-MAX_TOTAL_SIZE_BYTES = 200 * 1024 * 1024  # 200 MB total
+MAX_FILE_SIZE_BYTES = 500 * 1024 * 1024  # 500 MB per file
 
 
 @router.post("/documents")
@@ -156,13 +155,6 @@ async def create_documents_file_upload(
         if not files:
             raise HTTPException(status_code=400, detail="No files provided")
 
-        if len(files) > MAX_FILES_PER_UPLOAD:
-            raise HTTPException(
-                status_code=413,
-                detail=f"Too many files. Maximum {MAX_FILES_PER_UPLOAD} files per upload.",
-            )
-
-        total_size = 0
         for file in files:
             file_size = file.size or 0
             if file_size > MAX_FILE_SIZE_BYTES:
@@ -171,14 +163,6 @@ async def create_documents_file_upload(
                     detail=f"File '{file.filename}' ({file_size / (1024 * 1024):.1f} MB) "
                     f"exceeds the {MAX_FILE_SIZE_BYTES // (1024 * 1024)} MB per-file limit.",
                 )
-            total_size += file_size
-
-        if total_size > MAX_TOTAL_SIZE_BYTES:
-            raise HTTPException(
-                status_code=413,
-                detail=f"Total upload size ({total_size / (1024 * 1024):.1f} MB) "
-                f"exceeds the {MAX_TOTAL_SIZE_BYTES // (1024 * 1024)} MB limit.",
-            )
 
         # ===== Read all files concurrently to avoid blocking the event loop =====
         async def _read_and_save(file: UploadFile) -> tuple[str, str, int]:
@@ -206,16 +190,6 @@ async def create_documents_file_upload(
 
         saved_files = await asyncio.gather(*(_read_and_save(f) for f in files))
 
-        actual_total_size = sum(size for _, _, size in saved_files)
-        if actual_total_size > MAX_TOTAL_SIZE_BYTES:
-            for temp_path, _, _ in saved_files:
-                os.unlink(temp_path)
-            raise HTTPException(
-                status_code=413,
-                detail=f"Total upload size ({actual_total_size / (1024 * 1024):.1f} MB) "
-                f"exceeds the {MAX_TOTAL_SIZE_BYTES // (1024 * 1024)} MB limit.",
-            )
-
         # ===== PHASE 1: Create pending documents for all files =====
         created_documents: list[Document] = []
         files_to_process: list[tuple[Document, str, str]] = []
@@ -451,13 +425,15 @@ async def read_documents(
                     reason=doc.status.get("reason"),
                 )
 
+            raw_content = doc.content or ""
             api_documents.append(
                 DocumentRead(
                     id=doc.id,
                     title=doc.title,
                     document_type=doc.document_type,
                     document_metadata=doc.document_metadata,
-                    content=doc.content,
+                    content="",
+                    content_preview=raw_content[:300],
                     content_hash=doc.content_hash,
                     unique_identifier_hash=doc.unique_identifier_hash,
                     created_at=doc.created_at,
@@ -609,13 +585,15 @@ async def search_documents(
                     reason=doc.status.get("reason"),
                 )
 
+            raw_content = doc.content or ""
             api_documents.append(
                 DocumentRead(
                     id=doc.id,
                     title=doc.title,
                     document_type=doc.document_type,
                     document_metadata=doc.document_metadata,
-                    content=doc.content,
+                    content="",
+                    content_preview=raw_content[:300],
                     content_hash=doc.content_hash,
                     unique_identifier_hash=doc.unique_identifier_hash,
                     created_at=doc.created_at,
@@ -884,16 +862,19 @@ async def get_document_type_counts(
 @router.get("/documents/by-chunk/{chunk_id}", response_model=DocumentWithChunksRead)
 async def get_document_by_chunk_id(
     chunk_id: int,
+    chunk_window: int = Query(
+        5, ge=0, description="Number of chunks before/after the cited chunk to include"
+    ),
     session: AsyncSession = Depends(get_async_session),
     user: User = Depends(current_active_user),
 ):
     """
-    Retrieves a document based on a chunk ID, including all its chunks ordered by creation time.
-    Requires DOCUMENTS_READ permission for the search space.
-    The document's embedding and chunk embeddings are excluded from the response.
+    Retrieves a document based on a chunk ID, including a window of chunks around the cited one.
+    Uses SQL-level pagination to avoid loading all chunks into memory.
     """
     try:
-        # First, get the chunk and verify it exists
+        from sqlalchemy import and_, func, or_
+
         chunk_result = await session.execute(select(Chunk).filter(Chunk.id == chunk_id))
         chunk = chunk_result.scalars().first()
 
@@ -902,11 +883,8 @@ async def get_document_by_chunk_id(
                 status_code=404, detail=f"Chunk with id {chunk_id} not found"
             )
 
-        # Get the associated document
         document_result = await session.execute(
-            select(Document)
-            .options(selectinload(Document.chunks))
-            .filter(Document.id == chunk.document_id)
+            select(Document).filter(Document.id == chunk.document_id)
         )
         document = document_result.scalars().first()
 
@@ -916,7 +894,6 @@ async def get_document_by_chunk_id(
                 detail="Document not found",
             )
 
-        # Check permission for the search space
         await check_permission(
             session,
             user,
@@ -925,10 +902,38 @@ async def get_document_by_chunk_id(
             "You don't have permission to read documents in this search space",
         )
 
-        # Sort chunks by creation time
-        sorted_chunks = sorted(document.chunks, key=lambda x: x.created_at)
+        total_result = await session.execute(
+            select(func.count())
+            .select_from(Chunk)
+            .filter(Chunk.document_id == document.id)
+        )
+        total_chunks = total_result.scalar() or 0
+
+        cited_idx_result = await session.execute(
+            select(func.count())
+            .select_from(Chunk)
+            .filter(
+                Chunk.document_id == document.id,
+                or_(
+                    Chunk.created_at < chunk.created_at,
+                    and_(Chunk.created_at == chunk.created_at, Chunk.id < chunk.id),
+                ),
+            )
+        )
+        cited_idx = cited_idx_result.scalar() or 0
+
+        start = max(0, cited_idx - chunk_window)
+        end = min(total_chunks, cited_idx + chunk_window + 1)
+
+        windowed_result = await session.execute(
+            select(Chunk)
+            .filter(Chunk.document_id == document.id)
+            .order_by(Chunk.created_at, Chunk.id)
+            .offset(start)
+            .limit(end - start)
+        )
+        windowed_chunks = windowed_result.scalars().all()
 
-        # Return the document with its chunks
         return DocumentWithChunksRead(
             id=document.id,
             title=document.title,
@@ -940,7 +945,9 @@ async def get_document_by_chunk_id(
             created_at=document.created_at,
             updated_at=document.updated_at,
             search_space_id=document.search_space_id,
-            chunks=sorted_chunks,
+            chunks=windowed_chunks,
+            total_chunks=total_chunks,
+            chunk_start_index=start,
         )
     except HTTPException:
         raise
@@ -950,6 +957,75 @@ async def get_document_by_chunk_id(
         ) from e
 
 
+@router.get(
+    "/documents/{document_id}/chunks",
+    response_model=PaginatedResponse[ChunkRead],
+)
+async def get_document_chunks_paginated(
+    document_id: int,
+    page: int = Query(0, ge=0),
+    page_size: int = Query(20, ge=1, le=100),
+    start_offset: int | None = Query(
+        None, ge=0, description="Direct offset; overrides page * page_size"
+    ),
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """
+    Paginated chunk loading for a document.
+    Supports both page-based and offset-based access.
+    """
+    try:
+        from sqlalchemy import func
+
+        doc_result = await session.execute(
+            select(Document).filter(Document.id == document_id)
+        )
+        document = doc_result.scalars().first()
+
+        if not document:
+            raise HTTPException(status_code=404, detail="Document not found")
+
+        await check_permission(
+            session,
+            user,
+            document.search_space_id,
+            Permission.DOCUMENTS_READ.value,
+            "You don't have permission to read documents in this search space",
+        )
+
+        total_result = await session.execute(
+            select(func.count())
+            .select_from(Chunk)
+            .filter(Chunk.document_id == document_id)
+        )
+        total = total_result.scalar() or 0
+
+        offset = start_offset if start_offset is not None else page * page_size
+        chunks_result = await session.execute(
+            select(Chunk)
+            .filter(Chunk.document_id == document_id)
+            .order_by(Chunk.created_at, Chunk.id)
+            .offset(offset)
+            .limit(page_size)
+        )
+        chunks = chunks_result.scalars().all()
+
+        return PaginatedResponse(
+            items=chunks,
+            total=total,
+            page=offset // page_size if page_size else page,
+            page_size=page_size,
+            has_more=(offset + len(chunks)) < total,
+        )
+    except HTTPException:
+        raise
+    except Exception as e:
+        raise HTTPException(
+            status_code=500, detail=f"Failed to fetch chunks: {e!s}"
+        ) from e
+
+
 @router.get("/documents/{document_id}", response_model=DocumentRead)
 async def read_document(
     document_id: int,
@@ -980,13 +1056,14 @@ async def read_document(
             "You don't have permission to read documents in this search space",
         )
 
-        # Convert database object to API-friendly format
+        raw_content = document.content or ""
         return DocumentRead(
             id=document.id,
             title=document.title,
             document_type=document.document_type,
             document_metadata=document.document_metadata,
-            content=document.content,
+            content=raw_content,
+            content_preview=raw_content[:300],
             content_hash=document.content_hash,
             unique_identifier_hash=document.unique_identifier_hash,
             created_at=document.created_at,
diff --git a/surfsense_backend/app/routes/editor_routes.py b/surfsense_backend/app/routes/editor_routes.py
index f54f18def..09a35c619 100644
--- a/surfsense_backend/app/routes/editor_routes.py
+++ b/surfsense_backend/app/routes/editor_routes.py
@@ -15,11 +15,10 @@ import pypandoc
 import typst
 from fastapi import APIRouter, Depends, HTTPException, Query
 from fastapi.responses import StreamingResponse
-from sqlalchemy import select
+from sqlalchemy import func, select
 from sqlalchemy.ext.asyncio import AsyncSession
-from sqlalchemy.orm import selectinload
 
-from app.db import Document, DocumentType, Permission, User, get_async_session
+from app.db import Chunk, Document, DocumentType, Permission, User, get_async_session
 from app.routes.reports_routes import (
     _FILE_EXTENSIONS,
     _MEDIA_TYPES,
@@ -44,6 +43,9 @@ router = APIRouter()
 async def get_editor_content(
     search_space_id: int,
     document_id: int,
+    max_length: int | None = Query(
+        None, description="Truncate source_markdown to this many characters"
+    ),
     session: AsyncSession = Depends(get_async_session),
     user: User = Depends(current_active_user),
 ):
@@ -65,9 +67,7 @@ async def get_editor_content(
     )
 
     result = await session.execute(
-        select(Document)
-        .options(selectinload(Document.chunks))
-        .filter(
+        select(Document).filter(
             Document.id == document_id,
             Document.search_space_id == search_space_id,
         )
@@ -77,62 +77,63 @@ async def get_editor_content(
     if not document:
         raise HTTPException(status_code=404, detail="Document not found")
 
-    # Priority 1: Return source_markdown if it exists (check `is not None` to allow empty strings)
-    if document.source_markdown is not None:
+    count_result = await session.execute(
+        select(func.count()).select_from(Chunk).filter(Chunk.document_id == document_id)
+    )
+    chunk_count = count_result.scalar() or 0
+
+    def _build_response(md: str) -> dict:
+        size_bytes = len(md.encode("utf-8"))
+        truncated = False
+        output_md = md
+        if max_length is not None and size_bytes > max_length:
+            output_md = md[:max_length]
+            truncated = True
         return {
             "document_id": document.id,
             "title": document.title,
             "document_type": document.document_type.value,
-            "source_markdown": document.source_markdown,
+            "source_markdown": output_md,
+            "content_size_bytes": size_bytes,
+            "chunk_count": chunk_count,
+            "truncated": truncated,
             "updated_at": document.updated_at.isoformat()
             if document.updated_at
             else None,
         }
 
-    # Priority 2: Lazy-migrate from blocknote_document (pure Python, no external deps)
+    if document.source_markdown is not None:
+        return _build_response(document.source_markdown)
+
     if document.blocknote_document:
         from app.utils.blocknote_to_markdown import blocknote_to_markdown
 
         markdown = blocknote_to_markdown(document.blocknote_document)
         if markdown:
-            # Persist the migration so we don't repeat it
             document.source_markdown = markdown
             await session.commit()
-            return {
-                "document_id": document.id,
-                "title": document.title,
-                "document_type": document.document_type.value,
-                "source_markdown": markdown,
-                "updated_at": document.updated_at.isoformat()
-                if document.updated_at
-                else None,
-            }
+            return _build_response(markdown)
 
-    # Priority 3: For NOTE type with no content, return empty markdown
     if document.document_type == DocumentType.NOTE:
         empty_markdown = ""
         document.source_markdown = empty_markdown
         await session.commit()
-        return {
-            "document_id": document.id,
-            "title": document.title,
-            "document_type": document.document_type.value,
-            "source_markdown": empty_markdown,
-            "updated_at": document.updated_at.isoformat()
-            if document.updated_at
-            else None,
-        }
+        return _build_response(empty_markdown)
 
-    # Priority 4: Reconstruct from chunks
-    chunks = sorted(document.chunks, key=lambda c: c.id)
+    chunk_contents_result = await session.execute(
+        select(Chunk.content)
+        .filter(Chunk.document_id == document_id)
+        .order_by(Chunk.id)
+    )
+    chunk_contents = chunk_contents_result.scalars().all()
 
-    if not chunks:
+    if not chunk_contents:
         raise HTTPException(
             status_code=400,
             detail="This document has no content and cannot be edited. Please re-upload to enable editing.",
         )
 
-    markdown_content = "\n\n".join(chunk.content for chunk in chunks)
+    markdown_content = "\n\n".join(chunk_contents)
 
     if not markdown_content.strip():
         raise HTTPException(
@@ -140,17 +141,77 @@ async def get_editor_content(
             detail="This document has empty content and cannot be edited.",
         )
 
-    # Persist the lazy migration
     document.source_markdown = markdown_content
     await session.commit()
 
-    return {
-        "document_id": document.id,
-        "title": document.title,
-        "document_type": document.document_type.value,
-        "source_markdown": markdown_content,
-        "updated_at": document.updated_at.isoformat() if document.updated_at else None,
-    }
+    return _build_response(markdown_content)
+
+
+@router.get(
+    "/search-spaces/{search_space_id}/documents/{document_id}/download-markdown"
+)
+async def download_document_markdown(
+    search_space_id: int,
+    document_id: int,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    """
+    Download the full document content as a .md file.
+    Reconstructs markdown from source_markdown or chunks.
+    """
+    await check_permission(
+        session,
+        user,
+        search_space_id,
+        Permission.DOCUMENTS_READ.value,
+        "You don't have permission to read documents in this search space",
+    )
+
+    result = await session.execute(
+        select(Document).filter(
+            Document.id == document_id,
+            Document.search_space_id == search_space_id,
+        )
+    )
+    document = result.scalars().first()
+
+    if not document:
+        raise HTTPException(status_code=404, detail="Document not found")
+
+    markdown: str | None = document.source_markdown
+    if markdown is None and document.blocknote_document:
+        from app.utils.blocknote_to_markdown import blocknote_to_markdown
+
+        markdown = blocknote_to_markdown(document.blocknote_document)
+    if markdown is None:
+        chunk_contents_result = await session.execute(
+            select(Chunk.content)
+            .filter(Chunk.document_id == document_id)
+            .order_by(Chunk.id)
+        )
+        chunk_contents = chunk_contents_result.scalars().all()
+        if chunk_contents:
+            markdown = "\n\n".join(chunk_contents)
+
+    if not markdown or not markdown.strip():
+        raise HTTPException(
+            status_code=400, detail="Document has no content to download"
+        )
+
+    safe_title = (
+        "".join(
+            c if c.isalnum() or c in " -_" else "_"
+            for c in (document.title or "document")
+        ).strip()[:80]
+        or "document"
+    )
+
+    return StreamingResponse(
+        io.BytesIO(markdown.encode("utf-8")),
+        media_type="text/markdown; charset=utf-8",
+        headers={"Content-Disposition": f'attachment; filename="{safe_title}.md"'},
+    )
 
 
 @router.post("/search-spaces/{search_space_id}/documents/{document_id}/save")
@@ -258,9 +319,7 @@ async def export_document(
     )
 
     result = await session.execute(
-        select(Document)
-        .options(selectinload(Document.chunks))
-        .filter(
+        select(Document).filter(
             Document.id == document_id,
             Document.search_space_id == search_space_id,
         )
@@ -269,16 +328,20 @@ async def export_document(
     if not document:
         raise HTTPException(status_code=404, detail="Document not found")
 
-    # Resolve markdown content (same priority as editor-content endpoint)
     markdown_content: str | None = document.source_markdown
     if markdown_content is None and document.blocknote_document:
         from app.utils.blocknote_to_markdown import blocknote_to_markdown
 
         markdown_content = blocknote_to_markdown(document.blocknote_document)
     if markdown_content is None:
-        chunks = sorted(document.chunks, key=lambda c: c.id)
-        if chunks:
-            markdown_content = "\n\n".join(chunk.content for chunk in chunks)
+        chunk_contents_result = await session.execute(
+            select(Chunk.content)
+            .filter(Chunk.document_id == document_id)
+            .order_by(Chunk.id)
+        )
+        chunk_contents = chunk_contents_result.scalars().all()
+        if chunk_contents:
+            markdown_content = "\n\n".join(chunk_contents)
 
     if not markdown_content or not markdown_content.strip():
         raise HTTPException(status_code=400, detail="Document has no content to export")
diff --git a/surfsense_backend/app/schemas/documents.py b/surfsense_backend/app/schemas/documents.py
index c022a09d2..49d2836b2 100644
--- a/surfsense_backend/app/schemas/documents.py
+++ b/surfsense_backend/app/schemas/documents.py
@@ -53,25 +53,26 @@ class DocumentRead(BaseModel):
     title: str
     document_type: DocumentType
     document_metadata: dict
-    content: str  # Changed to string to match frontend
+    content: str = ""
+    content_preview: str = ""
     content_hash: str
     unique_identifier_hash: str | None
     created_at: datetime
     updated_at: datetime | None
     search_space_id: int
     folder_id: int | None = None
-    created_by_id: UUID | None = None  # User who created/uploaded this document
+    created_by_id: UUID | None = None
     created_by_name: str | None = None
     created_by_email: str | None = None
-    status: DocumentStatusSchema | None = (
-        None  # Processing status (ready, processing, failed)
-    )
+    status: DocumentStatusSchema | None = None
 
     model_config = ConfigDict(from_attributes=True)
 
 
 class DocumentWithChunksRead(DocumentRead):
     chunks: list[ChunkRead] = []
+    total_chunks: int = 0
+    chunk_start_index: int = 0
 
     model_config = ConfigDict(from_attributes=True)
 
diff --git a/surfsense_backend/app/tasks/chat/stream_new_chat.py b/surfsense_backend/app/tasks/chat/stream_new_chat.py
index 7c1e3b7ea..5ff907459 100644
--- a/surfsense_backend/app/tasks/chat/stream_new_chat.py
+++ b/surfsense_backend/app/tasks/chat/stream_new_chat.py
@@ -39,7 +39,6 @@ from app.agents.new_chat.llm_config import (
 )
 from app.db import (
     ChatVisibility,
-    Document,
     NewChatMessage,
     NewChatThread,
     Report,
@@ -63,74 +62,6 @@ _perf_log = get_perf_logger()
 _background_tasks: set[asyncio.Task] = set()
 
 
-def format_mentioned_documents_as_context(documents: list[Document]) -> str:
-    """
-    Format mentioned documents as context for the agent.
-
-    Uses the same XML structure as knowledge_base.format_documents_for_context
-    to ensure citations work properly with chunk IDs.
-    """
-    if not documents:
-        return ""
-
-    context_parts = ["<mentioned_documents>"]
-    context_parts.append(
-        "The user has explicitly mentioned the following documents from their knowledge base. "
-        "These documents are directly relevant to the query and should be prioritized as primary sources. "
-        "Use [citation:CHUNK_ID] format for citations (e.g., [citation:123])."
-    )
-    context_parts.append("")
-
-    for doc in documents:
-        # Build metadata JSON
-        metadata = doc.document_metadata or {}
-        metadata_json = json.dumps(metadata, ensure_ascii=False)
-
-        # Get URL from metadata
-        url = (
-            metadata.get("url")
-            or metadata.get("source")
-            or metadata.get("page_url")
-            or ""
-        )
-
-        context_parts.append("<document>")
-        context_parts.append("<document_metadata>")
-        context_parts.append(f"  <document_id>{doc.id}</document_id>")
-        context_parts.append(
-            f"  <document_type>{doc.document_type.value}</document_type>"
-        )
-        context_parts.append(f"  <title><![CDATA[{doc.title}]]></title>")
-        context_parts.append(f"  <url><![CDATA[{url}]]></url>")
-        context_parts.append(
-            f"  <metadata_json><![CDATA[{metadata_json}]]></metadata_json>"
-        )
-        context_parts.append("</document_metadata>")
-        context_parts.append("")
-        context_parts.append("<document_content>")
-
-        # Use chunks if available (preferred for proper citations)
-        if hasattr(doc, "chunks") and doc.chunks:
-            for chunk in doc.chunks:
-                context_parts.append(
-                    f"  <chunk id='{chunk.id}'><![CDATA[{chunk.content}]]></chunk>"
-                )
-        else:
-            # Fallback to document content if chunks not loaded
-            # Use document ID as chunk ID prefix for consistency
-            context_parts.append(
-                f"  <chunk id='{doc.id}'><![CDATA[{doc.content}]]></chunk>"
-            )
-
-        context_parts.append("</document_content>")
-        context_parts.append("</document>")
-        context_parts.append("")
-
-    context_parts.append("</mentioned_documents>")
-
-    return "\n".join(context_parts)
-
-
 def format_mentioned_surfsense_docs_as_context(
     documents: list[SurfsenseDocsDocument],
 ) -> str:
@@ -1317,6 +1248,7 @@ async def stream_new_chat(
             firecrawl_api_key=firecrawl_api_key,
             thread_visibility=visibility,
             disabled_tools=disabled_tools,
+            mentioned_document_ids=mentioned_document_ids,
         )
         _perf_log.info(
             "[stream_new_chat] Agent created in %.3fs", time.perf_counter() - _t0
@@ -1340,18 +1272,9 @@ async def stream_new_chat(
                 thread.needs_history_bootstrap = False
                 await session.commit()
 
-        # Fetch mentioned documents if any (with chunks for proper citations)
-        mentioned_documents: list[Document] = []
-        if mentioned_document_ids:
-            result = await session.execute(
-                select(Document)
-                .options(selectinload(Document.chunks))
-                .filter(
-                    Document.id.in_(mentioned_document_ids),
-                    Document.search_space_id == search_space_id,
-                )
-            )
-            mentioned_documents = list(result.scalars().all())
+        # Mentioned KB documents are now handled by KnowledgeBaseSearchMiddleware
+        # which merges them into the scoped filesystem with full document
+        # structure. Only SurfSense docs and report context are inlined here.
 
         # Fetch mentioned SurfSense docs if any
         mentioned_surfsense_docs: list[SurfsenseDocsDocument] = []
@@ -1379,15 +1302,10 @@ async def stream_new_chat(
         )
         recent_reports = list(recent_reports_result.scalars().all())
 
-        # Format the user query with context (mentioned documents + SurfSense docs)
+        # Format the user query with context (SurfSense docs + reports only)
         final_query = user_query
         context_parts = []
 
-        if mentioned_documents:
-            context_parts.append(
-                format_mentioned_documents_as_context(mentioned_documents)
-            )
-
         if mentioned_surfsense_docs:
             context_parts.append(
                 format_mentioned_surfsense_docs_as_context(mentioned_surfsense_docs)
@@ -1479,7 +1397,7 @@ async def stream_new_chat(
         yield streaming_service.format_start_step()
 
         # Initial thinking step - analyzing the request
-        if mentioned_documents or mentioned_surfsense_docs:
+        if mentioned_surfsense_docs:
             initial_title = "Analyzing referenced content"
             action_verb = "Analyzing"
         else:
@@ -1490,18 +1408,6 @@ async def stream_new_chat(
         query_text = user_query[:80] + ("..." if len(user_query) > 80 else "")
         processing_parts.append(query_text)
 
-        if mentioned_documents:
-            doc_names = []
-            for doc in mentioned_documents:
-                title = doc.title
-                if len(title) > 30:
-                    title = title[:27] + "..."
-                doc_names.append(title)
-            if len(doc_names) == 1:
-                processing_parts.append(f"[{doc_names[0]}]")
-            else:
-                processing_parts.append(f"[{len(doc_names)} documents]")
-
         if mentioned_surfsense_docs:
             doc_names = []
             for doc in mentioned_surfsense_docs:
@@ -1527,7 +1433,7 @@ async def stream_new_chat(
         # These ORM objects (with eagerly-loaded chunks) can be very large.
         # They're only needed to build context strings already copied into
         # final_query / langchain_messages — release them before streaming.
-        del mentioned_documents, mentioned_surfsense_docs, recent_reports
+        del mentioned_surfsense_docs, recent_reports
         del langchain_messages, final_query
 
         # Check if this is the first assistant response so we can generate
diff --git a/surfsense_backend/app/tasks/document_processors/__init__.py b/surfsense_backend/app/tasks/document_processors/__init__.py
index e70c41cb4..2b5690d02 100644
--- a/surfsense_backend/app/tasks/document_processors/__init__.py
+++ b/surfsense_backend/app/tasks/document_processors/__init__.py
@@ -12,16 +12,14 @@ Available processors:
 - YouTube processor: Process YouTube videos and extract transcripts
 """
 
-# URL crawler
 # Extension processor
-from .extension_processor import add_extension_received_document
-
-# File processors
-from .file_processors import (
+# File processors (backward-compatible re-exports from _save)
+from ._save import (
     add_received_file_document_using_docling,
     add_received_file_document_using_llamacloud,
     add_received_file_document_using_unstructured,
 )
+from .extension_processor import add_extension_received_document
 
 # Markdown processor
 from .markdown_processor import add_received_markdown_file_document
@@ -32,9 +30,9 @@ from .youtube_processor import add_youtube_video_document
 __all__ = [
     # Extension processing
     "add_extension_received_document",
+    # File processing with different ETL services
     "add_received_file_document_using_docling",
     "add_received_file_document_using_llamacloud",
-    # File processing with different ETL services
     "add_received_file_document_using_unstructured",
     # Markdown file processing
     "add_received_markdown_file_document",
diff --git a/surfsense_backend/app/tasks/document_processors/_constants.py b/surfsense_backend/app/tasks/document_processors/_constants.py
new file mode 100644
index 000000000..f74d7acce
--- /dev/null
+++ b/surfsense_backend/app/tasks/document_processors/_constants.py
@@ -0,0 +1,74 @@
+"""
+Constants for file document processing.
+
+Centralizes file type classification, LlamaCloud retry configuration,
+and timeout calculation parameters.
+"""
+
+import ssl
+from enum import Enum
+
+import httpx
+
+# ---------------------------------------------------------------------------
+# File type classification
+# ---------------------------------------------------------------------------
+
+MARKDOWN_EXTENSIONS = (".md", ".markdown", ".txt")
+AUDIO_EXTENSIONS = (".mp3", ".mp4", ".mpeg", ".mpga", ".m4a", ".wav", ".webm")
+DIRECT_CONVERT_EXTENSIONS = (".csv", ".tsv", ".html", ".htm")
+
+
+class FileCategory(Enum):
+    MARKDOWN = "markdown"
+    AUDIO = "audio"
+    DIRECT_CONVERT = "direct_convert"
+    DOCUMENT = "document"
+
+
+def classify_file(filename: str) -> FileCategory:
+    """Classify a file by its extension into a processing category."""
+    lower = filename.lower()
+    if lower.endswith(MARKDOWN_EXTENSIONS):
+        return FileCategory.MARKDOWN
+    if lower.endswith(AUDIO_EXTENSIONS):
+        return FileCategory.AUDIO
+    if lower.endswith(DIRECT_CONVERT_EXTENSIONS):
+        return FileCategory.DIRECT_CONVERT
+    return FileCategory.DOCUMENT
+
+
+# ---------------------------------------------------------------------------
+# LlamaCloud retry configuration
+# ---------------------------------------------------------------------------
+
+LLAMACLOUD_MAX_RETRIES = 5
+LLAMACLOUD_BASE_DELAY = 10  # seconds (exponential backoff base)
+LLAMACLOUD_MAX_DELAY = 120  # max delay between retries (2 minutes)
+LLAMACLOUD_RETRYABLE_EXCEPTIONS = (
+    ssl.SSLError,
+    httpx.ConnectError,
+    httpx.ConnectTimeout,
+    httpx.ReadError,
+    httpx.ReadTimeout,
+    httpx.WriteError,
+    httpx.WriteTimeout,
+    httpx.RemoteProtocolError,
+    httpx.LocalProtocolError,
+    ConnectionError,
+    ConnectionResetError,
+    TimeoutError,
+    OSError,
+)
+
+# ---------------------------------------------------------------------------
+# Timeout calculation constants
+# ---------------------------------------------------------------------------
+
+UPLOAD_BYTES_PER_SECOND_SLOW = (
+    100 * 1024
+)  # 100 KB/s (conservative for slow connections)
+MIN_UPLOAD_TIMEOUT = 120  # Minimum 2 minutes for any file
+MAX_UPLOAD_TIMEOUT = 1800  # Maximum 30 minutes for very large files
+BASE_JOB_TIMEOUT = 600  # 10 minutes base for job processing
+PER_PAGE_JOB_TIMEOUT = 60  # 1 minute per page for processing
diff --git a/surfsense_backend/app/tasks/document_processors/_direct_converters.py b/surfsense_backend/app/tasks/document_processors/_direct_converters.py
new file mode 100644
index 000000000..b1a69ef4f
--- /dev/null
+++ b/surfsense_backend/app/tasks/document_processors/_direct_converters.py
@@ -0,0 +1,90 @@
+"""
+Lossless file-to-markdown converters for text-based formats.
+
+These converters handle file types that can be faithfully represented as
+markdown without any external ETL/OCR service:
+
+- CSV / TSV  → markdown table  (stdlib ``csv``)
+- HTML / HTM → markdown        (``markdownify``)
+"""
+
+from __future__ import annotations
+
+import csv
+from collections.abc import Callable
+from pathlib import Path
+
+from markdownify import markdownify
+
+# The stdlib csv module defaults to a 128 KB field-size limit which is too
+# small for real-world exports (e.g. chat logs, CRM dumps).  We raise it once
+# at import time so every csv.reader call in this module can handle large fields.
+csv.field_size_limit(2**31 - 1)
+
+
+def _escape_pipe(cell: str) -> str:
+    """Escape literal pipe characters inside a markdown table cell."""
+    return cell.replace("|", "\\|")
+
+
+def csv_to_markdown(file_path: str, *, delimiter: str = ",") -> str:
+    """Convert a CSV (or TSV) file to a markdown table.
+
+    The first row is treated as the header.  An empty file returns an
+    empty string so the caller can decide how to handle it.
+    """
+    with open(file_path, encoding="utf-8", newline="") as fh:
+        reader = csv.reader(fh, delimiter=delimiter)
+        rows = list(reader)
+
+    if not rows:
+        return ""
+
+    header, *body = rows
+    col_count = len(header)
+
+    lines: list[str] = []
+
+    header_cells = [_escape_pipe(c.strip()) for c in header]
+    lines.append("| " + " | ".join(header_cells) + " |")
+    lines.append("| " + " | ".join(["---"] * col_count) + " |")
+
+    for row in body:
+        padded = row + [""] * (col_count - len(row))
+        cells = [_escape_pipe(c.strip()) for c in padded[:col_count]]
+        lines.append("| " + " | ".join(cells) + " |")
+
+    return "\n".join(lines) + "\n"
+
+
+def tsv_to_markdown(file_path: str) -> str:
+    """Convert a TSV file to a markdown table."""
+    return csv_to_markdown(file_path, delimiter="\t")
+
+
+def html_to_markdown(file_path: str) -> str:
+    """Convert an HTML file to markdown via ``markdownify``."""
+    html = Path(file_path).read_text(encoding="utf-8")
+    return markdownify(html).strip()
+
+
+_CONVERTER_MAP: dict[str, Callable[..., str]] = {
+    ".csv": csv_to_markdown,
+    ".tsv": tsv_to_markdown,
+    ".html": html_to_markdown,
+    ".htm": html_to_markdown,
+}
+
+
+def convert_file_directly(file_path: str, filename: str) -> str:
+    """Dispatch to the appropriate lossless converter based on file extension.
+
+    Raises ``ValueError`` if the extension is not supported.
+    """
+    suffix = Path(filename).suffix.lower()
+    converter = _CONVERTER_MAP.get(suffix)
+    if converter is None:
+        raise ValueError(
+            f"No direct converter for extension '{suffix}' (file: {filename})"
+        )
+    return converter(file_path)
diff --git a/surfsense_backend/app/tasks/document_processors/_etl.py b/surfsense_backend/app/tasks/document_processors/_etl.py
new file mode 100644
index 000000000..cc3a8b1ac
--- /dev/null
+++ b/surfsense_backend/app/tasks/document_processors/_etl.py
@@ -0,0 +1,209 @@
+"""
+ETL parsing strategies for different document processing services.
+
+Provides parse functions for Unstructured, LlamaCloud, and Docling, along with
+LlamaCloud retry logic and dynamic timeout calculations.
+"""
+
+import asyncio
+import logging
+import os
+import random
+import warnings
+from logging import ERROR, getLogger
+
+import httpx
+
+from app.config import config as app_config
+from app.db import Log
+from app.services.task_logging_service import TaskLoggingService
+
+from ._constants import (
+    LLAMACLOUD_BASE_DELAY,
+    LLAMACLOUD_MAX_DELAY,
+    LLAMACLOUD_MAX_RETRIES,
+    LLAMACLOUD_RETRYABLE_EXCEPTIONS,
+    PER_PAGE_JOB_TIMEOUT,
+)
+from ._helpers import calculate_job_timeout, calculate_upload_timeout
+
+# ---------------------------------------------------------------------------
+# LlamaCloud parsing with retry
+# ---------------------------------------------------------------------------
+
+
+async def parse_with_llamacloud_retry(
+    file_path: str,
+    estimated_pages: int,
+    task_logger: TaskLoggingService | None = None,
+    log_entry: Log | None = None,
+):
+    """
+    Parse a file with LlamaCloud with retry logic for transient SSL/connection errors.
+
+    Uses dynamic timeout calculations based on file size and page count to handle
+    very large files reliably.
+
+    Returns:
+        LlamaParse result object
+
+    Raises:
+        Exception: If all retries fail
+    """
+    from llama_cloud_services import LlamaParse
+    from llama_cloud_services.parse.utils import ResultType
+
+    file_size_bytes = os.path.getsize(file_path)
+    file_size_mb = file_size_bytes / (1024 * 1024)
+
+    upload_timeout = calculate_upload_timeout(file_size_bytes)
+    job_timeout = calculate_job_timeout(estimated_pages, file_size_bytes)
+
+    custom_timeout = httpx.Timeout(
+        connect=120.0,
+        read=upload_timeout,
+        write=upload_timeout,
+        pool=120.0,
+    )
+
+    logging.info(
+        f"LlamaCloud upload configured: file_size={file_size_mb:.1f}MB, "
+        f"pages={estimated_pages}, upload_timeout={upload_timeout:.0f}s, "
+        f"job_timeout={job_timeout:.0f}s"
+    )
+
+    last_exception = None
+    attempt_errors: list[str] = []
+
+    for attempt in range(1, LLAMACLOUD_MAX_RETRIES + 1):
+        try:
+            async with httpx.AsyncClient(timeout=custom_timeout) as custom_client:
+                parser = LlamaParse(
+                    api_key=app_config.LLAMA_CLOUD_API_KEY,
+                    num_workers=1,
+                    verbose=True,
+                    language="en",
+                    result_type=ResultType.MD,
+                    max_timeout=int(max(2000, job_timeout + upload_timeout)),
+                    job_timeout_in_seconds=job_timeout,
+                    job_timeout_extra_time_per_page_in_seconds=PER_PAGE_JOB_TIMEOUT,
+                    custom_client=custom_client,
+                )
+                result = await parser.aparse(file_path)
+
+                if attempt > 1:
+                    logging.info(
+                        f"LlamaCloud upload succeeded on attempt {attempt} after "
+                        f"{len(attempt_errors)} failures"
+                    )
+                return result
+
+        except LLAMACLOUD_RETRYABLE_EXCEPTIONS as e:
+            last_exception = e
+            error_type = type(e).__name__
+            error_msg = str(e)[:200]
+            attempt_errors.append(f"Attempt {attempt}: {error_type} - {error_msg}")
+
+            if attempt < LLAMACLOUD_MAX_RETRIES:
+                base_delay = min(
+                    LLAMACLOUD_BASE_DELAY * (2 ** (attempt - 1)),
+                    LLAMACLOUD_MAX_DELAY,
+                )
+                jitter = base_delay * 0.25 * (2 * random.random() - 1)
+                delay = base_delay + jitter
+
+                if task_logger and log_entry:
+                    await task_logger.log_task_progress(
+                        log_entry,
+                        f"LlamaCloud upload failed "
+                        f"(attempt {attempt}/{LLAMACLOUD_MAX_RETRIES}), "
+                        f"retrying in {delay:.0f}s",
+                        {
+                            "error_type": error_type,
+                            "error_message": error_msg,
+                            "attempt": attempt,
+                            "retry_delay": delay,
+                            "file_size_mb": round(file_size_mb, 1),
+                            "upload_timeout": upload_timeout,
+                        },
+                    )
+                else:
+                    logging.warning(
+                        f"LlamaCloud upload failed "
+                        f"(attempt {attempt}/{LLAMACLOUD_MAX_RETRIES}): "
+                        f"{error_type}. File: {file_size_mb:.1f}MB. "
+                        f"Retrying in {delay:.0f}s..."
+                    )
+
+                await asyncio.sleep(delay)
+            else:
+                logging.error(
+                    f"LlamaCloud upload failed after {LLAMACLOUD_MAX_RETRIES} "
+                    f"attempts. File size: {file_size_mb:.1f}MB, "
+                    f"Pages: {estimated_pages}. "
+                    f"Errors: {'; '.join(attempt_errors)}"
+                )
+
+        except Exception:
+            raise
+
+    raise last_exception or RuntimeError(
+        f"LlamaCloud parsing failed after {LLAMACLOUD_MAX_RETRIES} retries. "
+        f"File size: {file_size_mb:.1f}MB"
+    )
+
+
+# ---------------------------------------------------------------------------
+# Per-service parse functions
+# ---------------------------------------------------------------------------
+
+
+async def parse_with_unstructured(file_path: str):
+    """
+    Parse a file using the Unstructured ETL service.
+
+    Returns:
+        List of LangChain Document elements.
+    """
+    from langchain_unstructured import UnstructuredLoader
+
+    loader = UnstructuredLoader(
+        file_path,
+        mode="elements",
+        post_processors=[],
+        languages=["eng"],
+        include_orig_elements=False,
+        include_metadata=False,
+        strategy="auto",
+    )
+    return await loader.aload()
+
+
+async def parse_with_docling(file_path: str, filename: str) -> str:
+    """
+    Parse a file using the Docling ETL service (via the Docling service wrapper).
+
+    Returns:
+        Markdown content string.
+    """
+    from app.services.docling_service import create_docling_service
+
+    docling_service = create_docling_service()
+
+    pdfminer_logger = getLogger("pdfminer")
+    original_level = pdfminer_logger.level
+
+    with warnings.catch_warnings():
+        warnings.filterwarnings("ignore", category=UserWarning, module="pdfminer")
+        warnings.filterwarnings(
+            "ignore", message=".*Cannot set gray non-stroke color.*"
+        )
+        warnings.filterwarnings("ignore", message=".*invalid float value.*")
+        pdfminer_logger.setLevel(ERROR)
+
+        try:
+            result = await docling_service.process_document(file_path, filename)
+        finally:
+            pdfminer_logger.setLevel(original_level)
+
+    return result["content"]
diff --git a/surfsense_backend/app/tasks/document_processors/_helpers.py b/surfsense_backend/app/tasks/document_processors/_helpers.py
new file mode 100644
index 000000000..7ac05932c
--- /dev/null
+++ b/surfsense_backend/app/tasks/document_processors/_helpers.py
@@ -0,0 +1,218 @@
+"""
+Document helper functions for deduplication, migration, and connector updates.
+
+Provides reusable logic shared across file processors and ETL strategies.
+"""
+
+import logging
+
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.db import Document, DocumentStatus, DocumentType
+from app.utils.document_converters import generate_unique_identifier_hash
+
+from ._constants import (
+    BASE_JOB_TIMEOUT,
+    MAX_UPLOAD_TIMEOUT,
+    MIN_UPLOAD_TIMEOUT,
+    PER_PAGE_JOB_TIMEOUT,
+    UPLOAD_BYTES_PER_SECOND_SLOW,
+)
+from .base import (
+    check_document_by_unique_identifier,
+    check_duplicate_document,
+)
+
+# ---------------------------------------------------------------------------
+# Unique identifier helpers
+# ---------------------------------------------------------------------------
+
+
+def get_google_drive_unique_identifier(
+    connector: dict | None,
+    filename: str,
+    search_space_id: int,
+) -> tuple[str, str | None]:
+    """
+    Get unique identifier hash, using file_id for Google Drive (stable across renames).
+
+    Returns:
+        Tuple of (primary_hash, legacy_hash or None).
+        For Google Drive: (file_id-based hash, filename-based hash for migration).
+        For other sources: (filename-based hash, None).
+    """
+    if connector and connector.get("type") == DocumentType.GOOGLE_DRIVE_FILE:
+        metadata = connector.get("metadata", {})
+        file_id = metadata.get("google_drive_file_id")
+
+        if file_id:
+            primary_hash = generate_unique_identifier_hash(
+                DocumentType.GOOGLE_DRIVE_FILE, file_id, search_space_id
+            )
+            legacy_hash = generate_unique_identifier_hash(
+                DocumentType.GOOGLE_DRIVE_FILE, filename, search_space_id
+            )
+            return primary_hash, legacy_hash
+
+    primary_hash = generate_unique_identifier_hash(
+        DocumentType.FILE, filename, search_space_id
+    )
+    return primary_hash, None
+
+
+# ---------------------------------------------------------------------------
+# Document deduplication and migration
+# ---------------------------------------------------------------------------
+
+
+async def handle_existing_document_update(
+    session: AsyncSession,
+    existing_document: Document,
+    content_hash: str,
+    connector: dict | None,
+    filename: str,
+    primary_hash: str,
+) -> tuple[bool, Document | None]:
+    """
+    Handle update logic for an existing document.
+
+    Returns:
+        Tuple of (should_skip_processing, document_to_return):
+        - (True, document): Content unchanged, return existing document
+        - (False, None): Content changed, needs re-processing
+    """
+    if existing_document.unique_identifier_hash != primary_hash:
+        existing_document.unique_identifier_hash = primary_hash
+        logging.info(f"Migrated document to file_id-based identifier: {filename}")
+
+    if existing_document.content_hash == content_hash:
+        if connector and connector.get("type") == DocumentType.GOOGLE_DRIVE_FILE:
+            connector_metadata = connector.get("metadata", {})
+            new_name = connector_metadata.get("google_drive_file_name")
+            doc_metadata = existing_document.document_metadata or {}
+            old_name = doc_metadata.get("FILE_NAME") or doc_metadata.get(
+                "google_drive_file_name"
+            )
+
+            if new_name and old_name and old_name != new_name:
+                from sqlalchemy.orm.attributes import flag_modified
+
+                existing_document.title = new_name
+                if not existing_document.document_metadata:
+                    existing_document.document_metadata = {}
+                existing_document.document_metadata["FILE_NAME"] = new_name
+                existing_document.document_metadata["google_drive_file_name"] = new_name
+                flag_modified(existing_document, "document_metadata")
+                await session.commit()
+                logging.info(
+                    f"File renamed in Google Drive: '{old_name}' → '{new_name}' "
+                    f"(no re-processing needed)"
+                )
+
+        logging.info(f"Document for file {filename} unchanged. Skipping.")
+        return True, existing_document
+
+    # Content has changed — guard against content_hash collision before
+    # expensive ETL processing.
+    collision_doc = await check_duplicate_document(session, content_hash)
+    if collision_doc and collision_doc.id != existing_document.id:
+        logging.warning(
+            "Content-hash collision for %s: identical content exists in "
+            "document #%s (%s). Skipping re-processing.",
+            filename,
+            collision_doc.id,
+            collision_doc.document_type,
+        )
+        if DocumentStatus.is_state(
+            existing_document.status, DocumentStatus.PENDING
+        ) or DocumentStatus.is_state(
+            existing_document.status, DocumentStatus.PROCESSING
+        ):
+            await session.delete(existing_document)
+            await session.commit()
+            return True, None
+
+        return True, existing_document
+
+    logging.info(f"Content changed for file {filename}. Updating document.")
+    return False, None
+
+
+async def find_existing_document_with_migration(
+    session: AsyncSession,
+    primary_hash: str,
+    legacy_hash: str | None,
+    content_hash: str | None = None,
+) -> Document | None:
+    """
+    Find existing document, checking primary hash, legacy hash, and content_hash.
+
+    Supports migration from filename-based to file_id-based hashing for
+    Google Drive files, with content_hash fallback for cross-source dedup.
+    """
+    existing_document = await check_document_by_unique_identifier(session, primary_hash)
+
+    if not existing_document and legacy_hash:
+        existing_document = await check_document_by_unique_identifier(
+            session, legacy_hash
+        )
+        if existing_document:
+            logging.info(
+                "Found legacy document (filename-based hash), "
+                "will migrate to file_id-based hash"
+            )
+
+    if not existing_document and content_hash:
+        existing_document = await check_duplicate_document(session, content_hash)
+        if existing_document:
+            logging.info(
+                f"Found duplicate content from different source (content_hash match). "
+                f"Original document ID: {existing_document.id}, "
+                f"type: {existing_document.document_type}"
+            )
+
+    return existing_document
+
+
+# ---------------------------------------------------------------------------
+# Connector helpers
+# ---------------------------------------------------------------------------
+
+
+async def update_document_from_connector(
+    document: Document | None,
+    connector: dict | None,
+    session: AsyncSession,
+) -> None:
+    """Update document type, metadata, and connector_id from connector info."""
+    if not document or not connector:
+        return
+    if "type" in connector:
+        document.document_type = connector["type"]
+    if "metadata" in connector:
+        if not document.document_metadata:
+            document.document_metadata = connector["metadata"]
+        else:
+            merged = {**document.document_metadata, **connector["metadata"]}
+            document.document_metadata = merged
+    if "connector_id" in connector:
+        document.connector_id = connector["connector_id"]
+    await session.commit()
+
+
+# ---------------------------------------------------------------------------
+# Timeout calculations
+# ---------------------------------------------------------------------------
+
+
+def calculate_upload_timeout(file_size_bytes: int) -> float:
+    """Calculate upload timeout based on file size (conservative for slow connections)."""
+    estimated_time = (file_size_bytes / UPLOAD_BYTES_PER_SECOND_SLOW) * 1.5
+    return max(MIN_UPLOAD_TIMEOUT, min(estimated_time, MAX_UPLOAD_TIMEOUT))
+
+
+def calculate_job_timeout(estimated_pages: int, file_size_bytes: int) -> float:
+    """Calculate job processing timeout based on page count and file size."""
+    page_based_timeout = BASE_JOB_TIMEOUT + (estimated_pages * PER_PAGE_JOB_TIMEOUT)
+    size_based_timeout = BASE_JOB_TIMEOUT + (file_size_bytes / (10 * 1024 * 1024)) * 60
+    return max(page_based_timeout, size_based_timeout)
diff --git a/surfsense_backend/app/tasks/document_processors/_save.py b/surfsense_backend/app/tasks/document_processors/_save.py
new file mode 100644
index 000000000..5088ad004
--- /dev/null
+++ b/surfsense_backend/app/tasks/document_processors/_save.py
@@ -0,0 +1,285 @@
+"""
+Unified document save/update logic for file processors.
+
+Replaces the three nearly-identical ``add_received_file_document_using_*``
+functions with a single ``save_file_document`` function plus thin wrappers
+for backward compatibility.
+"""
+
+import logging
+
+from langchain_core.documents import Document as LangChainDocument
+from sqlalchemy.exc import SQLAlchemyError
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.db import Document, DocumentStatus, DocumentType
+from app.services.llm_service import get_user_long_context_llm
+from app.utils.document_converters import (
+    create_document_chunks,
+    embed_text,
+    generate_content_hash,
+    generate_document_summary,
+)
+
+from ._helpers import (
+    find_existing_document_with_migration,
+    get_google_drive_unique_identifier,
+    handle_existing_document_update,
+)
+from .base import get_current_timestamp, safe_set_chunks
+
+# ---------------------------------------------------------------------------
+# Summary generation
+# ---------------------------------------------------------------------------
+
+
+async def _generate_summary(
+    markdown_content: str,
+    file_name: str,
+    etl_service: str,
+    user_llm,
+    enable_summary: bool,
+) -> tuple[str, list[float]]:
+    """
+    Generate a document summary and embedding.
+
+    Docling uses its own large-document summary strategy; other ETL services
+    use the standard ``generate_document_summary`` helper.
+    """
+    if not enable_summary:
+        summary = f"File: {file_name}\n\n{markdown_content[:4000]}"
+        return summary, embed_text(summary)
+
+    if etl_service == "DOCLING":
+        from app.services.docling_service import create_docling_service
+
+        docling_service = create_docling_service()
+        summary_text = await docling_service.process_large_document_summary(
+            content=markdown_content, llm=user_llm, document_title=file_name
+        )
+
+        meta = {
+            "file_name": file_name,
+            "etl_service": etl_service,
+            "document_type": "File Document",
+        }
+        parts = ["# DOCUMENT METADATA"]
+        for key, value in meta.items():
+            if value:
+                formatted_key = key.replace("_", " ").title()
+                parts.append(f"**{formatted_key}:** {value}")
+
+        enhanced = "\n".join(parts) + "\n\n# DOCUMENT SUMMARY\n\n" + summary_text
+        return enhanced, embed_text(enhanced)
+
+    # Standard summary (Unstructured / LlamaCloud / others)
+    meta = {
+        "file_name": file_name,
+        "etl_service": etl_service,
+        "document_type": "File Document",
+    }
+    return await generate_document_summary(markdown_content, user_llm, meta)
+
+
+# ---------------------------------------------------------------------------
+# Unified save function
+# ---------------------------------------------------------------------------
+
+
+async def save_file_document(
+    session: AsyncSession,
+    file_name: str,
+    markdown_content: str,
+    search_space_id: int,
+    user_id: str,
+    etl_service: str,
+    connector: dict | None = None,
+    enable_summary: bool = True,
+) -> Document | None:
+    """
+    Process and store a file document with deduplication and migration support.
+
+    Handles both creating new documents and updating existing ones.  This is
+    the single implementation behind the per-ETL-service wrapper functions.
+
+    Args:
+        session: Database session
+        file_name: Name of the processed file
+        markdown_content: Markdown content to store
+        search_space_id: ID of the search space
+        user_id: ID of the user
+        etl_service: Name of the ETL service (UNSTRUCTURED, LLAMACLOUD, DOCLING)
+        connector: Optional connector info for Google Drive files
+        enable_summary: Whether to generate an AI summary
+
+    Returns:
+        Document object if successful, None if duplicate detected
+    """
+    try:
+        primary_hash, legacy_hash = get_google_drive_unique_identifier(
+            connector, file_name, search_space_id
+        )
+        content_hash = generate_content_hash(markdown_content, search_space_id)
+
+        existing_document = await find_existing_document_with_migration(
+            session, primary_hash, legacy_hash, content_hash
+        )
+
+        if existing_document:
+            should_skip, doc = await handle_existing_document_update(
+                session,
+                existing_document,
+                content_hash,
+                connector,
+                file_name,
+                primary_hash,
+            )
+            if should_skip:
+                return doc
+
+        user_llm = await get_user_long_context_llm(session, user_id, search_space_id)
+        if not user_llm:
+            raise RuntimeError(
+                f"No long context LLM configured for user {user_id} "
+                f"in search space {search_space_id}"
+            )
+
+        summary_content, summary_embedding = await _generate_summary(
+            markdown_content, file_name, etl_service, user_llm, enable_summary
+        )
+        chunks = await create_document_chunks(markdown_content)
+        doc_metadata = {"FILE_NAME": file_name, "ETL_SERVICE": etl_service}
+
+        if existing_document:
+            existing_document.title = file_name
+            existing_document.content = summary_content
+            existing_document.content_hash = content_hash
+            existing_document.embedding = summary_embedding
+            existing_document.document_metadata = doc_metadata
+            await safe_set_chunks(session, existing_document, chunks)
+            existing_document.source_markdown = markdown_content
+            existing_document.content_needs_reindexing = False
+            existing_document.updated_at = get_current_timestamp()
+            existing_document.status = DocumentStatus.ready()
+
+            await session.commit()
+            await session.refresh(existing_document)
+            return existing_document
+
+        doc_type = DocumentType.FILE
+        if connector and connector.get("type") == DocumentType.GOOGLE_DRIVE_FILE:
+            doc_type = DocumentType.GOOGLE_DRIVE_FILE
+
+        document = Document(
+            search_space_id=search_space_id,
+            title=file_name,
+            document_type=doc_type,
+            document_metadata=doc_metadata,
+            content=summary_content,
+            embedding=summary_embedding,
+            chunks=chunks,
+            content_hash=content_hash,
+            unique_identifier_hash=primary_hash,
+            source_markdown=markdown_content,
+            content_needs_reindexing=False,
+            updated_at=get_current_timestamp(),
+            created_by_id=user_id,
+            connector_id=connector.get("connector_id") if connector else None,
+            status=DocumentStatus.ready(),
+        )
+        session.add(document)
+        await session.commit()
+        await session.refresh(document)
+        return document
+
+    except SQLAlchemyError as db_error:
+        await session.rollback()
+        if "ix_documents_content_hash" in str(db_error):
+            logging.warning(
+                "content_hash collision during commit for %s (%s). Skipping.",
+                file_name,
+                etl_service,
+            )
+            return None
+        raise db_error
+    except Exception as e:
+        await session.rollback()
+        raise RuntimeError(
+            f"Failed to process file document using {etl_service}: {e!s}"
+        ) from e
+
+
+# ---------------------------------------------------------------------------
+# Backward-compatible wrapper functions
+# ---------------------------------------------------------------------------
+
+
+async def add_received_file_document_using_unstructured(
+    session: AsyncSession,
+    file_name: str,
+    unstructured_processed_elements: list[LangChainDocument],
+    search_space_id: int,
+    user_id: str,
+    connector: dict | None = None,
+    enable_summary: bool = True,
+) -> Document | None:
+    """Process and store a file document using the Unstructured service."""
+    from app.utils.document_converters import convert_document_to_markdown
+
+    markdown_content = await convert_document_to_markdown(
+        unstructured_processed_elements
+    )
+    return await save_file_document(
+        session,
+        file_name,
+        markdown_content,
+        search_space_id,
+        user_id,
+        "UNSTRUCTURED",
+        connector,
+        enable_summary,
+    )
+
+
+async def add_received_file_document_using_llamacloud(
+    session: AsyncSession,
+    file_name: str,
+    llamacloud_markdown_document: str,
+    search_space_id: int,
+    user_id: str,
+    connector: dict | None = None,
+    enable_summary: bool = True,
+) -> Document | None:
+    """Process and store document content parsed by LlamaCloud."""
+    return await save_file_document(
+        session,
+        file_name,
+        llamacloud_markdown_document,
+        search_space_id,
+        user_id,
+        "LLAMACLOUD",
+        connector,
+        enable_summary,
+    )
+
+
+async def add_received_file_document_using_docling(
+    session: AsyncSession,
+    file_name: str,
+    docling_markdown_document: str,
+    search_space_id: int,
+    user_id: str,
+    connector: dict | None = None,
+    enable_summary: bool = True,
+) -> Document | None:
+    """Process and store document content parsed by Docling."""
+    return await save_file_document(
+        session,
+        file_name,
+        docling_markdown_document,
+        search_space_id,
+        user_id,
+        "DOCLING",
+        connector,
+        enable_summary,
+    )
diff --git a/surfsense_backend/app/tasks/document_processors/file_processors.py b/surfsense_backend/app/tasks/document_processors/file_processors.py
index 6c0ae1870..0c1cad52d 100644
--- a/surfsense_backend/app/tasks/document_processors/file_processors.py
+++ b/surfsense_backend/app/tasks/document_processors/file_processors.py
@@ -1,905 +1,685 @@
 """
-File document processors for different ETL services (Unstructured, LlamaCloud, Docling).
+File document processors orchestrating content extraction and indexing.
+
+This module is the public entry point for file processing.  It delegates to
+specialised sub-modules that each own a single concern:
+
+- ``_constants``          — file type classification and configuration constants
+- ``_helpers``            — document deduplication, migration, connector helpers
+- ``_direct_converters``  — lossless file-to-markdown for csv/tsv/html
+- ``_etl``               — ETL parsing strategies (Unstructured, LlamaCloud, Docling)
+- ``_save``              — unified document creation / update logic
 """
 
-import asyncio
+from __future__ import annotations
+
 import contextlib
 import logging
-import ssl
-import warnings
+import os
+from dataclasses import dataclass, field
 from logging import ERROR, getLogger
 
-import httpx
 from fastapi import HTTPException
-from langchain_core.documents import Document as LangChainDocument
-from litellm import atranscription
-from sqlalchemy.exc import SQLAlchemyError
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from app.config import config as app_config
-from app.db import Document, DocumentStatus, DocumentType, Log, Notification
-from app.indexing_pipeline.adapters.file_upload_adapter import UploadDocumentAdapter
-from app.services.llm_service import get_user_long_context_llm
+from app.db import Document, Log, Notification
 from app.services.notification_service import NotificationService
 from app.services.task_logging_service import TaskLoggingService
-from app.utils.document_converters import (
-    convert_document_to_markdown,
-    create_document_chunks,
-    embed_text,
-    generate_content_hash,
-    generate_document_summary,
-    generate_unique_identifier_hash,
-)
 
-from .base import (
-    check_document_by_unique_identifier,
-    check_duplicate_document,
-    get_current_timestamp,
-    safe_set_chunks,
+from ._constants import FileCategory, classify_file
+from ._direct_converters import convert_file_directly
+from ._etl import (
+    parse_with_docling,
+    parse_with_llamacloud_retry,
+    parse_with_unstructured,
+)
+from ._helpers import update_document_from_connector
+from ._save import (
+    add_received_file_document_using_docling,
+    add_received_file_document_using_llamacloud,
+    add_received_file_document_using_unstructured,
+    save_file_document,
 )
 from .markdown_processor import add_received_markdown_file_document
 
-# Constants for LlamaCloud retry configuration
-LLAMACLOUD_MAX_RETRIES = 5  # Increased from 3 for large file resilience
-LLAMACLOUD_BASE_DELAY = 10  # Base delay in seconds for exponential backoff
-LLAMACLOUD_MAX_DELAY = 120  # Maximum delay between retries (2 minutes)
-LLAMACLOUD_RETRYABLE_EXCEPTIONS = (
-    ssl.SSLError,
-    httpx.ConnectError,
-    httpx.ConnectTimeout,
-    httpx.ReadTimeout,
-    httpx.WriteTimeout,
-    httpx.RemoteProtocolError,
-    httpx.LocalProtocolError,
-    ConnectionError,
-    ConnectionResetError,
-    TimeoutError,
-    OSError,  # Catches various network-level errors
-)
-
-# Timeout calculation constants
-UPLOAD_BYTES_PER_SECOND_SLOW = (
-    100 * 1024
-)  # 100 KB/s (conservative for slow connections)
-MIN_UPLOAD_TIMEOUT = 120  # Minimum 2 minutes for any file
-MAX_UPLOAD_TIMEOUT = 1800  # Maximum 30 minutes for very large files
-BASE_JOB_TIMEOUT = 600  # 10 minutes base for job processing
-PER_PAGE_JOB_TIMEOUT = 60  # 1 minute per page for processing
+# Re-export public API so existing ``from file_processors import …`` keeps working.
+__all__ = [
+    "add_received_file_document_using_docling",
+    "add_received_file_document_using_llamacloud",
+    "add_received_file_document_using_unstructured",
+    "parse_with_llamacloud_retry",
+    "process_file_in_background",
+    "process_file_in_background_with_document",
+    "save_file_document",
+]
 
 
-def get_google_drive_unique_identifier(
-    connector: dict | None,
-    filename: str,
-    search_space_id: int,
-) -> tuple[str, str | None]:
-    """
-    Get unique identifier hash for a file, with special handling for Google Drive.
-
-    For Google Drive files, uses file_id as the unique identifier (doesn't change on rename).
-    For other files, uses filename.
-
-    Args:
-        connector: Optional connector info dict with type and metadata
-        filename: The filename (used for non-Google Drive files or as fallback)
-        search_space_id: The search space ID
-
-    Returns:
-        Tuple of (primary_hash, legacy_hash or None)
-        - For Google Drive: (file_id_based_hash, filename_based_hash for migration)
-        - For other sources: (filename_based_hash, None)
-    """
-    if connector and connector.get("type") == DocumentType.GOOGLE_DRIVE_FILE:
-        metadata = connector.get("metadata", {})
-        file_id = metadata.get("google_drive_file_id")
-
-        if file_id:
-            # New method: use file_id as unique identifier (doesn't change on rename)
-            primary_hash = generate_unique_identifier_hash(
-                DocumentType.GOOGLE_DRIVE_FILE, file_id, search_space_id
-            )
-            # Legacy method: for backward compatibility with existing documents
-            # that were indexed with filename-based hash
-            legacy_hash = generate_unique_identifier_hash(
-                DocumentType.GOOGLE_DRIVE_FILE, filename, search_space_id
-            )
-            return primary_hash, legacy_hash
-
-    # For non-Google Drive files, use filename as before
-    primary_hash = generate_unique_identifier_hash(
-        DocumentType.FILE, filename, search_space_id
-    )
-    return primary_hash, None
+# ---------------------------------------------------------------------------
+# Processing context (bundles parameters shared across handler functions)
+# ---------------------------------------------------------------------------
 
 
-async def handle_existing_document_update(
-    session: AsyncSession,
-    existing_document: Document,
-    content_hash: str,
-    connector: dict | None,
-    filename: str,
-    primary_hash: str,
-) -> tuple[bool, Document | None]:
-    """
-    Handle update logic for an existing document.
+@dataclass
+class _ProcessingContext:
+    session: AsyncSession
+    file_path: str
+    filename: str
+    search_space_id: int
+    user_id: str
+    task_logger: TaskLoggingService
+    log_entry: Log
+    connector: dict | None = None
+    notification: Notification | None = None
+    enable_summary: bool = field(init=False)
 
-    Args:
-        session: Database session
-        existing_document: The existing document found in database
-        content_hash: Hash of the new content
-        connector: Optional connector info
-        filename: Current filename
-        primary_hash: The primary hash (file_id based for Google Drive)
-
-    Returns:
-        Tuple of (should_skip_processing, document_to_return)
-        - (True, document): Content unchanged, just return existing document
-        - (False, None): Content changed, need to re-process
-    """
-    # Check if this document needs hash migration (found via legacy hash)
-    if existing_document.unique_identifier_hash != primary_hash:
-        existing_document.unique_identifier_hash = primary_hash
-        logging.info(f"Migrated document to file_id-based identifier: {filename}")
-
-    # Check if content has changed
-    if existing_document.content_hash == content_hash:
-        # Content unchanged - check if we need to update metadata (e.g., filename changed)
-        if connector and connector.get("type") == DocumentType.GOOGLE_DRIVE_FILE:
-            connector_metadata = connector.get("metadata", {})
-            new_name = connector_metadata.get("google_drive_file_name")
-            # Check both possible keys for old name (FILE_NAME is used in stored documents)
-            doc_metadata = existing_document.document_metadata or {}
-            old_name = doc_metadata.get("FILE_NAME") or doc_metadata.get(
-                "google_drive_file_name"
-            )
-
-            if new_name and old_name and old_name != new_name:
-                # File was renamed - update title and metadata, skip expensive processing
-                from sqlalchemy.orm.attributes import flag_modified
-
-                existing_document.title = new_name
-                if not existing_document.document_metadata:
-                    existing_document.document_metadata = {}
-                existing_document.document_metadata["FILE_NAME"] = new_name
-                existing_document.document_metadata["google_drive_file_name"] = new_name
-                flag_modified(existing_document, "document_metadata")
-                await session.commit()
-                logging.info(
-                    f"File renamed in Google Drive: '{old_name}' → '{new_name}' (no re-processing needed)"
-                )
-
-        logging.info(f"Document for file {filename} unchanged. Skipping.")
-        return True, existing_document
-    else:
-        # Content has changed — guard against content_hash collision before
-        # expensive ETL processing.  A collision means the exact same content
-        # already lives in a *different* document (e.g. a manual upload of the
-        # same file).  Proceeding would trigger a unique-constraint violation
-        # on ix_documents_content_hash.
-        collision_doc = await check_duplicate_document(session, content_hash)
-        if collision_doc and collision_doc.id != existing_document.id:
-            logging.warning(
-                "Content-hash collision for %s: identical content exists in "
-                "document #%s (%s). Skipping re-processing.",
-                filename,
-                collision_doc.id,
-                collision_doc.document_type,
-            )
-            if DocumentStatus.is_state(
-                existing_document.status, DocumentStatus.PENDING
-            ) or DocumentStatus.is_state(
-                existing_document.status, DocumentStatus.PROCESSING
-            ):
-                # Pending/processing doc has no real content yet — remove it
-                # so the UI doesn't show a contentless entry.
-                await session.delete(existing_document)
-                await session.commit()
-                return True, None
-
-            # Document already has valid content — keep it as-is.
-            return True, existing_document
-
-        logging.info(f"Content changed for file {filename}. Updating document.")
-        return False, None
-
-
-async def find_existing_document_with_migration(
-    session: AsyncSession,
-    primary_hash: str,
-    legacy_hash: str | None,
-    content_hash: str | None = None,
-) -> Document | None:
-    """
-    Find existing document, checking both new hash and legacy hash for migration,
-    with fallback to content_hash for cross-source deduplication.
-
-    Args:
-        session: Database session
-        primary_hash: The primary hash (file_id based for Google Drive)
-        legacy_hash: The legacy hash (filename based) for migration, or None
-        content_hash: The content hash for fallback deduplication, or None
-
-    Returns:
-        Existing document if found, None otherwise
-    """
-    # First check with primary hash (new method)
-    existing_document = await check_document_by_unique_identifier(session, primary_hash)
-
-    # If not found and we have a legacy hash, check with that (migration path)
-    if not existing_document and legacy_hash:
-        existing_document = await check_document_by_unique_identifier(
-            session, legacy_hash
-        )
-        if existing_document:
-            logging.info(
-                "Found legacy document (filename-based hash), will migrate to file_id-based hash"
-            )
-
-    # Fallback: check by content_hash to catch duplicates from different sources
-    # This prevents unique constraint violations when the same content exists
-    # under a different unique_identifier (e.g., manual upload vs Google Drive)
-    if not existing_document and content_hash:
-        existing_document = await check_duplicate_document(session, content_hash)
-        if existing_document:
-            logging.info(
-                f"Found duplicate content from different source (content_hash match). "
-                f"Original document ID: {existing_document.id}, type: {existing_document.document_type}"
-            )
-
-    return existing_document
-
-
-def calculate_upload_timeout(file_size_bytes: int) -> float:
-    """
-    Calculate appropriate upload timeout based on file size.
-
-    Assumes a conservative slow connection speed to handle worst-case scenarios.
-
-    Args:
-        file_size_bytes: Size of the file in bytes
-
-    Returns:
-        Timeout in seconds
-    """
-    # Calculate time needed at slow connection speed
-    # Add 50% buffer for network variability and SSL overhead
-    estimated_time = (file_size_bytes / UPLOAD_BYTES_PER_SECOND_SLOW) * 1.5
-
-    # Clamp to reasonable bounds
-    return max(MIN_UPLOAD_TIMEOUT, min(estimated_time, MAX_UPLOAD_TIMEOUT))
-
-
-def calculate_job_timeout(estimated_pages: int, file_size_bytes: int) -> float:
-    """
-    Calculate job processing timeout based on page count and file size.
-
-    Args:
-        estimated_pages: Estimated number of pages
-        file_size_bytes: Size of the file in bytes
-
-    Returns:
-        Timeout in seconds
-    """
-    # Base timeout + time per page
-    page_based_timeout = BASE_JOB_TIMEOUT + (estimated_pages * PER_PAGE_JOB_TIMEOUT)
-
-    # Also consider file size (large images take longer to process)
-    # ~1 minute per 10MB of file size
-    size_based_timeout = BASE_JOB_TIMEOUT + (file_size_bytes / (10 * 1024 * 1024)) * 60
-
-    # Use the larger of the two estimates
-    return max(page_based_timeout, size_based_timeout)
-
-
-async def parse_with_llamacloud_retry(
-    file_path: str,
-    estimated_pages: int,
-    task_logger: TaskLoggingService | None = None,
-    log_entry: Log | None = None,
-):
-    """
-    Parse a file with LlamaCloud with retry logic for transient SSL/connection errors.
-
-    Uses dynamic timeout calculations based on file size and page count to handle
-    very large files reliably.
-
-    Args:
-        file_path: Path to the file to parse
-        estimated_pages: Estimated number of pages for timeout calculation
-        task_logger: Optional task logger for progress updates
-        log_entry: Optional log entry for progress updates
-
-    Returns:
-        LlamaParse result object
-
-    Raises:
-        Exception: If all retries fail
-    """
-    import os
-    import random
-
-    from llama_cloud_services import LlamaParse
-    from llama_cloud_services.parse.utils import ResultType
-
-    # Get file size for timeout calculations
-    file_size_bytes = os.path.getsize(file_path)
-    file_size_mb = file_size_bytes / (1024 * 1024)
-
-    # Calculate dynamic timeouts based on file size and page count
-    upload_timeout = calculate_upload_timeout(file_size_bytes)
-    job_timeout = calculate_job_timeout(estimated_pages, file_size_bytes)
-
-    # HTTP client timeouts - scaled based on file size
-    # Write timeout is critical for large file uploads
-    custom_timeout = httpx.Timeout(
-        connect=120.0,  # 2 minutes to establish connection (handles slow DNS, etc.)
-        read=upload_timeout,  # Dynamic based on file size
-        write=upload_timeout,  # Dynamic based on file size (upload time)
-        pool=120.0,  # 2 minutes to acquire connection from pool
-    )
-
-    logging.info(
-        f"LlamaCloud upload configured: file_size={file_size_mb:.1f}MB, "
-        f"pages={estimated_pages}, upload_timeout={upload_timeout:.0f}s, "
-        f"job_timeout={job_timeout:.0f}s"
-    )
-
-    last_exception = None
-    attempt_errors = []
-
-    for attempt in range(1, LLAMACLOUD_MAX_RETRIES + 1):
-        try:
-            # Create a fresh httpx client for each attempt
-            async with httpx.AsyncClient(timeout=custom_timeout) as custom_client:
-                # Create LlamaParse parser instance with optimized settings
-                parser = LlamaParse(
-                    api_key=app_config.LLAMA_CLOUD_API_KEY,
-                    num_workers=1,  # Use single worker for file processing
-                    verbose=True,
-                    language="en",
-                    result_type=ResultType.MD,
-                    # Timeout settings for large files
-                    max_timeout=int(max(2000, job_timeout + upload_timeout)),
-                    job_timeout_in_seconds=job_timeout,
-                    job_timeout_extra_time_per_page_in_seconds=PER_PAGE_JOB_TIMEOUT,
-                    # Use our custom client with larger timeouts
-                    custom_client=custom_client,
-                )
-
-                # Parse the file asynchronously
-                result = await parser.aparse(file_path)
-
-                # Success - log if we had previous failures
-                if attempt > 1:
-                    logging.info(
-                        f"LlamaCloud upload succeeded on attempt {attempt} after "
-                        f"{len(attempt_errors)} failures"
-                    )
-
-                return result
-
-        except LLAMACLOUD_RETRYABLE_EXCEPTIONS as e:
-            last_exception = e
-            error_type = type(e).__name__
-            error_msg = str(e)[:200]
-            attempt_errors.append(f"Attempt {attempt}: {error_type} - {error_msg}")
-
-            if attempt < LLAMACLOUD_MAX_RETRIES:
-                # Calculate exponential backoff with jitter
-                # Base delay doubles each attempt, capped at max delay
-                base_delay = min(
-                    LLAMACLOUD_BASE_DELAY * (2 ** (attempt - 1)), LLAMACLOUD_MAX_DELAY
-                )
-                # Add random jitter (±25%) to prevent thundering herd
-                jitter = base_delay * 0.25 * (2 * random.random() - 1)
-                delay = base_delay + jitter
-
-                if task_logger and log_entry:
-                    await task_logger.log_task_progress(
-                        log_entry,
-                        f"LlamaCloud upload failed (attempt {attempt}/{LLAMACLOUD_MAX_RETRIES}), retrying in {delay:.0f}s",
-                        {
-                            "error_type": error_type,
-                            "error_message": error_msg,
-                            "attempt": attempt,
-                            "retry_delay": delay,
-                            "file_size_mb": round(file_size_mb, 1),
-                            "upload_timeout": upload_timeout,
-                        },
-                    )
-                else:
-                    logging.warning(
-                        f"LlamaCloud upload failed (attempt {attempt}/{LLAMACLOUD_MAX_RETRIES}): "
-                        f"{error_type}. File: {file_size_mb:.1f}MB. Retrying in {delay:.0f}s..."
-                    )
-
-                await asyncio.sleep(delay)
-            else:
-                logging.error(
-                    f"LlamaCloud upload failed after {LLAMACLOUD_MAX_RETRIES} attempts. "
-                    f"File size: {file_size_mb:.1f}MB, Pages: {estimated_pages}. "
-                    f"Errors: {'; '.join(attempt_errors)}"
-                )
-
-        except Exception:
-            # Non-retryable exception, raise immediately
-            raise
-
-    # All retries exhausted
-    raise last_exception or RuntimeError(
-        f"LlamaCloud parsing failed after {LLAMACLOUD_MAX_RETRIES} retries. "
-        f"File size: {file_size_mb:.1f}MB"
-    )
-
-
-async def add_received_file_document_using_unstructured(
-    session: AsyncSession,
-    file_name: str,
-    unstructured_processed_elements: list[LangChainDocument],
-    search_space_id: int,
-    user_id: str,
-    connector: dict | None = None,
-    enable_summary: bool = True,
-) -> Document | None:
-    """
-    Process and store a file document using Unstructured service.
-
-    Args:
-        session: Database session
-        file_name: Name of the processed file
-        unstructured_processed_elements: Processed elements from Unstructured
-        search_space_id: ID of the search space
-        user_id: ID of the user
-        connector: Optional connector info for Google Drive files
-
-    Returns:
-        Document object if successful, None if failed
-    """
-    try:
-        file_in_markdown = await convert_document_to_markdown(
-            unstructured_processed_elements
+    def __post_init__(self) -> None:
+        self.enable_summary = (
+            self.connector.get("enable_summary", True) if self.connector else True
         )
 
-        # Generate unique identifier hash (uses file_id for Google Drive, filename for others)
-        primary_hash, legacy_hash = get_google_drive_unique_identifier(
-            connector, file_name, search_space_id
-        )
 
-        # Generate content hash
-        content_hash = generate_content_hash(file_in_markdown, search_space_id)
-
-        # Check if document exists (with migration support for Google Drive and content_hash fallback)
-        existing_document = await find_existing_document_with_migration(
-            session, primary_hash, legacy_hash, content_hash
-        )
-
-        if existing_document:
-            # Handle existing document (rename detection, content change check)
-            should_skip, doc = await handle_existing_document_update(
-                session,
-                existing_document,
-                content_hash,
-                connector,
-                file_name,
-                primary_hash,
-            )
-            if should_skip:
-                return doc
-            # Content changed - continue to update
-
-        # Get user's long context LLM (needed for both create and update)
-        user_llm = await get_user_long_context_llm(session, user_id, search_space_id)
-        if not user_llm:
-            raise RuntimeError(
-                f"No long context LLM configured for user {user_id} in search space {search_space_id}"
-            )
-
-        # Generate summary with metadata
-        document_metadata = {
-            "file_name": file_name,
-            "etl_service": "UNSTRUCTURED",
-            "document_type": "File Document",
-        }
-        if enable_summary:
-            summary_content, summary_embedding = await generate_document_summary(
-                file_in_markdown, user_llm, document_metadata
-            )
-        else:
-            summary_content = f"File: {file_name}\n\n{file_in_markdown[:4000]}"
-            summary_embedding = embed_text(summary_content)
-
-        # Process chunks
-        chunks = await create_document_chunks(file_in_markdown)
-
-        # Update or create document
-        if existing_document:
-            # Update existing document
-            existing_document.title = file_name
-            existing_document.content = summary_content
-            existing_document.content_hash = content_hash
-            existing_document.embedding = summary_embedding
-            existing_document.document_metadata = {
-                "FILE_NAME": file_name,
-                "ETL_SERVICE": "UNSTRUCTURED",
-            }
-            await safe_set_chunks(session, existing_document, chunks)
-            existing_document.source_markdown = file_in_markdown
-            existing_document.content_needs_reindexing = False
-            existing_document.updated_at = get_current_timestamp()
-            existing_document.status = DocumentStatus.ready()
-
-            await session.commit()
-            await session.refresh(existing_document)
-            document = existing_document
-        else:
-            # Create new document
-            doc_type = DocumentType.FILE
-            if connector and connector.get("type") == DocumentType.GOOGLE_DRIVE_FILE:
-                doc_type = DocumentType.GOOGLE_DRIVE_FILE
-
-            document = Document(
-                search_space_id=search_space_id,
-                title=file_name,
-                document_type=doc_type,
-                document_metadata={
-                    "FILE_NAME": file_name,
-                    "ETL_SERVICE": "UNSTRUCTURED",
-                },
-                content=summary_content,
-                embedding=summary_embedding,
-                chunks=chunks,
-                content_hash=content_hash,
-                unique_identifier_hash=primary_hash,
-                source_markdown=file_in_markdown,
-                content_needs_reindexing=False,
-                updated_at=get_current_timestamp(),
-                created_by_id=user_id,
-                connector_id=connector.get("connector_id") if connector else None,
-                status=DocumentStatus.ready(),
-            )
-
-            session.add(document)
-            await session.commit()
-            await session.refresh(document)
-
-        return document
-    except SQLAlchemyError as db_error:
-        await session.rollback()
-        if "ix_documents_content_hash" in str(db_error):
-            logging.warning(
-                "content_hash collision during commit for %s (Unstructured). Skipping.",
-                file_name,
-            )
-            return None
-        raise db_error
-    except Exception as e:
-        await session.rollback()
-        raise RuntimeError(f"Failed to process file document: {e!s}") from e
+# ---------------------------------------------------------------------------
+# Notification helper
+# ---------------------------------------------------------------------------
 
 
-async def add_received_file_document_using_llamacloud(
-    session: AsyncSession,
-    file_name: str,
-    llamacloud_markdown_document: str,
-    search_space_id: int,
-    user_id: str,
-    connector: dict | None = None,
-    enable_summary: bool = True,
-) -> Document | None:
-    """
-    Process and store document content parsed by LlamaCloud.
-
-    Args:
-        session: Database session
-        file_name: Name of the processed file
-        llamacloud_markdown_document: Markdown content from LlamaCloud parsing
-        search_space_id: ID of the search space
-        user_id: ID of the user
-        connector: Optional connector info for Google Drive files
-
-    Returns:
-        Document object if successful, None if failed
-    """
-    try:
-        # Combine all markdown documents into one
-        file_in_markdown = llamacloud_markdown_document
-
-        # Generate unique identifier hash (uses file_id for Google Drive, filename for others)
-        primary_hash, legacy_hash = get_google_drive_unique_identifier(
-            connector, file_name, search_space_id
-        )
-
-        # Generate content hash
-        content_hash = generate_content_hash(file_in_markdown, search_space_id)
-
-        # Check if document exists (with migration support for Google Drive and content_hash fallback)
-        existing_document = await find_existing_document_with_migration(
-            session, primary_hash, legacy_hash, content_hash
-        )
-
-        if existing_document:
-            # Handle existing document (rename detection, content change check)
-            should_skip, doc = await handle_existing_document_update(
-                session,
-                existing_document,
-                content_hash,
-                connector,
-                file_name,
-                primary_hash,
-            )
-            if should_skip:
-                return doc
-            # Content changed - continue to update
-
-        # Get user's long context LLM (needed for both create and update)
-        user_llm = await get_user_long_context_llm(session, user_id, search_space_id)
-        if not user_llm:
-            raise RuntimeError(
-                f"No long context LLM configured for user {user_id} in search space {search_space_id}"
-            )
-
-        # Generate summary with metadata
-        document_metadata = {
-            "file_name": file_name,
-            "etl_service": "LLAMACLOUD",
-            "document_type": "File Document",
-        }
-        if enable_summary:
-            summary_content, summary_embedding = await generate_document_summary(
-                file_in_markdown, user_llm, document_metadata
-            )
-        else:
-            summary_content = f"File: {file_name}\n\n{file_in_markdown[:4000]}"
-            summary_embedding = embed_text(summary_content)
-
-        # Process chunks
-        chunks = await create_document_chunks(file_in_markdown)
-
-        # Update or create document
-        if existing_document:
-            existing_document.title = file_name
-            existing_document.content = summary_content
-            existing_document.content_hash = content_hash
-            existing_document.embedding = summary_embedding
-            existing_document.document_metadata = {
-                "FILE_NAME": file_name,
-                "ETL_SERVICE": "LLAMACLOUD",
-            }
-            await safe_set_chunks(session, existing_document, chunks)
-            existing_document.source_markdown = file_in_markdown
-            existing_document.content_needs_reindexing = False
-            existing_document.updated_at = get_current_timestamp()
-            existing_document.status = DocumentStatus.ready()
-
-            await session.commit()
-            await session.refresh(existing_document)
-            document = existing_document
-        else:
-            doc_type = DocumentType.FILE
-            if connector and connector.get("type") == DocumentType.GOOGLE_DRIVE_FILE:
-                doc_type = DocumentType.GOOGLE_DRIVE_FILE
-
-            document = Document(
-                search_space_id=search_space_id,
-                title=file_name,
-                document_type=doc_type,
-                document_metadata={
-                    "FILE_NAME": file_name,
-                    "ETL_SERVICE": "LLAMACLOUD",
-                },
-                content=summary_content,
-                embedding=summary_embedding,
-                chunks=chunks,
-                content_hash=content_hash,
-                unique_identifier_hash=primary_hash,
-                source_markdown=file_in_markdown,
-                content_needs_reindexing=False,
-                updated_at=get_current_timestamp(),
-                created_by_id=user_id,
-                connector_id=connector.get("connector_id") if connector else None,
-                status=DocumentStatus.ready(),
-            )
-
-            session.add(document)
-            await session.commit()
-            await session.refresh(document)
-
-        return document
-    except SQLAlchemyError as db_error:
-        await session.rollback()
-        if "ix_documents_content_hash" in str(db_error):
-            logging.warning(
-                "content_hash collision during commit for %s (LlamaCloud). Skipping.",
-                file_name,
-            )
-            return None
-        raise db_error
-    except Exception as e:
-        await session.rollback()
-        raise RuntimeError(
-            f"Failed to process file document using LlamaCloud: {e!s}"
-        ) from e
-
-
-async def add_received_file_document_using_docling(
-    session: AsyncSession,
-    file_name: str,
-    docling_markdown_document: str,
-    search_space_id: int,
-    user_id: str,
-    connector: dict | None = None,
-    enable_summary: bool = True,
-) -> Document | None:
-    """
-    Process and store document content parsed by Docling.
-
-    Args:
-        session: Database session
-        file_name: Name of the processed file
-        docling_markdown_document: Markdown content from Docling parsing
-        search_space_id: ID of the search space
-        user_id: ID of the user
-        connector: Optional connector info for Google Drive files
-
-    Returns:
-        Document object if successful, None if failed
-    """
-    try:
-        file_in_markdown = docling_markdown_document
-
-        # Generate unique identifier hash (uses file_id for Google Drive, filename for others)
-        primary_hash, legacy_hash = get_google_drive_unique_identifier(
-            connector, file_name, search_space_id
-        )
-
-        # Generate content hash
-        content_hash = generate_content_hash(file_in_markdown, search_space_id)
-
-        # Check if document exists (with migration support for Google Drive and content_hash fallback)
-        existing_document = await find_existing_document_with_migration(
-            session, primary_hash, legacy_hash, content_hash
-        )
-
-        if existing_document:
-            # Handle existing document (rename detection, content change check)
-            should_skip, doc = await handle_existing_document_update(
-                session,
-                existing_document,
-                content_hash,
-                connector,
-                file_name,
-                primary_hash,
-            )
-            if should_skip:
-                return doc
-            # Content changed - continue to update
-
-        # Get user's long context LLM (needed for both create and update)
-        user_llm = await get_user_long_context_llm(session, user_id, search_space_id)
-        if not user_llm:
-            raise RuntimeError(
-                f"No long context LLM configured for user {user_id} in search_space {search_space_id}"
-            )
-
-        if enable_summary:
-            from app.services.docling_service import create_docling_service
-
-            docling_service = create_docling_service()
-
-            summary_content = await docling_service.process_large_document_summary(
-                content=file_in_markdown, llm=user_llm, document_title=file_name
-            )
-
-            document_metadata = {
-                "file_name": file_name,
-                "etl_service": "DOCLING",
-                "document_type": "File Document",
-            }
-            metadata_parts = ["# DOCUMENT METADATA"]
-            for key, value in document_metadata.items():
-                if value:
-                    formatted_key = key.replace("_", " ").title()
-                    metadata_parts.append(f"**{formatted_key}:** {value}")
-
-            metadata_section = "\n".join(metadata_parts)
-            enhanced_summary_content = (
-                f"{metadata_section}\n\n# DOCUMENT SUMMARY\n\n{summary_content}"
-            )
-        else:
-            enhanced_summary_content = f"File: {file_name}\n\n{file_in_markdown[:4000]}"
-
-        summary_embedding = embed_text(enhanced_summary_content)
-
-        # Process chunks
-        chunks = await create_document_chunks(file_in_markdown)
-
-        # Update or create document
-        if existing_document:
-            # Update existing document
-            existing_document.title = file_name
-            existing_document.content = enhanced_summary_content
-            existing_document.content_hash = content_hash
-            existing_document.embedding = summary_embedding
-            existing_document.document_metadata = {
-                "FILE_NAME": file_name,
-                "ETL_SERVICE": "DOCLING",
-            }
-            await safe_set_chunks(session, existing_document, chunks)
-            existing_document.source_markdown = file_in_markdown
-            existing_document.content_needs_reindexing = False
-            existing_document.updated_at = get_current_timestamp()
-            existing_document.status = DocumentStatus.ready()  # Mark as ready
-
-            await session.commit()
-            await session.refresh(existing_document)
-            document = existing_document
-        else:
-            # Create new document
-            # Determine document type based on connector
-            doc_type = DocumentType.FILE
-            if connector and connector.get("type") == DocumentType.GOOGLE_DRIVE_FILE:
-                doc_type = DocumentType.GOOGLE_DRIVE_FILE
-
-            document = Document(
-                search_space_id=search_space_id,
-                title=file_name,
-                document_type=doc_type,
-                document_metadata={
-                    "FILE_NAME": file_name,
-                    "ETL_SERVICE": "DOCLING",
-                },
-                content=enhanced_summary_content,
-                embedding=summary_embedding,
-                chunks=chunks,
-                content_hash=content_hash,
-                unique_identifier_hash=primary_hash,
-                source_markdown=file_in_markdown,
-                content_needs_reindexing=False,
-                updated_at=get_current_timestamp(),
-                created_by_id=user_id,
-                connector_id=connector.get("connector_id") if connector else None,
-                status=DocumentStatus.ready(),  # Mark as ready
-            )
-
-            session.add(document)
-            await session.commit()
-            await session.refresh(document)
-
-        return document
-    except SQLAlchemyError as db_error:
-        await session.rollback()
-        if "ix_documents_content_hash" in str(db_error):
-            logging.warning(
-                "content_hash collision during commit for %s (Docling). Skipping.",
-                file_name,
-            )
-            return None
-        raise db_error
-    except Exception as e:
-        await session.rollback()
-        raise RuntimeError(
-            f"Failed to process file document using Docling: {e!s}"
-        ) from e
-
-
-async def _update_document_from_connector(
-    document: Document | None, connector: dict | None, session: AsyncSession
+async def _notify(
+    ctx: _ProcessingContext,
+    stage: str,
+    stage_message: str | None = None,
+    **kwargs,
 ) -> None:
-    """Helper to update document type, metadata, and connector_id from connector info."""
-    if document and connector:
-        if "type" in connector:
-            document.document_type = connector["type"]
-        if "metadata" in connector:
-            # Merge with existing document_metadata (the actual column name)
-            if not document.document_metadata:
-                document.document_metadata = connector["metadata"]
-            else:
-                # Expand existing metadata with connector metadata
-                merged = {**document.document_metadata, **connector["metadata"]}
-                document.document_metadata = merged
-        # Set connector_id if provided for de-indexing support
-        if "connector_id" in connector:
-            document.connector_id = connector["connector_id"]
-        await session.commit()
+    """Send a processing-progress notification if one is attached."""
+    if not ctx.notification:
+        return
+    await NotificationService.document_processing.notify_processing_progress(
+        ctx.session,
+        ctx.notification,
+        stage=stage,
+        stage_message=stage_message,
+        **kwargs,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Page-limit helpers
+# ---------------------------------------------------------------------------
+
+
+def _estimate_pages_safe(page_limit_service, file_path: str) -> int:
+    """Estimate page count with a file-size fallback."""
+    try:
+        return page_limit_service.estimate_pages_before_processing(file_path)
+    except Exception:
+        file_size = os.path.getsize(file_path)
+        return max(1, file_size // (80 * 1024))
+
+
+async def _log_page_divergence(
+    task_logger: TaskLoggingService,
+    log_entry: Log,
+    filename: str,
+    estimated: int,
+    actual: int,
+    final: int,
+) -> None:
+    """Log a warning when the actual page count far exceeds the pre-estimate."""
+    if actual > estimated * 1.5:
+        await task_logger.log_task_progress(
+            log_entry,
+            f"Actual page count higher than estimate: {filename}",
+            {
+                "estimated_before": estimated,
+                "actual_pages": actual,
+                "using_count": final,
+            },
+        )
+
+
+# ===================================================================
+# Handlers for process_file_in_background (legacy / connector path)
+# ===================================================================
+
+
+async def _process_markdown_upload(ctx: _ProcessingContext) -> Document | None:
+    """Read a markdown / text file and create or update a document."""
+    await _notify(ctx, "parsing", "Reading file")
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Processing markdown/text file: {ctx.filename}",
+        {"file_type": "markdown", "processing_stage": "reading_file"},
+    )
+
+    with open(ctx.file_path, encoding="utf-8") as f:
+        markdown_content = f.read()
+
+    with contextlib.suppress(Exception):
+        os.unlink(ctx.file_path)
+
+    await _notify(ctx, "chunking")
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Creating document from markdown content: {ctx.filename}",
+        {
+            "processing_stage": "creating_document",
+            "content_length": len(markdown_content),
+        },
+    )
+
+    result = await add_received_markdown_file_document(
+        ctx.session,
+        ctx.filename,
+        markdown_content,
+        ctx.search_space_id,
+        ctx.user_id,
+        ctx.connector,
+    )
+    if ctx.connector:
+        await update_document_from_connector(result, ctx.connector, ctx.session)
+
+    if result:
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Successfully processed markdown file: {ctx.filename}",
+            {
+                "document_id": result.id,
+                "content_hash": result.content_hash,
+                "file_type": "markdown",
+            },
+        )
+    else:
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Markdown file already exists (duplicate): {ctx.filename}",
+            {"duplicate_detected": True, "file_type": "markdown"},
+        )
+    return result
+
+
+async def _process_direct_convert_upload(ctx: _ProcessingContext) -> Document | None:
+    """Convert a text-based file (csv/tsv/html) to markdown without ETL."""
+    await _notify(ctx, "parsing", "Converting file")
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Direct-converting file to markdown: {ctx.filename}",
+        {"file_type": "direct_convert", "processing_stage": "converting"},
+    )
+
+    markdown_content = convert_file_directly(ctx.file_path, ctx.filename)
+
+    with contextlib.suppress(Exception):
+        os.unlink(ctx.file_path)
+
+    await _notify(ctx, "chunking")
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Creating document from converted content: {ctx.filename}",
+        {
+            "processing_stage": "creating_document",
+            "content_length": len(markdown_content),
+        },
+    )
+
+    result = await add_received_markdown_file_document(
+        ctx.session,
+        ctx.filename,
+        markdown_content,
+        ctx.search_space_id,
+        ctx.user_id,
+        ctx.connector,
+    )
+    if ctx.connector:
+        await update_document_from_connector(result, ctx.connector, ctx.session)
+
+    if result:
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Successfully direct-converted file: {ctx.filename}",
+            {
+                "document_id": result.id,
+                "content_hash": result.content_hash,
+                "file_type": "direct_convert",
+            },
+        )
+    else:
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Direct-converted file already exists (duplicate): {ctx.filename}",
+            {"duplicate_detected": True, "file_type": "direct_convert"},
+        )
+    return result
+
+
+async def _process_audio_upload(ctx: _ProcessingContext) -> Document | None:
+    """Transcribe an audio file and create or update a document."""
+    await _notify(ctx, "parsing", "Transcribing audio")
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Processing audio file for transcription: {ctx.filename}",
+        {"file_type": "audio", "processing_stage": "starting_transcription"},
+    )
+
+    stt_service_type = (
+        "local"
+        if app_config.STT_SERVICE and app_config.STT_SERVICE.startswith("local/")
+        else "external"
+    )
+
+    if stt_service_type == "local":
+        from app.services.stt_service import stt_service
+
+        try:
+            stt_result = stt_service.transcribe_file(ctx.file_path)
+            transcribed_text = stt_result.get("text", "")
+            if not transcribed_text:
+                raise ValueError("Transcription returned empty text")
+            transcribed_text = (
+                f"# Transcription of {ctx.filename}\n\n{transcribed_text}"
+            )
+        except Exception as e:
+            raise HTTPException(
+                status_code=422,
+                detail=f"Failed to transcribe audio file {ctx.filename}: {e!s}",
+            ) from e
+
+        await ctx.task_logger.log_task_progress(
+            ctx.log_entry,
+            f"Local STT transcription completed: {ctx.filename}",
+            {
+                "processing_stage": "local_transcription_complete",
+                "language": stt_result.get("language"),
+                "confidence": stt_result.get("language_probability"),
+                "duration": stt_result.get("duration"),
+            },
+        )
+    else:
+        from litellm import atranscription
+
+        with open(ctx.file_path, "rb") as audio_file:
+            transcription_kwargs: dict = {
+                "model": app_config.STT_SERVICE,
+                "file": audio_file,
+                "api_key": app_config.STT_SERVICE_API_KEY,
+            }
+            if app_config.STT_SERVICE_API_BASE:
+                transcription_kwargs["api_base"] = app_config.STT_SERVICE_API_BASE
+
+            transcription_response = await atranscription(**transcription_kwargs)
+            transcribed_text = transcription_response.get("text", "")
+            if not transcribed_text:
+                raise ValueError("Transcription returned empty text")
+
+        transcribed_text = f"# Transcription of {ctx.filename}\n\n{transcribed_text}"
+
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Transcription completed, creating document: {ctx.filename}",
+        {
+            "processing_stage": "transcription_complete",
+            "transcript_length": len(transcribed_text),
+        },
+    )
+
+    await _notify(ctx, "chunking")
+
+    with contextlib.suppress(Exception):
+        os.unlink(ctx.file_path)
+
+    result = await add_received_markdown_file_document(
+        ctx.session,
+        ctx.filename,
+        transcribed_text,
+        ctx.search_space_id,
+        ctx.user_id,
+        ctx.connector,
+    )
+    if ctx.connector:
+        await update_document_from_connector(result, ctx.connector, ctx.session)
+
+    if result:
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Successfully transcribed and processed audio file: {ctx.filename}",
+            {
+                "document_id": result.id,
+                "content_hash": result.content_hash,
+                "file_type": "audio",
+                "transcript_length": len(transcribed_text),
+                "stt_service": stt_service_type,
+            },
+        )
+    else:
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Audio file transcript already exists (duplicate): {ctx.filename}",
+            {"duplicate_detected": True, "file_type": "audio"},
+        )
+    return result
+
+
+# ---------------------------------------------------------------------------
+# Document file processing (ETL service dispatch)
+# ---------------------------------------------------------------------------
+
+
+async def _etl_unstructured(
+    ctx: _ProcessingContext,
+    page_limit_service,
+    estimated_pages: int,
+) -> Document | None:
+    """Parse and save via the Unstructured ETL service."""
+    await _notify(ctx, "parsing", "Extracting content")
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Processing file with Unstructured ETL: {ctx.filename}",
+        {
+            "file_type": "document",
+            "etl_service": "UNSTRUCTURED",
+            "processing_stage": "loading",
+        },
+    )
+
+    docs = await parse_with_unstructured(ctx.file_path)
+
+    await _notify(ctx, "chunking", chunks_count=len(docs))
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Unstructured ETL completed, creating document: {ctx.filename}",
+        {"processing_stage": "etl_complete", "elements_count": len(docs)},
+    )
+
+    actual_pages = page_limit_service.estimate_pages_from_elements(docs)
+    final_pages = max(estimated_pages, actual_pages)
+    await _log_page_divergence(
+        ctx.task_logger,
+        ctx.log_entry,
+        ctx.filename,
+        estimated_pages,
+        actual_pages,
+        final_pages,
+    )
+
+    with contextlib.suppress(Exception):
+        os.unlink(ctx.file_path)
+
+    result = await add_received_file_document_using_unstructured(
+        ctx.session,
+        ctx.filename,
+        docs,
+        ctx.search_space_id,
+        ctx.user_id,
+        ctx.connector,
+        enable_summary=ctx.enable_summary,
+    )
+    if ctx.connector:
+        await update_document_from_connector(result, ctx.connector, ctx.session)
+
+    if result:
+        await page_limit_service.update_page_usage(
+            ctx.user_id, final_pages, allow_exceed=True
+        )
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Successfully processed file with Unstructured: {ctx.filename}",
+            {
+                "document_id": result.id,
+                "content_hash": result.content_hash,
+                "file_type": "document",
+                "etl_service": "UNSTRUCTURED",
+                "pages_processed": final_pages,
+            },
+        )
+    else:
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Document already exists (duplicate): {ctx.filename}",
+            {
+                "duplicate_detected": True,
+                "file_type": "document",
+                "etl_service": "UNSTRUCTURED",
+            },
+        )
+    return result
+
+
+async def _etl_llamacloud(
+    ctx: _ProcessingContext,
+    page_limit_service,
+    estimated_pages: int,
+) -> Document | None:
+    """Parse and save via the LlamaCloud ETL service."""
+    await _notify(ctx, "parsing", "Extracting content")
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Processing file with LlamaCloud ETL: {ctx.filename}",
+        {
+            "file_type": "document",
+            "etl_service": "LLAMACLOUD",
+            "processing_stage": "parsing",
+            "estimated_pages": estimated_pages,
+        },
+    )
+
+    raw_result = await parse_with_llamacloud_retry(
+        file_path=ctx.file_path,
+        estimated_pages=estimated_pages,
+        task_logger=ctx.task_logger,
+        log_entry=ctx.log_entry,
+    )
+
+    with contextlib.suppress(Exception):
+        os.unlink(ctx.file_path)
+
+    markdown_documents = await raw_result.aget_markdown_documents(split_by_page=False)
+
+    await _notify(ctx, "chunking", chunks_count=len(markdown_documents))
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"LlamaCloud parsing completed, creating documents: {ctx.filename}",
+        {
+            "processing_stage": "parsing_complete",
+            "documents_count": len(markdown_documents),
+        },
+    )
+
+    if not markdown_documents:
+        await ctx.task_logger.log_task_failure(
+            ctx.log_entry,
+            f"LlamaCloud parsing returned no documents: {ctx.filename}",
+            "ETL service returned empty document list",
+            {"error_type": "EmptyDocumentList", "etl_service": "LLAMACLOUD"},
+        )
+        raise ValueError(f"LlamaCloud parsing returned no documents for {ctx.filename}")
+
+    actual_pages = page_limit_service.estimate_pages_from_markdown(markdown_documents)
+    final_pages = max(estimated_pages, actual_pages)
+    await _log_page_divergence(
+        ctx.task_logger,
+        ctx.log_entry,
+        ctx.filename,
+        estimated_pages,
+        actual_pages,
+        final_pages,
+    )
+
+    any_created = False
+    last_doc: Document | None = None
+
+    for doc in markdown_documents:
+        doc_result = await add_received_file_document_using_llamacloud(
+            ctx.session,
+            ctx.filename,
+            llamacloud_markdown_document=doc.text,
+            search_space_id=ctx.search_space_id,
+            user_id=ctx.user_id,
+            connector=ctx.connector,
+            enable_summary=ctx.enable_summary,
+        )
+        if doc_result:
+            any_created = True
+            last_doc = doc_result
+
+    if any_created:
+        await page_limit_service.update_page_usage(
+            ctx.user_id, final_pages, allow_exceed=True
+        )
+        if ctx.connector:
+            await update_document_from_connector(last_doc, ctx.connector, ctx.session)
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Successfully processed file with LlamaCloud: {ctx.filename}",
+            {
+                "document_id": last_doc.id,
+                "content_hash": last_doc.content_hash,
+                "file_type": "document",
+                "etl_service": "LLAMACLOUD",
+                "pages_processed": final_pages,
+                "documents_count": len(markdown_documents),
+            },
+        )
+        return last_doc
+
+    await ctx.task_logger.log_task_success(
+        ctx.log_entry,
+        f"Document already exists (duplicate): {ctx.filename}",
+        {
+            "duplicate_detected": True,
+            "file_type": "document",
+            "etl_service": "LLAMACLOUD",
+            "documents_count": len(markdown_documents),
+        },
+    )
+    return None
+
+
+async def _etl_docling(
+    ctx: _ProcessingContext,
+    page_limit_service,
+    estimated_pages: int,
+) -> Document | None:
+    """Parse and save via the Docling ETL service."""
+    await _notify(ctx, "parsing", "Extracting content")
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Processing file with Docling ETL: {ctx.filename}",
+        {
+            "file_type": "document",
+            "etl_service": "DOCLING",
+            "processing_stage": "parsing",
+        },
+    )
+
+    content = await parse_with_docling(ctx.file_path, ctx.filename)
+
+    with contextlib.suppress(Exception):
+        os.unlink(ctx.file_path)
+
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Docling parsing completed, creating document: {ctx.filename}",
+        {"processing_stage": "parsing_complete", "content_length": len(content)},
+    )
+
+    actual_pages = page_limit_service.estimate_pages_from_content_length(len(content))
+    final_pages = max(estimated_pages, actual_pages)
+    await _log_page_divergence(
+        ctx.task_logger,
+        ctx.log_entry,
+        ctx.filename,
+        estimated_pages,
+        actual_pages,
+        final_pages,
+    )
+
+    await _notify(ctx, "chunking")
+
+    result = await add_received_file_document_using_docling(
+        ctx.session,
+        ctx.filename,
+        docling_markdown_document=content,
+        search_space_id=ctx.search_space_id,
+        user_id=ctx.user_id,
+        connector=ctx.connector,
+        enable_summary=ctx.enable_summary,
+    )
+
+    if result:
+        await page_limit_service.update_page_usage(
+            ctx.user_id, final_pages, allow_exceed=True
+        )
+        if ctx.connector:
+            await update_document_from_connector(result, ctx.connector, ctx.session)
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Successfully processed file with Docling: {ctx.filename}",
+            {
+                "document_id": result.id,
+                "content_hash": result.content_hash,
+                "file_type": "document",
+                "etl_service": "DOCLING",
+                "pages_processed": final_pages,
+            },
+        )
+    else:
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Document already exists (duplicate): {ctx.filename}",
+            {
+                "duplicate_detected": True,
+                "file_type": "document",
+                "etl_service": "DOCLING",
+            },
+        )
+    return result
+
+
+async def _process_document_upload(ctx: _ProcessingContext) -> Document | None:
+    """Route a document file to the configured ETL service."""
+    from app.services.page_limit_service import PageLimitExceededError, PageLimitService
+
+    page_limit_service = PageLimitService(ctx.session)
+    estimated_pages = _estimate_pages_safe(page_limit_service, ctx.file_path)
+
+    await ctx.task_logger.log_task_progress(
+        ctx.log_entry,
+        f"Estimated {estimated_pages} pages for file: {ctx.filename}",
+        {"estimated_pages": estimated_pages, "file_type": "document"},
+    )
+
+    try:
+        await page_limit_service.check_page_limit(ctx.user_id, estimated_pages)
+    except PageLimitExceededError as e:
+        await ctx.task_logger.log_task_failure(
+            ctx.log_entry,
+            f"Page limit exceeded before processing: {ctx.filename}",
+            str(e),
+            {
+                "error_type": "PageLimitExceeded",
+                "pages_used": e.pages_used,
+                "pages_limit": e.pages_limit,
+                "estimated_pages": estimated_pages,
+            },
+        )
+        with contextlib.suppress(Exception):
+            os.unlink(ctx.file_path)
+        raise HTTPException(status_code=403, detail=str(e)) from e
+
+    etl_dispatch = {
+        "UNSTRUCTURED": _etl_unstructured,
+        "LLAMACLOUD": _etl_llamacloud,
+        "DOCLING": _etl_docling,
+    }
+    handler = etl_dispatch.get(app_config.ETL_SERVICE)
+    if handler is None:
+        raise RuntimeError(f"Unknown ETL_SERVICE: {app_config.ETL_SERVICE}")
+
+    return await handler(ctx, page_limit_service, estimated_pages)
+
+
+# ===================================================================
+# Public orchestrators
+# ===================================================================
 
 
 async def process_file_in_background(
@@ -910,726 +690,35 @@ async def process_file_in_background(
     session: AsyncSession,
     task_logger: TaskLoggingService,
     log_entry: Log,
-    connector: dict
-    | None = None,  # Optional: {"type": "GOOGLE_DRIVE_FILE", "metadata": {...}}
-    notification: Notification
-    | None = None,  # Optional notification for progress updates
+    connector: dict | None = None,
+    notification: Notification | None = None,
 ) -> Document | None:
+    ctx = _ProcessingContext(
+        session=session,
+        file_path=file_path,
+        filename=filename,
+        search_space_id=search_space_id,
+        user_id=user_id,
+        task_logger=task_logger,
+        log_entry=log_entry,
+        connector=connector,
+        notification=notification,
+    )
+
     try:
-        # Check if the file is a markdown or text file
-        if filename.lower().endswith((".md", ".markdown", ".txt")):
-            # Update notification: parsing stage
-            if notification:
-                await (
-                    NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="parsing",
-                        stage_message="Reading file",
-                    )
-                )
+        category = classify_file(filename)
 
-            await task_logger.log_task_progress(
-                log_entry,
-                f"Processing markdown/text file: {filename}",
-                {"file_type": "markdown", "processing_stage": "reading_file"},
-            )
+        if category == FileCategory.MARKDOWN:
+            return await _process_markdown_upload(ctx)
+        if category == FileCategory.DIRECT_CONVERT:
+            return await _process_direct_convert_upload(ctx)
+        if category == FileCategory.AUDIO:
+            return await _process_audio_upload(ctx)
+        return await _process_document_upload(ctx)
 
-            # For markdown files, read the content directly
-            with open(file_path, encoding="utf-8") as f:
-                markdown_content = f.read()
-
-            # Clean up the temp file
-            import os
-
-            try:
-                os.unlink(file_path)
-            except Exception as e:
-                print("Error deleting temp file", e)
-                pass
-
-            # Update notification: chunking stage
-            if notification:
-                await (
-                    NotificationService.document_processing.notify_processing_progress(
-                        session, notification, stage="chunking"
-                    )
-                )
-
-            await task_logger.log_task_progress(
-                log_entry,
-                f"Creating document from markdown content: {filename}",
-                {
-                    "processing_stage": "creating_document",
-                    "content_length": len(markdown_content),
-                },
-            )
-
-            # Process markdown directly through specialized function
-            result = await add_received_markdown_file_document(
-                session, filename, markdown_content, search_space_id, user_id, connector
-            )
-
-            if connector:
-                await _update_document_from_connector(result, connector, session)
-
-            if result:
-                await task_logger.log_task_success(
-                    log_entry,
-                    f"Successfully processed markdown file: {filename}",
-                    {
-                        "document_id": result.id,
-                        "content_hash": result.content_hash,
-                        "file_type": "markdown",
-                    },
-                )
-                return result
-            else:
-                await task_logger.log_task_success(
-                    log_entry,
-                    f"Markdown file already exists (duplicate): {filename}",
-                    {"duplicate_detected": True, "file_type": "markdown"},
-                )
-                return None
-
-        # Check if the file is an audio file
-        elif filename.lower().endswith(
-            (".mp3", ".mp4", ".mpeg", ".mpga", ".m4a", ".wav", ".webm")
-        ):
-            # Update notification: parsing stage (transcription)
-            if notification:
-                await (
-                    NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="parsing",
-                        stage_message="Transcribing audio",
-                    )
-                )
-
-            await task_logger.log_task_progress(
-                log_entry,
-                f"Processing audio file for transcription: {filename}",
-                {"file_type": "audio", "processing_stage": "starting_transcription"},
-            )
-
-            # Determine STT service type
-            stt_service_type = (
-                "local"
-                if app_config.STT_SERVICE
-                and app_config.STT_SERVICE.startswith("local/")
-                else "external"
-            )
-
-            # Check if using local STT service
-            if stt_service_type == "local":
-                # Use local Faster-Whisper for transcription
-                from app.services.stt_service import stt_service
-
-                try:
-                    result = stt_service.transcribe_file(file_path)
-                    transcribed_text = result.get("text", "")
-
-                    if not transcribed_text:
-                        raise ValueError("Transcription returned empty text")
-
-                    # Add metadata about the transcription
-                    transcribed_text = (
-                        f"# Transcription of {filename}\n\n{transcribed_text}"
-                    )
-                except Exception as e:
-                    raise HTTPException(
-                        status_code=422,
-                        detail=f"Failed to transcribe audio file {filename}: {e!s}",
-                    ) from e
-
-                await task_logger.log_task_progress(
-                    log_entry,
-                    f"Local STT transcription completed: {filename}",
-                    {
-                        "processing_stage": "local_transcription_complete",
-                        "language": result.get("language"),
-                        "confidence": result.get("language_probability"),
-                        "duration": result.get("duration"),
-                    },
-                )
-            else:
-                # Use LiteLLM for audio transcription
-                with open(file_path, "rb") as audio_file:
-                    transcription_kwargs = {
-                        "model": app_config.STT_SERVICE,
-                        "file": audio_file,
-                        "api_key": app_config.STT_SERVICE_API_KEY,
-                    }
-                    if app_config.STT_SERVICE_API_BASE:
-                        transcription_kwargs["api_base"] = (
-                            app_config.STT_SERVICE_API_BASE
-                        )
-
-                    transcription_response = await atranscription(
-                        **transcription_kwargs
-                    )
-
-                    # Extract the transcribed text
-                    transcribed_text = transcription_response.get("text", "")
-
-                    if not transcribed_text:
-                        raise ValueError("Transcription returned empty text")
-
-                # Add metadata about the transcription
-                transcribed_text = (
-                    f"# Transcription of {filename}\n\n{transcribed_text}"
-                )
-
-            await task_logger.log_task_progress(
-                log_entry,
-                f"Transcription completed, creating document: {filename}",
-                {
-                    "processing_stage": "transcription_complete",
-                    "transcript_length": len(transcribed_text),
-                },
-            )
-
-            # Update notification: chunking stage
-            if notification:
-                await (
-                    NotificationService.document_processing.notify_processing_progress(
-                        session, notification, stage="chunking"
-                    )
-                )
-
-            # Clean up the temp file
-            try:
-                os.unlink(file_path)
-            except Exception as e:
-                print("Error deleting temp file", e)
-                pass
-
-            # Process transcription as markdown document
-            result = await add_received_markdown_file_document(
-                session, filename, transcribed_text, search_space_id, user_id, connector
-            )
-
-            if connector:
-                await _update_document_from_connector(result, connector, session)
-
-            if result:
-                await task_logger.log_task_success(
-                    log_entry,
-                    f"Successfully transcribed and processed audio file: {filename}",
-                    {
-                        "document_id": result.id,
-                        "content_hash": result.content_hash,
-                        "file_type": "audio",
-                        "transcript_length": len(transcribed_text),
-                        "stt_service": stt_service_type,
-                    },
-                )
-                return result
-            else:
-                await task_logger.log_task_success(
-                    log_entry,
-                    f"Audio file transcript already exists (duplicate): {filename}",
-                    {"duplicate_detected": True, "file_type": "audio"},
-                )
-                return None
-
-        else:
-            # Import page limit service
-            from app.services.page_limit_service import (
-                PageLimitExceededError,
-                PageLimitService,
-            )
-
-            # Initialize page limit service
-            page_limit_service = PageLimitService(session)
-
-            # CRITICAL: Estimate page count BEFORE making expensive ETL API calls
-            # This prevents users from incurring costs on files that would exceed their limit
-            try:
-                estimated_pages_before = (
-                    page_limit_service.estimate_pages_before_processing(file_path)
-                )
-            except Exception:
-                # If estimation fails, use a conservative estimate based on file size
-                import os
-
-                file_size = os.path.getsize(file_path)
-                estimated_pages_before = max(
-                    1, file_size // (80 * 1024)
-                )  # ~80KB per page
-
-            await task_logger.log_task_progress(
-                log_entry,
-                f"Estimated {estimated_pages_before} pages for file: {filename}",
-                {
-                    "estimated_pages": estimated_pages_before,
-                    "file_type": "document",
-                },
-            )
-
-            # Check page limit BEFORE calling ETL service to avoid unnecessary costs
-            try:
-                await page_limit_service.check_page_limit(
-                    user_id, estimated_pages_before
-                )
-            except PageLimitExceededError as e:
-                await task_logger.log_task_failure(
-                    log_entry,
-                    f"Page limit exceeded before processing: {filename}",
-                    str(e),
-                    {
-                        "error_type": "PageLimitExceeded",
-                        "pages_used": e.pages_used,
-                        "pages_limit": e.pages_limit,
-                        "estimated_pages": estimated_pages_before,
-                    },
-                )
-                # Clean up the temp file
-                import os
-
-                with contextlib.suppress(Exception):
-                    os.unlink(file_path)
-
-                raise HTTPException(
-                    status_code=403,
-                    detail=str(e),
-                ) from e
-
-            if app_config.ETL_SERVICE == "UNSTRUCTURED":
-                # Update notification: parsing stage
-                if notification:
-                    await NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="parsing",
-                        stage_message="Extracting content",
-                    )
-
-                await task_logger.log_task_progress(
-                    log_entry,
-                    f"Processing file with Unstructured ETL: {filename}",
-                    {
-                        "file_type": "document",
-                        "etl_service": "UNSTRUCTURED",
-                        "processing_stage": "loading",
-                    },
-                )
-
-                from langchain_unstructured import UnstructuredLoader
-
-                # Process the file
-                loader = UnstructuredLoader(
-                    file_path,
-                    mode="elements",
-                    post_processors=[],
-                    languages=["eng"],
-                    include_orig_elements=False,
-                    include_metadata=False,
-                    strategy="auto",
-                )
-
-                docs = await loader.aload()
-
-                # Update notification: chunking stage
-                if notification:
-                    await NotificationService.document_processing.notify_processing_progress(
-                        session, notification, stage="chunking", chunks_count=len(docs)
-                    )
-
-                await task_logger.log_task_progress(
-                    log_entry,
-                    f"Unstructured ETL completed, creating document: {filename}",
-                    {"processing_stage": "etl_complete", "elements_count": len(docs)},
-                )
-
-                # Verify actual page count from parsed documents
-                actual_pages = page_limit_service.estimate_pages_from_elements(docs)
-
-                # Use the higher of the two estimates for safety (in case pre-estimate was too low)
-                final_page_count = max(estimated_pages_before, actual_pages)
-
-                # If actual is significantly higher than estimate, log a warning
-                if actual_pages > estimated_pages_before * 1.5:
-                    await task_logger.log_task_progress(
-                        log_entry,
-                        f"Actual page count higher than estimate: {filename}",
-                        {
-                            "estimated_before": estimated_pages_before,
-                            "actual_pages": actual_pages,
-                            "using_count": final_page_count,
-                        },
-                    )
-
-                # Clean up the temp file
-                import os
-
-                try:
-                    os.unlink(file_path)
-                except Exception as e:
-                    print("Error deleting temp file", e)
-                    pass
-
-                enable_summary = (
-                    connector.get("enable_summary", True) if connector else True
-                )
-                result = await add_received_file_document_using_unstructured(
-                    session,
-                    filename,
-                    docs,
-                    search_space_id,
-                    user_id,
-                    connector,
-                    enable_summary=enable_summary,
-                )
-
-                if connector:
-                    await _update_document_from_connector(result, connector, session)
-
-                if result:
-                    # Update page usage after successful processing
-                    # allow_exceed=True because document was already created after passing initial check
-                    await page_limit_service.update_page_usage(
-                        user_id, final_page_count, allow_exceed=True
-                    )
-
-                    await task_logger.log_task_success(
-                        log_entry,
-                        f"Successfully processed file with Unstructured: {filename}",
-                        {
-                            "document_id": result.id,
-                            "content_hash": result.content_hash,
-                            "file_type": "document",
-                            "etl_service": "UNSTRUCTURED",
-                            "pages_processed": final_page_count,
-                        },
-                    )
-                    return result
-                else:
-                    await task_logger.log_task_success(
-                        log_entry,
-                        f"Document already exists (duplicate): {filename}",
-                        {
-                            "duplicate_detected": True,
-                            "file_type": "document",
-                            "etl_service": "UNSTRUCTURED",
-                        },
-                    )
-                    return None
-
-            elif app_config.ETL_SERVICE == "LLAMACLOUD":
-                # Update notification: parsing stage
-                if notification:
-                    await NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="parsing",
-                        stage_message="Extracting content",
-                    )
-
-                await task_logger.log_task_progress(
-                    log_entry,
-                    f"Processing file with LlamaCloud ETL: {filename}",
-                    {
-                        "file_type": "document",
-                        "etl_service": "LLAMACLOUD",
-                        "processing_stage": "parsing",
-                        "estimated_pages": estimated_pages_before,
-                    },
-                )
-
-                # Parse file with retry logic for SSL/connection errors (common with large files)
-                result = await parse_with_llamacloud_retry(
-                    file_path=file_path,
-                    estimated_pages=estimated_pages_before,
-                    task_logger=task_logger,
-                    log_entry=log_entry,
-                )
-
-                # Clean up the temp file
-                import os
-
-                try:
-                    os.unlink(file_path)
-                except Exception as e:
-                    print("Error deleting temp file", e)
-                    pass
-
-                # Get markdown documents from the result
-                markdown_documents = await result.aget_markdown_documents(
-                    split_by_page=False
-                )
-
-                # Update notification: chunking stage
-                if notification:
-                    await NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="chunking",
-                        chunks_count=len(markdown_documents),
-                    )
-
-                await task_logger.log_task_progress(
-                    log_entry,
-                    f"LlamaCloud parsing completed, creating documents: {filename}",
-                    {
-                        "processing_stage": "parsing_complete",
-                        "documents_count": len(markdown_documents),
-                    },
-                )
-
-                # Check if LlamaCloud returned any documents
-                if not markdown_documents or len(markdown_documents) == 0:
-                    await task_logger.log_task_failure(
-                        log_entry,
-                        f"LlamaCloud parsing returned no documents: {filename}",
-                        "ETL service returned empty document list",
-                        {
-                            "error_type": "EmptyDocumentList",
-                            "etl_service": "LLAMACLOUD",
-                        },
-                    )
-                    raise ValueError(
-                        f"LlamaCloud parsing returned no documents for {filename}"
-                    )
-
-                # Verify actual page count from parsed markdown documents
-                actual_pages = page_limit_service.estimate_pages_from_markdown(
-                    markdown_documents
-                )
-
-                # Use the higher of the two estimates for safety (in case pre-estimate was too low)
-                final_page_count = max(estimated_pages_before, actual_pages)
-
-                # If actual is significantly higher than estimate, log a warning
-                if actual_pages > estimated_pages_before * 1.5:
-                    await task_logger.log_task_progress(
-                        log_entry,
-                        f"Actual page count higher than estimate: {filename}",
-                        {
-                            "estimated_before": estimated_pages_before,
-                            "actual_pages": actual_pages,
-                            "using_count": final_page_count,
-                        },
-                    )
-
-                # Track if any document was successfully created (not a duplicate)
-                any_doc_created = False
-                last_created_doc = None
-
-                for doc in markdown_documents:
-                    # Extract text content from the markdown documents
-                    markdown_content = doc.text
-
-                    enable_summary = (
-                        connector.get("enable_summary", True) if connector else True
-                    )
-                    doc_result = await add_received_file_document_using_llamacloud(
-                        session,
-                        filename,
-                        llamacloud_markdown_document=markdown_content,
-                        search_space_id=search_space_id,
-                        user_id=user_id,
-                        connector=connector,
-                        enable_summary=enable_summary,
-                    )
-
-                    # Track if this document was successfully created
-                    if doc_result:
-                        any_doc_created = True
-                        last_created_doc = doc_result
-
-                # Update page usage once after processing all documents
-                # Only update if at least one document was created (not all duplicates)
-                if any_doc_created:
-                    # Update page usage after successful processing
-                    # allow_exceed=True because document was already created after passing initial check
-                    await page_limit_service.update_page_usage(
-                        user_id, final_page_count, allow_exceed=True
-                    )
-
-                    if connector:
-                        await _update_document_from_connector(
-                            last_created_doc, connector, session
-                        )
-
-                    await task_logger.log_task_success(
-                        log_entry,
-                        f"Successfully processed file with LlamaCloud: {filename}",
-                        {
-                            "document_id": last_created_doc.id,
-                            "content_hash": last_created_doc.content_hash,
-                            "file_type": "document",
-                            "etl_service": "LLAMACLOUD",
-                            "pages_processed": final_page_count,
-                            "documents_count": len(markdown_documents),
-                        },
-                    )
-                    return last_created_doc
-                else:
-                    # All documents were duplicates (markdown_documents was not empty, but all returned None)
-                    await task_logger.log_task_success(
-                        log_entry,
-                        f"Document already exists (duplicate): {filename}",
-                        {
-                            "duplicate_detected": True,
-                            "file_type": "document",
-                            "etl_service": "LLAMACLOUD",
-                            "documents_count": len(markdown_documents),
-                        },
-                    )
-                    return None
-
-            elif app_config.ETL_SERVICE == "DOCLING":
-                # Update notification: parsing stage
-                if notification:
-                    await NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="parsing",
-                        stage_message="Extracting content",
-                    )
-
-                await task_logger.log_task_progress(
-                    log_entry,
-                    f"Processing file with Docling ETL: {filename}",
-                    {
-                        "file_type": "document",
-                        "etl_service": "DOCLING",
-                        "processing_stage": "parsing",
-                    },
-                )
-
-                # Use Docling service for document processing
-                from app.services.docling_service import create_docling_service
-
-                # Create Docling service
-                docling_service = create_docling_service()
-
-                # Suppress pdfminer warnings that can cause processing to hang
-                # These warnings are harmless but can spam logs and potentially halt processing
-                # Suppress both Python warnings and logging warnings from pdfminer
-                pdfminer_logger = getLogger("pdfminer")
-                original_level = pdfminer_logger.level
-
-                with warnings.catch_warnings():
-                    warnings.filterwarnings(
-                        "ignore", category=UserWarning, module="pdfminer"
-                    )
-                    warnings.filterwarnings(
-                        "ignore",
-                        message=".*Cannot set gray non-stroke color.*",
-                    )
-                    warnings.filterwarnings("ignore", message=".*invalid float value.*")
-
-                    # Temporarily suppress pdfminer logging warnings
-                    pdfminer_logger.setLevel(ERROR)
-
-                    try:
-                        # Process the document
-                        result = await docling_service.process_document(
-                            file_path, filename
-                        )
-                    finally:
-                        # Restore original logging level
-                        pdfminer_logger.setLevel(original_level)
-
-                # Clean up the temp file
-                import os
-
-                try:
-                    os.unlink(file_path)
-                except Exception as e:
-                    print("Error deleting temp file", e)
-                    pass
-
-                await task_logger.log_task_progress(
-                    log_entry,
-                    f"Docling parsing completed, creating document: {filename}",
-                    {
-                        "processing_stage": "parsing_complete",
-                        "content_length": len(result["content"]),
-                    },
-                )
-
-                # Verify actual page count from content length
-                actual_pages = page_limit_service.estimate_pages_from_content_length(
-                    len(result["content"])
-                )
-
-                # Use the higher of the two estimates for safety (in case pre-estimate was too low)
-                final_page_count = max(estimated_pages_before, actual_pages)
-
-                # If actual is significantly higher than estimate, log a warning
-                if actual_pages > estimated_pages_before * 1.5:
-                    await task_logger.log_task_progress(
-                        log_entry,
-                        f"Actual page count higher than estimate: {filename}",
-                        {
-                            "estimated_before": estimated_pages_before,
-                            "actual_pages": actual_pages,
-                            "using_count": final_page_count,
-                        },
-                    )
-
-                # Update notification: chunking stage
-                if notification:
-                    await NotificationService.document_processing.notify_processing_progress(
-                        session, notification, stage="chunking"
-                    )
-
-                enable_summary = (
-                    connector.get("enable_summary", True) if connector else True
-                )
-                doc_result = await add_received_file_document_using_docling(
-                    session,
-                    filename,
-                    docling_markdown_document=result["content"],
-                    search_space_id=search_space_id,
-                    user_id=user_id,
-                    connector=connector,
-                    enable_summary=enable_summary,
-                )
-
-                if doc_result:
-                    # Update page usage after successful processing
-                    # allow_exceed=True because document was already created after passing initial check
-                    await page_limit_service.update_page_usage(
-                        user_id, final_page_count, allow_exceed=True
-                    )
-
-                    if connector:
-                        await _update_document_from_connector(
-                            doc_result, connector, session
-                        )
-
-                    await task_logger.log_task_success(
-                        log_entry,
-                        f"Successfully processed file with Docling: {filename}",
-                        {
-                            "document_id": doc_result.id,
-                            "content_hash": doc_result.content_hash,
-                            "file_type": "document",
-                            "etl_service": "DOCLING",
-                            "pages_processed": final_page_count,
-                        },
-                    )
-                    return doc_result
-                else:
-                    await task_logger.log_task_success(
-                        log_entry,
-                        f"Document already exists (duplicate): {filename}",
-                        {
-                            "duplicate_detected": True,
-                            "file_type": "document",
-                            "etl_service": "DOCLING",
-                        },
-                    )
-                    return None
     except Exception as e:
         await session.rollback()
 
-        # For page limit errors, use the detailed message from the exception
         from app.services.page_limit_service import PageLimitExceededError
 
         if isinstance(e, PageLimitExceededError):
@@ -1645,10 +734,225 @@ async def process_file_in_background(
             str(e),
             {"error_type": type(e).__name__, "filename": filename},
         )
-        import logging
-
         logging.error(f"Error processing file in background: {error_message}")
-        raise  # Re-raise so the wrapper can also handle it
+        raise
+
+
+# ===================================================================
+# 2-phase handler (process_file_in_background_with_document)
+# ===================================================================
+
+
+async def _extract_file_content(
+    file_path: str,
+    filename: str,
+    session: AsyncSession,
+    user_id: str,
+    task_logger: TaskLoggingService,
+    log_entry: Log,
+    notification: Notification | None,
+) -> tuple[str, str]:
+    """
+    Extract markdown content from a file regardless of type.
+
+    Returns:
+        Tuple of (markdown_content, etl_service_name).
+    """
+    category = classify_file(filename)
+
+    if category == FileCategory.MARKDOWN:
+        if notification:
+            await NotificationService.document_processing.notify_processing_progress(
+                session,
+                notification,
+                stage="parsing",
+                stage_message="Reading file",
+            )
+        await task_logger.log_task_progress(
+            log_entry,
+            f"Processing markdown/text file: {filename}",
+            {"file_type": "markdown", "processing_stage": "reading_file"},
+        )
+        with open(file_path, encoding="utf-8") as f:
+            content = f.read()
+        with contextlib.suppress(Exception):
+            os.unlink(file_path)
+        return content, "MARKDOWN"
+
+    if category == FileCategory.DIRECT_CONVERT:
+        if notification:
+            await NotificationService.document_processing.notify_processing_progress(
+                session,
+                notification,
+                stage="parsing",
+                stage_message="Converting file",
+            )
+        await task_logger.log_task_progress(
+            log_entry,
+            f"Direct-converting file to markdown: {filename}",
+            {"file_type": "direct_convert", "processing_stage": "converting"},
+        )
+        content = convert_file_directly(file_path, filename)
+        with contextlib.suppress(Exception):
+            os.unlink(file_path)
+        return content, "DIRECT_CONVERT"
+
+    if category == FileCategory.AUDIO:
+        if notification:
+            await NotificationService.document_processing.notify_processing_progress(
+                session,
+                notification,
+                stage="parsing",
+                stage_message="Transcribing audio",
+            )
+        await task_logger.log_task_progress(
+            log_entry,
+            f"Processing audio file for transcription: {filename}",
+            {"file_type": "audio", "processing_stage": "starting_transcription"},
+        )
+        transcribed_text = await _transcribe_audio(file_path, filename)
+        with contextlib.suppress(Exception):
+            os.unlink(file_path)
+        return transcribed_text, "AUDIO_TRANSCRIPTION"
+
+    # Document file — use ETL service
+    return await _extract_document_content(
+        file_path,
+        filename,
+        session,
+        user_id,
+        task_logger,
+        log_entry,
+        notification,
+    )
+
+
+async def _transcribe_audio(file_path: str, filename: str) -> str:
+    """Transcribe an audio file and return formatted markdown text."""
+    stt_service_type = (
+        "local"
+        if app_config.STT_SERVICE and app_config.STT_SERVICE.startswith("local/")
+        else "external"
+    )
+
+    if stt_service_type == "local":
+        from app.services.stt_service import stt_service
+
+        result = stt_service.transcribe_file(file_path)
+        text = result.get("text", "")
+        if not text:
+            raise ValueError("Transcription returned empty text")
+    else:
+        from litellm import atranscription
+
+        with open(file_path, "rb") as audio_file:
+            kwargs: dict = {
+                "model": app_config.STT_SERVICE,
+                "file": audio_file,
+                "api_key": app_config.STT_SERVICE_API_KEY,
+            }
+            if app_config.STT_SERVICE_API_BASE:
+                kwargs["api_base"] = app_config.STT_SERVICE_API_BASE
+            response = await atranscription(**kwargs)
+            text = response.get("text", "")
+            if not text:
+                raise ValueError("Transcription returned empty text")
+
+    return f"# Transcription of {filename}\n\n{text}"
+
+
+async def _extract_document_content(
+    file_path: str,
+    filename: str,
+    session: AsyncSession,
+    user_id: str,
+    task_logger: TaskLoggingService,
+    log_entry: Log,
+    notification: Notification | None,
+) -> tuple[str, str]:
+    """
+    Parse a document file via the configured ETL service.
+
+    Returns:
+        Tuple of (markdown_content, etl_service_name).
+    """
+    from app.services.page_limit_service import PageLimitService
+
+    page_limit_service = PageLimitService(session)
+
+    try:
+        estimated_pages = page_limit_service.estimate_pages_before_processing(file_path)
+    except Exception:
+        file_size = os.path.getsize(file_path)
+        estimated_pages = max(1, file_size // (80 * 1024))
+
+    await page_limit_service.check_page_limit(user_id, estimated_pages)
+
+    etl_service = app_config.ETL_SERVICE
+    markdown_content: str | None = None
+
+    if notification:
+        await NotificationService.document_processing.notify_processing_progress(
+            session,
+            notification,
+            stage="parsing",
+            stage_message="Extracting content",
+        )
+
+    if etl_service == "UNSTRUCTURED":
+        from app.utils.document_converters import convert_document_to_markdown
+
+        docs = await parse_with_unstructured(file_path)
+        markdown_content = await convert_document_to_markdown(docs)
+        actual_pages = page_limit_service.estimate_pages_from_elements(docs)
+        final_pages = max(estimated_pages, actual_pages)
+        await page_limit_service.update_page_usage(
+            user_id, final_pages, allow_exceed=True
+        )
+
+    elif etl_service == "LLAMACLOUD":
+        raw_result = await parse_with_llamacloud_retry(
+            file_path=file_path,
+            estimated_pages=estimated_pages,
+            task_logger=task_logger,
+            log_entry=log_entry,
+        )
+        markdown_documents = await raw_result.aget_markdown_documents(
+            split_by_page=False
+        )
+        if not markdown_documents:
+            raise RuntimeError(f"LlamaCloud parsing returned no documents: {filename}")
+        markdown_content = markdown_documents[0].text
+        await page_limit_service.update_page_usage(
+            user_id, estimated_pages, allow_exceed=True
+        )
+
+    elif etl_service == "DOCLING":
+        getLogger("docling.pipeline.base_pipeline").setLevel(ERROR)
+        getLogger("docling.document_converter").setLevel(ERROR)
+        getLogger("docling_core.transforms.chunker.hierarchical_chunker").setLevel(
+            ERROR
+        )
+
+        from docling.document_converter import DocumentConverter
+
+        converter = DocumentConverter()
+        result = converter.convert(file_path)
+        markdown_content = result.document.export_to_markdown()
+        await page_limit_service.update_page_usage(
+            user_id, estimated_pages, allow_exceed=True
+        )
+
+    else:
+        raise RuntimeError(f"Unknown ETL_SERVICE: {etl_service}")
+
+    with contextlib.suppress(Exception):
+        os.unlink(file_path)
+
+    if not markdown_content:
+        raise RuntimeError(f"Failed to extract content from file: {filename}")
+
+    return markdown_content, etl_service
 
 
 async def process_file_in_background_with_document(
@@ -1667,272 +971,50 @@ async def process_file_in_background_with_document(
     """
     Process file and update existing pending document (2-phase pattern).
 
-    This function is Phase 2 of the real-time document status updates:
-    - Phase 1 (API): Created document with pending status
-    - Phase 2 (this): Process file and update document to ready/failed
-
-    The document already exists with pending status. This function:
-    1. Parses the file content (markdown, audio, or ETL services)
-    2. Updates the document with content, embeddings, and chunks
-    3. Sets status to 'ready' on success
-
-    Args:
-        document: Existing document with pending status
-        file_path: Path to the uploaded file
-        filename: Original filename
-        search_space_id: ID of the search space
-        user_id: ID of the user
-        session: Database session
-        task_logger: Task logging service
-        log_entry: Log entry for this task
-        connector: Optional connector info for Google Drive files
-        notification: Optional notification for progress updates
-
-    Returns:
-        Updated Document object if successful, None if duplicate content detected
+    Phase 1 (API layer): Created document with pending status.
+    Phase 2 (this function): Process file and update document to ready/failed.
     """
-    import os
-
-    from app.config import config as app_config
+    from app.indexing_pipeline.adapters.file_upload_adapter import (
+        UploadDocumentAdapter,
+    )
     from app.services.llm_service import get_user_long_context_llm
+    from app.utils.document_converters import generate_content_hash
+
+    from .base import check_duplicate_document
 
     doc_id = document.id
 
     try:
-        markdown_content = None
-        etl_service = None
-
-        # ===== STEP 1: Parse file content based on type =====
-
-        # Check if the file is a markdown or text file
-        if filename.lower().endswith((".md", ".markdown", ".txt")):
-            # Update notification: parsing stage
-            if notification:
-                await (
-                    NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="parsing",
-                        stage_message="Reading file",
-                    )
-                )
-
-            await task_logger.log_task_progress(
-                log_entry,
-                f"Processing markdown/text file: {filename}",
-                {"file_type": "markdown", "processing_stage": "reading_file"},
-            )
-
-            # Read markdown content directly
-            with open(file_path, encoding="utf-8") as f:
-                markdown_content = f.read()
-            etl_service = "MARKDOWN"
-
-            # Clean up temp file
-            with contextlib.suppress(Exception):
-                os.unlink(file_path)
-
-        # Check if the file is an audio file
-        elif filename.lower().endswith(
-            (".mp3", ".mp4", ".mpeg", ".mpga", ".m4a", ".wav", ".webm")
-        ):
-            # Update notification: parsing stage (transcription)
-            if notification:
-                await (
-                    NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="parsing",
-                        stage_message="Transcribing audio",
-                    )
-                )
-
-            await task_logger.log_task_progress(
-                log_entry,
-                f"Processing audio file for transcription: {filename}",
-                {"file_type": "audio", "processing_stage": "starting_transcription"},
-            )
-
-            # Transcribe audio
-            stt_service_type = (
-                "local"
-                if app_config.STT_SERVICE
-                and app_config.STT_SERVICE.startswith("local/")
-                else "external"
-            )
-
-            if stt_service_type == "local":
-                from app.services.stt_service import stt_service
-
-                result = stt_service.transcribe_file(file_path)
-                transcribed_text = result.get("text", "")
-                if not transcribed_text:
-                    raise ValueError("Transcription returned empty text")
-                markdown_content = (
-                    f"# Transcription of {filename}\n\n{transcribed_text}"
-                )
-            else:
-                with open(file_path, "rb") as audio_file:
-                    transcription_kwargs = {
-                        "model": app_config.STT_SERVICE,
-                        "file": audio_file,
-                        "api_key": app_config.STT_SERVICE_API_KEY,
-                    }
-                    if app_config.STT_SERVICE_API_BASE:
-                        transcription_kwargs["api_base"] = (
-                            app_config.STT_SERVICE_API_BASE
-                        )
-                    transcription_response = await atranscription(
-                        **transcription_kwargs
-                    )
-                    transcribed_text = transcription_response.get("text", "")
-                    if not transcribed_text:
-                        raise ValueError("Transcription returned empty text")
-                markdown_content = (
-                    f"# Transcription of {filename}\n\n{transcribed_text}"
-                )
-
-            etl_service = "AUDIO_TRANSCRIPTION"
-            # Clean up temp file
-            with contextlib.suppress(Exception):
-                os.unlink(file_path)
-
-        else:
-            # Document files - use ETL service
-            from app.services.page_limit_service import (
-                PageLimitExceededError,
-                PageLimitService,
-            )
-
-            page_limit_service = PageLimitService(session)
-
-            # Estimate page count
-            try:
-                estimated_pages = page_limit_service.estimate_pages_before_processing(
-                    file_path
-                )
-            except Exception:
-                file_size = os.path.getsize(file_path)
-                estimated_pages = max(1, file_size // (80 * 1024))
-
-            # Check page limit
-            await page_limit_service.check_page_limit(user_id, estimated_pages)
-
-            if app_config.ETL_SERVICE == "UNSTRUCTURED":
-                if notification:
-                    await NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="parsing",
-                        stage_message="Extracting content",
-                    )
-
-                from langchain_unstructured import UnstructuredLoader
-
-                loader = UnstructuredLoader(
-                    file_path,
-                    mode="elements",
-                    post_processors=[],
-                    languages=["eng"],
-                    include_orig_elements=False,
-                    include_metadata=False,
-                    strategy="auto",
-                )
-                docs = await loader.aload()
-                markdown_content = await convert_document_to_markdown(docs)
-                actual_pages = page_limit_service.estimate_pages_from_elements(docs)
-                final_page_count = max(estimated_pages, actual_pages)
-                etl_service = "UNSTRUCTURED"
-
-                # Update page usage
-                await page_limit_service.update_page_usage(
-                    user_id, final_page_count, allow_exceed=True
-                )
-
-            elif app_config.ETL_SERVICE == "LLAMACLOUD":
-                if notification:
-                    await NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="parsing",
-                        stage_message="Extracting content",
-                    )
-
-                result = await parse_with_llamacloud_retry(
-                    file_path=file_path,
-                    estimated_pages=estimated_pages,
-                    task_logger=task_logger,
-                    log_entry=log_entry,
-                )
-                markdown_documents = await result.aget_markdown_documents(
-                    split_by_page=False
-                )
-                if not markdown_documents:
-                    raise RuntimeError(
-                        f"LlamaCloud parsing returned no documents: {filename}"
-                    )
-                markdown_content = markdown_documents[0].text
-                etl_service = "LLAMACLOUD"
-
-                # Update page usage
-                await page_limit_service.update_page_usage(
-                    user_id, estimated_pages, allow_exceed=True
-                )
-
-            elif app_config.ETL_SERVICE == "DOCLING":
-                if notification:
-                    await NotificationService.document_processing.notify_processing_progress(
-                        session,
-                        notification,
-                        stage="parsing",
-                        stage_message="Extracting content",
-                    )
-
-                # Suppress logging during Docling import
-                getLogger("docling.pipeline.base_pipeline").setLevel(ERROR)
-                getLogger("docling.document_converter").setLevel(ERROR)
-                getLogger(
-                    "docling_core.transforms.chunker.hierarchical_chunker"
-                ).setLevel(ERROR)
-
-                from docling.document_converter import DocumentConverter
-
-                converter = DocumentConverter()
-                result = converter.convert(file_path)
-                markdown_content = result.document.export_to_markdown()
-                etl_service = "DOCLING"
-
-                # Update page usage
-                await page_limit_service.update_page_usage(
-                    user_id, estimated_pages, allow_exceed=True
-                )
-
-            else:
-                raise RuntimeError(f"Unknown ETL_SERVICE: {app_config.ETL_SERVICE}")
-
-            # Clean up temp file
-            with contextlib.suppress(Exception):
-                os.unlink(file_path)
+        # Step 1: extract content
+        markdown_content, etl_service = await _extract_file_content(
+            file_path,
+            filename,
+            session,
+            user_id,
+            task_logger,
+            log_entry,
+            notification,
+        )
 
         if not markdown_content:
             raise RuntimeError(f"Failed to extract content from file: {filename}")
 
-        # ===== STEP 2: Check for duplicate content =====
+        # Step 2: duplicate check
         content_hash = generate_content_hash(markdown_content, search_space_id)
-
         existing_by_content = await check_duplicate_document(session, content_hash)
         if existing_by_content and existing_by_content.id != doc_id:
-            # Duplicate content found - mark this document as failed
             logging.info(
                 f"Duplicate content detected for {filename}, "
                 f"matches document {existing_by_content.id}"
             )
             return None
 
-        # ===== STEP 3+4: Index via pipeline =====
+        # Step 3: index via pipeline
         if notification:
             await NotificationService.document_processing.notify_processing_progress(
-                session, notification, stage="chunking"
+                session,
+                notification,
+                stage="chunking",
             )
 
         user_llm = await get_user_long_context_llm(session, user_id, search_space_id)
@@ -1957,7 +1039,6 @@ async def process_file_in_background_with_document(
                 "file_type": etl_service,
             },
         )
-
         return document
 
     except Exception as e:
diff --git a/surfsense_backend/app/tasks/document_processors/markdown_processor.py b/surfsense_backend/app/tasks/document_processors/markdown_processor.py
index 2fb711bf8..0ff340c0e 100644
--- a/surfsense_backend/app/tasks/document_processors/markdown_processor.py
+++ b/surfsense_backend/app/tasks/document_processors/markdown_processor.py
@@ -14,88 +14,19 @@ from app.utils.document_converters import (
     create_document_chunks,
     generate_content_hash,
     generate_document_summary,
-    generate_unique_identifier_hash,
 )
 
+from ._helpers import (
+    find_existing_document_with_migration,
+    get_google_drive_unique_identifier,
+)
 from .base import (
-    check_document_by_unique_identifier,
     check_duplicate_document,
     get_current_timestamp,
     safe_set_chunks,
 )
 
 
-def _get_google_drive_unique_identifier(
-    connector: dict | None,
-    filename: str,
-    search_space_id: int,
-) -> tuple[str, str | None]:
-    """
-    Get unique identifier hash for a file, with special handling for Google Drive.
-
-    For Google Drive files, uses file_id as the unique identifier (doesn't change on rename).
-    For other files, uses filename.
-
-    Args:
-        connector: Optional connector info dict with type and metadata
-        filename: The filename (used for non-Google Drive files or as fallback)
-        search_space_id: The search space ID
-
-    Returns:
-        Tuple of (primary_hash, legacy_hash or None)
-    """
-    if connector and connector.get("type") == DocumentType.GOOGLE_DRIVE_FILE:
-        metadata = connector.get("metadata", {})
-        file_id = metadata.get("google_drive_file_id")
-
-        if file_id:
-            primary_hash = generate_unique_identifier_hash(
-                DocumentType.GOOGLE_DRIVE_FILE, file_id, search_space_id
-            )
-            legacy_hash = generate_unique_identifier_hash(
-                DocumentType.GOOGLE_DRIVE_FILE, filename, search_space_id
-            )
-            return primary_hash, legacy_hash
-
-    primary_hash = generate_unique_identifier_hash(
-        DocumentType.FILE, filename, search_space_id
-    )
-    return primary_hash, None
-
-
-async def _find_existing_document_with_migration(
-    session: AsyncSession,
-    primary_hash: str,
-    legacy_hash: str | None,
-    content_hash: str | None = None,
-) -> Document | None:
-    """
-    Find existing document, checking both new hash and legacy hash for migration,
-    with fallback to content_hash for cross-source deduplication.
-    """
-    existing_document = await check_document_by_unique_identifier(session, primary_hash)
-
-    if not existing_document and legacy_hash:
-        existing_document = await check_document_by_unique_identifier(
-            session, legacy_hash
-        )
-        if existing_document:
-            logging.info(
-                "Found legacy document (filename-based hash), will migrate to file_id-based hash"
-            )
-
-    # Fallback: check by content_hash to catch duplicates from different sources
-    if not existing_document and content_hash:
-        existing_document = await check_duplicate_document(session, content_hash)
-        if existing_document:
-            logging.info(
-                f"Found duplicate content from different source (content_hash match). "
-                f"Original document ID: {existing_document.id}, type: {existing_document.document_type}"
-            )
-
-    return existing_document
-
-
 async def _handle_existing_document_update(
     session: AsyncSession,
     existing_document: Document,
@@ -224,7 +155,7 @@ async def add_received_markdown_file_document(
 
     try:
         # Generate unique identifier hash (uses file_id for Google Drive, filename for others)
-        primary_hash, legacy_hash = _get_google_drive_unique_identifier(
+        primary_hash, legacy_hash = get_google_drive_unique_identifier(
             connector, file_name, search_space_id
         )
 
@@ -232,7 +163,7 @@ async def add_received_markdown_file_document(
         content_hash = generate_content_hash(file_in_markdown, search_space_id)
 
         # Check if document exists (with migration support for Google Drive and content_hash fallback)
-        existing_document = await _find_existing_document_with_migration(
+        existing_document = await find_existing_document_with_migration(
             session, primary_hash, legacy_hash, content_hash
         )
 
diff --git a/surfsense_backend/tests/integration/document_upload/test_upload_limits.py b/surfsense_backend/tests/integration/document_upload/test_upload_limits.py
index a8dab43f0..a56398baa 100644
--- a/surfsense_backend/tests/integration/document_upload/test_upload_limits.py
+++ b/surfsense_backend/tests/integration/document_upload/test_upload_limits.py
@@ -2,12 +2,11 @@
 Integration tests for backend file upload limit enforcement.
 
 These tests verify that the API rejects uploads that exceed:
-  - Max files per upload (10)
-  - Max per-file size (50 MB)
-  - Max total upload size (200 MB)
+  - Max per-file size (500 MB)
 
-The limits mirror the frontend's DocumentUploadTab.tsx constants and are
-enforced server-side to protect against direct API calls.
+No file count or total size limits are enforced — the frontend batches
+uploads in groups of 5 and there is no cap on how many files a user can
+upload in a single session.
 
 Prerequisites:
   - PostgreSQL + pgvector
@@ -24,60 +23,12 @@ pytestmark = pytest.mark.integration
 
 
 # ---------------------------------------------------------------------------
-# Test A: File count limit
-# ---------------------------------------------------------------------------
-
-
-class TestFileCountLimit:
-    """Uploading more than 10 files in a single request should be rejected."""
-
-    async def test_11_files_returns_413(
-        self,
-        client: httpx.AsyncClient,
-        headers: dict[str, str],
-        search_space_id: int,
-    ):
-        files = [
-            ("files", (f"file_{i}.txt", io.BytesIO(b"test content"), "text/plain"))
-            for i in range(11)
-        ]
-        resp = await client.post(
-            "/api/v1/documents/fileupload",
-            headers=headers,
-            files=files,
-            data={"search_space_id": str(search_space_id)},
-        )
-        assert resp.status_code == 413
-        assert "too many files" in resp.json()["detail"].lower()
-
-    async def test_10_files_accepted(
-        self,
-        client: httpx.AsyncClient,
-        headers: dict[str, str],
-        search_space_id: int,
-        cleanup_doc_ids: list[int],
-    ):
-        files = [
-            ("files", (f"file_{i}.txt", io.BytesIO(b"test content"), "text/plain"))
-            for i in range(10)
-        ]
-        resp = await client.post(
-            "/api/v1/documents/fileupload",
-            headers=headers,
-            files=files,
-            data={"search_space_id": str(search_space_id)},
-        )
-        assert resp.status_code == 200
-        cleanup_doc_ids.extend(resp.json().get("document_ids", []))
-
-
-# ---------------------------------------------------------------------------
-# Test B: Per-file size limit
+# Test: Per-file size limit (500 MB)
 # ---------------------------------------------------------------------------
 
 
 class TestPerFileSizeLimit:
-    """A single file exceeding 50 MB should be rejected."""
+    """A single file exceeding 500 MB should be rejected."""
 
     async def test_oversized_file_returns_413(
         self,
@@ -85,7 +36,7 @@ class TestPerFileSizeLimit:
         headers: dict[str, str],
         search_space_id: int,
     ):
-        oversized = io.BytesIO(b"\x00" * (50 * 1024 * 1024 + 1))
+        oversized = io.BytesIO(b"\x00" * (500 * 1024 * 1024 + 1))
         resp = await client.post(
             "/api/v1/documents/fileupload",
             headers=headers,
@@ -102,11 +53,11 @@ class TestPerFileSizeLimit:
         search_space_id: int,
         cleanup_doc_ids: list[int],
     ):
-        at_limit = io.BytesIO(b"\x00" * (50 * 1024 * 1024))
+        at_limit = io.BytesIO(b"\x00" * (500 * 1024 * 1024))
         resp = await client.post(
             "/api/v1/documents/fileupload",
             headers=headers,
-            files=[("files", ("exact50mb.txt", at_limit, "text/plain"))],
+            files=[("files", ("exact500mb.txt", at_limit, "text/plain"))],
             data={"search_space_id": str(search_space_id)},
         )
         assert resp.status_code == 200
@@ -114,26 +65,23 @@ class TestPerFileSizeLimit:
 
 
 # ---------------------------------------------------------------------------
-# Test C: Total upload size limit
+# Test: Multiple files accepted without count limit
 # ---------------------------------------------------------------------------
 
 
-class TestTotalSizeLimit:
-    """Multiple files whose combined size exceeds 200 MB should be rejected."""
+class TestNoFileCountLimit:
+    """Many files in a single request should be accepted."""
 
-    async def test_total_size_over_200mb_returns_413(
+    async def test_many_files_accepted(
         self,
         client: httpx.AsyncClient,
         headers: dict[str, str],
         search_space_id: int,
+        cleanup_doc_ids: list[int],
     ):
-        chunk_size = 45 * 1024 * 1024  # 45 MB each
         files = [
-            (
-                "files",
-                (f"chunk_{i}.txt", io.BytesIO(b"\x00" * chunk_size), "text/plain"),
-            )
-            for i in range(5)  # 5 x 45 MB = 225 MB > 200 MB
+            ("files", (f"file_{i}.txt", io.BytesIO(b"test content"), "text/plain"))
+            for i in range(20)
         ]
         resp = await client.post(
             "/api/v1/documents/fileupload",
@@ -141,5 +89,5 @@ class TestTotalSizeLimit:
             files=files,
             data={"search_space_id": str(search_space_id)},
         )
-        assert resp.status_code == 413
-        assert "total upload size" in resp.json()["detail"].lower()
+        assert resp.status_code == 200
+        cleanup_doc_ids.extend(resp.json().get("document_ids", []))
diff --git a/surfsense_backend/tests/unit/middleware/test_knowledge_search.py b/surfsense_backend/tests/unit/middleware/test_knowledge_search.py
index 163dd0d1d..a8cf5c93b 100644
--- a/surfsense_backend/tests/unit/middleware/test_knowledge_search.py
+++ b/surfsense_backend/tests/unit/middleware/test_knowledge_search.py
@@ -248,7 +248,7 @@ class TestKnowledgeBaseSearchMiddlewarePlanner:
             return []
 
         async def fake_build_scoped_filesystem(**kwargs):
-            return {}
+            return {}, {}
 
         monkeypatch.setattr(
             "app.agents.new_chat.middleware.knowledge_search.search_knowledge_base",
@@ -298,7 +298,7 @@ class TestKnowledgeBaseSearchMiddlewarePlanner:
             return []
 
         async def fake_build_scoped_filesystem(**kwargs):
-            return {}
+            return {}, {}
 
         monkeypatch.setattr(
             "app.agents.new_chat.middleware.knowledge_search.search_knowledge_base",
@@ -334,7 +334,7 @@ class TestKnowledgeBaseSearchMiddlewarePlanner:
             return []
 
         async def fake_build_scoped_filesystem(**kwargs):
-            return {}
+            return {}, {}
 
         monkeypatch.setattr(
             "app.agents.new_chat.middleware.knowledge_search.search_knowledge_base",
diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
index 4e0c36267..1c246ed71 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
@@ -329,14 +329,15 @@ export function DocumentsTableShell({
 
 	const handleViewDocument = useCallback(async (doc: Document) => {
 		setViewingDoc(doc);
-		if (doc.content) {
-			setViewingContent(doc.content);
+		const preview = doc.content_preview || doc.content;
+		if (preview) {
+			setViewingContent(preview);
 			return;
 		}
 		setViewingLoading(true);
 		try {
 			const fullDoc = await documentsApiService.getDocument({ id: doc.id });
-			setViewingContent(fullDoc.content);
+			setViewingContent(fullDoc.content_preview || fullDoc.content);
 		} catch (err) {
 			console.error("[DocumentsTableShell] Failed to fetch document content:", err);
 			setViewingContent("Failed to load document content.");
@@ -946,13 +947,36 @@ export function DocumentsTableShell({
 							WebkitMaskImage: `linear-gradient(to bottom, ${previewScrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${previewScrollPos === "bottom" ? "black" : "transparent"})`,
 						}}
 					>
-						{viewingLoading ? (
-							<div className="flex items-center justify-center py-12">
-								<Spinner size="lg" className="text-muted-foreground" />
-							</div>
-						) : (
-							<MarkdownViewer content={viewingContent} />
-						)}
+					{viewingLoading ? (
+						<div className="flex items-center justify-center py-12">
+							<Spinner size="lg" className="text-muted-foreground" />
+						</div>
+					) : (
+						<>
+							<MarkdownViewer content={viewingContent} maxLength={50_000} />
+							{viewingDoc && (
+								<div className="mt-4 flex justify-center">
+									<Button
+										variant="outline"
+										size="sm"
+										onClick={() => {
+											if (viewingDoc) {
+												openEditor({
+													documentId: viewingDoc.id,
+													searchSpaceId: Number(searchSpaceId),
+													title: viewingDoc.title,
+												});
+												handleCloseViewer();
+											}
+										}}
+									>
+										<Eye className="h-3.5 w-3.5 mr-1.5" />
+										View full document
+									</Button>
+								</div>
+							)}
+						</>
+					)}
 					</div>
 				</DrawerContent>
 			</Drawer>
diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/types.ts b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/types.ts
index d87f7374b..88914bd4f 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/types.ts
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/types.ts
@@ -9,9 +9,9 @@ export type Document = {
 	id: number;
 	title: string;
 	document_type: DocumentType;
-	// Optional: Only needed when viewing document details (lazy loaded)
 	document_metadata?: any;
 	content?: string;
+	content_preview?: string;
 	created_at: string;
 	search_space_id: number;
 	created_by_id?: string | null;
diff --git a/surfsense_web/components/editor-panel/editor-panel.tsx b/surfsense_web/components/editor-panel/editor-panel.tsx
index 3ea36f800..4b7079aef 100644
--- a/surfsense_web/components/editor-panel/editor-panel.tsx
+++ b/surfsense_web/components/editor-panel/editor-panel.tsx
@@ -1,12 +1,13 @@
 "use client";
 
 import { useAtomValue, useSetAtom } from "jotai";
-import { AlertCircle, XIcon } from "lucide-react";
+import { AlertCircle, Download, FileText, Loader2, XIcon } from "lucide-react";
 import dynamic from "next/dynamic";
 import { useCallback, useEffect, useRef, useState } from "react";
 import { toast } from "sonner";
 import { closeEditorPanelAtom, editorPanelAtom } from "@/atoms/editor/editor-panel.atom";
 import { MarkdownViewer } from "@/components/markdown-viewer";
+import { Alert, AlertDescription } from "@/components/ui/alert";
 import { Button } from "@/components/ui/button";
 import { Drawer, DrawerContent, DrawerHandle, DrawerTitle } from "@/components/ui/drawer";
 import { Skeleton } from "@/components/ui/skeleton";
@@ -18,11 +19,16 @@ const PlateEditor = dynamic(
 	{ ssr: false, loading: () => <Skeleton className="h-64 w-full" /> }
 );
 
+const LARGE_DOCUMENT_THRESHOLD = 2 * 1024 * 1024; // 2MB
+
 interface EditorContent {
 	document_id: number;
 	title: string;
 	document_type?: string;
 	source_markdown: string;
+	content_size_bytes?: number;
+	chunk_count?: number;
+	truncated?: boolean;
 }
 
 const EDITABLE_DOCUMENT_TYPES = new Set(["FILE", "NOTE"]);
@@ -62,6 +68,7 @@ export function EditorPanelContent({
 	const [isLoading, setIsLoading] = useState(true);
 	const [error, setError] = useState<string | null>(null);
 	const [saving, setSaving] = useState(false);
+	const [downloading, setDownloading] = useState(false);
 
 	const [editedMarkdown, setEditedMarkdown] = useState<string | null>(null);
 	const markdownRef = useRef<string>("");
@@ -69,6 +76,8 @@ export function EditorPanelContent({
 	const changeCountRef = useRef(0);
 	const [displayTitle, setDisplayTitle] = useState(title || "Untitled");
 
+	const isLargeDocument = (editorDoc?.content_size_bytes ?? 0) > LARGE_DOCUMENT_THRESHOLD;
+
 	useEffect(() => {
 		let cancelled = false;
 		setIsLoading(true);
@@ -86,10 +95,12 @@ export function EditorPanelContent({
 			}
 
 			try {
-				const response = await authenticatedFetch(
-					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`,
-					{ method: "GET" }
+				const url = new URL(
+					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`
 				);
+				url.searchParams.set("max_length", String(LARGE_DOCUMENT_THRESHOLD));
+
+				const response = await authenticatedFetch(url.toString(), { method: "GET" });
 
 				if (cancelled) return;
 
@@ -175,7 +186,7 @@ export function EditorPanelContent({
 	}, [documentId, searchSpaceId]);
 
 	const isEditableType = editorDoc
-		? EDITABLE_DOCUMENT_TYPES.has(editorDoc.document_type ?? "")
+		? EDITABLE_DOCUMENT_TYPES.has(editorDoc.document_type ?? "") && !isLargeDocument
 		: false;
 
 	return (
@@ -206,6 +217,57 @@ export function EditorPanelContent({
 							<p className="text-sm text-red-500 mt-1">{error || "An unknown error occurred"}</p>
 						</div>
 					</div>
+				) : isLargeDocument ? (
+					<div className="h-full overflow-y-auto px-5 py-4">
+						<Alert className="mb-4">
+							<FileText className="size-4" />
+							<AlertDescription className="flex items-center justify-between gap-4">
+								<span>
+									This document is too large for the editor ({Math.round((editorDoc.content_size_bytes ?? 0) / 1024 / 1024)}MB, {editorDoc.chunk_count ?? 0} chunks). Showing a preview below.
+								</span>
+								<Button
+									variant="outline"
+									size="sm"
+									className="shrink-0 gap-1.5"
+									disabled={downloading}
+									onClick={async () => {
+										setDownloading(true);
+										try {
+											const response = await authenticatedFetch(
+												`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/download-markdown`,
+												{ method: "GET" }
+											);
+											if (!response.ok) throw new Error("Download failed");
+											const blob = await response.blob();
+											const url = URL.createObjectURL(blob);
+											const a = document.createElement("a");
+											a.href = url;
+											const disposition = response.headers.get("content-disposition");
+											const match = disposition?.match(/filename="(.+)"/);
+											a.download = match?.[1] ?? `${editorDoc.title || "document"}.md`;
+											document.body.appendChild(a);
+											a.click();
+											a.remove();
+											URL.revokeObjectURL(url);
+											toast.success("Download started");
+										} catch {
+											toast.error("Failed to download document");
+										} finally {
+											setDownloading(false);
+										}
+									}}
+								>
+									{downloading ? (
+										<Loader2 className="size-3.5 animate-spin" />
+									) : (
+										<Download className="size-3.5" />
+									)}
+									{downloading ? "Preparing..." : "Download .md"}
+								</Button>
+							</AlertDescription>
+						</Alert>
+						<MarkdownViewer content={editorDoc.source_markdown} />
+					</div>
 				) : isEditableType ? (
 					<PlateEditor
 						key={documentId}
diff --git a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
index ac279cd4d..ad48c89de 100644
--- a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
+++ b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
@@ -1,18 +1,24 @@
 "use client";
 
-import { AlertCircle, Pencil } from "lucide-react";
+import { AlertCircle, Download, FileText, Loader2, Pencil } from "lucide-react";
 import { useCallback, useEffect, useRef, useState } from "react";
 import { toast } from "sonner";
 import { PlateEditor } from "@/components/editor/plate-editor";
 import { MarkdownViewer } from "@/components/markdown-viewer";
+import { Alert, AlertDescription } from "@/components/ui/alert";
 import { Button } from "@/components/ui/button";
 import { authenticatedFetch, getBearerToken, redirectToLogin } from "@/lib/auth-utils";
 
+const LARGE_DOCUMENT_THRESHOLD = 2 * 1024 * 1024; // 2MB
+
 interface DocumentContent {
 	document_id: number;
 	title: string;
 	document_type?: string;
 	source_markdown: string;
+	content_size_bytes?: number;
+	chunk_count?: number;
+	truncated?: boolean;
 }
 
 function DocumentSkeleton() {
@@ -49,11 +55,14 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 	const [error, setError] = useState<string | null>(null);
 	const [isEditing, setIsEditing] = useState(false);
 	const [saving, setSaving] = useState(false);
+	const [downloading, setDownloading] = useState(false);
 	const [editedMarkdown, setEditedMarkdown] = useState<string | null>(null);
 	const markdownRef = useRef<string>("");
 	const initialLoadDone = useRef(false);
 	const changeCountRef = useRef(0);
 
+	const isLargeDocument = (doc?.content_size_bytes ?? 0) > LARGE_DOCUMENT_THRESHOLD;
+
 	useEffect(() => {
 		let cancelled = false;
 		setIsLoading(true);
@@ -72,10 +81,12 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 			}
 
 			try {
-				const response = await authenticatedFetch(
-					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`,
-					{ method: "GET" }
+				const url = new URL(
+					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`
 				);
+				url.searchParams.set("max_length", String(LARGE_DOCUMENT_THRESHOLD));
+
+				const response = await authenticatedFetch(url.toString(), { method: "GET" });
 
 				if (cancelled) return;
 
@@ -173,9 +184,9 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 		);
 	}
 
-	const isEditable = EDITABLE_DOCUMENT_TYPES.has(doc.document_type ?? "");
+	const isEditable = EDITABLE_DOCUMENT_TYPES.has(doc.document_type ?? "") && !isLargeDocument;
 
-	if (isEditing) {
+	if (isEditing && !isLargeDocument) {
 		return (
 			<div className="flex flex-col h-full overflow-hidden">
 				<div className="flex items-center justify-between px-6 py-3 border-b shrink-0">
@@ -236,7 +247,60 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 			</div>
 			<div className="flex-1 overflow-auto">
 				<div className="max-w-4xl mx-auto px-6 py-6">
-					<MarkdownViewer content={doc.source_markdown} />
+					{isLargeDocument ? (
+						<>
+							<Alert className="mb-4">
+								<FileText className="size-4" />
+								<AlertDescription className="flex items-center justify-between gap-4">
+									<span>
+										This document is too large for the editor ({Math.round((doc.content_size_bytes ?? 0) / 1024 / 1024)}MB, {doc.chunk_count ?? 0} chunks). Showing a preview below.
+									</span>
+									<Button
+										variant="outline"
+										size="sm"
+										className="shrink-0 gap-1.5"
+										disabled={downloading}
+										onClick={async () => {
+											setDownloading(true);
+											try {
+												const response = await authenticatedFetch(
+													`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/download-markdown`,
+													{ method: "GET" }
+												);
+												if (!response.ok) throw new Error("Download failed");
+												const blob = await response.blob();
+												const url = URL.createObjectURL(blob);
+												const a = document.createElement("a");
+												a.href = url;
+												const disposition = response.headers.get("content-disposition");
+												const match = disposition?.match(/filename="(.+)"/);
+												a.download = match?.[1] ?? `${doc.title || "document"}.md`;
+												document.body.appendChild(a);
+												a.click();
+												a.remove();
+												URL.revokeObjectURL(url);
+												toast.success("Download started");
+											} catch {
+												toast.error("Failed to download document");
+											} finally {
+												setDownloading(false);
+											}
+										}}
+									>
+										{downloading ? (
+											<Loader2 className="size-3.5 animate-spin" />
+										) : (
+											<Download className="size-3.5" />
+										)}
+										{downloading ? "Preparing..." : "Download .md"}
+									</Button>
+								</AlertDescription>
+							</Alert>
+							<MarkdownViewer content={doc.source_markdown} />
+						</>
+					) : (
+						<MarkdownViewer content={doc.source_markdown} />
+					)}
 				</div>
 			</div>
 		</div>
diff --git a/surfsense_web/components/markdown-viewer.tsx b/surfsense_web/components/markdown-viewer.tsx
index e22df8998..abd999301 100644
--- a/surfsense_web/components/markdown-viewer.tsx
+++ b/surfsense_web/components/markdown-viewer.tsx
@@ -15,6 +15,7 @@ const math = createMathPlugin({
 interface MarkdownViewerProps {
 	content: string;
 	className?: string;
+	maxLength?: number;
 }
 
 /**
@@ -79,8 +80,10 @@ function convertLatexDelimiters(content: string): string {
 	return content;
 }
 
-export function MarkdownViewer({ content, className }: MarkdownViewerProps) {
-	const processedContent = convertLatexDelimiters(stripOuterMarkdownFence(content));
+export function MarkdownViewer({ content, className, maxLength }: MarkdownViewerProps) {
+	const isTruncated = maxLength != null && content.length > maxLength;
+	const displayContent = isTruncated ? content.slice(0, maxLength) : content;
+	const processedContent = convertLatexDelimiters(stripOuterMarkdownFence(displayContent));
 	const components: StreamdownProps["components"] = {
 		p: ({ children, ...props }) => (
 			<p className="my-2" {...props}>
@@ -171,6 +174,11 @@ export function MarkdownViewer({ content, className }: MarkdownViewerProps) {
 			>
 				{processedContent}
 			</Streamdown>
+			{isTruncated && (
+				<p className="mt-4 text-sm text-muted-foreground italic">
+					Content truncated ({Math.round(content.length / 1024)}KB total). Showing first {Math.round(maxLength / 1024)}KB.
+				</p>
+			)}
 		</div>
 	);
 }
diff --git a/surfsense_web/components/new-chat/source-detail-panel.tsx b/surfsense_web/components/new-chat/source-detail-panel.tsx
index b02b2e217..c17616c53 100644
--- a/surfsense_web/components/new-chat/source-detail-panel.tsx
+++ b/surfsense_web/components/new-chat/source-detail-panel.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useQuery } from "@tanstack/react-query";
-import { BookOpen, ChevronDown, ExternalLink, FileText, Hash, Sparkles, X } from "lucide-react";
+import { BookOpen, ChevronDown, ChevronUp, ExternalLink, FileText, Hash, Loader2, Sparkles, X } from "lucide-react";
 import { AnimatePresence, motion, useReducedMotion } from "motion/react";
 import { useTranslations } from "next-intl";
 import type React from "react";
@@ -10,7 +10,6 @@ import { createPortal } from "react-dom";
 import { MarkdownViewer } from "@/components/markdown-viewer";
 import { Badge } from "@/components/ui/badge";
 import { Button } from "@/components/ui/button";
-import { Collapsible, CollapsibleContent, CollapsibleTrigger } from "@/components/ui/collapsible";
 import { ScrollArea } from "@/components/ui/scroll-area";
 import { Spinner } from "@/components/ui/spinner";
 import type {
@@ -48,7 +47,8 @@ const formatDocumentType = (type: string) => {
 // which break auto-scroll functionality
 interface ChunkCardProps {
 	chunk: { id: number; content: string };
-	index: number;
+	localIndex: number;
+	chunkNumber: number;
 	totalChunks: number;
 	isCited: boolean;
 	isActive: boolean;
@@ -56,11 +56,11 @@ interface ChunkCardProps {
 }
 
 const ChunkCard = memo(
-	forwardRef<HTMLDivElement, ChunkCardProps>(({ chunk, index, totalChunks, isCited }, ref) => {
+	forwardRef<HTMLDivElement, ChunkCardProps>(({ chunk, localIndex, chunkNumber, totalChunks, isCited }, ref) => {
 		return (
 			<div
 				ref={ref}
-				data-chunk-index={index}
+				data-chunk-index={localIndex}
 				className={cn(
 					"group relative rounded-2xl border-2 transition-all duration-300",
 					isCited
@@ -68,10 +68,8 @@ const ChunkCard = memo(
 						: "bg-card border-border/50 hover:border-border hover:shadow-md"
 				)}
 			>
-				{/* Cited indicator glow effect */}
 				{isCited && <div className="absolute inset-0 rounded-2xl bg-primary/5 blur-xl -z-10" />}
 
-				{/* Header */}
 				<div className="flex items-center justify-between px-5 py-4 border-b border-border/50">
 					<div className="flex items-center gap-3">
 						<div
@@ -82,9 +80,9 @@ const ChunkCard = memo(
 									: "bg-muted text-muted-foreground group-hover:bg-muted/80"
 							)}
 						>
-							{index + 1}
+							{chunkNumber}
 						</div>
-						<span className="text-sm text-muted-foreground">of {totalChunks} chunks</span>
+						<span className="text-sm text-muted-foreground">Chunk {chunkNumber} of {totalChunks}</span>
 					</div>
 					{isCited && (
 						<Badge variant="default" className="gap-1.5 px-3 py-1">
@@ -94,9 +92,8 @@ const ChunkCard = memo(
 					)}
 				</div>
 
-				{/* Content */}
 				<div className="p-5 overflow-hidden">
-					<MarkdownViewer content={chunk.content} />
+					<MarkdownViewer content={chunk.content} maxLength={100_000} />
 				</div>
 			</div>
 		);
@@ -118,7 +115,6 @@ export function SourceDetailPanel({
 	const t = useTranslations("dashboard");
 	const scrollAreaRef = useRef<HTMLDivElement>(null);
 	const hasScrolledRef = useRef(false); // Use ref to avoid stale closures
-	const [summaryOpen, setSummaryOpen] = useState(false);
 	const [activeChunkIndex, setActiveChunkIndex] = useState<number | null>(null);
 	const [mounted, setMounted] = useState(false);
 	const [_hasScrolledToCited, setHasScrolledToCited] = useState(false);
@@ -140,20 +136,88 @@ export function SourceDetailPanel({
 			if (isDocsChunk) {
 				return documentsApiService.getSurfsenseDocByChunk(chunkId);
 			}
-			return documentsApiService.getDocumentByChunk({ chunk_id: chunkId });
+			return documentsApiService.getDocumentByChunk({ chunk_id: chunkId, chunk_window: 5 });
 		},
 		enabled: !!chunkId && open,
 		staleTime: 5 * 60 * 1000,
 	});
 
+	const totalChunks = (documentData && "total_chunks" in documentData)
+		? (documentData.total_chunks ?? documentData.chunks.length)
+		: (documentData?.chunks?.length ?? 0);
+	const [beforeChunks, setBeforeChunks] = useState<Array<{ id: number; content: string; created_at: string }>>([]);
+	const [afterChunks, setAfterChunks] = useState<Array<{ id: number; content: string; created_at: string }>>([]);
+	const [loadingBefore, setLoadingBefore] = useState(false);
+	const [loadingAfter, setLoadingAfter] = useState(false);
+
+	useEffect(() => {
+		setBeforeChunks([]);
+		setAfterChunks([]);
+	}, [chunkId, open]);
+
+	const chunkStartIndex = (documentData && "chunk_start_index" in documentData)
+		? (documentData.chunk_start_index ?? 0) : 0;
+	const initialChunks = documentData?.chunks ?? [];
+	const allChunks = [...beforeChunks, ...initialChunks, ...afterChunks];
+	const absoluteStart = chunkStartIndex - beforeChunks.length;
+	const absoluteEnd = chunkStartIndex + initialChunks.length + afterChunks.length;
+	const canLoadBefore = absoluteStart > 0;
+	const canLoadAfter = absoluteEnd < totalChunks;
+
+	const EXPAND_SIZE = 10;
+
+	const loadBefore = useCallback(async () => {
+		if (!documentData || !("search_space_id" in documentData) || !canLoadBefore) return;
+		setLoadingBefore(true);
+		try {
+			const count = Math.min(EXPAND_SIZE, absoluteStart);
+			const result = await documentsApiService.getDocumentChunks({
+				document_id: documentData.id,
+				page: 0,
+				page_size: count,
+				start_offset: absoluteStart - count,
+			});
+			const existingIds = new Set(allChunks.map(c => c.id));
+			const newChunks = result.items
+				.filter(c => !existingIds.has(c.id))
+				.map(c => ({ id: c.id, content: c.content, created_at: c.created_at }));
+			setBeforeChunks(prev => [...newChunks, ...prev]);
+		} catch (err) {
+			console.error("Failed to load earlier chunks:", err);
+		} finally {
+			setLoadingBefore(false);
+		}
+	}, [documentData, absoluteStart, canLoadBefore, allChunks]);
+
+	const loadAfter = useCallback(async () => {
+		if (!documentData || !("search_space_id" in documentData) || !canLoadAfter) return;
+		setLoadingAfter(true);
+		try {
+			const result = await documentsApiService.getDocumentChunks({
+				document_id: documentData.id,
+				page: 0,
+				page_size: EXPAND_SIZE,
+				start_offset: absoluteEnd,
+			});
+			const existingIds = new Set(allChunks.map(c => c.id));
+			const newChunks = result.items
+				.filter(c => !existingIds.has(c.id))
+				.map(c => ({ id: c.id, content: c.content, created_at: c.created_at }));
+			setAfterChunks(prev => [...prev, ...newChunks]);
+		} catch (err) {
+			console.error("Failed to load later chunks:", err);
+		} finally {
+			setLoadingAfter(false);
+		}
+	}, [documentData, absoluteEnd, canLoadAfter, allChunks]);
+
 	const isDirectRenderSource =
 		sourceType === "TAVILY_API" ||
 		sourceType === "LINKUP_API" ||
 		sourceType === "SEARXNG_API" ||
 		sourceType === "BAIDU_SEARCH_API";
 
-	// Find cited chunk index
-	const citedChunkIndex = documentData?.chunks?.findIndex((chunk) => chunk.id === chunkId) ?? -1;
+	const citedChunkIndex = allChunks.findIndex((chunk) => chunk.id === chunkId);
 
 	// Simple scroll function that scrolls to a chunk by index
 	const scrollToChunkByIndex = useCallback(
@@ -336,12 +400,12 @@ export function SourceDetailPanel({
 									{documentData && "document_type" in documentData
 										? formatDocumentType(documentData.document_type)
 										: sourceType && formatDocumentType(sourceType)}
-									{documentData?.chunks && (
-										<span className="ml-2">
-											• {documentData.chunks.length} chunk
-											{documentData.chunks.length !== 1 ? "s" : ""}
-										</span>
-									)}
+								{totalChunks > 0 && (
+									<span className="ml-2">
+										• {totalChunks} chunk{totalChunks !== 1 ? "s" : ""}
+										{allChunks.length < totalChunks && ` (showing ${allChunks.length})`}
+									</span>
+								)}
 								</p>
 							</div>
 							<div className="flex items-center gap-3 shrink-0">
@@ -450,7 +514,7 @@ export function SourceDetailPanel({
 						{!isDirectRenderSource && documentData && (
 							<div className="flex-1 flex overflow-hidden">
 								{/* Chunk Navigation Sidebar */}
-								{documentData.chunks.length > 1 && (
+								{allChunks.length > 1 && (
 									<motion.div
 										initial={{ opacity: 0, x: -20 }}
 										animate={{ opacity: 1, x: 0 }}
@@ -459,7 +523,8 @@ export function SourceDetailPanel({
 									>
 										<ScrollArea className="flex-1 h-full">
 											<div className="p-2 pt-3 flex flex-col gap-1.5">
-												{documentData.chunks.map((chunk, idx) => {
+												{allChunks.map((chunk, idx) => {
+													const absNum = absoluteStart + idx + 1;
 													const isCited = chunk.id === chunkId;
 													const isActive = activeChunkIndex === idx;
 													return (
@@ -478,9 +543,9 @@ export function SourceDetailPanel({
 																		? "bg-muted text-foreground"
 																		: "bg-muted/50 text-muted-foreground hover:bg-muted hover:text-foreground"
 															)}
-															title={isCited ? `Chunk ${idx + 1} (Cited)` : `Chunk ${idx + 1}`}
+															title={isCited ? `Chunk ${absNum} (Cited)` : `Chunk ${absNum}`}
 														>
-															{idx + 1}
+															{absNum}
 															{isCited && (
 																<span className="absolute -top-1.5 -right-1.5 flex items-center justify-center w-4 h-4 bg-primary rounded-full border-2 border-background shadow-sm">
 																	<Sparkles className="h-2.5 w-2.5 text-primary-foreground" />
@@ -524,44 +589,11 @@ export function SourceDetailPanel({
 												</motion.div>
 											)}
 
-										{/* Summary Collapsible */}
-										{documentData.content && (
-											<motion.div
-												initial={{ opacity: 0, y: 10 }}
-												animate={{ opacity: 1, y: 0 }}
-												transition={{ delay: 0.15 }}
-											>
-												<Collapsible open={summaryOpen} onOpenChange={setSummaryOpen}>
-													<CollapsibleTrigger className="w-full flex items-center justify-between p-5 rounded-2xl bg-linear-to-r from-muted/50 to-muted/30 border hover:from-muted/70 hover:to-muted/50 transition-all duration-200">
-														<span className="font-semibold flex items-center gap-2">
-															<BookOpen className="h-4 w-4" />
-															Document Summary
-														</span>
-														<motion.div
-															animate={{ rotate: summaryOpen ? 180 : 0 }}
-															transition={{ duration: 0.2 }}
-														>
-															<ChevronDown className="h-5 w-5 text-muted-foreground" />
-														</motion.div>
-													</CollapsibleTrigger>
-													<CollapsibleContent>
-														<motion.div
-															initial={{ opacity: 0 }}
-															animate={{ opacity: 1 }}
-															className="mt-3 p-5 bg-muted/20 rounded-2xl border"
-														>
-															<MarkdownViewer content={documentData.content} />
-														</motion.div>
-													</CollapsibleContent>
-												</Collapsible>
-											</motion.div>
-										)}
-
 										{/* Chunks Header */}
-										<div className="flex items-center justify-between pt-4">
+										<div className="flex items-center justify-between pt-2">
 											<h3 className="text-sm font-semibold text-muted-foreground uppercase tracking-wider flex items-center gap-2">
 												<Hash className="h-4 w-4" />
-												Content Chunks
+												Chunks {absoluteStart + 1}–{absoluteEnd} of {totalChunks}
 											</h3>
 											{citedChunkIndex !== -1 && (
 												<Button
@@ -576,24 +608,70 @@ export function SourceDetailPanel({
 											)}
 										</div>
 
+										{/* Load Earlier */}
+										{canLoadBefore && (
+											<div className="flex items-center justify-center">
+												<Button
+													variant="outline"
+													size="sm"
+													onClick={loadBefore}
+													disabled={loadingBefore}
+													className="gap-2"
+												>
+													{loadingBefore ? (
+														<Loader2 className="h-3.5 w-3.5 animate-spin" />
+													) : (
+														<ChevronUp className="h-3.5 w-3.5" />
+													)}
+													{loadingBefore
+														? "Loading..."
+														: `Load ${Math.min(EXPAND_SIZE, absoluteStart)} earlier chunks`}
+												</Button>
+											</div>
+										)}
+
 										{/* Chunks */}
 										<div className="space-y-4">
-											{documentData.chunks.map((chunk, idx) => {
+											{allChunks.map((chunk, idx) => {
 												const isCited = chunk.id === chunkId;
+												const chunkNumber = absoluteStart + idx + 1;
 												return (
 													<ChunkCard
 														key={chunk.id}
 														ref={isCited ? citedChunkRefCallback : undefined}
 														chunk={chunk}
-														index={idx}
-														totalChunks={documentData.chunks.length}
+														localIndex={idx}
+														chunkNumber={chunkNumber}
+														totalChunks={totalChunks}
 														isCited={isCited}
 														isActive={activeChunkIndex === idx}
-														disableLayoutAnimation={documentData.chunks.length > 30}
+														disableLayoutAnimation={allChunks.length > 30}
 													/>
 												);
 											})}
 										</div>
+
+										{/* Load Later */}
+										{canLoadAfter && (
+											<div className="flex items-center justify-center py-3">
+												<Button
+													variant="outline"
+													size="sm"
+													onClick={loadAfter}
+													disabled={loadingAfter}
+													className="gap-2"
+												>
+													{loadingAfter ? (
+														<Loader2 className="h-3.5 w-3.5 animate-spin" />
+													) : (
+														<ChevronDown className="h-3.5 w-3.5" />
+													)}
+													{loadingAfter
+														? "Loading..."
+														: `Load ${Math.min(EXPAND_SIZE, totalChunks - absoluteEnd)} later chunks`}
+												</Button>
+											</div>
+										)}
 									</div>
 								</ScrollArea>
 							</div>
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 6817b19db..faa042d8e 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -1,10 +1,10 @@
 "use client";
 
 import { useAtom } from "jotai";
-import { CheckCircle2, FileType, Info, Upload, X } from "lucide-react";
+import { CheckCircle2, FileType, FolderOpen, Info, Upload, X } from "lucide-react";
 
 import { useTranslations } from "next-intl";
-import { useCallback, useMemo, useRef, useState } from "react";
+import { type ChangeEvent, useCallback, useMemo, useRef, useState } from "react";
 import { useDropzone } from "react-dropzone";
 import { toast } from "sonner";
 import { uploadDocumentMutationAtom } from "@/atoms/documents/document-mutation.atoms";
@@ -51,6 +51,7 @@ const commonTypes = {
 	"application/vnd.openxmlformats-officedocument.presentationml.presentation": [".pptx"],
 	"text/html": [".html", ".htm"],
 	"text/csv": [".csv"],
+	"text/tab-separated-values": [".tsv"],
 	"image/jpeg": [".jpg", ".jpeg"],
 	"image/png": [".png"],
 	"image/bmp": [".bmp"],
@@ -76,7 +77,6 @@ const FILE_TYPE_CONFIG: Record<string, Record<string, string[]>> = {
 		"application/rtf": [".rtf"],
 		"application/xml": [".xml"],
 		"application/epub+zip": [".epub"],
-		"text/tab-separated-values": [".tsv"],
 		"text/html": [".html", ".htm", ".web"],
 		"image/gif": [".gif"],
 		"image/svg+xml": [".svg"],
@@ -102,7 +102,6 @@ const FILE_TYPE_CONFIG: Record<string, Record<string, string[]>> = {
 		"application/vnd.ms-powerpoint": [".ppt"],
 		"text/x-rst": [".rst"],
 		"application/rtf": [".rtf"],
-		"text/tab-separated-values": [".tsv"],
 		"application/vnd.ms-excel": [".xls"],
 		"application/xml": [".xml"],
 		...audioFileTypes,
@@ -116,10 +115,8 @@ interface FileWithId {
 
 const cardClass = "border border-border bg-slate-400/5 dark:bg-white/5";
 
-// Upload limits — files are sent in batches of 5 to avoid proxy timeouts
-const MAX_FILES = 50;
-const MAX_TOTAL_SIZE_MB = 200;
-const MAX_TOTAL_SIZE_BYTES = MAX_TOTAL_SIZE_MB * 1024 * 1024;
+const MAX_FILE_SIZE_MB = 500;
+const MAX_FILE_SIZE_BYTES = MAX_FILE_SIZE_MB * 1024 * 1024;
 
 export function DocumentUploadTab({
 	searchSpaceId,
@@ -134,6 +131,7 @@ export function DocumentUploadTab({
 	const [uploadDocumentMutation] = useAtom(uploadDocumentMutationAtom);
 	const { mutate: uploadDocuments, isPending: isUploading } = uploadDocumentMutation;
 	const fileInputRef = useRef<HTMLInputElement>(null);
+	const folderInputRef = useRef<HTMLInputElement>(null);
 
 	const acceptedFileTypes = useMemo(() => {
 		const etlService = process.env.NEXT_PUBLIC_ETL_SERVICE;
@@ -145,49 +143,76 @@ export function DocumentUploadTab({
 		[acceptedFileTypes]
 	);
 
-	const onDrop = useCallback(
-		(acceptedFiles: File[]) => {
+	const supportedExtensionsSet = useMemo(
+		() => new Set(supportedExtensions.map((ext) => ext.toLowerCase())),
+		[supportedExtensions]
+	);
+
+	const addFiles = useCallback(
+		(incoming: File[]) => {
+			const oversized = incoming.filter((f) => f.size > MAX_FILE_SIZE_BYTES);
+			if (oversized.length > 0) {
+				toast.error(t("file_too_large"), {
+					description: t("file_too_large_desc", {
+						name: oversized[0].name,
+						maxMB: MAX_FILE_SIZE_MB,
+					}),
+				});
+			}
+			const valid = incoming.filter((f) => f.size <= MAX_FILE_SIZE_BYTES);
+			if (valid.length === 0) return;
+
 			setFiles((prev) => {
-				const newEntries = acceptedFiles.map((f) => ({
+				const newEntries = valid.map((f) => ({
 					id: crypto.randomUUID?.() ?? `file-${Date.now()}-${Math.random().toString(36)}`,
 					file: f,
 				}));
-				const newFiles = [...prev, ...newEntries];
-
-				if (newFiles.length > MAX_FILES) {
-					toast.error(t("max_files_exceeded"), {
-						description: t("max_files_exceeded_desc", { max: MAX_FILES }),
-					});
-					return prev;
-				}
-
-				const newTotalSize = newFiles.reduce((sum, entry) => sum + entry.file.size, 0);
-				if (newTotalSize > MAX_TOTAL_SIZE_BYTES) {
-					toast.error(t("max_size_exceeded"), {
-						description: t("max_size_exceeded_desc", { max: MAX_TOTAL_SIZE_MB }),
-					});
-					return prev;
-				}
-
-				return newFiles;
+				return [...prev, ...newEntries];
 			});
 		},
 		[t]
 	);
 
+	const onDrop = useCallback(
+		(acceptedFiles: File[]) => {
+			addFiles(acceptedFiles);
+		},
+		[addFiles]
+	);
+
 	const { getRootProps, getInputProps, isDragActive } = useDropzone({
 		onDrop,
 		accept: acceptedFileTypes,
-		maxSize: 50 * 1024 * 1024, // 50MB per file
+		maxSize: MAX_FILE_SIZE_BYTES,
 		noClick: false,
-		disabled: files.length >= MAX_FILES,
 	});
 
-	// Handle file input click to prevent event bubbling that might reopen dialog
 	const handleFileInputClick = useCallback((e: React.MouseEvent<HTMLInputElement>) => {
 		e.stopPropagation();
 	}, []);
 
+	const handleFolderChange = useCallback(
+		(e: ChangeEvent<HTMLInputElement>) => {
+			const fileList = e.target.files;
+			if (!fileList || fileList.length === 0) return;
+
+			const folderFiles = Array.from(fileList).filter((f) => {
+				const ext = f.name.includes(".") ? `.${f.name.split(".").pop()?.toLowerCase()}` : "";
+				return ext !== "" && supportedExtensionsSet.has(ext);
+			});
+
+			if (folderFiles.length === 0) {
+				toast.error(t("no_supported_files_in_folder"));
+				e.target.value = "";
+				return;
+			}
+
+			addFiles(folderFiles);
+			e.target.value = "";
+		},
+		[addFiles, supportedExtensionsSet, t]
+	);
+
 	const formatFileSize = (bytes: number) => {
 		if (bytes === 0) return "0 Bytes";
 		const k = 1024;
@@ -198,15 +223,6 @@ export function DocumentUploadTab({
 
 	const totalFileSize = files.reduce((total, entry) => total + entry.file.size, 0);
 
-	// Check if limits are reached
-	const isFileCountLimitReached = files.length >= MAX_FILES;
-	const isSizeLimitReached = totalFileSize >= MAX_TOTAL_SIZE_BYTES;
-	const remainingFiles = MAX_FILES - files.length;
-	const remainingSizeMB = Math.max(
-		0,
-		(MAX_TOTAL_SIZE_BYTES - totalFileSize) / (1024 * 1024)
-	).toFixed(1);
-
 	// Track accordion state changes
 	const handleAccordionChange = useCallback(
 		(value: string) => {
@@ -257,11 +273,21 @@ export function DocumentUploadTab({
 			<Alert className="border border-border bg-slate-400/5 dark:bg-white/5">
 				<Info className="h-4 w-4 shrink-0 mt-0.5" />
 				<AlertDescription className="text-xs sm:text-sm leading-relaxed pt-0.5">
-					{t("file_size_limit")}{" "}
-					{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}
+					{t("file_size_limit", { maxMB: MAX_FILE_SIZE_MB })}{" "}
+					{t("upload_limits")}
 				</AlertDescription>
 			</Alert>
 
+			{/* Hidden folder input */}
+			<input
+				ref={folderInputRef}
+				type="file"
+				className="hidden"
+				onChange={handleFolderChange}
+				multiple
+				{...({ webkitdirectory: "", directory: "" } as React.InputHTMLAttributes<HTMLInputElement>)}
+			/>
+
 			<Card className={`relative overflow-hidden ${cardClass}`}>
 				<div className="absolute inset-0 [mask-image:radial-gradient(ellipse_at_center,white,transparent)] opacity-30">
 					<GridPattern />
@@ -269,11 +295,7 @@ export function DocumentUploadTab({
 				<CardContent className="p-4 sm:p-10 relative z-10">
 					<div
 						{...getRootProps()}
-						className={`flex flex-col items-center justify-center min-h-[200px] sm:min-h-[300px] border-2 border-dashed rounded-lg transition-colors ${
-							isFileCountLimitReached || isSizeLimitReached
-								? "border-destructive/50 bg-destructive/5 cursor-not-allowed"
-								: "border-border hover:border-primary/50 cursor-pointer"
-						}`}
+						className="flex flex-col items-center justify-center min-h-[200px] sm:min-h-[300px] border-2 border-dashed rounded-lg transition-colors border-border hover:border-primary/50 cursor-pointer"
 					>
 						<input
 							{...getInputProps()}
@@ -281,19 +303,7 @@ export function DocumentUploadTab({
 							className="hidden"
 							onClick={handleFileInputClick}
 						/>
-						{isFileCountLimitReached ? (
-							<div className="flex flex-col items-center gap-2 sm:gap-4 text-center px-4">
-								<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-destructive/70" />
-								<div>
-									<p className="text-sm sm:text-lg font-medium text-destructive">
-										{t("file_limit_reached")}
-									</p>
-									<p className="text-xs sm:text-sm text-muted-foreground mt-1">
-										{t("file_limit_reached_desc", { max: MAX_FILES })}
-									</p>
-								</div>
-							</div>
-						) : isDragActive ? (
+						{isDragActive ? (
 							<div className="flex flex-col items-center gap-2 sm:gap-4">
 								<Upload className="h-8 w-8 sm:h-12 sm:w-12 text-primary" />
 								<p className="text-sm sm:text-lg font-medium text-primary">{t("drop_files")}</p>
@@ -305,29 +315,35 @@ export function DocumentUploadTab({
 									<p className="text-sm sm:text-lg font-medium">{t("drag_drop")}</p>
 									<p className="text-xs sm:text-sm text-muted-foreground mt-1">{t("or_browse")}</p>
 								</div>
-								{files.length > 0 && (
-									<p className="text-xs text-muted-foreground">
-										{t("remaining_capacity", { files: remainingFiles, sizeMB: remainingSizeMB })}
-									</p>
-								)}
-							</div>
-						)}
-						{!isFileCountLimitReached && (
-							<div className="mt-2 sm:mt-4">
-								<Button
-									variant="secondary"
-									size="sm"
-									className="text-xs sm:text-sm"
-									onClick={(e) => {
-										e.stopPropagation();
-										e.preventDefault();
-										fileInputRef.current?.click();
-									}}
-								>
-									{t("browse_files")}
-								</Button>
 							</div>
 						)}
+						<div className="mt-2 sm:mt-4 flex gap-2">
+							<Button
+								variant="secondary"
+								size="sm"
+								className="text-xs sm:text-sm"
+								onClick={(e) => {
+									e.stopPropagation();
+									e.preventDefault();
+									fileInputRef.current?.click();
+								}}
+							>
+								{t("browse_files")}
+							</Button>
+							<Button
+								variant="outline"
+								size="sm"
+								className="text-xs sm:text-sm"
+								onClick={(e) => {
+									e.stopPropagation();
+									e.preventDefault();
+									folderInputRef.current?.click();
+								}}
+							>
+								<FolderOpen className="h-4 w-4 mr-1.5" />
+								{t("browse_folder")}
+							</Button>
+						</div>
 					</div>
 				</CardContent>
 			</Card>
diff --git a/surfsense_web/contracts/types/document.types.ts b/surfsense_web/contracts/types/document.types.ts
index 1a3326bae..f5431aecb 100644
--- a/surfsense_web/contracts/types/document.types.ts
+++ b/surfsense_web/contracts/types/document.types.ts
@@ -39,6 +39,7 @@ export const document = z.object({
 	document_type: documentTypeEnum,
 	document_metadata: z.record(z.string(), z.any()),
 	content: z.string(),
+	content_preview: z.string().optional().default(""),
 	content_hash: z.string(),
 	unique_identifier_hash: z.string().nullable(),
 	created_at: z.string(),
@@ -69,6 +70,8 @@ export const documentWithChunks = document.extend({
 			created_at: z.string(),
 		})
 	),
+	total_chunks: z.number().optional().default(0),
+	chunk_start_index: z.number().optional().default(0),
 });
 
 /**
@@ -243,10 +246,36 @@ export const getDocumentTypeCountsResponse = z.record(z.string(), z.number());
  */
 export const getDocumentByChunkRequest = z.object({
 	chunk_id: z.number(),
+	chunk_window: z.number().optional(),
 });
 
 export const getDocumentByChunkResponse = documentWithChunks;
 
+/**
+ * Get paginated chunks for a document
+ */
+export const getDocumentChunksRequest = z.object({
+	document_id: z.number(),
+	page: z.number().optional().default(0),
+	page_size: z.number().optional().default(20),
+	start_offset: z.number().optional(),
+});
+
+export const chunkRead = z.object({
+	id: z.number(),
+	content: z.string(),
+	document_id: z.number(),
+	created_at: z.string(),
+});
+
+export const getDocumentChunksResponse = z.object({
+	items: z.array(chunkRead),
+	total: z.number(),
+	page: z.number(),
+	page_size: z.number(),
+	has_more: z.boolean(),
+});
+
 /**
  * Get Surfsense docs by chunk
  */
@@ -328,3 +357,6 @@ export type GetSurfsenseDocsByChunkRequest = z.infer<typeof getSurfsenseDocsByCh
 export type GetSurfsenseDocsByChunkResponse = z.infer<typeof getSurfsenseDocsByChunkResponse>;
 export type GetSurfsenseDocsRequest = z.infer<typeof getSurfsenseDocsRequest>;
 export type GetSurfsenseDocsResponse = z.infer<typeof getSurfsenseDocsResponse>;
+export type GetDocumentChunksRequest = z.infer<typeof getDocumentChunksRequest>;
+export type GetDocumentChunksResponse = z.infer<typeof getDocumentChunksResponse>;
+export type ChunkRead = z.infer<typeof chunkRead>;
diff --git a/surfsense_web/lib/apis/documents-api.service.ts b/surfsense_web/lib/apis/documents-api.service.ts
index 14a247032..71fa58852 100644
--- a/surfsense_web/lib/apis/documents-api.service.ts
+++ b/surfsense_web/lib/apis/documents-api.service.ts
@@ -6,6 +6,7 @@ import {
 	deleteDocumentRequest,
 	deleteDocumentResponse,
 	type GetDocumentByChunkRequest,
+	type GetDocumentChunksRequest,
 	type GetDocumentRequest,
 	type GetDocumentsRequest,
 	type GetDocumentsStatusRequest,
@@ -13,6 +14,8 @@ import {
 	type GetSurfsenseDocsRequest,
 	getDocumentByChunkRequest,
 	getDocumentByChunkResponse,
+	getDocumentChunksRequest,
+	getDocumentChunksResponse,
 	getDocumentRequest,
 	getDocumentResponse,
 	getDocumentsRequest,
@@ -295,23 +298,52 @@ class DocumentsApiService {
 	};
 
 	/**
-	 * Get document by chunk ID (includes all chunks)
+	 * Get document by chunk ID (includes a window of chunks around the cited one)
 	 */
 	getDocumentByChunk = async (request: GetDocumentByChunkRequest) => {
-		// Validate the request
 		const parsedRequest = getDocumentByChunkRequest.safeParse(request);
 
 		if (!parsedRequest.success) {
 			console.error("Invalid request:", parsedRequest.error);
 
-			// Format a user friendly error message
 			const errorMessage = parsedRequest.error.issues.map((issue) => issue.message).join(", ");
 			throw new ValidationError(`Invalid request: ${errorMessage}`);
 		}
 
+		const params = new URLSearchParams();
+		if (request.chunk_window != null) {
+			params.set("chunk_window", String(request.chunk_window));
+		}
+		const qs = params.toString();
+		const url = `/api/v1/documents/by-chunk/${request.chunk_id}${qs ? `?${qs}` : ""}`;
+
+		return baseApiService.get(url, getDocumentByChunkResponse);
+	};
+
+	/**
+	 * Get paginated chunks for a document
+	 */
+	getDocumentChunks = async (request: GetDocumentChunksRequest) => {
+		const parsedRequest = getDocumentChunksRequest.safeParse(request);
+
+		if (!parsedRequest.success) {
+			console.error("Invalid request:", parsedRequest.error);
+
+			const errorMessage = parsedRequest.error.issues.map((issue) => issue.message).join(", ");
+			throw new ValidationError(`Invalid request: ${errorMessage}`);
+		}
+
+		const params = new URLSearchParams({
+			page: String(parsedRequest.data.page),
+			page_size: String(parsedRequest.data.page_size),
+		});
+		if (parsedRequest.data.start_offset != null) {
+			params.set("start_offset", String(parsedRequest.data.start_offset));
+		}
+
 		return baseApiService.get(
-			`/api/v1/documents/by-chunk/${request.chunk_id}`,
-			getDocumentByChunkResponse
+			`/api/v1/documents/${parsedRequest.data.document_id}/chunks?${params}`,
+			getDocumentChunksResponse
 		);
 	};
 
diff --git a/surfsense_web/messages/en.json b/surfsense_web/messages/en.json
index 53f80ea5f..cacaec557 100644
--- a/surfsense_web/messages/en.json
+++ b/surfsense_web/messages/en.json
@@ -376,12 +376,13 @@
 	"upload_documents": {
 		"title": "Upload Documents",
 		"subtitle": "Upload your files to make them searchable and accessible through AI-powered conversations.",
-		"file_size_limit": "Maximum file size: 50MB per file.",
-		"upload_limits": "Upload limit: {maxFiles} files, {maxSizeMB}MB total.",
-		"drop_files": "Drop files here",
-		"drag_drop": "Drag & drop files here",
-		"or_browse": "or click to browse",
+		"file_size_limit": "Maximum file size: {maxMB}MB per file.",
+		"upload_limits": "Upload files or entire folders",
+		"drop_files": "Drop files or folders here",
+		"drag_drop": "Drag & drop files or folders here",
+		"or_browse": "or click to browse files and folders",
 		"browse_files": "Browse Files",
+		"browse_folder": "Browse Folder",
 		"selected_files": "Selected Files ({count})",
 		"total_size": "Total size",
 		"clear_all": "Clear all",
@@ -394,13 +395,9 @@
 		"upload_error_desc": "Error uploading files",
 		"supported_file_types": "Supported File Types",
 		"file_types_desc": "These file types are supported based on your current ETL service configuration.",
-		"max_files_exceeded": "File Limit Exceeded",
-		"max_files_exceeded_desc": "You can upload a maximum of {max} files at a time.",
-		"max_size_exceeded": "Size Limit Exceeded",
-		"max_size_exceeded_desc": "Total file size cannot exceed {max}MB.",
-		"file_limit_reached": "Maximum Files Reached",
-		"file_limit_reached_desc": "Remove some files to add more (max {max} files).",
-		"remaining_capacity": "{files} files remaining • {sizeMB}MB available"
+		"file_too_large": "File Too Large",
+		"file_too_large_desc": "\"{name}\" exceeds the {maxMB}MB per-file limit.",
+		"no_supported_files_in_folder": "No supported file types found in the selected folder."
 	},
 	"add_webpage": {
 		"title": "Add Webpages for Crawling",
diff --git a/surfsense_web/messages/es.json b/surfsense_web/messages/es.json
index 36e627295..7670e76df 100644
--- a/surfsense_web/messages/es.json
+++ b/surfsense_web/messages/es.json
@@ -376,12 +376,13 @@
 	"upload_documents": {
 		"title": "Subir documentos",
 		"subtitle": "Sube tus archivos para hacerlos buscables y accesibles a través de conversaciones con IA.",
-		"file_size_limit": "Tamaño máximo de archivo: 50 MB por archivo.",
-		"upload_limits": "Límite de subida: {maxFiles} archivos, {maxSizeMB} MB en total.",
-		"drop_files": "Suelta los archivos aquí",
-		"drag_drop": "Arrastra y suelta archivos aquí",
-		"or_browse": "o haz clic para explorar",
+		"file_size_limit": "Tamaño máximo de archivo: {maxMB} MB por archivo.",
+		"upload_limits": "Sube archivos o carpetas enteras",
+		"drop_files": "Suelta archivos o carpetas aquí",
+		"drag_drop": "Arrastra y suelta archivos o carpetas aquí",
+		"or_browse": "o haz clic para explorar archivos y carpetas",
 		"browse_files": "Explorar archivos",
+		"browse_folder": "Explorar carpeta",
 		"selected_files": "Archivos seleccionados ({count})",
 		"total_size": "Tamaño total",
 		"clear_all": "Limpiar todo",
@@ -394,13 +395,9 @@
 		"upload_error_desc": "Error al subir archivos",
 		"supported_file_types": "Tipos de archivo soportados",
 		"file_types_desc": "Estos tipos de archivo son soportados según la configuración actual de tu servicio ETL.",
-		"max_files_exceeded": "Límite de archivos excedido",
-		"max_files_exceeded_desc": "Puedes subir un máximo de {max} archivos a la vez.",
-		"max_size_exceeded": "Límite de tamaño excedido",
-		"max_size_exceeded_desc": "El tamaño total de los archivos no puede exceder {max} MB.",
-		"file_limit_reached": "Máximo de archivos alcanzado",
-		"file_limit_reached_desc": "Elimina algunos archivos para agregar más (máximo {max} archivos).",
-		"remaining_capacity": "{files} archivos restantes • {sizeMB} MB disponibles"
+		"file_too_large": "Archivo demasiado grande",
+		"file_too_large_desc": "\"{name}\" excede el límite de {maxMB} MB por archivo.",
+		"no_supported_files_in_folder": "No se encontraron tipos de archivo compatibles en la carpeta seleccionada."
 	},
 	"add_webpage": {
 		"title": "Agregar páginas web para rastreo",
diff --git a/surfsense_web/messages/hi.json b/surfsense_web/messages/hi.json
index fd51acdc2..cbcff0b30 100644
--- a/surfsense_web/messages/hi.json
+++ b/surfsense_web/messages/hi.json
@@ -376,12 +376,13 @@
 	"upload_documents": {
 		"title": "दस्तावेज़ अपलोड करें",
 		"subtitle": "AI-संचालित बातचीत के माध्यम से अपनी फ़ाइलों को खोजने योग्य और सुलभ बनाने के लिए अपलोड करें।",
-		"file_size_limit": "अधिकतम फ़ाइल आकार: प्रति फ़ाइल 50MB।",
-		"upload_limits": "अपलोड सीमा: {maxFiles} फ़ाइलें, कुल {maxSizeMB}MB।",
-		"drop_files": "फ़ाइलें यहां छोड़ें",
-		"drag_drop": "फ़ाइलें यहां खींचें और छोड़ें",
-		"or_browse": "या ब्राउज़ करने के लिए क्लिक करें",
+		"file_size_limit": "अधिकतम फ़ाइल आकार: प्रति फ़ाइल {maxMB}MB।",
+		"upload_limits": "फ़ाइलें या पूरे फ़ोल्डर अपलोड करें",
+		"drop_files": "फ़ाइलें या फ़ोल्डर यहां छोड़ें",
+		"drag_drop": "फ़ाइलें या फ़ोल्डर यहां खींचें और छोड़ें",
+		"or_browse": "या फ़ाइलें और फ़ोल्डर ब्राउज़ करने के लिए क्लिक करें",
 		"browse_files": "फ़ाइलें ब्राउज़ करें",
+		"browse_folder": "फ़ोल्डर ब्राउज़ करें",
 		"selected_files": "चयनित फ़ाइलें ({count})",
 		"total_size": "कुल आकार",
 		"clear_all": "सभी साफ करें",
@@ -394,13 +395,9 @@
 		"upload_error_desc": "फ़ाइलें अपलोड करने में त्रुटि",
 		"supported_file_types": "समर्थित फ़ाइल प्रकार",
 		"file_types_desc": "ये फ़ाइल प्रकार आपकी वर्तमान ETL सेवा कॉन्फ़िगरेशन के आधार पर समर्थित हैं।",
-		"max_files_exceeded": "फ़ाइल सीमा पार हो गई",
-		"max_files_exceeded_desc": "आप एक बार में अधिकतम {max} फ़ाइलें अपलोड कर सकते हैं।",
-		"max_size_exceeded": "आकार सीमा पार हो गई",
-		"max_size_exceeded_desc": "कुल फ़ाइल आकार {max}MB से अधिक नहीं हो सकता।",
-		"file_limit_reached": "अधिकतम फ़ाइलें पहुंच गई",
-		"file_limit_reached_desc": "और जोड़ने के लिए कुछ फ़ाइलें हटाएं (अधिकतम {max} फ़ाइलें)।",
-		"remaining_capacity": "{files} फ़ाइलें शेष • {sizeMB}MB उपलब्ध"
+		"file_too_large": "फ़ाइल बहुत बड़ी है",
+		"file_too_large_desc": "\"{name}\" प्रति फ़ाइल {maxMB}MB की सीमा से अधिक है।",
+		"no_supported_files_in_folder": "चयनित फ़ोल्डर में कोई समर्थित फ़ाइल प्रकार नहीं मिला।"
 	},
 	"add_webpage": {
 		"title": "क्रॉलिंग के लिए वेबपेज जोड़ें",
diff --git a/surfsense_web/messages/pt.json b/surfsense_web/messages/pt.json
index e26499f90..ec72ef0da 100644
--- a/surfsense_web/messages/pt.json
+++ b/surfsense_web/messages/pt.json
@@ -376,12 +376,13 @@
 	"upload_documents": {
 		"title": "Enviar documentos",
 		"subtitle": "Envie seus arquivos para torná-los pesquisáveis e acessíveis através de conversas com IA.",
-		"file_size_limit": "Tamanho máximo do arquivo: 50 MB por arquivo.",
-		"upload_limits": "Limite de envio: {maxFiles} arquivos, {maxSizeMB} MB no total.",
-		"drop_files": "Solte os arquivos aqui",
-		"drag_drop": "Arraste e solte arquivos aqui",
-		"or_browse": "ou clique para navegar",
+		"file_size_limit": "Tamanho máximo do arquivo: {maxMB} MB por arquivo.",
+		"upload_limits": "Envie arquivos ou pastas inteiras",
+		"drop_files": "Solte arquivos ou pastas aqui",
+		"drag_drop": "Arraste e solte arquivos ou pastas aqui",
+		"or_browse": "ou clique para navegar arquivos e pastas",
 		"browse_files": "Navegar arquivos",
+		"browse_folder": "Navegar pasta",
 		"selected_files": "Arquivos selecionados ({count})",
 		"total_size": "Tamanho total",
 		"clear_all": "Limpar tudo",
@@ -394,13 +395,9 @@
 		"upload_error_desc": "Erro ao enviar arquivos",
 		"supported_file_types": "Tipos de arquivo suportados",
 		"file_types_desc": "Estes tipos de arquivo são suportados com base na configuração atual do seu serviço ETL.",
-		"max_files_exceeded": "Limite de arquivos excedido",
-		"max_files_exceeded_desc": "Você pode enviar no máximo {max} arquivos de uma vez.",
-		"max_size_exceeded": "Limite de tamanho excedido",
-		"max_size_exceeded_desc": "O tamanho total dos arquivos não pode exceder {max} MB.",
-		"file_limit_reached": "Máximo de arquivos atingido",
-		"file_limit_reached_desc": "Remova alguns arquivos para adicionar mais (máximo {max} arquivos).",
-		"remaining_capacity": "{files} arquivos restantes • {sizeMB} MB disponíveis"
+		"file_too_large": "Arquivo muito grande",
+		"file_too_large_desc": "\"{name}\" excede o limite de {maxMB} MB por arquivo.",
+		"no_supported_files_in_folder": "Nenhum tipo de arquivo suportado encontrado na pasta selecionada."
 	},
 	"add_webpage": {
 		"title": "Adicionar páginas web para rastreamento",
diff --git a/surfsense_web/messages/zh.json b/surfsense_web/messages/zh.json
index 819432410..db634dfd9 100644
--- a/surfsense_web/messages/zh.json
+++ b/surfsense_web/messages/zh.json
@@ -360,12 +360,13 @@
 	"upload_documents": {
 		"title": "上传文档",
 		"subtitle": "上传您的文件，使其可通过 AI 对话进行搜索和访问。",
-		"file_size_limit": "最大文件大小：每个文件 50MB。",
-		"upload_limits": "上传限制：最多 {maxFiles} 个文件，总大小不超过 {maxSizeMB}MB。",
-		"drop_files": "放下文件到这里",
-		"drag_drop": "拖放文件到这里",
-		"or_browse": "或点击浏览",
+		"file_size_limit": "最大文件大小：每个文件 {maxMB}MB。",
+		"upload_limits": "上传文件或整个文件夹",
+		"drop_files": "将文件或文件夹拖放到此处",
+		"drag_drop": "将文件或文件夹拖放到此处",
+		"or_browse": "或点击浏览文件和文件夹",
 		"browse_files": "浏览文件",
+		"browse_folder": "浏览文件夹",
 		"selected_files": "已选择的文件 ({count})",
 		"total_size": "总大小",
 		"clear_all": "全部清除",
@@ -378,13 +379,9 @@
 		"upload_error_desc": "上传文件时出错",
 		"supported_file_types": "支持的文件类型",
 		"file_types_desc": "根据您当前的 ETL 服务配置支持这些文件类型。",
-		"max_files_exceeded": "超过文件数量限制",
-		"max_files_exceeded_desc": "一次最多只能上传 {max} 个文件。",
-		"max_size_exceeded": "超过文件大小限制",
-		"max_size_exceeded_desc": "文件总大小不能超过 {max}MB。",
-		"file_limit_reached": "已达到最大文件数量",
-		"file_limit_reached_desc": "移除一些文件以添加更多（最多 {max} 个文件）。",
-		"remaining_capacity": "剩余 {files} 个文件名额 • 可用 {sizeMB}MB"
+		"file_too_large": "文件过大",
+		"file_too_large_desc": "\"{name}\" 超过了每个文件 {maxMB}MB 的限制。",
+		"no_supported_files_in_folder": "所选文件夹中没有找到支持的文件类型。"
 	},
 	"add_webpage": {
 		"title": "添加网页爬取",

From eb1785027471dbce67a0b9e09f8ce6791c57c869 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Thu, 2 Apr 2026 19:45:28 -0700
Subject: [PATCH 064/202] chore: linting

---
 .../components/DocumentsTableShell.tsx        |  60 ++++----
 .../new-chat/[[...chat_id]]/page.tsx          |   2 +-
 surfsense_web/app/docs/[[...slug]]/page.tsx   |   2 +-
 surfsense_web/app/error.tsx                   |   1 -
 .../comment-composer/comment-composer.tsx     |   5 +-
 .../components/editor-panel/editor-panel.tsx  |   4 +-
 .../layout/ui/tabs/DocumentTabContent.tsx     |   4 +-
 surfsense_web/components/markdown-viewer.tsx  |   3 +-
 .../new-chat/source-detail-panel.tsx          | 141 ++++++++++--------
 .../components/sources/DocumentUploadTab.tsx  |   3 +-
 surfsense_web/components/ui/checkbox.tsx      |   2 +-
 surfsense_web/components/ui/dropdown-menu.tsx |   2 +-
 surfsense_web/components/ui/toggle-group.tsx  |   2 +-
 surfsense_web/components/ui/toggle.tsx        |   2 +-
 .../query-client/query-client.provider.tsx    |   2 +-
 15 files changed, 127 insertions(+), 108 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
index 1c246ed71..ceef9f2e1 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
@@ -947,36 +947,36 @@ export function DocumentsTableShell({
 							WebkitMaskImage: `linear-gradient(to bottom, ${previewScrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${previewScrollPos === "bottom" ? "black" : "transparent"})`,
 						}}
 					>
-					{viewingLoading ? (
-						<div className="flex items-center justify-center py-12">
-							<Spinner size="lg" className="text-muted-foreground" />
-						</div>
-					) : (
-						<>
-							<MarkdownViewer content={viewingContent} maxLength={50_000} />
-							{viewingDoc && (
-								<div className="mt-4 flex justify-center">
-									<Button
-										variant="outline"
-										size="sm"
-										onClick={() => {
-											if (viewingDoc) {
-												openEditor({
-													documentId: viewingDoc.id,
-													searchSpaceId: Number(searchSpaceId),
-													title: viewingDoc.title,
-												});
-												handleCloseViewer();
-											}
-										}}
-									>
-										<Eye className="h-3.5 w-3.5 mr-1.5" />
-										View full document
-									</Button>
-								</div>
-							)}
-						</>
-					)}
+						{viewingLoading ? (
+							<div className="flex items-center justify-center py-12">
+								<Spinner size="lg" className="text-muted-foreground" />
+							</div>
+						) : (
+							<>
+								<MarkdownViewer content={viewingContent} maxLength={50_000} />
+								{viewingDoc && (
+									<div className="mt-4 flex justify-center">
+										<Button
+											variant="outline"
+											size="sm"
+											onClick={() => {
+												if (viewingDoc) {
+													openEditor({
+														documentId: viewingDoc.id,
+														searchSpaceId: Number(searchSpaceId),
+														title: viewingDoc.title,
+													});
+													handleCloseViewer();
+												}
+											}}
+										>
+											<Eye className="h-3.5 w-3.5 mr-1.5" />
+											View full document
+										</Button>
+									</div>
+								)}
+							</>
+						)}
 					</div>
 				</DrawerContent>
 			</Drawer>
diff --git a/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx b/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx
index 9e9374dd6..ac1fcdaf9 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/new-chat/[[...chat_id]]/page.tsx
@@ -232,7 +232,7 @@ export default function NewChatPage() {
 				const prevById = new Map(prev.map((m) => [m.id, m]));
 
 				return syncedMessages.map((msg) => {
-					const member = msg.author_id ? memberById.get(msg.author_id) ?? null : null;
+					const member = msg.author_id ? (memberById.get(msg.author_id) ?? null) : null;
 
 					// Preserve existing author info if member lookup fails (e.g., cloned chats)
 					const existingMsg = prevById.get(`msg-${msg.id}`);
diff --git a/surfsense_web/app/docs/[[...slug]]/page.tsx b/surfsense_web/app/docs/[[...slug]]/page.tsx
index 166131f90..0905be8a0 100644
--- a/surfsense_web/app/docs/[[...slug]]/page.tsx
+++ b/surfsense_web/app/docs/[[...slug]]/page.tsx
@@ -1,8 +1,8 @@
 import { DocsBody, DocsDescription, DocsPage, DocsTitle } from "fumadocs-ui/page";
 import { notFound } from "next/navigation";
+import { cache } from "react";
 import { source } from "@/lib/source";
 import { getMDXComponents } from "@/mdx-components";
-import { cache } from "react";
 
 const getDocPage = cache((slug?: string[]) => {
 	return source.getPage(slug);
diff --git a/surfsense_web/app/error.tsx b/surfsense_web/app/error.tsx
index 3935f84d5..70c3d9632 100644
--- a/surfsense_web/app/error.tsx
+++ b/surfsense_web/app/error.tsx
@@ -1,6 +1,5 @@
 "use client";
 
-
 import { useEffect } from "react";
 
 export default function ErrorPage({
diff --git a/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx b/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
index bee3f2da6..3d6ea384b 100644
--- a/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
+++ b/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
@@ -16,10 +16,7 @@ function convertDisplayToData(displayContent: string, mentions: InsertedMention[
 	const sortedMentions = [...mentions].sort((a, b) => b.displayName.length - a.displayName.length);
 
 	const mentionPatterns = sortedMentions.map((mention) => ({
-		pattern: new RegExp(
-			`@${escapeRegExp(mention.displayName)}(?=\\s|$|[.,!?;:])`,
-			"g"
-		),
+		pattern: new RegExp(`@${escapeRegExp(mention.displayName)}(?=\\s|$|[.,!?;:])`, "g"),
 		dataFormat: `@[${mention.id}]`,
 	}));
 
diff --git a/surfsense_web/components/editor-panel/editor-panel.tsx b/surfsense_web/components/editor-panel/editor-panel.tsx
index 4b7079aef..3f167dc24 100644
--- a/surfsense_web/components/editor-panel/editor-panel.tsx
+++ b/surfsense_web/components/editor-panel/editor-panel.tsx
@@ -223,7 +223,9 @@ export function EditorPanelContent({
 							<FileText className="size-4" />
 							<AlertDescription className="flex items-center justify-between gap-4">
 								<span>
-									This document is too large for the editor ({Math.round((editorDoc.content_size_bytes ?? 0) / 1024 / 1024)}MB, {editorDoc.chunk_count ?? 0} chunks). Showing a preview below.
+									This document is too large for the editor (
+									{Math.round((editorDoc.content_size_bytes ?? 0) / 1024 / 1024)}MB,{" "}
+									{editorDoc.chunk_count ?? 0} chunks). Showing a preview below.
 								</span>
 								<Button
 									variant="outline"
diff --git a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
index ad48c89de..16457404f 100644
--- a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
+++ b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
@@ -253,7 +253,9 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 								<FileText className="size-4" />
 								<AlertDescription className="flex items-center justify-between gap-4">
 									<span>
-										This document is too large for the editor ({Math.round((doc.content_size_bytes ?? 0) / 1024 / 1024)}MB, {doc.chunk_count ?? 0} chunks). Showing a preview below.
+										This document is too large for the editor (
+										{Math.round((doc.content_size_bytes ?? 0) / 1024 / 1024)}MB,{" "}
+										{doc.chunk_count ?? 0} chunks). Showing a preview below.
 									</span>
 									<Button
 										variant="outline"
diff --git a/surfsense_web/components/markdown-viewer.tsx b/surfsense_web/components/markdown-viewer.tsx
index abd999301..a568bd698 100644
--- a/surfsense_web/components/markdown-viewer.tsx
+++ b/surfsense_web/components/markdown-viewer.tsx
@@ -176,7 +176,8 @@ export function MarkdownViewer({ content, className, maxLength }: MarkdownViewer
 			</Streamdown>
 			{isTruncated && (
 				<p className="mt-4 text-sm text-muted-foreground italic">
-					Content truncated ({Math.round(content.length / 1024)}KB total). Showing first {Math.round(maxLength / 1024)}KB.
+					Content truncated ({Math.round(content.length / 1024)}KB total). Showing first{" "}
+					{Math.round(maxLength / 1024)}KB.
 				</p>
 			)}
 		</div>
diff --git a/surfsense_web/components/new-chat/source-detail-panel.tsx b/surfsense_web/components/new-chat/source-detail-panel.tsx
index c17616c53..bff088971 100644
--- a/surfsense_web/components/new-chat/source-detail-panel.tsx
+++ b/surfsense_web/components/new-chat/source-detail-panel.tsx
@@ -1,7 +1,17 @@
 "use client";
 
 import { useQuery } from "@tanstack/react-query";
-import { BookOpen, ChevronDown, ChevronUp, ExternalLink, FileText, Hash, Loader2, Sparkles, X } from "lucide-react";
+import {
+	BookOpen,
+	ChevronDown,
+	ChevronUp,
+	ExternalLink,
+	FileText,
+	Hash,
+	Loader2,
+	Sparkles,
+	X,
+} from "lucide-react";
 import { AnimatePresence, motion, useReducedMotion } from "motion/react";
 import { useTranslations } from "next-intl";
 import type React from "react";
@@ -56,48 +66,52 @@ interface ChunkCardProps {
 }
 
 const ChunkCard = memo(
-	forwardRef<HTMLDivElement, ChunkCardProps>(({ chunk, localIndex, chunkNumber, totalChunks, isCited }, ref) => {
-		return (
-			<div
-				ref={ref}
-				data-chunk-index={localIndex}
-				className={cn(
-					"group relative rounded-2xl border-2 transition-all duration-300",
-					isCited
-						? "bg-linear-to-br from-primary/5 via-primary/10 to-primary/5 border-primary shadow-lg shadow-primary/10"
-						: "bg-card border-border/50 hover:border-border hover:shadow-md"
-				)}
-			>
-				{isCited && <div className="absolute inset-0 rounded-2xl bg-primary/5 blur-xl -z-10" />}
-
-				<div className="flex items-center justify-between px-5 py-4 border-b border-border/50">
-					<div className="flex items-center gap-3">
-						<div
-							className={cn(
-								"flex items-center justify-center w-8 h-8 rounded-full text-sm font-semibold transition-colors",
-								isCited
-									? "bg-primary text-primary-foreground"
-									: "bg-muted text-muted-foreground group-hover:bg-muted/80"
-							)}
-						>
-							{chunkNumber}
-						</div>
-						<span className="text-sm text-muted-foreground">Chunk {chunkNumber} of {totalChunks}</span>
-					</div>
-					{isCited && (
-						<Badge variant="default" className="gap-1.5 px-3 py-1">
-							<Sparkles className="h-3 w-3" />
-							Cited Source
-						</Badge>
+	forwardRef<HTMLDivElement, ChunkCardProps>(
+		({ chunk, localIndex, chunkNumber, totalChunks, isCited }, ref) => {
+			return (
+				<div
+					ref={ref}
+					data-chunk-index={localIndex}
+					className={cn(
+						"group relative rounded-2xl border-2 transition-all duration-300",
+						isCited
+							? "bg-linear-to-br from-primary/5 via-primary/10 to-primary/5 border-primary shadow-lg shadow-primary/10"
+							: "bg-card border-border/50 hover:border-border hover:shadow-md"
 					)}
-				</div>
+				>
+					{isCited && <div className="absolute inset-0 rounded-2xl bg-primary/5 blur-xl -z-10" />}
 
-				<div className="p-5 overflow-hidden">
-					<MarkdownViewer content={chunk.content} maxLength={100_000} />
+					<div className="flex items-center justify-between px-5 py-4 border-b border-border/50">
+						<div className="flex items-center gap-3">
+							<div
+								className={cn(
+									"flex items-center justify-center w-8 h-8 rounded-full text-sm font-semibold transition-colors",
+									isCited
+										? "bg-primary text-primary-foreground"
+										: "bg-muted text-muted-foreground group-hover:bg-muted/80"
+								)}
+							>
+								{chunkNumber}
+							</div>
+							<span className="text-sm text-muted-foreground">
+								Chunk {chunkNumber} of {totalChunks}
+							</span>
+						</div>
+						{isCited && (
+							<Badge variant="default" className="gap-1.5 px-3 py-1">
+								<Sparkles className="h-3 w-3" />
+								Cited Source
+							</Badge>
+						)}
+					</div>
+
+					<div className="p-5 overflow-hidden">
+						<MarkdownViewer content={chunk.content} maxLength={100_000} />
+					</div>
 				</div>
-			</div>
-		);
-	})
+			);
+		}
+	)
 );
 ChunkCard.displayName = "ChunkCard";
 
@@ -142,11 +156,16 @@ export function SourceDetailPanel({
 		staleTime: 5 * 60 * 1000,
 	});
 
-	const totalChunks = (documentData && "total_chunks" in documentData)
-		? (documentData.total_chunks ?? documentData.chunks.length)
-		: (documentData?.chunks?.length ?? 0);
-	const [beforeChunks, setBeforeChunks] = useState<Array<{ id: number; content: string; created_at: string }>>([]);
-	const [afterChunks, setAfterChunks] = useState<Array<{ id: number; content: string; created_at: string }>>([]);
+	const totalChunks =
+		documentData && "total_chunks" in documentData
+			? (documentData.total_chunks ?? documentData.chunks.length)
+			: (documentData?.chunks?.length ?? 0);
+	const [beforeChunks, setBeforeChunks] = useState<
+		Array<{ id: number; content: string; created_at: string }>
+	>([]);
+	const [afterChunks, setAfterChunks] = useState<
+		Array<{ id: number; content: string; created_at: string }>
+	>([]);
 	const [loadingBefore, setLoadingBefore] = useState(false);
 	const [loadingAfter, setLoadingAfter] = useState(false);
 
@@ -155,8 +174,8 @@ export function SourceDetailPanel({
 		setAfterChunks([]);
 	}, [chunkId, open]);
 
-	const chunkStartIndex = (documentData && "chunk_start_index" in documentData)
-		? (documentData.chunk_start_index ?? 0) : 0;
+	const chunkStartIndex =
+		documentData && "chunk_start_index" in documentData ? (documentData.chunk_start_index ?? 0) : 0;
 	const initialChunks = documentData?.chunks ?? [];
 	const allChunks = [...beforeChunks, ...initialChunks, ...afterChunks];
 	const absoluteStart = chunkStartIndex - beforeChunks.length;
@@ -177,11 +196,11 @@ export function SourceDetailPanel({
 				page_size: count,
 				start_offset: absoluteStart - count,
 			});
-			const existingIds = new Set(allChunks.map(c => c.id));
+			const existingIds = new Set(allChunks.map((c) => c.id));
 			const newChunks = result.items
-				.filter(c => !existingIds.has(c.id))
-				.map(c => ({ id: c.id, content: c.content, created_at: c.created_at }));
-			setBeforeChunks(prev => [...newChunks, ...prev]);
+				.filter((c) => !existingIds.has(c.id))
+				.map((c) => ({ id: c.id, content: c.content, created_at: c.created_at }));
+			setBeforeChunks((prev) => [...newChunks, ...prev]);
 		} catch (err) {
 			console.error("Failed to load earlier chunks:", err);
 		} finally {
@@ -199,11 +218,11 @@ export function SourceDetailPanel({
 				page_size: EXPAND_SIZE,
 				start_offset: absoluteEnd,
 			});
-			const existingIds = new Set(allChunks.map(c => c.id));
+			const existingIds = new Set(allChunks.map((c) => c.id));
 			const newChunks = result.items
-				.filter(c => !existingIds.has(c.id))
-				.map(c => ({ id: c.id, content: c.content, created_at: c.created_at }));
-			setAfterChunks(prev => [...prev, ...newChunks]);
+				.filter((c) => !existingIds.has(c.id))
+				.map((c) => ({ id: c.id, content: c.content, created_at: c.created_at }));
+			setAfterChunks((prev) => [...prev, ...newChunks]);
 		} catch (err) {
 			console.error("Failed to load later chunks:", err);
 		} finally {
@@ -400,12 +419,12 @@ export function SourceDetailPanel({
 									{documentData && "document_type" in documentData
 										? formatDocumentType(documentData.document_type)
 										: sourceType && formatDocumentType(sourceType)}
-								{totalChunks > 0 && (
-									<span className="ml-2">
-										• {totalChunks} chunk{totalChunks !== 1 ? "s" : ""}
-										{allChunks.length < totalChunks && ` (showing ${allChunks.length})`}
-									</span>
-								)}
+									{totalChunks > 0 && (
+										<span className="ml-2">
+											• {totalChunks} chunk{totalChunks !== 1 ? "s" : ""}
+											{allChunks.length < totalChunks && ` (showing ${allChunks.length})`}
+										</span>
+									)}
 								</p>
 							</div>
 							<div className="flex items-center gap-3 shrink-0">
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index faa042d8e..723a3ad36 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -273,8 +273,7 @@ export function DocumentUploadTab({
 			<Alert className="border border-border bg-slate-400/5 dark:bg-white/5">
 				<Info className="h-4 w-4 shrink-0 mt-0.5" />
 				<AlertDescription className="text-xs sm:text-sm leading-relaxed pt-0.5">
-					{t("file_size_limit", { maxMB: MAX_FILE_SIZE_MB })}{" "}
-					{t("upload_limits")}
+					{t("file_size_limit", { maxMB: MAX_FILE_SIZE_MB })} {t("upload_limits")}
 				</AlertDescription>
 			</Alert>
 
diff --git a/surfsense_web/components/ui/checkbox.tsx b/surfsense_web/components/ui/checkbox.tsx
index 586e3e602..056761547 100644
--- a/surfsense_web/components/ui/checkbox.tsx
+++ b/surfsense_web/components/ui/checkbox.tsx
@@ -1,7 +1,7 @@
 "use client";
 
-import { CheckIcon } from "lucide-react";
 import * as CheckboxPrimitive from "@radix-ui/react-checkbox";
+import { CheckIcon } from "lucide-react";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/dropdown-menu.tsx b/surfsense_web/components/ui/dropdown-menu.tsx
index 2904b93dd..d387a4592 100644
--- a/surfsense_web/components/ui/dropdown-menu.tsx
+++ b/surfsense_web/components/ui/dropdown-menu.tsx
@@ -1,7 +1,7 @@
 "use client";
 
-import { CheckIcon, ChevronRightIcon, CircleIcon } from "lucide-react";
 import * as DropdownMenuPrimitive from "@radix-ui/react-dropdown-menu";
+import { CheckIcon, ChevronRightIcon, CircleIcon } from "lucide-react";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/toggle-group.tsx b/surfsense_web/components/ui/toggle-group.tsx
index 33aa433b2..6740fade0 100644
--- a/surfsense_web/components/ui/toggle-group.tsx
+++ b/surfsense_web/components/ui/toggle-group.tsx
@@ -1,7 +1,7 @@
 "use client";
 
-import type { VariantProps } from "class-variance-authority";
 import * as ToggleGroupPrimitive from "@radix-ui/react-toggle-group";
+import type { VariantProps } from "class-variance-authority";
 import * as React from "react";
 import { toggleVariants } from "@/components/ui/toggle";
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/components/ui/toggle.tsx b/surfsense_web/components/ui/toggle.tsx
index f0e68cec9..6a6e24025 100644
--- a/surfsense_web/components/ui/toggle.tsx
+++ b/surfsense_web/components/ui/toggle.tsx
@@ -1,7 +1,7 @@
 "use client";
 
-import { cva, type VariantProps } from "class-variance-authority";
 import * as TogglePrimitive from "@radix-ui/react-toggle";
+import { cva, type VariantProps } from "class-variance-authority";
 import type * as React from "react";
 
 import { cn } from "@/lib/utils";
diff --git a/surfsense_web/lib/query-client/query-client.provider.tsx b/surfsense_web/lib/query-client/query-client.provider.tsx
index 6dc2a4258..30c6d9767 100644
--- a/surfsense_web/lib/query-client/query-client.provider.tsx
+++ b/surfsense_web/lib/query-client/query-client.provider.tsx
@@ -1,6 +1,6 @@
 "use client";
-import dynamic from "next/dynamic";
 import { QueryClientAtomProvider } from "jotai-tanstack-query/react";
+import dynamic from "next/dynamic";
 import { queryClient } from "./client";
 
 const ReactQueryDevtools = dynamic(

From 9a370a37d4b485ca9f25e1f7db74bab951e1ce04 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Thu, 2 Apr 2026 20:06:02 -0700
Subject: [PATCH 065/202] docs: update README files to highlight SurfSense
 advantages over NotebookLM

- Expanded sections detailing limitations of NotebookLM.
- Added comparison table between SurfSense and Google NotebookLM.
- Enhanced descriptions of SurfSense features and capabilities.
- Updated example links and images for better clarity and relevance.
---
 README.es.md    | 64 +++++++++++++++++++++++++++++++++----------------
 README.hi.md    | 64 +++++++++++++++++++++++++++++++++----------------
 README.md       | 62 ++++++++++++++++++++++++++++++++---------------
 README.pt-BR.md | 64 +++++++++++++++++++++++++++++++++----------------
 README.zh-CN.md | 64 +++++++++++++++++++++++++++++++++----------------
 5 files changed, 219 insertions(+), 99 deletions(-)

diff --git a/README.es.md b/README.es.md
index d61504cd5..b62d2cece 100644
--- a/README.es.md
+++ b/README.es.md
@@ -21,9 +21,28 @@
 </div>
 
 # SurfSense
-Conecta cualquier LLM a tus fuentes de conocimiento internas y chatea con él en tiempo real junto a tu equipo. Alternativa de código abierto a NotebookLM, Perplexity y Glean.
 
-SurfSense es un agente de investigación de IA altamente personalizable, conectado a fuentes externas como motores de búsqueda (SearxNG, Tavily, LinkUp), Google Drive, OneDrive, Dropbox, Slack, Microsoft Teams, Linear, Jira, ClickUp, Confluence, BookStack, Gmail, Notion, YouTube, GitHub, Discord, Airtable, Google Calendar, Luma, Circleback, Elasticsearch, Obsidian y más por venir.
+NotebookLM es una de las mejores y más útiles plataformas de IA que existen, pero una vez que comienzas a usarla regularmente también sientes sus limitaciones dejando algo que desear.
+
+1. Hay límites en la cantidad de fuentes que puedes agregar en un notebook.
+2. Hay límites en la cantidad de notebooks que puedes tener.
+3. No puedes tener fuentes que excedan 500,000 palabras y más de 200MB.
+4. Estás bloqueado con los servicios de Google (LLMs, modelos de uso, etc.) sin opción de configurarlos.
+5. Fuentes de datos externas e integraciones de servicios limitadas.
+6. El agente de NotebookLM está específicamente optimizado solo para estudiar e investigar, pero puedes hacer mucho más con los datos de origen.
+7. Falta de soporte multijugador.
+
+...y más.
+
+**SurfSense está específicamente hecho para resolver estos problemas.** SurfSense te permite:
+
+- **Controla Tu Flujo de Datos** - Mantén tus datos privados y seguros.
+- **Sin Límites de Datos** - Agrega una cantidad ilimitada de fuentes y notebooks.
+- **Sin Dependencia de Proveedores** - Configura cualquier modelo LLM, de imagen, TTS y STT.
+- **25+ Fuentes de Datos Externas** - Agrega tus fuentes desde Google Drive, OneDrive, Dropbox, Notion y muchos otros servicios externos.
+- **Soporte Multijugador en Tiempo Real** - Trabaja fácilmente con los miembros de tu equipo en un notebook compartido.
+
+...y más por venir.
 
 
 
@@ -34,7 +53,7 @@ https://github.com/user-attachments/assets/cc0c84d3-1f2f-4f7a-b519-2ecce22310b1
 ## Ejemplo de Agente de Video
 
 
-https://github.com/user-attachments/assets/cc977e6d-8292-4ffe-abb8-3b0560ef5562
+https://github.com/user-attachments/assets/012a7ffa-6f76-4f06-9dda-7632b470057a
 
 
 
@@ -133,24 +152,29 @@ Para Docker Compose, instalación manual y otras opciones de despliegue, consult
 
    <p align="center"><img src="https://github.com/user-attachments/assets/3b04477d-8f42-4baa-be95-867c1eaeba87" alt="Comentarios en Tiempo Real" /></p>
 
-## Funcionalidades Principales
+## SurfSense vs Google NotebookLM
 
-| Funcionalidad | Descripción |
-|----------------|-------------|
-| Alternativa OSS | Reemplazo directo de NotebookLM, Perplexity y Glean con colaboración en equipo en tiempo real |
-| 50+ Formatos de Archivo | Sube documentos, imágenes, videos vía LlamaCloud, Unstructured o Docling (local) |
-| Búsqueda Híbrida | Semántica + Texto completo con Índices Jerárquicos y Reciprocal Rank Fusion |
-| Respuestas con Citas | Chatea con tu base de conocimiento y obtén respuestas citadas al estilo Perplexity |
-| Arquitectura de Agentes Profundos | Impulsado por [LangChain Deep Agents](https://docs.langchain.com/oss/python/deepagents/overview) con planificación, subagentes y acceso al sistema de archivos |
-| Soporte Universal de LLM | 100+ LLMs, 6000+ modelos de embeddings, todos los principales rerankers vía OpenAI spec y LiteLLM |
-| Privacidad Primero | Soporte completo de LLM local (vLLM, Ollama) tus datos son tuyos |
-| Colaboración en Equipo | RBAC con roles de Propietario / Admin / Editor / Visor, chat en tiempo real e hilos de comentarios |
-| Generación de Videos | Genera videos con narración y visuales |
-| Generación de Presentaciones | Crea presentaciones editables basadas en diapositivas |
-| Generación de Podcasts | Podcast de 3 min en menos de 20 segundos; múltiples proveedores TTS (OpenAI, Azure, Kokoro) |
-| Extensión de Navegador | Extensión multi-navegador para guardar cualquier página web, incluyendo páginas protegidas por autenticación |
-| 27+ Conectores | Motores de búsqueda, Google Drive, OneDrive, Dropbox, Slack, Teams, Jira, Notion, GitHub, Discord y [más](#fuentes-externas) |
-| Auto-Hospedable | Código abierto, Docker en un solo comando o Docker Compose completo para producción |
+| Característica | Google NotebookLM | SurfSense |
+|---------|-------------------|-----------|
+| **Fuentes por Notebook** | 50 (Gratis) a 600 (Ultra, $249.99/mes) | Ilimitadas |
+| **Número de Notebooks** | 100 (Gratis) a 500 (planes de pago) | Ilimitados |
+| **Límite de Tamaño de Fuente** | 500,000 palabras / 200MB por fuente | Sin límite |
+| **Precios** | Nivel gratuito disponible; Pro $19.99/mes, Ultra $249.99/mes | Gratuito y de código abierto, auto-hospedable en tu propia infra |
+| **Soporte de LLM** | Solo Google Gemini | 100+ LLMs vía OpenAI spec y LiteLLM |
+| **Modelos de Embeddings** | Solo Google | 6,000+ modelos de embeddings, todos los principales rerankers |
+| **LLMs Locales / Privados** | No disponible | Soporte completo (vLLM, Ollama) - tus datos son tuyos |
+| **Auto-Hospedable** | No | Sí - Docker en un solo comando o Docker Compose completo |
+| **Código Abierto** | No | Sí |
+| **Conectores Externos** | Google Drive, YouTube, sitios web | 27+ conectores - Motores de búsqueda, Google Drive, OneDrive, Dropbox, Slack, Teams, Jira, Notion, GitHub, Discord y [más](#fuentes-externas) |
+| **Soporte de Formatos de Archivo** | PDFs, Docs, Slides, Sheets, CSV, Word, EPUB, imágenes, URLs web, YouTube | 50+ formatos - documentos, imágenes, videos vía LlamaCloud, Unstructured o Docling (local) |
+| **Búsqueda** | Búsqueda semántica | Búsqueda Híbrida - Semántica + Texto completo con Índices Jerárquicos y Reciprocal Rank Fusion |
+| **Respuestas con Citas** | Sí | Sí - Respuestas citadas al estilo Perplexity |
+| **Arquitectura de Agentes** | No | Sí - impulsado por [LangChain Deep Agents](https://docs.langchain.com/oss/python/deepagents/overview) con planificación, subagentes y acceso al sistema de archivos |
+| **Multijugador en Tiempo Real** | Notebooks compartidos con roles de Visor/Editor (sin chat en tiempo real) | RBAC con roles de Propietario / Admin / Editor / Visor, chat en tiempo real e hilos de comentarios |
+| **Generación de Videos** | Resúmenes en video cinemáticos vía Veo 3 (solo Ultra) | Disponible (NotebookLM es mejor aquí, mejorando activamente) |
+| **Generación de Presentaciones** | Diapositivas más atractivas pero no editables | Crea presentaciones editables basadas en diapositivas |
+| **Generación de Podcasts** | Resúmenes de audio con hosts e idiomas personalizables | Disponible con múltiples proveedores TTS (NotebookLM es mejor aquí, mejorando activamente) |
+| **Extensión de Navegador** | No | Extensión multi-navegador para guardar cualquier página web, incluyendo páginas protegidas por autenticación |
 
 <details>
 <summary><b>Lista completa de Fuentes Externas</b></summary>
diff --git a/README.hi.md b/README.hi.md
index 011dbf5db..b49bddc72 100644
--- a/README.hi.md
+++ b/README.hi.md
@@ -21,9 +21,28 @@
 </div>
 
 # SurfSense
-किसी भी LLM को अपने आंतरिक ज्ञान स्रोतों से जोड़ें और अपनी टीम के साथ रीयल-टाइम में चैट करें। NotebookLM, Perplexity और Glean का ओपन सोर्स विकल्प।
 
-SurfSense एक अत्यधिक अनुकूलन योग्य AI शोध एजेंट है, जो बाहरी स्रोतों से जुड़ा है जैसे सर्च इंजन (SearxNG, Tavily, LinkUp), Google Drive, OneDrive, Dropbox, Slack, Microsoft Teams, Linear, Jira, ClickUp, Confluence, BookStack, Gmail, Notion, YouTube, GitHub, Discord, Airtable, Google Calendar, Luma, Circleback, Elasticsearch, Obsidian और भी बहुत कुछ आने वाला है।
+NotebookLM वहाँ उपलब्ध सबसे अच्छे और सबसे उपयोगी AI प्लेटफ़ॉर्म में से एक है, लेकिन जब आप इसे नियमित रूप से उपयोग करना शुरू करते हैं तो आप इसकी सीमाओं को भी महसूस करते हैं जो कुछ और की चाह छोड़ती हैं।
+
+1. एक notebook में जोड़े जा सकने वाले स्रोतों की मात्रा पर सीमाएं हैं।
+2. आपके पास कितने notebooks हो सकते हैं इस पर सीमाएं हैं।
+3. आपके पास ऐसे स्रोत नहीं हो सकते जो 500,000 शब्दों और 200MB से अधिक हों।
+4. आप Google सेवाओं (LLMs, उपयोग मॉडल, आदि) में बंद हैं और उन्हें कॉन्फ़िगर करने का कोई विकल्प नहीं है।
+5. सीमित बाहरी डेटा स्रोत और सेवा एकीकरण।
+6. NotebookLM एजेंट विशेष रूप से केवल अध्ययन और शोध के लिए अनुकूलित है, लेकिन आप स्रोत डेटा के साथ और भी बहुत कुछ कर सकते हैं।
+7. मल्टीप्लेयर सपोर्ट की कमी।
+
+...और भी बहुत कुछ।
+
+**SurfSense विशेष रूप से इन समस्याओं को हल करने के लिए बनाया गया है।** SurfSense आपको सक्षम बनाता है:
+
+- **अपने डेटा प्रवाह को नियंत्रित करें** - अपने डेटा को निजी और सुरक्षित रखें।
+- **कोई डेटा सीमा नहीं** - असीमित मात्रा में स्रोत और notebooks जोड़ें।
+- **कोई विक्रेता लॉक-इन नहीं** - किसी भी LLM, इमेज, TTS और STT मॉडल को कॉन्फ़िगर करें।
+- **25+ बाहरी डेटा स्रोत** - Google Drive, OneDrive, Dropbox, Notion और कई अन्य बाहरी सेवाओं से अपने स्रोत जोड़ें।
+- **रीयल-टाइम मल्टीप्लेयर सपोर्ट** - एक साझा notebook में अपनी टीम के सदस्यों के साथ आसानी से काम करें।
+
+...और भी बहुत कुछ आने वाला है।
 
 
 
@@ -34,7 +53,7 @@ https://github.com/user-attachments/assets/cc0c84d3-1f2f-4f7a-b519-2ecce22310b1
 ## वीडियो एजेंट नमूना
 
 
-https://github.com/user-attachments/assets/cc977e6d-8292-4ffe-abb8-3b0560ef5562
+https://github.com/user-attachments/assets/012a7ffa-6f76-4f06-9dda-7632b470057a
 
 
 
@@ -133,24 +152,29 @@ Docker Compose, मैनुअल इंस्टॉलेशन और अन
 
    <p align="center"><img src="https://github.com/user-attachments/assets/3b04477d-8f42-4baa-be95-867c1eaeba87" alt="रीयल-टाइम कमेंट्स" /></p>
 
-## प्रमुख विशेषताएं
+## SurfSense vs Google NotebookLM
 
-| विशेषता | विवरण |
-|----------|--------|
-| OSS विकल्प | रीयल-टाइम टीम सहयोग के साथ NotebookLM, Perplexity और Glean का सीधा प्रतिस्थापन |
-| 50+ फ़ाइल फ़ॉर्मेट | LlamaCloud, Unstructured या Docling (लोकल) के माध्यम से दस्तावेज़, चित्र, वीडियो अपलोड करें |
-| हाइब्रिड सर्च | हायरार्किकल इंडाइसेस और Reciprocal Rank Fusion के साथ सिमैंटिक + फुल टेक्स्ट सर्च |
-| उद्धृत उत्तर | अपने ज्ञान आधार के साथ चैट करें और Perplexity शैली के उद्धृत उत्तर पाएं |
-| डीप एजेंट आर्किटेक्चर | [LangChain Deep Agents](https://docs.langchain.com/oss/python/deepagents/overview) द्वारा संचालित, योजना, सब-एजेंट और फ़ाइल सिस्टम एक्सेस |
-| यूनिवर्सल LLM सपोर्ट | 100+ LLMs, 6000+ एम्बेडिंग मॉडल, सभी प्रमुख रीरैंकर्स OpenAI spec और LiteLLM के माध्यम से |
-| प्राइवेसी फर्स्ट | पूर्ण लोकल LLM सपोर्ट (vLLM, Ollama) आपका डेटा आपका रहता है |
-| टीम सहयोग | मालिक / एडमिन / संपादक / दर्शक भूमिकाओं के साथ RBAC, रीयल-टाइम चैट और कमेंट थ्रेड |
-| वीडियो जनरेशन | नैरेशन और विज़ुअल के साथ वीडियो बनाएं |
-| प्रेजेंटेशन जनरेशन | संपादन योग्य, स्लाइड आधारित प्रेजेंटेशन बनाएं |
-| पॉडकास्ट जनरेशन | 20 सेकंड से कम में 3 मिनट का पॉडकास्ट; कई TTS प्रदाता (OpenAI, Azure, Kokoro) |
-| ब्राउज़र एक्सटेंशन | किसी भी वेबपेज को सहेजने के लिए क्रॉस-ब्राउज़र एक्सटेंशन, प्रमाणीकरण सुरक्षित पेज सहित |
-| 27+ कनेक्टर्स | सर्च इंजन, Google Drive, OneDrive, Dropbox, Slack, Teams, Jira, Notion, GitHub, Discord और [अधिक](#बाहरी-स्रोत) |
-| सेल्फ-होस्ट करने योग्य | ओपन सोर्स, Docker एक कमांड या प्रोडक्शन के लिए पूर्ण Docker Compose |
+| विशेषता | Google NotebookLM | SurfSense |
+|---------|-------------------|-----------|
+| **प्रति Notebook स्रोत** | 50 (मुफ़्त) से 600 (Ultra, $249.99/माह) | असीमित |
+| **Notebooks की संख्या** | 100 (मुफ़्त) से 500 (सशुल्क योजनाएं) | असीमित |
+| **स्रोत आकार सीमा** | 500,000 शब्द / 200MB प्रति स्रोत | कोई सीमा नहीं |
+| **मूल्य निर्धारण** | मुफ़्त स्तर उपलब्ध; Pro $19.99/माह, Ultra $249.99/माह | मुफ़्त और ओपन सोर्स, अपनी इंफ्रा पर सेल्फ-होस्ट करें |
+| **LLM सपोर्ट** | केवल Google Gemini | 100+ LLMs OpenAI spec और LiteLLM के माध्यम से |
+| **एम्बेडिंग मॉडल** | केवल Google | 6,000+ एम्बेडिंग मॉडल, सभी प्रमुख रीरैंकर्स |
+| **लोकल / प्राइवेट LLMs** | उपलब्ध नहीं | पूर्ण सपोर्ट (vLLM, Ollama) - आपका डेटा आपका रहता है |
+| **सेल्फ-होस्ट करने योग्य** | नहीं | हाँ - Docker एक कमांड या पूर्ण Docker Compose |
+| **ओपन सोर्स** | नहीं | हाँ |
+| **बाहरी कनेक्टर्स** | Google Drive, YouTube, वेबसाइटें | 27+ कनेक्टर्स - सर्च इंजन, Google Drive, OneDrive, Dropbox, Slack, Teams, Jira, Notion, GitHub, Discord और [अधिक](#बाहरी-स्रोत) |
+| **फ़ाइल फ़ॉर्मेट सपोर्ट** | PDFs, Docs, Slides, Sheets, CSV, Word, EPUB, इमेज, वेब URLs, YouTube | 50+ फ़ॉर्मेट - दस्तावेज़, इमेज, वीडियो LlamaCloud, Unstructured या Docling (लोकल) के माध्यम से |
+| **सर्च** | सिमैंटिक सर्च | हाइब्रिड सर्च - हायरार्किकल इंडाइसेस और Reciprocal Rank Fusion के साथ सिमैंटिक + फुल टेक्स्ट |
+| **उद्धृत उत्तर** | हाँ | हाँ - Perplexity शैली के उद्धृत उत्तर |
+| **एजेंट आर्किटेक्चर** | नहीं | हाँ - [LangChain Deep Agents](https://docs.langchain.com/oss/python/deepagents/overview) द्वारा संचालित, योजना, सब-एजेंट और फ़ाइल सिस्टम एक्सेस |
+| **रीयल-टाइम मल्टीप्लेयर** | दर्शक/संपादक भूमिकाओं के साथ साझा notebooks (कोई रीयल-टाइम चैट नहीं) | मालिक / एडमिन / संपादक / दर्शक भूमिकाओं के साथ RBAC, रीयल-टाइम चैट और कमेंट थ्रेड |
+| **वीडियो जनरेशन** | Veo 3 के माध्यम से सिनेमैटिक वीडियो ओवरव्यू (केवल Ultra) | उपलब्ध (NotebookLM यहाँ बेहतर है, सक्रिय रूप से सुधार हो रहा है) |
+| **प्रेजेंटेशन जनरेशन** | बेहतर दिखने वाली स्लाइड्स लेकिन संपादन योग्य नहीं | संपादन योग्य, स्लाइड आधारित प्रेजेंटेशन बनाएं |
+| **पॉडकास्ट जनरेशन** | कस्टमाइज़ेबल होस्ट और भाषाओं के साथ ऑडियो ओवरव्यू | कई TTS प्रदाताओं के साथ उपलब्ध (NotebookLM यहाँ बेहतर है, सक्रिय रूप से सुधार हो रहा है) |
+| **ब्राउज़र एक्सटेंशन** | नहीं | किसी भी वेबपेज को सहेजने के लिए क्रॉस-ब्राउज़र एक्सटेंशन, प्रमाणीकरण सुरक्षित पेज सहित |
 
 <details>
 <summary><b>बाहरी स्रोतों की पूरी सूची</b></summary>
diff --git a/README.md b/README.md
index f007fd43c..12ea4912a 100644
--- a/README.md
+++ b/README.md
@@ -21,9 +21,28 @@
 </div>
 
 # SurfSense
-Connect any LLM to your internal knowledge sources and chat with it in real time alongside your team. OSS alternative to NotebookLM, Perplexity, and Glean.
 
-SurfSense is a highly customizable AI research agent, connected to external sources such as Search Engines (SearxNG, Tavily, LinkUp), Google Drive, OneDrive, Dropbox, Slack, Microsoft Teams, Linear, Jira, ClickUp, Confluence, BookStack, Gmail, Notion, YouTube, GitHub, Discord, Airtable, Google Calendar, Luma, Circleback, Elasticsearch, Obsidian and more to come.
+NotebookLM is one of the best and most useful AI platforms out there, but once you start using it regularly you also feel its limitations leaving something to be desired more.
+
+1. There are limits on the amount of sources you can add in a notebook.
+2. There are limits on the number of notebooks you can have.
+3. You cannot have sources that exceed 500,000 words and are more than 200MB.
+4. You are vendor locked in to Google services (LLMs, usage models, etc.) with no option to configure them.
+5. Limited external data sources and service integrations.
+6. NotebookLM Agent is specifically optimised for just studying and researching, but you can do so much more with the source data.
+7. Lack of multiplayer support.
+
+...and more.
+
+**SurfSense is specifically made to solve these problems.** SurfSense empowers you to:
+
+- **Control Your Data Flow** - Keep your data private and secure.
+- **No Data Limits** - Add an unlimited amount of sources and notebooks.
+- **No Vendor Lock-in** - Configure any LLM, image, TTS, and STT models to use.
+- **25+ External Data Sources** - Add your sources from Google Drive, OneDrive, Dropbox, Notion, and many other external services.
+- **Real-Time Multiplayer Support** - Work easily with your team members in a shared notebook.
+
+...and more to come.
 
 
 
@@ -134,24 +153,29 @@ For Docker Compose, manual installation, and other deployment options, see the [
 
    <p align="center"><img src="https://github.com/user-attachments/assets/3b04477d-8f42-4baa-be95-867c1eaeba87" alt="Realtime Comments" /></p>
 
-## Key Features
+## SurfSense vs Google NotebookLM
 
-| Feature | Description |
-|---------|-------------|
-| OSS Alternative | Drop in replacement for NotebookLM, Perplexity, and Glean with real time team collaboration |
-| 50+ File Formats | Upload documents, images, videos via LlamaCloud, Unstructured, or Docling (local) |
-| Hybrid Search | Semantic + Full Text Search with Hierarchical Indices and Reciprocal Rank Fusion |
-| Cited Answers | Chat with your knowledge base and get Perplexity style cited responses |
-| Deep Agent Architecture | Powered by [LangChain Deep Agents](https://docs.langchain.com/oss/python/deepagents/overview) planning, subagents, and file system access |
-| Universal LLM Support | 100+ LLMs, 6000+ embedding models, all major rerankers via OpenAI spec & LiteLLM |
-| Privacy First | Full local LLM support (vLLM, Ollama) your data stays yours |
-| Team Collaboration | RBAC with Owner / Admin / Editor / Viewer roles, real time chat & comment threads |
-| Video Generation | Generate videos with narration and visuals |
-| Presentation Generation | Create editable, slide based presentations |
-| Podcast Generation | 3 min podcast in under 20 seconds; multiple TTS providers (OpenAI, Azure, Kokoro) |
-| Browser Extension | Cross browser extension to save any webpage, including auth protected pages |
-| 27+ Connectors | Search Engines, Google Drive, OneDrive, Dropbox, Slack, Teams, Jira, Notion, GitHub, Discord & [more](#external-sources) |
-| Self Hostable | Open source, Docker one liner or full Docker Compose for production |
+| Feature | Google NotebookLM | SurfSense |
+|---------|-------------------|-----------|
+| **Sources per Notebook** | 50 (Free) to 600 (Ultra, $249.99/mo) | Unlimited |
+| **Number of Notebooks** | 100 (Free) to 500 (paid tiers) | Unlimited |
+| **Source Size Limit** | 500,000 words / 200MB per source | No limit |
+| **Pricing** | Free tier available; Pro $19.99/mo, Ultra $249.99/mo | Free and open source, self-host on your own infra |
+| **LLM Support** | Google Gemini only | 100+ LLMs via OpenAI spec & LiteLLM |
+| **Embedding Models** | Google only | 6,000+ embedding models, all major rerankers |
+| **Local / Private LLMs** | Not available | Full support (vLLM, Ollama) - your data stays yours |
+| **Self Hostable** | No | Yes - Docker one-liner or full Docker Compose |
+| **Open Source** | No | Yes |
+| **External Connectors** | Google Drive, YouTube, websites | 27+ connectors - Search Engines, Google Drive, OneDrive, Dropbox, Slack, Teams, Jira, Notion, GitHub, Discord & [more](#external-sources) |
+| **File Format Support** | PDFs, Docs, Slides, Sheets, CSV, Word, EPUB, images, web URLs, YouTube | 50+ formats - documents, images, videos via LlamaCloud, Unstructured, or Docling (local) |
+| **Search** | Semantic search | Hybrid Search - Semantic + Full Text with Hierarchical Indices & Reciprocal Rank Fusion |
+| **Cited Answers** | Yes | Yes - Perplexity-style cited responses |
+| **Agentic Architecture** | No | Yes - powered by [LangChain Deep Agents](https://docs.langchain.com/oss/python/deepagents/overview) with planning, subagents, and file system access |
+| **Real-Time Multiplayer** | Shared notebooks with Viewer/Editor roles (no real-time chat) | RBAC with Owner / Admin / Editor / Viewer roles, real-time chat & comment threads |
+| **Video Generation** | Cinematic Video Overviews via Veo 3 (Ultra only) | Available (NotebookLM is better here, actively improving) |
+| **Presentation Generation** | Better looking slides but not editable | Create editable, slide-based presentations |
+| **Podcast Generation** | Audio Overviews with customizable hosts and languages | Available with multiple TTS providers (NotebookLM is better here, actively improving) |
+| **Browser Extension** | No | Cross-browser extension to save any webpage, including auth-protected pages |
 
 <details>
 <summary><b>Full list of External Sources</b></summary>
diff --git a/README.pt-BR.md b/README.pt-BR.md
index 4306b0767..50a8b739e 100644
--- a/README.pt-BR.md
+++ b/README.pt-BR.md
@@ -21,9 +21,28 @@
 </div>
 
 # SurfSense
-Conecte qualquer LLM às suas fontes de conhecimento internas e converse com ele em tempo real junto com sua equipe. Alternativa de código aberto ao NotebookLM, Perplexity e Glean.
 
-SurfSense é um agente de pesquisa de IA altamente personalizável, conectado a fontes externas como mecanismos de busca (SearxNG, Tavily, LinkUp), Google Drive, OneDrive, Dropbox, Slack, Microsoft Teams, Linear, Jira, ClickUp, Confluence, BookStack, Gmail, Notion, YouTube, GitHub, Discord, Airtable, Google Calendar, Luma, Circleback, Elasticsearch, Obsidian e mais por vir.
+O NotebookLM é uma das melhores e mais úteis plataformas de IA disponíveis, mas quando você começa a usá-lo regularmente também sente suas limitações deixando algo a desejar.
+
+1. Há limites na quantidade de fontes que você pode adicionar em um notebook.
+2. Há limites no número de notebooks que você pode ter.
+3. Você não pode ter fontes que excedam 500.000 palavras e mais de 200MB.
+4. Você fica preso aos serviços do Google (LLMs, modelos de uso, etc.) sem opção de configurá-los.
+5. Fontes de dados externas e integrações de serviços limitadas.
+6. O agente do NotebookLM é especificamente otimizado apenas para estudar e pesquisar, mas você pode fazer muito mais com os dados de origem.
+7. Falta de suporte multiplayer.
+
+...e mais.
+
+**O SurfSense foi feito especificamente para resolver esses problemas.** O SurfSense permite que você:
+
+- **Controle Seu Fluxo de Dados** - Mantenha seus dados privados e seguros.
+- **Sem Limites de Dados** - Adicione uma quantidade ilimitada de fontes e notebooks.
+- **Sem Dependência de Fornecedor** - Configure qualquer modelo LLM, de imagem, TTS e STT.
+- **25+ Fontes de Dados Externas** - Adicione suas fontes do Google Drive, OneDrive, Dropbox, Notion e muitos outros serviços externos.
+- **Suporte Multiplayer em Tempo Real** - Trabalhe facilmente com os membros da sua equipe em um notebook compartilhado.
+
+...e mais por vir.
 
 
 
@@ -34,7 +53,7 @@ https://github.com/user-attachments/assets/cc0c84d3-1f2f-4f7a-b519-2ecce22310b1
 ## Exemplo de Agente de Vídeo
 
 
-https://github.com/user-attachments/assets/cc977e6d-8292-4ffe-abb8-3b0560ef5562
+https://github.com/user-attachments/assets/012a7ffa-6f76-4f06-9dda-7632b470057a
 
 
 
@@ -133,24 +152,29 @@ Para Docker Compose, instalação manual e outras opções de implantação, con
 
    <p align="center"><img src="https://github.com/user-attachments/assets/3b04477d-8f42-4baa-be95-867c1eaeba87" alt="Comentários em Tempo Real" /></p>
 
-## Funcionalidades Principais
+## SurfSense vs Google NotebookLM
 
-| Funcionalidade | Descrição |
-|----------------|-----------|
-| Alternativa OSS | Substituto direto do NotebookLM, Perplexity e Glean com colaboração em equipe em tempo real |
-| 50+ Formatos de Arquivo | Faça upload de documentos, imagens, vídeos via LlamaCloud, Unstructured ou Docling (local) |
-| Busca Híbrida | Semântica + Texto completo com Índices Hierárquicos e Reciprocal Rank Fusion |
-| Respostas com Citações | Converse com sua base de conhecimento e obtenha respostas citadas no estilo Perplexity |
-| Arquitetura de Agentes Profundos | Alimentado por [LangChain Deep Agents](https://docs.langchain.com/oss/python/deepagents/overview) com planejamento, subagentes e acesso ao sistema de arquivos |
-| Suporte Universal de LLM | 100+ LLMs, 6000+ modelos de embeddings, todos os principais rerankers via OpenAI spec e LiteLLM |
-| Privacidade em Primeiro Lugar | Suporte completo a LLM local (vLLM, Ollama) seus dados ficam com você |
-| Colaboração em Equipe | RBAC com papéis de Proprietário / Admin / Editor / Visualizador, chat em tempo real e threads de comentários |
-| Geração de Vídeos | Gera vídeos com narração e visuais |
-| Geração de Apresentações | Cria apresentações editáveis baseadas em slides |
-| Geração de Podcasts | Podcast de 3 min em menos de 20 segundos; múltiplos provedores TTS (OpenAI, Azure, Kokoro) |
-| Extensão de Navegador | Extensão multi-navegador para salvar qualquer página web, incluindo páginas protegidas por autenticação |
-| 27+ Conectores | Mecanismos de busca, Google Drive, OneDrive, Dropbox, Slack, Teams, Jira, Notion, GitHub, Discord e [mais](#fontes-externas) |
-| Auto-Hospedável | Código aberto, Docker em um único comando ou Docker Compose completo para produção |
+| Recurso | Google NotebookLM | SurfSense |
+|---------|-------------------|-----------|
+| **Fontes por Notebook** | 50 (Grátis) a 600 (Ultra, $249.99/mês) | Ilimitadas |
+| **Número de Notebooks** | 100 (Grátis) a 500 (planos pagos) | Ilimitados |
+| **Limite de Tamanho da Fonte** | 500.000 palavras / 200MB por fonte | Sem limite |
+| **Preços** | Nível gratuito disponível; Pro $19.99/mês, Ultra $249.99/mês | Gratuito e de código aberto, auto-hospedável na sua própria infra |
+| **Suporte a LLM** | Apenas Google Gemini | 100+ LLMs via OpenAI spec e LiteLLM |
+| **Modelos de Embeddings** | Apenas Google | 6.000+ modelos de embeddings, todos os principais rerankers |
+| **LLMs Locais / Privados** | Não disponível | Suporte completo (vLLM, Ollama) - seus dados ficam com você |
+| **Auto-Hospedável** | Não | Sim - Docker em um único comando ou Docker Compose completo |
+| **Código Aberto** | Não | Sim |
+| **Conectores Externos** | Google Drive, YouTube, sites | 27+ conectores - Mecanismos de busca, Google Drive, OneDrive, Dropbox, Slack, Teams, Jira, Notion, GitHub, Discord e [mais](#fontes-externas) |
+| **Suporte a Formatos de Arquivo** | PDFs, Docs, Slides, Sheets, CSV, Word, EPUB, imagens, URLs web, YouTube | 50+ formatos - documentos, imagens, vídeos via LlamaCloud, Unstructured ou Docling (local) |
+| **Busca** | Busca semântica | Busca Híbrida - Semântica + Texto completo com Índices Hierárquicos e Reciprocal Rank Fusion |
+| **Respostas com Citações** | Sim | Sim - Respostas citadas no estilo Perplexity |
+| **Arquitetura de Agentes** | Não | Sim - alimentado por [LangChain Deep Agents](https://docs.langchain.com/oss/python/deepagents/overview) com planejamento, subagentes e acesso ao sistema de arquivos |
+| **Multiplayer em Tempo Real** | Notebooks compartilhados com papéis de Visualizador/Editor (sem chat em tempo real) | RBAC com papéis de Proprietário / Admin / Editor / Visualizador, chat em tempo real e threads de comentários |
+| **Geração de Vídeos** | Visões gerais cinemáticas via Veo 3 (apenas Ultra) | Disponível (NotebookLM é melhor aqui, melhorando ativamente) |
+| **Geração de Apresentações** | Slides mais bonitos mas não editáveis | Cria apresentações editáveis baseadas em slides |
+| **Geração de Podcasts** | Visões gerais em áudio com hosts e idiomas personalizáveis | Disponível com múltiplos provedores TTS (NotebookLM é melhor aqui, melhorando ativamente) |
+| **Extensão de Navegador** | Não | Extensão multi-navegador para salvar qualquer página web, incluindo páginas protegidas por autenticação |
 
 <details>
 <summary><b>Lista completa de Fontes Externas</b></summary>
diff --git a/README.zh-CN.md b/README.zh-CN.md
index 96ebb25ad..419a831ae 100644
--- a/README.zh-CN.md
+++ b/README.zh-CN.md
@@ -21,9 +21,28 @@
 </div>
 
 # SurfSense
-将任何 LLM 连接到您的内部知识源，并与团队成员实时聊天。NotebookLM、Perplexity 和 Glean 的开源替代方案。
 
-SurfSense 是一个高度可定制的 AI 研究助手，可以连接外部数据源，如搜索引擎（SearxNG、Tavily、LinkUp）、Google Drive、OneDrive、Dropbox、Slack、Microsoft Teams、Linear、Jira、ClickUp、Confluence、BookStack、Gmail、Notion、YouTube、GitHub、Discord、Airtable、Google Calendar、Luma、Circleback、Elasticsearch、Obsidian 等，未来还会支持更多。
+NotebookLM 是目前最好、最实用的 AI 平台之一，但当你开始经常使用它时，你也会感受到它的局限性，总觉得还有不足之处。
+
+1. 一个笔记本中可以添加的来源数量有限制。
+2. 可以拥有的笔记本数量有限制。
+3. 来源不能超过 500,000 个单词和 200MB。
+4. 你被锁定在 Google 服务中（LLM、使用模型等），没有配置选项。
+5. 有限的外部数据源和服务集成。
+6. NotebookLM 代理专门针对学习和研究进行了优化，但你可以用源数据做更多事情。
+7. 缺乏多人协作支持。
+
+...还有更多。
+
+**SurfSense 正是为了解决这些问题而生。** SurfSense 赋予你：
+
+- **控制你的数据流** - 保持数据私密和安全。
+- **无数据限制** - 添加无限数量的来源和笔记本。
+- **无供应商锁定** - 配置任何 LLM、图像、TTS 和 STT 模型。
+- **25+ 外部数据源** - 从 Google Drive、OneDrive、Dropbox、Notion 和许多其他外部服务添加你的来源。
+- **实时多人协作支持** - 在共享笔记本中轻松与团队成员协作。
+
+...更多功能即将推出。
 
 
 
@@ -34,7 +53,7 @@ https://github.com/user-attachments/assets/cc0c84d3-1f2f-4f7a-b519-2ecce22310b1
 ## 视频代理示例
 
 
-https://github.com/user-attachments/assets/cc977e6d-8292-4ffe-abb8-3b0560ef5562
+https://github.com/user-attachments/assets/012a7ffa-6f76-4f06-9dda-7632b470057a
 
 
 
@@ -133,24 +152,29 @@ irm https://raw.githubusercontent.com/MODSetter/SurfSense/main/docker/scripts/in
 
    <p align="center"><img src="https://github.com/user-attachments/assets/3b04477d-8f42-4baa-be95-867c1eaeba87" alt="实时评论" /></p>
 
-## 核心功能
+## SurfSense vs Google NotebookLM
 
-| 功能 | 描述 |
-|------|------|
-| 开源替代方案 | 支持实时团队协作的 NotebookLM、Perplexity 和 Glean 替代品 |
-| 50+ 文件格式 | 通过 LlamaCloud、Unstructured 或 Docling（本地）上传文档、图像、视频 |
-| 混合搜索 | 语义搜索 + 全文搜索，结合层次化索引和倒数排名融合 |
-| 引用回答 | 与知识库对话，获得 Perplexity 风格的引用回答 |
-| 深度代理架构 | 基于 [LangChain Deep Agents](https://docs.langchain.com/oss/python/deepagents/overview) 构建，支持规划、子代理和文件系统访问 |
-| 通用 LLM 支持 | 100+ LLM、6000+ 嵌入模型、所有主流重排序器，通过 OpenAI spec 和 LiteLLM |
-| 隐私优先 | 完整本地 LLM 支持（vLLM、Ollama），您的数据由您掌控 |
-| 团队协作 | RBAC 角色控制（所有者/管理员/编辑者/查看者），实时聊天和评论线程 |
-| 视频生成 | 生成带有旁白和视觉效果的视频 |
-| 演示文稿生成 | 创建可编辑的幻灯片式演示文稿 |
-| 播客生成 | 20 秒内生成 3 分钟播客；多种 TTS 提供商（OpenAI、Azure、Kokoro） |
-| 浏览器扩展 | 跨浏览器扩展，保存任何网页，包括需要身份验证的页面 |
-| 27+ 连接器 | 搜索引擎、Google Drive、OneDrive、Dropbox、Slack、Teams、Jira、Notion、GitHub、Discord 等[更多](#外部数据源) |
-| 可自托管 | 开源，Docker 一行命令或完整 Docker Compose 用于生产环境 |
+| 功能 | Google NotebookLM | SurfSense |
+|---------|-------------------|-----------|
+| **每个笔记本的来源数** | 50（免费）到 600（Ultra，$249.99/月） | 无限制 |
+| **笔记本数量** | 100（免费）到 500（付费方案） | 无限制 |
+| **来源大小限制** | 500,000 词 / 200MB 每个来源 | 无限制 |
+| **定价** | 免费版可用；Pro $19.99/月，Ultra $249.99/月 | 免费开源，在自己的基础设施上自托管 |
+| **LLM 支持** | 仅 Google Gemini | 100+ LLM，通过 OpenAI spec 和 LiteLLM |
+| **嵌入模型** | 仅 Google | 6,000+ 嵌入模型，所有主流重排序器 |
+| **本地 / 私有 LLM** | 不可用 | 完整支持（vLLM、Ollama）- 您的数据由您掌控 |
+| **可自托管** | 否 | 是 - Docker 一行命令或完整 Docker Compose |
+| **开源** | 否 | 是 |
+| **外部连接器** | Google Drive、YouTube、网站 | 27+ 连接器 - 搜索引擎、Google Drive、OneDrive、Dropbox、Slack、Teams、Jira、Notion、GitHub、Discord 等[更多](#外部数据源) |
+| **文件格式支持** | PDF、Docs、Slides、Sheets、CSV、Word、EPUB、图像、网页 URL、YouTube | 50+ 格式 - 文档、图像、视频，通过 LlamaCloud、Unstructured 或 Docling（本地） |
+| **搜索** | 语义搜索 | 混合搜索 - 语义 + 全文搜索，结合层次化索引和倒数排名融合 |
+| **引用回答** | 是 | 是 - Perplexity 风格的引用回答 |
+| **代理架构** | 否 | 是 - 基于 [LangChain Deep Agents](https://docs.langchain.com/oss/python/deepagents/overview) 构建，支持规划、子代理和文件系统访问 |
+| **实时多人协作** | 共享笔记本，支持查看者/编辑者角色（无实时聊天） | RBAC 角色控制（所有者/管理员/编辑者/查看者），实时聊天和评论线程 |
+| **视频生成** | 通过 Veo 3 的电影级视频概览（仅 Ultra） | 可用（NotebookLM 在此方面更好，正在积极改进） |
+| **演示文稿生成** | 更美观的幻灯片但不可编辑 | 创建可编辑的幻灯片式演示文稿 |
+| **播客生成** | 可自定义主持人和语言的音频概览 | 可用，支持多种 TTS 提供商（NotebookLM 在此方面更好，正在积极改进） |
+| **浏览器扩展** | 否 | 跨浏览器扩展，保存任何网页，包括需要身份验证的页面 |
 
 <details>
 <summary><b>外部数据源完整列表</b></summary>

From e13ca675d97c7308ed77b754fdcc97afc393dd59 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Thu, 2 Apr 2026 20:26:34 -0700
Subject: [PATCH 066/202] chore: optimize zero publication column migration
 process

- Updated migration instructions to emphasize the importance of stopping zero-cache before and after running the migration.
- Added a function to terminate blocked PIDs that could interfere with the migration.
- Set a lock timeout to prevent deadlocks during the migration process.
---
 ..._optimize_zero_publication_column_lists.py | 29 ++++++++++++++++---
 1 file changed, 25 insertions(+), 4 deletions(-)

diff --git a/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py b/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py
index 3c2d34c76..78a26a381 100644
--- a/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py
+++ b/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py
@@ -11,10 +11,11 @@ to FULL for the old Electric SQL setup (migration 66/75/76).
 With DEFAULT (primary-key) identity, column-list publications
 only need to include the PK — not every column.
 
-After running this migration you MUST:
-  1. Stop zero-cache
-  2. Delete / reset the zero-cache data volume
-  3. Restart zero-cache  (it will do a fresh initial sync)
+IMPORTANT — before AND after running this migration:
+  1. Stop zero-cache  (it holds replication locks that will deadlock DDL)
+  2. Run:  alembic upgrade head
+  3. Delete / reset the zero-cache data volume
+  4. Restart zero-cache  (it will do a fresh initial sync)
 
 Revision ID: 117
 Revises: 116
@@ -62,9 +63,29 @@ CREATE PUBLICATION {PUBLICATION_NAME} FOR TABLE
 """
 
 
+def _terminate_blocked_pids(conn, table: str) -> None:
+    """Kill backends whose locks on *table* would block our AccessExclusiveLock."""
+    conn.execute(
+        sa.text(
+            "SELECT pg_terminate_backend(l.pid) "
+            "FROM pg_locks l "
+            "JOIN pg_class c ON c.oid = l.relation "
+            "WHERE c.relname = :tbl "
+            "  AND l.pid != pg_backend_pid()"
+        ),
+        {"tbl": table},
+    )
+
+
 def upgrade() -> None:
     conn = op.get_bind()
 
+    conn.execute(sa.text("SET lock_timeout = '10s'"))
+
+    for tbl in sorted(TABLES_WITH_FULL_IDENTITY):
+        _terminate_blocked_pids(conn, tbl)
+        conn.execute(sa.text(f'LOCK TABLE "{tbl}" IN ACCESS EXCLUSIVE MODE'))
+
     for tbl in TABLES_WITH_FULL_IDENTITY:
         conn.execute(sa.text(f'ALTER TABLE "{tbl}" REPLICA IDENTITY DEFAULT'))
 

From 6b06d3abb1ce5674339db4d18d52a49f5cc9eb76 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Thu, 2 Apr 2026 20:38:10 -0700
Subject: [PATCH 067/202] chore: optimize zero publication column migration
 process

- Updated migration instructions to emphasize the importance of stopping zero-cache before and after running the migration.
- Added a function to terminate blocked PIDs that could interfere with the migration.
- Set a lock timeout to prevent deadlocks during the migration process.
---
 ..._optimize_zero_publication_column_lists.py | 29 ++++++++++++++++---
 1 file changed, 25 insertions(+), 4 deletions(-)

diff --git a/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py b/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py
index 3c2d34c76..78a26a381 100644
--- a/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py
+++ b/surfsense_backend/alembic/versions/117_optimize_zero_publication_column_lists.py
@@ -11,10 +11,11 @@ to FULL for the old Electric SQL setup (migration 66/75/76).
 With DEFAULT (primary-key) identity, column-list publications
 only need to include the PK — not every column.
 
-After running this migration you MUST:
-  1. Stop zero-cache
-  2. Delete / reset the zero-cache data volume
-  3. Restart zero-cache  (it will do a fresh initial sync)
+IMPORTANT — before AND after running this migration:
+  1. Stop zero-cache  (it holds replication locks that will deadlock DDL)
+  2. Run:  alembic upgrade head
+  3. Delete / reset the zero-cache data volume
+  4. Restart zero-cache  (it will do a fresh initial sync)
 
 Revision ID: 117
 Revises: 116
@@ -62,9 +63,29 @@ CREATE PUBLICATION {PUBLICATION_NAME} FOR TABLE
 """
 
 
+def _terminate_blocked_pids(conn, table: str) -> None:
+    """Kill backends whose locks on *table* would block our AccessExclusiveLock."""
+    conn.execute(
+        sa.text(
+            "SELECT pg_terminate_backend(l.pid) "
+            "FROM pg_locks l "
+            "JOIN pg_class c ON c.oid = l.relation "
+            "WHERE c.relname = :tbl "
+            "  AND l.pid != pg_backend_pid()"
+        ),
+        {"tbl": table},
+    )
+
+
 def upgrade() -> None:
     conn = op.get_bind()
 
+    conn.execute(sa.text("SET lock_timeout = '10s'"))
+
+    for tbl in sorted(TABLES_WITH_FULL_IDENTITY):
+        _terminate_blocked_pids(conn, tbl)
+        conn.execute(sa.text(f'LOCK TABLE "{tbl}" IN ACCESS EXCLUSIVE MODE'))
+
     for tbl in TABLES_WITH_FULL_IDENTITY:
         conn.execute(sa.text(f'ALTER TABLE "{tbl}" REPLICA IDENTITY DEFAULT'))
 

From 9a65163fe4d89d35e6891015c1b46b555f11f321 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 09:20:44 +0530
Subject: [PATCH 068/202] feat: improve DocumentUploadTab UI with updated
 styles, enhanced file size limit messages

---
 .../components/sources/DocumentUploadTab.tsx  | 89 ++++++++++---------
 surfsense_web/messages/en.json                |  4 +-
 surfsense_web/messages/es.json                |  4 +-
 surfsense_web/messages/hi.json                |  4 +-
 surfsense_web/messages/pt.json                |  4 +-
 surfsense_web/messages/zh.json                |  4 +-
 6 files changed, 55 insertions(+), 54 deletions(-)

diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 7176afae5..9a32e5a59 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useAtom } from "jotai";
-import { CheckCircle2, ChevronDown, File as FileIcon, FileType, FolderOpen, Plus, Upload, X } from "lucide-react";
+import { ChevronDown, Dot, File as FileIcon, FolderOpen, Upload, X } from "lucide-react";
 
 import { useTranslations } from "next-intl";
 import { useCallback, useMemo, useRef, useState } from "react";
@@ -22,7 +22,6 @@ import {
 	DropdownMenuItem,
 	DropdownMenuTrigger,
 } from "@/components/ui/dropdown-menu";
-import { Label } from "@/components/ui/label";
 import { Progress } from "@/components/ui/progress";
 import { Spinner } from "@/components/ui/spinner";
 import { Switch } from "@/components/ui/switch";
@@ -362,12 +361,12 @@ export function DocumentUploadTab({
 			return (
 				<DropdownMenu>
 					<DropdownMenuTrigger asChild onClick={(e) => e.stopPropagation()}>
-						<Button variant="secondary" size="sm" className={`text-xs gap-1 ${sizeClass} ${widthClass}`}>
+						<Button variant="ghost" size="sm" className={`text-xs gap-1 bg-neutral-700/50 hover:bg-neutral-600/50 ${sizeClass} ${widthClass}`}>
 							Browse
 							<ChevronDown className="h-3 w-3 opacity-60" />
 						</Button>
 					</DropdownMenuTrigger>
-					<DropdownMenuContent align="center" onClick={(e) => e.stopPropagation()}>
+					<DropdownMenuContent align="center" className="dark:bg-neutral-800" onClick={(e) => e.stopPropagation()}>
 						<DropdownMenuItem onClick={handleBrowseFiles}>
 							<FileIcon className="h-4 w-4 mr-2" />
 							Files
@@ -416,32 +415,31 @@ export function DocumentUploadTab({
 								{renderBrowseButton({ compact: true, fullWidth: true })}
 							</div>
 						) : (
-							<Button
-								variant="outline"
-								size="sm"
-								className="w-full text-xs h-8 gap-1.5 border-dashed border-muted-foreground/30"
+							<button
+								type="button"
+								className="w-full text-xs h-8 flex items-center justify-center gap-1.5 rounded-md border border-dashed border-muted-foreground/30 text-muted-foreground hover:text-foreground hover:border-foreground/50 transition-colors"
 								onClick={() => fileInputRef.current?.click()}
 							>
-								<Plus className="h-3.5 w-3.5" />
 								Add more files
-							</Button>
+							</button>
 						)
 					)
 				) : (
 					<div
-						className="flex flex-col items-center gap-3 py-6 px-4 cursor-pointer"
+						className="flex flex-col items-center gap-4 py-12 px-4 cursor-pointer"
 						onClick={() => {
 							if (!isElectron) fileInputRef.current?.click();
 						}}
 					>
-						<Upload className="h-7 w-7 text-muted-foreground" />
-						<div className="text-center space-y-1">
-							<p className="text-sm font-medium">
+						<Upload className="h-10 w-10 text-muted-foreground" />
+						<div className="text-center space-y-1.5">
+							<p className="text-base font-medium">
 								{isElectron ? "Select files or folder" : "Tap to select files"}
 							</p>
-							<p className="text-xs text-muted-foreground">
-								{t("file_size_limit")}{" "}
-								{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}
+							<p className="text-sm text-muted-foreground inline-flex items-center flex-wrap justify-center">
+								<span>{t("file_size_limit")}</span>
+								<Dot className="h-4 w-4 shrink-0" />
+								<span>{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}</span>
 							</p>
 						</div>
 						{isElectron && (
@@ -491,9 +489,10 @@ export function DocumentUploadTab({
 					<div className="flex flex-col items-center gap-2">
 						<Upload className="h-8 w-8 text-muted-foreground" />
 						<p className="text-sm font-medium">{t("drag_drop")}</p>
-						<p className="text-xs text-muted-foreground text-center">
-							{t("file_size_limit")}{" "}
-							{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}
+						<p className="text-xs text-muted-foreground text-center inline-flex items-center flex-wrap justify-center">
+							<span>{t("file_size_limit")}</span>
+							<Dot className="h-4 w-4 shrink-0" />
+							<span>{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}</span>
 						</p>
 						<div className="mt-1">{renderBrowseButton()}</div>
 					</div>
@@ -520,28 +519,29 @@ export function DocumentUploadTab({
 						</Button>
 					</div>
 
-					<div className={toggleRowClass}>
-						<Label htmlFor="watch-folder-toggle" className="flex flex-col gap-0.5 cursor-pointer">
-							<span className="text-sm font-medium">Watch folder</span>
-							<span className="text-xs text-muted-foreground font-normal">
-								Auto-sync when files change
-							</span>
-						</Label>
-						<Switch
-							id="watch-folder-toggle"
-							checked={watchFolder}
-							onCheckedChange={setWatchFolder}
-						/>
-					</div>
-
-					<div className={toggleRowClass}>
-						<div className="space-y-0.5">
-							<p className="font-medium text-sm">Enable AI Summary</p>
-							<p className="text-xs text-muted-foreground">
-								Improves search quality but adds latency
-							</p>
+					<div className="rounded-lg bg-slate-400/5 dark:bg-white/5 divide-y divide-border">
+						<div className="flex items-center justify-between p-3">
+							<div className="space-y-0.5">
+								<p className="font-medium text-sm">Watch folder</p>
+								<p className="text-xs text-muted-foreground">
+									Auto-sync when files change
+								</p>
+							</div>
+							<Switch
+								id="watch-folder-toggle"
+								checked={watchFolder}
+								onCheckedChange={setWatchFolder}
+							/>
+						</div>
+						<div className="flex items-center justify-between p-3">
+							<div className="space-y-0.5">
+								<p className="font-medium text-sm">Enable AI Summary</p>
+								<p className="text-xs text-muted-foreground">
+									Improves search quality but adds latency
+								</p>
+							</div>
+							<Switch checked={shouldSummarize} onCheckedChange={setShouldSummarize} />
 						</div>
-						<Switch checked={shouldSummarize} onCheckedChange={setShouldSummarize} />
 					</div>
 
 					<Button
@@ -585,7 +585,9 @@ export function DocumentUploadTab({
 								key={entry.id}
 								className="flex items-center gap-2 py-1.5 px-2 rounded-md hover:bg-slate-400/5 dark:hover:bg-white/5 group"
 							>
-								<FileType className="h-4 w-4 text-muted-foreground shrink-0" />
+								<span className="text-[10px] font-medium uppercase leading-none bg-muted px-1.5 py-0.5 rounded text-muted-foreground shrink-0">
+									{entry.file.name.split(".").pop() || "?"}
+								</span>
 								<span className="text-sm truncate flex-1 min-w-0">{entry.file.name}</span>
 								<span className="text-xs text-muted-foreground shrink-0">
 									{formatFileSize(entry.file.size)}
@@ -635,7 +637,6 @@ export function DocumentUploadTab({
 							</span>
 						) : (
 							<span className="flex items-center gap-2">
-								<CheckCircle2 className="h-4 w-4" />
 								{t("upload_button", { count: files.length })}
 							</span>
 						)}
@@ -649,7 +650,7 @@ export function DocumentUploadTab({
 				collapsible
 				value={accordionValue}
 				onValueChange={handleAccordionChange}
-				className="w-full"
+				className="w-full mt-5"
 			>
 				<AccordionItem value="supported-file-types" className="border border-border rounded-lg">
 					<AccordionTrigger className="px-3 py-2.5 hover:no-underline !items-center [&>svg]:!translate-y-0">
diff --git a/surfsense_web/messages/en.json b/surfsense_web/messages/en.json
index 4310bc707..3cafebfdd 100644
--- a/surfsense_web/messages/en.json
+++ b/surfsense_web/messages/en.json
@@ -376,8 +376,8 @@
 	"upload_documents": {
 		"title": "Upload Documents",
 		"subtitle": "Upload your files to make them searchable and accessible through AI-powered conversations.",
-		"file_size_limit": "Maximum file size: 50MB per file.",
-		"upload_limits": "Upload limit: {maxFiles} files, {maxSizeMB}MB total.",
+		"file_size_limit": "Maximum file size: 50MB per file",
+		"upload_limits": "Upload limit: {maxFiles} files, {maxSizeMB}MB total",
 		"drop_files": "Drop files here",
 		"drag_drop": "Drag & drop files here",
 		"or_browse": "or click to browse",
diff --git a/surfsense_web/messages/es.json b/surfsense_web/messages/es.json
index 36e627295..99314ee7d 100644
--- a/surfsense_web/messages/es.json
+++ b/surfsense_web/messages/es.json
@@ -376,8 +376,8 @@
 	"upload_documents": {
 		"title": "Subir documentos",
 		"subtitle": "Sube tus archivos para hacerlos buscables y accesibles a través de conversaciones con IA.",
-		"file_size_limit": "Tamaño máximo de archivo: 50 MB por archivo.",
-		"upload_limits": "Límite de subida: {maxFiles} archivos, {maxSizeMB} MB en total.",
+		"file_size_limit": "Tamaño máximo de archivo: 50 MB por archivo",
+		"upload_limits": "Límite de subida: {maxFiles} archivos, {maxSizeMB} MB en total",
 		"drop_files": "Suelta los archivos aquí",
 		"drag_drop": "Arrastra y suelta archivos aquí",
 		"or_browse": "o haz clic para explorar",
diff --git a/surfsense_web/messages/hi.json b/surfsense_web/messages/hi.json
index fd51acdc2..c11f43815 100644
--- a/surfsense_web/messages/hi.json
+++ b/surfsense_web/messages/hi.json
@@ -376,8 +376,8 @@
 	"upload_documents": {
 		"title": "दस्तावेज़ अपलोड करें",
 		"subtitle": "AI-संचालित बातचीत के माध्यम से अपनी फ़ाइलों को खोजने योग्य और सुलभ बनाने के लिए अपलोड करें।",
-		"file_size_limit": "अधिकतम फ़ाइल आकार: प्रति फ़ाइल 50MB।",
-		"upload_limits": "अपलोड सीमा: {maxFiles} फ़ाइलें, कुल {maxSizeMB}MB।",
+		"file_size_limit": "अधिकतम फ़ाइल आकार: प्रति फ़ाइल 50MB",
+		"upload_limits": "अपलोड सीमा: {maxFiles} फ़ाइलें, कुल {maxSizeMB}MB",
 		"drop_files": "फ़ाइलें यहां छोड़ें",
 		"drag_drop": "फ़ाइलें यहां खींचें और छोड़ें",
 		"or_browse": "या ब्राउज़ करने के लिए क्लिक करें",
diff --git a/surfsense_web/messages/pt.json b/surfsense_web/messages/pt.json
index e26499f90..d77aa0c22 100644
--- a/surfsense_web/messages/pt.json
+++ b/surfsense_web/messages/pt.json
@@ -376,8 +376,8 @@
 	"upload_documents": {
 		"title": "Enviar documentos",
 		"subtitle": "Envie seus arquivos para torná-los pesquisáveis e acessíveis através de conversas com IA.",
-		"file_size_limit": "Tamanho máximo do arquivo: 50 MB por arquivo.",
-		"upload_limits": "Limite de envio: {maxFiles} arquivos, {maxSizeMB} MB no total.",
+		"file_size_limit": "Tamanho máximo do arquivo: 50 MB por arquivo",
+		"upload_limits": "Limite de envio: {maxFiles} arquivos, {maxSizeMB} MB no total",
 		"drop_files": "Solte os arquivos aqui",
 		"drag_drop": "Arraste e solte arquivos aqui",
 		"or_browse": "ou clique para navegar",
diff --git a/surfsense_web/messages/zh.json b/surfsense_web/messages/zh.json
index 819432410..b72a44dbb 100644
--- a/surfsense_web/messages/zh.json
+++ b/surfsense_web/messages/zh.json
@@ -360,8 +360,8 @@
 	"upload_documents": {
 		"title": "上传文档",
 		"subtitle": "上传您的文件，使其可通过 AI 对话进行搜索和访问。",
-		"file_size_limit": "最大文件大小：每个文件 50MB。",
-		"upload_limits": "上传限制：最多 {maxFiles} 个文件，总大小不超过 {maxSizeMB}MB。",
+		"file_size_limit": "最大文件大小：每个文件 50MB",
+		"upload_limits": "上传限制：最多 {maxFiles} 个文件，总大小不超过 {maxSizeMB}MB",
 		"drop_files": "放下文件到这里",
 		"drag_drop": "拖放文件到这里",
 		"or_browse": "或点击浏览",

From e2ba5093140a30b93056e376baa082df7a5324cf Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 09:29:59 +0530
Subject: [PATCH 069/202] feat: enhance error handling in local folder indexing
 by adding rollback and refresh on IntegrityError

---
 .../local_folder_indexer.py                   | 21 +++++++++++++------
 .../components/documents/DocumentNode.tsx     |  4 ++--
 .../layout/ui/sidebar/DocumentsSidebar.tsx    |  8 +++++++
 surfsense_web/components/ui/context-menu.tsx  |  2 +-
 surfsense_web/components/ui/dropdown-menu.tsx |  2 +-
 5 files changed, 27 insertions(+), 10 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index 041df71fc..7f6a35d7f 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -19,7 +19,7 @@ from datetime import UTC, datetime
 from pathlib import Path
 
 from sqlalchemy import select
-from sqlalchemy.exc import SQLAlchemyError
+from sqlalchemy.exc import IntegrityError, SQLAlchemyError
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from app.config import config
@@ -732,7 +732,12 @@ async def index_local_folder(
                 document.folder_id = folder_mapping.get(
                     parent_dir, folder_mapping.get("")
                 )
-            await session.commit()
+            try:
+                await session.commit()
+            except IntegrityError:
+                await session.rollback()
+                for document in documents:
+                    await session.refresh(document)
 
             llm = await get_user_long_context_llm(session, user_id, search_space_id)
 
@@ -905,10 +910,14 @@ async def _index_single_file(
         # Assign folder_id before indexing so the doc appears in the
         # correct folder while still pending/processing.
         if root_folder_id:
-            db_doc.folder_id = await _resolve_folder_for_file(
-                session, rel_path, root_folder_id, search_space_id, user_id
-            )
-            await session.commit()
+            try:
+                db_doc.folder_id = await _resolve_folder_for_file(
+                    session, rel_path, root_folder_id, search_space_id, user_id
+                )
+                await session.commit()
+            except IntegrityError:
+                await session.rollback()
+                await session.refresh(db_doc)
 
         await pipeline.index(db_doc, connector_doc, llm)
 
diff --git a/surfsense_web/components/documents/DocumentNode.tsx b/surfsense_web/components/documents/DocumentNode.tsx
index 7a3b3e0ca..dc92109b1 100644
--- a/surfsense_web/components/documents/DocumentNode.tsx
+++ b/surfsense_web/components/documents/DocumentNode.tsx
@@ -237,7 +237,7 @@ export const DocumentNode = React.memo(function DocumentNode({
 							</DropdownMenuItem>
 							{onExport && (
 								<DropdownMenuSub>
-									<DropdownMenuSubTrigger>
+									<DropdownMenuSubTrigger disabled={isProcessing}>
 										<Download className="mr-2 h-4 w-4" />
 										Export
 									</DropdownMenuSubTrigger>
@@ -277,7 +277,7 @@ export const DocumentNode = React.memo(function DocumentNode({
 					</ContextMenuItem>
 					{onExport && (
 						<ContextMenuSub>
-							<ContextMenuSubTrigger>
+							<ContextMenuSubTrigger disabled={isProcessing}>
 								<Download className="mr-2 h-4 w-4" />
 								Export
 							</ContextMenuSubTrigger>
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index 8dce68eeb..7aa518361 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -358,6 +358,14 @@ export function DocumentsSidebar({
 	const handleDeleteFolder = useCallback(async (folder: FolderDisplay) => {
 		if (!confirm(`Delete folder "${folder.name}" and all its contents?`)) return;
 		try {
+			const api = window.electronAPI;
+			if (api) {
+				const watchedFolders = await api.getWatchedFolders();
+				const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
+				if (matched) {
+					await api.removeWatchedFolder(matched.path);
+				}
+			}
 			await foldersApiService.deleteFolder(folder.id);
 			toast.success("Folder deleted");
 		} catch (e: unknown) {
diff --git a/surfsense_web/components/ui/context-menu.tsx b/surfsense_web/components/ui/context-menu.tsx
index 0d3c27a6b..f3d4063e2 100644
--- a/surfsense_web/components/ui/context-menu.tsx
+++ b/surfsense_web/components/ui/context-menu.tsx
@@ -47,7 +47,7 @@ function ContextMenuSubTrigger({
 			data-slot="context-menu-sub-trigger"
 			data-inset={inset}
 			className={cn(
-				"focus:bg-accent focus:text-accent-foreground data-[state=open]:bg-accent data-[state=open]:text-accent-foreground flex cursor-default items-center rounded-sm px-2 py-1.5 text-sm outline-hidden select-none data-[inset]:pl-8",
+				"focus:bg-accent focus:text-accent-foreground data-[state=open]:bg-accent data-[state=open]:text-accent-foreground flex cursor-default items-center rounded-sm px-2 py-1.5 text-sm outline-hidden select-none data-[disabled]:pointer-events-none data-[disabled]:opacity-50 data-[inset]:pl-8",
 				className
 			)}
 			{...props}
diff --git a/surfsense_web/components/ui/dropdown-menu.tsx b/surfsense_web/components/ui/dropdown-menu.tsx
index 24b99467e..1584e0ea4 100644
--- a/surfsense_web/components/ui/dropdown-menu.tsx
+++ b/surfsense_web/components/ui/dropdown-menu.tsx
@@ -182,7 +182,7 @@ function DropdownMenuSubTrigger({
 			data-slot="dropdown-menu-sub-trigger"
 			data-inset={inset}
 			className={cn(
-				"focus:bg-neutral-200 focus:text-accent-foreground dark:focus:bg-neutral-700 data-[state=open]:bg-neutral-200 data-[state=open]:text-accent-foreground dark:data-[state=open]:bg-neutral-700 [&_svg:not([class*='text-'])]:text-muted-foreground flex cursor-default items-center gap-2 rounded-sm px-2 py-1.5 text-sm outline-hidden select-none data-[inset]:pl-8 [&_svg]:pointer-events-none [&_svg]:shrink-0 [&_svg:not([class*='size-'])]:size-4",
+				"focus:bg-neutral-200 focus:text-accent-foreground dark:focus:bg-neutral-700 data-[state=open]:bg-neutral-200 data-[state=open]:text-accent-foreground dark:data-[state=open]:bg-neutral-700 [&_svg:not([class*='text-'])]:text-muted-foreground flex cursor-default items-center gap-2 rounded-sm px-2 py-1.5 text-sm outline-hidden select-none data-[disabled]:pointer-events-none data-[disabled]:opacity-50 data-[inset]:pl-8 [&_svg]:pointer-events-none [&_svg]:shrink-0 [&_svg:not([class*='size-'])]:size-4",
 				className
 			)}
 			{...props}

From 1fa8e1cc836564ba71b64d51f4b253f5b10ef919 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 10:02:36 +0530
Subject: [PATCH 070/202] feat: refactor folder indexing to support batch
 processing of multiple files, enhancing performance and error handling

---
 .../app/routes/documents_routes.py            |  38 ++---
 .../app/tasks/celery_tasks/document_tasks.py  | 116 ++++++++++++---
 .../local_folder_indexer.py                   | 132 ++++++++++++++++--
 .../test_local_folder_pipeline.py             |  10 +-
 surfsense_web/hooks/use-folder-sync.ts        |  73 ++++++----
 .../lib/apis/documents-api.service.ts         |   4 +-
 6 files changed, 293 insertions(+), 80 deletions(-)

diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index edb01d4cc..e6eed7836 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -1305,11 +1305,11 @@ class FolderIndexRequest(PydanticBaseModel):
     enable_summary: bool = False
 
 
-class FolderIndexFileRequest(PydanticBaseModel):
+class FolderIndexFilesRequest(PydanticBaseModel):
     folder_path: str
     folder_name: str
     search_space_id: int
-    target_file_path: str
+    target_file_paths: list[str]
     root_folder_id: int | None = None
     enable_summary: bool = False
 
@@ -1393,14 +1393,15 @@ async def folder_index(
     }
 
 
-@router.post("/documents/folder-index-file")
-async def folder_index_file(
-    request: FolderIndexFileRequest,
+@router.post("/documents/folder-index-files")
+async def folder_index_files(
+    request: FolderIndexFilesRequest,
     session: AsyncSession = Depends(get_async_session),
     user: User = Depends(current_active_user),
 ):
-    """Index a single file within a watched folder (chokidar trigger).
-    Validates that target_file_path is under folder_path.
+    """Index multiple files within a watched folder (batched chokidar trigger).
+    Validates that all target_file_paths are under folder_path.
+    Dispatches a single Celery task that processes them in parallel.
     """
     from app.config import config as app_config
 
@@ -1410,6 +1411,9 @@ async def folder_index_file(
             detail="Local folder indexing is only available in self-hosted mode",
         )
 
+    if not request.target_file_paths:
+        raise HTTPException(status_code=400, detail="target_file_paths must not be empty")
+
     await check_permission(
         session,
         user,
@@ -1420,13 +1424,14 @@ async def folder_index_file(
 
     from pathlib import Path
 
-    try:
-        Path(request.target_file_path).relative_to(request.folder_path)
-    except ValueError:
-        raise HTTPException(
-            status_code=400,
-            detail="target_file_path must be inside folder_path",
-        )
+    for fp in request.target_file_paths:
+        try:
+            Path(fp).relative_to(request.folder_path)
+        except ValueError:
+            raise HTTPException(
+                status_code=400,
+                detail=f"target_file_path {fp} must be inside folder_path",
+            )
 
     from app.tasks.celery_tasks.document_tasks import index_local_folder_task
 
@@ -1435,14 +1440,15 @@ async def folder_index_file(
         user_id=str(user.id),
         folder_path=request.folder_path,
         folder_name=request.folder_name,
-        target_file_path=request.target_file_path,
+        target_file_paths=request.target_file_paths,
         root_folder_id=request.root_folder_id,
         enable_summary=request.enable_summary,
     )
 
     return {
-        "message": "File indexing started",
+        "message": f"Batch indexing started for {len(request.target_file_paths)} file(s)",
         "status": "processing",
+        "file_count": len(request.target_file_paths),
     }
 
 
diff --git a/surfsense_backend/app/tasks/celery_tasks/document_tasks.py b/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
index 4701d9911..16ac50967 100644
--- a/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
+++ b/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
@@ -1275,7 +1275,7 @@ def index_local_folder_task(
     file_extensions: list[str] | None = None,
     root_folder_id: int | None = None,
     enable_summary: bool = False,
-    target_file_path: str | None = None,
+    target_file_paths: list[str] | None = None,
 ):
     """Celery task to index a local folder. Config is passed directly — no connector row."""
     loop = asyncio.new_event_loop()
@@ -1292,7 +1292,7 @@ def index_local_folder_task(
                 file_extensions=file_extensions,
                 root_folder_id=root_folder_id,
                 enable_summary=enable_summary,
-                target_file_path=target_file_path,
+                target_file_paths=target_file_paths,
             )
         )
     finally:
@@ -1308,19 +1308,103 @@ async def _index_local_folder_async(
     file_extensions: list[str] | None = None,
     root_folder_id: int | None = None,
     enable_summary: bool = False,
-    target_file_path: str | None = None,
+    target_file_paths: list[str] | None = None,
 ):
-    """Run local folder indexing with a fresh DB session."""
+    """Run local folder indexing with notification + heartbeat."""
+    is_batch = bool(target_file_paths)
+    is_full_scan = not target_file_paths
+    file_count = len(target_file_paths) if target_file_paths else None
+
+    if is_batch:
+        doc_name = f"{folder_name} ({file_count} file{'s' if file_count != 1 else ''})"
+    else:
+        doc_name = folder_name
+
+    notification = None
+    heartbeat_task = None
+
     async with get_celery_session_maker()() as session:
-        await index_local_folder(
-            session=session,
-            search_space_id=search_space_id,
-            user_id=user_id,
-            folder_path=folder_path,
-            folder_name=folder_name,
-            exclude_patterns=exclude_patterns,
-            file_extensions=file_extensions,
-            root_folder_id=root_folder_id,
-            enable_summary=enable_summary,
-            target_file_path=target_file_path,
-        )
+        try:
+            notification = (
+                await NotificationService.document_processing.notify_processing_started(
+                    session=session,
+                    user_id=UUID(user_id),
+                    document_type="LOCAL_FOLDER_FILE",
+                    document_name=doc_name,
+                    search_space_id=search_space_id,
+                )
+            )
+            _start_heartbeat(notification.id)
+            heartbeat_task = asyncio.create_task(
+                _run_heartbeat_loop(notification.id)
+            )
+        except Exception:
+            logger.warning(
+                "Failed to create notification for local folder indexing",
+                exc_info=True,
+            )
+
+        async def _heartbeat_progress(completed_count: int) -> None:
+            """Refresh heartbeat and optionally update notification progress."""
+            if notification:
+                try:
+                    await NotificationService.document_processing.notify_processing_progress(
+                        session=session,
+                        notification=notification,
+                        stage="indexing",
+                        stage_message=f"Syncing files ({completed_count}/{file_count or '?'})",
+                    )
+                except Exception:
+                    pass
+
+        try:
+            indexed, skipped_or_failed, _rfid, err = await index_local_folder(
+                session=session,
+                search_space_id=search_space_id,
+                user_id=user_id,
+                folder_path=folder_path,
+                folder_name=folder_name,
+                exclude_patterns=exclude_patterns,
+                file_extensions=file_extensions,
+                root_folder_id=root_folder_id,
+                enable_summary=enable_summary,
+                target_file_paths=target_file_paths,
+                on_heartbeat_callback=_heartbeat_progress if (is_batch or is_full_scan) else None,
+            )
+
+            if notification:
+                try:
+                    if err:
+                        await NotificationService.document_processing.notify_processing_completed(
+                            session=session,
+                            notification=notification,
+                            error_message=err,
+                        )
+                    else:
+                        await NotificationService.document_processing.notify_processing_completed(
+                            session=session,
+                            notification=notification,
+                        )
+                except Exception:
+                    logger.warning(
+                        "Failed to update notification after local folder indexing",
+                        exc_info=True,
+                    )
+
+        except Exception as e:
+            logger.exception(f"Local folder indexing failed: {e}")
+            if notification:
+                try:
+                    await NotificationService.document_processing.notify_processing_completed(
+                        session=session,
+                        notification=notification,
+                        error_message=str(e)[:200],
+                    )
+                except Exception:
+                    pass
+            raise
+        finally:
+            if heartbeat_task:
+                heartbeat_task.cancel()
+            if notification:
+                _stop_heartbeat(notification.id)
diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index 7f6a35d7f..4ac8cc594 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -3,7 +3,7 @@ Local folder indexer.
 
 Indexes files from a local folder on disk. Supports:
 - Full-scan mode (startup reconciliation / manual trigger)
-- Single-file mode (chokidar real-time trigger)
+- Batch mode (chokidar real-time trigger, 1..N files)
 - Filesystem folder structure mirroring into DB Folder rows
 - Document versioning via create_version_snapshot
 - ETL-based file parsing for binary formats (PDF, DOCX, images, audio, etc.)
@@ -13,6 +13,7 @@ Config (folder_path, exclude_patterns, etc.) is passed in from the caller —
 no connector row is read.
 """
 
+import asyncio
 import os
 from collections.abc import Awaitable, Callable
 from datetime import UTC, datetime
@@ -34,6 +35,7 @@ from app.indexing_pipeline.document_hashing import compute_identifier_hash
 from app.indexing_pipeline.indexing_pipeline_service import IndexingPipelineService
 from app.services.llm_service import get_user_long_context_llm
 from app.services.task_logging_service import TaskLoggingService
+from app.tasks.celery_tasks import get_celery_session_maker
 from app.utils.document_versioning import create_version_snapshot
 
 from .base import (
@@ -497,14 +499,15 @@ async def index_local_folder(
     file_extensions: list[str] | None = None,
     root_folder_id: int | None = None,
     enable_summary: bool = False,
-    target_file_path: str | None = None,
+    target_file_paths: list[str] | None = None,
     on_heartbeat_callback: HeartbeatCallbackType | None = None,
 ) -> tuple[int, int, int | None, str | None]:
     """Index files from a local folder.
 
     Supports two modes:
-    - Full scan (target_file_path=None): walks entire folder, handles new/changed/deleted files.
-    - Single-file (target_file_path set): processes only that file.
+    - Batch (target_file_paths set): processes 1..N files.
+      Single-file uses the caller's session; multi-file fans out with per-file sessions.
+    - Full scan (no target paths): walks entire folder, handles new/changed/deleted files.
 
     Returns (indexed_count, skipped_count, root_folder_id, error_or_warning_message).
     """
@@ -517,7 +520,7 @@ async def index_local_folder(
         metadata={
             "folder_path": folder_path,
             "user_id": str(user_id),
-            "target_file_path": target_file_path,
+            "target_file_paths_count": len(target_file_paths) if target_file_paths else None,
         },
     )
 
@@ -535,22 +538,47 @@ async def index_local_folder(
             exclude_patterns = DEFAULT_EXCLUDE_PATTERNS
 
         # ====================================================================
-        # SINGLE-FILE MODE
+        # BATCH MODE (1..N files)
         # ====================================================================
-        if target_file_path:
-            indexed, skipped, err = await _index_single_file(
-                session=session,
+        if target_file_paths:
+            if len(target_file_paths) == 1:
+                indexed, skipped, err = await _index_single_file(
+                    session=session,
+                    search_space_id=search_space_id,
+                    user_id=user_id,
+                    folder_path=folder_path,
+                    folder_name=folder_name,
+                    target_file_path=target_file_paths[0],
+                    enable_summary=enable_summary,
+                    root_folder_id=root_folder_id,
+                    task_logger=task_logger,
+                    log_entry=log_entry,
+                )
+                return indexed, skipped, root_folder_id, err
+
+            indexed, failed, err = await _index_batch_files(
                 search_space_id=search_space_id,
                 user_id=user_id,
                 folder_path=folder_path,
                 folder_name=folder_name,
-                target_file_path=target_file_path,
+                target_file_paths=target_file_paths,
                 enable_summary=enable_summary,
                 root_folder_id=root_folder_id,
-                task_logger=task_logger,
-                log_entry=log_entry,
+                on_progress_callback=on_heartbeat_callback,
             )
-            return indexed, skipped, root_folder_id, err
+            if err:
+                await task_logger.log_task_success(
+                    log_entry,
+                    f"Batch indexing: {indexed} indexed, {failed} failed",
+                    {"indexed": indexed, "failed": failed},
+                )
+            else:
+                await task_logger.log_task_success(
+                    log_entry,
+                    f"Batch indexing complete: {indexed} indexed",
+                    {"indexed": indexed, "failed": failed},
+                )
+            return indexed, failed, root_folder_id, err
 
         # ====================================================================
         # FULL-SCAN MODE
@@ -822,6 +850,84 @@ async def index_local_folder(
         return 0, 0, root_folder_id, str(e)
 
 
+BATCH_CONCURRENCY = 5
+
+
+async def _index_batch_files(
+    search_space_id: int,
+    user_id: str,
+    folder_path: str,
+    folder_name: str,
+    target_file_paths: list[str],
+    enable_summary: bool,
+    root_folder_id: int | None,
+    on_progress_callback: HeartbeatCallbackType | None = None,
+) -> tuple[int, int, str | None]:
+    """Process multiple files in parallel with bounded concurrency.
+
+    Each file gets its own DB session so they can run concurrently.
+    Returns (indexed_count, failed_count, error_summary_or_none).
+    """
+    semaphore = asyncio.Semaphore(BATCH_CONCURRENCY)
+    indexed = 0
+    failed = 0
+    errors: list[str] = []
+    lock = asyncio.Lock()
+    completed = 0
+
+    async def process_one(file_path: str) -> None:
+        nonlocal indexed, failed, completed
+        async with semaphore:
+            try:
+                async with get_celery_session_maker()() as file_session:
+                    task_logger = TaskLoggingService(file_session, search_space_id)
+                    log_entry = await task_logger.log_task_start(
+                        task_name="local_folder_indexing",
+                        source="local_folder_batch_indexing",
+                        message=f"Batch: indexing {Path(file_path).name}",
+                        metadata={"file_path": file_path},
+                    )
+                    ix, _sk, err = await _index_single_file(
+                        session=file_session,
+                        search_space_id=search_space_id,
+                        user_id=user_id,
+                        folder_path=folder_path,
+                        folder_name=folder_name,
+                        target_file_path=file_path,
+                        enable_summary=enable_summary,
+                        root_folder_id=root_folder_id,
+                        task_logger=task_logger,
+                        log_entry=log_entry,
+                    )
+                    async with lock:
+                        indexed += ix
+                        if err:
+                            failed += 1
+                            errors.append(f"{Path(file_path).name}: {err}")
+                        completed += 1
+                        if on_progress_callback and completed % BATCH_CONCURRENCY == 0:
+                            await on_progress_callback(completed)
+            except Exception as exc:
+                logger.exception(f"Batch: error processing {file_path}: {exc}")
+                async with lock:
+                    failed += 1
+                    completed += 1
+                    errors.append(f"{Path(file_path).name}: {exc}")
+
+    await asyncio.gather(*[process_one(fp) for fp in target_file_paths])
+
+    if on_progress_callback:
+        await on_progress_callback(completed)
+
+    error_summary = None
+    if errors:
+        error_summary = f"{failed} file(s) failed: " + "; ".join(errors[:5])
+        if len(errors) > 5:
+            error_summary += f" ... and {len(errors) - 5} more"
+
+    return indexed, failed, error_summary
+
+
 async def _index_single_file(
     session: AsyncSession,
     search_space_id: int,
diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index 154cc6e0e..6cc5655c4 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -215,7 +215,7 @@ class TestFullIndexer:
         db_search_space: SearchSpace,
         tmp_path: Path,
     ):
-        """I5: Single-file mode only processes the specified file."""
+        """I5: Batch mode with a single file only processes that file."""
         from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
 
         (tmp_path / "a.md").write_text("File A")
@@ -228,7 +228,7 @@ class TestFullIndexer:
             user_id=str(db_user.id),
             folder_path=str(tmp_path),
             folder_name="test-folder",
-            target_file_path=str(tmp_path / "b.md"),
+            target_file_paths=[str(tmp_path / "b.md")],
         )
         assert count == 1
 
@@ -507,7 +507,7 @@ class TestFolderMirroring:
             user_id=str(db_user.id),
             folder_path=str(tmp_path),
             folder_name="test-folder",
-            target_file_path=str(sub / "new.md"),
+            target_file_paths=[str(sub / "new.md")],
             root_folder_id=root_folder_id,
         )
         assert count == 1
@@ -546,7 +546,7 @@ class TestFolderMirroring:
         db_search_space: SearchSpace,
         tmp_path: Path,
     ):
-        """F7: Deleting the only file in a subfolder via single-file mode removes empty Folder rows."""
+        """F7: Deleting the only file in a subfolder via batch mode removes empty Folder rows."""
         from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
 
         sub = tmp_path / "notes" / "ephemeral"
@@ -578,7 +578,7 @@ class TestFolderMirroring:
             user_id=str(db_user.id),
             folder_path=str(tmp_path),
             folder_name="test-folder",
-            target_file_path=str(target),
+            target_file_paths=[str(target)],
             root_folder_id=root_folder_id,
         )
 
diff --git a/surfsense_web/hooks/use-folder-sync.ts b/surfsense_web/hooks/use-folder-sync.ts
index 59c061afb..a64add593 100644
--- a/surfsense_web/hooks/use-folder-sync.ts
+++ b/surfsense_web/hooks/use-folder-sync.ts
@@ -16,65 +16,82 @@ interface FileChangedEvent {
 }
 
 const DEBOUNCE_MS = 2000;
-interface QueueItem {
-	event: FileChangedEvent;
+
+interface BatchItem {
+	folderPath: string;
+	folderName: string;
+	searchSpaceId: number;
+	rootFolderId: number | null;
+	filePaths: string[];
 	ackIds: string[];
 }
 
 export function useFolderSync() {
-	const queueRef = useRef<QueueItem[]>([]);
+	const queueRef = useRef<BatchItem[]>([]);
 	const processingRef = useRef(false);
 	const debounceTimers = useRef<Map<string, ReturnType<typeof setTimeout>>>(new Map());
-	const pendingByKey = useRef<Map<string, QueueItem>>(new Map());
+	const pendingByFolder = useRef<Map<string, BatchItem>>(new Map());
 	const isMountedRef = useRef(false);
 
 	async function processQueue() {
 		if (processingRef.current) return;
 		processingRef.current = true;
 		while (queueRef.current.length > 0) {
-			const item = queueRef.current.shift()!;
+			const batch = queueRef.current.shift()!;
 			try {
-				await documentsApiService.folderIndexFile(item.event.searchSpaceId, {
-					folder_path: item.event.folderPath,
-					folder_name: item.event.folderName,
-					search_space_id: item.event.searchSpaceId,
-					target_file_path: item.event.fullPath,
-					root_folder_id: item.event.rootFolderId,
+				await documentsApiService.folderIndexFiles(batch.searchSpaceId, {
+					folder_path: batch.folderPath,
+					folder_name: batch.folderName,
+					search_space_id: batch.searchSpaceId,
+					target_file_paths: batch.filePaths,
+					root_folder_id: batch.rootFolderId,
 				});
 				const api = typeof window !== "undefined" ? window.electronAPI : null;
-				if (api?.acknowledgeFileEvents && item.ackIds.length > 0) {
-					await api.acknowledgeFileEvents(item.ackIds);
+				if (api?.acknowledgeFileEvents && batch.ackIds.length > 0) {
+					await api.acknowledgeFileEvents(batch.ackIds);
 				}
 			} catch (err) {
-				console.error("[FolderSync] Failed to trigger re-index:", err);
+				console.error("[FolderSync] Failed to trigger batch re-index:", err);
 			}
 		}
 		processingRef.current = false;
 	}
 
 	function enqueueWithDebounce(event: FileChangedEvent) {
-		const key = `${event.folderPath}:${event.relativePath}`;
-		const existing = pendingByKey.current.get(key);
-		const ackSet = new Set(existing?.ackIds ?? []);
-		ackSet.add(event.id);
-		pendingByKey.current.set(key, {
-			event,
-			ackIds: Array.from(ackSet),
-		});
+		const folderKey = event.folderPath;
+		const existing = pendingByFolder.current.get(folderKey);
 
-		const existingTimeout = debounceTimers.current.get(key);
+		if (existing) {
+			const pathSet = new Set(existing.filePaths);
+			pathSet.add(event.fullPath);
+			existing.filePaths = Array.from(pathSet);
+			if (!existing.ackIds.includes(event.id)) {
+				existing.ackIds.push(event.id);
+			}
+		} else {
+			pendingByFolder.current.set(folderKey, {
+				folderPath: event.folderPath,
+				folderName: event.folderName,
+				searchSpaceId: event.searchSpaceId,
+				rootFolderId: event.rootFolderId,
+				filePaths: [event.fullPath],
+				ackIds: [event.id],
+			});
+		}
+
+		const existingTimeout = debounceTimers.current.get(folderKey);
 		if (existingTimeout) clearTimeout(existingTimeout);
 
 		const timeout = setTimeout(() => {
-			debounceTimers.current.delete(key);
-			const pending = pendingByKey.current.get(key);
+			debounceTimers.current.delete(folderKey);
+			const pending = pendingByFolder.current.get(folderKey);
 			if (!pending) return;
-			pendingByKey.current.delete(key);
+			pendingByFolder.current.delete(folderKey);
 			queueRef.current.push(pending);
 			processQueue();
 		}, DEBOUNCE_MS);
 
-		debounceTimers.current.set(key, timeout);
+		debounceTimers.current.set(folderKey, timeout);
 	}
 
 	useEffect(() => {
@@ -108,7 +125,7 @@ export function useFolderSync() {
 				clearTimeout(timeout);
 			}
 			debounceTimers.current.clear();
-			pendingByKey.current.clear();
+			pendingByFolder.current.clear();
 		};
 	}, []);
 }
diff --git a/surfsense_web/lib/apis/documents-api.service.ts b/surfsense_web/lib/apis/documents-api.service.ts
index e8b228d03..45d9f6dc8 100644
--- a/surfsense_web/lib/apis/documents-api.service.ts
+++ b/surfsense_web/lib/apis/documents-api.service.ts
@@ -400,8 +400,8 @@ class DocumentsApiService {
 		return baseApiService.post(`/api/v1/documents/folder-index`, undefined, { body });
 	};
 
-	folderIndexFile = async (searchSpaceId: number, body: { folder_path: string; folder_name: string; search_space_id: number; target_file_path: string; root_folder_id?: number | null; enable_summary?: boolean }) => {
-		return baseApiService.post(`/api/v1/documents/folder-index-file`, undefined, { body });
+	folderIndexFiles = async (searchSpaceId: number, body: { folder_path: string; folder_name: string; search_space_id: number; target_file_paths: string[]; root_folder_id?: number | null; enable_summary?: boolean }) => {
+		return baseApiService.post(`/api/v1/documents/folder-index-files`, undefined, { body });
 	};
 
 	getWatchedFolders = async (searchSpaceId: number) => {

From 2b9d79d44c00699253cbcab934e549c6c64b94cb Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 10:04:14 +0530
Subject: [PATCH 071/202] feat: add integration tests for batch processing of
 local folder indexing, covering multiple file scenarios and error handling

---
 .../test_local_folder_pipeline.py             | 130 +++++++++++++++++-
 1 file changed, 129 insertions(+), 1 deletion(-)

diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index 6cc5655c4..67254ec93 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -1,6 +1,7 @@
-"""Integration tests for local folder indexer — Tier 3 (I1-I5), Tier 4 (F1-F7), Tier 5 (P1)."""
+"""Integration tests for local folder indexer — Tier 3 (I1-I5), Tier 4 (F1-F7), Tier 5 (P1), Tier 6 (B1-B2)."""
 
 import os
+from contextlib import asynccontextmanager
 from pathlib import Path
 
 import pytest
@@ -24,6 +25,34 @@ UNIFIED_FIXTURES = (
 )
 
 
+class _FakeSessionMaker:
+    """Wraps an existing AsyncSession so ``async with factory()`` yields it
+    without closing it. Used to route batch-mode DB operations through the
+    test's savepoint-wrapped session."""
+
+    def __init__(self, session: AsyncSession):
+        self._session = session
+
+    def __call__(self):
+        @asynccontextmanager
+        async def _ctx():
+            yield self._session
+        return _ctx()
+
+
+@pytest.fixture
+def patched_batch_sessions(monkeypatch, db_session):
+    """Make ``_index_batch_files`` use the test session and run sequentially."""
+    monkeypatch.setattr(
+        "app.tasks.connector_indexers.local_folder_indexer.get_celery_session_maker",
+        lambda: _FakeSessionMaker(db_session),
+    )
+    monkeypatch.setattr(
+        "app.tasks.connector_indexers.local_folder_indexer.BATCH_CONCURRENCY",
+        1,
+    )
+
+
 # ====================================================================
 # Tier 3: Full Indexer Integration (I1-I5)
 # ====================================================================
@@ -597,6 +626,105 @@ class TestFolderMirroring:
         assert notes_after is None
 
 
+# ====================================================================
+# Tier 6: Batch Mode (B1-B2)
+# ====================================================================
+
+
+class TestBatchMode:
+
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_b1_batch_indexes_multiple_files(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+        patched_batch_sessions,
+    ):
+        """B1: Batch with 3 files indexes all of them."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "a.md").write_text("File A content")
+        (tmp_path / "b.md").write_text("File B content")
+        (tmp_path / "c.md").write_text("File C content")
+
+        count, failed, root_folder_id, err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            target_file_paths=[
+                str(tmp_path / "a.md"),
+                str(tmp_path / "b.md"),
+                str(tmp_path / "c.md"),
+            ],
+        )
+
+        assert count == 3
+        assert failed == 0
+        assert err is None
+
+        docs = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
+                )
+            )
+        ).scalars().all()
+        assert len(docs) == 3
+        assert {d.title for d in docs} == {"a.md", "b.md", "c.md"}
+        assert all(
+            DocumentStatus.is_state(d.status, DocumentStatus.READY) for d in docs
+        )
+
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_b2_partial_failure(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+        patched_batch_sessions,
+    ):
+        """B2: One unreadable file fails gracefully; the other two still get indexed."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "good1.md").write_text("Good file one")
+        (tmp_path / "good2.md").write_text("Good file two")
+        (tmp_path / "bad.md").write_bytes(b"\x00binary garbage")
+
+        count, failed, _, err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            target_file_paths=[
+                str(tmp_path / "good1.md"),
+                str(tmp_path / "bad.md"),
+                str(tmp_path / "good2.md"),
+            ],
+        )
+
+        assert count == 2
+        assert failed == 1
+        assert err is not None
+
+        docs = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
+                )
+            )
+        ).scalars().all()
+        assert len(docs) == 2
+        assert {d.title for d in docs} == {"good1.md", "good2.md"}
+
+
 # ====================================================================
 # Tier 5: Pipeline Integration (P1)
 # ====================================================================

From 19dfd9f90765d4021ac71c68b7bfd47e26e0ac61 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 10:13:46 +0530
Subject: [PATCH 072/202] feat: enhance folder synchronization by adding max
 wait time and batch size limits for processing file events

---
 surfsense_web/hooks/use-folder-sync.ts | 40 ++++++++++++++++++++------
 1 file changed, 31 insertions(+), 9 deletions(-)

diff --git a/surfsense_web/hooks/use-folder-sync.ts b/surfsense_web/hooks/use-folder-sync.ts
index a64add593..ef3326556 100644
--- a/surfsense_web/hooks/use-folder-sync.ts
+++ b/surfsense_web/hooks/use-folder-sync.ts
@@ -16,6 +16,8 @@ interface FileChangedEvent {
 }
 
 const DEBOUNCE_MS = 2000;
+const MAX_WAIT_MS = 10_000;
+const MAX_BATCH_SIZE = 50;
 
 interface BatchItem {
 	folderPath: string;
@@ -31,6 +33,7 @@ export function useFolderSync() {
 	const processingRef = useRef(false);
 	const debounceTimers = useRef<Map<string, ReturnType<typeof setTimeout>>>(new Map());
 	const pendingByFolder = useRef<Map<string, BatchItem>>(new Map());
+	const firstEventTime = useRef<Map<string, number>>(new Map());
 	const isMountedRef = useRef(false);
 
 	async function processQueue() {
@@ -57,6 +60,23 @@ export function useFolderSync() {
 		processingRef.current = false;
 	}
 
+	function flushFolder(folderKey: string) {
+		debounceTimers.current.delete(folderKey);
+		firstEventTime.current.delete(folderKey);
+		const pending = pendingByFolder.current.get(folderKey);
+		if (!pending) return;
+		pendingByFolder.current.delete(folderKey);
+
+		for (let i = 0; i < pending.filePaths.length; i += MAX_BATCH_SIZE) {
+			queueRef.current.push({
+				...pending,
+				filePaths: pending.filePaths.slice(i, i + MAX_BATCH_SIZE),
+				ackIds: i === 0 ? pending.ackIds : [],
+			});
+		}
+		processQueue();
+	}
+
 	function enqueueWithDebounce(event: FileChangedEvent) {
 		const folderKey = event.folderPath;
 		const existing = pendingByFolder.current.get(folderKey);
@@ -77,20 +97,21 @@ export function useFolderSync() {
 				filePaths: [event.fullPath],
 				ackIds: [event.id],
 			});
+			firstEventTime.current.set(folderKey, Date.now());
+		}
+
+		const elapsed = Date.now() - (firstEventTime.current.get(folderKey) ?? Date.now());
+		if (elapsed >= MAX_WAIT_MS) {
+			const existingTimeout = debounceTimers.current.get(folderKey);
+			if (existingTimeout) clearTimeout(existingTimeout);
+			flushFolder(folderKey);
+			return;
 		}
 
 		const existingTimeout = debounceTimers.current.get(folderKey);
 		if (existingTimeout) clearTimeout(existingTimeout);
 
-		const timeout = setTimeout(() => {
-			debounceTimers.current.delete(folderKey);
-			const pending = pendingByFolder.current.get(folderKey);
-			if (!pending) return;
-			pendingByFolder.current.delete(folderKey);
-			queueRef.current.push(pending);
-			processQueue();
-		}, DEBOUNCE_MS);
-
+		const timeout = setTimeout(() => flushFolder(folderKey), DEBOUNCE_MS);
 		debounceTimers.current.set(folderKey, timeout);
 	}
 
@@ -126,6 +147,7 @@ export function useFolderSync() {
 			}
 			debounceTimers.current.clear();
 			pendingByFolder.current.clear();
+			firstEventTime.current.clear();
 		};
 	}, []);
 }

From 4ca0787ab7bb8365b36c785ecd41366af32a6874 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 10:42:21 +0530
Subject: [PATCH 073/202] feat: add version history functionality to document
 management, enabling users to view and manage document versions through UI
 updates and backend integration

---
 .../app/tasks/celery_tasks/document_tasks.py  |  12 +-
 .../components/documents/DocumentNode.tsx     |  22 ++
 .../components/documents/FolderTreeView.tsx   |   3 +
 .../components/documents/version-history.tsx  | 251 ++++++++++++------
 .../layout/ui/sidebar/DocumentsSidebar.tsx    |  11 +
 5 files changed, 214 insertions(+), 85 deletions(-)

diff --git a/surfsense_backend/app/tasks/celery_tasks/document_tasks.py b/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
index 16ac50967..506f8118c 100644
--- a/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
+++ b/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
@@ -1321,6 +1321,7 @@ async def _index_local_folder_async(
         doc_name = folder_name
 
     notification = None
+    notification_id: int | None = None
     heartbeat_task = None
 
     async with get_celery_session_maker()() as session:
@@ -1334,9 +1335,10 @@ async def _index_local_folder_async(
                     search_space_id=search_space_id,
                 )
             )
-            _start_heartbeat(notification.id)
+            notification_id = notification.id
+            _start_heartbeat(notification_id)
             heartbeat_task = asyncio.create_task(
-                _run_heartbeat_loop(notification.id)
+                _run_heartbeat_loop(notification_id)
             )
         except Exception:
             logger.warning(
@@ -1374,6 +1376,7 @@ async def _index_local_folder_async(
 
             if notification:
                 try:
+                    await session.refresh(notification)
                     if err:
                         await NotificationService.document_processing.notify_processing_completed(
                             session=session,
@@ -1395,6 +1398,7 @@ async def _index_local_folder_async(
             logger.exception(f"Local folder indexing failed: {e}")
             if notification:
                 try:
+                    await session.refresh(notification)
                     await NotificationService.document_processing.notify_processing_completed(
                         session=session,
                         notification=notification,
@@ -1406,5 +1410,5 @@ async def _index_local_folder_async(
         finally:
             if heartbeat_task:
                 heartbeat_task.cancel()
-            if notification:
-                _stop_heartbeat(notification.id)
+            if notification_id is not None:
+                _stop_heartbeat(notification_id)
diff --git a/surfsense_web/components/documents/DocumentNode.tsx b/surfsense_web/components/documents/DocumentNode.tsx
index dc92109b1..31d1bc7ca 100644
--- a/surfsense_web/components/documents/DocumentNode.tsx
+++ b/surfsense_web/components/documents/DocumentNode.tsx
@@ -5,6 +5,7 @@ import {
 	Clock,
 	Download,
 	Eye,
+	History,
 	MoreHorizontal,
 	Move,
 	PenLine,
@@ -38,6 +39,7 @@ import { Spinner } from "@/components/ui/spinner";
 import { Tooltip, TooltipContent, TooltipTrigger } from "@/components/ui/tooltip";
 import type { DocumentTypeEnum } from "@/contracts/types/document.types";
 import { cn } from "@/lib/utils";
+import { isVersionableType } from "./version-history";
 import { DND_TYPES } from "./FolderNode";
 
 const EDITABLE_DOCUMENT_TYPES = new Set(["FILE", "NOTE"]);
@@ -60,6 +62,7 @@ interface DocumentNodeProps {
 	onDelete: (doc: DocumentNodeDoc) => void;
 	onMove: (doc: DocumentNodeDoc) => void;
 	onExport?: (doc: DocumentNodeDoc, format: string) => void;
+	onVersionHistory?: (doc: DocumentNodeDoc) => void;
 	contextMenuOpen?: boolean;
 	onContextMenuOpenChange?: (open: boolean) => void;
 }
@@ -74,6 +77,7 @@ export const DocumentNode = React.memo(function DocumentNode({
 	onDelete,
 	onMove,
 	onExport,
+	onVersionHistory,
 	contextMenuOpen,
 	onContextMenuOpenChange,
 }: DocumentNodeProps) {
@@ -246,6 +250,15 @@ export const DocumentNode = React.memo(function DocumentNode({
 									</DropdownMenuSubContent>
 								</DropdownMenuSub>
 							)}
+							{onVersionHistory && isVersionableType(doc.document_type) && (
+								<DropdownMenuItem
+									disabled={isProcessing}
+									onClick={() => onVersionHistory(doc)}
+								>
+									<History className="mr-2 h-4 w-4" />
+									Versions
+								</DropdownMenuItem>
+							)}
 							<DropdownMenuItem
 								className="text-destructive focus:text-destructive"
 								disabled={isProcessing}
@@ -286,6 +299,15 @@ export const DocumentNode = React.memo(function DocumentNode({
 							</ContextMenuSubContent>
 						</ContextMenuSub>
 					)}
+					{onVersionHistory && isVersionableType(doc.document_type) && (
+						<ContextMenuItem
+							disabled={isProcessing}
+							onClick={() => onVersionHistory(doc)}
+						>
+							<History className="mr-2 h-4 w-4" />
+							Versions
+						</ContextMenuItem>
+					)}
 					<ContextMenuItem
 						className="text-destructive focus:text-destructive"
 						disabled={isProcessing}
diff --git a/surfsense_web/components/documents/FolderTreeView.tsx b/surfsense_web/components/documents/FolderTreeView.tsx
index 01af73edc..6f64d6258 100644
--- a/surfsense_web/components/documents/FolderTreeView.tsx
+++ b/surfsense_web/components/documents/FolderTreeView.tsx
@@ -32,6 +32,7 @@ interface FolderTreeViewProps {
 	onDeleteDocument: (doc: DocumentNodeDoc) => void;
 	onMoveDocument: (doc: DocumentNodeDoc) => void;
 	onExportDocument?: (doc: DocumentNodeDoc, format: string) => void;
+	onVersionHistory?: (doc: DocumentNodeDoc) => void;
 	activeTypes: DocumentTypeEnum[];
 	searchQuery?: string;
 	onDropIntoFolder?: (
@@ -73,6 +74,7 @@ export function FolderTreeView({
 	onDeleteDocument,
 	onMoveDocument,
 	onExportDocument,
+	onVersionHistory,
 	activeTypes,
 	searchQuery,
 	onDropIntoFolder,
@@ -267,6 +269,7 @@ export function FolderTreeView({
 					onDelete={onDeleteDocument}
 					onMove={onMoveDocument}
 					onExport={onExportDocument}
+					onVersionHistory={onVersionHistory}
 					contextMenuOpen={openContextMenuId === `doc-${d.id}`}
 					onContextMenuOpenChange={(open) => setOpenContextMenuId(open ? `doc-${d.id}` : null)}
 				/>
diff --git a/surfsense_web/components/documents/version-history.tsx b/surfsense_web/components/documents/version-history.tsx
index 29740e079..f438a7190 100644
--- a/surfsense_web/components/documents/version-history.tsx
+++ b/surfsense_web/components/documents/version-history.tsx
@@ -1,16 +1,17 @@
 "use client";
 
 import { useCallback, useEffect, useState } from "react";
-import { Clock, RotateCcw } from "lucide-react";
+import { Check, ChevronRight, Clock, Copy, RotateCcw } from "lucide-react";
 import { Button } from "@/components/ui/button";
 import {
-	Sheet,
-	SheetContent,
-	SheetHeader,
-	SheetTitle,
-	SheetTrigger,
-} from "@/components/ui/sheet";
+	Dialog,
+	DialogContent,
+	DialogTitle,
+	DialogTrigger,
+} from "@/components/ui/dialog";
+import { Separator } from "@/components/ui/separator";
 import { Spinner } from "@/components/ui/spinner";
+import { cn } from "@/lib/utils";
 import { documentsApiService } from "@/lib/apis/documents-api.service";
 import { toast } from "sonner";
 
@@ -26,28 +27,72 @@ interface VersionHistoryProps {
 	documentType: string;
 }
 
+const VERSION_DOCUMENT_TYPES = new Set(["LOCAL_FOLDER_FILE", "OBSIDIAN_CONNECTOR"]);
+
+export function isVersionableType(documentType: string) {
+	return VERSION_DOCUMENT_TYPES.has(documentType);
+}
+
+const DIALOG_CLASSES =
+	"select-none max-w-[900px] w-[95vw] md:w-[90vw] h-[90vh] md:h-[80vh] max-h-[640px] flex flex-col md:flex-row p-0 gap-0 overflow-hidden [--card:var(--background)] dark:[--card:oklch(0.205_0_0)] dark:[--background:oklch(0.205_0_0)]";
+
 export function VersionHistoryButton({ documentId, documentType }: VersionHistoryProps) {
-	const showVersionHistory = documentType === "LOCAL_FOLDER_FILE" || documentType === "OBSIDIAN_CONNECTOR";
-	if (!showVersionHistory) return null;
+	if (!isVersionableType(documentType)) return null;
 
 	return (
-		<Sheet>
-			<SheetTrigger asChild>
+		<Dialog>
+			<DialogTrigger asChild>
 				<Button variant="ghost" size="sm" className="gap-1.5 text-xs">
 					<Clock className="h-3.5 w-3.5" />
 					Versions
 				</Button>
-			</SheetTrigger>
-			<SheetContent className="w-[400px] sm:w-[540px]">
-				<SheetHeader>
-					<SheetTitle>Version History</SheetTitle>
-				</SheetHeader>
+			</DialogTrigger>
+			<DialogContent className={DIALOG_CLASSES}>
+				<DialogTitle className="sr-only">Version History</DialogTitle>
 				<VersionHistoryPanel documentId={documentId} />
-			</SheetContent>
-		</Sheet>
+			</DialogContent>
+		</Dialog>
 	);
 }
 
+export function VersionHistoryDialog({
+	open,
+	onOpenChange,
+	documentId,
+}: {
+	open: boolean;
+	onOpenChange: (open: boolean) => void;
+	documentId: number;
+}) {
+	return (
+		<Dialog open={open} onOpenChange={onOpenChange}>
+			<DialogContent className={DIALOG_CLASSES}>
+				<DialogTitle className="sr-only">Version History</DialogTitle>
+				{open && <VersionHistoryPanel documentId={documentId} />}
+			</DialogContent>
+		</Dialog>
+	);
+}
+
+function formatRelativeTime(dateStr: string): string {
+	const now = Date.now();
+	const then = new Date(dateStr).getTime();
+	const diffMs = now - then;
+	const diffMin = Math.floor(diffMs / 60_000);
+	if (diffMin < 1) return "Just now";
+	if (diffMin < 60) return `${diffMin} minute${diffMin !== 1 ? "s" : ""} ago`;
+	const diffHr = Math.floor(diffMin / 60);
+	if (diffHr < 24) return `${diffHr} hour${diffHr !== 1 ? "s" : ""} ago`;
+	return new Date(dateStr).toLocaleDateString(undefined, {
+		weekday: "short",
+		month: "short",
+		day: "numeric",
+		year: "numeric",
+		hour: "numeric",
+		minute: "2-digit",
+	});
+}
+
 function VersionHistoryPanel({ documentId }: { documentId: number }) {
 	const [versions, setVersions] = useState<DocumentVersionSummary[]>([]);
 	const [loading, setLoading] = useState(true);
@@ -55,6 +100,7 @@ function VersionHistoryPanel({ documentId }: { documentId: number }) {
 	const [versionContent, setVersionContent] = useState<string>("");
 	const [contentLoading, setContentLoading] = useState(false);
 	const [restoring, setRestoring] = useState(false);
+	const [copied, setCopied] = useState(false);
 
 	const loadVersions = useCallback(async () => {
 		setLoading(true);
@@ -73,6 +119,7 @@ function VersionHistoryPanel({ documentId }: { documentId: number }) {
 	}, [loadVersions]);
 
 	const handleSelectVersion = async (versionNumber: number) => {
+		if (selectedVersion === versionNumber) return;
 		setSelectedVersion(versionNumber);
 		setContentLoading(true);
 		try {
@@ -101,9 +148,15 @@ function VersionHistoryPanel({ documentId }: { documentId: number }) {
 		}
 	};
 
+	const handleCopy = () => {
+		navigator.clipboard.writeText(versionContent);
+		setCopied(true);
+		setTimeout(() => setCopied(false), 2000);
+	};
+
 	if (loading) {
 		return (
-			<div className="flex items-center justify-center py-12">
+			<div className="flex flex-1 items-center justify-center">
 				<Spinner size="lg" className="text-muted-foreground" />
 			</div>
 		);
@@ -111,75 +164,111 @@ function VersionHistoryPanel({ documentId }: { documentId: number }) {
 
 	if (versions.length === 0) {
 		return (
-			<div className="flex flex-col items-center justify-center py-12 text-muted-foreground">
-				<Clock className="h-8 w-8 mb-2 opacity-50" />
+			<div className="flex flex-1 flex-col items-center justify-center text-muted-foreground">
 				<p className="text-sm">No version history available yet.</p>
 				<p className="text-xs mt-1">Versions are created when file content changes.</p>
 			</div>
 		);
 	}
 
-	return (
-		<div className="flex flex-col gap-4 pt-4 h-full">
-			<div className="flex-1 overflow-y-auto space-y-2">
-				{versions.map((v) => (
-					<div
-						key={v.version_number}
-						className={`rounded-lg border p-3 cursor-pointer transition-colors ${
-							selectedVersion === v.version_number
-								? "border-primary bg-primary/5"
-								: "border-border hover:border-primary/50"
-						}`}
-						onClick={() => handleSelectVersion(v.version_number)}
-					>
-						<div className="flex items-center justify-between">
-							<div className="space-y-1">
-								<p className="text-sm font-medium">Version {v.version_number}</p>
-								{v.created_at && (
-									<p className="text-xs text-muted-foreground">
-										{new Date(v.created_at).toLocaleString()}
-									</p>
-								)}
-								{v.title && (
-									<p className="text-xs text-muted-foreground truncate max-w-[200px]">
-										{v.title}
-									</p>
-								)}
-							</div>
-							<Button
-								variant="outline"
-								size="sm"
-								className="shrink-0 gap-1"
-								disabled={restoring}
-								onClick={(e) => {
-									e.stopPropagation();
-									handleRestore(v.version_number);
-								}}
-							>
-								<RotateCcw className="h-3 w-3" />
-								Restore
-							</Button>
-						</div>
-					</div>
-				))}
-			</div>
+	const selectedVersionData = versions.find((v) => v.version_number === selectedVersion);
 
-			{selectedVersion !== null && (
-				<div className="border-t pt-4 max-h-[40vh] overflow-y-auto">
-					<h4 className="text-sm font-medium mb-2">
-						Preview — Version {selectedVersion}
-					</h4>
-					{contentLoading ? (
-						<div className="flex items-center justify-center py-6">
-							<Spinner size="sm" />
-						</div>
-					) : (
-						<pre className="text-xs whitespace-pre-wrap font-mono bg-muted/50 rounded-lg p-3 max-h-[30vh] overflow-y-auto">
-							{versionContent || "(empty)"}
-						</pre>
-					)}
+	return (
+		<>
+			{/* Left panel — version list */}
+			<nav className="w-full md:w-[260px] shrink-0 flex flex-col border-b md:border-b-0 md:border-r border-border">
+				<div className="px-4 pr-12 md:pr-4 pt-5 pb-2">
+					<h2 className="text-sm font-semibold text-foreground">Version History</h2>
 				</div>
-			)}
-		</div>
+				<div className="flex-1 overflow-y-auto p-2">
+					<div className="flex flex-col gap-0.5">
+						{versions.map((v) => (
+							<button
+								key={v.version_number}
+								type="button"
+								onClick={() => handleSelectVersion(v.version_number)}
+								className={cn(
+									"flex items-center gap-2 rounded-lg px-3 py-2.5 text-left transition-colors focus:outline-none focus-visible:outline-none w-full",
+									selectedVersion === v.version_number
+										? "bg-accent text-accent-foreground"
+										: "text-muted-foreground hover:bg-accent/50 hover:text-foreground"
+								)}
+							>
+								<div className="flex-1 min-w-0 space-y-0.5">
+									<p className="text-sm font-medium truncate">
+										{v.created_at ? formatRelativeTime(v.created_at) : `Version ${v.version_number}`}
+									</p>
+									{v.title && (
+										<p className="text-xs text-muted-foreground truncate">
+											{v.title}
+										</p>
+									)}
+								</div>
+								<ChevronRight className="h-3.5 w-3.5 shrink-0 opacity-50" />
+							</button>
+						))}
+					</div>
+				</div>
+			</nav>
+
+			{/* Right panel — content preview */}
+			<div className="flex flex-1 flex-col overflow-hidden min-w-0">
+				{selectedVersion !== null && selectedVersionData ? (
+					<>
+						<div className="flex items-center justify-between pl-6 pr-14 pt-5 pb-2">
+							<h2 className="text-sm font-semibold truncate">
+								{selectedVersionData.title || `Version ${selectedVersion}`}
+							</h2>
+							<div className="flex items-center gap-1.5 shrink-0">
+								<Button
+									variant="outline"
+									size="sm"
+									className="gap-1.5 text-xs"
+									onClick={handleCopy}
+									disabled={contentLoading || copied}
+								>
+									{copied ? (
+										<Check className="h-3 w-3" />
+									) : (
+										<Copy className="h-3 w-3" />
+									)}
+									{copied ? "Copied" : "Copy"}
+								</Button>
+								<Button
+									variant="outline"
+									size="sm"
+									className="gap-1.5 text-xs"
+									disabled={restoring || contentLoading}
+									onClick={() => handleRestore(selectedVersion)}
+								>
+									{restoring ? (
+										<Spinner size="xs" />
+									) : (
+										<RotateCcw className="h-3 w-3" />
+									)}
+									Restore
+								</Button>
+							</div>
+						</div>
+						<Separator />
+						<div className="flex-1 overflow-y-auto px-6 py-4">
+							{contentLoading ? (
+								<div className="flex items-center justify-center py-12">
+									<Spinner size="sm" className="text-muted-foreground" />
+								</div>
+							) : (
+								<pre className="text-sm whitespace-pre-wrap font-mono leading-relaxed text-foreground/90">
+									{versionContent || "(empty)"}
+								</pre>
+							)}
+						</div>
+					</>
+				) : (
+					<div className="flex flex-1 items-center justify-center text-muted-foreground">
+						<p className="text-sm">Select a version to preview</p>
+					</div>
+				)}
+			</div>
+		</>
 	);
 }
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index 7aa518361..031390c9e 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -21,6 +21,7 @@ import type { DocumentNodeDoc } from "@/components/documents/DocumentNode";
 import type { FolderDisplay } from "@/components/documents/FolderNode";
 import { FolderPickerDialog } from "@/components/documents/FolderPickerDialog";
 import { FolderTreeView } from "@/components/documents/FolderTreeView";
+import { VersionHistoryDialog } from "@/components/documents/version-history";
 import { JsonMetadataViewer } from "@/components/json-metadata-viewer";
 import { EXPORT_FILE_EXTENSIONS } from "@/components/shared/ExportMenuItems";
 import {
@@ -579,6 +580,7 @@ export function DocumentsSidebar({
 
 	const [bulkDeleteConfirmOpen, setBulkDeleteConfirmOpen] = useState(false);
 	const [isBulkDeleting, setIsBulkDeleting] = useState(false);
+	const [versionDocId, setVersionDocId] = useState<number | null>(null);
 
 	const handleBulkDeleteSelected = useCallback(async () => {
 		if (deletableSelectedIds.length === 0) return;
@@ -826,6 +828,7 @@ export function DocumentsSidebar({
 				onDeleteDocument={(doc) => handleDeleteDocument(doc.id)}
 				onMoveDocument={handleMoveDocument}
 				onExportDocument={handleExportDocument}
+				onVersionHistory={(doc) => setVersionDocId(doc.id)}
 				activeTypes={activeTypes}
 				onDropIntoFolder={handleDropIntoFolder}
 				onReorderFolder={handleReorderFolder}
@@ -850,6 +853,14 @@ export function DocumentsSidebar({
 			}}
 		/>
 
+		{versionDocId !== null && (
+			<VersionHistoryDialog
+				open
+				onOpenChange={(open) => { if (!open) setVersionDocId(null); }}
+				documentId={versionDocId}
+			/>
+		)}
+
 		<FolderPickerDialog
 				open={folderPickerOpen}
 				onOpenChange={setFolderPickerOpen}

From ca250910c09a2d9aaa3c553aba350b749a7ecdc5 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 10:56:43 +0530
Subject: [PATCH 074/202] fix: update version history messages for clarity by
 removing unnecessary punctuation

---
 surfsense_web/components/documents/version-history.tsx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/surfsense_web/components/documents/version-history.tsx b/surfsense_web/components/documents/version-history.tsx
index f438a7190..7aba92b47 100644
--- a/surfsense_web/components/documents/version-history.tsx
+++ b/surfsense_web/components/documents/version-history.tsx
@@ -165,8 +165,8 @@ function VersionHistoryPanel({ documentId }: { documentId: number }) {
 	if (versions.length === 0) {
 		return (
 			<div className="flex flex-1 flex-col items-center justify-center text-muted-foreground">
-				<p className="text-sm">No version history available yet.</p>
-				<p className="text-xs mt-1">Versions are created when file content changes.</p>
+				<p className="text-sm">No version history available yet</p>
+				<p className="text-xs mt-1">Versions are created when file content changes</p>
 			</div>
 		);
 	}

From 79f19b9bc637d13bf89a8c08ae2e815123093491 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 11:10:46 +0530
Subject: [PATCH 075/202] fix: adjust layout in DocumentsSidebar for improved
 UI responsiveness and interaction, including changes to button styles and
 positioning

---
 .../components/layout/ui/sidebar/DocumentsSidebar.tsx     | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index 031390c9e..24f6666c9 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -784,12 +784,13 @@ export function DocumentsSidebar({
 			/>
 				</div>
 
+			<div className="relative flex-1 min-h-0 overflow-auto">
 				{deletableSelectedIds.length > 0 && (
-					<div className="shrink-0 flex items-center justify-center px-4 py-1.5 animate-in fade-in duration-150">
+					<div className="absolute inset-x-0 top-0 z-10 flex items-center justify-center px-4 py-1.5 animate-in fade-in duration-150 pointer-events-none">
 						<button
 							type="button"
 							onClick={() => setBulkDeleteConfirmOpen(true)}
-							className="flex items-center gap-1.5 px-3 py-1 rounded-md bg-destructive text-destructive-foreground shadow-sm text-xs font-medium hover:bg-destructive/90 transition-colors"
+							className="pointer-events-auto flex items-center gap-1.5 px-3 py-1 rounded-md bg-destructive text-destructive-foreground shadow-lg text-xs font-medium hover:bg-destructive/90 transition-colors"
 						>
 							<Trash2 size={12} />
 							Delete {deletableSelectedIds.length}{" "}
@@ -798,7 +799,7 @@ export function DocumentsSidebar({
 					</div>
 				)}
 
-				<FolderTreeView
+			<FolderTreeView
 				folders={treeFolders}
 				documents={searchFilteredDocuments}
 				expandedIds={expandedIds}
@@ -837,6 +838,7 @@ export function DocumentsSidebar({
 			onStopWatchingFolder={handleStopWatching}
 			onViewFolderMetadata={handleViewFolderMetadata}
 		/>
+			</div>
 		</div>
 
 		<JsonMetadataViewer

From 525fae5abf3796cfe5bc5ecd3b39c207878a7894 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 11:19:54 +0530
Subject: [PATCH 076/202] feat: trigger document reindexing after restoring a
 document version to ensure content is up-to-date

---
 surfsense_backend/app/routes/documents_routes.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index e6eed7836..083ed2b89 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -1285,6 +1285,9 @@ async def restore_document_version(
     document.content_needs_reindexing = True
     await session.commit()
 
+    from app.tasks.celery_tasks.document_reindex_tasks import reindex_document_task
+    reindex_document_task.delay(document_id, str(user.id))
+
     return {
         "message": f"Restored version {version_number}",
         "document_id": document_id,

From 3833084dad3444d7bf534a7b39dc62ebf24a89fd Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 11:45:53 +0530
Subject: [PATCH 077/202] feat: changed the revision number of folder alembic
 migration

---
 ...ing.py => 118_add_local_folder_sync_and_versioning.py} | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)
 rename surfsense_backend/alembic/versions/{117_add_local_folder_sync_and_versioning.py => 118_add_local_folder_sync_and_versioning.py} (98%)

diff --git a/surfsense_backend/alembic/versions/117_add_local_folder_sync_and_versioning.py b/surfsense_backend/alembic/versions/118_add_local_folder_sync_and_versioning.py
similarity index 98%
rename from surfsense_backend/alembic/versions/117_add_local_folder_sync_and_versioning.py
rename to surfsense_backend/alembic/versions/118_add_local_folder_sync_and_versioning.py
index e322a608d..1fef9fbcb 100644
--- a/surfsense_backend/alembic/versions/117_add_local_folder_sync_and_versioning.py
+++ b/surfsense_backend/alembic/versions/118_add_local_folder_sync_and_versioning.py
@@ -1,7 +1,7 @@
 """Add LOCAL_FOLDER_FILE document type, folder metadata, and document_versions table
 
-Revision ID: 117
-Revises: 116
+Revision ID: 118
+Revises: 117
 """
 
 from collections.abc import Sequence
@@ -10,8 +10,8 @@ import sqlalchemy as sa
 
 from alembic import op
 
-revision: str = "117"
-down_revision: str | None = "116"
+revision: str = "118"
+down_revision: str | None = "117"
 branch_labels: str | Sequence[str] | None = None
 depends_on: str | Sequence[str] | None = None
 

From 3621951f2aeceebaff70328ffe8a6c91e9bad83d Mon Sep 17 00:00:00 2001
From: Matt Van Horn <455140+mvanhorn@users.noreply.github.com>
Date: Thu, 2 Apr 2026 23:21:57 -0700
Subject: [PATCH 078/202] perf: throttle scroll handlers with
 requestAnimationFrame

Wrap scroll handlers in thread.tsx, InboxSidebar.tsx, and
DocumentsTableShell.tsx with requestAnimationFrame batching so scroll
position state updates fire at most once per animation frame instead of
on every scroll event (up to 60/sec at 60fps). Add cleanup useEffect to
cancel pending frames on unmount.

Fixes #1103
---
 .../(manage)/components/DocumentsTableShell.tsx      | 12 +++++++++---
 surfsense_web/components/assistant-ui/thread.tsx     | 12 +++++++++---
 .../components/layout/ui/sidebar/InboxSidebar.tsx    | 12 +++++++++---
 3 files changed, 27 insertions(+), 9 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
index ceef9f2e1..dc8966571 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
@@ -267,12 +267,18 @@ export function DocumentsTableShell({
 	const [metadataJson, setMetadataJson] = useState<Record<string, unknown> | null>(null);
 	const [metadataLoading, setMetadataLoading] = useState(false);
 	const [previewScrollPos, setPreviewScrollPos] = useState<"top" | "middle" | "bottom">("top");
+	const previewRafRef = useRef<number>();
 	const handlePreviewScroll = useCallback((e: React.UIEvent<HTMLDivElement>) => {
 		const el = e.currentTarget;
-		const atTop = el.scrollTop <= 2;
-		const atBottom = el.scrollHeight - el.scrollTop - el.clientHeight <= 2;
-		setPreviewScrollPos(atTop ? "top" : atBottom ? "bottom" : "middle");
+		if (previewRafRef.current) return;
+		previewRafRef.current = requestAnimationFrame(() => {
+			const atTop = el.scrollTop <= 2;
+			const atBottom = el.scrollHeight - el.scrollTop - el.clientHeight <= 2;
+			setPreviewScrollPos(atTop ? "top" : atBottom ? "bottom" : "middle");
+			previewRafRef.current = undefined;
+		});
 	}, []);
+	useEffect(() => () => { if (previewRafRef.current) cancelAnimationFrame(previewRafRef.current); }, []);
 
 	const [deleteDoc, setDeleteDoc] = useState<Document | null>(null);
 	const [isDeleting, setIsDeleting] = useState(false);
diff --git a/surfsense_web/components/assistant-ui/thread.tsx b/surfsense_web/components/assistant-ui/thread.tsx
index 0d0163d8a..0f230cec3 100644
--- a/surfsense_web/components/assistant-ui/thread.tsx
+++ b/surfsense_web/components/assistant-ui/thread.tsx
@@ -816,12 +816,18 @@ const ComposerAction: FC<ComposerActionProps> = ({ isBlockedByOtherUser = false
 	const isDesktop = useMediaQuery("(min-width: 640px)");
 	const { openDialog: openUploadDialog } = useDocumentUploadDialog();
 	const [toolsScrollPos, setToolsScrollPos] = useState<"top" | "middle" | "bottom">("top");
+	const toolsRafRef = useRef<number>();
 	const handleToolsScroll = useCallback((e: React.UIEvent<HTMLDivElement>) => {
 		const el = e.currentTarget;
-		const atTop = el.scrollTop <= 2;
-		const atBottom = el.scrollHeight - el.scrollTop - el.clientHeight <= 2;
-		setToolsScrollPos(atTop ? "top" : atBottom ? "bottom" : "middle");
+		if (toolsRafRef.current) return;
+		toolsRafRef.current = requestAnimationFrame(() => {
+			const atTop = el.scrollTop <= 2;
+			const atBottom = el.scrollHeight - el.scrollTop - el.clientHeight <= 2;
+			setToolsScrollPos(atTop ? "top" : atBottom ? "bottom" : "middle");
+			toolsRafRef.current = undefined;
+		});
 	}, []);
+	useEffect(() => () => { if (toolsRafRef.current) cancelAnimationFrame(toolsRafRef.current); }, []);
 	const isComposerTextEmpty = useAuiState(({ composer }) => {
 		const text = composer.text?.trim() || "";
 		return text.length === 0;
diff --git a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
index 72400a589..4aa8d4c60 100644
--- a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
@@ -178,12 +178,18 @@ export function InboxSidebarContent({
 	const [mounted, setMounted] = useState(false);
 	const [openDropdown, setOpenDropdown] = useState<"filter" | null>(null);
 	const [connectorScrollPos, setConnectorScrollPos] = useState<"top" | "middle" | "bottom">("top");
+	const connectorRafRef = useRef<number>();
 	const handleConnectorScroll = useCallback((e: React.UIEvent<HTMLDivElement>) => {
 		const el = e.currentTarget;
-		const atTop = el.scrollTop <= 2;
-		const atBottom = el.scrollHeight - el.scrollTop - el.clientHeight <= 2;
-		setConnectorScrollPos(atTop ? "top" : atBottom ? "bottom" : "middle");
+		if (connectorRafRef.current) return;
+		connectorRafRef.current = requestAnimationFrame(() => {
+			const atTop = el.scrollTop <= 2;
+			const atBottom = el.scrollHeight - el.scrollTop - el.clientHeight <= 2;
+			setConnectorScrollPos(atTop ? "top" : atBottom ? "bottom" : "middle");
+			connectorRafRef.current = undefined;
+		});
 	}, []);
+	useEffect(() => () => { if (connectorRafRef.current) cancelAnimationFrame(connectorRafRef.current); }, []);
 	const [filterDrawerOpen, setFilterDrawerOpen] = useState(false);
 	const [markingAsReadId, setMarkingAsReadId] = useState<number | null>(null);
 

From e38a0ff7c345cb83121f7983eec838cfdf579f66 Mon Sep 17 00:00:00 2001
From: Matt Van Horn <455140+mvanhorn@users.noreply.github.com>
Date: Thu, 2 Apr 2026 23:43:19 -0700
Subject: [PATCH 079/202] style: format useEffect cleanup to satisfy biome

---
 .../documents/(manage)/components/DocumentsTableShell.tsx  | 7 ++++++-
 surfsense_web/components/assistant-ui/thread.tsx           | 7 ++++++-
 .../components/layout/ui/sidebar/InboxSidebar.tsx          | 7 ++++++-
 3 files changed, 18 insertions(+), 3 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
index dc8966571..748fb1911 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsTableShell.tsx
@@ -278,7 +278,12 @@ export function DocumentsTableShell({
 			previewRafRef.current = undefined;
 		});
 	}, []);
-	useEffect(() => () => { if (previewRafRef.current) cancelAnimationFrame(previewRafRef.current); }, []);
+	useEffect(
+		() => () => {
+			if (previewRafRef.current) cancelAnimationFrame(previewRafRef.current);
+		},
+		[]
+	);
 
 	const [deleteDoc, setDeleteDoc] = useState<Document | null>(null);
 	const [isDeleting, setIsDeleting] = useState(false);
diff --git a/surfsense_web/components/assistant-ui/thread.tsx b/surfsense_web/components/assistant-ui/thread.tsx
index 0f230cec3..718bf3961 100644
--- a/surfsense_web/components/assistant-ui/thread.tsx
+++ b/surfsense_web/components/assistant-ui/thread.tsx
@@ -827,7 +827,12 @@ const ComposerAction: FC<ComposerActionProps> = ({ isBlockedByOtherUser = false
 			toolsRafRef.current = undefined;
 		});
 	}, []);
-	useEffect(() => () => { if (toolsRafRef.current) cancelAnimationFrame(toolsRafRef.current); }, []);
+	useEffect(
+		() => () => {
+			if (toolsRafRef.current) cancelAnimationFrame(toolsRafRef.current);
+		},
+		[]
+	);
 	const isComposerTextEmpty = useAuiState(({ composer }) => {
 		const text = composer.text?.trim() || "";
 		return text.length === 0;
diff --git a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
index 4aa8d4c60..525b7cf74 100644
--- a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
@@ -189,7 +189,12 @@ export function InboxSidebarContent({
 			connectorRafRef.current = undefined;
 		});
 	}, []);
-	useEffect(() => () => { if (connectorRafRef.current) cancelAnimationFrame(connectorRafRef.current); }, []);
+	useEffect(
+		() => () => {
+			if (connectorRafRef.current) cancelAnimationFrame(connectorRafRef.current);
+		},
+		[]
+	);
 	const [filterDrawerOpen, setFilterDrawerOpen] = useState(false);
 	const [markingAsReadId, setMarkingAsReadId] = useState<number | null>(null);
 

From b9b2bac16f89203e16b637ab12e3edb5ef3b4589 Mon Sep 17 00:00:00 2001
From: Matt Van Horn <455140+mvanhorn@users.noreply.github.com>
Date: Thu, 2 Apr 2026 23:59:15 -0700
Subject: [PATCH 080/202] fix: clean up onboarding tour timer leaks

Fix two timer cleanup bugs in onboarding-tour.tsx:

1. Remove cleanup return from useCallback (only works in useEffect).
   Clear retryTimerRef at the start of updateTarget and in a
   dedicated useEffect cleanup instead.

2. Track recursive setTimeout calls via startCheckTimerRef so they
   are properly cancelled on unmount instead of leaking.

Fixes #1091
---
 surfsense_web/components/onboarding-tour.tsx | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/surfsense_web/components/onboarding-tour.tsx b/surfsense_web/components/onboarding-tour.tsx
index 1c52169cb..d762d9c15 100644
--- a/surfsense_web/components/onboarding-tour.tsx
+++ b/surfsense_web/components/onboarding-tour.tsx
@@ -429,6 +429,7 @@ export function OnboardingTour() {
 	const pathname = usePathname();
 	const retryCountRef = useRef(0);
 	const retryTimerRef = useRef<ReturnType<typeof setTimeout> | null>(null);
+	const startCheckTimerRef = useRef<ReturnType<typeof setTimeout> | null>(null);
 	const maxRetries = 10;
 	// Track previous user ID to detect user changes
 	const previousUserIdRef = useRef<string | null>(null);
@@ -460,6 +461,7 @@ export function OnboardingTour() {
 
 	// Find and track target element with retry logic
 	const updateTarget = useCallback(() => {
+		if (retryTimerRef.current) clearTimeout(retryTimerRef.current);
 		if (!currentStep) return;
 
 		const el = document.querySelector(currentStep.target);
@@ -480,11 +482,13 @@ export function OnboardingTour() {
 				}
 			}, 200);
 		}
+	}, [currentStep]);
 
+	useEffect(() => {
 		return () => {
 			if (retryTimerRef.current) clearTimeout(retryTimerRef.current);
 		};
-	}, [currentStep]);
+	}, []);
 
 	// Check if tour should run: localStorage + data validation with user ID tracking
 	useEffect(() => {
@@ -573,15 +577,15 @@ export function OnboardingTour() {
 				setPosition(calculatePosition(connectorEl, TOUR_STEPS[0].placement));
 			} else {
 				// Retry after delay
-				setTimeout(checkAndStartTour, 200);
+				startCheckTimerRef.current = setTimeout(checkAndStartTour, 200);
 			}
 		};
 
 		// Start checking after initial delay
-		const timer = setTimeout(checkAndStartTour, 500);
+		startCheckTimerRef.current = setTimeout(checkAndStartTour, 500);
 		return () => {
 			cancelled = true;
-			clearTimeout(timer);
+			if (startCheckTimerRef.current) clearTimeout(startCheckTimerRef.current);
 		};
 	}, [mounted, user?.id, searchSpaceId, pathname, threadsData, documentTypeCounts, connectors]);
 

From 388811194e720a28dce7a92e47757d01f9f2820f Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 12:33:47 +0530
Subject: [PATCH 081/202] feat: update DocumentUploadTab to use a dropdown for
 file and folder selection, enhancing user experience; also update upload
 limits and file size messages in multiple languages

---
 .../components/sources/DocumentUploadTab.tsx  | 73 ++++++-------------
 surfsense_web/messages/en.json                | 15 +++-
 surfsense_web/messages/es.json                | 15 +++-
 surfsense_web/messages/hi.json                | 15 +++-
 surfsense_web/messages/pt.json                | 15 +++-
 surfsense_web/messages/zh.json                | 17 +++--
 6 files changed, 80 insertions(+), 70 deletions(-)

diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index f3b9166dc..9733bd2e6 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -413,18 +413,24 @@ export function DocumentUploadTab({
 		}
 
 		return (
-			<Button
-				variant="secondary"
-				size="sm"
-				className={`text-xs ${sizeClass} ${widthClass}`}
-				onClick={(e) => {
-					e.stopPropagation();
-					e.preventDefault();
-					fileInputRef.current?.click();
-				}}
-			>
-				{t("browse_files")}
-			</Button>
+			<DropdownMenu>
+				<DropdownMenuTrigger asChild onClick={(e) => e.stopPropagation()}>
+					<Button variant="secondary" size="sm" className={`text-xs gap-1 ${sizeClass} ${widthClass}`}>
+						Browse
+						<ChevronDown className="h-3 w-3 opacity-60" />
+					</Button>
+				</DropdownMenuTrigger>
+				<DropdownMenuContent align="center" onClick={(e) => e.stopPropagation()}>
+					<DropdownMenuItem onClick={() => fileInputRef.current?.click()}>
+						<FileIcon className="h-4 w-4 mr-2" />
+						{t("browse_files")}
+					</DropdownMenuItem>
+					<DropdownMenuItem onClick={() => folderInputRef.current?.click()}>
+						<FolderOpen className="h-4 w-4 mr-2" />
+						{t("browse_folder")}
+					</DropdownMenuItem>
+				</DropdownMenuContent>
+			</DropdownMenu>
 		);
 	};
 
@@ -476,7 +482,7 @@ export function DocumentUploadTab({
 						<Upload className="h-10 w-10 text-muted-foreground" />
 						<div className="text-center space-y-1.5">
 							<p className="text-base font-medium">
-								{isElectron ? "Select files or folder" : "Tap to select files"}
+								{isElectron ? "Select files or folder" : "Tap to select files or folder"}
 							</p>
 							<p className="text-sm text-muted-foreground inline-flex items-center flex-wrap justify-center">
 								<span>{t("file_size_limit")}</span>
@@ -484,40 +490,9 @@ export function DocumentUploadTab({
 								<span>{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}</span>
 							</p>
 						</div>
-						{isElectron && (
-							<div className="w-full mt-1" onClick={(e) => e.stopPropagation()}>
-								{renderBrowseButton({ fullWidth: true })}
-							</div>
-						)}
-						{!isElectron && (
-							<div className="mt-2 flex gap-2">
-								<Button
-									variant="secondary"
-									size="sm"
-									className="text-xs"
-									onClick={(e) => {
-										e.stopPropagation();
-										e.preventDefault();
-										fileInputRef.current?.click();
-									}}
-								>
-									{t("browse_files")}
-								</Button>
-								<Button
-									variant="outline"
-									size="sm"
-									className="text-xs"
-									onClick={(e) => {
-										e.stopPropagation();
-										e.preventDefault();
-										folderInputRef.current?.click();
-									}}
-								>
-									<FolderOpen className="h-4 w-4 mr-1.5" />
-									{t("browse_folder")}
-								</Button>
-							</div>
-						)}
+						<div className="w-full mt-1" onClick={(e) => e.stopPropagation()}>
+							{renderBrowseButton({ fullWidth: true })}
+						</div>
 					</div>
 				)}
 			</div>
@@ -570,8 +545,8 @@ export function DocumentUploadTab({
 				)}
 			</div>
 
-			{/* FOLDER SELECTED */}
-			{selectedFolder && (
+			{/* FOLDER SELECTED (Electron only — web flattens folder contents into file list) */}
+			{isElectron && selectedFolder && (
 				<div className="rounded-lg border border-border p-3 space-y-2">
 					<div className="flex items-center gap-2">
 						<FolderOpen className="h-4 w-4 text-primary shrink-0" />
diff --git a/surfsense_web/messages/en.json b/surfsense_web/messages/en.json
index 47d08e921..3a8c0c632 100644
--- a/surfsense_web/messages/en.json
+++ b/surfsense_web/messages/en.json
@@ -376,11 +376,11 @@
 	"upload_documents": {
 		"title": "Upload Documents",
 		"subtitle": "Upload your files to make them searchable and accessible through AI-powered conversations.",
-		"file_size_limit": "Maximum file size: {maxMB}MB per file",
-		"upload_limits": "Upload files or entire folders",
+		"file_size_limit": "Maximum file size: 50MB per file",
+		"upload_limits": "Upload limit: {maxFiles} files, {maxSizeMB}MB total",
 		"drop_files": "Drop files or folders here",
 		"drag_drop": "Drag & drop files or folders here",
-		"or_browse": "or click to browse files and folders",
+		"or_browse": "or click to browse",
 		"browse_files": "Browse Files",
 		"browse_folder": "Browse Folder",
 		"selected_files": "Selected Files ({count})",
@@ -397,7 +397,14 @@
 		"file_types_desc": "These file types are supported based on your current ETL service configuration.",
 		"file_too_large": "File Too Large",
 		"file_too_large_desc": "\"{name}\" exceeds the {maxMB}MB per-file limit.",
-		"no_supported_files_in_folder": "No supported file types found in the selected folder."
+		"no_supported_files_in_folder": "No supported file types found in the selected folder.",
+		"remaining_capacity": "{files} files, {sizeMB}MB remaining",
+		"file_limit_reached": "File limit reached",
+		"file_limit_reached_desc": "Maximum of {max} files allowed",
+		"max_files_exceeded": "Too many files",
+		"max_files_exceeded_desc": "You can upload a maximum of {max} files at once",
+		"max_size_exceeded": "Total size exceeded",
+		"max_size_exceeded_desc": "Total upload size cannot exceed {max}MB"
 	},
 	"add_webpage": {
 		"title": "Add Webpages for Crawling",
diff --git a/surfsense_web/messages/es.json b/surfsense_web/messages/es.json
index e7761ba25..2de30d29d 100644
--- a/surfsense_web/messages/es.json
+++ b/surfsense_web/messages/es.json
@@ -376,11 +376,11 @@
 	"upload_documents": {
 		"title": "Subir documentos",
 		"subtitle": "Sube tus archivos para hacerlos buscables y accesibles a través de conversaciones con IA.",
-		"file_size_limit": "Tamaño máximo de archivo: {maxMB} MB por archivo",
-		"upload_limits": "Sube archivos o carpetas enteras",
+		"file_size_limit": "Tamaño máximo de archivo: 50 MB por archivo",
+		"upload_limits": "Límite de subida: {maxFiles} archivos, {maxSizeMB} MB en total",
 		"drop_files": "Suelta archivos o carpetas aquí",
 		"drag_drop": "Arrastra y suelta archivos o carpetas aquí",
-		"or_browse": "o haz clic para explorar archivos y carpetas",
+		"or_browse": "o haz clic para explorar",
 		"browse_files": "Explorar archivos",
 		"browse_folder": "Explorar carpeta",
 		"selected_files": "Archivos seleccionados ({count})",
@@ -397,7 +397,14 @@
 		"file_types_desc": "Estos tipos de archivo son soportados según la configuración actual de tu servicio ETL.",
 		"file_too_large": "Archivo demasiado grande",
 		"file_too_large_desc": "\"{name}\" excede el límite de {maxMB} MB por archivo.",
-		"no_supported_files_in_folder": "No se encontraron tipos de archivo compatibles en la carpeta seleccionada."
+		"no_supported_files_in_folder": "No se encontraron tipos de archivo compatibles en la carpeta seleccionada.",
+		"remaining_capacity": "{files} archivos, {sizeMB}MB restante",
+		"file_limit_reached": "Límite de archivos alcanzado",
+		"file_limit_reached_desc": "Máximo de {max} archivos permitidos",
+		"max_files_exceeded": "Demasiados archivos",
+		"max_files_exceeded_desc": "Puedes subir un máximo de {max} archivos a la vez",
+		"max_size_exceeded": "Tamaño total excedido",
+		"max_size_exceeded_desc": "El tamaño total de subida no puede exceder {max}MB"
 	},
 	"add_webpage": {
 		"title": "Agregar páginas web para rastreo",
diff --git a/surfsense_web/messages/hi.json b/surfsense_web/messages/hi.json
index 957533206..c27291e3b 100644
--- a/surfsense_web/messages/hi.json
+++ b/surfsense_web/messages/hi.json
@@ -376,11 +376,11 @@
 	"upload_documents": {
 		"title": "दस्तावेज़ अपलोड करें",
 		"subtitle": "AI-संचालित बातचीत के माध्यम से अपनी फ़ाइलों को खोजने योग्य और सुलभ बनाने के लिए अपलोड करें।",
-		"file_size_limit": "अधिकतम फ़ाइल आकार: प्रति फ़ाइल {maxMB}MB",
-		"upload_limits": "फ़ाइलें या पूरे फ़ोल्डर अपलोड करें",
+		"file_size_limit": "अधिकतम फ़ाइल आकार: प्रति फ़ाइल 50MB",
+		"upload_limits": "अपलोड सीमा: {maxFiles} फ़ाइलें, कुल {maxSizeMB}MB",
 		"drop_files": "फ़ाइलें या फ़ोल्डर यहां छोड़ें",
 		"drag_drop": "फ़ाइलें या फ़ोल्डर यहां खींचें और छोड़ें",
-		"or_browse": "या फ़ाइलें और फ़ोल्डर ब्राउज़ करने के लिए क्लिक करें",
+		"or_browse": "या ब्राउज़ करने के लिए क्लिक करें",
 		"browse_files": "फ़ाइलें ब्राउज़ करें",
 		"browse_folder": "फ़ोल्डर ब्राउज़ करें",
 		"selected_files": "चयनित फ़ाइलें ({count})",
@@ -397,7 +397,14 @@
 		"file_types_desc": "ये फ़ाइल प्रकार आपकी वर्तमान ETL सेवा कॉन्फ़िगरेशन के आधार पर समर्थित हैं।",
 		"file_too_large": "फ़ाइल बहुत बड़ी है",
 		"file_too_large_desc": "\"{name}\" प्रति फ़ाइल {maxMB}MB की सीमा से अधिक है।",
-		"no_supported_files_in_folder": "चयनित फ़ोल्डर में कोई समर्थित फ़ाइल प्रकार नहीं मिला।"
+		"no_supported_files_in_folder": "चयनित फ़ोल्डर में कोई समर्थित फ़ाइल प्रकार नहीं मिला।",
+		"remaining_capacity": "{files} फ़ाइलें, {sizeMB}MB शेष",
+		"file_limit_reached": "फ़ाइल सीमा पूरी हो गई",
+		"file_limit_reached_desc": "अधिकतम {max} फ़ाइलें अनुमत हैं",
+		"max_files_exceeded": "बहुत सारी फ़ाइलें",
+		"max_files_exceeded_desc": "आप एक बार में अधिकतम {max} फ़ाइलें अपलोड कर सकते हैं",
+		"max_size_exceeded": "कुल आकार सीमा पार",
+		"max_size_exceeded_desc": "कुल अपलोड आकार {max}MB से अधिक नहीं हो सकता"
 	},
 	"add_webpage": {
 		"title": "क्रॉलिंग के लिए वेबपेज जोड़ें",
diff --git a/surfsense_web/messages/pt.json b/surfsense_web/messages/pt.json
index 9aec7af48..eeb417a27 100644
--- a/surfsense_web/messages/pt.json
+++ b/surfsense_web/messages/pt.json
@@ -376,11 +376,11 @@
 	"upload_documents": {
 		"title": "Enviar documentos",
 		"subtitle": "Envie seus arquivos para torná-los pesquisáveis e acessíveis através de conversas com IA.",
-		"file_size_limit": "Tamanho máximo do arquivo: {maxMB} MB por arquivo",
-		"upload_limits": "Envie arquivos ou pastas inteiras",
+		"file_size_limit": "Tamanho máximo do arquivo: 50 MB por arquivo",
+		"upload_limits": "Limite de envio: {maxFiles} arquivos, {maxSizeMB} MB no total",
 		"drop_files": "Solte arquivos ou pastas aqui",
 		"drag_drop": "Arraste e solte arquivos ou pastas aqui",
-		"or_browse": "ou clique para navegar arquivos e pastas",
+		"or_browse": "ou clique para navegar",
 		"browse_files": "Navegar arquivos",
 		"browse_folder": "Navegar pasta",
 		"selected_files": "Arquivos selecionados ({count})",
@@ -397,7 +397,14 @@
 		"file_types_desc": "Estes tipos de arquivo são suportados com base na configuração atual do seu serviço ETL.",
 		"file_too_large": "Arquivo muito grande",
 		"file_too_large_desc": "\"{name}\" excede o limite de {maxMB} MB por arquivo.",
-		"no_supported_files_in_folder": "Nenhum tipo de arquivo suportado encontrado na pasta selecionada."
+		"no_supported_files_in_folder": "Nenhum tipo de arquivo suportado encontrado na pasta selecionada.",
+		"remaining_capacity": "{files} arquivos, {sizeMB}MB restante",
+		"file_limit_reached": "Limite de arquivos atingido",
+		"file_limit_reached_desc": "Máximo de {max} arquivos permitidos",
+		"max_files_exceeded": "Muitos arquivos",
+		"max_files_exceeded_desc": "Você pode enviar no máximo {max} arquivos de uma vez",
+		"max_size_exceeded": "Tamanho total excedido",
+		"max_size_exceeded_desc": "O tamanho total do envio não pode exceder {max}MB"
 	},
 	"add_webpage": {
 		"title": "Adicionar páginas web para rastreamento",
diff --git a/surfsense_web/messages/zh.json b/surfsense_web/messages/zh.json
index 3ceab2443..2ee18a346 100644
--- a/surfsense_web/messages/zh.json
+++ b/surfsense_web/messages/zh.json
@@ -360,11 +360,11 @@
 	"upload_documents": {
 		"title": "上传文档",
 		"subtitle": "上传您的文件，使其可通过 AI 对话进行搜索和访问。",
-		"file_size_limit": "最大文件大小：每个文件 {maxMB}MB",
-		"upload_limits": "上传文件或整个文件夹",
+		"file_size_limit": "最大文件大小：每个文件 50MB",
+		"upload_limits": "上传限制：最多 {maxFiles} 个文件，总大小不超过 {maxSizeMB}MB",
 		"drop_files": "将文件或文件夹拖放到此处",
-		"drag_drop": "将文件或文件夹拖放到此处",
-		"or_browse": "或点击浏览文件和文件夹",
+		"drag_drop": "拖放文件或文件夹到这里",
+		"or_browse": "或点击浏览",
 		"browse_files": "浏览文件",
 		"browse_folder": "浏览文件夹",
 		"selected_files": "已选择的文件 ({count})",
@@ -381,7 +381,14 @@
 		"file_types_desc": "根据您当前的 ETL 服务配置支持这些文件类型。",
 		"file_too_large": "文件过大",
 		"file_too_large_desc": "\"{name}\" 超过了每个文件 {maxMB}MB 的限制。",
-		"no_supported_files_in_folder": "所选文件夹中没有找到支持的文件类型。"
+		"no_supported_files_in_folder": "所选文件夹中没有找到支持的文件类型。",
+		"remaining_capacity": "剩余 {files} 个文件，{sizeMB}MB",
+		"file_limit_reached": "已达文件数量上限",
+		"file_limit_reached_desc": "最多允许 {max} 个文件",
+		"max_files_exceeded": "文件数量过多",
+		"max_files_exceeded_desc": "一次最多上传 {max} 个文件",
+		"max_size_exceeded": "总大小超出限制",
+		"max_size_exceeded_desc": "总上传大小不能超过 {max}MB"
 	},
 	"add_webpage": {
 		"title": "添加网页爬取",

From 134beec3920c9c2cc2c84e3588828b8294d856c9 Mon Sep 17 00:00:00 2001
From: Matt Van Horn <455140+mvanhorn@users.noreply.github.com>
Date: Fri, 3 Apr 2026 00:05:06 -0700
Subject: [PATCH 082/202] fix: clear upload progress interval on unmount

Store the progress setInterval ID in a ref and clear it in a
useEffect cleanup. Previously the interval was stored in a local
variable and only cleared in onSuccess/onError callbacks, leaking
if the component unmounted mid-upload.

Fixes #1090
---
 .../components/sources/DocumentUploadTab.tsx    | 17 +++++++++++++----
 1 file changed, 13 insertions(+), 4 deletions(-)

diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 723a3ad36..5c8ec83a5 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -4,7 +4,7 @@ import { useAtom } from "jotai";
 import { CheckCircle2, FileType, FolderOpen, Info, Upload, X } from "lucide-react";
 
 import { useTranslations } from "next-intl";
-import { type ChangeEvent, useCallback, useMemo, useRef, useState } from "react";
+import { type ChangeEvent, useCallback, useEffect, useMemo, useRef, useState } from "react";
 import { useDropzone } from "react-dropzone";
 import { toast } from "sonner";
 import { uploadDocumentMutationAtom } from "@/atoms/documents/document-mutation.atoms";
@@ -132,6 +132,15 @@ export function DocumentUploadTab({
 	const { mutate: uploadDocuments, isPending: isUploading } = uploadDocumentMutation;
 	const fileInputRef = useRef<HTMLInputElement>(null);
 	const folderInputRef = useRef<HTMLInputElement>(null);
+	const progressIntervalRef = useRef<ReturnType<typeof setInterval> | null>(null);
+
+	useEffect(() => {
+		return () => {
+			if (progressIntervalRef.current) {
+				clearInterval(progressIntervalRef.current);
+			}
+		};
+	}, []);
 
 	const acceptedFileTypes = useMemo(() => {
 		const etlService = process.env.NEXT_PUBLIC_ETL_SERVICE;
@@ -236,7 +245,7 @@ export function DocumentUploadTab({
 		setUploadProgress(0);
 		trackDocumentUploadStarted(Number(searchSpaceId), files.length, totalFileSize);
 
-		const progressInterval = setInterval(() => {
+		progressIntervalRef.current = setInterval(() => {
 			setUploadProgress((prev) => (prev >= 90 ? prev : prev + Math.random() * 10));
 		}, 200);
 
@@ -249,14 +258,14 @@ export function DocumentUploadTab({
 			},
 			{
 				onSuccess: () => {
-					clearInterval(progressInterval);
+					if (progressIntervalRef.current) clearInterval(progressIntervalRef.current);
 					setUploadProgress(100);
 					trackDocumentUploadSuccess(Number(searchSpaceId), files.length);
 					toast(t("upload_initiated"), { description: t("upload_initiated_desc") });
 					onSuccess?.();
 				},
 				onError: (error: unknown) => {
-					clearInterval(progressInterval);
+					if (progressIntervalRef.current) clearInterval(progressIntervalRef.current);
 					setUploadProgress(0);
 					const message = error instanceof Error ? error.message : "Upload failed";
 					trackDocumentUploadFailure(Number(searchSpaceId), message);

From 8171605fae6737b4e95cc07d05fe5467493265dd Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 13:05:42 +0530
Subject: [PATCH 083/202] refactor: remove metadata viewing functionality from
 FolderNode, FolderTreeView, and DocumentsSidebar components

---
 .../components/documents/FolderNode.tsx       | 10 +-----
 .../components/documents/FolderTreeView.tsx   |  3 --
 .../layout/ui/sidebar/DocumentsSidebar.tsx    | 34 -------------------
 3 files changed, 1 insertion(+), 46 deletions(-)

diff --git a/surfsense_web/components/documents/FolderNode.tsx b/surfsense_web/components/documents/FolderNode.tsx
index 41c1d8f73..909f965f9 100644
--- a/surfsense_web/components/documents/FolderNode.tsx
+++ b/surfsense_web/components/documents/FolderNode.tsx
@@ -80,7 +80,6 @@ interface FolderNodeProps {
 	isWatched?: boolean;
 	onRescan?: (folder: FolderDisplay) => void;
 	onStopWatching?: (folder: FolderDisplay) => void;
-	onViewMetadata?: (folder: FolderDisplay) => void;
 }
 
 function getDropZone(
@@ -122,7 +121,6 @@ export const FolderNode = React.memo(function FolderNode({
 	isWatched,
 	onRescan,
 	onStopWatching,
-	onViewMetadata,
 }: FolderNodeProps) {
 	const [renameValue, setRenameValue] = useState(folder.name);
 	const inputRef = useRef<HTMLInputElement>(null);
@@ -258,13 +256,7 @@ export const FolderNode = React.memo(function FolderNode({
 						isOver && !canDrop && "cursor-not-allowed"
 					)}
 					style={{ paddingLeft: `${depth * 16 + 4}px` }}
-				onClick={(e) => {
-					if ((e.ctrlKey || e.metaKey) && onViewMetadata) {
-						e.preventDefault();
-						e.stopPropagation();
-						onViewMetadata(folder);
-						return;
-					}
+				onClick={() => {
 					onToggleExpand(folder.id);
 				}}
 				onKeyDown={(e) => {
diff --git a/surfsense_web/components/documents/FolderTreeView.tsx b/surfsense_web/components/documents/FolderTreeView.tsx
index 6f64d6258..3aa8ce9d8 100644
--- a/surfsense_web/components/documents/FolderTreeView.tsx
+++ b/surfsense_web/components/documents/FolderTreeView.tsx
@@ -44,7 +44,6 @@ interface FolderTreeViewProps {
 	watchedFolderIds?: Set<number>;
 	onRescanFolder?: (folder: FolderDisplay) => void;
 	onStopWatchingFolder?: (folder: FolderDisplay) => void;
-	onViewFolderMetadata?: (folder: FolderDisplay) => void;
 }
 
 function groupBy<T>(items: T[], keyFn: (item: T) => string | number): Record<string | number, T[]> {
@@ -82,7 +81,6 @@ export function FolderTreeView({
 	watchedFolderIds,
 	onRescanFolder,
 	onStopWatchingFolder,
-	onViewFolderMetadata,
 }: FolderTreeViewProps) {
 	const foldersByParent = useMemo(() => groupBy(folders, (f) => f.parentId ?? "root"), [folders]);
 
@@ -247,7 +245,6 @@ export function FolderTreeView({
 				isWatched={watchedFolderIds?.has(f.id)}
 				onRescan={onRescanFolder}
 				onStopWatching={onStopWatchingFolder}
-				onViewMetadata={onViewFolderMetadata}
 			/>
 			);
 
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index 24f6666c9..c10c5dc82 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -22,7 +22,6 @@ import type { FolderDisplay } from "@/components/documents/FolderNode";
 import { FolderPickerDialog } from "@/components/documents/FolderPickerDialog";
 import { FolderTreeView } from "@/components/documents/FolderTreeView";
 import { VersionHistoryDialog } from "@/components/documents/version-history";
-import { JsonMetadataViewer } from "@/components/json-metadata-viewer";
 import { EXPORT_FILE_EXTENSIONS } from "@/components/shared/ExportMenuItems";
 import {
 	AlertDialog,
@@ -97,10 +96,6 @@ export function DocumentsSidebar({
 	const [activeTypes, setActiveTypes] = useState<DocumentTypeEnum[]>([]);
 	const [watchedFolderIds, setWatchedFolderIds] = useState<Set<number>>(new Set());
 
-	const [metadataFolder, setMetadataFolder] = useState<FolderDisplay | null>(null);
-	const [metadataJson, setMetadataJson] = useState<Record<string, unknown> | null>(null);
-	const [metadataLoading, setMetadataLoading] = useState(false);
-
 	useEffect(() => {
 		const api = typeof window !== "undefined" ? window.electronAPI : null;
 		if (!api?.getWatchedFolders) return;
@@ -333,20 +328,6 @@ export function DocumentsSidebar({
 		[]
 	);
 
-	const handleViewFolderMetadata = useCallback(async (folder: FolderDisplay) => {
-		setMetadataFolder(folder);
-		setMetadataLoading(true);
-		try {
-			const fullFolder = await foldersApiService.getFolder(folder.id);
-			setMetadataJson((fullFolder.metadata as Record<string, unknown>) ?? {});
-		} catch (err) {
-			console.error("[DocumentsSidebar] Failed to fetch folder metadata:", err);
-			setMetadataJson({ error: "Failed to load folder metadata" });
-		} finally {
-			setMetadataLoading(false);
-		}
-	}, []);
-
 	const handleRenameFolder = useCallback(async (folder: FolderDisplay, newName: string) => {
 		try {
 			await foldersApiService.updateFolder(folder.id, { name: newName });
@@ -836,25 +817,10 @@ export function DocumentsSidebar({
 				watchedFolderIds={watchedFolderIds}
 				onRescanFolder={handleRescanFolder}
 			onStopWatchingFolder={handleStopWatching}
-			onViewFolderMetadata={handleViewFolderMetadata}
 		/>
 			</div>
 		</div>
 
-		<JsonMetadataViewer
-			title={metadataFolder?.name ?? "Folder"}
-			metadata={metadataJson}
-			loading={metadataLoading}
-			open={!!metadataFolder}
-			onOpenChange={(open) => {
-				if (!open) {
-					setMetadataFolder(null);
-					setMetadataJson(null);
-					setMetadataLoading(false);
-				}
-			}}
-		/>
-
 		{versionDocId !== null && (
 			<VersionHistoryDialog
 				open

From 6ace8850bb5ef433372f42c0129bafe92bdca6d6 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 13:10:25 +0530
Subject: [PATCH 084/202] fix: update button alignment in InlineCitation
 component for consistent styling

---
 surfsense_web/components/assistant-ui/inline-citation.tsx | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/inline-citation.tsx b/surfsense_web/components/assistant-ui/inline-citation.tsx
index 15ad11d94..42144f1d6 100644
--- a/surfsense_web/components/assistant-ui/inline-citation.tsx
+++ b/surfsense_web/components/assistant-ui/inline-citation.tsx
@@ -32,8 +32,7 @@ export const InlineCitation: FC<InlineCitationProps> = ({ chunkId, isDocsChunk =
 			<button
 				type="button"
 				onClick={() => setIsOpen(true)}
-				className="ml-0.5 inline-flex h-5 min-w-5 cursor-pointer items-center justify-center rounded-md bg-muted/60 px-1.5 text-[11px] font-medium text-muted-foreground align-super shadow-sm transition-colors hover:bg-muted hover:text-foreground focus-visible:ring-ring focus-visible:ring-2 focus-visible:outline-none"
-				title={`View source chunk #${chunkId}`}
+				className="ml-0.5 inline-flex h-5 min-w-5 cursor-pointer items-center justify-center rounded-md bg-muted/60 px-1.5 text-[11px] font-medium text-muted-foreground align-baseline shadow-sm transition-colors hover:bg-muted hover:text-foreground focus-visible:ring-ring focus-visible:ring-2 focus-visible:outline-none"				title={`View source chunk #${chunkId}`}
 			>
 				{chunkId}
 			</button>

From 746c730b2e03ae23a718d53023bf473fa673d3f7 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 13:14:40 +0530
Subject: [PATCH 085/202] chore: ran linting

---
 .../app/routes/documents_routes.py            |  63 ++---
 surfsense_backend/app/routes/editor_routes.py |   6 +-
 .../routes/search_source_connectors_routes.py |   1 -
 surfsense_backend/app/schemas/folders.py      |   7 +-
 .../app/tasks/celery_tasks/document_tasks.py  |  15 +-
 .../local_folder_indexer.py                   | 215 +++++++++++++-----
 .../app/utils/document_versioning.py          |   6 +-
 .../tests/integration/conftest.py             |   2 -
 .../test_local_folder_pipeline.py             | 198 +++++++++-------
 .../integration/test_document_versioning.py   |  55 ++---
 .../test_local_folder_scan.py                 |   4 +-
 .../app/(home)/login/LocalLoginForm.tsx       |  20 +-
 surfsense_web/app/(home)/register/page.tsx    | 131 +++++------
 .../(manage)/components/DocumentsFilters.tsx  |  22 +-
 .../components/PromptsContent.tsx             |   7 +-
 .../assistant-ui/connector-popup.tsx          |   5 +-
 .../views/connector-edit-view.tsx             |  58 ++---
 .../assistant-ui/document-upload-popup.tsx    |   5 +-
 .../assistant-ui/inline-citation.tsx          |   3 +-
 .../components/documents/DocumentNode.tsx     |  17 +-
 .../components/documents/FolderNode.tsx       | 186 +++++++--------
 .../components/documents/FolderTreeView.tsx   |   8 +-
 .../components/documents/version-history.tsx  |  42 ++--
 .../components/editor-panel/editor-panel.tsx  |  39 ++--
 .../layout/ui/sidebar/DocumentsSidebar.tsx    | 185 ++++++++-------
 .../layout/ui/tabs/DocumentTabContent.tsx     |   4 +-
 .../new-chat/source-detail-panel.tsx          |   4 +-
 .../components/settings/llm-role-manager.tsx  |  41 ++--
 .../components/sources/DocumentUploadTab.tsx  |  73 +++---
 .../lib/apis/connectors-api.service.ts        |   1 -
 .../lib/apis/documents-api.service.ts         |  38 +++-
 31 files changed, 801 insertions(+), 660 deletions(-)

diff --git a/surfsense_backend/app/routes/documents_routes.py b/surfsense_backend/app/routes/documents_routes.py
index c86cdab3f..5008b1a10 100644
--- a/surfsense_backend/app/routes/documents_routes.py
+++ b/surfsense_backend/app/routes/documents_routes.py
@@ -977,15 +977,19 @@ async def get_watched_folders(
     )
 
     folders = (
-        await session.execute(
-            select(Folder).where(
-                Folder.search_space_id == search_space_id,
-                Folder.parent_id.is_(None),
-                Folder.folder_metadata.isnot(None),
-                Folder.folder_metadata["watched"].astext == "true",
+        (
+            await session.execute(
+                select(Folder).where(
+                    Folder.search_space_id == search_space_id,
+                    Folder.parent_id.is_(None),
+                    Folder.folder_metadata.isnot(None),
+                    Folder.folder_metadata["watched"].astext == "true",
+                )
             )
         )
-    ).scalars().all()
+        .scalars()
+        .all()
+    )
 
     return folders
 
@@ -1265,15 +1269,21 @@ async def list_document_versions(
     if not document:
         raise HTTPException(status_code=404, detail="Document not found")
 
-    await check_permission(session, user, document.search_space_id, Permission.DOCUMENTS_READ.value)
+    await check_permission(
+        session, user, document.search_space_id, Permission.DOCUMENTS_READ.value
+    )
 
     versions = (
-        await session.execute(
-            select(DocumentVersion)
-            .where(DocumentVersion.document_id == document_id)
-            .order_by(DocumentVersion.version_number.desc())
+        (
+            await session.execute(
+                select(DocumentVersion)
+                .where(DocumentVersion.document_id == document_id)
+                .order_by(DocumentVersion.version_number.desc())
+            )
         )
-    ).scalars().all()
+        .scalars()
+        .all()
+    )
 
     return [
         {
@@ -1300,7 +1310,9 @@ async def get_document_version(
     if not document:
         raise HTTPException(status_code=404, detail="Document not found")
 
-    await check_permission(session, user, document.search_space_id, Permission.DOCUMENTS_READ.value)
+    await check_permission(
+        session, user, document.search_space_id, Permission.DOCUMENTS_READ.value
+    )
 
     version = (
         await session.execute(
@@ -1331,14 +1343,14 @@ async def restore_document_version(
 ):
     """Restore a previous version: snapshot current state, then overwrite document content."""
     document = (
-        await session.execute(
-            select(Document).where(Document.id == document_id)
-        )
+        await session.execute(select(Document).where(Document.id == document_id))
     ).scalar_one_or_none()
     if not document:
         raise HTTPException(status_code=404, detail="Document not found")
 
-    await check_permission(session, user, document.search_space_id, Permission.DOCUMENTS_UPDATE.value)
+    await check_permission(
+        session, user, document.search_space_id, Permission.DOCUMENTS_UPDATE.value
+    )
 
     version = (
         await session.execute(
@@ -1363,6 +1375,7 @@ async def restore_document_version(
     await session.commit()
 
     from app.tasks.celery_tasks.document_reindex_tasks import reindex_document_task
+
     reindex_document_task.delay(document_id, str(user.id))
 
     return {
@@ -1430,9 +1443,7 @@ async def folder_index(
     root_folder_id = request.root_folder_id
     if root_folder_id:
         existing = (
-            await session.execute(
-                select(Folder).where(Folder.id == root_folder_id)
-            )
+            await session.execute(select(Folder).where(Folder.id == root_folder_id))
         ).scalar_one_or_none()
         if not existing:
             root_folder_id = None
@@ -1492,7 +1503,9 @@ async def folder_index_files(
         )
 
     if not request.target_file_paths:
-        raise HTTPException(status_code=400, detail="target_file_paths must not be empty")
+        raise HTTPException(
+            status_code=400, detail="target_file_paths must not be empty"
+        )
 
     await check_permission(
         session,
@@ -1507,11 +1520,11 @@ async def folder_index_files(
     for fp in request.target_file_paths:
         try:
             Path(fp).relative_to(request.folder_path)
-        except ValueError:
+        except ValueError as err:
             raise HTTPException(
                 status_code=400,
                 detail=f"target_file_path {fp} must be inside folder_path",
-            )
+            ) from err
 
     from app.tasks.celery_tasks.document_tasks import index_local_folder_task
 
@@ -1530,5 +1543,3 @@ async def folder_index_files(
         "status": "processing",
         "file_count": len(request.target_file_paths),
     }
-
-
diff --git a/surfsense_backend/app/routes/editor_routes.py b/surfsense_backend/app/routes/editor_routes.py
index a0505f62f..829b2cf69 100644
--- a/surfsense_backend/app/routes/editor_routes.py
+++ b/surfsense_backend/app/routes/editor_routes.py
@@ -129,7 +129,11 @@ async def get_editor_content(
 
     if not chunk_contents:
         doc_status = document.status or {}
-        state = doc_status.get("state", "ready") if isinstance(doc_status, dict) else "ready"
+        state = (
+            doc_status.get("state", "ready")
+            if isinstance(doc_status, dict)
+            else "ready"
+        )
         if state in ("pending", "processing"):
             raise HTTPException(
                 status_code=409,
diff --git a/surfsense_backend/app/routes/search_source_connectors_routes.py b/surfsense_backend/app/routes/search_source_connectors_routes.py
index f49ba2d5d..d208ff910 100644
--- a/surfsense_backend/app/routes/search_source_connectors_routes.py
+++ b/surfsense_backend/app/routes/search_source_connectors_routes.py
@@ -20,7 +20,6 @@ Non-OAuth connectors (BookStack, GitHub, etc.) are limited to one per search spa
 
 import asyncio
 import logging
-import os
 from contextlib import suppress
 from datetime import UTC, datetime, timedelta
 from typing import Any
diff --git a/surfsense_backend/app/schemas/folders.py b/surfsense_backend/app/schemas/folders.py
index e8bdf3821..a7e065144 100644
--- a/surfsense_backend/app/schemas/folders.py
+++ b/surfsense_backend/app/schemas/folders.py
@@ -1,9 +1,8 @@
 """Pydantic schemas for folder CRUD, move, and reorder operations."""
 
 from datetime import datetime
-from uuid import UUID
-
 from typing import Any
+from uuid import UUID
 
 from pydantic import BaseModel, ConfigDict, Field
 
@@ -36,7 +35,9 @@ class FolderRead(BaseModel):
     created_by_id: UUID | None
     created_at: datetime
     updated_at: datetime
-    metadata: dict[str, Any] | None = Field(default=None, validation_alias="folder_metadata")
+    metadata: dict[str, Any] | None = Field(
+        default=None, validation_alias="folder_metadata"
+    )
 
     model_config = ConfigDict(from_attributes=True)
 
diff --git a/surfsense_backend/app/tasks/celery_tasks/document_tasks.py b/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
index 506f8118c..4e9249d34 100644
--- a/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
+++ b/surfsense_backend/app/tasks/celery_tasks/document_tasks.py
@@ -1,6 +1,7 @@
 """Celery tasks for document processing."""
 
 import asyncio
+import contextlib
 import logging
 import os
 from uuid import UUID
@@ -1337,9 +1338,7 @@ async def _index_local_folder_async(
             )
             notification_id = notification.id
             _start_heartbeat(notification_id)
-            heartbeat_task = asyncio.create_task(
-                _run_heartbeat_loop(notification_id)
-            )
+            heartbeat_task = asyncio.create_task(_run_heartbeat_loop(notification_id))
         except Exception:
             logger.warning(
                 "Failed to create notification for local folder indexing",
@@ -1349,18 +1348,16 @@ async def _index_local_folder_async(
         async def _heartbeat_progress(completed_count: int) -> None:
             """Refresh heartbeat and optionally update notification progress."""
             if notification:
-                try:
+                with contextlib.suppress(Exception):
                     await NotificationService.document_processing.notify_processing_progress(
                         session=session,
                         notification=notification,
                         stage="indexing",
                         stage_message=f"Syncing files ({completed_count}/{file_count or '?'})",
                     )
-                except Exception:
-                    pass
 
         try:
-            indexed, skipped_or_failed, _rfid, err = await index_local_folder(
+            _indexed, _skipped_or_failed, _rfid, err = await index_local_folder(
                 session=session,
                 search_space_id=search_space_id,
                 user_id=user_id,
@@ -1371,7 +1368,9 @@ async def _index_local_folder_async(
                 root_folder_id=root_folder_id,
                 enable_summary=enable_summary,
                 target_file_paths=target_file_paths,
-                on_heartbeat_callback=_heartbeat_progress if (is_batch or is_full_scan) else None,
+                on_heartbeat_callback=_heartbeat_progress
+                if (is_batch or is_full_scan)
+                else None,
             )
 
             if notification:
diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index 4ac8cc594..539cfdd32 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -43,30 +43,110 @@ from .base import (
     logger,
 )
 
-PLAINTEXT_EXTENSIONS = frozenset({
-    ".md", ".markdown", ".txt", ".text", ".csv", ".tsv",
-    ".json", ".jsonl", ".yaml", ".yml", ".toml", ".ini", ".cfg", ".conf",
-    ".xml", ".html", ".htm", ".css", ".scss", ".less", ".sass",
-    ".py", ".pyw", ".pyi", ".pyx",
-    ".js", ".jsx", ".ts", ".tsx", ".mjs", ".cjs",
-    ".java", ".kt", ".kts", ".scala", ".groovy",
-    ".c", ".h", ".cpp", ".cxx", ".cc", ".hpp", ".hxx",
-    ".cs", ".fs", ".fsx",
-    ".go", ".rs", ".rb", ".php", ".pl", ".pm", ".lua",
-    ".swift", ".m", ".mm",
-    ".r", ".R", ".jl",
-    ".sh", ".bash", ".zsh", ".fish", ".bat", ".cmd", ".ps1",
-    ".sql", ".graphql", ".gql",
-    ".env", ".gitignore", ".dockerignore", ".editorconfig",
-    ".makefile", ".cmake",
-    ".log", ".rst", ".tex", ".bib", ".org", ".adoc", ".asciidoc",
-    ".vue", ".svelte", ".astro",
-    ".tf", ".hcl", ".proto",
-})
+PLAINTEXT_EXTENSIONS = frozenset(
+    {
+        ".md",
+        ".markdown",
+        ".txt",
+        ".text",
+        ".csv",
+        ".tsv",
+        ".json",
+        ".jsonl",
+        ".yaml",
+        ".yml",
+        ".toml",
+        ".ini",
+        ".cfg",
+        ".conf",
+        ".xml",
+        ".html",
+        ".htm",
+        ".css",
+        ".scss",
+        ".less",
+        ".sass",
+        ".py",
+        ".pyw",
+        ".pyi",
+        ".pyx",
+        ".js",
+        ".jsx",
+        ".ts",
+        ".tsx",
+        ".mjs",
+        ".cjs",
+        ".java",
+        ".kt",
+        ".kts",
+        ".scala",
+        ".groovy",
+        ".c",
+        ".h",
+        ".cpp",
+        ".cxx",
+        ".cc",
+        ".hpp",
+        ".hxx",
+        ".cs",
+        ".fs",
+        ".fsx",
+        ".go",
+        ".rs",
+        ".rb",
+        ".php",
+        ".pl",
+        ".pm",
+        ".lua",
+        ".swift",
+        ".m",
+        ".mm",
+        ".r",
+        ".R",
+        ".jl",
+        ".sh",
+        ".bash",
+        ".zsh",
+        ".fish",
+        ".bat",
+        ".cmd",
+        ".ps1",
+        ".sql",
+        ".graphql",
+        ".gql",
+        ".env",
+        ".gitignore",
+        ".dockerignore",
+        ".editorconfig",
+        ".makefile",
+        ".cmake",
+        ".log",
+        ".rst",
+        ".tex",
+        ".bib",
+        ".org",
+        ".adoc",
+        ".asciidoc",
+        ".vue",
+        ".svelte",
+        ".astro",
+        ".tf",
+        ".hcl",
+        ".proto",
+    }
+)
 
-AUDIO_EXTENSIONS = frozenset({
-    ".mp3", ".mp4", ".mpeg", ".mpga", ".m4a", ".wav", ".webm",
-})
+AUDIO_EXTENSIONS = frozenset(
+    {
+        ".mp3",
+        ".mp4",
+        ".mpeg",
+        ".mpga",
+        ".m4a",
+        ".wav",
+        ".webm",
+    }
+)
 
 
 def _is_plaintext_file(filename: str) -> bool:
@@ -81,6 +161,7 @@ def _needs_etl(filename: str) -> bool:
     """File is not plaintext and not audio — requires ETL service to parse."""
     return not _is_plaintext_file(filename) and not _is_audio_file(filename)
 
+
 HeartbeatCallbackType = Callable[[int], Awaitable[None]]
 
 DEFAULT_EXCLUDE_PATTERNS = [
@@ -121,9 +202,7 @@ def scan_folder(
     for dirpath, dirnames, filenames in os.walk(root):
         rel_dir = Path(dirpath).relative_to(root)
 
-        dirnames[:] = [
-            d for d in dirnames if d not in exclude_patterns
-        ]
+        dirnames[:] = [d for d in dirnames if d not in exclude_patterns]
 
         if any(part in exclude_patterns for part in rel_dir.parts):
             continue
@@ -134,9 +213,11 @@ def scan_folder(
 
             full = Path(dirpath) / fname
 
-            if file_extensions is not None:
-                if full.suffix.lower() not in file_extensions:
-                    continue
+            if (
+                file_extensions is not None
+                and full.suffix.lower() not in file_extensions
+            ):
+                continue
 
             try:
                 stat = full.stat()
@@ -209,11 +290,14 @@ def _content_hash(content: str, search_space_id: int) -> str:
     pipeline so that dedup checks are consistent.
     """
     import hashlib
-    return hashlib.sha256(f"{search_space_id}:{content}".encode("utf-8")).hexdigest()
+
+    return hashlib.sha256(f"{search_space_id}:{content}".encode()).hexdigest()
 
 
 async def _compute_file_content_hash(
-    file_path: str, filename: str, search_space_id: int,
+    file_path: str,
+    filename: str,
+    search_space_id: int,
 ) -> tuple[str, str]:
     """Read a file (via ETL if needed) and compute its content hash.
 
@@ -257,9 +341,7 @@ async def _mirror_folder_structure(
 
     if root_folder_id:
         existing = (
-            await session.execute(
-                select(Folder).where(Folder.id == root_folder_id)
-            )
+            await session.execute(select(Folder).where(Folder.id == root_folder_id))
         ).scalar_one_or_none()
         if existing:
             mapping[""] = existing.id
@@ -412,13 +494,17 @@ async def _cleanup_empty_folders(
     id_to_rel: dict[int, str] = {fid: rel for rel, fid in folder_mapping.items() if rel}
 
     all_folders = (
-        await session.execute(
-            select(Folder).where(
-                Folder.search_space_id == search_space_id,
-                Folder.id != root_folder_id,
+        (
+            await session.execute(
+                select(Folder).where(
+                    Folder.search_space_id == search_space_id,
+                    Folder.id != root_folder_id,
+                )
             )
         )
-    ).scalars().all()
+        .scalars()
+        .all()
+    )
 
     candidates: list[Folder] = []
     for folder in all_folders:
@@ -520,7 +606,9 @@ async def index_local_folder(
         metadata={
             "folder_path": folder_path,
             "user_id": str(user_id),
-            "target_file_paths_count": len(target_file_paths) if target_file_paths else None,
+            "target_file_paths_count": len(target_file_paths)
+            if target_file_paths
+            else None,
         },
     )
 
@@ -532,7 +620,12 @@ async def index_local_folder(
                 "Folder not found",
                 {},
             )
-            return 0, 0, root_folder_id, f"Folder path missing or does not exist: {folder_path}"
+            return (
+                0,
+                0,
+                root_folder_id,
+                f"Folder path missing or does not exist: {folder_path}",
+            )
 
         if exclude_patterns is None:
             exclude_patterns = DEFAULT_EXCLUDE_PATTERNS
@@ -639,7 +732,9 @@ async def index_local_folder(
                 )
 
                 if existing_document:
-                    stored_mtime = (existing_document.document_metadata or {}).get("mtime")
+                    stored_mtime = (existing_document.document_metadata or {}).get(
+                        "mtime"
+                    )
                     current_mtime = file_info["modified_at"].timestamp()
 
                     if stored_mtime and abs(current_mtime - stored_mtime) < 1.0:
@@ -709,23 +804,31 @@ async def index_local_folder(
         # ================================================================
         all_root_folder_ids = set(folder_mapping.values())
         all_db_folders = (
-            await session.execute(
-                select(Folder.id).where(
-                    Folder.search_space_id == search_space_id,
+            (
+                await session.execute(
+                    select(Folder.id).where(
+                        Folder.search_space_id == search_space_id,
+                    )
                 )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
         all_root_folder_ids.update(all_db_folders)
 
         all_folder_docs = (
-            await session.execute(
-                select(Document).where(
-                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
-                    Document.search_space_id == search_space_id,
-                    Document.folder_id.in_(list(all_root_folder_ids)),
+            (
+                await session.execute(
+                    select(Document).where(
+                        Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                        Document.search_space_id == search_space_id,
+                        Document.folder_id.in_(list(all_root_folder_ids)),
+                    )
                 )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
 
         for doc in all_folder_docs:
             if doc.unique_identifier_hash not in seen_unique_hashes:
@@ -742,9 +845,7 @@ async def index_local_folder(
             )
 
             pipeline = IndexingPipelineService(session)
-            doc_map = {
-                compute_unique_identifier_hash(cd): cd for cd in connector_docs
-            }
+            doc_map = {compute_unique_identifier_hash(cd): cd for cd in connector_docs}
             documents = await pipeline.prepare_for_indexing(connector_docs)
 
             # Assign folder_id immediately so docs appear in the correct
@@ -1033,7 +1134,9 @@ async def _index_single_file(
         db_doc.document_metadata = doc_meta
         await session.commit()
 
-        indexed = 1 if DocumentStatus.is_state(db_doc.status, DocumentStatus.READY) else 0
+        indexed = (
+            1 if DocumentStatus.is_state(db_doc.status, DocumentStatus.READY) else 0
+        )
         failed_msg = None if indexed else "Indexing failed"
 
         if indexed:
diff --git a/surfsense_backend/app/utils/document_versioning.py b/surfsense_backend/app/utils/document_versioning.py
index 889bc4a3a..e6ad1fb06 100644
--- a/surfsense_backend/app/utils/document_versioning.py
+++ b/surfsense_backend/app/utils/document_versioning.py
@@ -83,9 +83,9 @@ async def create_version_snapshot(
     # Cleanup: cap at MAX_VERSIONS_PER_DOCUMENT
     count = (
         await session.execute(
-            select(func.count()).select_from(DocumentVersion).where(
-                DocumentVersion.document_id == document.id
-            )
+            select(func.count())
+            .select_from(DocumentVersion)
+            .where(DocumentVersion.document_id == document.id)
         )
     ).scalar_one()
 
diff --git a/surfsense_backend/tests/integration/conftest.py b/surfsense_backend/tests/integration/conftest.py
index 9c91011ae..d9d7cacae 100644
--- a/surfsense_backend/tests/integration/conftest.py
+++ b/surfsense_backend/tests/integration/conftest.py
@@ -166,5 +166,3 @@ def make_connector_document(db_connector, db_user):
         return ConnectorDocument(**defaults)
 
     return _make
-
-
diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index 67254ec93..4062c3a3b 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -21,7 +21,9 @@ from app.db import (
 pytestmark = pytest.mark.integration
 
 UNIFIED_FIXTURES = (
-    "patched_summarize", "patched_embed_texts", "patched_chunk_text",
+    "patched_summarize",
+    "patched_embed_texts",
+    "patched_chunk_text",
 )
 
 
@@ -37,6 +39,7 @@ class _FakeSessionMaker:
         @asynccontextmanager
         async def _ctx():
             yield self._session
+
         return _ctx()
 
 
@@ -59,7 +62,6 @@ def patched_batch_sessions(monkeypatch, db_session):
 
 
 class TestFullIndexer:
-
     @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_i1_new_file_indexed(
         self,
@@ -73,7 +75,7 @@ class TestFullIndexer:
 
         (tmp_path / "note.md").write_text("# Hello World\n\nContent here.")
 
-        count, skipped, root_folder_id, err = await index_local_folder(
+        count, _skipped, _root_folder_id, err = await index_local_folder(
             session=db_session,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
@@ -85,13 +87,17 @@ class TestFullIndexer:
         assert count == 1
 
         docs = (
-            await db_session.execute(
-                select(Document).where(
-                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
-                    Document.search_space_id == db_search_space.id,
+            (
+                await db_session.execute(
+                    select(Document).where(
+                        Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                        Document.search_space_id == db_search_space.id,
+                    )
                 )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
         assert len(docs) == 1
         assert docs[0].document_type == DocumentType.LOCAL_FOLDER_FILE
         assert DocumentStatus.is_state(docs[0].status, DocumentStatus.READY)
@@ -130,7 +136,9 @@ class TestFullIndexer:
 
         total = (
             await db_session.execute(
-                select(func.count()).select_from(Document).where(
+                select(func.count())
+                .select_from(Document)
+                .where(
                     Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
                     Document.search_space_id == db_search_space.id,
                 )
@@ -174,13 +182,19 @@ class TestFullIndexer:
         assert count == 1
 
         versions = (
-            await db_session.execute(
-                select(DocumentVersion).join(Document).where(
-                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
-                    Document.search_space_id == db_search_space.id,
+            (
+                await db_session.execute(
+                    select(DocumentVersion)
+                    .join(Document)
+                    .where(
+                        Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                        Document.search_space_id == db_search_space.id,
+                    )
                 )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
         assert len(versions) >= 1
 
     @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
@@ -207,7 +221,9 @@ class TestFullIndexer:
 
         docs_before = (
             await db_session.execute(
-                select(func.count()).select_from(Document).where(
+                select(func.count())
+                .select_from(Document)
+                .where(
                     Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
                     Document.search_space_id == db_search_space.id,
                 )
@@ -228,7 +244,9 @@ class TestFullIndexer:
 
         docs_after = (
             await db_session.execute(
-                select(func.count()).select_from(Document).where(
+                select(func.count())
+                .select_from(Document)
+                .where(
                     Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
                     Document.search_space_id == db_search_space.id,
                 )
@@ -262,13 +280,17 @@ class TestFullIndexer:
         assert count == 1
 
         docs = (
-            await db_session.execute(
-                select(Document).where(
-                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
-                    Document.search_space_id == db_search_space.id,
+            (
+                await db_session.execute(
+                    select(Document).where(
+                        Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                        Document.search_space_id == db_search_space.id,
+                    )
                 )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
         assert len(docs) == 1
         assert docs[0].title == "b.md"
 
@@ -279,7 +301,6 @@ class TestFullIndexer:
 
 
 class TestFolderMirroring:
-
     @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_f1_root_folder_created(
         self,
@@ -335,10 +356,14 @@ class TestFolderMirroring:
         )
 
         folders = (
-            await db_session.execute(
-                select(Folder).where(Folder.search_space_id == db_search_space.id)
+            (
+                await db_session.execute(
+                    select(Folder).where(Folder.search_space_id == db_search_space.id)
+                )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
 
         folder_names = {f.name for f in folders}
         assert "notes" in folder_names
@@ -376,10 +401,14 @@ class TestFolderMirroring:
         )
 
         folders_before = (
-            await db_session.execute(
-                select(Folder).where(Folder.search_space_id == db_search_space.id)
+            (
+                await db_session.execute(
+                    select(Folder).where(Folder.search_space_id == db_search_space.id)
+                )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
         ids_before = {f.id for f in folders_before}
 
         await index_local_folder(
@@ -392,10 +421,14 @@ class TestFolderMirroring:
         )
 
         folders_after = (
-            await db_session.execute(
-                select(Folder).where(Folder.search_space_id == db_search_space.id)
+            (
+                await db_session.execute(
+                    select(Folder).where(Folder.search_space_id == db_search_space.id)
+                )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
         ids_after = {f.id for f in folders_after}
 
         assert ids_before == ids_after
@@ -425,21 +458,23 @@ class TestFolderMirroring:
         )
 
         docs = (
-            await db_session.execute(
-                select(Document).where(
-                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
-                    Document.search_space_id == db_search_space.id,
+            (
+                await db_session.execute(
+                    select(Document).where(
+                        Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                        Document.search_space_id == db_search_space.id,
+                    )
                 )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
 
         today_doc = next(d for d in docs if d.title == "today.md")
         root_doc = next(d for d in docs if d.title == "root.md")
 
         daily_folder = (
-            await db_session.execute(
-                select(Folder).where(Folder.name == "daily")
-            )
+            await db_session.execute(select(Folder).where(Folder.name == "daily"))
         ).scalar_one()
 
         assert today_doc.folder_id == daily_folder.id
@@ -455,9 +490,10 @@ class TestFolderMirroring:
         tmp_path: Path,
     ):
         """F5: Deleted dir's empty Folder row is cleaned up on re-sync."""
-        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
         import shutil
 
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
         daily = tmp_path / "notes" / "daily"
         daily.mkdir(parents=True)
         weekly = tmp_path / "notes" / "weekly"
@@ -474,9 +510,7 @@ class TestFolderMirroring:
         )
 
         weekly_folder = (
-            await db_session.execute(
-                select(Folder).where(Folder.name == "weekly")
-            )
+            await db_session.execute(select(Folder).where(Folder.name == "weekly"))
         ).scalar_one_or_none()
         assert weekly_folder is not None
 
@@ -492,16 +526,12 @@ class TestFolderMirroring:
         )
 
         weekly_after = (
-            await db_session.execute(
-                select(Folder).where(Folder.name == "weekly")
-            )
+            await db_session.execute(select(Folder).where(Folder.name == "weekly"))
         ).scalar_one_or_none()
         assert weekly_after is None
 
         daily_after = (
-            await db_session.execute(
-                select(Folder).where(Folder.name == "daily")
-            )
+            await db_session.execute(select(Folder).where(Folder.name == "daily"))
         ).scalar_one_or_none()
         assert daily_after is not None
 
@@ -551,18 +581,14 @@ class TestFolderMirroring:
         ).scalar_one()
 
         daily_folder = (
-            await db_session.execute(
-                select(Folder).where(Folder.name == "daily")
-            )
+            await db_session.execute(select(Folder).where(Folder.name == "daily"))
         ).scalar_one()
 
         assert doc.folder_id == daily_folder.id
         assert daily_folder.parent_id is not None
 
         notes_folder = (
-            await db_session.execute(
-                select(Folder).where(Folder.name == "notes")
-            )
+            await db_session.execute(select(Folder).where(Folder.name == "notes"))
         ).scalar_one()
         assert daily_folder.parent_id == notes_folder.id
         assert notes_folder.parent_id == root_folder_id
@@ -592,9 +618,7 @@ class TestFolderMirroring:
         )
 
         eph_folder = (
-            await db_session.execute(
-                select(Folder).where(Folder.name == "ephemeral")
-            )
+            await db_session.execute(select(Folder).where(Folder.name == "ephemeral"))
         ).scalar_one_or_none()
         assert eph_folder is not None
 
@@ -612,16 +636,12 @@ class TestFolderMirroring:
         )
 
         eph_after = (
-            await db_session.execute(
-                select(Folder).where(Folder.name == "ephemeral")
-            )
+            await db_session.execute(select(Folder).where(Folder.name == "ephemeral"))
         ).scalar_one_or_none()
         assert eph_after is None
 
         notes_after = (
-            await db_session.execute(
-                select(Folder).where(Folder.name == "notes")
-            )
+            await db_session.execute(select(Folder).where(Folder.name == "notes"))
         ).scalar_one_or_none()
         assert notes_after is None
 
@@ -632,7 +652,6 @@ class TestFolderMirroring:
 
 
 class TestBatchMode:
-
     @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_b1_batch_indexes_multiple_files(
         self,
@@ -649,7 +668,7 @@ class TestBatchMode:
         (tmp_path / "b.md").write_text("File B content")
         (tmp_path / "c.md").write_text("File C content")
 
-        count, failed, root_folder_id, err = await index_local_folder(
+        count, failed, _root_folder_id, err = await index_local_folder(
             session=db_session,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
@@ -667,13 +686,17 @@ class TestBatchMode:
         assert err is None
 
         docs = (
-            await db_session.execute(
-                select(Document).where(
-                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
-                    Document.search_space_id == db_search_space.id,
+            (
+                await db_session.execute(
+                    select(Document).where(
+                        Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                        Document.search_space_id == db_search_space.id,
+                    )
                 )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
         assert len(docs) == 3
         assert {d.title for d in docs} == {"a.md", "b.md", "c.md"}
         assert all(
@@ -714,13 +737,17 @@ class TestBatchMode:
         assert err is not None
 
         docs = (
-            await db_session.execute(
-                select(Document).where(
-                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
-                    Document.search_space_id == db_search_space.id,
+            (
+                await db_session.execute(
+                    select(Document).where(
+                        Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                        Document.search_space_id == db_search_space.id,
+                    )
                 )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
         assert len(docs) == 2
         assert {d.title for d in docs} == {"good1.md", "good2.md"}
 
@@ -731,7 +758,6 @@ class TestBatchMode:
 
 
 class TestPipelineIntegration:
-
     @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
     async def test_p1_local_folder_file_through_pipeline(
         self,
@@ -742,7 +768,9 @@ class TestPipelineIntegration:
     ):
         """P1: LOCAL_FOLDER_FILE ConnectorDocument through prepare+index to READY."""
         from app.indexing_pipeline.connector_document import ConnectorDocument
-        from app.indexing_pipeline.indexing_pipeline_service import IndexingPipelineService
+        from app.indexing_pipeline.indexing_pipeline_service import (
+            IndexingPipelineService,
+        )
 
         doc = ConnectorDocument(
             title="Test Local File",
@@ -763,12 +791,16 @@ class TestPipelineIntegration:
         assert result is not None
 
         docs = (
-            await db_session.execute(
-                select(Document).where(
-                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
-                    Document.search_space_id == db_search_space.id,
+            (
+                await db_session.execute(
+                    select(Document).where(
+                        Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                        Document.search_space_id == db_search_space.id,
+                    )
                 )
             )
-        ).scalars().all()
+            .scalars()
+            .all()
+        )
         assert len(docs) == 1
         assert DocumentStatus.is_state(docs[0].status, DocumentStatus.READY)
diff --git a/surfsense_backend/tests/integration/test_document_versioning.py b/surfsense_backend/tests/integration/test_document_versioning.py
index 87e3c490c..9bd03d219 100644
--- a/surfsense_backend/tests/integration/test_document_versioning.py
+++ b/surfsense_backend/tests/integration/test_document_versioning.py
@@ -34,14 +34,16 @@ async def db_document(
 
 async def _version_count(session: AsyncSession, document_id: int) -> int:
     result = await session.execute(
-        select(func.count()).select_from(DocumentVersion).where(
-            DocumentVersion.document_id == document_id
-        )
+        select(func.count())
+        .select_from(DocumentVersion)
+        .where(DocumentVersion.document_id == document_id)
     )
     return result.scalar_one()
 
 
-async def _get_versions(session: AsyncSession, document_id: int) -> list[DocumentVersion]:
+async def _get_versions(
+    session: AsyncSession, document_id: int
+) -> list[DocumentVersion]:
     result = await session.execute(
         select(DocumentVersion)
         .where(DocumentVersion.document_id == document_id)
@@ -74,18 +76,14 @@ class TestCreateVersionSnapshot:
         from app.utils.document_versioning import create_version_snapshot
 
         t0 = datetime(2025, 1, 1, 12, 0, 0, tzinfo=UTC)
-        monkeypatch.setattr(
-            "app.utils.document_versioning._now", lambda: t0
-        )
+        monkeypatch.setattr("app.utils.document_versioning._now", lambda: t0)
         await create_version_snapshot(db_session, db_document)
 
         # Simulate content change and time passing
         db_document.source_markdown = "# Test\n\nUpdated content."
         db_document.content_hash = "def456"
         t1 = t0 + timedelta(minutes=31)
-        monkeypatch.setattr(
-            "app.utils.document_versioning._now", lambda: t1
-        )
+        monkeypatch.setattr("app.utils.document_versioning._now", lambda: t1)
         await create_version_snapshot(db_session, db_document)
 
         versions = await _get_versions(db_session, db_document.id)
@@ -101,9 +99,7 @@ class TestCreateVersionSnapshot:
         from app.utils.document_versioning import create_version_snapshot
 
         t0 = datetime(2025, 1, 1, 12, 0, 0, tzinfo=UTC)
-        monkeypatch.setattr(
-            "app.utils.document_versioning._now", lambda: t0
-        )
+        monkeypatch.setattr("app.utils.document_versioning._now", lambda: t0)
         await create_version_snapshot(db_session, db_document)
         count_after_first = await _version_count(db_session, db_document.id)
         assert count_after_first == 1
@@ -112,9 +108,7 @@ class TestCreateVersionSnapshot:
         db_document.source_markdown = "# Test\n\nQuick edit."
         db_document.content_hash = "quick123"
         t1 = t0 + timedelta(minutes=10)
-        monkeypatch.setattr(
-            "app.utils.document_versioning._now", lambda: t1
-        )
+        monkeypatch.setattr("app.utils.document_versioning._now", lambda: t1)
         await create_version_snapshot(db_session, db_document)
 
         count_after_second = await _version_count(db_session, db_document.id)
@@ -134,22 +128,15 @@ class TestCreateVersionSnapshot:
 
         # Create 5 versions spread across time: 3 older than 90 days, 2 recent
         for i in range(5):
-            db_document.source_markdown = f"Content v{i+1}"
-            db_document.content_hash = f"hash_{i+1}"
-            if i < 3:
-                t = base + timedelta(days=i)  # old
-            else:
-                t = base + timedelta(days=100 + i)  # recent
-            monkeypatch.setattr(
-                "app.utils.document_versioning._now", lambda _t=t: _t
-            )
+            db_document.source_markdown = f"Content v{i + 1}"
+            db_document.content_hash = f"hash_{i + 1}"
+            t = base + timedelta(days=i) if i < 3 else base + timedelta(days=100 + i)
+            monkeypatch.setattr("app.utils.document_versioning._now", lambda _t=t: _t)
             await create_version_snapshot(db_session, db_document)
 
         # Now trigger cleanup from a "current" time that makes the first 3 versions > 90 days old
         now = base + timedelta(days=200)
-        monkeypatch.setattr(
-            "app.utils.document_versioning._now", lambda: now
-        )
+        monkeypatch.setattr("app.utils.document_versioning._now", lambda: now)
         db_document.source_markdown = "Content v6"
         db_document.content_hash = "hash_6"
         await create_version_snapshot(db_session, db_document)
@@ -160,9 +147,7 @@ class TestCreateVersionSnapshot:
             age = now - v.created_at.replace(tzinfo=UTC)
             assert age <= timedelta(days=90), f"Version {v.version_number} is too old"
 
-    async def test_v5_cap_at_20_versions(
-        self, db_session, db_document, monkeypatch
-    ):
+    async def test_v5_cap_at_20_versions(self, db_session, db_document, monkeypatch):
         """V5: More than 20 versions triggers cap — oldest gets deleted."""
         from app.utils.document_versioning import create_version_snapshot
 
@@ -170,12 +155,10 @@ class TestCreateVersionSnapshot:
 
         # Create 21 versions (all within 90 days, each 31 min apart)
         for i in range(21):
-            db_document.source_markdown = f"Content v{i+1}"
-            db_document.content_hash = f"hash_{i+1}"
+            db_document.source_markdown = f"Content v{i + 1}"
+            db_document.content_hash = f"hash_{i + 1}"
             t = base + timedelta(minutes=31 * i)
-            monkeypatch.setattr(
-                "app.utils.document_versioning._now", lambda _t=t: _t
-            )
+            monkeypatch.setattr("app.utils.document_versioning._now", lambda _t=t: _t)
             await create_version_snapshot(db_session, db_document)
 
         versions = await _get_versions(db_session, db_document.id)
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_local_folder_scan.py b/surfsense_backend/tests/unit/connector_indexers/test_local_folder_scan.py
index 9b4c73f25..c6e7b160c 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_local_folder_scan.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_local_folder_scan.py
@@ -51,9 +51,7 @@ class TestScanFolder:
         git.mkdir()
         (git / "config").write_text("gitconfig")
 
-        results = scan_folder(
-            str(tmp_path), exclude_patterns=["node_modules", ".git"]
-        )
+        results = scan_folder(str(tmp_path), exclude_patterns=["node_modules", ".git"])
         names = {r["relative_path"] for r in results}
 
         assert "good.md" in names
diff --git a/surfsense_web/app/(home)/login/LocalLoginForm.tsx b/surfsense_web/app/(home)/login/LocalLoginForm.tsx
index 1ebbf46b6..e94857334 100644
--- a/surfsense_web/app/(home)/login/LocalLoginForm.tsx
+++ b/surfsense_web/app/(home)/login/LocalLoginForm.tsx
@@ -160,11 +160,11 @@ export function LocalLoginForm() {
 						placeholder="you@example.com"
 						value={username}
 						onChange={(e) => setUsername(e.target.value)}
-					className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
-						error.title
-							? "border-destructive focus:border-destructive focus:ring-destructive/40"
-							: "border-border focus:border-primary focus:ring-primary/40"
-					}`}
+						className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
+							error.title
+								? "border-destructive focus:border-destructive focus:ring-destructive/40"
+								: "border-border focus:border-primary focus:ring-primary/40"
+						}`}
 						disabled={isLoggingIn}
 					/>
 				</div>
@@ -181,11 +181,11 @@ export function LocalLoginForm() {
 							placeholder="Enter your password"
 							value={password}
 							onChange={(e) => setPassword(e.target.value)}
-						className={`mt-1 block w-full rounded-md border pr-10 px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
-							error.title
-								? "border-destructive focus:border-destructive focus:ring-destructive/40"
-								: "border-border focus:border-primary focus:ring-primary/40"
-						}`}
+							className={`mt-1 block w-full rounded-md border pr-10 px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
+								error.title
+									? "border-destructive focus:border-destructive focus:ring-destructive/40"
+									: "border-border focus:border-primary focus:ring-primary/40"
+							}`}
 							disabled={isLoggingIn}
 						/>
 						<button
diff --git a/surfsense_web/app/(home)/register/page.tsx b/surfsense_web/app/(home)/register/page.tsx
index 3161da4a7..a6926dc5c 100644
--- a/surfsense_web/app/(home)/register/page.tsx
+++ b/surfsense_web/app/(home)/register/page.tsx
@@ -229,72 +229,66 @@ export default function RegisterPage() {
 						</AnimatePresence>
 
 						<div>
-						<label
-							htmlFor="email"
-							className="block text-sm font-medium text-foreground"
-						>
-							{t("email")}
-						</label>
-						<input
-							id="email"
-							type="email"
-							required
-							placeholder="you@example.com"
-							value={email}
-							onChange={(e) => setEmail(e.target.value)}
-						className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
-							error.title
-								? "border-destructive focus:border-destructive focus:ring-destructive/40"
-								: "border-border focus:border-primary focus:ring-primary/40"
-						}`}
-						disabled={isRegistering}
-					/>
-					</div>
+							<label htmlFor="email" className="block text-sm font-medium text-foreground">
+								{t("email")}
+							</label>
+							<input
+								id="email"
+								type="email"
+								required
+								placeholder="you@example.com"
+								value={email}
+								onChange={(e) => setEmail(e.target.value)}
+								className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
+									error.title
+										? "border-destructive focus:border-destructive focus:ring-destructive/40"
+										: "border-border focus:border-primary focus:ring-primary/40"
+								}`}
+								disabled={isRegistering}
+							/>
+						</div>
 
-					<div>
-						<label
-							htmlFor="password"
-							className="block text-sm font-medium text-foreground"
-						>
-							{t("password")}
-						</label>
-						<input
-							id="password"
-							type="password"
-							required
-							placeholder="Enter your password"
-							value={password}
-							onChange={(e) => setPassword(e.target.value)}
-							className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
-								error.title
-									? "border-destructive focus:border-destructive focus:ring-destructive/40"
-									: "border-border focus:border-primary focus:ring-primary/40"
-							}`}
-							disabled={isRegistering}
-						/>
-					</div>
+						<div>
+							<label htmlFor="password" className="block text-sm font-medium text-foreground">
+								{t("password")}
+							</label>
+							<input
+								id="password"
+								type="password"
+								required
+								placeholder="Enter your password"
+								value={password}
+								onChange={(e) => setPassword(e.target.value)}
+								className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
+									error.title
+										? "border-destructive focus:border-destructive focus:ring-destructive/40"
+										: "border-border focus:border-primary focus:ring-primary/40"
+								}`}
+								disabled={isRegistering}
+							/>
+						</div>
 
-					<div>
-						<label
-							htmlFor="confirmPassword"
-							className="block text-sm font-medium text-foreground"
-						>
-							{t("confirm_password")}
-						</label>
-						<input
-							id="confirmPassword"
-							type="password"
-							required
-							placeholder="Confirm your password"
-							value={confirmPassword}
-							onChange={(e) => setConfirmPassword(e.target.value)}
-							className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
-								error.title
-									? "border-destructive focus:border-destructive focus:ring-destructive/40"
-									: "border-border focus:border-primary focus:ring-primary/40"
-							}`}
-							disabled={isRegistering}
-						/>
+						<div>
+							<label
+								htmlFor="confirmPassword"
+								className="block text-sm font-medium text-foreground"
+							>
+								{t("confirm_password")}
+							</label>
+							<input
+								id="confirmPassword"
+								type="password"
+								required
+								placeholder="Confirm your password"
+								value={confirmPassword}
+								onChange={(e) => setConfirmPassword(e.target.value)}
+								className={`mt-1 block w-full rounded-md border px-3 py-1.5 md:py-2 shadow-sm focus:outline-none focus:ring-1 bg-background text-foreground transition-all ${
+									error.title
+										? "border-destructive focus:border-destructive focus:ring-destructive/40"
+										: "border-border focus:border-primary focus:ring-primary/40"
+								}`}
+								disabled={isRegistering}
+							/>
 						</div>
 
 						<button
@@ -312,12 +306,9 @@ export default function RegisterPage() {
 					</form>
 
 					<div className="mt-4 text-center text-sm">
-					<p className="text-muted-foreground">
-						{t("already_have_account")}{" "}
-						<Link
-							href="/login"
-							className="font-medium text-primary hover:text-primary/90"
-						>
+						<p className="text-muted-foreground">
+							{t("already_have_account")}{" "}
+							<Link href="/login" className="font-medium text-primary hover:text-primary/90">
 								{t("sign_in")}
 							</Link>
 						</p>
diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
index 150c119de..b85af13b7 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
@@ -214,17 +214,17 @@ export function DocumentsFilters({
 					</Tooltip>
 				)}
 
-		{/* Upload Button */}
-			<Button
-				data-joyride="upload-button"
-				onClick={openUploadDialog}
-				variant="outline"
-				size="sm"
-				className="h-9 shrink-0 gap-1.5 bg-white text-gray-700 border-white hover:bg-gray-50 dark:bg-white dark:text-gray-800 dark:hover:bg-gray-100"
-			>
-				<Upload size={14} />
-				<span>Upload</span>
-			</Button>
+				{/* Upload Button */}
+				<Button
+					data-joyride="upload-button"
+					onClick={openUploadDialog}
+					variant="outline"
+					size="sm"
+					className="h-9 shrink-0 gap-1.5 bg-white text-gray-700 border-white hover:bg-gray-50 dark:bg-white dark:text-gray-800 dark:hover:bg-gray-100"
+				>
+					<Upload size={14} />
+					<span>Upload</span>
+				</Button>
 			</div>
 		</div>
 	);
diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/PromptsContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/PromptsContent.tsx
index 39362d244..1e7087afc 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/PromptsContent.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/PromptsContent.tsx
@@ -2,7 +2,6 @@
 
 import { useAtomValue } from "jotai";
 import { AlertTriangle, Globe, Lock, PenLine, Sparkles, Trash2 } from "lucide-react";
-import { ShortcutKbd } from "@/components/ui/shortcut-kbd";
 import { useCallback, useState } from "react";
 import { toast } from "sonner";
 import {
@@ -24,6 +23,7 @@ import {
 import { Button } from "@/components/ui/button";
 import { Input } from "@/components/ui/input";
 import { Label } from "@/components/ui/label";
+import { ShortcutKbd } from "@/components/ui/shortcut-kbd";
 import { Spinner } from "@/components/ui/spinner";
 import { Switch } from "@/components/ui/switch";
 import type { PromptRead } from "@/contracts/types/prompts.types";
@@ -145,9 +145,8 @@ export function PromptsContent() {
 		<div className="space-y-6 min-w-0 overflow-hidden">
 			<div className="flex items-center justify-between">
 				<p className="text-sm text-muted-foreground">
-					Create prompt templates triggered with{" "}
-					<ShortcutKbd keys={["/"]} className="ml-0" /> in the
-					chat composer.
+					Create prompt templates triggered with <ShortcutKbd keys={["/"]} className="ml-0" /> in
+					the chat composer.
 				</p>
 				{!showForm && (
 					<Button
diff --git a/surfsense_web/components/assistant-ui/connector-popup.tsx b/surfsense_web/components/assistant-ui/connector-popup.tsx
index abe623c82..fe7b29f28 100644
--- a/surfsense_web/components/assistant-ui/connector-popup.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup.tsx
@@ -374,7 +374,10 @@ export const ConnectorIndicator = forwardRef<ConnectorIndicatorHandle, Connector
 									<div className="px-4 sm:px-12 py-4 sm:py-8 pb-12 sm:pb-16">
 										{/* LLM Configuration Warning */}
 										{!llmConfigLoading && !hasDocumentSummaryLLM && (
-											<Alert variant="destructive" className="mb-6 bg-muted/50 rounded-xl border-destructive/30">
+											<Alert
+												variant="destructive"
+												className="mb-6 bg-muted/50 rounded-xl border-destructive/30"
+											>
 												<AlertTriangle className="h-4 w-4" />
 												<AlertTitle>LLM Configuration Required</AlertTitle>
 												<AlertDescription className="mt-2">
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
index 05d42adcb..1e71b0a25 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
@@ -294,36 +294,36 @@ export const ConnectorEditView: FC<ConnectorEditViewProps> = ({
 									)}
 
 								{(() => {
-										const isGoogleDrive = connector.connector_type === "GOOGLE_DRIVE_CONNECTOR";
-										const isComposioGoogleDrive =
-											connector.connector_type === "COMPOSIO_GOOGLE_DRIVE_CONNECTOR";
-										const requiresFolderSelection = isGoogleDrive || isComposioGoogleDrive;
-										const selectedFolders =
-											(connector.config?.selected_folders as
-												| Array<{ id: string; name: string }>
-												| undefined) || [];
-										const selectedFiles =
-											(connector.config?.selected_files as
-												| Array<{ id: string; name: string }>
-												| undefined) || [];
-										const hasItemsSelected = selectedFolders.length > 0 || selectedFiles.length > 0;
-										const isDisabled = requiresFolderSelection && !hasItemsSelected;
+									const isGoogleDrive = connector.connector_type === "GOOGLE_DRIVE_CONNECTOR";
+									const isComposioGoogleDrive =
+										connector.connector_type === "COMPOSIO_GOOGLE_DRIVE_CONNECTOR";
+									const requiresFolderSelection = isGoogleDrive || isComposioGoogleDrive;
+									const selectedFolders =
+										(connector.config?.selected_folders as
+											| Array<{ id: string; name: string }>
+											| undefined) || [];
+									const selectedFiles =
+										(connector.config?.selected_files as
+											| Array<{ id: string; name: string }>
+											| undefined) || [];
+									const hasItemsSelected = selectedFolders.length > 0 || selectedFiles.length > 0;
+									const isDisabled = requiresFolderSelection && !hasItemsSelected;
 
-										return (
-											<PeriodicSyncConfig
-												enabled={periodicEnabled}
-												frequencyMinutes={frequencyMinutes}
-												onEnabledChange={onPeriodicEnabledChange}
-												onFrequencyChange={onFrequencyChange}
-												disabled={isDisabled}
-												disabledMessage={
-													isDisabled
-														? "Select at least one folder or file above to enable periodic sync"
-														: undefined
-												}
-											/>
-										);
-									})()}
+									return (
+										<PeriodicSyncConfig
+											enabled={periodicEnabled}
+											frequencyMinutes={frequencyMinutes}
+											onEnabledChange={onPeriodicEnabledChange}
+											onFrequencyChange={onFrequencyChange}
+											disabled={isDisabled}
+											disabledMessage={
+												isDisabled
+													? "Select at least one folder or file above to enable periodic sync"
+													: undefined
+											}
+										/>
+									);
+								})()}
 							</>
 						)}
 
diff --git a/surfsense_web/components/assistant-ui/document-upload-popup.tsx b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
index 78600be47..4f06588c1 100644
--- a/surfsense_web/components/assistant-ui/document-upload-popup.tsx
+++ b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
@@ -143,7 +143,10 @@ const DocumentUploadPopupContent: FC<{
 
 					<div className="px-4 sm:px-6 pb-4 sm:pb-6">
 						{!isLoading && !hasDocumentSummaryLLM ? (
-							<Alert variant="destructive" className="mb-4 bg-muted/50 rounded-xl border-destructive/30">
+							<Alert
+								variant="destructive"
+								className="mb-4 bg-muted/50 rounded-xl border-destructive/30"
+							>
 								<AlertTriangle className="h-4 w-4" />
 								<AlertTitle>LLM Configuration Required</AlertTitle>
 								<AlertDescription className="mt-2">
diff --git a/surfsense_web/components/assistant-ui/inline-citation.tsx b/surfsense_web/components/assistant-ui/inline-citation.tsx
index 42144f1d6..0c99090e6 100644
--- a/surfsense_web/components/assistant-ui/inline-citation.tsx
+++ b/surfsense_web/components/assistant-ui/inline-citation.tsx
@@ -32,7 +32,8 @@ export const InlineCitation: FC<InlineCitationProps> = ({ chunkId, isDocsChunk =
 			<button
 				type="button"
 				onClick={() => setIsOpen(true)}
-				className="ml-0.5 inline-flex h-5 min-w-5 cursor-pointer items-center justify-center rounded-md bg-muted/60 px-1.5 text-[11px] font-medium text-muted-foreground align-baseline shadow-sm transition-colors hover:bg-muted hover:text-foreground focus-visible:ring-ring focus-visible:ring-2 focus-visible:outline-none"				title={`View source chunk #${chunkId}`}
+				className="ml-0.5 inline-flex h-5 min-w-5 cursor-pointer items-center justify-center rounded-md bg-muted/60 px-1.5 text-[11px] font-medium text-muted-foreground align-baseline shadow-sm transition-colors hover:bg-muted hover:text-foreground focus-visible:ring-ring focus-visible:ring-2 focus-visible:outline-none"
+				title={`View source chunk #${chunkId}`}
 			>
 				{chunkId}
 			</button>
diff --git a/surfsense_web/components/documents/DocumentNode.tsx b/surfsense_web/components/documents/DocumentNode.tsx
index 31d1bc7ca..919f904d4 100644
--- a/surfsense_web/components/documents/DocumentNode.tsx
+++ b/surfsense_web/components/documents/DocumentNode.tsx
@@ -39,8 +39,8 @@ import { Spinner } from "@/components/ui/spinner";
 import { Tooltip, TooltipContent, TooltipTrigger } from "@/components/ui/tooltip";
 import type { DocumentTypeEnum } from "@/contracts/types/document.types";
 import { cn } from "@/lib/utils";
-import { isVersionableType } from "./version-history";
 import { DND_TYPES } from "./FolderNode";
+import { isVersionableType } from "./version-history";
 
 const EDITABLE_DOCUMENT_TYPES = new Set(["FILE", "NOTE"]);
 
@@ -199,7 +199,10 @@ export const DocumentNode = React.memo(function DocumentNode({
 
 					<span className="flex-1 min-w-0 truncate">{doc.title}</span>
 
-					{getDocumentTypeIcon(doc.document_type as DocumentTypeEnum, "h-3.5 w-3.5 text-muted-foreground") && (
+					{getDocumentTypeIcon(
+						doc.document_type as DocumentTypeEnum,
+						"h-3.5 w-3.5 text-muted-foreground"
+					) && (
 						<span className="shrink-0">
 							{getDocumentTypeIcon(
 								doc.document_type as DocumentTypeEnum,
@@ -251,10 +254,7 @@ export const DocumentNode = React.memo(function DocumentNode({
 								</DropdownMenuSub>
 							)}
 							{onVersionHistory && isVersionableType(doc.document_type) && (
-								<DropdownMenuItem
-									disabled={isProcessing}
-									onClick={() => onVersionHistory(doc)}
-								>
+								<DropdownMenuItem disabled={isProcessing} onClick={() => onVersionHistory(doc)}>
 									<History className="mr-2 h-4 w-4" />
 									Versions
 								</DropdownMenuItem>
@@ -300,10 +300,7 @@ export const DocumentNode = React.memo(function DocumentNode({
 						</ContextMenuSub>
 					)}
 					{onVersionHistory && isVersionableType(doc.document_type) && (
-						<ContextMenuItem
-							disabled={isProcessing}
-							onClick={() => onVersionHistory(doc)}
-						>
+						<ContextMenuItem disabled={isProcessing} onClick={() => onVersionHistory(doc)}>
 							<History className="mr-2 h-4 w-4" />
 							Versions
 						</ContextMenuItem>
diff --git a/surfsense_web/components/documents/FolderNode.tsx b/surfsense_web/components/documents/FolderNode.tsx
index 909f965f9..88cc76c69 100644
--- a/surfsense_web/components/documents/FolderNode.tsx
+++ b/surfsense_web/components/documents/FolderNode.tsx
@@ -256,15 +256,15 @@ export const FolderNode = React.memo(function FolderNode({
 						isOver && !canDrop && "cursor-not-allowed"
 					)}
 					style={{ paddingLeft: `${depth * 16 + 4}px` }}
-				onClick={() => {
-					onToggleExpand(folder.id);
-				}}
-				onKeyDown={(e) => {
-					if (e.key === "Enter" || e.key === " ") {
-						e.preventDefault();
+					onClick={() => {
 						onToggleExpand(folder.id);
-					}
-				}}
+					}}
+					onKeyDown={(e) => {
+						if (e.key === "Enter" || e.key === " ") {
+							e.preventDefault();
+							onToggleExpand(folder.id);
+						}
+					}}
 					onDoubleClick={(e) => {
 						e.stopPropagation();
 						startRename();
@@ -306,7 +306,11 @@ export const FolderNode = React.memo(function FolderNode({
 					) : (
 						<Checkbox
 							checked={
-								selectionState === "all" ? true : selectionState === "some" ? "indeterminate" : false
+								selectionState === "all"
+									? true
+									: selectionState === "some"
+										? "indeterminate"
+										: false
 							}
 							onCheckedChange={handleCheckChange}
 							onClick={(e) => e.stopPropagation()}
@@ -350,107 +354,107 @@ export const FolderNode = React.memo(function FolderNode({
 									<MoreHorizontal className="h-3.5 w-3.5" />
 								</Button>
 							</DropdownMenuTrigger>
-						<DropdownMenuContent align="end" className="w-40">
-							{isWatched && onRescan && (
+							<DropdownMenuContent align="end" className="w-40">
+								{isWatched && onRescan && (
+									<DropdownMenuItem
+										onClick={(e) => {
+											e.stopPropagation();
+											onRescan(folder);
+										}}
+									>
+										<RefreshCw className="mr-2 h-4 w-4" />
+										Re-scan
+									</DropdownMenuItem>
+								)}
+								{isWatched && onStopWatching && (
+									<DropdownMenuItem
+										onClick={(e) => {
+											e.stopPropagation();
+											onStopWatching(folder);
+										}}
+									>
+										<EyeOff className="mr-2 h-4 w-4" />
+										Stop watching
+									</DropdownMenuItem>
+								)}
 								<DropdownMenuItem
 									onClick={(e) => {
 										e.stopPropagation();
-										onRescan(folder);
+										onCreateSubfolder(folder.id);
 									}}
 								>
-									<RefreshCw className="mr-2 h-4 w-4" />
-									Re-scan
+									<FolderPlus className="mr-2 h-4 w-4" />
+									New subfolder
 								</DropdownMenuItem>
-							)}
-							{isWatched && onStopWatching && (
 								<DropdownMenuItem
 									onClick={(e) => {
 										e.stopPropagation();
-										onStopWatching(folder);
+										startRename();
 									}}
 								>
-									<EyeOff className="mr-2 h-4 w-4" />
-									Stop watching
+									<PenLine className="mr-2 h-4 w-4" />
+									Rename
 								</DropdownMenuItem>
-							)}
-							<DropdownMenuItem
-								onClick={(e) => {
-									e.stopPropagation();
-									onCreateSubfolder(folder.id);
-								}}
-							>
-								<FolderPlus className="mr-2 h-4 w-4" />
-								New subfolder
-							</DropdownMenuItem>
-							<DropdownMenuItem
-								onClick={(e) => {
-									e.stopPropagation();
-									startRename();
-								}}
-							>
-								<PenLine className="mr-2 h-4 w-4" />
-								Rename
-							</DropdownMenuItem>
-							<DropdownMenuItem
-								onClick={(e) => {
-									e.stopPropagation();
-									onMove(folder);
-								}}
-							>
-								<Move className="mr-2 h-4 w-4" />
-								Move to...
-							</DropdownMenuItem>
-							<DropdownMenuItem
-								className="text-destructive focus:text-destructive"
-								onClick={(e) => {
-									e.stopPropagation();
-									onDelete(folder);
-								}}
-							>
-								<Trash2 className="mr-2 h-4 w-4" />
-								Delete
-							</DropdownMenuItem>
-						</DropdownMenuContent>
+								<DropdownMenuItem
+									onClick={(e) => {
+										e.stopPropagation();
+										onMove(folder);
+									}}
+								>
+									<Move className="mr-2 h-4 w-4" />
+									Move to...
+								</DropdownMenuItem>
+								<DropdownMenuItem
+									className="text-destructive focus:text-destructive"
+									onClick={(e) => {
+										e.stopPropagation();
+										onDelete(folder);
+									}}
+								>
+									<Trash2 className="mr-2 h-4 w-4" />
+									Delete
+								</DropdownMenuItem>
+							</DropdownMenuContent>
 						</DropdownMenu>
 					)}
 				</div>
 			</ContextMenuTrigger>
 
-		{!isRenaming && contextMenuOpen && (
-			<ContextMenuContent className="w-40">
-				{isWatched && onRescan && (
-					<ContextMenuItem onClick={() => onRescan(folder)}>
-						<RefreshCw className="mr-2 h-4 w-4" />
-						Re-scan
+			{!isRenaming && contextMenuOpen && (
+				<ContextMenuContent className="w-40">
+					{isWatched && onRescan && (
+						<ContextMenuItem onClick={() => onRescan(folder)}>
+							<RefreshCw className="mr-2 h-4 w-4" />
+							Re-scan
+						</ContextMenuItem>
+					)}
+					{isWatched && onStopWatching && (
+						<ContextMenuItem onClick={() => onStopWatching(folder)}>
+							<EyeOff className="mr-2 h-4 w-4" />
+							Stop watching
+						</ContextMenuItem>
+					)}
+					<ContextMenuItem onClick={() => onCreateSubfolder(folder.id)}>
+						<FolderPlus className="mr-2 h-4 w-4" />
+						New subfolder
 					</ContextMenuItem>
-				)}
-				{isWatched && onStopWatching && (
-					<ContextMenuItem onClick={() => onStopWatching(folder)}>
-						<EyeOff className="mr-2 h-4 w-4" />
-						Stop watching
+					<ContextMenuItem onClick={() => startRename()}>
+						<PenLine className="mr-2 h-4 w-4" />
+						Rename
 					</ContextMenuItem>
-				)}
-				<ContextMenuItem onClick={() => onCreateSubfolder(folder.id)}>
-					<FolderPlus className="mr-2 h-4 w-4" />
-					New subfolder
-				</ContextMenuItem>
-				<ContextMenuItem onClick={() => startRename()}>
-					<PenLine className="mr-2 h-4 w-4" />
-					Rename
-				</ContextMenuItem>
-				<ContextMenuItem onClick={() => onMove(folder)}>
-					<Move className="mr-2 h-4 w-4" />
-					Move to...
-				</ContextMenuItem>
-				<ContextMenuItem
-					className="text-destructive focus:text-destructive"
-					onClick={() => onDelete(folder)}
-				>
-					<Trash2 className="mr-2 h-4 w-4" />
-					Delete
-				</ContextMenuItem>
-			</ContextMenuContent>
-		)}
+					<ContextMenuItem onClick={() => onMove(folder)}>
+						<Move className="mr-2 h-4 w-4" />
+						Move to...
+					</ContextMenuItem>
+					<ContextMenuItem
+						className="text-destructive focus:text-destructive"
+						onClick={() => onDelete(folder)}
+					>
+						<Trash2 className="mr-2 h-4 w-4" />
+						Delete
+					</ContextMenuItem>
+				</ContextMenuContent>
+			)}
 		</ContextMenu>
 	);
 });
diff --git a/surfsense_web/components/documents/FolderTreeView.tsx b/surfsense_web/components/documents/FolderTreeView.tsx
index 3aa8ce9d8..1df007c0b 100644
--- a/surfsense_web/components/documents/FolderTreeView.tsx
+++ b/surfsense_web/components/documents/FolderTreeView.tsx
@@ -242,10 +242,10 @@ export function FolderTreeView({
 					siblingPositions={siblingPositions}
 					contextMenuOpen={openContextMenuId === `folder-${f.id}`}
 					onContextMenuOpenChange={(open) => setOpenContextMenuId(open ? `folder-${f.id}` : null)}
-				isWatched={watchedFolderIds?.has(f.id)}
-				onRescan={onRescanFolder}
-				onStopWatching={onStopWatchingFolder}
-			/>
+					isWatched={watchedFolderIds?.has(f.id)}
+					onRescan={onRescanFolder}
+					onStopWatching={onStopWatchingFolder}
+				/>
 			);
 
 			if (isExpanded) {
diff --git a/surfsense_web/components/documents/version-history.tsx b/surfsense_web/components/documents/version-history.tsx
index 7aba92b47..27343dc6a 100644
--- a/surfsense_web/components/documents/version-history.tsx
+++ b/surfsense_web/components/documents/version-history.tsx
@@ -1,19 +1,14 @@
 "use client";
 
-import { useCallback, useEffect, useState } from "react";
 import { Check, ChevronRight, Clock, Copy, RotateCcw } from "lucide-react";
+import { useCallback, useEffect, useState } from "react";
+import { toast } from "sonner";
 import { Button } from "@/components/ui/button";
-import {
-	Dialog,
-	DialogContent,
-	DialogTitle,
-	DialogTrigger,
-} from "@/components/ui/dialog";
+import { Dialog, DialogContent, DialogTitle, DialogTrigger } from "@/components/ui/dialog";
 import { Separator } from "@/components/ui/separator";
 import { Spinner } from "@/components/ui/spinner";
-import { cn } from "@/lib/utils";
 import { documentsApiService } from "@/lib/apis/documents-api.service";
-import { toast } from "sonner";
+import { cn } from "@/lib/utils";
 
 interface DocumentVersionSummary {
 	version_number: number;
@@ -123,10 +118,9 @@ function VersionHistoryPanel({ documentId }: { documentId: number }) {
 		setSelectedVersion(versionNumber);
 		setContentLoading(true);
 		try {
-			const data = (await documentsApiService.getDocumentVersion(
-				documentId,
-				versionNumber
-			)) as { source_markdown: string };
+			const data = (await documentsApiService.getDocumentVersion(documentId, versionNumber)) as {
+				source_markdown: string;
+			};
 			setVersionContent(data.source_markdown || "");
 		} catch {
 			toast.error("Failed to load version content");
@@ -196,13 +190,11 @@ function VersionHistoryPanel({ documentId }: { documentId: number }) {
 							>
 								<div className="flex-1 min-w-0 space-y-0.5">
 									<p className="text-sm font-medium truncate">
-										{v.created_at ? formatRelativeTime(v.created_at) : `Version ${v.version_number}`}
+										{v.created_at
+											? formatRelativeTime(v.created_at)
+											: `Version ${v.version_number}`}
 									</p>
-									{v.title && (
-										<p className="text-xs text-muted-foreground truncate">
-											{v.title}
-										</p>
-									)}
+									{v.title && <p className="text-xs text-muted-foreground truncate">{v.title}</p>}
 								</div>
 								<ChevronRight className="h-3.5 w-3.5 shrink-0 opacity-50" />
 							</button>
@@ -227,11 +219,7 @@ function VersionHistoryPanel({ documentId }: { documentId: number }) {
 									onClick={handleCopy}
 									disabled={contentLoading || copied}
 								>
-									{copied ? (
-										<Check className="h-3 w-3" />
-									) : (
-										<Copy className="h-3 w-3" />
-									)}
+									{copied ? <Check className="h-3 w-3" /> : <Copy className="h-3 w-3" />}
 									{copied ? "Copied" : "Copy"}
 								</Button>
 								<Button
@@ -241,11 +229,7 @@ function VersionHistoryPanel({ documentId }: { documentId: number }) {
 									disabled={restoring || contentLoading}
 									onClick={() => handleRestore(selectedVersion)}
 								>
-									{restoring ? (
-										<Spinner size="xs" />
-									) : (
-										<RotateCcw className="h-3 w-3" />
-									)}
+									{restoring ? <Spinner size="xs" /> : <RotateCcw className="h-3 w-3" />}
 									Restore
 								</Button>
 							</div>
diff --git a/surfsense_web/components/editor-panel/editor-panel.tsx b/surfsense_web/components/editor-panel/editor-panel.tsx
index 59af0ee8d..05bcd2dc0 100644
--- a/surfsense_web/components/editor-panel/editor-panel.tsx
+++ b/surfsense_web/components/editor-panel/editor-panel.tsx
@@ -54,7 +54,6 @@ function EditorPanelSkeleton() {
 	);
 }
 
-
 export function EditorPanelContent({
 	documentId,
 	searchSpaceId,
@@ -194,24 +193,24 @@ export function EditorPanelContent({
 	return (
 		<>
 			<div className="flex items-center justify-between px-4 py-2 shrink-0 border-b">
-			<div className="flex-1 min-w-0">
-				<h2 className="text-sm font-semibold truncate">{displayTitle}</h2>
-				{isEditableType && editedMarkdown !== null && (
-					<p className="text-[10px] text-muted-foreground">Unsaved changes</p>
-				)}
+				<div className="flex-1 min-w-0">
+					<h2 className="text-sm font-semibold truncate">{displayTitle}</h2>
+					{isEditableType && editedMarkdown !== null && (
+						<p className="text-[10px] text-muted-foreground">Unsaved changes</p>
+					)}
+				</div>
+				<div className="flex items-center gap-1 shrink-0">
+					{editorDoc?.document_type && (
+						<VersionHistoryButton documentId={documentId} documentType={editorDoc.document_type} />
+					)}
+					{onClose && (
+						<Button variant="ghost" size="icon" onClick={onClose} className="size-7 shrink-0">
+							<XIcon className="size-4" />
+							<span className="sr-only">Close editor panel</span>
+						</Button>
+					)}
+				</div>
 			</div>
-			<div className="flex items-center gap-1 shrink-0">
-				{editorDoc?.document_type && (
-					<VersionHistoryButton documentId={documentId} documentType={editorDoc.document_type} />
-				)}
-				{onClose && (
-					<Button variant="ghost" size="icon" onClick={onClose} className="size-7 shrink-0">
-						<XIcon className="size-4" />
-						<span className="sr-only">Close editor panel</span>
-					</Button>
-				)}
-			</div>
-		</div>
 
 			<div className="flex-1 overflow-hidden">
 				{isLoading ? (
@@ -233,7 +232,9 @@ export function EditorPanelContent({
 									? "Document is processing"
 									: "Document unavailable"}
 							</p>
-							<p className="text-sm text-muted-foreground">{error || "An unknown error occurred"}</p>
+							<p className="text-sm text-muted-foreground">
+								{error || "An unknown error occurred"}
+							</p>
 						</div>
 					</div>
 				) : isLargeDocument ? (
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index c10c5dc82..aa409e179 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -121,9 +121,7 @@ export function DocumentsSidebar({
 					}
 					const recovered = await api!.getWatchedFolders();
 					const ids = new Set(
-						recovered
-							.filter((f) => f.rootFolderId != null)
-							.map((f) => f.rootFolderId as number)
+						recovered.filter((f) => f.rootFolderId != null).map((f) => f.rootFolderId as number)
 					);
 					setWatchedFolderIds(ids);
 					return;
@@ -133,9 +131,7 @@ export function DocumentsSidebar({
 			}
 
 			const ids = new Set(
-				folders
-					.filter((f) => f.rootFolderId != null)
-					.map((f) => f.rootFolderId as number)
+				folders.filter((f) => f.rootFolderId != null).map((f) => f.rootFolderId as number)
 			);
 			setWatchedFolderIds(ids);
 		}
@@ -305,28 +301,25 @@ export function DocumentsSidebar({
 		[searchSpaceId]
 	);
 
-	const handleStopWatching = useCallback(
-		async (folder: FolderDisplay) => {
-			const api = window.electronAPI;
-			if (!api) return;
+	const handleStopWatching = useCallback(async (folder: FolderDisplay) => {
+		const api = window.electronAPI;
+		if (!api) return;
 
-			const watchedFolders = await api.getWatchedFolders();
-			const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
-			if (!matched) {
-				toast.error("This folder is not being watched");
-				return;
-			}
+		const watchedFolders = await api.getWatchedFolders();
+		const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
+		if (!matched) {
+			toast.error("This folder is not being watched");
+			return;
+		}
 
-			await api.removeWatchedFolder(matched.path);
-			try {
-				await foldersApiService.stopWatching(folder.id);
-			} catch (err) {
-				console.error("[DocumentsSidebar] Failed to clear watched metadata:", err);
-			}
-			toast.success(`Stopped watching: ${matched.name}`);
-		},
-		[]
-	);
+		await api.removeWatchedFolder(matched.path);
+		try {
+			await foldersApiService.stopWatching(folder.id);
+		} catch (err) {
+			console.error("[DocumentsSidebar] Failed to clear watched metadata:", err);
+		}
+		toast.success(`Stopped watching: ${matched.name}`);
+	}, []);
 
 	const handleRenameFolder = useCallback(async (folder: FolderDisplay, newName: string) => {
 		try {
@@ -755,81 +748,83 @@ export function DocumentsSidebar({
 
 			<div className="flex-1 min-h-0 overflow-x-hidden pt-0 flex flex-col">
 				<div className="px-4 pb-2">
-			<DocumentsFilters
-				typeCounts={typeCounts}
-				onSearch={setSearch}
-				searchValue={search}
-				onToggleType={onToggleType}
-				activeTypes={activeTypes}
-				onCreateFolder={() => handleCreateFolder(null)}
-			/>
+					<DocumentsFilters
+						typeCounts={typeCounts}
+						onSearch={setSearch}
+						searchValue={search}
+						onToggleType={onToggleType}
+						activeTypes={activeTypes}
+						onCreateFolder={() => handleCreateFolder(null)}
+					/>
 				</div>
 
-			<div className="relative flex-1 min-h-0 overflow-auto">
-				{deletableSelectedIds.length > 0 && (
-					<div className="absolute inset-x-0 top-0 z-10 flex items-center justify-center px-4 py-1.5 animate-in fade-in duration-150 pointer-events-none">
-						<button
-							type="button"
-							onClick={() => setBulkDeleteConfirmOpen(true)}
-							className="pointer-events-auto flex items-center gap-1.5 px-3 py-1 rounded-md bg-destructive text-destructive-foreground shadow-lg text-xs font-medium hover:bg-destructive/90 transition-colors"
-						>
-							<Trash2 size={12} />
-							Delete {deletableSelectedIds.length}{" "}
-							{deletableSelectedIds.length === 1 ? "item" : "items"}
-						</button>
-					</div>
-				)}
+				<div className="relative flex-1 min-h-0 overflow-auto">
+					{deletableSelectedIds.length > 0 && (
+						<div className="absolute inset-x-0 top-0 z-10 flex items-center justify-center px-4 py-1.5 animate-in fade-in duration-150 pointer-events-none">
+							<button
+								type="button"
+								onClick={() => setBulkDeleteConfirmOpen(true)}
+								className="pointer-events-auto flex items-center gap-1.5 px-3 py-1 rounded-md bg-destructive text-destructive-foreground shadow-lg text-xs font-medium hover:bg-destructive/90 transition-colors"
+							>
+								<Trash2 size={12} />
+								Delete {deletableSelectedIds.length}{" "}
+								{deletableSelectedIds.length === 1 ? "item" : "items"}
+							</button>
+						</div>
+					)}
 
-			<FolderTreeView
-				folders={treeFolders}
-				documents={searchFilteredDocuments}
-				expandedIds={expandedIds}
-				onToggleExpand={toggleFolderExpand}
-				mentionedDocIds={mentionedDocIds}
-				onToggleChatMention={handleToggleChatMention}
-				onToggleFolderSelect={handleToggleFolderSelect}
-				onRenameFolder={handleRenameFolder}
-				onDeleteFolder={handleDeleteFolder}
-				onMoveFolder={handleMoveFolder}
-				onCreateFolder={handleCreateFolder}
-				searchQuery={debouncedSearch.trim() || undefined}
-				onPreviewDocument={(doc) => {
-					openEditorPanel({
-						documentId: doc.id,
-						searchSpaceId,
-						title: doc.title,
-					});
-				}}
-				onEditDocument={(doc) => {
-					openEditorPanel({
-						documentId: doc.id,
-						searchSpaceId,
-						title: doc.title,
-					});
-				}}
-				onDeleteDocument={(doc) => handleDeleteDocument(doc.id)}
-				onMoveDocument={handleMoveDocument}
-				onExportDocument={handleExportDocument}
-				onVersionHistory={(doc) => setVersionDocId(doc.id)}
-				activeTypes={activeTypes}
-				onDropIntoFolder={handleDropIntoFolder}
-				onReorderFolder={handleReorderFolder}
-				watchedFolderIds={watchedFolderIds}
-				onRescanFolder={handleRescanFolder}
-			onStopWatchingFolder={handleStopWatching}
-		/>
+					<FolderTreeView
+						folders={treeFolders}
+						documents={searchFilteredDocuments}
+						expandedIds={expandedIds}
+						onToggleExpand={toggleFolderExpand}
+						mentionedDocIds={mentionedDocIds}
+						onToggleChatMention={handleToggleChatMention}
+						onToggleFolderSelect={handleToggleFolderSelect}
+						onRenameFolder={handleRenameFolder}
+						onDeleteFolder={handleDeleteFolder}
+						onMoveFolder={handleMoveFolder}
+						onCreateFolder={handleCreateFolder}
+						searchQuery={debouncedSearch.trim() || undefined}
+						onPreviewDocument={(doc) => {
+							openEditorPanel({
+								documentId: doc.id,
+								searchSpaceId,
+								title: doc.title,
+							});
+						}}
+						onEditDocument={(doc) => {
+							openEditorPanel({
+								documentId: doc.id,
+								searchSpaceId,
+								title: doc.title,
+							});
+						}}
+						onDeleteDocument={(doc) => handleDeleteDocument(doc.id)}
+						onMoveDocument={handleMoveDocument}
+						onExportDocument={handleExportDocument}
+						onVersionHistory={(doc) => setVersionDocId(doc.id)}
+						activeTypes={activeTypes}
+						onDropIntoFolder={handleDropIntoFolder}
+						onReorderFolder={handleReorderFolder}
+						watchedFolderIds={watchedFolderIds}
+						onRescanFolder={handleRescanFolder}
+						onStopWatchingFolder={handleStopWatching}
+					/>
+				</div>
 			</div>
-		</div>
 
-		{versionDocId !== null && (
-			<VersionHistoryDialog
-				open
-				onOpenChange={(open) => { if (!open) setVersionDocId(null); }}
-				documentId={versionDocId}
-			/>
-		)}
+			{versionDocId !== null && (
+				<VersionHistoryDialog
+					open
+					onOpenChange={(open) => {
+						if (!open) setVersionDocId(null);
+					}}
+					documentId={versionDocId}
+				/>
+			)}
 
-		<FolderPickerDialog
+			<FolderPickerDialog
 				open={folderPickerOpen}
 				onOpenChange={setFolderPickerOpen}
 				folders={treeFolders}
diff --git a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
index 2e7269c57..c781bd731 100644
--- a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
+++ b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
@@ -185,9 +185,7 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 					<p className="font-semibold text-foreground text-lg">
 						{isProcessing ? "Document is processing" : "Document unavailable"}
 					</p>
-					<p className="text-sm text-muted-foreground">
-						{error || "An unknown error occurred"}
-					</p>
+					<p className="text-sm text-muted-foreground">{error || "An unknown error occurred"}</p>
 				</div>
 				{!isProcessing && (
 					<Button
diff --git a/surfsense_web/components/new-chat/source-detail-panel.tsx b/surfsense_web/components/new-chat/source-detail-panel.tsx
index 8593f96db..ed6c7e4ac 100644
--- a/surfsense_web/components/new-chat/source-detail-panel.tsx
+++ b/surfsense_web/components/new-chat/source-detail-panel.tsx
@@ -480,9 +480,7 @@ export function SourceDetailPanel({
 										<FileQuestionMark className="h-10 w-10 text-muted-foreground" />
 									</div>
 									<div>
-										<p className="font-semibold text-foreground text-lg">
-											Document unavailable
-										</p>
+										<p className="font-semibold text-foreground text-lg">Document unavailable</p>
 										<p className="text-sm text-muted-foreground mt-2 max-w-md">
 											{documentByChunkFetchingError.message ||
 												"An unexpected error occurred. Please try again."}
diff --git a/surfsense_web/components/settings/llm-role-manager.tsx b/surfsense_web/components/settings/llm-role-manager.tsx
index d1651b7f0..718503318 100644
--- a/surfsense_web/components/settings/llm-role-manager.tsx
+++ b/surfsense_web/components/settings/llm-role-manager.tsx
@@ -134,24 +134,27 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 		preferences?.image_generation_config_id,
 	]);
 
-	const handleRoleAssignment = useCallback(async (prefKey: string, configId: string) => {
-		const value = configId === "unassigned" ? "" : parseInt(configId);
+	const handleRoleAssignment = useCallback(
+		async (prefKey: string, configId: string) => {
+			const value = configId === "unassigned" ? "" : parseInt(configId);
 
-		setAssignments((prev) => ({ ...prev, [prefKey]: value }));
-		setSavingRole(prefKey);
-		savingRef.current = true;
+			setAssignments((prev) => ({ ...prev, [prefKey]: value }));
+			setSavingRole(prefKey);
+			savingRef.current = true;
 
-		try {
-			await updatePreferences({
-				search_space_id: searchSpaceId,
-				data: { [prefKey]: value || undefined },
-			});
-			toast.success("Role assignment updated");
-		} finally {
-			setSavingRole(null);
-			savingRef.current = false;
-		}
-	}, [updatePreferences, searchSpaceId]);
+			try {
+				await updatePreferences({
+					search_space_id: searchSpaceId,
+					data: { [prefKey]: value || undefined },
+				});
+				toast.success("Role assignment updated");
+			} finally {
+				setSavingRole(null);
+				savingRef.current = false;
+			}
+		},
+		[updatePreferences, searchSpaceId]
+	);
 
 	// Combine global and custom LLM configs
 	const allLLMConfigs = [
@@ -199,10 +202,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 					Refresh
 				</Button>
 				{isAssignmentComplete && !isLoading && !hasError && (
-					<Badge
-						variant="outline"
-						className="text-xs gap-1.5 text-muted-foreground"
-					>
+					<Badge variant="outline" className="text-xs gap-1.5 text-muted-foreground">
 						<CircleCheck className="h-3 w-3" />
 						All roles assigned
 					</Badge>
@@ -483,7 +483,6 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 					})}
 				</div>
 			)}
-
 		</div>
 	);
 }
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 9733bd2e6..f1162f57c 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -128,7 +128,8 @@ const MAX_TOTAL_SIZE_BYTES = MAX_TOTAL_SIZE_MB * 1024 * 1024;
 const MAX_FILE_SIZE_MB = 500;
 const MAX_FILE_SIZE_BYTES = MAX_FILE_SIZE_MB * 1024 * 1024;
 
-const toggleRowClass = "flex items-center justify-between rounded-lg bg-slate-400/5 dark:bg-white/5 p-3";
+const toggleRowClass =
+	"flex items-center justify-between rounded-lg bg-slate-400/5 dark:bg-white/5 p-3";
 
 export function DocumentUploadTab({
 	searchSpaceId,
@@ -326,7 +327,14 @@ export function DocumentUploadTab({
 				await api.addWatchedFolder({
 					path: selectedFolder.path,
 					name: selectedFolder.name,
-					excludePatterns: [".git", "node_modules", "__pycache__", ".DS_Store", ".obsidian", ".trash"],
+					excludePatterns: [
+						".git",
+						"node_modules",
+						"__pycache__",
+						".DS_Store",
+						".obsidian",
+						".trash",
+					],
 					fileExtensions: null,
 					rootFolderId,
 					searchSpaceId: Number(searchSpaceId),
@@ -393,12 +401,20 @@ export function DocumentUploadTab({
 			return (
 				<DropdownMenu>
 					<DropdownMenuTrigger asChild onClick={(e) => e.stopPropagation()}>
-						<Button variant="ghost" size="sm" className={`text-xs gap-1 bg-neutral-700/50 hover:bg-neutral-600/50 ${sizeClass} ${widthClass}`}>
+						<Button
+							variant="ghost"
+							size="sm"
+							className={`text-xs gap-1 bg-neutral-700/50 hover:bg-neutral-600/50 ${sizeClass} ${widthClass}`}
+						>
 							Browse
 							<ChevronDown className="h-3 w-3 opacity-60" />
 						</Button>
 					</DropdownMenuTrigger>
-					<DropdownMenuContent align="center" className="dark:bg-neutral-800" onClick={(e) => e.stopPropagation()}>
+					<DropdownMenuContent
+						align="center"
+						className="dark:bg-neutral-800"
+						onClick={(e) => e.stopPropagation()}
+					>
 						<DropdownMenuItem onClick={handleBrowseFiles}>
 							<FileIcon className="h-4 w-4 mr-2" />
 							Files
@@ -415,7 +431,11 @@ export function DocumentUploadTab({
 		return (
 			<DropdownMenu>
 				<DropdownMenuTrigger asChild onClick={(e) => e.stopPropagation()}>
-					<Button variant="secondary" size="sm" className={`text-xs gap-1 ${sizeClass} ${widthClass}`}>
+					<Button
+						variant="secondary"
+						size="sm"
+						className={`text-xs gap-1 ${sizeClass} ${widthClass}`}
+					>
 						Browse
 						<ChevronDown className="h-3 w-3 opacity-60" />
 					</Button>
@@ -457,21 +477,19 @@ export function DocumentUploadTab({
 			{/* MOBILE DROP ZONE */}
 			<div className="sm:hidden">
 				{hasContent ? (
-					!selectedFolder && !isFileCountLimitReached && (
-						isElectron ? (
-							<div className="w-full">
-								{renderBrowseButton({ compact: true, fullWidth: true })}
-							</div>
-						) : (
-							<button
-								type="button"
-								className="w-full text-xs h-8 flex items-center justify-center gap-1.5 rounded-md border border-dashed border-muted-foreground/30 text-muted-foreground hover:text-foreground hover:border-foreground/50 transition-colors"
-								onClick={() => fileInputRef.current?.click()}
-							>
-								Add more files
-							</button>
-						)
-					)
+					!selectedFolder &&
+					!isFileCountLimitReached &&
+					(isElectron ? (
+						<div className="w-full">{renderBrowseButton({ compact: true, fullWidth: true })}</div>
+					) : (
+						<button
+							type="button"
+							className="w-full text-xs h-8 flex items-center justify-center gap-1.5 rounded-md border border-dashed border-muted-foreground/30 text-muted-foreground hover:text-foreground hover:border-foreground/50 transition-colors"
+							onClick={() => fileInputRef.current?.click()}
+						>
+							Add more files
+						</button>
+					))
 				) : (
 					<div
 						className="flex flex-col items-center gap-4 py-12 px-4 cursor-pointer"
@@ -487,7 +505,9 @@ export function DocumentUploadTab({
 							<p className="text-sm text-muted-foreground inline-flex items-center flex-wrap justify-center">
 								<span>{t("file_size_limit")}</span>
 								<Dot className="h-4 w-4 shrink-0" />
-								<span>{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}</span>
+								<span>
+									{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}
+								</span>
 							</p>
 						</div>
 						<div className="w-full mt-1" onClick={(e) => e.stopPropagation()}>
@@ -538,7 +558,9 @@ export function DocumentUploadTab({
 						<p className="text-xs text-muted-foreground text-center inline-flex items-center flex-wrap justify-center">
 							<span>{t("file_size_limit")}</span>
 							<Dot className="h-4 w-4 shrink-0" />
-							<span>{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}</span>
+							<span>
+								{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}
+							</span>
 						</p>
 						<div className="mt-1">{renderBrowseButton()}</div>
 					</div>
@@ -569,9 +591,7 @@ export function DocumentUploadTab({
 						<div className="flex items-center justify-between p-3">
 							<div className="space-y-0.5">
 								<p className="font-medium text-sm">Watch folder</p>
-								<p className="text-xs text-muted-foreground">
-									Auto-sync when files change
-								</p>
+								<p className="text-xs text-muted-foreground">Auto-sync when files change</p>
 							</div>
 							<Switch
 								id="watch-folder-toggle"
@@ -612,7 +632,8 @@ export function DocumentUploadTab({
 				<div className="rounded-lg border border-border p-3 space-y-2">
 					<div className="flex items-center justify-between">
 						<p className="text-sm font-medium">
-							{t("selected_files", { count: files.length })} &middot; {formatFileSize(totalFileSize)}
+							{t("selected_files", { count: files.length })} &middot;{" "}
+							{formatFileSize(totalFileSize)}
 						</p>
 						<Button
 							variant="ghost"
diff --git a/surfsense_web/lib/apis/connectors-api.service.ts b/surfsense_web/lib/apis/connectors-api.service.ts
index 7b94b3746..abd16c7a7 100644
--- a/surfsense_web/lib/apis/connectors-api.service.ts
+++ b/surfsense_web/lib/apis/connectors-api.service.ts
@@ -404,7 +404,6 @@ class ConnectorsApiService {
 			listDiscordChannelsResponse
 		);
 	};
-
 }
 
 export type { SlackChannel, DiscordChannel };
diff --git a/surfsense_web/lib/apis/documents-api.service.ts b/surfsense_web/lib/apis/documents-api.service.ts
index f72e1dbcc..5961522ec 100644
--- a/surfsense_web/lib/apis/documents-api.service.ts
+++ b/surfsense_web/lib/apis/documents-api.service.ts
@@ -417,27 +417,47 @@ class DocumentsApiService {
 	};
 
 	getDocumentVersion = async (documentId: number, versionNumber: number) => {
-		return baseApiService.get(
-			`/api/v1/documents/${documentId}/versions/${versionNumber}`
-		);
+		return baseApiService.get(`/api/v1/documents/${documentId}/versions/${versionNumber}`);
 	};
 
 	restoreDocumentVersion = async (documentId: number, versionNumber: number) => {
-		return baseApiService.post(
-			`/api/v1/documents/${documentId}/versions/${versionNumber}/restore`
-		);
+		return baseApiService.post(`/api/v1/documents/${documentId}/versions/${versionNumber}/restore`);
 	};
 
-	folderIndex = async (searchSpaceId: number, body: { folder_path: string; folder_name: string; search_space_id: number; exclude_patterns?: string[]; file_extensions?: string[]; root_folder_id?: number; enable_summary?: boolean }) => {
+	folderIndex = async (
+		searchSpaceId: number,
+		body: {
+			folder_path: string;
+			folder_name: string;
+			search_space_id: number;
+			exclude_patterns?: string[];
+			file_extensions?: string[];
+			root_folder_id?: number;
+			enable_summary?: boolean;
+		}
+	) => {
 		return baseApiService.post(`/api/v1/documents/folder-index`, undefined, { body });
 	};
 
-	folderIndexFiles = async (searchSpaceId: number, body: { folder_path: string; folder_name: string; search_space_id: number; target_file_paths: string[]; root_folder_id?: number | null; enable_summary?: boolean }) => {
+	folderIndexFiles = async (
+		searchSpaceId: number,
+		body: {
+			folder_path: string;
+			folder_name: string;
+			search_space_id: number;
+			target_file_paths: string[];
+			root_folder_id?: number | null;
+			enable_summary?: boolean;
+		}
+	) => {
 		return baseApiService.post(`/api/v1/documents/folder-index-files`, undefined, { body });
 	};
 
 	getWatchedFolders = async (searchSpaceId: number) => {
-		return baseApiService.get(`/api/v1/documents/watched-folders?search_space_id=${searchSpaceId}`, folderListResponse);
+		return baseApiService.get(
+			`/api/v1/documents/watched-folders?search_space_id=${searchSpaceId}`,
+			folderListResponse
+		);
 	};
 
 	/**

From fc84dcffb05f794ca19641253ad8cab68b85d43f Mon Sep 17 00:00:00 2001
From: okxint <cashmein.eth@gmail.com>
Date: Fri, 3 Apr 2026 13:59:14 +0530
Subject: [PATCH 086/202] fix: memoize formatRelativeTime in thread list to
 prevent unnecessary re-renders

---
 surfsense_web/components/assistant-ui/thread-list.tsx | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/thread-list.tsx b/surfsense_web/components/assistant-ui/thread-list.tsx
index f1d10ca16..e8b8db6fe 100644
--- a/surfsense_web/components/assistant-ui/thread-list.tsx
+++ b/surfsense_web/components/assistant-ui/thread-list.tsx
@@ -9,7 +9,7 @@ import {
 	TrashIcon,
 } from "lucide-react";
 import { useRouter } from "next/navigation";
-import { memo, useCallback, useEffect, useState } from "react";
+import { memo, useCallback, useEffect, useMemo, useState } from "react";
 import { Button } from "@/components/ui/button";
 import {
 	DropdownMenu,
@@ -224,6 +224,11 @@ const ThreadListItemComponent = memo(function ThreadListItemComponent({
 	onUnarchive,
 	onDelete,
 }: ThreadListItemComponentProps) {
+	const relativeTime = useMemo(
+		() => formatRelativeTime(new Date(thread.updatedAt)),
+		[thread.updatedAt]
+	);
+
 	return (
 		<button
 			type="button"
@@ -237,7 +242,7 @@ const ThreadListItemComponent = memo(function ThreadListItemComponent({
 			<div className="flex-1 min-w-0">
 				<p className="truncate text-sm font-medium">{thread.title || "New Chat"}</p>
 				<p className="truncate text-xs text-muted-foreground">
-					{formatRelativeTime(new Date(thread.updatedAt))}
+					{relativeTime}
 				</p>
 			</div>
 			<DropdownMenu>

From c964b47f99a53cef556342061d42f8c1f4c78a91 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 13:59:33 +0530
Subject: [PATCH 087/202] style: enhance folder selection UI in
 DocumentUploadTab

---
 surfsense_web/components/sources/DocumentUploadTab.tsx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index f1162f57c..940d1560a 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -570,7 +570,7 @@ export function DocumentUploadTab({
 			{/* FOLDER SELECTED (Electron only — web flattens folder contents into file list) */}
 			{isElectron && selectedFolder && (
 				<div className="rounded-lg border border-border p-3 space-y-2">
-					<div className="flex items-center gap-2">
+					<div className="flex items-center gap-2 py-1.5 px-2 -mx-1 rounded-md hover:bg-slate-400/5 dark:hover:bg-white/5 group">
 						<FolderOpen className="h-4 w-4 text-primary shrink-0" />
 						<div className="min-w-0 flex-1">
 							<p className="text-sm font-medium truncate">{selectedFolder.name}</p>

From 8a8e5fcd76c5dcebb6fbc2142212408553ee7d6d Mon Sep 17 00:00:00 2001
From: SohamBhattacharjee2003
 <125297948+SohamBhattacharjee2003@users.noreply.github.com>
Date: Fri, 3 Apr 2026 14:29:41 +0530
Subject: [PATCH 088/202] fix(hooks): add AbortController to properly cancel
 fetch requests on unmount

---
 package-lock.json                              |  6 ++++++
 .../components/circleback-config.tsx           | 16 ++++++++++++----
 .../components/editor-panel/editor-panel.tsx   | 18 ++++++++----------
 .../layout/ui/tabs/DocumentTabContent.tsx      | 18 ++++++++----------
 4 files changed, 34 insertions(+), 24 deletions(-)
 create mode 100644 package-lock.json

diff --git a/package-lock.json b/package-lock.json
new file mode 100644
index 000000000..9703ac09f
--- /dev/null
+++ b/package-lock.json
@@ -0,0 +1,6 @@
+{
+  "name": "SurfSense",
+  "lockfileVersion": 3,
+  "requires": true,
+  "packages": {}
+}
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/circleback-config.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/circleback-config.tsx
index 99e26c542..268ab0f98 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/circleback-config.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/components/circleback-config.tsx
@@ -34,9 +34,12 @@ export const CirclebackConfig: FC<CirclebackConfigProps> = ({ connector, onNameC
 	const [isLoading, setIsLoading] = useState(true);
 	const [copied, setCopied] = useState(false);
 
+	// Fetch webhook info
 	// Fetch webhook info
 	useEffect(() => {
-		const fetchWebhookInfo = async () => {
+		const controller = new AbortController();
+
+		const doFetch = async () => {
 			if (!connector.search_space_id) return;
 
 			const baseUrl = process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL;
@@ -49,8 +52,11 @@ export const CirclebackConfig: FC<CirclebackConfigProps> = ({ connector, onNameC
 			setIsLoading(true);
 			try {
 				const response = await authenticatedFetch(
-					`${baseUrl}/api/v1/webhooks/circleback/${connector.search_space_id}/info`
+					`${baseUrl}/api/v1/webhooks/circleback/${connector.search_space_id}/info`,
+					{ signal: controller.signal }
 				);
+				if (controller.signal.aborted) return;
+
 				if (response.ok) {
 					const data: unknown = await response.json();
 					// Runtime validation with zod schema
@@ -59,16 +65,18 @@ export const CirclebackConfig: FC<CirclebackConfigProps> = ({ connector, onNameC
 					setWebhookUrl(validatedData.webhook_url);
 				}
 			} catch (error) {
+				if (controller.signal.aborted) return;
 				console.error("Failed to fetch webhook info:", error);
 				// Reset state on error
 				setWebhookInfo(null);
 				setWebhookUrl("");
 			} finally {
-				setIsLoading(false);
+				if (!controller.signal.aborted) setIsLoading(false);
 			}
 		};
 
-		fetchWebhookInfo();
+		doFetch().catch(() => {});
+		return () => controller.abort();
 	}, [connector.search_space_id]);
 
 	const handleNameChange = (value: string) => {
diff --git a/surfsense_web/components/editor-panel/editor-panel.tsx b/surfsense_web/components/editor-panel/editor-panel.tsx
index 3ea36f800..3c204f1bb 100644
--- a/surfsense_web/components/editor-panel/editor-panel.tsx
+++ b/surfsense_web/components/editor-panel/editor-panel.tsx
@@ -70,7 +70,7 @@ export function EditorPanelContent({
 	const [displayTitle, setDisplayTitle] = useState(title || "Untitled");
 
 	useEffect(() => {
-		let cancelled = false;
+		const controller = new AbortController();
 		setIsLoading(true);
 		setError(null);
 		setEditorDoc(null);
@@ -78,7 +78,7 @@ export function EditorPanelContent({
 		initialLoadDone.current = false;
 		changeCountRef.current = 0;
 
-		const fetchContent = async () => {
+		const doFetch = async () => {
 			const token = getBearerToken();
 			if (!token) {
 				redirectToLogin();
@@ -88,10 +88,10 @@ export function EditorPanelContent({
 			try {
 				const response = await authenticatedFetch(
 					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`,
-					{ method: "GET" }
+					{ method: "GET", signal: controller.signal }
 				);
 
-				if (cancelled) return;
+				if (controller.signal.aborted) return;
 
 				if (!response.ok) {
 					const errorData = await response
@@ -115,18 +115,16 @@ export function EditorPanelContent({
 				setEditorDoc(data);
 				initialLoadDone.current = true;
 			} catch (err) {
-				if (cancelled) return;
+				if (controller.signal.aborted) return;
 				console.error("Error fetching document:", err);
 				setError(err instanceof Error ? err.message : "Failed to fetch document");
 			} finally {
-				if (!cancelled) setIsLoading(false);
+				if (!controller.signal.aborted) setIsLoading(false);
 			}
 		};
 
-		fetchContent();
-		return () => {
-			cancelled = true;
-		};
+		doFetch().catch(() => {});
+		return () => controller.abort();
 	}, [documentId, searchSpaceId, title]);
 
 	const handleMarkdownChange = useCallback((md: string) => {
diff --git a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
index ac279cd4d..a645bfbd5 100644
--- a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
+++ b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
@@ -55,7 +55,7 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 	const changeCountRef = useRef(0);
 
 	useEffect(() => {
-		let cancelled = false;
+		const controller = new AbortController();
 		setIsLoading(true);
 		setError(null);
 		setDoc(null);
@@ -64,7 +64,7 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 		initialLoadDone.current = false;
 		changeCountRef.current = 0;
 
-		const fetchContent = async () => {
+		const doFetch = async () => {
 			const token = getBearerToken();
 			if (!token) {
 				redirectToLogin();
@@ -74,10 +74,10 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 			try {
 				const response = await authenticatedFetch(
 					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`,
-					{ method: "GET" }
+					{ method: "GET", signal: controller.signal }
 				);
 
-				if (cancelled) return;
+				if (controller.signal.aborted) return;
 
 				if (!response.ok) {
 					const errorData = await response
@@ -98,18 +98,16 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 				setDoc(data);
 				initialLoadDone.current = true;
 			} catch (err) {
-				if (cancelled) return;
+				if (controller.signal.aborted) return;
 				console.error("Error fetching document:", err);
 				setError(err instanceof Error ? err.message : "Failed to fetch document");
 			} finally {
-				if (!cancelled) setIsLoading(false);
+				if (!controller.signal.aborted) setIsLoading(false);
 			}
 		};
 
-		fetchContent();
-		return () => {
-			cancelled = true;
-		};
+		doFetch().catch(() => {});
+		return () => controller.abort();
 	}, [documentId, searchSpaceId]);
 
 	const handleMarkdownChange = useCallback((md: string) => {

From 416b3635bf90d9c5618745f9069d2cab816839c0 Mon Sep 17 00:00:00 2001
From: sukarxn <thecodersmailbox@gmail.com>
Date: Fri, 3 Apr 2026 17:09:35 +0530
Subject: [PATCH 089/202] fix: optimize image components with next/image

- Replace raw <img> with Next.js Image in markdown-viewer.tsx
- Use next/image with fill + sizes in assistant-ui image.tsx
- Optimize favicons with explicit dimensions in citation components
- Set unoptimized=true for data/blob URLs and external favicons
---
 .../components/assistant-ui/image.tsx         | 121 +++++++++++++-----
 .../components/homepage/use-cases-grid.tsx    |  10 ++
 surfsense_web/components/markdown-viewer.tsx  |  37 ++++--
 .../tool-ui/citation/citation-list.tsx        |  42 +++---
 .../components/tool-ui/citation/citation.tsx  |  25 ++--
 5 files changed, 160 insertions(+), 75 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/image.tsx b/surfsense_web/components/assistant-ui/image.tsx
index 65059bcdc..c147eede4 100644
--- a/surfsense_web/components/assistant-ui/image.tsx
+++ b/surfsense_web/components/assistant-ui/image.tsx
@@ -6,6 +6,7 @@ import { ImageIcon, ImageOffIcon } from "lucide-react";
 import { memo, type PropsWithChildren, useEffect, useRef, useState } from "react";
 import { createPortal } from "react-dom";
 import { cn } from "@/lib/utils";
+import NextImage from 'next/image';
 
 const imageVariants = cva("aui-image-root relative overflow-hidden rounded-lg", {
 	variants: {
@@ -86,23 +87,57 @@ function ImagePreview({
 				>
 					<ImageOffIcon className="size-8 text-muted-foreground" />
 				</div>
-			) : (
+			) : isDataOrBlobUrl(src) ? (
+                // biome-ignore lint/performance/noImgElement: data/blob URLs need plain img
+                <img
+                    ref={imgRef}
+                    src={src}
+                    alt={alt}
+                    className={cn("block h-auto w-full object-contain", !loaded && "invisible", className)}
+                    onLoad={(e) => {
+                        if (typeof src === "string") setLoadedSrc(src);
+                        onLoad?.(e);
+                    }}
+                    onError={(e) => {
+                        if (typeof src === "string") setErrorSrc(src);
+                        onError?.(e);
+                    }}
+                    {...props}
+                />
+            ) : (
 				// biome-ignore lint/performance/noImgElement: intentional for dynamic external URLs
-				<img
-					ref={imgRef}
-					src={src}
-					alt={alt}
-					className={cn("block h-auto w-full object-contain", !loaded && "invisible", className)}
-					onLoad={(e) => {
-						if (typeof src === "string") setLoadedSrc(src);
-						onLoad?.(e);
-					}}
-					onError={(e) => {
-						if (typeof src === "string") setErrorSrc(src);
-						onError?.(e);
-					}}
-					{...props}
-				/>
+				// <img
+				// 	ref={imgRef}
+				// 	src={src}
+				// 	alt={alt}
+				// 	className={cn("block h-auto w-full object-contain", !loaded && "invisible", className)}
+				// 	onLoad={(e) => {
+				// 		if (typeof src === "string") setLoadedSrc(src);
+				// 		onLoad?.(e);
+				// 	}}
+				// 	onError={(e) => {
+				// 		if (typeof src === "string") setErrorSrc(src);
+				// 		onError?.(e);
+				// 	}}
+				// 	{...props}
+				// />
+				<NextImage
+				fill
+				src={src || ""}
+				alt={alt}
+				sizes="(max-width: 768px) 100vw, (max-width: 1200px) 80vw, 60vw"
+				className={cn("block object-contain", !loaded && "invisible", className)}
+				onLoad={() => {
+					if (typeof src === "string") setLoadedSrc(src);
+					onLoad?.();
+				}}
+				onError={() => {
+					if (typeof src === "string") setErrorSrc(src);
+					onError?.();
+				}}
+				unoptimized={false}
+				{...props}
+			/>
 			)}
 		</div>
 	);
@@ -126,7 +161,10 @@ type ImageZoomProps = PropsWithChildren<{
 	src: string;
 	alt?: string;
 }>;
-
+function isDataOrBlobUrl(src: string | undefined): boolean {
+    if (!src || typeof src !== "string") return false;
+    return src.startsWith("data:") || src.startsWith("blob:");
+}
 function ImageZoom({ src, alt = "Image preview", children }: ImageZoomProps) {
 	const [isMounted, setIsMounted] = useState(false);
 	const [isOpen, setIsOpen] = useState(false);
@@ -177,22 +215,39 @@ function ImageZoom({ src, alt = "Image preview", children }: ImageZoomProps) {
 						aria-label="Close zoomed image"
 					>
 						{/** biome-ignore lint/performance/noImgElement: <explanation> */}
-						<img
-							data-slot="image-zoom-content"
-							src={src}
-							alt={alt}
-							className="aui-image-zoom-content fade-in zoom-in-95 max-h-[90vh] max-w-[90vw] animate-in object-contain duration-200"
-							onClick={(e) => {
-								e.stopPropagation();
-								handleClose();
-							}}
-							onKeyDown={(e) => {
-								if (e.key === "Enter") {
-									e.stopPropagation();
-									handleClose();
-								}
-							}}
-						/>
+						{isDataOrBlobUrl(src) ? (
+                            // biome-ignore lint/performance/noImgElement: data/blob URLs need plain img
+                            <img
+                                data-slot="image-zoom-content"
+                                src={src}
+                                alt={alt}
+                                className="aui-image-zoom-content fade-in zoom-in-95 max-h-[90vh] max-w-[90vw] animate-in object-contain duration-200"
+                                onClick={(e) => {
+                                    e.stopPropagation();
+                                    handleClose();
+                                }}
+                                onKeyDown={(e) => {
+                                    if (e.key === "Enter") {
+                                        e.stopPropagation();
+                                        handleClose();
+                                    }
+                                }}
+                            />
+                        ) : (
+							<NextImage
+                                data-slot="image-zoom-content"
+                                fill
+                                src={src}
+                                alt={alt}
+                                sizes="90vw"
+                                className="aui-image-zoom-content fade-in zoom-in-95 object-contain duration-200"
+                                onClick={(e) => {
+                                    e.stopPropagation();
+                                    handleClose();
+                                }}
+                                unoptimized={false}
+                            />
+                        )}
 					</button>,
 					document.body
 				)}
diff --git a/surfsense_web/components/homepage/use-cases-grid.tsx b/surfsense_web/components/homepage/use-cases-grid.tsx
index 2f8c2d537..f9d315b49 100644
--- a/surfsense_web/components/homepage/use-cases-grid.tsx
+++ b/surfsense_web/components/homepage/use-cases-grid.tsx
@@ -1,4 +1,5 @@
 "use client";
+import Image from 'next/image';
 
 import { AnimatePresence, motion } from "motion/react";
 import { ExpandedGifOverlay, useExpandedGif } from "@/components/ui/expanded-gif-overlay";
@@ -81,6 +82,15 @@ function UseCaseCard({
 						alt={title}
 						className="w-full rounded-xl object-cover transition-transform duration-500 group-hover:scale-[1.02]"
 					/>
+					<div className="relative w-full h-48">
+					<Image
+						src={src}
+						alt={title}
+						fill
+						className="rounded-xl object-cover transition-transform duration-500 group-hover:scale-[1.02]"
+						unoptimized={src.endsWith('.gif')}
+					/>
+					</div>
 				</div>
 				<div className="px-5 py-4">
 					<h3 className="text-base font-semibold text-neutral-900 dark:text-white">{title}</h3>
diff --git a/surfsense_web/components/markdown-viewer.tsx b/surfsense_web/components/markdown-viewer.tsx
index a568bd698..1c39f03a0 100644
--- a/surfsense_web/components/markdown-viewer.tsx
+++ b/surfsense_web/components/markdown-viewer.tsx
@@ -3,6 +3,8 @@ import { createMathPlugin } from "@streamdown/math";
 import { Streamdown, type StreamdownProps } from "streamdown";
 import "katex/dist/katex.min.css";
 import { cn } from "@/lib/utils";
+import Image from 'next/image';
+import { is } from "drizzle-orm";
 
 const code = createCodePlugin({
 	themes: ["nord", "nord"],
@@ -127,16 +129,31 @@ export function MarkdownViewer({ content, className, maxLength }: MarkdownViewer
 			<blockquote className="border-l-4 border-muted pl-4 italic my-2" {...props} />
 		),
 		hr: ({ ...props }) => <hr className="my-4 border-muted" {...props} />,
-		img: ({ src, alt, width: _w, height: _h, ...props }) => (
-			// eslint-disable-next-line @next/next/no-img-element
-			<img
-				className="max-w-full h-auto my-4 rounded"
-				alt={alt || "markdown image"}
-				src={typeof src === "string" ? src : ""}
-				loading="lazy"
-				{...props}
-			/>
-		),
+		img: ({ src, alt, width: _w, height: _h, ...props }) => {
+    	const isDataOrUnknownUrl = typeof src === "string" && (src.startsWith("data:") || !src.startsWith("http"));
+
+    return isDataOrUnknownUrl ? (
+        // eslint-disable-next-line @next/next/no-img-element
+        <img
+            className="max-w-full h-auto my-4 rounded"
+            alt={alt || "markdown image"}
+            src={src}
+            loading="lazy"
+            {...props}
+        />
+    ) : (
+        <Image
+            className="max-w-full h-auto my-4 rounded"
+            alt={alt || "markdown image"}
+            src={typeof src === "string" ? src : ""}
+            width={_w || 800}
+            height={_h || 600}
+            sizes="(max-width: 768px) 100vw, (max-width: 1200px) 75vw, 60vw"
+            unoptimized={isDataOrUnknownUrl}
+            {...props}
+        />
+    );
+},
 		table: ({ ...props }) => (
 			<div className="overflow-x-auto my-4 rounded-lg border border-border w-full">
 				<table className="w-full divide-y divide-border" {...props} />
diff --git a/surfsense_web/components/tool-ui/citation/citation-list.tsx b/surfsense_web/components/tool-ui/citation/citation-list.tsx
index 3151917b6..75b02bf3d 100644
--- a/surfsense_web/components/tool-ui/citation/citation-list.tsx
+++ b/surfsense_web/components/tool-ui/citation/citation-list.tsx
@@ -7,6 +7,8 @@ import { openSafeNavigationHref, resolveSafeNavigationHref } from "../shared/med
 import { cn, Popover, PopoverContent, PopoverTrigger } from "./_adapter";
 import { Citation } from "./citation";
 import type { CitationType, CitationVariant, SerializableCitation } from "./schema";
+import NextImage from 'next/image';
+
 
 const TYPE_ICONS: Record<CitationType, LucideIcon> = {
 	webpage: Globe,
@@ -253,18 +255,18 @@ function OverflowItem({ citation, onClick }: OverflowItemProps) {
 			className="group hover:bg-muted focus-visible:bg-muted flex w-full cursor-pointer items-center gap-2.5 rounded-md px-2 py-2 text-left transition-colors focus-visible:outline-none"
 		>
 			{citation.favicon ? (
-				// biome-ignore lint/performance/noImgElement: external favicon from arbitrary domain — next/image requires remotePatterns config
-				<img
+				<NextImage
 					src={citation.favicon}
 					alt=""
 					aria-hidden="true"
-					width={16}
-					height={16}
-					className="bg-muted size-4 shrink-0 rounded object-cover"
+					width={18}
+					height={18}
+					className="size-4.5 rounded-full object-cover"
+					unoptimized={true}
 				/>
-			) : (
-				<TypeIcon className="text-muted-foreground size-4 shrink-0" aria-hidden="true" />
-			)}
+				) : (
+				<TypeIcon className="text-muted-foreground size-3" aria-hidden="true" />
+				)}
 			<div className="min-w-0 flex-1">
 				<p className="group-hover:decoration-foreground/30 truncate text-sm font-medium group-hover:underline group-hover:underline-offset-2">
 					{citation.title}
@@ -339,18 +341,18 @@ function StackedCitations({ id, citations, className, onNavigate }: StackedCitat
 										style={{ zIndex: maxIcons - index }}
 									>
 										{citation.favicon ? (
-											// biome-ignore lint/performance/noImgElement: external favicon from arbitrary domain — next/image requires remotePatterns config
-											<img
-												src={citation.favicon}
-												alt=""
-												aria-hidden="true"
-												width={18}
-												height={18}
-												className="size-4.5 rounded-full object-cover"
-											/>
-										) : (
-											<TypeIcon className="text-muted-foreground size-3" aria-hidden="true" />
-										)}
+										<NextImage
+											src={citation.favicon}
+											alt=""
+											aria-hidden="true"
+											width={18}
+											height={18}
+											className="size-4.5 rounded-full object-cover"
+											unoptimized={true}
+										/>
+									) : (
+										<TypeIcon className="text-muted-foreground size-3" aria-hidden="true" />
+									)}	
 									</div>
 								);
 							})}
diff --git a/surfsense_web/components/tool-ui/citation/citation.tsx b/surfsense_web/components/tool-ui/citation/citation.tsx
index 523169f49..fa5d4d165 100644
--- a/surfsense_web/components/tool-ui/citation/citation.tsx
+++ b/surfsense_web/components/tool-ui/citation/citation.tsx
@@ -6,6 +6,7 @@ import * as React from "react";
 import { openSafeNavigationHref, sanitizeHref } from "../shared/media";
 import { cn, Popover, PopoverContent, PopoverTrigger } from "./_adapter";
 import type { CitationType, CitationVariant, SerializableCitation } from "./schema";
+import NextImage from 'next/image';
 
 const FALLBACK_LOCALE = "en-US";
 
@@ -114,18 +115,18 @@ export function Citation(props: CitationProps) {
 	};
 
 	const iconElement = favicon ? (
-		// biome-ignore lint/performance/noImgElement: external favicon from arbitrary domain — next/image requires remotePatterns config
-		<img
-			src={favicon}
-			alt=""
-			aria-hidden="true"
-			width={14}
-			height={14}
-			className="bg-muted size-3.5 shrink-0 rounded object-cover"
-		/>
-	) : (
-		<TypeIcon className="size-3.5 shrink-0 opacity-60" aria-hidden="true" />
-	);
+    <NextImage
+        src={favicon}
+        alt=""
+        aria-hidden="true"
+        width={16}
+        height={16}
+        className="bg-muted size-3.5 shrink-0 rounded object-cover"
+        unoptimized={true}
+    />
+) : (
+    <TypeIcon className="size-3.5 shrink-0 opacity-60" aria-hidden="true" />
+);
 
 	const { open, handleMouseEnter, handleMouseLeave } = useHoverPopover();
 

From 1c50106c819fd6adceb6a78b7a5cb0e6c7eb0309 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 17:24:06 +0530
Subject: [PATCH 090/202] refactor: simplify file upload logic in
 DocumentUploadTab by removing file count and size limits; update file size
 limit messages in multiple languages

---
 .../assistant-ui/document-upload-popup.tsx    |  2 +-
 .../components/sources/DocumentUploadTab.tsx  | 73 +++----------------
 surfsense_web/messages/en.json                | 15 +---
 surfsense_web/messages/es.json                | 15 +---
 surfsense_web/messages/hi.json                | 15 +---
 surfsense_web/messages/pt.json                | 15 +---
 surfsense_web/messages/zh.json                | 15 +---
 7 files changed, 30 insertions(+), 120 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/document-upload-popup.tsx b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
index 4f06588c1..59d73e651 100644
--- a/surfsense_web/components/assistant-ui/document-upload-popup.tsx
+++ b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
@@ -125,7 +125,7 @@ const DocumentUploadPopupContent: FC<{
 				onPointerDownOutside={(e) => e.preventDefault()}
 				onInteractOutside={(e) => e.preventDefault()}
 				onEscapeKeyDown={(e) => e.preventDefault()}
-				className="select-none max-w-2xl w-[95vw] sm:w-[640px] h-[min(460px,75dvh)] sm:h-[min(520px,80vh)] flex flex-col p-0 gap-0 overflow-hidden border border-border ring-0 bg-muted dark:bg-muted text-foreground [&>button]:right-3 sm:[&>button]:right-6 [&>button]:top-3 sm:[&>button]:top-5 [&>button]:opacity-80 hover:[&>button]:opacity-100 [&>button]:z-[100] [&>button_svg]:size-4 sm:[&>button_svg]:size-5"
+				className="select-none max-w-2xl w-[95vw] sm:w-[640px] h-[min(440px,75dvh)] sm:h-[min(500px,80vh)] flex flex-col p-0 gap-0 overflow-hidden border border-border ring-0 bg-muted dark:bg-muted text-foreground [&>button]:right-3 sm:[&>button]:right-6 [&>button]:top-3 sm:[&>button]:top-5 [&>button]:opacity-80 hover:[&>button]:opacity-100 [&>button]:z-[100] [&>button_svg]:size-4 sm:[&>button_svg]:size-5"
 			>
 				<DialogTitle className="sr-only">Upload Document</DialogTitle>
 
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 940d1560a..dcafe62ba 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -121,10 +121,6 @@ interface FileWithId {
 	file: File;
 }
 
-const MAX_FILES = 50;
-const MAX_TOTAL_SIZE_MB = 200;
-const MAX_TOTAL_SIZE_BYTES = MAX_TOTAL_SIZE_MB * 1024 * 1024;
-
 const MAX_FILE_SIZE_MB = 500;
 const MAX_FILE_SIZE_BYTES = MAX_FILE_SIZE_MB * 1024 * 1024;
 
@@ -204,7 +200,6 @@ export function DocumentUploadTab({
 		accept: acceptedFileTypes,
 		maxSize: MAX_FILE_SIZE_BYTES,
 		noClick: isElectron,
-		disabled: files.length >= MAX_FILES,
 	});
 
 	const handleFileInputClick = useCallback((e: React.MouseEvent<HTMLInputElement>) => {
@@ -224,24 +219,8 @@ export function DocumentUploadTab({
 			id: crypto.randomUUID?.() ?? `file-${Date.now()}-${Math.random().toString(36)}`,
 			file: new File([fd.data], fd.name, { type: fd.mimeType }),
 		}));
-		setFiles((prev) => {
-			const merged = [...prev, ...newFiles];
-			if (merged.length > MAX_FILES) {
-				toast.error(t("max_files_exceeded"), {
-					description: t("max_files_exceeded_desc", { max: MAX_FILES }),
-				});
-				return prev;
-			}
-			const totalSize = merged.reduce((sum, e) => sum + e.file.size, 0);
-			if (totalSize > MAX_TOTAL_SIZE_BYTES) {
-				toast.error(t("max_size_exceeded"), {
-					description: t("max_size_exceeded_desc", { max: MAX_TOTAL_SIZE_MB }),
-				});
-				return prev;
-			}
-			return merged;
-		});
-	}, [t]);
+		setFiles((prev) => [...prev, ...newFiles]);
+	}, []);
 
 	const handleBrowseFolder = useCallback(async () => {
 		const api = window.electronAPI;
@@ -288,14 +267,6 @@ export function DocumentUploadTab({
 
 	const totalFileSize = files.reduce((total, entry) => total + entry.file.size, 0);
 
-	const isFileCountLimitReached = files.length >= MAX_FILES;
-	const isSizeLimitReached = totalFileSize >= MAX_TOTAL_SIZE_BYTES;
-	const remainingFiles = MAX_FILES - files.length;
-	const remainingSizeMB = Math.max(
-		0,
-		(MAX_TOTAL_SIZE_BYTES - totalFileSize) / (1024 * 1024)
-	).toFixed(1);
-
 	const hasContent = files.length > 0 || selectedFolder !== null;
 
 	const handleAccordionChange = useCallback(
@@ -392,8 +363,6 @@ export function DocumentUploadTab({
 
 	const renderBrowseButton = (options?: { compact?: boolean; fullWidth?: boolean }) => {
 		const { compact, fullWidth } = options ?? {};
-		if (isFileCountLimitReached) return null;
-
 		const sizeClass = compact ? "h-7" : "h-8";
 		const widthClass = fullWidth ? "w-full" : "";
 
@@ -478,7 +447,6 @@ export function DocumentUploadTab({
 			<div className="sm:hidden">
 				{hasContent ? (
 					!selectedFolder &&
-					!isFileCountLimitReached &&
 					(isElectron ? (
 						<div className="w-full">{renderBrowseButton({ compact: true, fullWidth: true })}</div>
 					) : (
@@ -502,12 +470,8 @@ export function DocumentUploadTab({
 							<p className="text-base font-medium">
 								{isElectron ? "Select files or folder" : "Tap to select files or folder"}
 							</p>
-							<p className="text-sm text-muted-foreground inline-flex items-center flex-wrap justify-center">
-								<span>{t("file_size_limit")}</span>
-								<Dot className="h-4 w-4 shrink-0" />
-								<span>
-									{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}
-								</span>
+							<p className="text-sm text-muted-foreground">
+								{t("file_size_limit")}
 							</p>
 						</div>
 						<div className="w-full mt-1" onClick={(e) => e.stopPropagation()}>
@@ -520,11 +484,7 @@ export function DocumentUploadTab({
 			{/* DESKTOP DROP ZONE */}
 			<div
 				{...getRootProps()}
-				className={`hidden sm:block border-2 border-dashed rounded-lg transition-colors ${
-					isFileCountLimitReached || isSizeLimitReached
-						? "border-destructive/50 bg-destructive/5 cursor-not-allowed"
-						: "border-muted-foreground/30 hover:border-foreground/70 cursor-pointer"
-				} ${hasContent ? "p-3" : "py-20 px-4"}`}
+				className={`hidden sm:block border-2 border-dashed rounded-lg transition-colors border-muted-foreground/30 hover:border-foreground/70 cursor-pointer ${hasContent ? "p-3" : "py-20 px-4"}`}
 			>
 				{hasContent ? (
 					<div className="flex items-center gap-3">
@@ -532,20 +492,10 @@ export function DocumentUploadTab({
 						<span className="text-xs text-muted-foreground flex-1 truncate">
 							{isDragActive
 								? t("drop_files")
-								: isFileCountLimitReached
-									? t("file_limit_reached")
-									: t("remaining_capacity", { files: remainingFiles, sizeMB: remainingSizeMB })}
+								: t("drag_drop_more")}
 						</span>
 						{renderBrowseButton({ compact: true })}
 					</div>
-				) : isFileCountLimitReached ? (
-					<div className="flex flex-col items-center gap-2 text-center">
-						<Upload className="h-8 w-8 text-destructive/70" />
-						<p className="text-sm font-medium text-destructive">{t("file_limit_reached")}</p>
-						<p className="text-xs text-muted-foreground">
-							{t("file_limit_reached_desc", { max: MAX_FILES })}
-						</p>
-					</div>
 				) : isDragActive ? (
 					<div className="flex flex-col items-center gap-2">
 						<Upload className="h-8 w-8 text-primary" />
@@ -555,12 +505,8 @@ export function DocumentUploadTab({
 					<div className="flex flex-col items-center gap-2">
 						<Upload className="h-8 w-8 text-muted-foreground" />
 						<p className="text-sm font-medium">{t("drag_drop")}</p>
-						<p className="text-xs text-muted-foreground text-center inline-flex items-center flex-wrap justify-center">
-							<span>{t("file_size_limit")}</span>
-							<Dot className="h-4 w-4 shrink-0" />
-							<span>
-								{t("upload_limits", { maxFiles: MAX_FILES, maxSizeMB: MAX_TOTAL_SIZE_MB })}
-							</span>
+						<p className="text-xs text-muted-foreground">
+							{t("file_size_limit")}
 						</p>
 						<div className="mt-1">{renderBrowseButton()}</div>
 					</div>
@@ -632,8 +578,7 @@ export function DocumentUploadTab({
 				<div className="rounded-lg border border-border p-3 space-y-2">
 					<div className="flex items-center justify-between">
 						<p className="text-sm font-medium">
-							{t("selected_files", { count: files.length })} &middot;{" "}
-							{formatFileSize(totalFileSize)}
+							{t("selected_files", { count: files.length })}<Dot className="inline h-4 w-4" />{formatFileSize(totalFileSize)}
 						</p>
 						<Button
 							variant="ghost"
diff --git a/surfsense_web/messages/en.json b/surfsense_web/messages/en.json
index 3a8c0c632..2e6e79976 100644
--- a/surfsense_web/messages/en.json
+++ b/surfsense_web/messages/en.json
@@ -376,14 +376,14 @@
 	"upload_documents": {
 		"title": "Upload Documents",
 		"subtitle": "Upload your files to make them searchable and accessible through AI-powered conversations.",
-		"file_size_limit": "Maximum file size: 50MB per file",
-		"upload_limits": "Upload limit: {maxFiles} files, {maxSizeMB}MB total",
+		"file_size_limit": "Maximum file size: 500MB per file",
 		"drop_files": "Drop files or folders here",
 		"drag_drop": "Drag & drop files or folders here",
+		"drag_drop_more": "Drop or browse to add more files",
 		"or_browse": "or click to browse",
 		"browse_files": "Browse Files",
 		"browse_folder": "Browse Folder",
-		"selected_files": "Selected Files ({count})",
+		"selected_files": "{count} selected {count, plural, one {file} other {files}}",
 		"total_size": "Total size",
 		"clear_all": "Clear all",
 		"uploading_files": "Uploading files",
@@ -397,14 +397,7 @@
 		"file_types_desc": "These file types are supported based on your current ETL service configuration.",
 		"file_too_large": "File Too Large",
 		"file_too_large_desc": "\"{name}\" exceeds the {maxMB}MB per-file limit.",
-		"no_supported_files_in_folder": "No supported file types found in the selected folder.",
-		"remaining_capacity": "{files} files, {sizeMB}MB remaining",
-		"file_limit_reached": "File limit reached",
-		"file_limit_reached_desc": "Maximum of {max} files allowed",
-		"max_files_exceeded": "Too many files",
-		"max_files_exceeded_desc": "You can upload a maximum of {max} files at once",
-		"max_size_exceeded": "Total size exceeded",
-		"max_size_exceeded_desc": "Total upload size cannot exceed {max}MB"
+		"no_supported_files_in_folder": "No supported file types found in the selected folder."
 	},
 	"add_webpage": {
 		"title": "Add Webpages for Crawling",
diff --git a/surfsense_web/messages/es.json b/surfsense_web/messages/es.json
index 2de30d29d..e282a52e1 100644
--- a/surfsense_web/messages/es.json
+++ b/surfsense_web/messages/es.json
@@ -376,14 +376,14 @@
 	"upload_documents": {
 		"title": "Subir documentos",
 		"subtitle": "Sube tus archivos para hacerlos buscables y accesibles a través de conversaciones con IA.",
-		"file_size_limit": "Tamaño máximo de archivo: 50 MB por archivo",
-		"upload_limits": "Límite de subida: {maxFiles} archivos, {maxSizeMB} MB en total",
+		"file_size_limit": "Tamaño máximo de archivo: 500 MB por archivo",
 		"drop_files": "Suelta archivos o carpetas aquí",
 		"drag_drop": "Arrastra y suelta archivos o carpetas aquí",
+		"drag_drop_more": "Suelta o explora para agregar más archivos",
 		"or_browse": "o haz clic para explorar",
 		"browse_files": "Explorar archivos",
 		"browse_folder": "Explorar carpeta",
-		"selected_files": "Archivos seleccionados ({count})",
+		"selected_files": "{count} {count, plural, one {archivo seleccionado} other {archivos seleccionados}}",
 		"total_size": "Tamaño total",
 		"clear_all": "Limpiar todo",
 		"uploading_files": "Subiendo archivos",
@@ -397,14 +397,7 @@
 		"file_types_desc": "Estos tipos de archivo son soportados según la configuración actual de tu servicio ETL.",
 		"file_too_large": "Archivo demasiado grande",
 		"file_too_large_desc": "\"{name}\" excede el límite de {maxMB} MB por archivo.",
-		"no_supported_files_in_folder": "No se encontraron tipos de archivo compatibles en la carpeta seleccionada.",
-		"remaining_capacity": "{files} archivos, {sizeMB}MB restante",
-		"file_limit_reached": "Límite de archivos alcanzado",
-		"file_limit_reached_desc": "Máximo de {max} archivos permitidos",
-		"max_files_exceeded": "Demasiados archivos",
-		"max_files_exceeded_desc": "Puedes subir un máximo de {max} archivos a la vez",
-		"max_size_exceeded": "Tamaño total excedido",
-		"max_size_exceeded_desc": "El tamaño total de subida no puede exceder {max}MB"
+		"no_supported_files_in_folder": "No se encontraron tipos de archivo compatibles en la carpeta seleccionada."
 	},
 	"add_webpage": {
 		"title": "Agregar páginas web para rastreo",
diff --git a/surfsense_web/messages/hi.json b/surfsense_web/messages/hi.json
index c27291e3b..9d4d982ad 100644
--- a/surfsense_web/messages/hi.json
+++ b/surfsense_web/messages/hi.json
@@ -376,14 +376,14 @@
 	"upload_documents": {
 		"title": "दस्तावेज़ अपलोड करें",
 		"subtitle": "AI-संचालित बातचीत के माध्यम से अपनी फ़ाइलों को खोजने योग्य और सुलभ बनाने के लिए अपलोड करें।",
-		"file_size_limit": "अधिकतम फ़ाइल आकार: प्रति फ़ाइल 50MB",
-		"upload_limits": "अपलोड सीमा: {maxFiles} फ़ाइलें, कुल {maxSizeMB}MB",
+		"file_size_limit": "अधिकतम फ़ाइल आकार: प्रति फ़ाइल 500MB",
 		"drop_files": "फ़ाइलें या फ़ोल्डर यहां छोड़ें",
 		"drag_drop": "फ़ाइलें या फ़ोल्डर यहां खींचें और छोड़ें",
+		"drag_drop_more": "और फ़ाइलें जोड़ने के लिए छोड़ें या ब्राउज़ करें",
 		"or_browse": "या ब्राउज़ करने के लिए क्लिक करें",
 		"browse_files": "फ़ाइलें ब्राउज़ करें",
 		"browse_folder": "फ़ोल्डर ब्राउज़ करें",
-		"selected_files": "चयनित फ़ाइलें ({count})",
+		"selected_files": "{count} चयनित {count, plural, one {फ़ाइल} other {फ़ाइलें}}",
 		"total_size": "कुल आकार",
 		"clear_all": "सभी साफ करें",
 		"uploading_files": "फ़ाइलें अपलोड हो रही हैं",
@@ -397,14 +397,7 @@
 		"file_types_desc": "ये फ़ाइल प्रकार आपकी वर्तमान ETL सेवा कॉन्फ़िगरेशन के आधार पर समर्थित हैं।",
 		"file_too_large": "फ़ाइल बहुत बड़ी है",
 		"file_too_large_desc": "\"{name}\" प्रति फ़ाइल {maxMB}MB की सीमा से अधिक है।",
-		"no_supported_files_in_folder": "चयनित फ़ोल्डर में कोई समर्थित फ़ाइल प्रकार नहीं मिला।",
-		"remaining_capacity": "{files} फ़ाइलें, {sizeMB}MB शेष",
-		"file_limit_reached": "फ़ाइल सीमा पूरी हो गई",
-		"file_limit_reached_desc": "अधिकतम {max} फ़ाइलें अनुमत हैं",
-		"max_files_exceeded": "बहुत सारी फ़ाइलें",
-		"max_files_exceeded_desc": "आप एक बार में अधिकतम {max} फ़ाइलें अपलोड कर सकते हैं",
-		"max_size_exceeded": "कुल आकार सीमा पार",
-		"max_size_exceeded_desc": "कुल अपलोड आकार {max}MB से अधिक नहीं हो सकता"
+		"no_supported_files_in_folder": "चयनित फ़ोल्डर में कोई समर्थित फ़ाइल प्रकार नहीं मिला।"
 	},
 	"add_webpage": {
 		"title": "क्रॉलिंग के लिए वेबपेज जोड़ें",
diff --git a/surfsense_web/messages/pt.json b/surfsense_web/messages/pt.json
index eeb417a27..7cb28d12f 100644
--- a/surfsense_web/messages/pt.json
+++ b/surfsense_web/messages/pt.json
@@ -376,14 +376,14 @@
 	"upload_documents": {
 		"title": "Enviar documentos",
 		"subtitle": "Envie seus arquivos para torná-los pesquisáveis e acessíveis através de conversas com IA.",
-		"file_size_limit": "Tamanho máximo do arquivo: 50 MB por arquivo",
-		"upload_limits": "Limite de envio: {maxFiles} arquivos, {maxSizeMB} MB no total",
+		"file_size_limit": "Tamanho máximo do arquivo: 500 MB por arquivo",
 		"drop_files": "Solte arquivos ou pastas aqui",
 		"drag_drop": "Arraste e solte arquivos ou pastas aqui",
+		"drag_drop_more": "Solte ou navegue para adicionar mais arquivos",
 		"or_browse": "ou clique para navegar",
 		"browse_files": "Navegar arquivos",
 		"browse_folder": "Navegar pasta",
-		"selected_files": "Arquivos selecionados ({count})",
+		"selected_files": "{count} {count, plural, one {arquivo selecionado} other {arquivos selecionados}}",
 		"total_size": "Tamanho total",
 		"clear_all": "Limpar tudo",
 		"uploading_files": "Enviando arquivos",
@@ -397,14 +397,7 @@
 		"file_types_desc": "Estes tipos de arquivo são suportados com base na configuração atual do seu serviço ETL.",
 		"file_too_large": "Arquivo muito grande",
 		"file_too_large_desc": "\"{name}\" excede o limite de {maxMB} MB por arquivo.",
-		"no_supported_files_in_folder": "Nenhum tipo de arquivo suportado encontrado na pasta selecionada.",
-		"remaining_capacity": "{files} arquivos, {sizeMB}MB restante",
-		"file_limit_reached": "Limite de arquivos atingido",
-		"file_limit_reached_desc": "Máximo de {max} arquivos permitidos",
-		"max_files_exceeded": "Muitos arquivos",
-		"max_files_exceeded_desc": "Você pode enviar no máximo {max} arquivos de uma vez",
-		"max_size_exceeded": "Tamanho total excedido",
-		"max_size_exceeded_desc": "O tamanho total do envio não pode exceder {max}MB"
+		"no_supported_files_in_folder": "Nenhum tipo de arquivo suportado encontrado na pasta selecionada."
 	},
 	"add_webpage": {
 		"title": "Adicionar páginas web para rastreamento",
diff --git a/surfsense_web/messages/zh.json b/surfsense_web/messages/zh.json
index 2ee18a346..9d0108ebc 100644
--- a/surfsense_web/messages/zh.json
+++ b/surfsense_web/messages/zh.json
@@ -360,14 +360,14 @@
 	"upload_documents": {
 		"title": "上传文档",
 		"subtitle": "上传您的文件，使其可通过 AI 对话进行搜索和访问。",
-		"file_size_limit": "最大文件大小：每个文件 50MB",
-		"upload_limits": "上传限制：最多 {maxFiles} 个文件，总大小不超过 {maxSizeMB}MB",
+		"file_size_limit": "最大文件大小：每个文件 500MB",
 		"drop_files": "将文件或文件夹拖放到此处",
 		"drag_drop": "拖放文件或文件夹到这里",
+		"drag_drop_more": "拖放或浏览以添加更多文件",
 		"or_browse": "或点击浏览",
 		"browse_files": "浏览文件",
 		"browse_folder": "浏览文件夹",
-		"selected_files": "已选择的文件 ({count})",
+		"selected_files": "已选择 {count} 个文件",
 		"total_size": "总大小",
 		"clear_all": "全部清除",
 		"uploading_files": "正在上传文件...",
@@ -381,14 +381,7 @@
 		"file_types_desc": "根据您当前的 ETL 服务配置支持这些文件类型。",
 		"file_too_large": "文件过大",
 		"file_too_large_desc": "\"{name}\" 超过了每个文件 {maxMB}MB 的限制。",
-		"no_supported_files_in_folder": "所选文件夹中没有找到支持的文件类型。",
-		"remaining_capacity": "剩余 {files} 个文件，{sizeMB}MB",
-		"file_limit_reached": "已达文件数量上限",
-		"file_limit_reached_desc": "最多允许 {max} 个文件",
-		"max_files_exceeded": "文件数量过多",
-		"max_files_exceeded_desc": "一次最多上传 {max} 个文件",
-		"max_size_exceeded": "总大小超出限制",
-		"max_size_exceeded_desc": "总上传大小不能超过 {max}MB"
+		"no_supported_files_in_folder": "所选文件夹中没有找到支持的文件类型。"
 	},
 	"add_webpage": {
 		"title": "添加网页爬取",

From b7f916c4dfcc55d3cb84ab4d8a82a432ab6f6b8b Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 17:24:34 +0530
Subject: [PATCH 091/202] chore: ran linting

---
 .../components/sources/DocumentUploadTab.tsx     | 16 ++++++----------
 1 file changed, 6 insertions(+), 10 deletions(-)

diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index dcafe62ba..2d70a4e1a 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -470,9 +470,7 @@ export function DocumentUploadTab({
 							<p className="text-base font-medium">
 								{isElectron ? "Select files or folder" : "Tap to select files or folder"}
 							</p>
-							<p className="text-sm text-muted-foreground">
-								{t("file_size_limit")}
-							</p>
+							<p className="text-sm text-muted-foreground">{t("file_size_limit")}</p>
 						</div>
 						<div className="w-full mt-1" onClick={(e) => e.stopPropagation()}>
 							{renderBrowseButton({ fullWidth: true })}
@@ -490,9 +488,7 @@ export function DocumentUploadTab({
 					<div className="flex items-center gap-3">
 						<Upload className="h-4 w-4 text-muted-foreground shrink-0" />
 						<span className="text-xs text-muted-foreground flex-1 truncate">
-							{isDragActive
-								? t("drop_files")
-								: t("drag_drop_more")}
+							{isDragActive ? t("drop_files") : t("drag_drop_more")}
 						</span>
 						{renderBrowseButton({ compact: true })}
 					</div>
@@ -505,9 +501,7 @@ export function DocumentUploadTab({
 					<div className="flex flex-col items-center gap-2">
 						<Upload className="h-8 w-8 text-muted-foreground" />
 						<p className="text-sm font-medium">{t("drag_drop")}</p>
-						<p className="text-xs text-muted-foreground">
-							{t("file_size_limit")}
-						</p>
+						<p className="text-xs text-muted-foreground">{t("file_size_limit")}</p>
 						<div className="mt-1">{renderBrowseButton()}</div>
 					</div>
 				)}
@@ -578,7 +572,9 @@ export function DocumentUploadTab({
 				<div className="rounded-lg border border-border p-3 space-y-2">
 					<div className="flex items-center justify-between">
 						<p className="text-sm font-medium">
-							{t("selected_files", { count: files.length })}<Dot className="inline h-4 w-4" />{formatFileSize(totalFileSize)}
+							{t("selected_files", { count: files.length })}
+							<Dot className="inline h-4 w-4" />
+							{formatFileSize(totalFileSize)}
 						</p>
 						<Button
 							variant="ghost"

From 9d4c2f5b984442b89ebfe27b7173b83164470bfa Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 17:28:12 +0530
Subject: [PATCH 092/202] refactor: replace span with Dot component in public
 chat snapshots, model configuration and thread managers

---
 surfsense_web/components/assistant-ui/thread.tsx           | 7 ++++++-
 .../public-chat-snapshots/public-chat-snapshot-row.tsx     | 4 ++--
 surfsense_web/components/settings/image-model-manager.tsx  | 4 ++--
 surfsense_web/components/settings/model-config-manager.tsx | 3 ++-
 4 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/thread.tsx b/surfsense_web/components/assistant-ui/thread.tsx
index 818644a47..9e2869d4e 100644
--- a/surfsense_web/components/assistant-ui/thread.tsx
+++ b/surfsense_web/components/assistant-ui/thread.tsx
@@ -15,6 +15,7 @@ import {
 	ChevronDown,
 	ChevronUp,
 	Clipboard,
+	Dot,
 	Globe,
 	Plus,
 	Settings2,
@@ -1147,7 +1148,11 @@ const ComposerAction: FC<ComposerActionProps> = ({ isBlockedByOtherUser = false
 														<TooltipTrigger asChild>{row}</TooltipTrigger>
 														<TooltipContent side="right" className="max-w-72 text-xs">
 															{groupDef?.tooltip ??
-																group.tools.map((t) => t.description).join(" · ")}
+																group.tools.flatMap((t, i) =>
+																	i === 0
+																		? [t.description]
+																		: [<Dot key={i} className="inline h-4 w-4" />, t.description]
+																)}
 														</TooltipContent>
 													</Tooltip>
 												);
diff --git a/surfsense_web/components/public-chat-snapshots/public-chat-snapshot-row.tsx b/surfsense_web/components/public-chat-snapshots/public-chat-snapshot-row.tsx
index ddf4746aa..4bb49c48d 100644
--- a/surfsense_web/components/public-chat-snapshots/public-chat-snapshot-row.tsx
+++ b/surfsense_web/components/public-chat-snapshots/public-chat-snapshot-row.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { Check, Copy, ExternalLink, MessageSquare, Trash2 } from "lucide-react";
+import { Check, Copy, Dot, ExternalLink, MessageSquare, Trash2 } from "lucide-react";
 import { useCallback, useRef, useState } from "react";
 import { Avatar, AvatarFallback, AvatarImage } from "@/components/ui/avatar";
 import { Badge } from "@/components/ui/badge";
@@ -153,7 +153,7 @@ export function PublicChatSnapshotRow({
 					<span className="text-[11px] text-muted-foreground/60">{formattedDate}</span>
 					{member && (
 						<>
-							<span className="text-muted-foreground/30">·</span>
+							<Dot className="h-4 w-4 text-muted-foreground/30" />
 							<TooltipProvider>
 								<Tooltip open={isDesktop ? undefined : false}>
 									<TooltipTrigger asChild>
diff --git a/surfsense_web/components/settings/image-model-manager.tsx b/surfsense_web/components/settings/image-model-manager.tsx
index 55128dc59..23162b629 100644
--- a/surfsense_web/components/settings/image-model-manager.tsx
+++ b/surfsense_web/components/settings/image-model-manager.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useAtomValue } from "jotai";
-import { AlertCircle, Edit3, Info, RefreshCw, Trash2, Wand2 } from "lucide-react";
+import { AlertCircle, Dot, Edit3, Info, RefreshCw, Trash2, Wand2 } from "lucide-react";
 import { useMemo, useState } from "react";
 import { deleteImageGenConfigMutationAtom } from "@/atoms/image-gen-config/image-gen-config-mutation.atoms";
 import {
@@ -330,7 +330,7 @@ export function ImageModelManager({ searchSpaceId }: ImageModelManagerProps) {
 													</span>
 													{member && (
 														<>
-															<span className="text-muted-foreground/30">·</span>
+															<Dot className="h-4 w-4 text-muted-foreground/30" />
 															<TooltipProvider>
 																<Tooltip open={isDesktop ? undefined : false}>
 																	<TooltipTrigger asChild>
diff --git a/surfsense_web/components/settings/model-config-manager.tsx b/surfsense_web/components/settings/model-config-manager.tsx
index 79504451a..db4f169f8 100644
--- a/surfsense_web/components/settings/model-config-manager.tsx
+++ b/surfsense_web/components/settings/model-config-manager.tsx
@@ -3,6 +3,7 @@
 import { useAtomValue } from "jotai";
 import {
 	AlertCircle,
+	Dot,
 	Edit3,
 	FileText,
 	Info,
@@ -364,7 +365,7 @@ export function ModelConfigManager({ searchSpaceId }: ModelConfigManagerProps) {
 													</span>
 													{member && (
 														<>
-															<span className="text-muted-foreground/30">·</span>
+															<Dot className="h-4 w-4 text-muted-foreground/30" />
 															<TooltipProvider>
 																<Tooltip open={isDesktop ? undefined : false}>
 																	<TooltipTrigger asChild>

From 6f4c0d5e6c882c2aa6e73f8f2f29624418982e85 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 17:29:12 +0530
Subject: [PATCH 093/202] chore: remove redundant file types description

---
 surfsense_web/messages/en.json | 1 -
 surfsense_web/messages/es.json | 1 -
 surfsense_web/messages/hi.json | 1 -
 surfsense_web/messages/pt.json | 1 -
 surfsense_web/messages/zh.json | 1 -
 5 files changed, 5 deletions(-)

diff --git a/surfsense_web/messages/en.json b/surfsense_web/messages/en.json
index 2e6e79976..b67f9db22 100644
--- a/surfsense_web/messages/en.json
+++ b/surfsense_web/messages/en.json
@@ -394,7 +394,6 @@
 		"upload_error": "Upload Error",
 		"upload_error_desc": "Error uploading files",
 		"supported_file_types": "Supported File Types",
-		"file_types_desc": "These file types are supported based on your current ETL service configuration.",
 		"file_too_large": "File Too Large",
 		"file_too_large_desc": "\"{name}\" exceeds the {maxMB}MB per-file limit.",
 		"no_supported_files_in_folder": "No supported file types found in the selected folder."
diff --git a/surfsense_web/messages/es.json b/surfsense_web/messages/es.json
index e282a52e1..5cf248a3a 100644
--- a/surfsense_web/messages/es.json
+++ b/surfsense_web/messages/es.json
@@ -394,7 +394,6 @@
 		"upload_error": "Error de subida",
 		"upload_error_desc": "Error al subir archivos",
 		"supported_file_types": "Tipos de archivo soportados",
-		"file_types_desc": "Estos tipos de archivo son soportados según la configuración actual de tu servicio ETL.",
 		"file_too_large": "Archivo demasiado grande",
 		"file_too_large_desc": "\"{name}\" excede el límite de {maxMB} MB por archivo.",
 		"no_supported_files_in_folder": "No se encontraron tipos de archivo compatibles en la carpeta seleccionada."
diff --git a/surfsense_web/messages/hi.json b/surfsense_web/messages/hi.json
index 9d4d982ad..0e7194832 100644
--- a/surfsense_web/messages/hi.json
+++ b/surfsense_web/messages/hi.json
@@ -394,7 +394,6 @@
 		"upload_error": "अपलोड त्रुटि",
 		"upload_error_desc": "फ़ाइलें अपलोड करने में त्रुटि",
 		"supported_file_types": "समर्थित फ़ाइल प्रकार",
-		"file_types_desc": "ये फ़ाइल प्रकार आपकी वर्तमान ETL सेवा कॉन्फ़िगरेशन के आधार पर समर्थित हैं।",
 		"file_too_large": "फ़ाइल बहुत बड़ी है",
 		"file_too_large_desc": "\"{name}\" प्रति फ़ाइल {maxMB}MB की सीमा से अधिक है।",
 		"no_supported_files_in_folder": "चयनित फ़ोल्डर में कोई समर्थित फ़ाइल प्रकार नहीं मिला।"
diff --git a/surfsense_web/messages/pt.json b/surfsense_web/messages/pt.json
index 7cb28d12f..00ae18eae 100644
--- a/surfsense_web/messages/pt.json
+++ b/surfsense_web/messages/pt.json
@@ -394,7 +394,6 @@
 		"upload_error": "Erro no envio",
 		"upload_error_desc": "Erro ao enviar arquivos",
 		"supported_file_types": "Tipos de arquivo suportados",
-		"file_types_desc": "Estes tipos de arquivo são suportados com base na configuração atual do seu serviço ETL.",
 		"file_too_large": "Arquivo muito grande",
 		"file_too_large_desc": "\"{name}\" excede o limite de {maxMB} MB por arquivo.",
 		"no_supported_files_in_folder": "Nenhum tipo de arquivo suportado encontrado na pasta selecionada."
diff --git a/surfsense_web/messages/zh.json b/surfsense_web/messages/zh.json
index 9d0108ebc..a6f3b5b84 100644
--- a/surfsense_web/messages/zh.json
+++ b/surfsense_web/messages/zh.json
@@ -378,7 +378,6 @@
 		"upload_error": "上传错误",
 		"upload_error_desc": "上传文件时出错",
 		"supported_file_types": "支持的文件类型",
-		"file_types_desc": "根据您当前的 ETL 服务配置支持这些文件类型。",
 		"file_too_large": "文件过大",
 		"file_too_large_desc": "\"{name}\" 超过了每个文件 {maxMB}MB 的限制。",
 		"no_supported_files_in_folder": "所选文件夹中没有找到支持的文件类型。"

From b759bb36a9694a8cd0820fbc8e1a65ba77bdec96 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 17:36:48 +0530
Subject: [PATCH 094/202] feat: add direct conversion support for CSV, TSV, and
 HTML files in local folder indexing

---
 .../local_folder_indexer.py                   |  26 ++-
 .../test_local_folder_pipeline.py             | 155 ++++++++++++++++++
 2 files changed, 175 insertions(+), 6 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index 539cfdd32..58c9f5003 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -49,8 +49,6 @@ PLAINTEXT_EXTENSIONS = frozenset(
         ".markdown",
         ".txt",
         ".text",
-        ".csv",
-        ".tsv",
         ".json",
         ".jsonl",
         ".yaml",
@@ -60,8 +58,6 @@ PLAINTEXT_EXTENSIONS = frozenset(
         ".cfg",
         ".conf",
         ".xml",
-        ".html",
-        ".htm",
         ".css",
         ".scss",
         ".less",
@@ -149,6 +145,9 @@ AUDIO_EXTENSIONS = frozenset(
 )
 
 
+DIRECT_CONVERT_EXTENSIONS = frozenset({".csv", ".tsv", ".html", ".htm"})
+
+
 def _is_plaintext_file(filename: str) -> bool:
     return Path(filename).suffix.lower() in PLAINTEXT_EXTENSIONS
 
@@ -157,9 +156,17 @@ def _is_audio_file(filename: str) -> bool:
     return Path(filename).suffix.lower() in AUDIO_EXTENSIONS
 
 
+def _is_direct_convert_file(filename: str) -> bool:
+    return Path(filename).suffix.lower() in DIRECT_CONVERT_EXTENSIONS
+
+
 def _needs_etl(filename: str) -> bool:
-    """File is not plaintext and not audio — requires ETL service to parse."""
-    return not _is_plaintext_file(filename) and not _is_audio_file(filename)
+    """File is not plaintext, not audio, and not direct-convert — requires ETL."""
+    return (
+        not _is_plaintext_file(filename)
+        and not _is_audio_file(filename)
+        and not _is_direct_convert_file(filename)
+    )
 
 
 HeartbeatCallbackType = Callable[[int], Awaitable[None]]
@@ -260,6 +267,13 @@ async def _read_file_content(file_path: str, filename: str) -> str:
     if _is_plaintext_file(filename):
         return _read_plaintext_file(file_path)
 
+    if _is_direct_convert_file(filename):
+        from app.tasks.document_processors._direct_converters import (
+            convert_file_directly,
+        )
+
+        return convert_file_directly(file_path, filename)
+
     if _is_audio_file(filename):
         etl_service = config.ETL_SERVICE if hasattr(config, "ETL_SERVICE") else None
         stt_service_val = config.STT_SERVICE if hasattr(config, "STT_SERVICE") else None
diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index 4062c3a3b..4c900bf51 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -804,3 +804,158 @@ class TestPipelineIntegration:
         )
         assert len(docs) == 1
         assert DocumentStatus.is_state(docs[0].status, DocumentStatus.READY)
+
+
+# ====================================================================
+# Tier 7: Direct Converters (DC1-DC4)
+# ====================================================================
+
+
+class TestDirectConvert:
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_dc1_csv_produces_markdown_table(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """DC1: CSV file is indexed as a markdown table, not raw comma-separated text."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "data.csv").write_text("name,age,city\nAlice,30,NYC\nBob,25,LA\n")
+
+        count, _skipped, _root_folder_id, err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+        )
+
+        assert err is None
+        assert count == 1
+
+        doc = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
+                )
+            )
+        ).scalar_one()
+
+        assert "| name" in doc.source_markdown
+        assert "| Alice" in doc.source_markdown
+        assert "name,age,city" not in doc.source_markdown
+
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_dc2_tsv_produces_markdown_table(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """DC2: TSV file is indexed as a markdown table."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "data.tsv").write_text("name\tage\tcity\nAlice\t30\tNYC\nBob\t25\tLA\n")
+
+        count, _skipped, _root_folder_id, err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+        )
+
+        assert err is None
+        assert count == 1
+
+        doc = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
+                )
+            )
+        ).scalar_one()
+
+        assert "| name" in doc.source_markdown
+        assert "| Alice" in doc.source_markdown
+
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_dc3_html_produces_clean_markdown(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """DC3: HTML file is indexed as clean markdown, not raw HTML."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "page.html").write_text(
+            "<h1>Title</h1><p>Hello world</p>"
+        )
+
+        count, _skipped, _root_folder_id, err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+        )
+
+        assert err is None
+        assert count == 1
+
+        doc = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
+                )
+            )
+        ).scalar_one()
+
+        assert "Title" in doc.source_markdown
+        assert "<h1>" not in doc.source_markdown
+
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_dc4_csv_single_file_mode(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """DC4: CSV via single-file batch mode also produces a markdown table."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        (tmp_path / "data.csv").write_text("name,age,city\nAlice,30,NYC\nBob,25,LA\n")
+
+        count, _skipped, _root_folder_id, err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            target_file_paths=[str(tmp_path / "data.csv")],
+        )
+
+        assert err is None
+        assert count == 1
+
+        doc = (
+            await db_session.execute(
+                select(Document).where(
+                    Document.document_type == DocumentType.LOCAL_FOLDER_FILE,
+                    Document.search_space_id == db_search_space.id,
+                )
+            )
+        ).scalar_one()
+
+        assert "| name" in doc.source_markdown
+        assert "name,age,city" not in doc.source_markdown

From edda5b98cb837eb16be2b33d9765c9532a656c10 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 17:38:29 +0530
Subject: [PATCH 095/202] chore: ran linting

---
 .../indexing_pipeline/test_local_folder_pipeline.py       | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index 4c900bf51..b94762ee6 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -860,7 +860,9 @@ class TestDirectConvert:
         """DC2: TSV file is indexed as a markdown table."""
         from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
 
-        (tmp_path / "data.tsv").write_text("name\tage\tcity\nAlice\t30\tNYC\nBob\t25\tLA\n")
+        (tmp_path / "data.tsv").write_text(
+            "name\tage\tcity\nAlice\t30\tNYC\nBob\t25\tLA\n"
+        )
 
         count, _skipped, _root_folder_id, err = await index_local_folder(
             session=db_session,
@@ -896,9 +898,7 @@ class TestDirectConvert:
         """DC3: HTML file is indexed as clean markdown, not raw HTML."""
         from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
 
-        (tmp_path / "page.html").write_text(
-            "<h1>Title</h1><p>Hello world</p>"
-        )
+        (tmp_path / "page.html").write_text("<h1>Title</h1><p>Hello world</p>")
 
         count, _skipped, _root_folder_id, err = await index_local_folder(
             session=db_session,

From 5068a6b4f392301a728f59f8c26fdf4679c6fc0c Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 17:52:59 +0530
Subject: [PATCH 096/202] style: update button variant and improve
 drag-and-drop UI in DocumentUploadTab

---
 .../components/sources/DocumentUploadTab.tsx  | 33 +++++++++++--------
 1 file changed, 20 insertions(+), 13 deletions(-)

diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 2d70a4e1a..0bf842b6d 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -401,15 +401,19 @@ export function DocumentUploadTab({
 			<DropdownMenu>
 				<DropdownMenuTrigger asChild onClick={(e) => e.stopPropagation()}>
 					<Button
-						variant="secondary"
+						variant="ghost"
 						size="sm"
-						className={`text-xs gap-1 ${sizeClass} ${widthClass}`}
+						className={`text-xs gap-1 bg-neutral-700/50 hover:bg-neutral-600/50 ${sizeClass} ${widthClass}`}
 					>
 						Browse
 						<ChevronDown className="h-3 w-3 opacity-60" />
 					</Button>
 				</DropdownMenuTrigger>
-				<DropdownMenuContent align="center" onClick={(e) => e.stopPropagation()}>
+				<DropdownMenuContent
+					align="center"
+					className="dark:bg-neutral-800"
+					onClick={(e) => e.stopPropagation()}
+				>
 					<DropdownMenuItem onClick={() => fileInputRef.current?.click()}>
 						<FileIcon className="h-4 w-4 mr-2" />
 						{t("browse_files")}
@@ -492,17 +496,20 @@ export function DocumentUploadTab({
 						</span>
 						{renderBrowseButton({ compact: true })}
 					</div>
-				) : isDragActive ? (
-					<div className="flex flex-col items-center gap-2">
-						<Upload className="h-8 w-8 text-primary" />
-						<p className="text-sm font-medium text-primary">{t("drop_files")}</p>
-					</div>
 				) : (
-					<div className="flex flex-col items-center gap-2">
-						<Upload className="h-8 w-8 text-muted-foreground" />
-						<p className="text-sm font-medium">{t("drag_drop")}</p>
-						<p className="text-xs text-muted-foreground">{t("file_size_limit")}</p>
-						<div className="mt-1">{renderBrowseButton()}</div>
+					<div className="relative">
+						{isDragActive && (
+							<div className="absolute inset-0 flex flex-col items-center justify-center gap-2">
+								<Upload className="h-8 w-8 text-primary" />
+								<p className="text-sm font-medium text-primary">{t("drop_files")}</p>
+							</div>
+						)}
+						<div className={`flex flex-col items-center gap-2 ${isDragActive ? "invisible" : ""}`}>
+							<Upload className="h-8 w-8 text-muted-foreground" />
+							<p className="text-sm font-medium">{t("drag_drop")}</p>
+							<p className="text-xs text-muted-foreground">{t("file_size_limit")}</p>
+							<div className="mt-1">{renderBrowseButton()}</div>
+						</div>
 					</div>
 				)}
 			</div>

From 9c0af6569d1e94744ad5361b9611efee0f57269c Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Fri, 3 Apr 2026 19:13:25 +0530
Subject: [PATCH 097/202] feat: implement page limit checks in local folder
 indexing to manage user page usage

---
 .../local_folder_indexer.py                   |  88 ++++++-
 .../test_local_folder_pipeline.py             | 219 ++++++++++++++++++
 2 files changed, 303 insertions(+), 4 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index 58c9f5003..acfbce0bf 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -34,6 +34,7 @@ from app.indexing_pipeline.connector_document import ConnectorDocument
 from app.indexing_pipeline.document_hashing import compute_identifier_hash
 from app.indexing_pipeline.indexing_pipeline_service import IndexingPipelineService
 from app.services.llm_service import get_user_long_context_llm
+from app.services.page_limit_service import PageLimitExceededError, PageLimitService
 from app.services.task_logging_service import TaskLoggingService
 from app.tasks.celery_tasks import get_celery_session_maker
 from app.utils.document_versioning import create_version_snapshot
@@ -171,6 +172,39 @@ def _needs_etl(filename: str) -> bool:
 
 HeartbeatCallbackType = Callable[[int], Awaitable[None]]
 
+
+def _estimate_pages_safe(page_limit_service: PageLimitService, file_path: str) -> int:
+    """Estimate page count with a file-size fallback."""
+    try:
+        return page_limit_service.estimate_pages_before_processing(file_path)
+    except Exception:
+        file_size = os.path.getsize(file_path)
+        return max(1, file_size // (80 * 1024))
+
+
+async def _check_page_limit_or_skip(
+    page_limit_service: PageLimitService,
+    user_id: str,
+    file_path: str,
+) -> int:
+    """Estimate pages and check the limit; raises PageLimitExceededError if over quota.
+
+    Returns the estimated page count on success.
+    """
+    estimated = _estimate_pages_safe(page_limit_service, file_path)
+    await page_limit_service.check_page_limit(user_id, estimated)
+    return estimated
+
+
+def _compute_final_pages(
+    page_limit_service: PageLimitService,
+    estimated_pages: int,
+    content_length: int,
+) -> int:
+    """Return the final page count as max(estimated, actual)."""
+    actual = page_limit_service.estimate_pages_from_content_length(content_length)
+    return max(estimated_pages, actual)
+
 DEFAULT_EXCLUDE_PATTERNS = [
     ".git",
     "node_modules",
@@ -720,11 +754,12 @@ async def index_local_folder(
         skipped_count = 0
         failed_count = 0
 
+        page_limit_service = PageLimitService(session)
+
         # ================================================================
         # PHASE 1: Pre-filter files (mtime / content-hash), version changed
         # ================================================================
         connector_docs: list[ConnectorDocument] = []
-        # Maps unique_id -> (relative_path, mtime) for post-pipeline folder_id assignment
         file_meta_map: dict[str, dict] = {}
         seen_unique_hashes: set[str] = set()
 
@@ -759,6 +794,17 @@ async def index_local_folder(
                         skipped_count += 1
                         continue
 
+                    try:
+                        estimated_pages = await _check_page_limit_or_skip(
+                            page_limit_service, user_id, file_path_abs
+                        )
+                    except PageLimitExceededError:
+                        logger.warning(
+                            f"Page limit exceeded, skipping: {file_path_abs}"
+                        )
+                        failed_count += 1
+                        continue
+
                     try:
                         content, content_hash = await _compute_file_content_hash(
                             file_path_abs, file_info["relative_path"], search_space_id
@@ -781,6 +827,17 @@ async def index_local_folder(
 
                     await create_version_snapshot(session, existing_document)
                 else:
+                    try:
+                        estimated_pages = await _check_page_limit_or_skip(
+                            page_limit_service, user_id, file_path_abs
+                        )
+                    except PageLimitExceededError:
+                        logger.warning(
+                            f"Page limit exceeded, skipping: {file_path_abs}"
+                        )
+                        failed_count += 1
+                        continue
+
                     try:
                         content, content_hash = await _compute_file_content_hash(
                             file_path_abs, file_info["relative_path"], search_space_id
@@ -807,6 +864,8 @@ async def index_local_folder(
                 file_meta_map[unique_identifier] = {
                     "relative_path": relative_path,
                     "mtime": file_info["modified_at"].timestamp(),
+                    "estimated_pages": estimated_pages,
+                    "content_length": len(content),
                 }
 
             except Exception as e:
@@ -901,6 +960,15 @@ async def index_local_folder(
                     doc_meta = dict(result.document_metadata or {})
                     doc_meta["mtime"] = mtime_info.get("mtime")
                     result.document_metadata = doc_meta
+
+                    est = mtime_info.get("estimated_pages", 1)
+                    content_len = mtime_info.get("content_length", 0)
+                    final_pages = _compute_final_pages(
+                        page_limit_service, est, content_len
+                    )
+                    await page_limit_service.update_page_usage(
+                        user_id, final_pages, allow_exceed=True
+                    )
                 else:
                     failed_count += 1
 
@@ -1084,6 +1152,14 @@ async def _index_single_file(
             DocumentType.LOCAL_FOLDER_FILE.value, unique_id, search_space_id
         )
 
+        page_limit_service = PageLimitService(session)
+        try:
+            estimated_pages = await _check_page_limit_or_skip(
+                page_limit_service, user_id, str(full_path)
+            )
+        except PageLimitExceededError as e:
+            return 0, 1, f"Page limit exceeded: {e}"
+
         try:
             content, content_hash = await _compute_file_content_hash(
                 str(full_path), full_path.name, search_space_id
@@ -1128,8 +1204,6 @@ async def _index_single_file(
 
         db_doc = documents[0]
 
-        # Assign folder_id before indexing so the doc appears in the
-        # correct folder while still pending/processing.
         if root_folder_id:
             try:
                 db_doc.folder_id = await _resolve_folder_for_file(
@@ -1154,10 +1228,16 @@ async def _index_single_file(
         failed_msg = None if indexed else "Indexing failed"
 
         if indexed:
+            final_pages = _compute_final_pages(
+                page_limit_service, estimated_pages, len(content)
+            )
+            await page_limit_service.update_page_usage(
+                user_id, final_pages, allow_exceed=True
+            )
             await task_logger.log_task_success(
                 log_entry,
                 f"Single file indexed: {rel_path}",
-                {"file": rel_path},
+                {"file": rel_path, "pages_processed": final_pages},
             )
         return indexed, 0 if indexed else 1, failed_msg
 
diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index b94762ee6..4d9bda7ee 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -959,3 +959,222 @@ class TestDirectConvert:
 
         assert "| name" in doc.source_markdown
         assert "name,age,city" not in doc.source_markdown
+
+
+# ====================================================================
+# Tier 8: Page Limits (PL1-PL6)
+# ====================================================================
+
+
+class TestPageLimits:
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_pl1_full_scan_increments_pages_used(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """PL1: Successful full-scan sync increments user.pages_used."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        db_user.pages_used = 0
+        db_user.pages_limit = 500
+        await db_session.flush()
+
+        (tmp_path / "note.md").write_text("# Hello World\n\nContent here.")
+
+        count, _skipped, _root_folder_id, err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+        )
+
+        assert err is None
+        assert count == 1
+
+        await db_session.refresh(db_user)
+        assert db_user.pages_used > 0, "pages_used should increase after indexing"
+
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_pl2_full_scan_blocked_when_limit_exhausted(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """PL2: Full-scan skips file when page limit is exhausted."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        db_user.pages_used = 100
+        db_user.pages_limit = 100
+        await db_session.flush()
+
+        (tmp_path / "note.md").write_text("# Hello World\n\nContent here.")
+
+        count, _skipped, _root_folder_id, err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+        )
+
+        assert count == 0
+
+        await db_session.refresh(db_user)
+        assert db_user.pages_used == 100, "pages_used should not change on rejection"
+
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_pl3_single_file_increments_pages_used(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """PL3: Single-file mode increments user.pages_used on success."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        db_user.pages_used = 0
+        db_user.pages_limit = 500
+        await db_session.flush()
+
+        (tmp_path / "note.md").write_text("# Hello World\n\nContent here.")
+
+        count, _skipped, _root_folder_id, err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            target_file_paths=[str(tmp_path / "note.md")],
+        )
+
+        assert err is None
+        assert count == 1
+
+        await db_session.refresh(db_user)
+        assert db_user.pages_used > 0, "pages_used should increase after indexing"
+
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_pl4_single_file_blocked_when_limit_exhausted(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """PL4: Single-file mode skips file when page limit is exhausted."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        db_user.pages_used = 100
+        db_user.pages_limit = 100
+        await db_session.flush()
+
+        (tmp_path / "note.md").write_text("# Hello World\n\nContent here.")
+
+        count, _skipped, _root_folder_id, err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            target_file_paths=[str(tmp_path / "note.md")],
+        )
+
+        assert count == 0
+        assert err is not None
+        assert "page limit" in err.lower()
+
+        await db_session.refresh(db_user)
+        assert db_user.pages_used == 100, "pages_used should not change on rejection"
+
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_pl5_unchanged_resync_no_extra_pages(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+    ):
+        """PL5: Re-syncing an unchanged file does not consume additional pages."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        db_user.pages_used = 0
+        db_user.pages_limit = 500
+        await db_session.flush()
+
+        (tmp_path / "note.md").write_text("# Hello\n\nSame content.")
+
+        count1, _, root_folder_id, _ = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+        )
+        assert count1 == 1
+
+        await db_session.refresh(db_user)
+        pages_after_first = db_user.pages_used
+        assert pages_after_first > 0
+
+        count2, _, _, _ = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            root_folder_id=root_folder_id,
+        )
+        assert count2 == 0
+
+        await db_session.refresh(db_user)
+        assert db_user.pages_used == pages_after_first, (
+            "pages_used should not increase for unchanged files"
+        )
+
+    @pytest.mark.usefixtures(*UNIFIED_FIXTURES)
+    async def test_pl6_batch_partial_page_limit_exhaustion(
+        self,
+        db_session: AsyncSession,
+        db_user: User,
+        db_search_space: SearchSpace,
+        tmp_path: Path,
+        patched_batch_sessions,
+    ):
+        """PL6: Batch mode with a very low page limit: some files succeed, rest fail."""
+        from app.tasks.connector_indexers.local_folder_indexer import index_local_folder
+
+        db_user.pages_used = 0
+        db_user.pages_limit = 1
+        await db_session.flush()
+
+        (tmp_path / "a.md").write_text("File A content")
+        (tmp_path / "b.md").write_text("File B content")
+        (tmp_path / "c.md").write_text("File C content")
+
+        count, failed, _root_folder_id, _err = await index_local_folder(
+            session=db_session,
+            search_space_id=db_search_space.id,
+            user_id=str(db_user.id),
+            folder_path=str(tmp_path),
+            folder_name="test-folder",
+            target_file_paths=[
+                str(tmp_path / "a.md"),
+                str(tmp_path / "b.md"),
+                str(tmp_path / "c.md"),
+            ],
+        )
+
+        assert count >= 1, "at least one file should succeed"
+        assert failed >= 1, "at least one file should fail due to page limit"
+        assert count + failed == 3
+
+        await db_session.refresh(db_user)
+        assert db_user.pages_used > 0
+        assert db_user.pages_used <= db_user.pages_limit + 1

From 8ba571566d2e1c3c296934c52e28a4202ede1dda Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Fri, 3 Apr 2026 16:10:52 +0200
Subject: [PATCH 098/202] remove uiohook-napi and keystroke monitoring

---
 surfsense_desktop/electron-builder.yml        |  10 +-
 surfsense_desktop/package.json                |   3 +-
 surfsense_desktop/pnpm-lock.yaml              |  17 --
 surfsense_desktop/scripts/build-electron.mjs  |   2 +-
 surfsense_desktop/src/ipc/channels.ts         |   1 -
 surfsense_desktop/src/ipc/handlers.ts         |   5 -
 .../src/modules/autocomplete/index.ts         | 156 +-----------------
 .../modules/autocomplete/keystroke-buffer.ts  |  76 ---------
 surfsense_desktop/src/modules/permissions.ts  |  12 +-
 surfsense_desktop/src/preload.ts              |   1 -
 .../app/desktop/permissions/page.tsx          | 122 ++++++--------
 surfsense_web/types/window.d.ts               |   2 -
 12 files changed, 57 insertions(+), 350 deletions(-)
 delete mode 100644 surfsense_desktop/src/modules/autocomplete/keystroke-buffer.ts

diff --git a/surfsense_desktop/electron-builder.yml b/surfsense_desktop/electron-builder.yml
index 115b69c8e..3de0f266d 100644
--- a/surfsense_desktop/electron-builder.yml
+++ b/surfsense_desktop/electron-builder.yml
@@ -9,10 +9,6 @@ directories:
 files:
   - dist/**/*
   - "!node_modules"
-  - node_modules/uiohook-napi/**/*
-  - "!node_modules/uiohook-napi/src"
-  - "!node_modules/uiohook-napi/libuiohook"
-  - "!node_modules/uiohook-napi/binding.gyp"
   - node_modules/node-gyp-build/**/*
   - node_modules/bindings/**/*
   - node_modules/file-uri-to-path/**/*
@@ -39,7 +35,6 @@ extraResources:
     filter: ["**/*"]
 asarUnpack:
   - "**/*.node"
-  - "node_modules/uiohook-napi/**/*"
   - "node_modules/node-gyp-build/**/*"
   - "node_modules/bindings/**/*"
   - "node_modules/file-uri-to-path/**/*"
@@ -51,9 +46,8 @@ mac:
   hardenedRuntime: false
   gatekeeperAssess: false
   extendInfo:
-    NSInputMonitoringUsageDescription: "SurfSense uses input monitoring to provide system-wide autocomplete suggestions as you type."
-    NSAccessibilityUsageDescription: "SurfSense uses accessibility features to read text fields and insert suggestions."
-    NSAppleEventsUsageDescription: "SurfSense uses Apple Events to read text from the active application and insert autocomplete suggestions."
+    NSAccessibilityUsageDescription: "SurfSense uses accessibility features to insert suggestions into the active application."
+    NSAppleEventsUsageDescription: "SurfSense uses Apple Events to interact with the active application."
   target:
     - target: dmg
       arch: [x64, arm64]
diff --git a/surfsense_desktop/package.json b/surfsense_desktop/package.json
index 01a63b265..ab4fa0b8f 100644
--- a/surfsense_desktop/package.json
+++ b/surfsense_desktop/package.json
@@ -32,7 +32,6 @@
     "bindings": "^1.5.0",
     "electron-updater": "^6.8.3",
     "get-port-please": "^3.2.0",
-    "node-mac-permissions": "^2.5.0",
-    "uiohook-napi": "^1.5.5"
+    "node-mac-permissions": "^2.5.0"
   }
 }
diff --git a/surfsense_desktop/pnpm-lock.yaml b/surfsense_desktop/pnpm-lock.yaml
index d0b453d31..96541c579 100644
--- a/surfsense_desktop/pnpm-lock.yaml
+++ b/surfsense_desktop/pnpm-lock.yaml
@@ -20,9 +20,6 @@ importers:
       node-mac-permissions:
         specifier: ^2.5.0
         version: 2.5.0
-      uiohook-napi:
-        specifier: ^1.5.5
-        version: 1.5.5
     devDependencies:
       '@electron/rebuild':
         specifier: ^4.0.3
@@ -1128,10 +1125,6 @@ packages:
   node-api-version@0.2.1:
     resolution: {integrity: sha512-2xP/IGGMmmSQpI1+O/k72jF/ykvZ89JeuKX3TLJAYPDVLUalrshrLHkeVcCCZqG/eEa635cr8IBYzgnDvM2O8Q==}
 
-  node-gyp-build@4.8.4:
-    resolution: {integrity: sha512-LA4ZjwlnUblHVgq0oBF3Jl/6h/Nvs5fzBLwdEF4nuxnFdsfajde4WfxtJr3CaiH+F6ewcIB/q4jQ4UzPyid+CQ==}
-    hasBin: true
-
   node-gyp@11.5.0:
     resolution: {integrity: sha512-ra7Kvlhxn5V9Slyus0ygMa2h+UqExPqUIkfk7Pc8QTLT956JLSy51uWFwHtIYy0vI8cB4BDhc/S03+880My/LQ==}
     engines: {node: ^18.17.0 || >=20.5.0}
@@ -1454,10 +1447,6 @@ packages:
     engines: {node: '>=14.17'}
     hasBin: true
 
-  uiohook-napi@1.5.5:
-    resolution: {integrity: sha512-oSlTdnECw2GBfsJPTbBQBeE4v/EXP0EZmX6BJq5nzH/JgFaBE8JpFwEA/kLhiEP7HxQw28FViWiYgdIZzWuuJQ==}
-    engines: {node: '>= 16'}
-
   undici-types@7.16.0:
     resolution: {integrity: sha512-Zz+aZWSj8LE6zoxD+xrjh4VfkIG8Ya6LvYkZqtUQGJPZjYl53ypCaUwWqo7eI0x66KBGeRo+mlBEkMSeSZ38Nw==}
 
@@ -2785,8 +2774,6 @@ snapshots:
     dependencies:
       semver: 7.7.4
 
-  node-gyp-build@4.8.4: {}
-
   node-gyp@11.5.0:
     dependencies:
       env-paths: 2.2.1
@@ -3113,10 +3100,6 @@ snapshots:
 
   typescript@5.9.3: {}
 
-  uiohook-napi@1.5.5:
-    dependencies:
-      node-gyp-build: 4.8.4
-
   undici-types@7.16.0: {}
 
   undici-types@7.18.2: {}
diff --git a/surfsense_desktop/scripts/build-electron.mjs b/surfsense_desktop/scripts/build-electron.mjs
index c2869ec46..9f507ea37 100644
--- a/surfsense_desktop/scripts/build-electron.mjs
+++ b/surfsense_desktop/scripts/build-electron.mjs
@@ -104,7 +104,7 @@ async function buildElectron() {
     bundle: true,
     platform: 'node',
     target: 'node18',
-    external: ['electron', 'uiohook-napi', 'node-mac-permissions', 'bindings', 'file-uri-to-path'],
+    external: ['electron', 'node-mac-permissions', 'bindings', 'file-uri-to-path'],
     sourcemap: true,
     minify: false,
     define: {
diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index 2965f516f..905a84bc3 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -9,7 +9,6 @@ export const IPC_CHANNELS = {
   // Permissions
   GET_PERMISSIONS_STATUS: 'get-permissions-status',
   REQUEST_ACCESSIBILITY: 'request-accessibility',
-  REQUEST_INPUT_MONITORING: 'request-input-monitoring',
   RESTART_APP: 'restart-app',
   // Autocomplete
   AUTOCOMPLETE_CONTEXT: 'autocomplete-context',
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index a6d82be4b..8597a39e8 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -3,7 +3,6 @@ import { IPC_CHANNELS } from './channels';
 import {
   getPermissionsStatus,
   requestAccessibility,
-  requestInputMonitoring,
   restartApp,
 } from '../modules/permissions';
 
@@ -31,10 +30,6 @@ export function registerIpcHandlers(): void {
     requestAccessibility();
   });
 
-  ipcMain.handle(IPC_CHANNELS.REQUEST_INPUT_MONITORING, async () => {
-    return await requestInputMonitoring();
-  });
-
   ipcMain.handle(IPC_CHANNELS.RESTART_APP, () => {
     restartApp();
   });
diff --git a/surfsense_desktop/src/modules/autocomplete/index.ts b/surfsense_desktop/src/modules/autocomplete/index.ts
index 2ea37d051..3d9d67eef 100644
--- a/surfsense_desktop/src/modules/autocomplete/index.ts
+++ b/surfsense_desktop/src/modules/autocomplete/index.ts
@@ -1,152 +1,23 @@
-import { clipboard, ipcMain, screen } from 'electron';
+import { clipboard, globalShortcut, ipcMain, screen } from 'electron';
 import { IPC_CHANNELS } from '../../ipc/channels';
 import { getFrontmostApp, hasAccessibilityPermission, simulatePaste } from '../platform';
 import { getMainWindow } from '../window';
-import {
-  appendToBuffer, buildKeycodeMap, getBuffer, getBufferTrimmed,
-  getLastTrackedApp, removeLastChar, resetBuffer, resolveChar, setLastTrackedApp,
-} from './keystroke-buffer';
 import { createSuggestionWindow, destroySuggestion, getSuggestionWindow } from './suggestion-window';
 
-const DEBOUNCE_MS = 600;
-
-let uIOhook: any = null;
-let UiohookKey: any = {};
-let IGNORED_KEYCODES: Set<number> = new Set();
-
-let debounceTimer: ReturnType<typeof setTimeout> | null = null;
-let hookStarted = false;
 let autocompleteEnabled = true;
 let savedClipboard = '';
 let sourceApp = '';
 let pendingSuggestionText = '';
 
-function loadUiohook(): boolean {
-  if (uIOhook) return true;
-  try {
-    const mod = require('uiohook-napi');
-    uIOhook = mod.uIOhook;
-    UiohookKey = mod.UiohookKey;
-    IGNORED_KEYCODES = new Set([
-      UiohookKey.Shift, UiohookKey.ShiftRight,
-      UiohookKey.Ctrl, UiohookKey.CtrlRight,
-      UiohookKey.Alt, UiohookKey.AltRight,
-      UiohookKey.Meta, UiohookKey.MetaRight,
-      UiohookKey.CapsLock, UiohookKey.NumLock, UiohookKey.ScrollLock,
-      UiohookKey.F1, UiohookKey.F2, UiohookKey.F3, UiohookKey.F4,
-      UiohookKey.F5, UiohookKey.F6, UiohookKey.F7, UiohookKey.F8,
-      UiohookKey.F9, UiohookKey.F10, UiohookKey.F11, UiohookKey.F12,
-      UiohookKey.PrintScreen,
-    ]);
-    buildKeycodeMap();
-    console.log('[autocomplete] uiohook-napi loaded');
-    return true;
-  } catch (err) {
-    console.error('[autocomplete] Failed to load uiohook-napi:', err);
-    return false;
-  }
-}
-
-function clearDebounce(): void {
-  if (debounceTimer) {
-    clearTimeout(debounceTimer);
-    debounceTimer = null;
-  }
-}
-
 function isSurfSenseWindow(): boolean {
   const app = getFrontmostApp();
   return app === 'Electron' || app === 'SurfSense' || app === 'surfsense-desktop';
 }
 
-function onKeyDown(event: {
-  keycode: number;
-  shiftKey?: boolean;
-  ctrlKey?: boolean;
-  metaKey?: boolean;
-  altKey?: boolean;
-}): void {
-  if (!autocompleteEnabled) return;
-
-  const currentApp = getFrontmostApp();
-  if (currentApp !== getLastTrackedApp()) {
-    resetBuffer();
-    setLastTrackedApp(currentApp);
-  }
-
-  const win = getSuggestionWindow();
-
-  if (event.keycode === UiohookKey.Tab && win && !win.isDestroyed()) {
-    if (pendingSuggestionText) {
-      acceptAndInject(pendingSuggestionText);
-    }
-    return;
-  }
-
-  if (event.keycode === UiohookKey.Escape) {
-    if (win && !win.isDestroyed()) {
-      destroySuggestion();
-      pendingSuggestionText = '';
-    }
-    clearDebounce();
-    return;
-  }
-
-  if (currentApp === 'Electron' || currentApp === 'SurfSense' || currentApp === 'surfsense-desktop') {
-    return;
-  }
-
-  if (event.ctrlKey || event.metaKey || event.altKey) {
-    resetBuffer();
-    clearDebounce();
-    return;
-  }
-
-  if (event.keycode === UiohookKey.Backspace) {
-    removeLastChar();
-  } else if (event.keycode === UiohookKey.Delete) {
-    // forward delete doesn't affect our trailing buffer
-  } else if (event.keycode === UiohookKey.Enter) {
-    appendToBuffer('\n');
-  } else if (event.keycode === UiohookKey.Space) {
-    appendToBuffer(' ');
-  } else if (
-    event.keycode === UiohookKey.ArrowLeft || event.keycode === UiohookKey.ArrowRight ||
-    event.keycode === UiohookKey.ArrowUp || event.keycode === UiohookKey.ArrowDown ||
-    event.keycode === UiohookKey.Home || event.keycode === UiohookKey.End ||
-    event.keycode === UiohookKey.PageUp || event.keycode === UiohookKey.PageDown
-  ) {
-    resetBuffer();
-    clearDebounce();
-    return;
-  } else if (IGNORED_KEYCODES.has(event.keycode)) {
-    return;
-  } else {
-    const ch = resolveChar(event.keycode, !!event.shiftKey);
-    if (ch) appendToBuffer(ch);
-  }
-
-  if (win && !win.isDestroyed()) {
-    destroySuggestion();
-  }
-
-  clearDebounce();
-  debounceTimer = setTimeout(() => {
-    triggerAutocomplete();
-  }, DEBOUNCE_MS);
-}
-
-function onMouseClick(): void {
-  resetBuffer();
-}
-
 async function triggerAutocomplete(): Promise<void> {
   if (!hasAccessibilityPermission()) return;
   if (isSurfSenseWindow()) return;
 
-  const text = getBufferTrimmed();
-  if (!text || text.length < 5) return;
-
   sourceApp = getFrontmostApp();
   savedClipboard = clipboard.readText();
 
@@ -168,8 +39,8 @@ async function triggerAutocomplete(): Promise<void> {
     setTimeout(() => {
       if (sw && !sw.isDestroyed()) {
         sw.webContents.send(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, {
-          text: getBuffer(),
-          cursorPosition: getBuffer().length,
+          text: '',
+          cursorPosition: 0,
           searchSpaceId,
         });
       }
@@ -190,7 +61,6 @@ async function acceptAndInject(text: string): Promise<void> {
     simulatePaste();
     await new Promise((r) => setTimeout(r, 100));
     clipboard.writeText(savedClipboard);
-    appendToBuffer(text);
   } catch {
     clipboard.writeText(savedClipboard);
   }
@@ -210,7 +80,6 @@ function registerIpcHandlers(): void {
   ipcMain.handle(IPC_CHANNELS.SET_AUTOCOMPLETE_ENABLED, (_event, enabled: boolean) => {
     autocompleteEnabled = enabled;
     if (!enabled) {
-      clearDebounce();
       destroySuggestion();
     }
   });
@@ -220,25 +89,10 @@ function registerIpcHandlers(): void {
 export function registerAutocomplete(): void {
   registerIpcHandlers();
 
-  if (!loadUiohook()) {
-    console.error('[autocomplete] Cannot start: uiohook-napi failed to load');
-    return;
-  }
-
-  uIOhook.on('keydown', onKeyDown);
-  uIOhook.on('click', onMouseClick);
-  try {
-    uIOhook.start();
-    hookStarted = true;
-  } catch (err) {
-    console.error('[autocomplete] uIOhook.start() failed:', err);
-  }
+  // TODO: Phase 2 — replace with vision-based trigger (desktopCapturer + globalShortcut)
+  console.log('[autocomplete] IPC handlers registered');
 }
 
 export function unregisterAutocomplete(): void {
-  clearDebounce();
   destroySuggestion();
-  if (uIOhook && hookStarted) {
-    try { uIOhook.stop(); } catch { /* already stopped */ }
-  }
 }
diff --git a/surfsense_desktop/src/modules/autocomplete/keystroke-buffer.ts b/surfsense_desktop/src/modules/autocomplete/keystroke-buffer.ts
deleted file mode 100644
index ca232d307..000000000
--- a/surfsense_desktop/src/modules/autocomplete/keystroke-buffer.ts
+++ /dev/null
@@ -1,76 +0,0 @@
-const MAX_BUFFER_LENGTH = 4000;
-const KEYCODE_TO_CHAR: Record<number, [string, string]> = {};
-
-let keystrokeBuffer = '';
-let lastTrackedApp = '';
-
-export function buildKeycodeMap(): void {
-  const letters: [string, number][] = [
-    ['q', 16], ['w', 17], ['e', 18], ['r', 19], ['t', 20],
-    ['y', 21], ['u', 22], ['i', 23], ['o', 24], ['p', 25],
-    ['a', 30], ['s', 31], ['d', 32], ['f', 33], ['g', 34],
-    ['h', 35], ['j', 36], ['k', 37], ['l', 38],
-    ['z', 44], ['x', 45], ['c', 46], ['v', 47],
-    ['b', 48], ['n', 49], ['m', 50],
-  ];
-  for (const [ch, code] of letters) {
-    KEYCODE_TO_CHAR[code] = [ch, ch.toUpperCase()];
-  }
-
-  const digits: [string, string, number][] = [
-    ['1', '!', 2], ['2', '@', 3], ['3', '#', 4], ['4', '$', 5],
-    ['5', '%', 6], ['6', '^', 7], ['7', '&', 8], ['8', '*', 9],
-    ['9', '(', 10], ['0', ')', 11],
-  ];
-  for (const [norm, shifted, code] of digits) {
-    KEYCODE_TO_CHAR[code] = [norm, shifted];
-  }
-
-  const punctuation: [string, string, number][] = [
-    [';', ':', 39], ['=', '+', 13], [',', '<', 51], ['-', '_', 12],
-    ['.', '>', 52], ['/', '?', 53], ['`', '~', 41], ['[', '{', 26],
-    ['\\', '|', 43], [']', '}', 27], ["'", '"', 40],
-  ];
-  for (const [norm, shifted, code] of punctuation) {
-    KEYCODE_TO_CHAR[code] = [norm, shifted];
-  }
-}
-
-export function resetBuffer(): void {
-  keystrokeBuffer = '';
-}
-
-export function appendToBuffer(char: string): void {
-  keystrokeBuffer += char;
-  if (keystrokeBuffer.length > MAX_BUFFER_LENGTH) {
-    keystrokeBuffer = keystrokeBuffer.slice(-MAX_BUFFER_LENGTH);
-  }
-}
-
-export function removeLastChar(): void {
-  if (keystrokeBuffer.length > 0) {
-    keystrokeBuffer = keystrokeBuffer.slice(0, -1);
-  }
-}
-
-export function getBuffer(): string {
-  return keystrokeBuffer;
-}
-
-export function getBufferTrimmed(): string {
-  return keystrokeBuffer.trim();
-}
-
-export function getLastTrackedApp(): string {
-  return lastTrackedApp;
-}
-
-export function setLastTrackedApp(app: string): void {
-  lastTrackedApp = app;
-}
-
-export function resolveChar(keycode: number, shift: boolean): string | null {
-  const mapping = KEYCODE_TO_CHAR[keycode];
-  if (!mapping) return null;
-  return shift ? mapping[1] : mapping[0];
-}
diff --git a/surfsense_desktop/src/modules/permissions.ts b/surfsense_desktop/src/modules/permissions.ts
index 9a6159c9a..4ac671b7c 100644
--- a/surfsense_desktop/src/modules/permissions.ts
+++ b/surfsense_desktop/src/modules/permissions.ts
@@ -4,7 +4,6 @@ type PermissionStatus = 'authorized' | 'denied' | 'not determined' | 'restricted
 
 export interface PermissionsStatus {
   accessibility: PermissionStatus;
-  inputMonitoring: PermissionStatus;
 }
 
 function isMac(): boolean {
@@ -17,19 +16,18 @@ function getNodeMacPermissions() {
 
 export function getPermissionsStatus(): PermissionsStatus {
   if (!isMac()) {
-    return { accessibility: 'authorized', inputMonitoring: 'authorized' };
+    return { accessibility: 'authorized' };
   }
 
   const perms = getNodeMacPermissions();
   return {
     accessibility: perms.getAuthStatus('accessibility'),
-    inputMonitoring: perms.getAuthStatus('input-monitoring'),
   };
 }
 
 export function allPermissionsGranted(): boolean {
   const status = getPermissionsStatus();
-  return status.accessibility === 'authorized' && status.inputMonitoring === 'authorized';
+  return status.accessibility === 'authorized';
 }
 
 export function requestAccessibility(): void {
@@ -38,12 +36,6 @@ export function requestAccessibility(): void {
   perms.askForAccessibilityAccess();
 }
 
-export async function requestInputMonitoring(): Promise<string> {
-  if (!isMac()) return 'authorized';
-  const perms = getNodeMacPermissions();
-  return perms.askForInputMonitoringAccess('listen');
-}
-
 export function restartApp(): void {
   app.relaunch();
   app.exit(0);
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 956afcc46..157fe216b 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -24,7 +24,6 @@ contextBridge.exposeInMainWorld('electronAPI', {
   // Permissions
   getPermissionsStatus: () => ipcRenderer.invoke(IPC_CHANNELS.GET_PERMISSIONS_STATUS),
   requestAccessibility: () => ipcRenderer.invoke(IPC_CHANNELS.REQUEST_ACCESSIBILITY),
-  requestInputMonitoring: () => ipcRenderer.invoke(IPC_CHANNELS.REQUEST_INPUT_MONITORING),
   restartApp: () => ipcRenderer.invoke(IPC_CHANNELS.RESTART_APP),
   // Autocomplete
   onAutocompleteContext: (callback: (data: { text: string; cursorPosition: number; searchSpaceId?: string }) => void) => {
diff --git a/surfsense_web/app/desktop/permissions/page.tsx b/surfsense_web/app/desktop/permissions/page.tsx
index 8bde63357..e0d3131e0 100644
--- a/surfsense_web/app/desktop/permissions/page.tsx
+++ b/surfsense_web/app/desktop/permissions/page.tsx
@@ -10,26 +10,8 @@ type PermissionStatus = "authorized" | "denied" | "not determined" | "restricted
 
 interface PermissionsStatus {
 	accessibility: PermissionStatus;
-	inputMonitoring: PermissionStatus;
 }
 
-const STEPS = [
-	{
-		id: "input-monitoring",
-		title: "Input Monitoring",
-		description: "Helps you write faster by enriching your text with suggestions from your knowledge base.",
-		action: "requestInputMonitoring",
-		field: "inputMonitoring" as const,
-	},
-	{
-		id: "accessibility",
-		title: "Accessibility",
-		description: "Lets you accept suggestions seamlessly, right where you're typing.",
-		action: "requestAccessibility",
-		field: "accessibility" as const,
-	},
-];
-
 function StatusBadge({ status }: { status: PermissionStatus }) {
 	if (status === "authorized") {
 		return (
@@ -66,13 +48,11 @@ export default function DesktopPermissionsPage() {
 
 		let interval: ReturnType<typeof setInterval> | null = null;
 
-		const isResolved = (s: string) => s === "authorized" || s === "restricted";
-
 		const poll = async () => {
 			const status = await window.electronAPI!.getPermissionsStatus();
 			setPermissions(status);
 
-			if (isResolved(status.accessibility) && isResolved(status.inputMonitoring)) {
+			if (status.accessibility === "authorized" || status.accessibility === "restricted") {
 				if (interval) clearInterval(interval);
 			}
 		};
@@ -98,14 +78,10 @@ export default function DesktopPermissionsPage() {
 		);
 	}
 
-	const allGranted = permissions.accessibility === "authorized" && permissions.inputMonitoring === "authorized";
+	const allGranted = permissions.accessibility === "authorized";
 
-	const handleRequest = async (action: string) => {
-		if (action === "requestInputMonitoring") {
-			await window.electronAPI!.requestInputMonitoring();
-		} else if (action === "requestAccessibility") {
-			await window.electronAPI!.requestAccessibility();
-		}
+	const handleRequest = async () => {
+		await window.electronAPI!.requestAccessibility();
 	};
 
 	const handleContinue = () => {
@@ -127,61 +103,55 @@ export default function DesktopPermissionsPage() {
 					<div className="space-y-1">
 						<h1 className="text-2xl font-semibold tracking-tight">System Permissions</h1>
 						<p className="text-sm text-muted-foreground">
-							SurfSense needs two macOS permissions to provide system-wide autocomplete.
+							SurfSense needs Accessibility permission to insert suggestions into the active application.
 						</p>
 					</div>
 				</div>
 
-				{/* Steps */}
+				{/* Permission card */}
 				<div className="rounded-xl border bg-background dark:bg-neutral-900 flex-1 min-h-0 overflow-y-auto px-6 py-6 space-y-6">
-					{STEPS.map((step, index) => {
-						const status = permissions[step.field];
-						const isGranted = status === "authorized";
-
-						return (
-							<div
-								key={step.id}
-								className={`rounded-lg border p-4 transition-colors ${
-									isGranted
-										? "border-green-200 bg-green-50/50 dark:border-green-900 dark:bg-green-950/20"
-										: "border-border"
-								}`}
-							>
-								<div className="flex items-start justify-between gap-3">
-									<div className="flex items-start gap-3">
-										<span className="flex h-7 w-7 shrink-0 items-center justify-center rounded-full bg-primary/10 text-sm font-medium text-primary">
-											{isGranted ? "✓" : index + 1}
-										</span>
-										<div className="space-y-1">
-											<h3 className="text-sm font-medium">{step.title}</h3>
-											<p className="text-xs text-muted-foreground">{step.description}</p>
-										</div>
-									</div>
-									<StatusBadge status={status} />
-								</div>
-								{!isGranted && (
-									<div className="mt-3 pl-10 space-y-2">
-										<Button
-											size="sm"
-											variant="outline"
-											onClick={() => handleRequest(step.action)}
-											className="text-xs"
-										>
-											Open System Settings
-										</Button>
-									{status === "denied" && (
-										<p className="text-xs text-amber-700 dark:text-amber-400">
-											Toggle SurfSense on in System Settings to continue.
-										</p>
-									)}
+					<div
+						className={`rounded-lg border p-4 transition-colors ${
+							allGranted
+								? "border-green-200 bg-green-50/50 dark:border-green-900 dark:bg-green-950/20"
+								: "border-border"
+						}`}
+					>
+						<div className="flex items-start justify-between gap-3">
+							<div className="flex items-start gap-3">
+								<span className="flex h-7 w-7 shrink-0 items-center justify-center rounded-full bg-primary/10 text-sm font-medium text-primary">
+									{allGranted ? "\u2713" : "1"}
+								</span>
+								<div className="space-y-1">
+									<h3 className="text-sm font-medium">Accessibility</h3>
 									<p className="text-xs text-muted-foreground">
-										If SurfSense doesn&apos;t appear in the list, click <strong>+</strong> and select it from Applications.
+										Lets SurfSense insert suggestions seamlessly, right where you&apos;re typing.
 									</p>
-									</div>
-								)}
+								</div>
 							</div>
-						);
-					})}
+							<StatusBadge status={permissions.accessibility} />
+						</div>
+						{!allGranted && (
+							<div className="mt-3 pl-10 space-y-2">
+								<Button
+									size="sm"
+									variant="outline"
+									onClick={handleRequest}
+									className="text-xs"
+								>
+									Open System Settings
+								</Button>
+								{permissions.accessibility === "denied" && (
+									<p className="text-xs text-amber-700 dark:text-amber-400">
+										Toggle SurfSense on in System Settings to continue.
+									</p>
+								)}
+								<p className="text-xs text-muted-foreground">
+									If SurfSense doesn&apos;t appear in the list, click <strong>+</strong> and select it from Applications.
+								</p>
+							</div>
+						)}
+					</div>
 				</div>
 
 				{/* Footer */}
@@ -198,7 +168,7 @@ export default function DesktopPermissionsPage() {
 					) : (
 						<>
 							<Button disabled className="text-sm h-9 min-w-[180px]">
-								Grant permissions to continue
+								Grant permission to continue
 							</Button>
 							<button
 								onClick={handleSkip}
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 8cf331b42..0b312b5ec 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -17,10 +17,8 @@ interface ElectronAPI {
 	// Permissions
 	getPermissionsStatus: () => Promise<{
 		accessibility: 'authorized' | 'denied' | 'not determined' | 'restricted' | 'limited';
-		inputMonitoring: 'authorized' | 'denied' | 'not determined' | 'restricted' | 'limited';
 	}>;
 	requestAccessibility: () => Promise<void>;
-	requestInputMonitoring: () => Promise<void>;
 	restartApp: () => Promise<void>;
 	// Autocomplete
 	onAutocompleteContext: (callback: (data: { text: string; cursorPosition: number; searchSpaceId?: string }) => void) => () => void;

From fb20b0444f5058cc57a3edbd77e2fd6bffe76409 Mon Sep 17 00:00:00 2001
From: ArvinFarrelP <farel877629@gmail.com>
Date: Fri, 3 Apr 2026 21:51:08 +0700
Subject: [PATCH 099/202] fix(navbar): remove key prop causing unnecessary
 remount in mobile navbar

---
 surfsense_web/components/homepage/navbar.tsx | 1 -
 1 file changed, 1 deletion(-)

diff --git a/surfsense_web/components/homepage/navbar.tsx b/surfsense_web/components/homepage/navbar.tsx
index 6ed5265bc..5dfacafb6 100644
--- a/surfsense_web/components/homepage/navbar.tsx
+++ b/surfsense_web/components/homepage/navbar.tsx
@@ -143,7 +143,6 @@ const MobileNav = ({ navItems, isScrolled, scrolledBgClassName }: any) => {
 		<motion.div
 			ref={navRef}
 			animate={{ borderRadius: open ? "4px" : "2rem" }}
-			key={String(open)}
 			className={cn(
 				"relative mx-auto flex w-full max-w-[calc(100vw-2rem)] flex-col items-center justify-between px-4 py-2 lg:hidden transition-all duration-300",
 				isScrolled

From bb84bb25a313be2397947a1b6a9bb9ac7e2db1d4 Mon Sep 17 00:00:00 2001
From: ArvinFarrelP <farel877629@gmail.com>
Date: Fri, 3 Apr 2026 22:11:21 +0700
Subject: [PATCH 100/202] perf(images): add sizes prop to improve Next.js image
 loading

---
 surfsense_web/components/homepage/features-bento-grid.tsx | 1 +
 surfsense_web/components/tool-ui/image/index.tsx          | 1 +
 surfsense_web/mdx-components.tsx                          | 3 ++-
 3 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/surfsense_web/components/homepage/features-bento-grid.tsx b/surfsense_web/components/homepage/features-bento-grid.tsx
index 07fe4fc22..32cbe2582 100644
--- a/surfsense_web/components/homepage/features-bento-grid.tsx
+++ b/surfsense_web/components/homepage/features-bento-grid.tsx
@@ -408,6 +408,7 @@ const AudioCommentIllustration = () => (
 			src="/homepage/comments-audio.webp"
 			alt="Audio Comment Illustration"
 			fill
+			sizes="(max-width: 768px) 100vw, (max-width: 1024px) 50vw, 33vw"
 			className="object-cover"
 		/>
 	</div>
diff --git a/surfsense_web/components/tool-ui/image/index.tsx b/surfsense_web/components/tool-ui/image/index.tsx
index 81c55d10a..9c39f4928 100644
--- a/surfsense_web/components/tool-ui/image/index.tsx
+++ b/surfsense_web/components/tool-ui/image/index.tsx
@@ -307,6 +307,7 @@ export function Image({
 							src={src}
 							alt={alt}
 							fill
+							sizes="(max-width: 512px) 100vw, 512px"
 							className={cn(
 								"transition-transform duration-300",
 								fit === "cover" ? "object-cover" : "object-contain",
diff --git a/surfsense_web/mdx-components.tsx b/surfsense_web/mdx-components.tsx
index 9dedbd20f..8297f732d 100644
--- a/surfsense_web/mdx-components.tsx
+++ b/surfsense_web/mdx-components.tsx
@@ -15,8 +15,9 @@ export function getMDXComponents(components?: MDXComponents): MDXComponents {
 		img: ({ className, alt, ...props }: React.ComponentProps<"img">) => (
 			<Image
 				{...(props as ImageProps)}
-				className={cn("rounded-md border", className)}
 				alt={alt ?? ""}
+				sizes="(max-width: 768px) 100vw, 896px"
+				className={cn("rounded-md border", className)}
 			/>
 		),
 		Video: ({ className, ...props }: React.ComponentProps<"video">) => (

From 482238e5d4f53b71dba757e5a93c2821d814b2b4 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Fri, 3 Apr 2026 17:40:27 +0200
Subject: [PATCH 101/202] add vision LLM role for screenshot analysis

---
 .../117_add_vision_llm_id_to_search_spaces.py | 39 +++++++++++++++++++
 surfsense_backend/app/db.py                   |  3 ++
 .../app/routes/search_spaces_routes.py        |  6 +++
 .../app/schemas/new_llm_config.py             |  9 +++++
 surfsense_backend/app/services/llm_service.py | 12 +++++-
 .../components/settings/llm-role-manager.tsx  | 21 +++++++++-
 .../contracts/types/new-llm-config.types.ts   |  3 ++
 7 files changed, 91 insertions(+), 2 deletions(-)
 create mode 100644 surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py

diff --git a/surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py b/surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py
new file mode 100644
index 000000000..254642c88
--- /dev/null
+++ b/surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py
@@ -0,0 +1,39 @@
+"""117_add_vision_llm_id_to_search_spaces
+
+Revision ID: 117
+Revises: 116
+
+Adds vision_llm_id column to search_spaces for vision/screenshot analysis
+LLM role assignment. Defaults to 0 (Auto mode), same convention as
+agent_llm_id and document_summary_llm_id.
+"""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "117"
+down_revision: str | None = "116"
+branch_labels: str | Sequence[str] | None = None
+depends_on: str | Sequence[str] | None = None
+
+
+def upgrade() -> None:
+    conn = op.get_bind()
+    existing_columns = [
+        col["name"] for col in sa.inspect(conn).get_columns("search_spaces")
+    ]
+
+    if "vision_llm_id" not in existing_columns:
+        op.add_column(
+            "search_spaces",
+            sa.Column("vision_llm_id", sa.Integer(), nullable=True, server_default="0"),
+        )
+
+
+def downgrade() -> None:
+    op.drop_column("search_spaces", "vision_llm_id")
diff --git a/surfsense_backend/app/db.py b/surfsense_backend/app/db.py
index 90630cc83..2dfbdd97f 100644
--- a/surfsense_backend/app/db.py
+++ b/surfsense_backend/app/db.py
@@ -1329,6 +1329,9 @@ class SearchSpace(BaseModel, TimestampMixin):
     image_generation_config_id = Column(
         Integer, nullable=True, default=0
     )  # For image generation, defaults to Auto mode
+    vision_llm_id = Column(
+        Integer, nullable=True, default=0
+    )  # For vision/screenshot analysis, defaults to Auto mode
 
     user_id = Column(
         UUID(as_uuid=True), ForeignKey("user.id", ondelete="CASCADE"), nullable=False
diff --git a/surfsense_backend/app/routes/search_spaces_routes.py b/surfsense_backend/app/routes/search_spaces_routes.py
index 7f6638e2c..c4f1ab035 100644
--- a/surfsense_backend/app/routes/search_spaces_routes.py
+++ b/surfsense_backend/app/routes/search_spaces_routes.py
@@ -522,14 +522,17 @@ async def get_llm_preferences(
         image_generation_config = await _get_image_gen_config_by_id(
             session, search_space.image_generation_config_id
         )
+        vision_llm = await _get_llm_config_by_id(session, search_space.vision_llm_id)
 
         return LLMPreferencesRead(
             agent_llm_id=search_space.agent_llm_id,
             document_summary_llm_id=search_space.document_summary_llm_id,
             image_generation_config_id=search_space.image_generation_config_id,
+            vision_llm_id=search_space.vision_llm_id,
             agent_llm=agent_llm,
             document_summary_llm=document_summary_llm,
             image_generation_config=image_generation_config,
+            vision_llm=vision_llm,
         )
 
     except HTTPException:
@@ -589,14 +592,17 @@ async def update_llm_preferences(
         image_generation_config = await _get_image_gen_config_by_id(
             session, search_space.image_generation_config_id
         )
+        vision_llm = await _get_llm_config_by_id(session, search_space.vision_llm_id)
 
         return LLMPreferencesRead(
             agent_llm_id=search_space.agent_llm_id,
             document_summary_llm_id=search_space.document_summary_llm_id,
             image_generation_config_id=search_space.image_generation_config_id,
+            vision_llm_id=search_space.vision_llm_id,
             agent_llm=agent_llm,
             document_summary_llm=document_summary_llm,
             image_generation_config=image_generation_config,
+            vision_llm=vision_llm,
         )
 
     except HTTPException:
diff --git a/surfsense_backend/app/schemas/new_llm_config.py b/surfsense_backend/app/schemas/new_llm_config.py
index 9863665b6..2deddd7f2 100644
--- a/surfsense_backend/app/schemas/new_llm_config.py
+++ b/surfsense_backend/app/schemas/new_llm_config.py
@@ -182,6 +182,9 @@ class LLMPreferencesRead(BaseModel):
     image_generation_config_id: int | None = Field(
         None, description="ID of the image generation config to use"
     )
+    vision_llm_id: int | None = Field(
+        None, description="ID of the LLM config to use for vision/screenshot analysis"
+    )
     agent_llm: dict[str, Any] | None = Field(
         None, description="Full config for agent LLM"
     )
@@ -191,6 +194,9 @@ class LLMPreferencesRead(BaseModel):
     image_generation_config: dict[str, Any] | None = Field(
         None, description="Full config for image generation"
     )
+    vision_llm: dict[str, Any] | None = Field(
+        None, description="Full config for vision LLM"
+    )
 
     model_config = ConfigDict(from_attributes=True)
 
@@ -207,3 +213,6 @@ class LLMPreferencesUpdate(BaseModel):
     image_generation_config_id: int | None = Field(
         None, description="ID of the image generation config to use"
     )
+    vision_llm_id: int | None = Field(
+        None, description="ID of the LLM config to use for vision/screenshot analysis"
+    )
diff --git a/surfsense_backend/app/services/llm_service.py b/surfsense_backend/app/services/llm_service.py
index 59f52a4eb..7c0f9e7e3 100644
--- a/surfsense_backend/app/services/llm_service.py
+++ b/surfsense_backend/app/services/llm_service.py
@@ -32,6 +32,7 @@ logger = logging.getLogger(__name__)
 class LLMRole:
     AGENT = "agent"  # For agent/chat operations
     DOCUMENT_SUMMARY = "document_summary"  # For document summarization
+    VISION = "vision"  # For vision/screenshot analysis
 
 
 def get_global_llm_config(llm_config_id: int) -> dict | None:
@@ -187,7 +188,7 @@ async def get_search_space_llm_instance(
     Args:
         session: Database session
         search_space_id: Search Space ID
-        role: LLM role ('agent' or 'document_summary')
+        role: LLM role ('agent', 'document_summary', or 'vision')
 
     Returns:
         ChatLiteLLM or ChatLiteLLMRouter instance, or None if not found
@@ -209,6 +210,8 @@ async def get_search_space_llm_instance(
             llm_config_id = search_space.agent_llm_id
         elif role == LLMRole.DOCUMENT_SUMMARY:
             llm_config_id = search_space.document_summary_llm_id
+        elif role == LLMRole.VISION:
+            llm_config_id = search_space.vision_llm_id
         else:
             logger.error(f"Invalid LLM role: {role}")
             return None
@@ -405,6 +408,13 @@ async def get_document_summary_llm(
     )
 
 
+async def get_vision_llm(
+    session: AsyncSession, search_space_id: int
+) -> ChatLiteLLM | ChatLiteLLMRouter | None:
+    """Get the search space's vision LLM instance for screenshot analysis."""
+    return await get_search_space_llm_instance(session, search_space_id, LLMRole.VISION)
+
+
 # Backward-compatible alias (LLM preferences are now per-search-space, not per-user)
 async def get_user_long_context_llm(
     session: AsyncSession,
diff --git a/surfsense_web/components/settings/llm-role-manager.tsx b/surfsense_web/components/settings/llm-role-manager.tsx
index 07ec492a3..eaf14d8e8 100644
--- a/surfsense_web/components/settings/llm-role-manager.tsx
+++ b/surfsense_web/components/settings/llm-role-manager.tsx
@@ -6,6 +6,7 @@ import {
 	Bot,
 	CheckCircle,
 	CircleDashed,
+	Eye,
 	FileText,
 	ImageIcon,
 	RefreshCw,
@@ -71,6 +72,15 @@ const ROLE_DESCRIPTIONS = {
 		prefKey: "image_generation_config_id" as const,
 		configType: "image" as const,
 	},
+	vision: {
+		icon: Eye,
+		title: "Vision LLM",
+		description: "Vision-capable model for screenshot analysis and context extraction",
+		color: "text-amber-600 dark:text-amber-400",
+		bgColor: "bg-amber-500/10",
+		prefKey: "vision_llm_id" as const,
+		configType: "llm" as const,
+	},
 };
 
 interface LLMRoleManagerProps {
@@ -116,6 +126,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 		agent_llm_id: preferences.agent_llm_id ?? "",
 		document_summary_llm_id: preferences.document_summary_llm_id ?? "",
 		image_generation_config_id: preferences.image_generation_config_id ?? "",
+		vision_llm_id: preferences.vision_llm_id ?? "",
 	}));
 
 	const [hasChanges, setHasChanges] = useState(false);
@@ -126,6 +137,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 			agent_llm_id: preferences.agent_llm_id ?? "",
 			document_summary_llm_id: preferences.document_summary_llm_id ?? "",
 			image_generation_config_id: preferences.image_generation_config_id ?? "",
+			vision_llm_id: preferences.vision_llm_id ?? "",
 		};
 		setAssignments(newAssignments);
 		setHasChanges(false);
@@ -133,6 +145,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 		preferences?.agent_llm_id,
 		preferences?.document_summary_llm_id,
 		preferences?.image_generation_config_id,
+		preferences?.vision_llm_id,
 	]);
 
 	const handleRoleAssignment = (prefKey: string, configId: string) => {
@@ -147,6 +160,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 			agent_llm_id: preferences.agent_llm_id ?? "",
 			document_summary_llm_id: preferences.document_summary_llm_id ?? "",
 			image_generation_config_id: preferences.image_generation_config_id ?? "",
+			vision_llm_id: preferences.vision_llm_id ?? "",
 		};
 
 		const hasChangesNow = Object.keys(newAssignments).some(
@@ -168,6 +182,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 			agent_llm_id: toNumericOrUndefined(assignments.agent_llm_id),
 			document_summary_llm_id: toNumericOrUndefined(assignments.document_summary_llm_id),
 			image_generation_config_id: toNumericOrUndefined(assignments.image_generation_config_id),
+			vision_llm_id: toNumericOrUndefined(assignments.vision_llm_id),
 		};
 
 		await updatePreferences({
@@ -186,6 +201,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 			agent_llm_id: preferences.agent_llm_id ?? "",
 			document_summary_llm_id: preferences.document_summary_llm_id ?? "",
 			image_generation_config_id: preferences.image_generation_config_id ?? "",
+			vision_llm_id: preferences.vision_llm_id ?? "",
 		});
 		setHasChanges(false);
 	};
@@ -199,7 +215,10 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 		assignments.document_summary_llm_id !== undefined &&
 		assignments.image_generation_config_id !== "" &&
 		assignments.image_generation_config_id !== null &&
-		assignments.image_generation_config_id !== undefined;
+		assignments.image_generation_config_id !== undefined &&
+		assignments.vision_llm_id !== "" &&
+		assignments.vision_llm_id !== null &&
+		assignments.vision_llm_id !== undefined;
 
 	// Combine global and custom LLM configs
 	const allLLMConfigs = [
diff --git a/surfsense_web/contracts/types/new-llm-config.types.ts b/surfsense_web/contracts/types/new-llm-config.types.ts
index 3bb43680a..3fbdb86ea 100644
--- a/surfsense_web/contracts/types/new-llm-config.types.ts
+++ b/surfsense_web/contracts/types/new-llm-config.types.ts
@@ -264,9 +264,11 @@ export const llmPreferences = z.object({
 	agent_llm_id: z.union([z.number(), z.null()]).optional(),
 	document_summary_llm_id: z.union([z.number(), z.null()]).optional(),
 	image_generation_config_id: z.union([z.number(), z.null()]).optional(),
+	vision_llm_id: z.union([z.number(), z.null()]).optional(),
 	agent_llm: z.union([z.record(z.string(), z.unknown()), z.null()]).optional(),
 	document_summary_llm: z.union([z.record(z.string(), z.unknown()), z.null()]).optional(),
 	image_generation_config: z.union([z.record(z.string(), z.unknown()), z.null()]).optional(),
+	vision_llm: z.union([z.record(z.string(), z.unknown()), z.null()]).optional(),
 });
 
 /**
@@ -287,6 +289,7 @@ export const updateLLMPreferencesRequest = z.object({
 		agent_llm_id: true,
 		document_summary_llm_id: true,
 		image_generation_config_id: true,
+		vision_llm_id: true,
 	}),
 });
 

From 339ff7fdf4f4778782193275e7f51712ec5f2cb2 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Fri, 3 Apr 2026 17:47:33 +0200
Subject: [PATCH 102/202] add screenshot capture module using desktopCapturer

---
 .../src/modules/autocomplete/screenshot.ts    | 27 +++++++++++++++++++
 1 file changed, 27 insertions(+)
 create mode 100644 surfsense_desktop/src/modules/autocomplete/screenshot.ts

diff --git a/surfsense_desktop/src/modules/autocomplete/screenshot.ts b/surfsense_desktop/src/modules/autocomplete/screenshot.ts
new file mode 100644
index 000000000..22b7c1b14
--- /dev/null
+++ b/surfsense_desktop/src/modules/autocomplete/screenshot.ts
@@ -0,0 +1,27 @@
+import { desktopCapturer, screen } from 'electron';
+
+/**
+ * Captures the primary display as a base64-encoded PNG data URL.
+ * Uses the display's actual size for full-resolution capture.
+ */
+export async function captureScreen(): Promise<string | null> {
+  try {
+    const primaryDisplay = screen.getPrimaryDisplay();
+    const { width, height } = primaryDisplay.size;
+
+    const sources = await desktopCapturer.getSources({
+      types: ['screen'],
+      thumbnailSize: { width, height },
+    });
+
+    if (!sources.length) {
+      console.error('[screenshot] No screen sources found');
+      return null;
+    }
+
+    return sources[0].thumbnail.toDataURL();
+  } catch (err) {
+    console.error('[screenshot] Failed to capture screen:', err);
+    return null;
+  }
+}

From ced7f7562a88275e1c778fe7650b12e1742f094a Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Fri, 3 Apr 2026 18:09:54 +0200
Subject: [PATCH 103/202] wire global shortcut and screenshot into autocomplete
 trigger

---
 .../src/modules/autocomplete/index.ts         | 31 ++++++++++++++++---
 1 file changed, 27 insertions(+), 4 deletions(-)

diff --git a/surfsense_desktop/src/modules/autocomplete/index.ts b/surfsense_desktop/src/modules/autocomplete/index.ts
index 3d9d67eef..6763b2cae 100644
--- a/surfsense_desktop/src/modules/autocomplete/index.ts
+++ b/surfsense_desktop/src/modules/autocomplete/index.ts
@@ -2,8 +2,11 @@ import { clipboard, globalShortcut, ipcMain, screen } from 'electron';
 import { IPC_CHANNELS } from '../../ipc/channels';
 import { getFrontmostApp, hasAccessibilityPermission, simulatePaste } from '../platform';
 import { getMainWindow } from '../window';
+import { captureScreen } from './screenshot';
 import { createSuggestionWindow, destroySuggestion, getSuggestionWindow } from './suggestion-window';
 
+const SHORTCUT = 'CommandOrControl+Shift+Space';
+
 let autocompleteEnabled = true;
 let savedClipboard = '';
 let sourceApp = '';
@@ -15,12 +18,19 @@ function isSurfSenseWindow(): boolean {
 }
 
 async function triggerAutocomplete(): Promise<void> {
+  if (!autocompleteEnabled) return;
   if (!hasAccessibilityPermission()) return;
   if (isSurfSenseWindow()) return;
 
   sourceApp = getFrontmostApp();
   savedClipboard = clipboard.readText();
 
+  const screenshot = await captureScreen();
+  if (!screenshot) {
+    console.error('[autocomplete] Screenshot capture failed');
+    return;
+  }
+
   const cursor = screen.getCursorScreenPoint();
   const win = createSuggestionWindow(cursor.x, cursor.y);
 
@@ -39,8 +49,7 @@ async function triggerAutocomplete(): Promise<void> {
     setTimeout(() => {
       if (sw && !sw.isDestroyed()) {
         sw.webContents.send(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, {
-          text: '',
-          cursorPosition: 0,
+          screenshot,
           searchSpaceId,
         });
       }
@@ -89,10 +98,24 @@ function registerIpcHandlers(): void {
 export function registerAutocomplete(): void {
   registerIpcHandlers();
 
-  // TODO: Phase 2 — replace with vision-based trigger (desktopCapturer + globalShortcut)
-  console.log('[autocomplete] IPC handlers registered');
+  const ok = globalShortcut.register(SHORTCUT, () => {
+    const sw = getSuggestionWindow();
+    if (sw && !sw.isDestroyed()) {
+      destroySuggestion();
+      pendingSuggestionText = '';
+      return;
+    }
+    triggerAutocomplete();
+  });
+
+  if (!ok) {
+    console.error(`[autocomplete] Failed to register shortcut ${SHORTCUT}`);
+  } else {
+    console.log(`[autocomplete] Registered shortcut ${SHORTCUT}`);
+  }
 }
 
 export function unregisterAutocomplete(): void {
+  globalShortcut.unregister(SHORTCUT);
   destroySuggestion();
 }

From aeb3f13f9113d9f53d507c88c8bfc0f4e4bd1484 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Fri, 3 Apr 2026 18:17:50 +0200
Subject: [PATCH 104/202] replace text-based autocomplete with vision-based
 endpoint

---
 .../app/routes/autocomplete_routes.py         |  23 ++--
 .../app/services/autocomplete_service.py      | 110 ------------------
 .../services/vision_autocomplete_service.py   |  78 +++++++++++++
 surfsense_desktop/src/preload.ts              |   4 +-
 surfsense_web/app/desktop/suggestion/page.tsx |  18 +--
 surfsense_web/types/window.d.ts               |   2 +-
 6 files changed, 102 insertions(+), 133 deletions(-)
 delete mode 100644 surfsense_backend/app/services/autocomplete_service.py
 create mode 100644 surfsense_backend/app/services/vision_autocomplete_service.py

diff --git a/surfsense_backend/app/routes/autocomplete_routes.py b/surfsense_backend/app/routes/autocomplete_routes.py
index 68c56d0e0..329476ca1 100644
--- a/surfsense_backend/app/routes/autocomplete_routes.py
+++ b/surfsense_backend/app/routes/autocomplete_routes.py
@@ -1,28 +1,29 @@
-from fastapi import APIRouter, Depends, Query
+from fastapi import APIRouter, Depends
 from fastapi.responses import StreamingResponse
+from pydantic import BaseModel
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from app.db import User, get_async_session
-from app.services.autocomplete_service import stream_autocomplete
 from app.services.new_streaming_service import VercelStreamingService
+from app.services.vision_autocomplete_service import stream_vision_autocomplete
 from app.users import current_active_user
 
 router = APIRouter(prefix="/autocomplete", tags=["autocomplete"])
 
 
-@router.post("/stream")
-async def autocomplete_stream(
-    text: str = Query(..., description="Current text in the input field"),
-    cursor_position: int = Query(-1, description="Cursor position in the text (-1 for end)"),
-    search_space_id: int = Query(..., description="Search space ID for KB context and LLM config"),
+class VisionAutocompleteRequest(BaseModel):
+    screenshot: str
+    search_space_id: int
+
+
+@router.post("/vision/stream")
+async def vision_autocomplete_stream(
+    body: VisionAutocompleteRequest,
     user: User = Depends(current_active_user),
     session: AsyncSession = Depends(get_async_session),
 ):
-    if cursor_position < 0:
-        cursor_position = len(text)
-
     return StreamingResponse(
-        stream_autocomplete(text, cursor_position, search_space_id, session),
+        stream_vision_autocomplete(body.screenshot, body.search_space_id, session),
         media_type="text/event-stream",
         headers={
             **VercelStreamingService.get_response_headers(),
diff --git a/surfsense_backend/app/services/autocomplete_service.py b/surfsense_backend/app/services/autocomplete_service.py
deleted file mode 100644
index 7c172275d..000000000
--- a/surfsense_backend/app/services/autocomplete_service.py
+++ /dev/null
@@ -1,110 +0,0 @@
-import logging
-from typing import AsyncGenerator
-
-from langchain_core.messages import HumanMessage, SystemMessage
-from sqlalchemy.ext.asyncio import AsyncSession
-
-from app.retriever.chunks_hybrid_search import ChucksHybridSearchRetriever
-from app.services.llm_service import get_agent_llm
-from app.services.new_streaming_service import VercelStreamingService
-
-logger = logging.getLogger(__name__)
-
-SYSTEM_PROMPT = """You are an inline text autocomplete engine. Your job is to complete the user's text naturally.
-
-Rules:
-- Output ONLY the continuation text. Do NOT repeat what the user already typed.
-- Keep completions concise: 1-3 sentences maximum.
-- Match the user's tone, style, and language.
-- If knowledge base context is provided, use it to make the completion factually accurate and personalized.
-- Do NOT add quotes, explanations, or meta-commentary.
-- Do NOT start with a space unless grammatically required.
-- If you cannot produce a useful completion, output nothing."""
-
-KB_CONTEXT_TEMPLATE = """
-Relevant knowledge base context (use this to personalize the completion):
----
-{kb_context}
----
-"""
-
-
-async def _retrieve_kb_context(
-    session: AsyncSession,
-    text: str,
-    search_space_id: int,
-) -> str:
-    try:
-        retriever = ChucksHybridSearchRetriever(session)
-        chunks = await retriever.vector_search(
-            query_text=text[-200:],
-            top_k=3,
-            search_space_id=search_space_id,
-        )
-        if not chunks:
-            return ""
-        snippets = []
-        for chunk in chunks:
-            content = getattr(chunk, "content", None) or getattr(chunk, "chunk_text", "")
-            if content:
-                snippets.append(content[:300])
-        if not snippets:
-            return ""
-        return KB_CONTEXT_TEMPLATE.format(kb_context="\n\n".join(snippets))
-    except Exception as e:
-        logger.warning(f"KB search failed for autocomplete, proceeding without context: {e}")
-        return ""
-
-
-async def stream_autocomplete(
-    text: str,
-    cursor_position: int,
-    search_space_id: int,
-    session: AsyncSession,
-) -> AsyncGenerator[str, None]:
-    """Build context, call the LLM, and yield SSE-formatted tokens."""
-    streaming = VercelStreamingService()
-    text_before_cursor = text[:cursor_position] if cursor_position >= 0 else text
-
-    if not text_before_cursor.strip():
-        yield streaming.format_message_start()
-        yield streaming.format_finish()
-        yield streaming.format_done()
-        return
-
-    kb_context = await _retrieve_kb_context(session, text_before_cursor, search_space_id)
-
-    llm = await get_agent_llm(session, search_space_id)
-    if not llm:
-        yield streaming.format_message_start()
-        yield streaming.format_error("No LLM configured for this search space")
-        yield streaming.format_done()
-        return
-
-    system_prompt = SYSTEM_PROMPT
-    if kb_context:
-        system_prompt += kb_context
-
-    messages = [
-        SystemMessage(content=system_prompt),
-        HumanMessage(content=f"Complete this text:\n{text_before_cursor}"),
-    ]
-
-    try:
-        yield streaming.format_message_start()
-        text_id = streaming.generate_text_id()
-        yield streaming.format_text_start(text_id)
-
-        async for chunk in llm.astream(messages):
-            token = chunk.content if hasattr(chunk, "content") else str(chunk)
-            if token:
-                yield streaming.format_text_delta(text_id, token)
-
-        yield streaming.format_text_end(text_id)
-        yield streaming.format_finish()
-        yield streaming.format_done()
-
-    except Exception as e:
-        logger.error(f"Autocomplete streaming error: {e}")
-        yield streaming.format_error(str(e))
-        yield streaming.format_done()
diff --git a/surfsense_backend/app/services/vision_autocomplete_service.py b/surfsense_backend/app/services/vision_autocomplete_service.py
new file mode 100644
index 000000000..526b0d35c
--- /dev/null
+++ b/surfsense_backend/app/services/vision_autocomplete_service.py
@@ -0,0 +1,78 @@
+import logging
+from typing import AsyncGenerator
+
+from langchain_core.messages import HumanMessage, SystemMessage
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.services.llm_service import get_vision_llm
+from app.services.new_streaming_service import VercelStreamingService
+
+logger = logging.getLogger(__name__)
+
+VISION_SYSTEM_PROMPT = """You are a smart writing assistant that analyzes the user's screen to draft or complete text.
+
+You will receive a screenshot of the user's screen. Your job:
+1. Analyze the ENTIRE screenshot to understand what the user is working on (email thread, chat conversation, document, code editor, form, etc.).
+2. Identify the text area where the user will type.
+3. Based on the full visual context, generate the text the user most likely wants to write.
+
+Key behavior:
+- If the text area is EMPTY, draft a full response or message based on what you see on screen (e.g., reply to an email, respond to a chat message, continue a document).
+- If the text area already has text, continue it naturally.
+
+Rules:
+- Output ONLY the text to be inserted. No quotes, no explanations, no meta-commentary.
+- Be concise but complete — a full thought, not a fragment.
+- Match the tone and formality of the surrounding context.
+- If the screen shows code, write code. If it shows a casual chat, be casual. If it shows a formal email, be formal.
+- Do NOT describe the screenshot or explain your reasoning.
+- If you cannot determine what to write, output nothing."""
+
+
+async def stream_vision_autocomplete(
+    screenshot_data_url: str,
+    search_space_id: int,
+    session: AsyncSession,
+) -> AsyncGenerator[str, None]:
+    """Analyze a screenshot with the vision LLM and stream a text completion."""
+    streaming = VercelStreamingService()
+
+    llm = await get_vision_llm(session, search_space_id)
+    if not llm:
+        yield streaming.format_message_start()
+        yield streaming.format_error("No Vision LLM configured for this search space")
+        yield streaming.format_done()
+        return
+
+    messages = [
+        SystemMessage(content=VISION_SYSTEM_PROMPT),
+        HumanMessage(content=[
+            {
+                "type": "text",
+                "text": "Analyze this screenshot. Understand the full context of what the user is working on, then generate the text they most likely want to write in the active text area.",
+            },
+            {
+                "type": "image_url",
+                "image_url": {"url": screenshot_data_url},
+            },
+        ]),
+    ]
+
+    try:
+        yield streaming.format_message_start()
+        text_id = streaming.generate_text_id()
+        yield streaming.format_text_start(text_id)
+
+        async for chunk in llm.astream(messages):
+            token = chunk.content if hasattr(chunk, "content") else str(chunk)
+            if token:
+                yield streaming.format_text_delta(text_id, token)
+
+        yield streaming.format_text_end(text_id)
+        yield streaming.format_finish()
+        yield streaming.format_done()
+
+    except Exception as e:
+        logger.error(f"Vision autocomplete streaming error: {e}")
+        yield streaming.format_error(str(e))
+        yield streaming.format_done()
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 157fe216b..891d9b029 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -26,8 +26,8 @@ contextBridge.exposeInMainWorld('electronAPI', {
   requestAccessibility: () => ipcRenderer.invoke(IPC_CHANNELS.REQUEST_ACCESSIBILITY),
   restartApp: () => ipcRenderer.invoke(IPC_CHANNELS.RESTART_APP),
   // Autocomplete
-  onAutocompleteContext: (callback: (data: { text: string; cursorPosition: number; searchSpaceId?: string }) => void) => {
-    const listener = (_event: unknown, data: { text: string; cursorPosition: number; searchSpaceId?: string }) => callback(data);
+  onAutocompleteContext: (callback: (data: { screenshot: string; searchSpaceId?: string }) => void) => {
+    const listener = (_event: unknown, data: { screenshot: string; searchSpaceId?: string }) => callback(data);
     ipcRenderer.on(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, listener);
     return () => {
       ipcRenderer.removeListener(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, listener);
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 69a19e3f1..2c147eb25 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -18,7 +18,7 @@ export default function SuggestionPage() {
 	const abortRef = useRef<AbortController | null>(null);
 
 	const fetchSuggestion = useCallback(
-		async (text: string, cursorPosition: number, searchSpaceId: string) => {
+		async (screenshot: string, searchSpaceId: string) => {
 			abortRef.current?.abort();
 			const controller = new AbortController();
 			abortRef.current = controller;
@@ -37,21 +37,19 @@ export default function SuggestionPage() {
 			const backendUrl =
 				process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL || "http://localhost:8000";
 
-			const params = new URLSearchParams({
-				text,
-				cursor_position: String(cursorPosition),
-				search_space_id: searchSpaceId,
-			});
-
 			try {
 				const response = await fetch(
-					`${backendUrl}/api/v1/autocomplete/stream?${params}`,
+					`${backendUrl}/api/v1/autocomplete/vision/stream`,
 					{
 						method: "POST",
 						headers: {
 							Authorization: `Bearer ${token}`,
 							"Content-Type": "application/json",
 						},
+						body: JSON.stringify({
+							screenshot,
+							search_space_id: parseInt(searchSpaceId, 10),
+						}),
 						signal: controller.signal,
 					},
 				);
@@ -119,7 +117,9 @@ export default function SuggestionPage() {
 
 		const cleanup = window.electronAPI.onAutocompleteContext((data) => {
 			const searchSpaceId = data.searchSpaceId || "1";
-			fetchSuggestion(data.text, data.cursorPosition, searchSpaceId);
+			if (data.screenshot) {
+				fetchSuggestion(data.screenshot, searchSpaceId);
+			}
 		});
 
 		return cleanup;
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 0b312b5ec..a5b8566f9 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -21,7 +21,7 @@ interface ElectronAPI {
 	requestAccessibility: () => Promise<void>;
 	restartApp: () => Promise<void>;
 	// Autocomplete
-	onAutocompleteContext: (callback: (data: { text: string; cursorPosition: number; searchSpaceId?: string }) => void) => () => void;
+	onAutocompleteContext: (callback: (data: { screenshot: string; searchSpaceId?: string }) => void) => () => void;
 	acceptSuggestion: (text: string) => Promise<void>;
 	dismissSuggestion: () => Promise<void>;
 	updateSuggestionText: (text: string) => Promise<void>;

From af5977691b399f315b1ea1b6f380bb7fea42bc35 Mon Sep 17 00:00:00 2001
From: sukarxn <thecodersmailbox@gmail.com>
Date: Fri, 3 Apr 2026 23:23:54 +0530
Subject: [PATCH 105/202] perf: optimize ui components with react hooks
 memoization

- toggle-group.tsx: Wrap contextValue in useMemo to prevent unnecessary re-renders
- animated-tabs.tsx: Hoist constants and memoize handlers with useCallback/useMemo
- LocaleContext.tsx: Wrap setLocale in useCallback and contextValue in useMemo
- plate-editor.tsx: Memoize SaveShortcutPlugin and contextProviderValue, use useRef for stable references
---
 surfsense_web/components/editor/plate-editor.tsx | 14 ++++++++------
 surfsense_web/components/ui/animated-tabs.tsx    |  5 +++--
 surfsense_web/components/ui/toggle-group.tsx     |  5 ++++-
 surfsense_web/contexts/LocaleContext.tsx         | 11 +++++++----
 4 files changed, 22 insertions(+), 13 deletions(-)

diff --git a/surfsense_web/components/editor/plate-editor.tsx b/surfsense_web/components/editor/plate-editor.tsx
index 870ded55f..ed239ffa3 100644
--- a/surfsense_web/components/editor/plate-editor.tsx
+++ b/surfsense_web/components/editor/plate-editor.tsx
@@ -158,14 +158,16 @@ export function PlateEditor({
 	// When not forced read-only, the user can toggle between editing/viewing.
 	const canToggleMode = !readOnly;
 
+	const contextProviderValue = useMemo(()=> ({
+		onSave,
+		hasUnsavedChanges,
+		isSaving,
+		canToggleMode,
+	}), [onSave, hasUnsavedChanges, isSaving, canToggleMode]);
+
 	return (
 		<EditorSaveContext.Provider
-			value={{
-				onSave,
-				hasUnsavedChanges,
-				isSaving,
-				canToggleMode,
-			}}
+			value={contextProviderValue}
 		>
 			<Plate
 				editor={editor}
diff --git a/surfsense_web/components/ui/animated-tabs.tsx b/surfsense_web/components/ui/animated-tabs.tsx
index 43ae82121..0cd8dd54c 100644
--- a/surfsense_web/components/ui/animated-tabs.tsx
+++ b/surfsense_web/components/ui/animated-tabs.tsx
@@ -7,6 +7,7 @@ import React, {
 	useCallback,
 	useContext,
 	useEffect,
+	useMemo,
 	useRef,
 	useState,
 } from "react";
@@ -201,9 +202,9 @@ const Tabs = forwardRef<
 		},
 		[onValueChange, value]
 	);
-
+	const contextValue = useMemo(() => ({ activeValue, onValueChange: handleValueChange }), [activeValue, handleValueChange]);
 	return (
-		<TabsContext.Provider value={{ activeValue, onValueChange: handleValueChange }}>
+		<TabsContext.Provider value={contextValue}>
 			<div ref={ref} className={cn("tabs-container", className)} {...props}>
 				{children}
 			</div>
diff --git a/surfsense_web/components/ui/toggle-group.tsx b/surfsense_web/components/ui/toggle-group.tsx
index 6740fade0..860fa7a52 100644
--- a/surfsense_web/components/ui/toggle-group.tsx
+++ b/surfsense_web/components/ui/toggle-group.tsx
@@ -5,6 +5,7 @@ import type { VariantProps } from "class-variance-authority";
 import * as React from "react";
 import { toggleVariants } from "@/components/ui/toggle";
 import { cn } from "@/lib/utils";
+import { useMemo } from "react";
 
 const ToggleGroupContext = React.createContext<
 	VariantProps<typeof toggleVariants> & {
@@ -27,6 +28,8 @@ function ToggleGroup({
 	VariantProps<typeof toggleVariants> & {
 		spacing?: number;
 	}) {
+	const contextValue = useMemo(() => ({variant, size, spacing }), [variant, size, spacing]);
+	
 	return (
 		<ToggleGroupPrimitive.Root
 			data-slot="toggle-group"
@@ -40,7 +43,7 @@ function ToggleGroup({
 			)}
 			{...props}
 		>
-			<ToggleGroupContext.Provider value={{ variant, size, spacing }}>
+			<ToggleGroupContext.Provider value={contextValue}>
 				{children}
 			</ToggleGroupContext.Provider>
 		</ToggleGroupPrimitive.Root>
diff --git a/surfsense_web/contexts/LocaleContext.tsx b/surfsense_web/contexts/LocaleContext.tsx
index 405fa4a50..e67e9c2a5 100644
--- a/surfsense_web/contexts/LocaleContext.tsx
+++ b/surfsense_web/contexts/LocaleContext.tsx
@@ -1,12 +1,13 @@
 "use client";
 
 import type React from "react";
-import { createContext, useContext, useEffect, useState } from "react";
+import { createContext, useCallback, useContext, useEffect, useMemo, useState } from "react";
 import enMessages from "../messages/en.json";
 import esMessages from "../messages/es.json";
 import hiMessages from "../messages/hi.json";
 import ptMessages from "../messages/pt.json";
 import zhMessages from "../messages/zh.json";
+import { set } from "zod";
 
 type Locale = "en" | "es" | "pt" | "hi" | "zh";
 
@@ -49,14 +50,14 @@ export function LocaleProvider({ children }: { children: React.ReactNode }) {
 	}, []);
 
 	// Update locale and persist to localStorage
-	const setLocale = (newLocale: Locale) => {
+	const setLocale = useCallback((newLocale: Locale) => {
 		setLocaleState(newLocale);
 		if (typeof window !== "undefined") {
 			localStorage.setItem(LOCALE_STORAGE_KEY, newLocale);
 			// Update HTML lang attribute
 			document.documentElement.lang = newLocale;
 		}
-	};
+	}, []);
 
 	// Set HTML lang attribute when locale changes
 	useEffect(() => {
@@ -65,8 +66,10 @@ export function LocaleProvider({ children }: { children: React.ReactNode }) {
 		}
 	}, [locale, mounted]);
 
+	const contextValue = useMemo(() => ({ locale, messages, setLocale }), [locale, messages, setLocale]);
+
 	return (
-		<LocaleContext.Provider value={{ locale, messages, setLocale }}>
+		<LocaleContext.Provider value={contextValue}>
 			{children}
 		</LocaleContext.Provider>
 	);

From c5aa869adb9a2e4b88b7a2ab140fb3fc4b9cad96 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Fri, 3 Apr 2026 19:57:48 +0200
Subject: [PATCH 106/202] switch to on-demand permission requests and improve
 suggestion UX

---
 .../117_add_vision_llm_id_to_search_spaces.py |   6 +-
 surfsense_desktop/electron-builder.yml        |   1 +
 surfsense_desktop/src/ipc/channels.ts         |   1 +
 surfsense_desktop/src/ipc/handlers.ts         |   5 +
 surfsense_desktop/src/main.ts                 |  14 +-
 .../src/modules/autocomplete/index.ts         |  13 +-
 surfsense_desktop/src/modules/permissions.ts  |  18 ++-
 surfsense_desktop/src/preload.ts              |   1 +
 .../app/desktop/permissions/page.tsx          | 122 +++++++++++-------
 surfsense_web/app/desktop/suggestion/page.tsx |  59 +++++++--
 .../app/desktop/suggestion/suggestion.css     |  42 +++---
 surfsense_web/types/window.d.ts               |   2 +
 12 files changed, 195 insertions(+), 89 deletions(-)

diff --git a/surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py b/surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py
index 254642c88..2bec374c6 100644
--- a/surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py
+++ b/surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py
@@ -25,15 +25,15 @@ depends_on: str | Sequence[str] | None = None
 def upgrade() -> None:
     conn = op.get_bind()
     existing_columns = [
-        col["name"] for col in sa.inspect(conn).get_columns("search_spaces")
+        col["name"] for col in sa.inspect(conn).get_columns("searchspaces")
     ]
 
     if "vision_llm_id" not in existing_columns:
         op.add_column(
-            "search_spaces",
+            "searchspaces",
             sa.Column("vision_llm_id", sa.Integer(), nullable=True, server_default="0"),
         )
 
 
 def downgrade() -> None:
-    op.drop_column("search_spaces", "vision_llm_id")
+    op.drop_column("searchspaces", "vision_llm_id")
diff --git a/surfsense_desktop/electron-builder.yml b/surfsense_desktop/electron-builder.yml
index 3de0f266d..be5e07c63 100644
--- a/surfsense_desktop/electron-builder.yml
+++ b/surfsense_desktop/electron-builder.yml
@@ -47,6 +47,7 @@ mac:
   gatekeeperAssess: false
   extendInfo:
     NSAccessibilityUsageDescription: "SurfSense uses accessibility features to insert suggestions into the active application."
+    NSScreenCaptureUsageDescription: "SurfSense uses screen capture to analyze your screen and provide context-aware writing suggestions."
     NSAppleEventsUsageDescription: "SurfSense uses Apple Events to interact with the active application."
   target:
     - target: dmg
diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index 905a84bc3..e41355eaf 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -9,6 +9,7 @@ export const IPC_CHANNELS = {
   // Permissions
   GET_PERMISSIONS_STATUS: 'get-permissions-status',
   REQUEST_ACCESSIBILITY: 'request-accessibility',
+  REQUEST_SCREEN_RECORDING: 'request-screen-recording',
   RESTART_APP: 'restart-app',
   // Autocomplete
   AUTOCOMPLETE_CONTEXT: 'autocomplete-context',
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index 8597a39e8..11cbfee05 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -3,6 +3,7 @@ import { IPC_CHANNELS } from './channels';
 import {
   getPermissionsStatus,
   requestAccessibility,
+  requestScreenRecording,
   restartApp,
 } from '../modules/permissions';
 
@@ -30,6 +31,10 @@ export function registerIpcHandlers(): void {
     requestAccessibility();
   });
 
+  ipcMain.handle(IPC_CHANNELS.REQUEST_SCREEN_RECORDING, () => {
+    requestScreenRecording();
+  });
+
   ipcMain.handle(IPC_CHANNELS.RESTART_APP, () => {
     restartApp();
   });
diff --git a/surfsense_desktop/src/main.ts b/surfsense_desktop/src/main.ts
index c96453c6d..584e930fe 100644
--- a/surfsense_desktop/src/main.ts
+++ b/surfsense_desktop/src/main.ts
@@ -8,7 +8,6 @@ import { setupMenu } from './modules/menu';
 import { registerQuickAsk, unregisterQuickAsk } from './modules/quick-ask';
 import { registerAutocomplete, unregisterAutocomplete } from './modules/autocomplete';
 import { registerIpcHandlers } from './ipc/handlers';
-import { allPermissionsGranted } from './modules/permissions';
 
 registerGlobalErrorHandlers();
 
@@ -18,14 +17,6 @@ if (!setupDeepLinks()) {
 
 registerIpcHandlers();
 
-function getInitialPath(): string {
-  const granted = allPermissionsGranted();
-  if (process.platform === 'darwin' && !granted) {
-    return '/desktop/permissions';
-  }
-  return '/dashboard';
-}
-
 app.whenReady().then(async () => {
   setupMenu();
   try {
@@ -36,8 +27,7 @@ app.whenReady().then(async () => {
     return;
   }
 
-  const initialPath = getInitialPath();
-  createMainWindow(initialPath);
+  createMainWindow('/dashboard');
   registerQuickAsk();
   registerAutocomplete();
   setupAutoUpdater();
@@ -46,7 +36,7 @@ app.whenReady().then(async () => {
 
   app.on('activate', () => {
     if (BrowserWindow.getAllWindows().length === 0) {
-      createMainWindow(getInitialPath());
+      createMainWindow('/dashboard');
     }
   });
 });
diff --git a/surfsense_desktop/src/modules/autocomplete/index.ts b/surfsense_desktop/src/modules/autocomplete/index.ts
index 6763b2cae..958886b63 100644
--- a/surfsense_desktop/src/modules/autocomplete/index.ts
+++ b/surfsense_desktop/src/modules/autocomplete/index.ts
@@ -1,6 +1,7 @@
 import { clipboard, globalShortcut, ipcMain, screen } from 'electron';
 import { IPC_CHANNELS } from '../../ipc/channels';
 import { getFrontmostApp, hasAccessibilityPermission, simulatePaste } from '../platform';
+import { hasScreenRecordingPermission, requestAccessibility, requestScreenRecording } from '../permissions';
 import { getMainWindow } from '../window';
 import { captureScreen } from './screenshot';
 import { createSuggestionWindow, destroySuggestion, getSuggestionWindow } from './suggestion-window';
@@ -19,9 +20,13 @@ function isSurfSenseWindow(): boolean {
 
 async function triggerAutocomplete(): Promise<void> {
   if (!autocompleteEnabled) return;
-  if (!hasAccessibilityPermission()) return;
   if (isSurfSenseWindow()) return;
 
+  if (!hasScreenRecordingPermission()) {
+    requestScreenRecording();
+    return;
+  }
+
   sourceApp = getFrontmostApp();
   savedClipboard = clipboard.readText();
 
@@ -59,7 +64,11 @@ async function triggerAutocomplete(): Promise<void> {
 
 async function acceptAndInject(text: string): Promise<void> {
   if (!sourceApp) return;
-  if (!hasAccessibilityPermission()) return;
+
+  if (!hasAccessibilityPermission()) {
+    requestAccessibility();
+    return;
+  }
 
   clipboard.writeText(text);
   destroySuggestion();
diff --git a/surfsense_desktop/src/modules/permissions.ts b/surfsense_desktop/src/modules/permissions.ts
index 4ac671b7c..a2f057795 100644
--- a/surfsense_desktop/src/modules/permissions.ts
+++ b/surfsense_desktop/src/modules/permissions.ts
@@ -4,6 +4,7 @@ type PermissionStatus = 'authorized' | 'denied' | 'not determined' | 'restricted
 
 export interface PermissionsStatus {
   accessibility: PermissionStatus;
+  screenRecording: PermissionStatus;
 }
 
 function isMac(): boolean {
@@ -16,18 +17,19 @@ function getNodeMacPermissions() {
 
 export function getPermissionsStatus(): PermissionsStatus {
   if (!isMac()) {
-    return { accessibility: 'authorized' };
+    return { accessibility: 'authorized', screenRecording: 'authorized' };
   }
 
   const perms = getNodeMacPermissions();
   return {
     accessibility: perms.getAuthStatus('accessibility'),
+    screenRecording: perms.getAuthStatus('screen'),
   };
 }
 
 export function allPermissionsGranted(): boolean {
   const status = getPermissionsStatus();
-  return status.accessibility === 'authorized';
+  return status.accessibility === 'authorized' && status.screenRecording === 'authorized';
 }
 
 export function requestAccessibility(): void {
@@ -36,6 +38,18 @@ export function requestAccessibility(): void {
   perms.askForAccessibilityAccess();
 }
 
+export function hasScreenRecordingPermission(): boolean {
+  if (!isMac()) return true;
+  const perms = getNodeMacPermissions();
+  return perms.getAuthStatus('screen') === 'authorized';
+}
+
+export function requestScreenRecording(): void {
+  if (!isMac()) return;
+  const perms = getNodeMacPermissions();
+  perms.askForScreenCaptureAccess();
+}
+
 export function restartApp(): void {
   app.relaunch();
   app.exit(0);
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 891d9b029..5c8b64f6f 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -24,6 +24,7 @@ contextBridge.exposeInMainWorld('electronAPI', {
   // Permissions
   getPermissionsStatus: () => ipcRenderer.invoke(IPC_CHANNELS.GET_PERMISSIONS_STATUS),
   requestAccessibility: () => ipcRenderer.invoke(IPC_CHANNELS.REQUEST_ACCESSIBILITY),
+  requestScreenRecording: () => ipcRenderer.invoke(IPC_CHANNELS.REQUEST_SCREEN_RECORDING),
   restartApp: () => ipcRenderer.invoke(IPC_CHANNELS.RESTART_APP),
   // Autocomplete
   onAutocompleteContext: (callback: (data: { screenshot: string; searchSpaceId?: string }) => void) => {
diff --git a/surfsense_web/app/desktop/permissions/page.tsx b/surfsense_web/app/desktop/permissions/page.tsx
index e0d3131e0..6c08e35b5 100644
--- a/surfsense_web/app/desktop/permissions/page.tsx
+++ b/surfsense_web/app/desktop/permissions/page.tsx
@@ -10,8 +10,26 @@ type PermissionStatus = "authorized" | "denied" | "not determined" | "restricted
 
 interface PermissionsStatus {
 	accessibility: PermissionStatus;
+	screenRecording: PermissionStatus;
 }
 
+const STEPS = [
+	{
+		id: "screen-recording",
+		title: "Screen Recording",
+		description: "Lets SurfSense capture your screen to understand context and provide smart writing suggestions.",
+		action: "requestScreenRecording",
+		field: "screenRecording" as const,
+	},
+	{
+		id: "accessibility",
+		title: "Accessibility",
+		description: "Lets SurfSense insert suggestions seamlessly, right where you\u2019re typing.",
+		action: "requestAccessibility",
+		field: "accessibility" as const,
+	},
+];
+
 function StatusBadge({ status }: { status: PermissionStatus }) {
 	if (status === "authorized") {
 		return (
@@ -48,11 +66,13 @@ export default function DesktopPermissionsPage() {
 
 		let interval: ReturnType<typeof setInterval> | null = null;
 
+		const isResolved = (s: string) => s === "authorized" || s === "restricted";
+
 		const poll = async () => {
 			const status = await window.electronAPI!.getPermissionsStatus();
 			setPermissions(status);
 
-			if (status.accessibility === "authorized" || status.accessibility === "restricted") {
+			if (isResolved(status.accessibility) && isResolved(status.screenRecording)) {
 				if (interval) clearInterval(interval);
 			}
 		};
@@ -78,10 +98,14 @@ export default function DesktopPermissionsPage() {
 		);
 	}
 
-	const allGranted = permissions.accessibility === "authorized";
+	const allGranted = permissions.accessibility === "authorized" && permissions.screenRecording === "authorized";
 
-	const handleRequest = async () => {
-		await window.electronAPI!.requestAccessibility();
+	const handleRequest = async (action: string) => {
+		if (action === "requestScreenRecording") {
+			await window.electronAPI!.requestScreenRecording();
+		} else if (action === "requestAccessibility") {
+			await window.electronAPI!.requestAccessibility();
+		}
 	};
 
 	const handleContinue = () => {
@@ -103,55 +127,61 @@ export default function DesktopPermissionsPage() {
 					<div className="space-y-1">
 						<h1 className="text-2xl font-semibold tracking-tight">System Permissions</h1>
 						<p className="text-sm text-muted-foreground">
-							SurfSense needs Accessibility permission to insert suggestions into the active application.
+							SurfSense needs two macOS permissions to provide context-aware writing suggestions.
 						</p>
 					</div>
 				</div>
 
-				{/* Permission card */}
+				{/* Steps */}
 				<div className="rounded-xl border bg-background dark:bg-neutral-900 flex-1 min-h-0 overflow-y-auto px-6 py-6 space-y-6">
-					<div
-						className={`rounded-lg border p-4 transition-colors ${
-							allGranted
-								? "border-green-200 bg-green-50/50 dark:border-green-900 dark:bg-green-950/20"
-								: "border-border"
-						}`}
-					>
-						<div className="flex items-start justify-between gap-3">
-							<div className="flex items-start gap-3">
-								<span className="flex h-7 w-7 shrink-0 items-center justify-center rounded-full bg-primary/10 text-sm font-medium text-primary">
-									{allGranted ? "\u2713" : "1"}
-								</span>
-								<div className="space-y-1">
-									<h3 className="text-sm font-medium">Accessibility</h3>
-									<p className="text-xs text-muted-foreground">
-										Lets SurfSense insert suggestions seamlessly, right where you&apos;re typing.
-									</p>
+					{STEPS.map((step, index) => {
+						const status = permissions[step.field];
+						const isGranted = status === "authorized";
+
+						return (
+							<div
+								key={step.id}
+								className={`rounded-lg border p-4 transition-colors ${
+									isGranted
+										? "border-green-200 bg-green-50/50 dark:border-green-900 dark:bg-green-950/20"
+										: "border-border"
+								}`}
+							>
+								<div className="flex items-start justify-between gap-3">
+									<div className="flex items-start gap-3">
+										<span className="flex h-7 w-7 shrink-0 items-center justify-center rounded-full bg-primary/10 text-sm font-medium text-primary">
+											{isGranted ? "\u2713" : index + 1}
+										</span>
+										<div className="space-y-1">
+											<h3 className="text-sm font-medium">{step.title}</h3>
+											<p className="text-xs text-muted-foreground">{step.description}</p>
+										</div>
+									</div>
+									<StatusBadge status={status} />
 								</div>
-							</div>
-							<StatusBadge status={permissions.accessibility} />
-						</div>
-						{!allGranted && (
-							<div className="mt-3 pl-10 space-y-2">
-								<Button
-									size="sm"
-									variant="outline"
-									onClick={handleRequest}
-									className="text-xs"
-								>
-									Open System Settings
-								</Button>
-								{permissions.accessibility === "denied" && (
-									<p className="text-xs text-amber-700 dark:text-amber-400">
-										Toggle SurfSense on in System Settings to continue.
-									</p>
+								{!isGranted && (
+									<div className="mt-3 pl-10 space-y-2">
+										<Button
+											size="sm"
+											variant="outline"
+											onClick={() => handleRequest(step.action)}
+											className="text-xs"
+										>
+											Open System Settings
+										</Button>
+										{status === "denied" && (
+											<p className="text-xs text-amber-700 dark:text-amber-400">
+												Toggle SurfSense on in System Settings to continue.
+											</p>
+										)}
+										<p className="text-xs text-muted-foreground">
+											If SurfSense doesn&apos;t appear in the list, click <strong>+</strong> and select it from Applications.
+										</p>
+									</div>
 								)}
-								<p className="text-xs text-muted-foreground">
-									If SurfSense doesn&apos;t appear in the list, click <strong>+</strong> and select it from Applications.
-								</p>
 							</div>
-						)}
-					</div>
+						);
+					})}
 				</div>
 
 				{/* Footer */}
@@ -168,7 +198,7 @@ export default function DesktopPermissionsPage() {
 					) : (
 						<>
 							<Button disabled className="text-sm h-9 min-w-[180px]">
-								Grant permission to continue
+								Grant permissions to continue
 							</Button>
 							<button
 								onClick={handleSkip}
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 2c147eb25..4de90e03c 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -11,12 +11,40 @@ type SSEEvent =
 	| { type: "finish" }
 	| { type: "error"; errorText: string };
 
+function friendlyError(raw: string | number): string {
+	if (typeof raw === "number") {
+		if (raw === 401) return "Please sign in to use suggestions.";
+		if (raw === 403) return "You don\u2019t have permission for this.";
+		if (raw === 404) return "Suggestion service not found. Is the backend running?";
+		if (raw >= 500) return "Something went wrong on the server. Try again.";
+		return "Something went wrong. Try again.";
+	}
+	const lower = raw.toLowerCase();
+	if (lower.includes("not authenticated") || lower.includes("unauthorized"))
+		return "Please sign in to use suggestions.";
+	if (lower.includes("no vision llm configured") || lower.includes("no llm configured"))
+		return "No Vision LLM configured. Set one in search space settings.";
+	if (lower.includes("fetch") || lower.includes("network") || lower.includes("econnrefused"))
+		return "Can\u2019t reach the server. Check your connection.";
+	return "Something went wrong. Try again.";
+}
+
+const AUTO_DISMISS_MS = 3000;
+
 export default function SuggestionPage() {
 	const [suggestion, setSuggestion] = useState("");
 	const [isLoading, setIsLoading] = useState(true);
 	const [error, setError] = useState<string | null>(null);
 	const abortRef = useRef<AbortController | null>(null);
 
+	useEffect(() => {
+		if (!error) return;
+		const timer = setTimeout(() => {
+			window.electronAPI?.dismissSuggestion?.();
+		}, AUTO_DISMISS_MS);
+		return () => clearTimeout(timer);
+	}, [error]);
+
 	const fetchSuggestion = useCallback(
 		async (screenshot: string, searchSpaceId: string) => {
 			abortRef.current?.abort();
@@ -29,7 +57,7 @@ export default function SuggestionPage() {
 
 			const token = getBearerToken();
 			if (!token) {
-				setError("Not authenticated");
+				setError(friendlyError("not authenticated"));
 				setIsLoading(false);
 				return;
 			}
@@ -55,13 +83,13 @@ export default function SuggestionPage() {
 				);
 
 				if (!response.ok) {
-					setError(`Error: ${response.status}`);
+					setError(friendlyError(response.status));
 					setIsLoading(false);
 					return;
 				}
 
 				if (!response.body) {
-					setError("No response body");
+					setError(friendlyError("network error"));
 					setIsLoading(false);
 					return;
 				}
@@ -94,7 +122,7 @@ export default function SuggestionPage() {
 										return updated;
 									});
 								} else if (parsed.type === "error") {
-									setError(parsed.errorText);
+									setError(friendlyError(parsed.errorText));
 								}
 							} catch {
 								continue;
@@ -104,7 +132,7 @@ export default function SuggestionPage() {
 				}
 			} catch (err) {
 				if (err instanceof DOMException && err.name === "AbortError") return;
-				setError("Failed to get suggestion");
+				setError(friendlyError("network error"));
 			} finally {
 				setIsLoading(false);
 			}
@@ -145,15 +173,28 @@ export default function SuggestionPage() {
 		);
 	}
 
+	const handleAccept = () => {
+		if (suggestion) {
+			window.electronAPI?.acceptSuggestion?.(suggestion);
+		}
+	};
+
+	const handleDismiss = () => {
+		window.electronAPI?.dismissSuggestion?.();
+	};
+
 	if (!suggestion) return null;
 
 	return (
 		<div className="suggestion-tooltip">
 			<p className="suggestion-text">{suggestion}</p>
-			<div className="suggestion-hint">
-				<kbd>Tab</kbd> accept
-				<span className="suggestion-separator" />
-				<kbd>Esc</kbd> dismiss
+			<div className="suggestion-actions">
+				<button className="suggestion-btn suggestion-btn-accept" onClick={handleAccept}>
+					Accept
+				</button>
+				<button className="suggestion-btn suggestion-btn-dismiss" onClick={handleDismiss}>
+					Dismiss
+				</button>
 			</div>
 		</div>
 	);
diff --git a/surfsense_web/app/desktop/suggestion/suggestion.css b/surfsense_web/app/desktop/suggestion/suggestion.css
index 0d3332103..712d12618 100644
--- a/surfsense_web/app/desktop/suggestion/suggestion.css
+++ b/surfsense_web/app/desktop/suggestion/suggestion.css
@@ -36,32 +36,44 @@ html, body {
   white-space: pre-wrap;
 }
 
-.suggestion-hint {
-  color: #666;
-  font-size: 11px;
+.suggestion-actions {
   display: flex;
-  align-items: center;
-  gap: 6px;
+  justify-content: flex-end;
+  gap: 4px;
   border-top: 1px solid #2a2a2a;
   padding-top: 6px;
 }
 
-.suggestion-hint kbd {
-  background: #2a2a2a;
-  border: 1px solid #3c3c3c;
+.suggestion-btn {
+  padding: 2px 8px;
   border-radius: 3px;
-  padding: 0 4px;
+  border: 1px solid #3c3c3c;
   font-family: inherit;
   font-size: 10px;
-  font-weight: 600;
-  color: #999;
-  line-height: 18px;
+  font-weight: 500;
+  cursor: pointer;
+  line-height: 16px;
+  transition: background 0.15s, border-color 0.15s;
 }
 
-.suggestion-separator {
-  width: 1px;
-  height: 10px;
+.suggestion-btn-accept {
+  background: #2563eb;
+  border-color: #3b82f6;
+  color: #fff;
+}
+
+.suggestion-btn-accept:hover {
+  background: #1d4ed8;
+}
+
+.suggestion-btn-dismiss {
+  background: #2a2a2a;
+  color: #999;
+}
+
+.suggestion-btn-dismiss:hover {
   background: #333;
+  color: #ccc;
 }
 
 .suggestion-error {
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index a5b8566f9..dc3a6465e 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -17,8 +17,10 @@ interface ElectronAPI {
 	// Permissions
 	getPermissionsStatus: () => Promise<{
 		accessibility: 'authorized' | 'denied' | 'not determined' | 'restricted' | 'limited';
+		screenRecording: 'authorized' | 'denied' | 'not determined' | 'restricted' | 'limited';
 	}>;
 	requestAccessibility: () => Promise<void>;
+	requestScreenRecording: () => Promise<void>;
 	restartApp: () => Promise<void>;
 	// Autocomplete
 	onAutocompleteContext: (callback: (data: { screenshot: string; searchSpaceId?: string }) => void) => () => void;

From 080acf5e0a18b62953cffcf19806633cc9122c98 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Fri, 3 Apr 2026 20:16:23 +0200
Subject: [PATCH 107/202] remove dead code: allPermissionsGranted,
 simulateCopy, pendingSuggestionText, updateSuggestionText

---
 surfsense_desktop/src/ipc/channels.ts               | 1 -
 surfsense_desktop/src/modules/autocomplete/index.ts | 7 -------
 surfsense_desktop/src/modules/permissions.ts        | 5 -----
 surfsense_desktop/src/modules/platform.ts           | 8 --------
 surfsense_desktop/src/preload.ts                    | 1 -
 surfsense_web/app/desktop/suggestion/page.tsx       | 6 +-----
 surfsense_web/types/window.d.ts                     | 1 -
 7 files changed, 1 insertion(+), 28 deletions(-)

diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index e41355eaf..d0e2b9ab4 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -15,7 +15,6 @@ export const IPC_CHANNELS = {
   AUTOCOMPLETE_CONTEXT: 'autocomplete-context',
   ACCEPT_SUGGESTION: 'accept-suggestion',
   DISMISS_SUGGESTION: 'dismiss-suggestion',
-  UPDATE_SUGGESTION_TEXT: 'update-suggestion-text',
   SET_AUTOCOMPLETE_ENABLED: 'set-autocomplete-enabled',
   GET_AUTOCOMPLETE_ENABLED: 'get-autocomplete-enabled',
 } as const;
diff --git a/surfsense_desktop/src/modules/autocomplete/index.ts b/surfsense_desktop/src/modules/autocomplete/index.ts
index 958886b63..3ed9c4a00 100644
--- a/surfsense_desktop/src/modules/autocomplete/index.ts
+++ b/surfsense_desktop/src/modules/autocomplete/index.ts
@@ -11,7 +11,6 @@ const SHORTCUT = 'CommandOrControl+Shift+Space';
 let autocompleteEnabled = true;
 let savedClipboard = '';
 let sourceApp = '';
-let pendingSuggestionText = '';
 
 function isSurfSenseWindow(): boolean {
   const app = getFrontmostApp();
@@ -72,7 +71,6 @@ async function acceptAndInject(text: string): Promise<void> {
 
   clipboard.writeText(text);
   destroySuggestion();
-  pendingSuggestionText = '';
 
   try {
     await new Promise((r) => setTimeout(r, 50));
@@ -90,10 +88,6 @@ function registerIpcHandlers(): void {
   });
   ipcMain.handle(IPC_CHANNELS.DISMISS_SUGGESTION, () => {
     destroySuggestion();
-    pendingSuggestionText = '';
-  });
-  ipcMain.handle(IPC_CHANNELS.UPDATE_SUGGESTION_TEXT, (_event, text: string) => {
-    pendingSuggestionText = text;
   });
   ipcMain.handle(IPC_CHANNELS.SET_AUTOCOMPLETE_ENABLED, (_event, enabled: boolean) => {
     autocompleteEnabled = enabled;
@@ -111,7 +105,6 @@ export function registerAutocomplete(): void {
     const sw = getSuggestionWindow();
     if (sw && !sw.isDestroyed()) {
       destroySuggestion();
-      pendingSuggestionText = '';
       return;
     }
     triggerAutocomplete();
diff --git a/surfsense_desktop/src/modules/permissions.ts b/surfsense_desktop/src/modules/permissions.ts
index a2f057795..02786113e 100644
--- a/surfsense_desktop/src/modules/permissions.ts
+++ b/surfsense_desktop/src/modules/permissions.ts
@@ -27,11 +27,6 @@ export function getPermissionsStatus(): PermissionsStatus {
   };
 }
 
-export function allPermissionsGranted(): boolean {
-  const status = getPermissionsStatus();
-  return status.accessibility === 'authorized' && status.screenRecording === 'authorized';
-}
-
 export function requestAccessibility(): void {
   if (!isMac()) return;
   const perms = getNodeMacPermissions();
diff --git a/surfsense_desktop/src/modules/platform.ts b/surfsense_desktop/src/modules/platform.ts
index 1ab0c38fb..1e6ac74e4 100644
--- a/surfsense_desktop/src/modules/platform.ts
+++ b/surfsense_desktop/src/modules/platform.ts
@@ -19,14 +19,6 @@ export function getFrontmostApp(): string {
   return '';
 }
 
-export function simulateCopy(): void {
-  if (process.platform === 'darwin') {
-    execSync('osascript -e \'tell application "System Events" to keystroke "c" using command down\'');
-  } else if (process.platform === 'win32') {
-    execSync('powershell -command "Add-Type -AssemblyName System.Windows.Forms; [System.Windows.Forms.SendKeys]::SendWait(\'^c\')"');
-  }
-}
-
 export function simulatePaste(): void {
   if (process.platform === 'darwin') {
     execSync('osascript -e \'tell application "System Events" to keystroke "v" using command down\'');
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 5c8b64f6f..31c5ca865 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -36,7 +36,6 @@ contextBridge.exposeInMainWorld('electronAPI', {
   },
   acceptSuggestion: (text: string) => ipcRenderer.invoke(IPC_CHANNELS.ACCEPT_SUGGESTION, text),
   dismissSuggestion: () => ipcRenderer.invoke(IPC_CHANNELS.DISMISS_SUGGESTION),
-  updateSuggestionText: (text: string) => ipcRenderer.invoke(IPC_CHANNELS.UPDATE_SUGGESTION_TEXT, text),
   setAutocompleteEnabled: (enabled: boolean) => ipcRenderer.invoke(IPC_CHANNELS.SET_AUTOCOMPLETE_ENABLED, enabled),
   getAutocompleteEnabled: () => ipcRenderer.invoke(IPC_CHANNELS.GET_AUTOCOMPLETE_ENABLED),
 });
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 4de90e03c..b68fe450d 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -116,11 +116,7 @@ export default function SuggestionPage() {
 							try {
 								const parsed: SSEEvent = JSON.parse(data);
 								if (parsed.type === "text-delta") {
-									setSuggestion((prev) => {
-										const updated = prev + parsed.delta;
-										window.electronAPI?.updateSuggestionText?.(updated);
-										return updated;
-									});
+									setSuggestion((prev) => prev + parsed.delta);
 								} else if (parsed.type === "error") {
 									setError(friendlyError(parsed.errorText));
 								}
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index dc3a6465e..2fc550306 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -26,7 +26,6 @@ interface ElectronAPI {
 	onAutocompleteContext: (callback: (data: { screenshot: string; searchSpaceId?: string }) => void) => () => void;
 	acceptSuggestion: (text: string) => Promise<void>;
 	dismissSuggestion: () => Promise<void>;
-	updateSuggestionText: (text: string) => Promise<void>;
 	setAutocompleteEnabled: (enabled: boolean) => Promise<void>;
 	getAutocompleteEnabled: () => Promise<boolean>;
 }

From 960b8fc01273795407398fe8b108ebbd6009ef58 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Fri, 3 Apr 2026 21:34:01 +0200
Subject: [PATCH 108/202] add app context and KB grounding to autocomplete
 suggestions

---
 .../app/routes/autocomplete_routes.py         |   7 +-
 .../services/vision_autocomplete_service.py   | 117 +++++++++++++++++-
 .../src/modules/autocomplete/index.ts         |   5 +-
 surfsense_desktop/src/modules/platform.ts     |  18 +++
 surfsense_desktop/src/preload.ts              |   4 +-
 surfsense_web/app/desktop/suggestion/page.tsx |   6 +-
 surfsense_web/types/window.d.ts               |   2 +-
 7 files changed, 150 insertions(+), 9 deletions(-)

diff --git a/surfsense_backend/app/routes/autocomplete_routes.py b/surfsense_backend/app/routes/autocomplete_routes.py
index 329476ca1..a6f66f408 100644
--- a/surfsense_backend/app/routes/autocomplete_routes.py
+++ b/surfsense_backend/app/routes/autocomplete_routes.py
@@ -14,6 +14,8 @@ router = APIRouter(prefix="/autocomplete", tags=["autocomplete"])
 class VisionAutocompleteRequest(BaseModel):
     screenshot: str
     search_space_id: int
+    app_name: str = ""
+    window_title: str = ""
 
 
 @router.post("/vision/stream")
@@ -23,7 +25,10 @@ async def vision_autocomplete_stream(
     session: AsyncSession = Depends(get_async_session),
 ):
     return StreamingResponse(
-        stream_vision_autocomplete(body.screenshot, body.search_space_id, session),
+        stream_vision_autocomplete(
+            body.screenshot, body.search_space_id, session,
+            app_name=body.app_name, window_title=body.window_title,
+        ),
         media_type="text/event-stream",
         headers={
             **VercelStreamingService.get_response_headers(),
diff --git a/surfsense_backend/app/services/vision_autocomplete_service.py b/surfsense_backend/app/services/vision_autocomplete_service.py
index 526b0d35c..0804df7fb 100644
--- a/surfsense_backend/app/services/vision_autocomplete_service.py
+++ b/surfsense_backend/app/services/vision_autocomplete_service.py
@@ -4,11 +4,21 @@ from typing import AsyncGenerator
 from langchain_core.messages import HumanMessage, SystemMessage
 from sqlalchemy.ext.asyncio import AsyncSession
 
+from app.retriever.chunks_hybrid_search import ChucksHybridSearchRetriever
 from app.services.llm_service import get_vision_llm
 from app.services.new_streaming_service import VercelStreamingService
 
 logger = logging.getLogger(__name__)
 
+KB_TOP_K = 5
+KB_MAX_CHARS = 4000
+
+EXTRACT_QUERY_PROMPT = """Look at this screenshot and describe in 1-2 short sentences what the user is working on and what topic they need to write about. Be specific about the subject matter. Output ONLY the description, nothing else."""
+
+EXTRACT_QUERY_PROMPT_WITH_APP = """The user is currently in the application "{app_name}" with the window titled "{window_title}".
+
+Look at this screenshot and describe in 1-2 short sentences what the user is working on and what topic they need to write about. Be specific about the subject matter. Output ONLY the description, nothing else."""
+
 VISION_SYSTEM_PROMPT = """You are a smart writing assistant that analyzes the user's screen to draft or complete text.
 
 You will receive a screenshot of the user's screen. Your job:
@@ -28,13 +38,107 @@ Rules:
 - Do NOT describe the screenshot or explain your reasoning.
 - If you cannot determine what to write, output nothing."""
 
+APP_CONTEXT_BLOCK = """
+
+The user is currently working in "{app_name}" (window: "{window_title}"). Use this to understand the type of application and adapt your tone and format accordingly."""
+
+KB_CONTEXT_BLOCK = """
+
+You also have access to the user's knowledge base documents below. Use them to write more accurate, informed, and contextually relevant text. Do NOT cite or reference the documents explicitly — just let the knowledge inform your writing naturally.
+
+<knowledge_base>
+{kb_context}
+</knowledge_base>"""
+
+
+def _build_system_prompt(app_name: str, window_title: str, kb_context: str) -> str:
+    """Assemble the system prompt from optional context blocks."""
+    prompt = VISION_SYSTEM_PROMPT
+    if app_name:
+        prompt += APP_CONTEXT_BLOCK.format(app_name=app_name, window_title=window_title)
+    if kb_context:
+        prompt += KB_CONTEXT_BLOCK.format(kb_context=kb_context)
+    return prompt
+
+
+async def _extract_query_from_screenshot(
+    llm, screenshot_data_url: str,
+    app_name: str = "", window_title: str = "",
+) -> str | None:
+    """Ask the Vision LLM to describe what the user is working on."""
+    if app_name:
+        prompt_text = EXTRACT_QUERY_PROMPT_WITH_APP.format(
+            app_name=app_name, window_title=window_title,
+        )
+    else:
+        prompt_text = EXTRACT_QUERY_PROMPT
+
+    try:
+        response = await llm.ainvoke([
+            HumanMessage(content=[
+                {"type": "text", "text": prompt_text},
+                {"type": "image_url", "image_url": {"url": screenshot_data_url}},
+            ]),
+        ])
+        query = response.content.strip() if hasattr(response, "content") else ""
+        return query if query else None
+    except Exception as e:
+        logger.warning(f"Failed to extract query from screenshot: {e}")
+        return None
+
+
+async def _search_knowledge_base(
+    session: AsyncSession, search_space_id: int, query: str
+) -> str:
+    """Search the KB and return formatted context string."""
+    try:
+        retriever = ChucksHybridSearchRetriever(session)
+        results = await retriever.hybrid_search(
+            query_text=query,
+            top_k=KB_TOP_K,
+            search_space_id=search_space_id,
+        )
+
+        if not results:
+            return ""
+
+        parts: list[str] = []
+        char_count = 0
+        for doc in results:
+            title = doc.get("document", {}).get("title", "Untitled")
+            for chunk in doc.get("chunks", []):
+                content = chunk.get("content", "").strip()
+                if not content:
+                    continue
+                entry = f"[{title}]\n{content}"
+                if char_count + len(entry) > KB_MAX_CHARS:
+                    break
+                parts.append(entry)
+                char_count += len(entry)
+            if char_count >= KB_MAX_CHARS:
+                break
+
+        return "\n\n---\n\n".join(parts)
+    except Exception as e:
+        logger.warning(f"KB search failed, proceeding without context: {e}")
+        return ""
+
 
 async def stream_vision_autocomplete(
     screenshot_data_url: str,
     search_space_id: int,
     session: AsyncSession,
+    *,
+    app_name: str = "",
+    window_title: str = "",
 ) -> AsyncGenerator[str, None]:
-    """Analyze a screenshot with the vision LLM and stream a text completion."""
+    """Analyze a screenshot with the vision LLM and stream a text completion.
+
+    Pipeline:
+    1. Extract a search query from the screenshot (non-streaming)
+    2. Search the knowledge base for relevant context
+    3. Stream the final completion with screenshot + KB + app context
+    """
     streaming = VercelStreamingService()
 
     llm = await get_vision_llm(session, search_space_id)
@@ -44,8 +148,17 @@ async def stream_vision_autocomplete(
         yield streaming.format_done()
         return
 
+    kb_context = ""
+    query = await _extract_query_from_screenshot(
+        llm, screenshot_data_url, app_name=app_name, window_title=window_title,
+    )
+    if query:
+        kb_context = await _search_knowledge_base(session, search_space_id, query)
+
+    system_prompt = _build_system_prompt(app_name, window_title, kb_context)
+
     messages = [
-        SystemMessage(content=VISION_SYSTEM_PROMPT),
+        SystemMessage(content=system_prompt),
         HumanMessage(content=[
             {
                 "type": "text",
diff --git a/surfsense_desktop/src/modules/autocomplete/index.ts b/surfsense_desktop/src/modules/autocomplete/index.ts
index 3ed9c4a00..0d5073de4 100644
--- a/surfsense_desktop/src/modules/autocomplete/index.ts
+++ b/surfsense_desktop/src/modules/autocomplete/index.ts
@@ -1,6 +1,6 @@
 import { clipboard, globalShortcut, ipcMain, screen } from 'electron';
 import { IPC_CHANNELS } from '../../ipc/channels';
-import { getFrontmostApp, hasAccessibilityPermission, simulatePaste } from '../platform';
+import { getFrontmostApp, getWindowTitle, hasAccessibilityPermission, simulatePaste } from '../platform';
 import { hasScreenRecordingPermission, requestAccessibility, requestScreenRecording } from '../permissions';
 import { getMainWindow } from '../window';
 import { captureScreen } from './screenshot';
@@ -27,6 +27,7 @@ async function triggerAutocomplete(): Promise<void> {
   }
 
   sourceApp = getFrontmostApp();
+  const windowTitle = getWindowTitle();
   savedClipboard = clipboard.readText();
 
   const screenshot = await captureScreen();
@@ -55,6 +56,8 @@ async function triggerAutocomplete(): Promise<void> {
         sw.webContents.send(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, {
           screenshot,
           searchSpaceId,
+          appName: sourceApp,
+          windowTitle,
         });
       }
     }, 300);
diff --git a/surfsense_desktop/src/modules/platform.ts b/surfsense_desktop/src/modules/platform.ts
index 1e6ac74e4..122e2efed 100644
--- a/surfsense_desktop/src/modules/platform.ts
+++ b/surfsense_desktop/src/modules/platform.ts
@@ -32,6 +32,24 @@ export function checkAccessibilityPermission(): boolean {
   return systemPreferences.isTrustedAccessibilityClient(true);
 }
 
+export function getWindowTitle(): string {
+  try {
+    if (process.platform === 'darwin') {
+      return execSync(
+        'osascript -e \'tell application "System Events" to get title of front window of first application process whose frontmost is true\''
+      ).toString().trim();
+    }
+    if (process.platform === 'win32') {
+      return execSync(
+        'powershell -command "(Get-Process | Where-Object { $_.MainWindowHandle -eq (Add-Type -MemberDefinition \'[DllImport(\\\"user32.dll\\\")] public static extern IntPtr GetForegroundWindow();\' -Name W -PassThru)::GetForegroundWindow() }).MainWindowTitle"'
+      ).toString().trim();
+    }
+  } catch {
+    return '';
+  }
+  return '';
+}
+
 export function hasAccessibilityPermission(): boolean {
   if (process.platform !== 'darwin') return true;
   return systemPreferences.isTrustedAccessibilityClient(false);
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 31c5ca865..2bd09f13c 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -27,8 +27,8 @@ contextBridge.exposeInMainWorld('electronAPI', {
   requestScreenRecording: () => ipcRenderer.invoke(IPC_CHANNELS.REQUEST_SCREEN_RECORDING),
   restartApp: () => ipcRenderer.invoke(IPC_CHANNELS.RESTART_APP),
   // Autocomplete
-  onAutocompleteContext: (callback: (data: { screenshot: string; searchSpaceId?: string }) => void) => {
-    const listener = (_event: unknown, data: { screenshot: string; searchSpaceId?: string }) => callback(data);
+  onAutocompleteContext: (callback: (data: { screenshot: string; searchSpaceId?: string; appName?: string; windowTitle?: string }) => void) => {
+    const listener = (_event: unknown, data: { screenshot: string; searchSpaceId?: string; appName?: string; windowTitle?: string }) => callback(data);
     ipcRenderer.on(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, listener);
     return () => {
       ipcRenderer.removeListener(IPC_CHANNELS.AUTOCOMPLETE_CONTEXT, listener);
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index b68fe450d..b7d9b97bd 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -46,7 +46,7 @@ export default function SuggestionPage() {
 	}, [error]);
 
 	const fetchSuggestion = useCallback(
-		async (screenshot: string, searchSpaceId: string) => {
+		async (screenshot: string, searchSpaceId: string, appName?: string, windowTitle?: string) => {
 			abortRef.current?.abort();
 			const controller = new AbortController();
 			abortRef.current = controller;
@@ -77,6 +77,8 @@ export default function SuggestionPage() {
 						body: JSON.stringify({
 							screenshot,
 							search_space_id: parseInt(searchSpaceId, 10),
+							app_name: appName || "",
+							window_title: windowTitle || "",
 						}),
 						signal: controller.signal,
 					},
@@ -142,7 +144,7 @@ export default function SuggestionPage() {
 		const cleanup = window.electronAPI.onAutocompleteContext((data) => {
 			const searchSpaceId = data.searchSpaceId || "1";
 			if (data.screenshot) {
-				fetchSuggestion(data.screenshot, searchSpaceId);
+				fetchSuggestion(data.screenshot, searchSpaceId, data.appName, data.windowTitle);
 			}
 		});
 
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 2fc550306..85b6bdf51 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -23,7 +23,7 @@ interface ElectronAPI {
 	requestScreenRecording: () => Promise<void>;
 	restartApp: () => Promise<void>;
 	// Autocomplete
-	onAutocompleteContext: (callback: (data: { screenshot: string; searchSpaceId?: string }) => void) => () => void;
+	onAutocompleteContext: (callback: (data: { screenshot: string; searchSpaceId?: string; appName?: string; windowTitle?: string }) => void) => () => void;
 	acceptSuggestion: (text: string) => Promise<void>;
 	dismissSuggestion: () => Promise<void>;
 	setAutocompleteEnabled: (enabled: boolean) => Promise<void>;

From ce40da80ea9f2a2afd02bd44aeb5390ac565fcff Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sat, 4 Apr 2026 02:51:28 +0530
Subject: [PATCH 109/202] feat: implement page limit estimation and enforcement
 in file based connector indexers

- Added a static method `estimate_pages_from_metadata` to `PageLimitService` for estimating page counts based on file metadata.
- Integrated page limit checks in Google Drive, Dropbox, and OneDrive indexers to prevent exceeding user quotas during file indexing.
- Updated relevant indexing methods to utilize the new page estimation logic and enforce limits accordingly.
- Enhanced tests for page limit functionality, ensuring accurate estimation and enforcement across different file types.
---
 .../app/services/page_limit_service.py        | 239 +++----
 .../app/tasks/connector_indexers/base.py      |   1 -
 .../connector_indexers/dropbox_indexer.py     |  52 ++
 .../google_drive_indexer.py                   |  88 +++
 .../connector_indexers/onedrive_indexer.py    |  80 +++
 .../integration/document_upload/conftest.py   |  63 ++
 .../test_google_drive_parallel.py             |  27 +-
 .../connector_indexers/test_page_limits.py    | 648 ++++++++++++++++++
 8 files changed, 1041 insertions(+), 157 deletions(-)
 create mode 100644 surfsense_backend/tests/unit/connector_indexers/test_page_limits.py

diff --git a/surfsense_backend/app/services/page_limit_service.py b/surfsense_backend/app/services/page_limit_service.py
index 080d05b5d..ea22067be 100644
--- a/surfsense_backend/app/services/page_limit_service.py
+++ b/surfsense_backend/app/services/page_limit_service.py
@@ -3,7 +3,7 @@ Service for managing user page limits for ETL services.
 """
 
 import os
-from pathlib import Path
+from pathlib import Path, PurePosixPath
 
 from sqlalchemy import select
 from sqlalchemy.ext.asyncio import AsyncSession
@@ -223,10 +223,91 @@ class PageLimitService:
         # Estimate ~2000 characters per page
         return max(1, content_length // 2000)
 
+    @staticmethod
+    def estimate_pages_from_metadata(
+        file_name_or_ext: str, file_size: int | str | None = None
+    ) -> int:
+        """Size-based page estimation from file name/extension and byte size.
+
+        Pure function — no file I/O, no database access.  Used by cloud
+        connectors (which only have API metadata) and as the internal
+        fallback for :meth:`estimate_pages_before_processing`.
+
+        ``file_name_or_ext`` can be a full filename (``"report.pdf"``) or
+        a bare extension (``".pdf"``).  ``file_size`` may be an int, a
+        stringified int from a cloud API, or *None*.
+        """
+        if file_size is not None:
+            try:
+                file_size = int(file_size)
+            except (ValueError, TypeError):
+                file_size = 0
+        else:
+            file_size = 0
+
+        if file_size <= 0:
+            return 1
+
+        ext = PurePosixPath(file_name_or_ext).suffix.lower() if file_name_or_ext else ""
+        if not ext and file_name_or_ext.startswith("."):
+            ext = file_name_or_ext.lower()
+        file_ext = ext
+
+        if file_ext == ".pdf":
+            return max(1, file_size // (100 * 1024))
+
+        if file_ext in {
+            ".doc", ".docx", ".docm", ".dot", ".dotm",
+            ".odt", ".ott", ".sxw", ".stw", ".uot",
+            ".rtf", ".pages", ".wpd", ".wps",
+            ".abw", ".zabw", ".cwk", ".hwp", ".lwp",
+            ".mcw", ".mw", ".sdw", ".vor",
+        }:
+            return max(1, file_size // (50 * 1024))
+
+        if file_ext in {
+            ".ppt", ".pptx", ".pptm", ".pot", ".potx",
+            ".odp", ".otp", ".sxi", ".sti", ".uop",
+            ".key", ".sda", ".sdd", ".sdp",
+        }:
+            return max(1, file_size // (200 * 1024))
+
+        if file_ext in {
+            ".xls", ".xlsx", ".xlsm", ".xlsb", ".xlw", ".xlr",
+            ".ods", ".ots", ".fods", ".numbers",
+            ".123", ".wk1", ".wk2", ".wk3", ".wk4", ".wks",
+            ".wb1", ".wb2", ".wb3", ".wq1", ".wq2",
+            ".csv", ".tsv", ".slk", ".sylk", ".dif", ".dbf",
+            ".prn", ".qpw", ".602", ".et", ".eth",
+        }:
+            return max(1, file_size // (100 * 1024))
+
+        if file_ext in {".epub"}:
+            return max(1, file_size // (50 * 1024))
+
+        if file_ext in {".txt", ".log", ".md", ".markdown", ".htm", ".html", ".xml"}:
+            return max(1, file_size // 3000)
+
+        if file_ext in {
+            ".jpg", ".jpeg", ".png", ".gif", ".bmp", ".tiff",
+            ".webp", ".svg", ".cgm", ".odg", ".pbd",
+        }:
+            return 1
+
+        if file_ext in {".mp3", ".m4a", ".wav", ".mpga"}:
+            return max(1, file_size // (1024 * 1024))
+
+        if file_ext in {".mp4", ".mpeg", ".webm"}:
+            return max(1, file_size // (5 * 1024 * 1024))
+
+        return max(1, file_size // (80 * 1024))
+
     def estimate_pages_before_processing(self, file_path: str) -> int:
         """
-        Estimate page count from file before processing (to avoid unnecessary API calls).
-        This is called BEFORE sending to ETL services to prevent cost on rejected files.
+        Estimate page count from a local file before processing.
+
+        For PDFs, attempts to read the actual page count via pypdf.
+        For everything else, delegates to :meth:`estimate_pages_from_metadata`.
 
         Args:
             file_path: Path to the file
@@ -240,7 +321,6 @@ class PageLimitService:
         file_ext = Path(file_path).suffix.lower()
         file_size = os.path.getsize(file_path)
 
-        # PDF files - try to get actual page count
         if file_ext == ".pdf":
             try:
                 import pypdf
@@ -249,153 +329,6 @@ class PageLimitService:
                     pdf_reader = pypdf.PdfReader(f)
                     return len(pdf_reader.pages)
             except Exception:
-                # If PDF reading fails, fall back to size estimation
-                # Typical PDF: ~100KB per page (conservative estimate)
-                return max(1, file_size // (100 * 1024))
+                pass  # fall through to size-based estimation
 
-        # Word Processing Documents
-        # Microsoft Word, LibreOffice Writer, WordPerfect, Pages, etc.
-        elif file_ext in [
-            ".doc",
-            ".docx",
-            ".docm",
-            ".dot",
-            ".dotm",  # Microsoft Word
-            ".odt",
-            ".ott",
-            ".sxw",
-            ".stw",
-            ".uot",  # OpenDocument/StarOffice Writer
-            ".rtf",  # Rich Text Format
-            ".pages",  # Apple Pages
-            ".wpd",
-            ".wps",  # WordPerfect, Microsoft Works
-            ".abw",
-            ".zabw",  # AbiWord
-            ".cwk",
-            ".hwp",
-            ".lwp",
-            ".mcw",
-            ".mw",
-            ".sdw",
-            ".vor",  # Other word processors
-        ]:
-            # Typical word document: ~50KB per page (conservative)
-            return max(1, file_size // (50 * 1024))
-
-        # Presentation Documents
-        # PowerPoint, Impress, Keynote, etc.
-        elif file_ext in [
-            ".ppt",
-            ".pptx",
-            ".pptm",
-            ".pot",
-            ".potx",  # Microsoft PowerPoint
-            ".odp",
-            ".otp",
-            ".sxi",
-            ".sti",
-            ".uop",  # OpenDocument/StarOffice Impress
-            ".key",  # Apple Keynote
-            ".sda",
-            ".sdd",
-            ".sdp",  # StarOffice Draw/Impress
-        ]:
-            # Typical presentation: ~200KB per slide (conservative)
-            return max(1, file_size // (200 * 1024))
-
-        # Spreadsheet Documents
-        # Excel, Calc, Numbers, Lotus, etc.
-        elif file_ext in [
-            ".xls",
-            ".xlsx",
-            ".xlsm",
-            ".xlsb",
-            ".xlw",
-            ".xlr",  # Microsoft Excel
-            ".ods",
-            ".ots",
-            ".fods",  # OpenDocument Spreadsheet
-            ".numbers",  # Apple Numbers
-            ".123",
-            ".wk1",
-            ".wk2",
-            ".wk3",
-            ".wk4",
-            ".wks",  # Lotus 1-2-3
-            ".wb1",
-            ".wb2",
-            ".wb3",
-            ".wq1",
-            ".wq2",  # Quattro Pro
-            ".csv",
-            ".tsv",
-            ".slk",
-            ".sylk",
-            ".dif",
-            ".dbf",
-            ".prn",
-            ".qpw",  # Data formats
-            ".602",
-            ".et",
-            ".eth",  # Other spreadsheets
-        ]:
-            # Spreadsheets typically have 1 sheet = 1 page for ETL
-            # Conservative: ~100KB per sheet
-            return max(1, file_size // (100 * 1024))
-
-        # E-books
-        elif file_ext in [".epub"]:
-            # E-books vary widely, estimate by size
-            # Typical e-book: ~50KB per page
-            return max(1, file_size // (50 * 1024))
-
-        # Plain Text and Markup Files
-        elif file_ext in [
-            ".txt",
-            ".log",  # Plain text
-            ".md",
-            ".markdown",  # Markdown
-            ".htm",
-            ".html",
-            ".xml",  # Markup
-        ]:
-            # Plain text: ~3000 bytes per page
-            return max(1, file_size // 3000)
-
-        # Image Files
-        # Each image is typically processed as 1 page
-        elif file_ext in [
-            ".jpg",
-            ".jpeg",  # JPEG
-            ".png",  # PNG
-            ".gif",  # GIF
-            ".bmp",  # Bitmap
-            ".tiff",  # TIFF
-            ".webp",  # WebP
-            ".svg",  # SVG
-            ".cgm",  # Computer Graphics Metafile
-            ".odg",
-            ".pbd",  # OpenDocument Graphics
-        ]:
-            # Each image = 1 page
-            return 1
-
-        # Audio Files (transcription = typically 1 page per minute)
-        # Note: These should be handled by audio transcription flow, not ETL
-        elif file_ext in [".mp3", ".m4a", ".wav", ".mpga"]:
-            # Audio files: estimate based on duration
-            # Fallback: ~1MB per minute of audio, 1 page per minute transcript
-            return max(1, file_size // (1024 * 1024))
-
-        # Video Files (typically not processed for pages, but just in case)
-        elif file_ext in [".mp4", ".mpeg", ".webm"]:
-            # Video files: very rough estimate
-            # Typically wouldn't be page-based, but use conservative estimate
-            return max(1, file_size // (5 * 1024 * 1024))
-
-        # Other/Unknown Document Types
-        else:
-            # Conservative estimate: ~80KB per page
-            # This catches: .sgl, .sxg, .uof, .uos1, .uos2, .web, and any future formats
-            return max(1, file_size // (80 * 1024))
+        return self.estimate_pages_from_metadata(file_ext, file_size)
diff --git a/surfsense_backend/app/tasks/connector_indexers/base.py b/surfsense_backend/app/tasks/connector_indexers/base.py
index ffc8ab72e..6b4bed4b5 100644
--- a/surfsense_backend/app/tasks/connector_indexers/base.py
+++ b/surfsense_backend/app/tasks/connector_indexers/base.py
@@ -4,7 +4,6 @@ Base functionality and shared imports for connector indexers.
 
 import logging
 from datetime import UTC, datetime, timedelta
-
 from sqlalchemy.ext.asyncio import AsyncSession
 from sqlalchemy.future import select
 
diff --git a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
index 1b039add7..87b3c55df 100644
--- a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
@@ -28,6 +28,7 @@ from app.indexing_pipeline.connector_document import ConnectorDocument
 from app.indexing_pipeline.document_hashing import compute_identifier_hash
 from app.indexing_pipeline.indexing_pipeline_service import IndexingPipelineService
 from app.services.llm_service import get_user_long_context_llm
+from app.services.page_limit_service import PageLimitService
 from app.services.task_logging_service import TaskLoggingService
 from app.tasks.connector_indexers.base import (
     check_document_by_unique_identifier,
@@ -278,6 +279,12 @@ async def _index_full_scan(
         },
     )
 
+    page_limit_service = PageLimitService(session)
+    pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
+    remaining_quota = pages_limit - pages_used
+    batch_estimated_pages = 0
+    page_limit_reached = False
+
     renamed_count = 0
     skipped = 0
     files_to_download: list[dict] = []
@@ -307,6 +314,21 @@ async def _index_full_scan(
         elif skip_item(file):
             skipped += 1
             continue
+
+        file_pages = PageLimitService.estimate_pages_from_metadata(
+            file.get("name", ""), file.get("size")
+        )
+        if batch_estimated_pages + file_pages > remaining_quota:
+            if not page_limit_reached:
+                logger.warning(
+                    "Page limit reached during Dropbox full scan, "
+                    "skipping remaining files"
+                )
+                page_limit_reached = True
+            skipped += 1
+            continue
+
+        batch_estimated_pages += file_pages
         files_to_download.append(file)
 
     batch_indexed, failed = await _download_and_index(
@@ -320,6 +342,14 @@ async def _index_full_scan(
         on_heartbeat=on_heartbeat_callback,
     )
 
+    if batch_indexed > 0 and files_to_download and batch_estimated_pages > 0:
+        pages_to_deduct = max(
+            1, batch_estimated_pages * batch_indexed // len(files_to_download)
+        )
+        await page_limit_service.update_page_usage(
+            user_id, pages_to_deduct, allow_exceed=True
+        )
+
     indexed = renamed_count + batch_indexed
     logger.info(
         f"Full scan complete: {indexed} indexed, {skipped} skipped, {failed} failed"
@@ -340,6 +370,11 @@ async def _index_selected_files(
     on_heartbeat: HeartbeatCallbackType | None = None,
 ) -> tuple[int, int, list[str]]:
     """Index user-selected files using the parallel pipeline."""
+    page_limit_service = PageLimitService(session)
+    pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
+    remaining_quota = pages_limit - pages_used
+    batch_estimated_pages = 0
+
     files_to_download: list[dict] = []
     errors: list[str] = []
     renamed_count = 0
@@ -364,6 +399,15 @@ async def _index_selected_files(
             skipped += 1
             continue
 
+        file_pages = PageLimitService.estimate_pages_from_metadata(
+            file.get("name", ""), file.get("size")
+        )
+        if batch_estimated_pages + file_pages > remaining_quota:
+            display = file_name or file_path
+            errors.append(f"File '{display}': page limit would be exceeded")
+            continue
+
+        batch_estimated_pages += file_pages
         files_to_download.append(file)
 
     batch_indexed, _failed = await _download_and_index(
@@ -377,6 +421,14 @@ async def _index_selected_files(
         on_heartbeat=on_heartbeat,
     )
 
+    if batch_indexed > 0 and files_to_download and batch_estimated_pages > 0:
+        pages_to_deduct = max(
+            1, batch_estimated_pages * batch_indexed // len(files_to_download)
+        )
+        await page_limit_service.update_page_usage(
+            user_id, pages_to_deduct, allow_exceed=True
+        )
+
     return renamed_count + batch_indexed, skipped, errors
 
 
diff --git a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
index b03d305f7..5e9e0f62f 100644
--- a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
@@ -34,6 +34,7 @@ from app.indexing_pipeline.indexing_pipeline_service import (
     PlaceholderInfo,
 )
 from app.services.llm_service import get_user_long_context_llm
+from app.services.page_limit_service import PageLimitService
 from app.services.task_logging_service import TaskLoggingService
 from app.tasks.connector_indexers.base import (
     check_document_by_unique_identifier,
@@ -327,6 +328,12 @@ async def _process_single_file(
                 return 1, 0, 0
             return 0, 1, 0
 
+        page_limit_service = PageLimitService(session)
+        estimated_pages = PageLimitService.estimate_pages_from_metadata(
+            file_name, file.get("size")
+        )
+        await page_limit_service.check_page_limit(user_id, estimated_pages)
+
         markdown, drive_metadata, error = await download_and_extract_content(
             drive_client, file
         )
@@ -363,6 +370,9 @@ async def _process_single_file(
             )
             await pipeline.index(document, connector_doc, user_llm)
 
+        await page_limit_service.update_page_usage(
+            user_id, estimated_pages, allow_exceed=True
+        )
         logger.info(f"Successfully indexed Google Drive file: {file_name}")
         return 1, 0, 0
 
@@ -466,6 +476,11 @@ async def _index_selected_files(
 
     Returns (indexed_count, skipped_count, errors).
     """
+    page_limit_service = PageLimitService(session)
+    pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
+    remaining_quota = pages_limit - pages_used
+    batch_estimated_pages = 0
+
     files_to_download: list[dict] = []
     errors: list[str] = []
     renamed_count = 0
@@ -486,6 +501,15 @@ async def _index_selected_files(
                 skipped += 1
             continue
 
+        file_pages = PageLimitService.estimate_pages_from_metadata(
+            file.get("name", ""), file.get("size")
+        )
+        if batch_estimated_pages + file_pages > remaining_quota:
+            display = file_name or file_id
+            errors.append(f"File '{display}': page limit would be exceeded")
+            continue
+
+        batch_estimated_pages += file_pages
         files_to_download.append(file)
 
     await _create_drive_placeholders(
@@ -507,6 +531,14 @@ async def _index_selected_files(
         on_heartbeat=on_heartbeat,
     )
 
+    if batch_indexed > 0 and files_to_download and batch_estimated_pages > 0:
+        pages_to_deduct = max(
+            1, batch_estimated_pages * batch_indexed // len(files_to_download)
+        )
+        await page_limit_service.update_page_usage(
+            user_id, pages_to_deduct, allow_exceed=True
+        )
+
     return renamed_count + batch_indexed, skipped, errors
 
 
@@ -545,6 +577,12 @@ async def _index_full_scan(
     # ------------------------------------------------------------------
     # Phase 1 (serial): collect files, run skip checks, track renames
     # ------------------------------------------------------------------
+    page_limit_service = PageLimitService(session)
+    pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
+    remaining_quota = pages_limit - pages_used
+    batch_estimated_pages = 0
+    page_limit_reached = False
+
     renamed_count = 0
     skipped = 0
     files_processed = 0
@@ -593,6 +631,20 @@ async def _index_full_scan(
                         skipped += 1
                     continue
 
+                file_pages = PageLimitService.estimate_pages_from_metadata(
+                    file.get("name", ""), file.get("size")
+                )
+                if batch_estimated_pages + file_pages > remaining_quota:
+                    if not page_limit_reached:
+                        logger.warning(
+                            "Page limit reached during Google Drive full scan, "
+                            "skipping remaining files"
+                        )
+                        page_limit_reached = True
+                    skipped += 1
+                    continue
+
+                batch_estimated_pages += file_pages
                 files_to_download.append(file)
 
             page_token = next_token
@@ -636,6 +688,14 @@ async def _index_full_scan(
         on_heartbeat=on_heartbeat_callback,
     )
 
+    if batch_indexed > 0 and files_to_download and batch_estimated_pages > 0:
+        pages_to_deduct = max(
+            1, batch_estimated_pages * batch_indexed // len(files_to_download)
+        )
+        await page_limit_service.update_page_usage(
+            user_id, pages_to_deduct, allow_exceed=True
+        )
+
     indexed = renamed_count + batch_indexed
     logger.info(
         f"Full scan complete: {indexed} indexed, {skipped} skipped, {failed} failed"
@@ -686,6 +746,12 @@ async def _index_with_delta_sync(
     # ------------------------------------------------------------------
     # Phase 1 (serial): handle removals, collect files for download
     # ------------------------------------------------------------------
+    page_limit_service = PageLimitService(session)
+    pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
+    remaining_quota = pages_limit - pages_used
+    batch_estimated_pages = 0
+    page_limit_reached = False
+
     renamed_count = 0
     skipped = 0
     files_to_download: list[dict] = []
@@ -715,6 +781,20 @@ async def _index_with_delta_sync(
                 skipped += 1
             continue
 
+        file_pages = PageLimitService.estimate_pages_from_metadata(
+            file.get("name", ""), file.get("size")
+        )
+        if batch_estimated_pages + file_pages > remaining_quota:
+            if not page_limit_reached:
+                logger.warning(
+                    "Page limit reached during Google Drive delta sync, "
+                    "skipping remaining files"
+                )
+                page_limit_reached = True
+            skipped += 1
+            continue
+
+        batch_estimated_pages += file_pages
         files_to_download.append(file)
 
     # ------------------------------------------------------------------
@@ -742,6 +822,14 @@ async def _index_with_delta_sync(
         on_heartbeat=on_heartbeat_callback,
     )
 
+    if batch_indexed > 0 and files_to_download and batch_estimated_pages > 0:
+        pages_to_deduct = max(
+            1, batch_estimated_pages * batch_indexed // len(files_to_download)
+        )
+        await page_limit_service.update_page_usage(
+            user_id, pages_to_deduct, allow_exceed=True
+        )
+
     indexed = renamed_count + batch_indexed
     logger.info(
         f"Delta sync complete: {indexed} indexed, {skipped} skipped, {failed} failed"
diff --git a/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
index 748cb0988..2301b6260 100644
--- a/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
@@ -28,6 +28,7 @@ from app.indexing_pipeline.connector_document import ConnectorDocument
 from app.indexing_pipeline.document_hashing import compute_identifier_hash
 from app.indexing_pipeline.indexing_pipeline_service import IndexingPipelineService
 from app.services.llm_service import get_user_long_context_llm
+from app.services.page_limit_service import PageLimitService
 from app.services.task_logging_service import TaskLoggingService
 from app.tasks.connector_indexers.base import (
     check_document_by_unique_identifier,
@@ -291,6 +292,11 @@ async def _index_selected_files(
     on_heartbeat: HeartbeatCallbackType | None = None,
 ) -> tuple[int, int, list[str]]:
     """Index user-selected files using the parallel pipeline."""
+    page_limit_service = PageLimitService(session)
+    pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
+    remaining_quota = pages_limit - pages_used
+    batch_estimated_pages = 0
+
     files_to_download: list[dict] = []
     errors: list[str] = []
     renamed_count = 0
@@ -311,6 +317,15 @@ async def _index_selected_files(
                 skipped += 1
             continue
 
+        file_pages = PageLimitService.estimate_pages_from_metadata(
+            file.get("name", ""), file.get("size")
+        )
+        if batch_estimated_pages + file_pages > remaining_quota:
+            display = file_name or file_id
+            errors.append(f"File '{display}': page limit would be exceeded")
+            continue
+
+        batch_estimated_pages += file_pages
         files_to_download.append(file)
 
     batch_indexed, _failed = await _download_and_index(
@@ -324,6 +339,14 @@ async def _index_selected_files(
         on_heartbeat=on_heartbeat,
     )
 
+    if batch_indexed > 0 and files_to_download and batch_estimated_pages > 0:
+        pages_to_deduct = max(
+            1, batch_estimated_pages * batch_indexed // len(files_to_download)
+        )
+        await page_limit_service.update_page_usage(
+            user_id, pages_to_deduct, allow_exceed=True
+        )
+
     return renamed_count + batch_indexed, skipped, errors
 
 
@@ -358,6 +381,12 @@ async def _index_full_scan(
         },
     )
 
+    page_limit_service = PageLimitService(session)
+    pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
+    remaining_quota = pages_limit - pages_used
+    batch_estimated_pages = 0
+    page_limit_reached = False
+
     renamed_count = 0
     skipped = 0
     files_to_download: list[dict] = []
@@ -383,6 +412,21 @@ async def _index_full_scan(
             else:
                 skipped += 1
             continue
+
+        file_pages = PageLimitService.estimate_pages_from_metadata(
+            file.get("name", ""), file.get("size")
+        )
+        if batch_estimated_pages + file_pages > remaining_quota:
+            if not page_limit_reached:
+                logger.warning(
+                    "Page limit reached during OneDrive full scan, "
+                    "skipping remaining files"
+                )
+                page_limit_reached = True
+            skipped += 1
+            continue
+
+        batch_estimated_pages += file_pages
         files_to_download.append(file)
 
     batch_indexed, failed = await _download_and_index(
@@ -396,6 +440,14 @@ async def _index_full_scan(
         on_heartbeat=on_heartbeat_callback,
     )
 
+    if batch_indexed > 0 and files_to_download and batch_estimated_pages > 0:
+        pages_to_deduct = max(
+            1, batch_estimated_pages * batch_indexed // len(files_to_download)
+        )
+        await page_limit_service.update_page_usage(
+            user_id, pages_to_deduct, allow_exceed=True
+        )
+
     indexed = renamed_count + batch_indexed
     logger.info(
         f"Full scan complete: {indexed} indexed, {skipped} skipped, {failed} failed"
@@ -441,6 +493,12 @@ async def _index_with_delta_sync(
 
     logger.info(f"Processing {len(changes)} delta changes")
 
+    page_limit_service = PageLimitService(session)
+    pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
+    remaining_quota = pages_limit - pages_used
+    batch_estimated_pages = 0
+    page_limit_reached = False
+
     renamed_count = 0
     skipped = 0
     files_to_download: list[dict] = []
@@ -471,6 +529,20 @@ async def _index_with_delta_sync(
                 skipped += 1
             continue
 
+        file_pages = PageLimitService.estimate_pages_from_metadata(
+            change.get("name", ""), change.get("size")
+        )
+        if batch_estimated_pages + file_pages > remaining_quota:
+            if not page_limit_reached:
+                logger.warning(
+                    "Page limit reached during OneDrive delta sync, "
+                    "skipping remaining files"
+                )
+                page_limit_reached = True
+            skipped += 1
+            continue
+
+        batch_estimated_pages += file_pages
         files_to_download.append(change)
 
     batch_indexed, failed = await _download_and_index(
@@ -484,6 +556,14 @@ async def _index_with_delta_sync(
         on_heartbeat=on_heartbeat_callback,
     )
 
+    if batch_indexed > 0 and files_to_download and batch_estimated_pages > 0:
+        pages_to_deduct = max(
+            1, batch_estimated_pages * batch_indexed // len(files_to_download)
+        )
+        await page_limit_service.update_page_usage(
+            user_id, pages_to_deduct, allow_exceed=True
+        )
+
     indexed = renamed_count + batch_indexed
     logger.info(
         f"Delta sync complete: {indexed} indexed, {skipped} skipped, {failed} failed"
diff --git a/surfsense_backend/tests/integration/document_upload/conftest.py b/surfsense_backend/tests/integration/document_upload/conftest.py
index 1f1c7df59..6640fefdf 100644
--- a/surfsense_backend/tests/integration/document_upload/conftest.py
+++ b/surfsense_backend/tests/integration/document_upload/conftest.py
@@ -3,6 +3,7 @@
 Prerequisites: PostgreSQL + pgvector only.
 
 External system boundaries are mocked:
+  - ETL parsing — LlamaParse (external API) and Docling (heavy library)
   - LLM summarization, text embedding, text chunking (external APIs)
   - Redis heartbeat (external infrastructure)
   - Task dispatch is swapped via DI (InlineTaskDispatcher)
@@ -11,6 +12,7 @@ External system boundaries are mocked:
 from __future__ import annotations
 
 import contextlib
+import os
 from collections.abc import AsyncGenerator
 from unittest.mock import AsyncMock, MagicMock
 
@@ -298,3 +300,64 @@ def _mock_redis_heartbeat(monkeypatch):
         "app.tasks.celery_tasks.document_tasks._run_heartbeat_loop",
         AsyncMock(),
     )
+
+
+@pytest.fixture(autouse=True)
+def _mock_etl_parsing(monkeypatch):
+    """Mock ETL parsing services — LlamaParse and Docling are external boundaries.
+
+    Preserves the real contract: empty/corrupt files raise an error just like
+    the actual services would, so tests covering failure paths keep working.
+    """
+
+    _MOCK_MARKDOWN = "# Mocked Document\n\nThis is mocked ETL content."
+
+    def _reject_empty(file_path: str) -> None:
+        if os.path.getsize(file_path) == 0:
+            raise RuntimeError(f"Cannot parse empty file: {file_path}")
+
+    # -- LlamaParse mock (external API) --------------------------------
+
+    class _FakeMarkdownDoc:
+        def __init__(self, text: str):
+            self.text = text
+
+    class _FakeLlamaParseResult:
+        async def aget_markdown_documents(self, *, split_by_page=False):
+            return [_FakeMarkdownDoc(_MOCK_MARKDOWN)]
+
+    async def _fake_llamacloud_parse(**kwargs):
+        _reject_empty(kwargs["file_path"])
+        return _FakeLlamaParseResult()
+
+    monkeypatch.setattr(
+        "app.tasks.document_processors.file_processors.parse_with_llamacloud_retry",
+        _fake_llamacloud_parse,
+    )
+
+    # -- Docling mock (heavy library boundary) -------------------------
+
+    async def _fake_docling_parse(file_path: str, filename: str):
+        _reject_empty(file_path)
+        return _MOCK_MARKDOWN
+
+    monkeypatch.setattr(
+        "app.tasks.document_processors.file_processors.parse_with_docling",
+        _fake_docling_parse,
+    )
+
+    class _FakeDoclingResult:
+        class document:
+            @staticmethod
+            def export_to_markdown():
+                return _MOCK_MARKDOWN
+
+    class _FakeDocumentConverter:
+        def convert(self, file_path):
+            _reject_empty(file_path)
+            return _FakeDoclingResult()
+
+    monkeypatch.setattr(
+        "docling.document_converter.DocumentConverter",
+        _FakeDocumentConverter,
+    )
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py b/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
index 3fe8a183d..20bd3f3d6 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
@@ -248,12 +248,33 @@ def _folder_dict(file_id: str, name: str) -> dict:
     }
 
 
+def _make_page_limit_session(pages_used=0, pages_limit=999_999):
+    """Build a mock DB session that real PageLimitService can operate against."""
+
+    class _FakeUser:
+        def __init__(self, pu, pl):
+            self.pages_used = pu
+            self.pages_limit = pl
+
+    fake_user = _FakeUser(pages_used, pages_limit)
+    session = AsyncMock()
+
+    def _make_result(*_a, **_kw):
+        r = MagicMock()
+        r.first.return_value = (fake_user.pages_used, fake_user.pages_limit)
+        r.unique.return_value.scalar_one_or_none.return_value = fake_user
+        return r
+
+    session.execute = AsyncMock(side_effect=_make_result)
+    return session, fake_user
+
+
 @pytest.fixture
 def full_scan_mocks(mock_drive_client, monkeypatch):
     """Wire up all mocks needed to call _index_full_scan in isolation."""
     import app.tasks.connector_indexers.google_drive_indexer as _mod
 
-    mock_session = AsyncMock()
+    mock_session, _ = _make_page_limit_session()
     mock_connector = MagicMock()
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
@@ -472,7 +493,7 @@ async def test_delta_sync_removals_serial_rest_parallel(monkeypatch):
         AsyncMock(return_value=MagicMock()),
     )
 
-    mock_session = AsyncMock()
+    mock_session, _ = _make_page_limit_session()
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
@@ -512,7 +533,7 @@ def selected_files_mocks(mock_drive_client, monkeypatch):
     """Wire up mocks for _index_selected_files tests."""
     import app.tasks.connector_indexers.google_drive_indexer as _mod
 
-    mock_session = AsyncMock()
+    mock_session, _ = _make_page_limit_session()
 
     get_file_results: dict[str, tuple[dict | None, str | None]] = {}
 
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
new file mode 100644
index 000000000..1c93965f3
--- /dev/null
+++ b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
@@ -0,0 +1,648 @@
+"""Tests for page limit enforcement in connector indexers.
+
+Covers:
+  A) PageLimitService.estimate_pages_from_metadata — pure function (no mocks)
+  B) Page-limit quota gating in _index_selected_files tested through the
+     real PageLimitService with a mock DB session (system boundary).
+     Google Drive is the primary, with OneDrive/Dropbox smoke tests.
+"""
+
+from unittest.mock import AsyncMock, MagicMock
+
+import pytest
+
+from app.services.page_limit_service import PageLimitService
+
+pytestmark = pytest.mark.unit
+
+_USER_ID = "00000000-0000-0000-0000-000000000001"
+_CONNECTOR_ID = 42
+_SEARCH_SPACE_ID = 1
+
+
+# ===================================================================
+# A) PageLimitService.estimate_pages_from_metadata — pure function
+#    No mocks: it's a staticmethod with no I/O.
+# ===================================================================
+
+
+class TestEstimatePagesFromMetadata:
+    """Vertical slices for the page estimation staticmethod."""
+
+    def test_pdf_100kb_returns_1(self):
+        assert PageLimitService.estimate_pages_from_metadata(".pdf", 100 * 1024) == 1
+
+    def test_pdf_500kb_returns_5(self):
+        assert PageLimitService.estimate_pages_from_metadata(".pdf", 500 * 1024) == 5
+
+    def test_pdf_1mb(self):
+        assert PageLimitService.estimate_pages_from_metadata(".pdf", 1024 * 1024) == 10
+
+    def test_docx_50kb_returns_1(self):
+        assert PageLimitService.estimate_pages_from_metadata(".docx", 50 * 1024) == 1
+
+    def test_docx_200kb(self):
+        assert PageLimitService.estimate_pages_from_metadata(".docx", 200 * 1024) == 4
+
+    def test_pptx_uses_200kb_per_page(self):
+        assert PageLimitService.estimate_pages_from_metadata(".pptx", 600 * 1024) == 3
+
+    def test_xlsx_uses_100kb_per_page(self):
+        assert PageLimitService.estimate_pages_from_metadata(".xlsx", 300 * 1024) == 3
+
+    def test_txt_uses_3000_bytes_per_page(self):
+        assert PageLimitService.estimate_pages_from_metadata(".txt", 9000) == 3
+
+    def test_image_always_returns_1(self):
+        for ext in (".jpg", ".png", ".gif", ".webp"):
+            assert PageLimitService.estimate_pages_from_metadata(ext, 5_000_000) == 1
+
+    def test_audio_uses_1mb_per_page(self):
+        assert PageLimitService.estimate_pages_from_metadata(".mp3", 3 * 1024 * 1024) == 3
+
+    def test_video_uses_5mb_per_page(self):
+        assert PageLimitService.estimate_pages_from_metadata(".mp4", 15 * 1024 * 1024) == 3
+
+    def test_unknown_ext_uses_80kb_per_page(self):
+        assert PageLimitService.estimate_pages_from_metadata(".xyz", 160 * 1024) == 2
+
+    def test_zero_size_returns_1(self):
+        assert PageLimitService.estimate_pages_from_metadata(".pdf", 0) == 1
+
+    def test_negative_size_returns_1(self):
+        assert PageLimitService.estimate_pages_from_metadata(".pdf", -500) == 1
+
+    def test_minimum_is_always_1(self):
+        assert PageLimitService.estimate_pages_from_metadata(".pdf", 50) == 1
+
+    def test_epub_uses_50kb_per_page(self):
+        assert PageLimitService.estimate_pages_from_metadata(".epub", 250 * 1024) == 5
+
+
+# ===================================================================
+# B) Page-limit enforcement in connector indexers
+#    System boundary mocked: DB session (for PageLimitService)
+#    System boundary mocked: external API clients, download/ETL
+#    NOT mocked: PageLimitService itself (our own code)
+# ===================================================================
+
+
+class _FakeUser:
+    """Stands in for the User ORM model at the DB boundary."""
+
+    def __init__(self, pages_used: int = 0, pages_limit: int = 100):
+        self.pages_used = pages_used
+        self.pages_limit = pages_limit
+
+
+def _make_page_limit_session(pages_used: int = 0, pages_limit: int = 100):
+    """Build a mock DB session that real PageLimitService can operate against.
+
+    Every ``session.execute()`` returns a result compatible with both
+    ``get_page_usage`` (.first() → tuple) and ``update_page_usage``
+    (.unique().scalar_one_or_none() → User-like).
+    """
+    fake_user = _FakeUser(pages_used, pages_limit)
+    session = AsyncMock()
+
+    def _make_result(*_args, **_kwargs):
+        result = MagicMock()
+        result.first.return_value = (fake_user.pages_used, fake_user.pages_limit)
+        result.unique.return_value.scalar_one_or_none.return_value = fake_user
+        return result
+
+    session.execute = AsyncMock(side_effect=_make_result)
+    return session, fake_user
+
+
+def _make_gdrive_file(file_id: str, name: str, size: int = 80 * 1024) -> dict:
+    return {
+        "id": file_id,
+        "name": name,
+        "mimeType": "application/octet-stream",
+        "size": str(size),
+    }
+
+
+# ---------------------------------------------------------------------------
+# Google Drive: _index_selected_files
+# ---------------------------------------------------------------------------
+
+
+@pytest.fixture
+def gdrive_selected_mocks(monkeypatch):
+    """Mocks for Google Drive _index_selected_files — only system boundaries."""
+    import app.tasks.connector_indexers.google_drive_indexer as _mod
+
+    session, fake_user = _make_page_limit_session(0, 100)
+
+    get_file_results: dict[str, tuple[dict | None, str | None]] = {}
+
+    async def _fake_get_file(client, file_id):
+        return get_file_results.get(file_id, (None, f"Not configured: {file_id}"))
+
+    monkeypatch.setattr(_mod, "get_file_by_id", _fake_get_file)
+    monkeypatch.setattr(
+        _mod, "_should_skip_file", AsyncMock(return_value=(False, None))
+    )
+
+    download_and_index_mock = AsyncMock(return_value=(0, 0))
+    monkeypatch.setattr(_mod, "_download_and_index", download_and_index_mock)
+
+    pipeline_mock = MagicMock()
+    pipeline_mock.create_placeholder_documents = AsyncMock(return_value=0)
+    monkeypatch.setattr(
+        _mod, "IndexingPipelineService", MagicMock(return_value=pipeline_mock)
+    )
+
+    return {
+        "mod": _mod,
+        "session": session,
+        "fake_user": fake_user,
+        "get_file_results": get_file_results,
+        "download_and_index_mock": download_and_index_mock,
+    }
+
+
+async def _run_gdrive_selected(mocks, file_ids):
+    from app.tasks.connector_indexers.google_drive_indexer import (
+        _index_selected_files,
+    )
+
+    return await _index_selected_files(
+        MagicMock(),
+        mocks["session"],
+        file_ids,
+        connector_id=_CONNECTOR_ID,
+        search_space_id=_SEARCH_SPACE_ID,
+        user_id=_USER_ID,
+        enable_summary=True,
+    )
+
+
+async def test_gdrive_files_within_quota_are_downloaded(gdrive_selected_mocks):
+    """Files whose cumulative estimated pages fit within remaining quota
+    are sent to _download_and_index."""
+    m = gdrive_selected_mocks
+    m["fake_user"].pages_used = 0
+    m["fake_user"].pages_limit = 100
+
+    for fid in ("f1", "f2", "f3"):
+        m["get_file_results"][fid] = (
+            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024), None,
+        )
+    m["download_and_index_mock"].return_value = (3, 0)
+
+    indexed, _skipped, errors = await _run_gdrive_selected(
+        m, [("f1", "f1.xyz"), ("f2", "f2.xyz"), ("f3", "f3.xyz")]
+    )
+
+    assert indexed == 3
+    assert errors == []
+    call_files = m["download_and_index_mock"].call_args[0][2]
+    assert len(call_files) == 3
+
+
+async def test_gdrive_files_exceeding_quota_rejected(gdrive_selected_mocks):
+    """Files whose pages would exceed remaining quota are rejected."""
+    m = gdrive_selected_mocks
+    m["fake_user"].pages_used = 98
+    m["fake_user"].pages_limit = 100
+
+    m["get_file_results"]["big"] = (
+        _make_gdrive_file("big", "huge.pdf", size=500 * 1024), None,
+    )
+
+    indexed, _skipped, errors = await _run_gdrive_selected(m, [("big", "huge.pdf")])
+
+    assert indexed == 0
+    assert len(errors) == 1
+    assert "page limit" in errors[0].lower()
+
+
+async def test_gdrive_quota_mix_partial_indexing(gdrive_selected_mocks):
+    """3rd file pushes over quota → only first two indexed."""
+    m = gdrive_selected_mocks
+    m["fake_user"].pages_used = 0
+    m["fake_user"].pages_limit = 2
+
+    for fid in ("f1", "f2", "f3"):
+        m["get_file_results"][fid] = (
+            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024), None,
+        )
+    m["download_and_index_mock"].return_value = (2, 0)
+
+    indexed, _skipped, errors = await _run_gdrive_selected(
+        m, [("f1", "f1.xyz"), ("f2", "f2.xyz"), ("f3", "f3.xyz")]
+    )
+
+    assert indexed == 2
+    assert len(errors) == 1
+    call_files = m["download_and_index_mock"].call_args[0][2]
+    assert {f["id"] for f in call_files} == {"f1", "f2"}
+
+
+async def test_gdrive_proportional_page_deduction(gdrive_selected_mocks):
+    """Pages deducted are proportional to successfully indexed files."""
+    m = gdrive_selected_mocks
+    m["fake_user"].pages_used = 0
+    m["fake_user"].pages_limit = 100
+
+    for fid in ("f1", "f2", "f3", "f4"):
+        m["get_file_results"][fid] = (
+            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024), None,
+        )
+    m["download_and_index_mock"].return_value = (2, 2)
+
+    await _run_gdrive_selected(
+        m,
+        [("f1", "f1.xyz"), ("f2", "f2.xyz"), ("f3", "f3.xyz"), ("f4", "f4.xyz")],
+    )
+
+    assert m["fake_user"].pages_used == 2
+
+
+async def test_gdrive_no_deduction_when_nothing_indexed(gdrive_selected_mocks):
+    """If batch_indexed == 0, user's pages_used stays unchanged."""
+    m = gdrive_selected_mocks
+    m["fake_user"].pages_used = 5
+    m["fake_user"].pages_limit = 100
+
+    m["get_file_results"]["f1"] = (
+        _make_gdrive_file("f1", "f1.xyz", size=80 * 1024), None,
+    )
+    m["download_and_index_mock"].return_value = (0, 1)
+
+    await _run_gdrive_selected(m, [("f1", "f1.xyz")])
+
+    assert m["fake_user"].pages_used == 5
+
+
+async def test_gdrive_zero_quota_rejects_all(gdrive_selected_mocks):
+    """When pages_used == pages_limit, every file is rejected."""
+    m = gdrive_selected_mocks
+    m["fake_user"].pages_used = 100
+    m["fake_user"].pages_limit = 100
+
+    for fid in ("f1", "f2"):
+        m["get_file_results"][fid] = (
+            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024), None,
+        )
+
+    indexed, _skipped, errors = await _run_gdrive_selected(
+        m, [("f1", "f1.xyz"), ("f2", "f2.xyz")]
+    )
+
+    assert indexed == 0
+    assert len(errors) == 2
+
+
+# ---------------------------------------------------------------------------
+# Google Drive: _index_full_scan
+# ---------------------------------------------------------------------------
+
+
+@pytest.fixture
+def gdrive_full_scan_mocks(monkeypatch):
+    import app.tasks.connector_indexers.google_drive_indexer as _mod
+
+    session, fake_user = _make_page_limit_session(0, 100)
+    mock_task_logger = MagicMock()
+    mock_task_logger.log_task_progress = AsyncMock()
+
+    monkeypatch.setattr(
+        _mod, "_should_skip_file", AsyncMock(return_value=(False, None))
+    )
+
+    download_mock = AsyncMock(return_value=([], 0))
+    monkeypatch.setattr(_mod, "_download_files_parallel", download_mock)
+
+    batch_mock = AsyncMock(return_value=([], 0, 0))
+    pipeline_mock = MagicMock()
+    pipeline_mock.index_batch_parallel = batch_mock
+    pipeline_mock.create_placeholder_documents = AsyncMock(return_value=0)
+    monkeypatch.setattr(
+        _mod, "IndexingPipelineService", MagicMock(return_value=pipeline_mock)
+    )
+    monkeypatch.setattr(
+        _mod, "get_user_long_context_llm", AsyncMock(return_value=MagicMock())
+    )
+
+    return {
+        "mod": _mod,
+        "session": session,
+        "fake_user": fake_user,
+        "task_logger": mock_task_logger,
+        "download_mock": download_mock,
+        "batch_mock": batch_mock,
+    }
+
+
+async def _run_gdrive_full_scan(mocks, max_files=500):
+    from app.tasks.connector_indexers.google_drive_indexer import _index_full_scan
+
+    return await _index_full_scan(
+        MagicMock(),
+        mocks["session"],
+        MagicMock(),
+        _CONNECTOR_ID,
+        _SEARCH_SPACE_ID,
+        _USER_ID,
+        "folder-root",
+        "My Folder",
+        mocks["task_logger"],
+        MagicMock(),
+        max_files,
+        include_subfolders=False,
+        enable_summary=True,
+    )
+
+
+async def test_gdrive_full_scan_skips_over_quota(gdrive_full_scan_mocks, monkeypatch):
+    m = gdrive_full_scan_mocks
+    m["fake_user"].pages_used = 0
+    m["fake_user"].pages_limit = 2
+
+    page_files = [
+        _make_gdrive_file(f"f{i}", f"file{i}.xyz", size=80 * 1024) for i in range(5)
+    ]
+    monkeypatch.setattr(
+        m["mod"], "get_files_in_folder",
+        AsyncMock(return_value=(page_files, None, None)),
+    )
+    m["download_mock"].return_value = ([], 0)
+    m["batch_mock"].return_value = ([], 2, 0)
+
+    _indexed, skipped = await _run_gdrive_full_scan(m)
+
+    call_files = m["download_mock"].call_args[0][1]
+    assert len(call_files) == 2
+    assert skipped == 3
+
+
+async def test_gdrive_full_scan_deducts_after_indexing(
+    gdrive_full_scan_mocks, monkeypatch
+):
+    m = gdrive_full_scan_mocks
+    m["fake_user"].pages_used = 0
+    m["fake_user"].pages_limit = 100
+
+    page_files = [
+        _make_gdrive_file(f"f{i}", f"file{i}.xyz", size=80 * 1024) for i in range(3)
+    ]
+    monkeypatch.setattr(
+        m["mod"], "get_files_in_folder",
+        AsyncMock(return_value=(page_files, None, None)),
+    )
+    mock_docs = [MagicMock() for _ in range(3)]
+    m["download_mock"].return_value = (mock_docs, 0)
+    m["batch_mock"].return_value = ([], 3, 0)
+
+    await _run_gdrive_full_scan(m)
+
+    assert m["fake_user"].pages_used == 3
+
+
+# ---------------------------------------------------------------------------
+# Google Drive: _index_with_delta_sync
+# ---------------------------------------------------------------------------
+
+
+async def test_gdrive_delta_sync_skips_over_quota(monkeypatch):
+    import app.tasks.connector_indexers.google_drive_indexer as _mod
+
+    session, _ = _make_page_limit_session(0, 2)
+
+    changes = [
+        {
+            "fileId": f"mod{i}",
+            "file": _make_gdrive_file(f"mod{i}", f"mod{i}.xyz", size=80 * 1024),
+        }
+        for i in range(5)
+    ]
+    monkeypatch.setattr(
+        _mod, "fetch_all_changes",
+        AsyncMock(return_value=(changes, "new-token", None)),
+    )
+    monkeypatch.setattr(_mod, "categorize_change", lambda change: "modified")
+    monkeypatch.setattr(
+        _mod, "_should_skip_file", AsyncMock(return_value=(False, None))
+    )
+
+    download_mock = AsyncMock(return_value=([], 0))
+    monkeypatch.setattr(_mod, "_download_files_parallel", download_mock)
+
+    batch_mock = AsyncMock(return_value=([], 2, 0))
+    pipeline_mock = MagicMock()
+    pipeline_mock.index_batch_parallel = batch_mock
+    pipeline_mock.create_placeholder_documents = AsyncMock(return_value=0)
+    monkeypatch.setattr(
+        _mod, "IndexingPipelineService", MagicMock(return_value=pipeline_mock)
+    )
+    monkeypatch.setattr(
+        _mod, "get_user_long_context_llm", AsyncMock(return_value=MagicMock())
+    )
+
+    mock_task_logger = MagicMock()
+    mock_task_logger.log_task_progress = AsyncMock()
+
+    _indexed, skipped = await _mod._index_with_delta_sync(
+        MagicMock(), session, MagicMock(),
+        _CONNECTOR_ID, _SEARCH_SPACE_ID, _USER_ID,
+        "folder-root", "start-token",
+        mock_task_logger, MagicMock(),
+        max_files=500, enable_summary=True,
+    )
+
+    call_files = download_mock.call_args[0][1]
+    assert len(call_files) == 2
+    assert skipped == 3
+
+
+# ===================================================================
+# C) OneDrive smoke tests — verify page limit wiring
+# ===================================================================
+
+
+def _make_onedrive_file(file_id: str, name: str, size: int = 80 * 1024) -> dict:
+    return {
+        "id": file_id,
+        "name": name,
+        "file": {"mimeType": "application/octet-stream"},
+        "size": str(size),
+        "lastModifiedDateTime": "2026-01-01T00:00:00Z",
+    }
+
+
+@pytest.fixture
+def onedrive_selected_mocks(monkeypatch):
+    import app.tasks.connector_indexers.onedrive_indexer as _mod
+
+    session, fake_user = _make_page_limit_session(0, 100)
+
+    get_file_results: dict[str, tuple[dict | None, str | None]] = {}
+
+    async def _fake_get_file(client, file_id):
+        return get_file_results.get(file_id, (None, f"Not found: {file_id}"))
+
+    monkeypatch.setattr(_mod, "get_file_by_id", _fake_get_file)
+    monkeypatch.setattr(
+        _mod, "_should_skip_file", AsyncMock(return_value=(False, None))
+    )
+
+    download_and_index_mock = AsyncMock(return_value=(0, 0))
+    monkeypatch.setattr(_mod, "_download_and_index", download_and_index_mock)
+
+    pipeline_mock = MagicMock()
+    pipeline_mock.create_placeholder_documents = AsyncMock(return_value=0)
+    monkeypatch.setattr(
+        _mod, "IndexingPipelineService", MagicMock(return_value=pipeline_mock)
+    )
+
+    return {
+        "session": session,
+        "fake_user": fake_user,
+        "get_file_results": get_file_results,
+        "download_and_index_mock": download_and_index_mock,
+    }
+
+
+async def _run_onedrive_selected(mocks, file_ids):
+    from app.tasks.connector_indexers.onedrive_indexer import _index_selected_files
+
+    return await _index_selected_files(
+        MagicMock(), mocks["session"], file_ids,
+        connector_id=_CONNECTOR_ID, search_space_id=_SEARCH_SPACE_ID,
+        user_id=_USER_ID, enable_summary=True,
+    )
+
+
+async def test_onedrive_over_quota_rejected(onedrive_selected_mocks):
+    """OneDrive: files exceeding quota produce errors, not downloads."""
+    m = onedrive_selected_mocks
+    m["fake_user"].pages_used = 99
+    m["fake_user"].pages_limit = 100
+
+    m["get_file_results"]["big"] = (
+        _make_onedrive_file("big", "huge.pdf", size=500 * 1024), None,
+    )
+
+    indexed, _skipped, errors = await _run_onedrive_selected(m, [("big", "huge.pdf")])
+
+    assert indexed == 0
+    assert len(errors) == 1
+    assert "page limit" in errors[0].lower()
+
+
+async def test_onedrive_deducts_after_success(onedrive_selected_mocks):
+    """OneDrive: pages_used increases after successful indexing."""
+    m = onedrive_selected_mocks
+    m["fake_user"].pages_used = 0
+    m["fake_user"].pages_limit = 100
+
+    for fid in ("f1", "f2"):
+        m["get_file_results"][fid] = (
+            _make_onedrive_file(fid, f"{fid}.xyz", size=80 * 1024), None,
+        )
+    m["download_and_index_mock"].return_value = (2, 0)
+
+    await _run_onedrive_selected(m, [("f1", "f1.xyz"), ("f2", "f2.xyz")])
+
+    assert m["fake_user"].pages_used == 2
+
+
+# ===================================================================
+# D) Dropbox smoke tests — verify page limit wiring
+# ===================================================================
+
+
+def _make_dropbox_file(file_path: str, name: str, size: int = 80 * 1024) -> dict:
+    return {
+        "id": f"id:{file_path}",
+        "name": name,
+        ".tag": "file",
+        "path_lower": file_path,
+        "size": str(size),
+        "server_modified": "2026-01-01T00:00:00Z",
+        "content_hash": f"hash_{name}",
+    }
+
+
+@pytest.fixture
+def dropbox_selected_mocks(monkeypatch):
+    import app.tasks.connector_indexers.dropbox_indexer as _mod
+
+    session, fake_user = _make_page_limit_session(0, 100)
+
+    get_file_results: dict[str, tuple[dict | None, str | None]] = {}
+
+    async def _fake_get_file(client, file_path):
+        return get_file_results.get(file_path, (None, f"Not found: {file_path}"))
+
+    monkeypatch.setattr(_mod, "get_file_by_path", _fake_get_file)
+    monkeypatch.setattr(
+        _mod, "_should_skip_file", AsyncMock(return_value=(False, None))
+    )
+
+    download_and_index_mock = AsyncMock(return_value=(0, 0))
+    monkeypatch.setattr(_mod, "_download_and_index", download_and_index_mock)
+
+    pipeline_mock = MagicMock()
+    pipeline_mock.create_placeholder_documents = AsyncMock(return_value=0)
+    monkeypatch.setattr(
+        _mod, "IndexingPipelineService", MagicMock(return_value=pipeline_mock)
+    )
+
+    return {
+        "session": session,
+        "fake_user": fake_user,
+        "get_file_results": get_file_results,
+        "download_and_index_mock": download_and_index_mock,
+    }
+
+
+async def _run_dropbox_selected(mocks, file_paths):
+    from app.tasks.connector_indexers.dropbox_indexer import _index_selected_files
+
+    return await _index_selected_files(
+        MagicMock(), mocks["session"], file_paths,
+        connector_id=_CONNECTOR_ID, search_space_id=_SEARCH_SPACE_ID,
+        user_id=_USER_ID, enable_summary=True,
+    )
+
+
+async def test_dropbox_over_quota_rejected(dropbox_selected_mocks):
+    """Dropbox: files exceeding quota produce errors, not downloads."""
+    m = dropbox_selected_mocks
+    m["fake_user"].pages_used = 99
+    m["fake_user"].pages_limit = 100
+
+    m["get_file_results"]["/huge.pdf"] = (
+        _make_dropbox_file("/huge.pdf", "huge.pdf", size=500 * 1024), None,
+    )
+
+    indexed, _skipped, errors = await _run_dropbox_selected(
+        m, [("/huge.pdf", "huge.pdf")]
+    )
+
+    assert indexed == 0
+    assert len(errors) == 1
+    assert "page limit" in errors[0].lower()
+
+
+async def test_dropbox_deducts_after_success(dropbox_selected_mocks):
+    """Dropbox: pages_used increases after successful indexing."""
+    m = dropbox_selected_mocks
+    m["fake_user"].pages_used = 0
+    m["fake_user"].pages_limit = 100
+
+    for name in ("f1.xyz", "f2.xyz"):
+        path = f"/{name}"
+        m["get_file_results"][path] = (
+            _make_dropbox_file(path, name, size=80 * 1024), None,
+        )
+    m["download_and_index_mock"].return_value = (2, 0)
+
+    await _run_dropbox_selected(m, [("/f1.xyz", "f1.xyz"), ("/f2.xyz", "f2.xyz")])
+
+    assert m["fake_user"].pages_used == 2

From a2b354104631a17c5717cac53837e022843a58bf Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sat, 4 Apr 2026 03:11:56 +0530
Subject: [PATCH 110/202] chore: ran linting

---
 .../app/services/page_limit_service.py        | 96 +++++++++++++++----
 .../app/tasks/connector_indexers/base.py      |  1 +
 .../local_folder_indexer.py                   |  1 +
 .../integration/document_upload/conftest.py   | 15 +--
 .../test_local_folder_pipeline.py             |  2 +-
 .../connector_indexers/test_page_limits.py    | 84 +++++++++++-----
 6 files changed, 150 insertions(+), 49 deletions(-)

diff --git a/surfsense_backend/app/services/page_limit_service.py b/surfsense_backend/app/services/page_limit_service.py
index ea22067be..47fe07fc6 100644
--- a/surfsense_backend/app/services/page_limit_service.py
+++ b/surfsense_backend/app/services/page_limit_service.py
@@ -257,28 +257,83 @@ class PageLimitService:
             return max(1, file_size // (100 * 1024))
 
         if file_ext in {
-            ".doc", ".docx", ".docm", ".dot", ".dotm",
-            ".odt", ".ott", ".sxw", ".stw", ".uot",
-            ".rtf", ".pages", ".wpd", ".wps",
-            ".abw", ".zabw", ".cwk", ".hwp", ".lwp",
-            ".mcw", ".mw", ".sdw", ".vor",
+            ".doc",
+            ".docx",
+            ".docm",
+            ".dot",
+            ".dotm",
+            ".odt",
+            ".ott",
+            ".sxw",
+            ".stw",
+            ".uot",
+            ".rtf",
+            ".pages",
+            ".wpd",
+            ".wps",
+            ".abw",
+            ".zabw",
+            ".cwk",
+            ".hwp",
+            ".lwp",
+            ".mcw",
+            ".mw",
+            ".sdw",
+            ".vor",
         }:
             return max(1, file_size // (50 * 1024))
 
         if file_ext in {
-            ".ppt", ".pptx", ".pptm", ".pot", ".potx",
-            ".odp", ".otp", ".sxi", ".sti", ".uop",
-            ".key", ".sda", ".sdd", ".sdp",
+            ".ppt",
+            ".pptx",
+            ".pptm",
+            ".pot",
+            ".potx",
+            ".odp",
+            ".otp",
+            ".sxi",
+            ".sti",
+            ".uop",
+            ".key",
+            ".sda",
+            ".sdd",
+            ".sdp",
         }:
             return max(1, file_size // (200 * 1024))
 
         if file_ext in {
-            ".xls", ".xlsx", ".xlsm", ".xlsb", ".xlw", ".xlr",
-            ".ods", ".ots", ".fods", ".numbers",
-            ".123", ".wk1", ".wk2", ".wk3", ".wk4", ".wks",
-            ".wb1", ".wb2", ".wb3", ".wq1", ".wq2",
-            ".csv", ".tsv", ".slk", ".sylk", ".dif", ".dbf",
-            ".prn", ".qpw", ".602", ".et", ".eth",
+            ".xls",
+            ".xlsx",
+            ".xlsm",
+            ".xlsb",
+            ".xlw",
+            ".xlr",
+            ".ods",
+            ".ots",
+            ".fods",
+            ".numbers",
+            ".123",
+            ".wk1",
+            ".wk2",
+            ".wk3",
+            ".wk4",
+            ".wks",
+            ".wb1",
+            ".wb2",
+            ".wb3",
+            ".wq1",
+            ".wq2",
+            ".csv",
+            ".tsv",
+            ".slk",
+            ".sylk",
+            ".dif",
+            ".dbf",
+            ".prn",
+            ".qpw",
+            ".602",
+            ".et",
+            ".eth",
         }:
             return max(1, file_size // (100 * 1024))
 
@@ -289,8 +344,17 @@ class PageLimitService:
             return max(1, file_size // 3000)
 
         if file_ext in {
-            ".jpg", ".jpeg", ".png", ".gif", ".bmp", ".tiff",
-            ".webp", ".svg", ".cgm", ".odg", ".pbd",
+            ".jpg",
+            ".jpeg",
+            ".png",
+            ".gif",
+            ".bmp",
+            ".tiff",
+            ".webp",
+            ".svg",
+            ".cgm",
+            ".odg",
+            ".pbd",
         }:
             return 1
 
diff --git a/surfsense_backend/app/tasks/connector_indexers/base.py b/surfsense_backend/app/tasks/connector_indexers/base.py
index 6b4bed4b5..ffc8ab72e 100644
--- a/surfsense_backend/app/tasks/connector_indexers/base.py
+++ b/surfsense_backend/app/tasks/connector_indexers/base.py
@@ -4,6 +4,7 @@ Base functionality and shared imports for connector indexers.
 
 import logging
 from datetime import UTC, datetime, timedelta
+
 from sqlalchemy.ext.asyncio import AsyncSession
 from sqlalchemy.future import select
 
diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index acfbce0bf..fa50e86d3 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -205,6 +205,7 @@ def _compute_final_pages(
     actual = page_limit_service.estimate_pages_from_content_length(content_length)
     return max(estimated_pages, actual)
 
+
 DEFAULT_EXCLUDE_PATTERNS = [
     ".git",
     "node_modules",
diff --git a/surfsense_backend/tests/integration/document_upload/conftest.py b/surfsense_backend/tests/integration/document_upload/conftest.py
index 6640fefdf..41c379e58 100644
--- a/surfsense_backend/tests/integration/document_upload/conftest.py
+++ b/surfsense_backend/tests/integration/document_upload/conftest.py
@@ -302,6 +302,9 @@ def _mock_redis_heartbeat(monkeypatch):
     )
 
 
+_MOCK_ETL_MARKDOWN = "# Mocked Document\n\nThis is mocked ETL content."
+
+
 @pytest.fixture(autouse=True)
 def _mock_etl_parsing(monkeypatch):
     """Mock ETL parsing services — LlamaParse and Docling are external boundaries.
@@ -310,8 +313,6 @@ def _mock_etl_parsing(monkeypatch):
     the actual services would, so tests covering failure paths keep working.
     """
 
-    _MOCK_MARKDOWN = "# Mocked Document\n\nThis is mocked ETL content."
-
     def _reject_empty(file_path: str) -> None:
         if os.path.getsize(file_path) == 0:
             raise RuntimeError(f"Cannot parse empty file: {file_path}")
@@ -324,7 +325,7 @@ def _mock_etl_parsing(monkeypatch):
 
     class _FakeLlamaParseResult:
         async def aget_markdown_documents(self, *, split_by_page=False):
-            return [_FakeMarkdownDoc(_MOCK_MARKDOWN)]
+            return [_FakeMarkdownDoc(_MOCK_ETL_MARKDOWN)]
 
     async def _fake_llamacloud_parse(**kwargs):
         _reject_empty(kwargs["file_path"])
@@ -339,7 +340,7 @@ def _mock_etl_parsing(monkeypatch):
 
     async def _fake_docling_parse(file_path: str, filename: str):
         _reject_empty(file_path)
-        return _MOCK_MARKDOWN
+        return _MOCK_ETL_MARKDOWN
 
     monkeypatch.setattr(
         "app.tasks.document_processors.file_processors.parse_with_docling",
@@ -347,10 +348,12 @@ def _mock_etl_parsing(monkeypatch):
     )
 
     class _FakeDoclingResult:
-        class document:
+        class Document:
             @staticmethod
             def export_to_markdown():
-                return _MOCK_MARKDOWN
+                return _MOCK_ETL_MARKDOWN
+
+        document = Document()
 
     class _FakeDocumentConverter:
         def convert(self, file_path):
diff --git a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
index 4d9bda7ee..000f43aa8 100644
--- a/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
+++ b/surfsense_backend/tests/integration/indexing_pipeline/test_local_folder_pipeline.py
@@ -1015,7 +1015,7 @@ class TestPageLimits:
 
         (tmp_path / "note.md").write_text("# Hello World\n\nContent here.")
 
-        count, _skipped, _root_folder_id, err = await index_local_folder(
+        count, _skipped, _root_folder_id, _err = await index_local_folder(
             session=db_session,
             search_space_id=db_search_space.id,
             user_id=str(db_user.id),
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
index 1c93965f3..b31a9557f 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
@@ -58,10 +58,14 @@ class TestEstimatePagesFromMetadata:
             assert PageLimitService.estimate_pages_from_metadata(ext, 5_000_000) == 1
 
     def test_audio_uses_1mb_per_page(self):
-        assert PageLimitService.estimate_pages_from_metadata(".mp3", 3 * 1024 * 1024) == 3
+        assert (
+            PageLimitService.estimate_pages_from_metadata(".mp3", 3 * 1024 * 1024) == 3
+        )
 
     def test_video_uses_5mb_per_page(self):
-        assert PageLimitService.estimate_pages_from_metadata(".mp4", 15 * 1024 * 1024) == 3
+        assert (
+            PageLimitService.estimate_pages_from_metadata(".mp4", 15 * 1024 * 1024) == 3
+        )
 
     def test_unknown_ext_uses_80kb_per_page(self):
         assert PageLimitService.estimate_pages_from_metadata(".xyz", 160 * 1024) == 2
@@ -189,7 +193,8 @@ async def test_gdrive_files_within_quota_are_downloaded(gdrive_selected_mocks):
 
     for fid in ("f1", "f2", "f3"):
         m["get_file_results"][fid] = (
-            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024), None,
+            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024),
+            None,
         )
     m["download_and_index_mock"].return_value = (3, 0)
 
@@ -210,7 +215,8 @@ async def test_gdrive_files_exceeding_quota_rejected(gdrive_selected_mocks):
     m["fake_user"].pages_limit = 100
 
     m["get_file_results"]["big"] = (
-        _make_gdrive_file("big", "huge.pdf", size=500 * 1024), None,
+        _make_gdrive_file("big", "huge.pdf", size=500 * 1024),
+        None,
     )
 
     indexed, _skipped, errors = await _run_gdrive_selected(m, [("big", "huge.pdf")])
@@ -228,7 +234,8 @@ async def test_gdrive_quota_mix_partial_indexing(gdrive_selected_mocks):
 
     for fid in ("f1", "f2", "f3"):
         m["get_file_results"][fid] = (
-            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024), None,
+            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024),
+            None,
         )
     m["download_and_index_mock"].return_value = (2, 0)
 
@@ -250,7 +257,8 @@ async def test_gdrive_proportional_page_deduction(gdrive_selected_mocks):
 
     for fid in ("f1", "f2", "f3", "f4"):
         m["get_file_results"][fid] = (
-            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024), None,
+            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024),
+            None,
         )
     m["download_and_index_mock"].return_value = (2, 2)
 
@@ -269,7 +277,8 @@ async def test_gdrive_no_deduction_when_nothing_indexed(gdrive_selected_mocks):
     m["fake_user"].pages_limit = 100
 
     m["get_file_results"]["f1"] = (
-        _make_gdrive_file("f1", "f1.xyz", size=80 * 1024), None,
+        _make_gdrive_file("f1", "f1.xyz", size=80 * 1024),
+        None,
     )
     m["download_and_index_mock"].return_value = (0, 1)
 
@@ -286,7 +295,8 @@ async def test_gdrive_zero_quota_rejects_all(gdrive_selected_mocks):
 
     for fid in ("f1", "f2"):
         m["get_file_results"][fid] = (
-            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024), None,
+            _make_gdrive_file(fid, f"{fid}.xyz", size=80 * 1024),
+            None,
         )
 
     indexed, _skipped, errors = await _run_gdrive_selected(
@@ -367,7 +377,8 @@ async def test_gdrive_full_scan_skips_over_quota(gdrive_full_scan_mocks, monkeyp
         _make_gdrive_file(f"f{i}", f"file{i}.xyz", size=80 * 1024) for i in range(5)
     ]
     monkeypatch.setattr(
-        m["mod"], "get_files_in_folder",
+        m["mod"],
+        "get_files_in_folder",
         AsyncMock(return_value=(page_files, None, None)),
     )
     m["download_mock"].return_value = ([], 0)
@@ -391,7 +402,8 @@ async def test_gdrive_full_scan_deducts_after_indexing(
         _make_gdrive_file(f"f{i}", f"file{i}.xyz", size=80 * 1024) for i in range(3)
     ]
     monkeypatch.setattr(
-        m["mod"], "get_files_in_folder",
+        m["mod"],
+        "get_files_in_folder",
         AsyncMock(return_value=(page_files, None, None)),
     )
     mock_docs = [MagicMock() for _ in range(3)]
@@ -421,7 +433,8 @@ async def test_gdrive_delta_sync_skips_over_quota(monkeypatch):
         for i in range(5)
     ]
     monkeypatch.setattr(
-        _mod, "fetch_all_changes",
+        _mod,
+        "fetch_all_changes",
         AsyncMock(return_value=(changes, "new-token", None)),
     )
     monkeypatch.setattr(_mod, "categorize_change", lambda change: "modified")
@@ -447,11 +460,18 @@ async def test_gdrive_delta_sync_skips_over_quota(monkeypatch):
     mock_task_logger.log_task_progress = AsyncMock()
 
     _indexed, skipped = await _mod._index_with_delta_sync(
-        MagicMock(), session, MagicMock(),
-        _CONNECTOR_ID, _SEARCH_SPACE_ID, _USER_ID,
-        "folder-root", "start-token",
-        mock_task_logger, MagicMock(),
-        max_files=500, enable_summary=True,
+        MagicMock(),
+        session,
+        MagicMock(),
+        _CONNECTOR_ID,
+        _SEARCH_SPACE_ID,
+        _USER_ID,
+        "folder-root",
+        "start-token",
+        mock_task_logger,
+        MagicMock(),
+        max_files=500,
+        enable_summary=True,
     )
 
     call_files = download_mock.call_args[0][1]
@@ -511,9 +531,13 @@ async def _run_onedrive_selected(mocks, file_ids):
     from app.tasks.connector_indexers.onedrive_indexer import _index_selected_files
 
     return await _index_selected_files(
-        MagicMock(), mocks["session"], file_ids,
-        connector_id=_CONNECTOR_ID, search_space_id=_SEARCH_SPACE_ID,
-        user_id=_USER_ID, enable_summary=True,
+        MagicMock(),
+        mocks["session"],
+        file_ids,
+        connector_id=_CONNECTOR_ID,
+        search_space_id=_SEARCH_SPACE_ID,
+        user_id=_USER_ID,
+        enable_summary=True,
     )
 
 
@@ -524,7 +548,8 @@ async def test_onedrive_over_quota_rejected(onedrive_selected_mocks):
     m["fake_user"].pages_limit = 100
 
     m["get_file_results"]["big"] = (
-        _make_onedrive_file("big", "huge.pdf", size=500 * 1024), None,
+        _make_onedrive_file("big", "huge.pdf", size=500 * 1024),
+        None,
     )
 
     indexed, _skipped, errors = await _run_onedrive_selected(m, [("big", "huge.pdf")])
@@ -542,7 +567,8 @@ async def test_onedrive_deducts_after_success(onedrive_selected_mocks):
 
     for fid in ("f1", "f2"):
         m["get_file_results"][fid] = (
-            _make_onedrive_file(fid, f"{fid}.xyz", size=80 * 1024), None,
+            _make_onedrive_file(fid, f"{fid}.xyz", size=80 * 1024),
+            None,
         )
     m["download_and_index_mock"].return_value = (2, 0)
 
@@ -605,9 +631,13 @@ async def _run_dropbox_selected(mocks, file_paths):
     from app.tasks.connector_indexers.dropbox_indexer import _index_selected_files
 
     return await _index_selected_files(
-        MagicMock(), mocks["session"], file_paths,
-        connector_id=_CONNECTOR_ID, search_space_id=_SEARCH_SPACE_ID,
-        user_id=_USER_ID, enable_summary=True,
+        MagicMock(),
+        mocks["session"],
+        file_paths,
+        connector_id=_CONNECTOR_ID,
+        search_space_id=_SEARCH_SPACE_ID,
+        user_id=_USER_ID,
+        enable_summary=True,
     )
 
 
@@ -618,7 +648,8 @@ async def test_dropbox_over_quota_rejected(dropbox_selected_mocks):
     m["fake_user"].pages_limit = 100
 
     m["get_file_results"]["/huge.pdf"] = (
-        _make_dropbox_file("/huge.pdf", "huge.pdf", size=500 * 1024), None,
+        _make_dropbox_file("/huge.pdf", "huge.pdf", size=500 * 1024),
+        None,
     )
 
     indexed, _skipped, errors = await _run_dropbox_selected(
@@ -639,7 +670,8 @@ async def test_dropbox_deducts_after_success(dropbox_selected_mocks):
     for name in ("f1.xyz", "f2.xyz"):
         path = f"/{name}"
         m["get_file_results"][path] = (
-            _make_dropbox_file(path, name, size=80 * 1024), None,
+            _make_dropbox_file(path, name, size=80 * 1024),
+            None,
         )
     m["download_and_index_mock"].return_value = (2, 0)
 

From 09008c8f1a6ed963bcac17957ce14c8b3bc569e3 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sat, 4 Apr 2026 03:26:22 +0530
Subject: [PATCH 111/202] refactor: remove redundant authenticatedFetch calls
 in editor panel components

---
 surfsense_web/components/editor-panel/editor-panel.tsx         | 3 ---
 surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx | 3 ---
 2 files changed, 6 deletions(-)

diff --git a/surfsense_web/components/editor-panel/editor-panel.tsx b/surfsense_web/components/editor-panel/editor-panel.tsx
index 248fe68eb..c307b3cea 100644
--- a/surfsense_web/components/editor-panel/editor-panel.tsx
+++ b/surfsense_web/components/editor-panel/editor-panel.tsx
@@ -96,9 +96,6 @@ export function EditorPanelContent({
 			}
 
 			try {
-				const response = await authenticatedFetch(
-					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`,
-					{ method: "GET", signal: controller.signal }
 				const url = new URL(
 					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`
 				);
diff --git a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
index d2ce3cc64..97c5b7cd9 100644
--- a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
+++ b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
@@ -81,9 +81,6 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 			}
 
 			try {
-				const response = await authenticatedFetch(
-					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`,
-					{ method: "GET", signal: controller.signal }
 				const url = new URL(
 					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`
 				);

From 8e6b1c77eafbbb54c69ccefaf26aa017cb8e2e50 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sat, 4 Apr 2026 03:35:34 +0530
Subject: [PATCH 112/202] feat: implement PKCE support in native Google OAuth
 flows

- Added `generate_code_verifier` function to create a PKCE code verifier for enhanced security.
- Updated Google Calendar, Drive, and Gmail connector routes to utilize the PKCE code verifier during OAuth authorization.
- Modified state management to include the code verifier for secure state generation and validation.
---
 .../google_calendar_add_connector_route.py    | 18 ++++++++++----
 .../google_drive_add_connector_route.py       | 24 +++++++++++++------
 .../google_gmail_add_connector_route.py       | 18 ++++++++++----
 surfsense_backend/app/utils/oauth_security.py | 10 ++++++++
 4 files changed, 55 insertions(+), 15 deletions(-)

diff --git a/surfsense_backend/app/routes/google_calendar_add_connector_route.py b/surfsense_backend/app/routes/google_calendar_add_connector_route.py
index 9a2308bec..725f8decc 100644
--- a/surfsense_backend/app/routes/google_calendar_add_connector_route.py
+++ b/surfsense_backend/app/routes/google_calendar_add_connector_route.py
@@ -28,7 +28,7 @@ from app.utils.connector_naming import (
     check_duplicate_connector,
     generate_unique_connector_name,
 )
-from app.utils.oauth_security import OAuthStateManager, TokenEncryption
+from app.utils.oauth_security import OAuthStateManager, TokenEncryption, generate_code_verifier
 
 logger = logging.getLogger(__name__)
 
@@ -96,9 +96,14 @@ async def connect_calendar(space_id: int, user: User = Depends(current_active_us
 
         flow = get_google_flow()
 
-        # Generate secure state parameter with HMAC signature
+        code_verifier = generate_code_verifier()
+        flow.code_verifier = code_verifier
+
+        # Generate secure state parameter with HMAC signature (includes PKCE code_verifier)
         state_manager = get_state_manager()
-        state_encoded = state_manager.generate_secure_state(space_id, user.id)
+        state_encoded = state_manager.generate_secure_state(
+            space_id, user.id, code_verifier=code_verifier
+        )
 
         auth_url, _ = flow.authorization_url(
             access_type="offline",
@@ -146,8 +151,11 @@ async def reauth_calendar(
 
         flow = get_google_flow()
 
+        code_verifier = generate_code_verifier()
+        flow.code_verifier = code_verifier
+
         state_manager = get_state_manager()
-        extra: dict = {"connector_id": connector_id}
+        extra: dict = {"connector_id": connector_id, "code_verifier": code_verifier}
         if return_url and return_url.startswith("/"):
             extra["return_url"] = return_url
         state_encoded = state_manager.generate_secure_state(space_id, user.id, **extra)
@@ -225,6 +233,7 @@ async def calendar_callback(
 
         user_id = UUID(data["user_id"])
         space_id = data["space_id"]
+        code_verifier = data.get("code_verifier")
 
         # Validate redirect URI (security: ensure it matches configured value)
         if not config.GOOGLE_CALENDAR_REDIRECT_URI:
@@ -233,6 +242,7 @@ async def calendar_callback(
             )
 
         flow = get_google_flow()
+        flow.code_verifier = code_verifier
         flow.fetch_token(code=code)
 
         creds = flow.credentials
diff --git a/surfsense_backend/app/routes/google_drive_add_connector_route.py b/surfsense_backend/app/routes/google_drive_add_connector_route.py
index 1c9391610..921f84af9 100644
--- a/surfsense_backend/app/routes/google_drive_add_connector_route.py
+++ b/surfsense_backend/app/routes/google_drive_add_connector_route.py
@@ -41,7 +41,7 @@ from app.utils.connector_naming import (
     check_duplicate_connector,
     generate_unique_connector_name,
 )
-from app.utils.oauth_security import OAuthStateManager, TokenEncryption
+from app.utils.oauth_security import OAuthStateManager, TokenEncryption, generate_code_verifier
 
 # Relax token scope validation for Google OAuth
 os.environ["OAUTHLIB_RELAX_TOKEN_SCOPE"] = "1"
@@ -127,14 +127,19 @@ async def connect_drive(space_id: int, user: User = Depends(current_active_user)
 
         flow = get_google_flow()
 
-        # Generate secure state parameter with HMAC signature
+        code_verifier = generate_code_verifier()
+        flow.code_verifier = code_verifier
+
+        # Generate secure state parameter with HMAC signature (includes PKCE code_verifier)
         state_manager = get_state_manager()
-        state_encoded = state_manager.generate_secure_state(space_id, user.id)
+        state_encoded = state_manager.generate_secure_state(
+            space_id, user.id, code_verifier=code_verifier
+        )
 
         # Generate authorization URL
         auth_url, _ = flow.authorization_url(
-            access_type="offline",  # Get refresh token
-            prompt="consent",  # Force consent screen to get refresh token
+            access_type="offline",
+            prompt="consent",
             include_granted_scopes="true",
             state=state_encoded,
         )
@@ -193,8 +198,11 @@ async def reauth_drive(
 
         flow = get_google_flow()
 
+        code_verifier = generate_code_verifier()
+        flow.code_verifier = code_verifier
+
         state_manager = get_state_manager()
-        extra: dict = {"connector_id": connector_id}
+        extra: dict = {"connector_id": connector_id, "code_verifier": code_verifier}
         if return_url and return_url.startswith("/"):
             extra["return_url"] = return_url
         state_encoded = state_manager.generate_secure_state(space_id, user.id, **extra)
@@ -285,6 +293,7 @@ async def drive_callback(
         space_id = data["space_id"]
         reauth_connector_id = data.get("connector_id")
         reauth_return_url = data.get("return_url")
+        code_verifier = data.get("code_verifier")
 
         logger.info(
             f"Processing Google Drive callback for user {user_id}, space {space_id}"
@@ -296,8 +305,9 @@ async def drive_callback(
                 status_code=500, detail="GOOGLE_DRIVE_REDIRECT_URI not configured"
             )
 
-        # Exchange authorization code for tokens
+        # Exchange authorization code for tokens (restore PKCE code_verifier from state)
         flow = get_google_flow()
+        flow.code_verifier = code_verifier
         flow.fetch_token(code=code)
 
         creds = flow.credentials
diff --git a/surfsense_backend/app/routes/google_gmail_add_connector_route.py b/surfsense_backend/app/routes/google_gmail_add_connector_route.py
index 750a64819..9fe0c0de6 100644
--- a/surfsense_backend/app/routes/google_gmail_add_connector_route.py
+++ b/surfsense_backend/app/routes/google_gmail_add_connector_route.py
@@ -28,7 +28,7 @@ from app.utils.connector_naming import (
     check_duplicate_connector,
     generate_unique_connector_name,
 )
-from app.utils.oauth_security import OAuthStateManager, TokenEncryption
+from app.utils.oauth_security import OAuthStateManager, TokenEncryption, generate_code_verifier
 
 logger = logging.getLogger(__name__)
 
@@ -109,9 +109,14 @@ async def connect_gmail(space_id: int, user: User = Depends(current_active_user)
 
         flow = get_google_flow()
 
-        # Generate secure state parameter with HMAC signature
+        code_verifier = generate_code_verifier()
+        flow.code_verifier = code_verifier
+
+        # Generate secure state parameter with HMAC signature (includes PKCE code_verifier)
         state_manager = get_state_manager()
-        state_encoded = state_manager.generate_secure_state(space_id, user.id)
+        state_encoded = state_manager.generate_secure_state(
+            space_id, user.id, code_verifier=code_verifier
+        )
 
         auth_url, _ = flow.authorization_url(
             access_type="offline",
@@ -164,8 +169,11 @@ async def reauth_gmail(
 
         flow = get_google_flow()
 
+        code_verifier = generate_code_verifier()
+        flow.code_verifier = code_verifier
+
         state_manager = get_state_manager()
-        extra: dict = {"connector_id": connector_id}
+        extra: dict = {"connector_id": connector_id, "code_verifier": code_verifier}
         if return_url and return_url.startswith("/"):
             extra["return_url"] = return_url
         state_encoded = state_manager.generate_secure_state(space_id, user.id, **extra)
@@ -256,6 +264,7 @@ async def gmail_callback(
 
         user_id = UUID(data["user_id"])
         space_id = data["space_id"]
+        code_verifier = data.get("code_verifier")
 
         # Validate redirect URI (security: ensure it matches configured value)
         if not config.GOOGLE_GMAIL_REDIRECT_URI:
@@ -264,6 +273,7 @@ async def gmail_callback(
             )
 
         flow = get_google_flow()
+        flow.code_verifier = code_verifier
         flow.fetch_token(code=code)
 
         creds = flow.credentials
diff --git a/surfsense_backend/app/utils/oauth_security.py b/surfsense_backend/app/utils/oauth_security.py
index 5135cdef4..0ad9d3bd9 100644
--- a/surfsense_backend/app/utils/oauth_security.py
+++ b/surfsense_backend/app/utils/oauth_security.py
@@ -11,6 +11,8 @@ import hmac
 import json
 import logging
 import time
+from random import SystemRandom
+from string import ascii_letters, digits
 from uuid import UUID
 
 from cryptography.fernet import Fernet
@@ -18,6 +20,14 @@ from fastapi import HTTPException
 
 logger = logging.getLogger(__name__)
 
+_PKCE_CHARS = ascii_letters + digits + "-._~"
+_PKCE_RNG = SystemRandom()
+
+
+def generate_code_verifier(length: int = 128) -> str:
+    """Generate a PKCE code_verifier (RFC 7636, 43-128 unreserved chars)."""
+    return "".join(_PKCE_RNG.choice(_PKCE_CHARS) for _ in range(length))
+
 
 class OAuthStateManager:
     """Manages secure OAuth state parameters with HMAC signatures."""

From e814540727bbc457bef59e5a6b63f3a2aec2f957 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sat, 4 Apr 2026 03:36:54 +0530
Subject: [PATCH 113/202] refactor: move PKCE pair generatio for airtable

- Removed the `generate_pkce_pair` function from `airtable_add_connector_route.py` and relocated it to `oauth_security.py` for better organization.
- Updated imports in `airtable_add_connector_route.py` to reflect the new location of the PKCE generation function.
---
 .../routes/airtable_add_connector_route.py    | 26 +------------------
 surfsense_backend/app/utils/oauth_security.py | 11 ++++++++
 2 files changed, 12 insertions(+), 25 deletions(-)

diff --git a/surfsense_backend/app/routes/airtable_add_connector_route.py b/surfsense_backend/app/routes/airtable_add_connector_route.py
index fe359d2f3..d2d25d006 100644
--- a/surfsense_backend/app/routes/airtable_add_connector_route.py
+++ b/surfsense_backend/app/routes/airtable_add_connector_route.py
@@ -1,7 +1,5 @@
 import base64
-import hashlib
 import logging
-import secrets
 from datetime import UTC, datetime, timedelta
 from uuid import UUID
 
@@ -26,7 +24,7 @@ from app.utils.connector_naming import (
     check_duplicate_connector,
     generate_unique_connector_name,
 )
-from app.utils.oauth_security import OAuthStateManager, TokenEncryption
+from app.utils.oauth_security import OAuthStateManager, TokenEncryption, generate_pkce_pair
 
 logger = logging.getLogger(__name__)
 
@@ -75,28 +73,6 @@ def make_basic_auth_header(client_id: str, client_secret: str) -> str:
     return f"Basic {b64}"
 
 
-def generate_pkce_pair() -> tuple[str, str]:
-    """
-    Generate PKCE code verifier and code challenge.
-
-    Returns:
-        Tuple of (code_verifier, code_challenge)
-    """
-    # Generate code verifier (43-128 characters)
-    code_verifier = (
-        base64.urlsafe_b64encode(secrets.token_bytes(32)).decode("utf-8").rstrip("=")
-    )
-
-    # Generate code challenge (SHA256 hash of verifier, base64url encoded)
-    code_challenge = (
-        base64.urlsafe_b64encode(hashlib.sha256(code_verifier.encode("utf-8")).digest())
-        .decode("utf-8")
-        .rstrip("=")
-    )
-
-    return code_verifier, code_challenge
-
-
 @router.get("/auth/airtable/connector/add")
 async def connect_airtable(space_id: int, user: User = Depends(current_active_user)):
     """
diff --git a/surfsense_backend/app/utils/oauth_security.py b/surfsense_backend/app/utils/oauth_security.py
index 0ad9d3bd9..c39b1e9b1 100644
--- a/surfsense_backend/app/utils/oauth_security.py
+++ b/surfsense_backend/app/utils/oauth_security.py
@@ -29,6 +29,17 @@ def generate_code_verifier(length: int = 128) -> str:
     return "".join(_PKCE_RNG.choice(_PKCE_CHARS) for _ in range(length))
 
 
+def generate_pkce_pair(length: int = 128) -> tuple[str, str]:
+    """Generate a PKCE code_verifier and its S256 code_challenge."""
+    verifier = generate_code_verifier(length)
+    challenge = (
+        base64.urlsafe_b64encode(hashlib.sha256(verifier.encode()).digest())
+        .decode()
+        .rstrip("=")
+    )
+    return verifier, challenge
+
+
 class OAuthStateManager:
     """Manages secure OAuth state parameters with HMAC signatures."""
 

From 82d4d3e27234fb876701a35f22b15c99e5608b15 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sat, 4 Apr 2026 03:37:33 +0530
Subject: [PATCH 114/202] chore: ran linting

---
 .../app/routes/airtable_add_connector_route.py              | 6 +++++-
 .../app/routes/google_calendar_add_connector_route.py       | 6 +++++-
 .../app/routes/google_drive_add_connector_route.py          | 6 +++++-
 .../app/routes/google_gmail_add_connector_route.py          | 6 +++++-
 4 files changed, 20 insertions(+), 4 deletions(-)

diff --git a/surfsense_backend/app/routes/airtable_add_connector_route.py b/surfsense_backend/app/routes/airtable_add_connector_route.py
index d2d25d006..1e0b1eb5d 100644
--- a/surfsense_backend/app/routes/airtable_add_connector_route.py
+++ b/surfsense_backend/app/routes/airtable_add_connector_route.py
@@ -24,7 +24,11 @@ from app.utils.connector_naming import (
     check_duplicate_connector,
     generate_unique_connector_name,
 )
-from app.utils.oauth_security import OAuthStateManager, TokenEncryption, generate_pkce_pair
+from app.utils.oauth_security import (
+    OAuthStateManager,
+    TokenEncryption,
+    generate_pkce_pair,
+)
 
 logger = logging.getLogger(__name__)
 
diff --git a/surfsense_backend/app/routes/google_calendar_add_connector_route.py b/surfsense_backend/app/routes/google_calendar_add_connector_route.py
index 725f8decc..d7ccf62ca 100644
--- a/surfsense_backend/app/routes/google_calendar_add_connector_route.py
+++ b/surfsense_backend/app/routes/google_calendar_add_connector_route.py
@@ -28,7 +28,11 @@ from app.utils.connector_naming import (
     check_duplicate_connector,
     generate_unique_connector_name,
 )
-from app.utils.oauth_security import OAuthStateManager, TokenEncryption, generate_code_verifier
+from app.utils.oauth_security import (
+    OAuthStateManager,
+    TokenEncryption,
+    generate_code_verifier,
+)
 
 logger = logging.getLogger(__name__)
 
diff --git a/surfsense_backend/app/routes/google_drive_add_connector_route.py b/surfsense_backend/app/routes/google_drive_add_connector_route.py
index 921f84af9..8706326b7 100644
--- a/surfsense_backend/app/routes/google_drive_add_connector_route.py
+++ b/surfsense_backend/app/routes/google_drive_add_connector_route.py
@@ -41,7 +41,11 @@ from app.utils.connector_naming import (
     check_duplicate_connector,
     generate_unique_connector_name,
 )
-from app.utils.oauth_security import OAuthStateManager, TokenEncryption, generate_code_verifier
+from app.utils.oauth_security import (
+    OAuthStateManager,
+    TokenEncryption,
+    generate_code_verifier,
+)
 
 # Relax token scope validation for Google OAuth
 os.environ["OAUTHLIB_RELAX_TOKEN_SCOPE"] = "1"
diff --git a/surfsense_backend/app/routes/google_gmail_add_connector_route.py b/surfsense_backend/app/routes/google_gmail_add_connector_route.py
index 9fe0c0de6..dd8feb1c7 100644
--- a/surfsense_backend/app/routes/google_gmail_add_connector_route.py
+++ b/surfsense_backend/app/routes/google_gmail_add_connector_route.py
@@ -28,7 +28,11 @@ from app.utils.connector_naming import (
     check_duplicate_connector,
     generate_unique_connector_name,
 )
-from app.utils.oauth_security import OAuthStateManager, TokenEncryption, generate_code_verifier
+from app.utils.oauth_security import (
+    OAuthStateManager,
+    TokenEncryption,
+    generate_code_verifier,
+)
 
 logger = logging.getLogger(__name__)
 

From 46e8134b23ec5bb56dce475811437a283bcaec47 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Sat, 4 Apr 2026 08:40:55 +0200
Subject: [PATCH 115/202] catch non-vision model errors with actionable user
 message

---
 .../app/services/vision_autocomplete_service.py      | 12 ++++++++++--
 surfsense_web/app/desktop/suggestion/page.tsx        |  2 ++
 2 files changed, 12 insertions(+), 2 deletions(-)

diff --git a/surfsense_backend/app/services/vision_autocomplete_service.py b/surfsense_backend/app/services/vision_autocomplete_service.py
index 0804df7fb..e172c6522 100644
--- a/surfsense_backend/app/services/vision_autocomplete_service.py
+++ b/surfsense_backend/app/services/vision_autocomplete_service.py
@@ -186,6 +186,14 @@ async def stream_vision_autocomplete(
         yield streaming.format_done()
 
     except Exception as e:
-        logger.error(f"Vision autocomplete streaming error: {e}")
-        yield streaming.format_error(str(e))
+        error_str = str(e).lower()
+        if "content must be a string" in error_str or "does not support image" in error_str:
+            logger.warning(f"Vision autocomplete: selected model does not support vision: {e}")
+            yield streaming.format_error(
+                "The selected model does not support vision. "
+                "Please set a vision-capable model (e.g. GPT-4o, Gemini) in your search space settings."
+            )
+        else:
+            logger.error(f"Vision autocomplete streaming error: {e}")
+            yield streaming.format_error(str(e))
         yield streaming.format_done()
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index b7d9b97bd..7188b73c6 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -24,6 +24,8 @@ function friendlyError(raw: string | number): string {
 		return "Please sign in to use suggestions.";
 	if (lower.includes("no vision llm configured") || lower.includes("no llm configured"))
 		return "No Vision LLM configured. Set one in search space settings.";
+	if (lower.includes("does not support vision"))
+		return "Selected model doesn\u2019t support vision. Set a vision-capable model in settings.";
 	if (lower.includes("fetch") || lower.includes("network") || lower.includes("econnrefused"))
 		return "Can\u2019t reach the server. Check your connection.";
 	return "Something went wrong. Try again.";

From 18103417bb10751c1b55b745bcd711596191dede Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Sat, 4 Apr 2026 08:57:09 +0200
Subject: [PATCH 116/202] fix: harden autocomplete endpoint security and error
 handling

---
 .../app/routes/autocomplete_routes.py         | 11 +++--
 .../services/vision_autocomplete_service.py   | 46 +++++++++++++++----
 surfsense_web/app/desktop/suggestion/page.tsx | 18 ++++++++
 .../app/desktop/suggestion/suggestion.css     |  3 +-
 4 files changed, 64 insertions(+), 14 deletions(-)

diff --git a/surfsense_backend/app/routes/autocomplete_routes.py b/surfsense_backend/app/routes/autocomplete_routes.py
index a6f66f408..bb56709cb 100644
--- a/surfsense_backend/app/routes/autocomplete_routes.py
+++ b/surfsense_backend/app/routes/autocomplete_routes.py
@@ -1,18 +1,21 @@
-from fastapi import APIRouter, Depends
+from fastapi import APIRouter, Depends, HTTPException
 from fastapi.responses import StreamingResponse
-from pydantic import BaseModel
+from pydantic import BaseModel, Field
 from sqlalchemy.ext.asyncio import AsyncSession
 
 from app.db import User, get_async_session
 from app.services.new_streaming_service import VercelStreamingService
 from app.services.vision_autocomplete_service import stream_vision_autocomplete
 from app.users import current_active_user
+from app.utils.rbac import check_search_space_access
 
 router = APIRouter(prefix="/autocomplete", tags=["autocomplete"])
 
+MAX_SCREENSHOT_SIZE = 20 * 1024 * 1024  # 20 MB base64 ceiling
+
 
 class VisionAutocompleteRequest(BaseModel):
-    screenshot: str
+    screenshot: str = Field(..., max_length=MAX_SCREENSHOT_SIZE)
     search_space_id: int
     app_name: str = ""
     window_title: str = ""
@@ -24,6 +27,8 @@ async def vision_autocomplete_stream(
     user: User = Depends(current_active_user),
     session: AsyncSession = Depends(get_async_session),
 ):
+    await check_search_space_access(session, user, body.search_space_id)
+
     return StreamingResponse(
         stream_vision_autocomplete(
             body.screenshot, body.search_space_id, session,
diff --git a/surfsense_backend/app/services/vision_autocomplete_service.py b/surfsense_backend/app/services/vision_autocomplete_service.py
index e172c6522..2ddb56f51 100644
--- a/surfsense_backend/app/services/vision_autocomplete_service.py
+++ b/surfsense_backend/app/services/vision_autocomplete_service.py
@@ -61,11 +61,21 @@ def _build_system_prompt(app_name: str, window_title: str, kb_context: str) -> s
     return prompt
 
 
+def _is_vision_unsupported_error(e: Exception) -> bool:
+    """Check if an exception indicates the model doesn't support vision/images."""
+    msg = str(e).lower()
+    return "content must be a string" in msg or "does not support image" in msg
+
+
 async def _extract_query_from_screenshot(
     llm, screenshot_data_url: str,
     app_name: str = "", window_title: str = "",
 ) -> str | None:
-    """Ask the Vision LLM to describe what the user is working on."""
+    """Ask the Vision LLM to describe what the user is working on.
+
+    Raises vision-unsupported errors so the caller can return a
+    friendly message immediately instead of retrying with astream.
+    """
     if app_name:
         prompt_text = EXTRACT_QUERY_PROMPT_WITH_APP.format(
             app_name=app_name, window_title=window_title,
@@ -83,6 +93,8 @@ async def _extract_query_from_screenshot(
         query = response.content.strip() if hasattr(response, "content") else ""
         return query if query else None
     except Exception as e:
+        if _is_vision_unsupported_error(e):
+            raise
         logger.warning(f"Failed to extract query from screenshot: {e}")
         return None
 
@@ -140,6 +152,10 @@ async def stream_vision_autocomplete(
     3. Stream the final completion with screenshot + KB + app context
     """
     streaming = VercelStreamingService()
+    vision_error_msg = (
+        "The selected model does not support vision. "
+        "Please set a vision-capable model (e.g. GPT-4o, Gemini) in your search space settings."
+    )
 
     llm = await get_vision_llm(session, search_space_id)
     if not llm:
@@ -149,9 +165,17 @@ async def stream_vision_autocomplete(
         return
 
     kb_context = ""
-    query = await _extract_query_from_screenshot(
-        llm, screenshot_data_url, app_name=app_name, window_title=window_title,
-    )
+    try:
+        query = await _extract_query_from_screenshot(
+            llm, screenshot_data_url, app_name=app_name, window_title=window_title,
+        )
+    except Exception as e:
+        logger.warning(f"Vision autocomplete: selected model does not support vision: {e}")
+        yield streaming.format_message_start()
+        yield streaming.format_error(vision_error_msg)
+        yield streaming.format_done()
+        return
+
     if query:
         kb_context = await _search_knowledge_base(session, search_space_id, query)
 
@@ -171,10 +195,13 @@ async def stream_vision_autocomplete(
         ]),
     ]
 
+    text_started = False
+    text_id = ""
     try:
         yield streaming.format_message_start()
         text_id = streaming.generate_text_id()
         yield streaming.format_text_start(text_id)
+        text_started = True
 
         async for chunk in llm.astream(messages):
             token = chunk.content if hasattr(chunk, "content") else str(chunk)
@@ -186,13 +213,12 @@ async def stream_vision_autocomplete(
         yield streaming.format_done()
 
     except Exception as e:
-        error_str = str(e).lower()
-        if "content must be a string" in error_str or "does not support image" in error_str:
+        if text_started:
+            yield streaming.format_text_end(text_id)
+
+        if _is_vision_unsupported_error(e):
             logger.warning(f"Vision autocomplete: selected model does not support vision: {e}")
-            yield streaming.format_error(
-                "The selected model does not support vision. "
-                "Please set a vision-capable model (e.g. GPT-4o, Gemini) in your search space settings."
-            )
+            yield streaming.format_error(vision_error_msg)
         else:
             logger.error(f"Vision autocomplete streaming error: {e}")
             yield streaming.format_error(str(e))
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 7188b73c6..03944867f 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -36,9 +36,17 @@ const AUTO_DISMISS_MS = 3000;
 export default function SuggestionPage() {
 	const [suggestion, setSuggestion] = useState("");
 	const [isLoading, setIsLoading] = useState(true);
+	const [isDesktop, setIsDesktop] = useState(true);
 	const [error, setError] = useState<string | null>(null);
 	const abortRef = useRef<AbortController | null>(null);
 
+	useEffect(() => {
+		if (!window.electronAPI?.onAutocompleteContext) {
+			setIsDesktop(false);
+			setIsLoading(false);
+		}
+	}, []);
+
 	useEffect(() => {
 		if (!error) return;
 		const timer = setTimeout(() => {
@@ -153,6 +161,16 @@ export default function SuggestionPage() {
 		return cleanup;
 	}, [fetchSuggestion]);
 
+	if (!isDesktop) {
+		return (
+			<div className="suggestion-tooltip">
+				<span className="suggestion-error-text">
+					This page is only available in the SurfSense desktop app.
+				</span>
+			</div>
+		);
+	}
+
 	if (error) {
 		return (
 			<div className="suggestion-tooltip suggestion-error">
diff --git a/surfsense_web/app/desktop/suggestion/suggestion.css b/surfsense_web/app/desktop/suggestion/suggestion.css
index 712d12618..62f4d2ea7 100644
--- a/surfsense_web/app/desktop/suggestion/suggestion.css
+++ b/surfsense_web/app/desktop/suggestion/suggestion.css
@@ -1,4 +1,5 @@
-html, body {
+html:has(.suggestion-body),
+body:has(.suggestion-body) {
   margin: 0 !important;
   padding: 0 !important;
   background: transparent !important;

From a180bf5576dc424646ea55a81e37b16c1c84743c Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Sat, 4 Apr 2026 09:39:20 +0200
Subject: [PATCH 117/202] fix merge conflicts

---
 ...=> 119_add_vision_llm_id_to_search_spaces.py} | 10 +++++-----
 .../app/services/vision_autocomplete_service.py  |  4 ++--
 .../src/modules/autocomplete/index.ts            | 16 +++++++++++-----
 .../components/editor-panel/editor-panel.tsx     |  3 ---
 .../layout/ui/tabs/DocumentTabContent.tsx        |  3 ---
 5 files changed, 18 insertions(+), 18 deletions(-)
 rename surfsense_backend/alembic/versions/{117_add_vision_llm_id_to_search_spaces.py => 119_add_vision_llm_id_to_search_spaces.py} (86%)

diff --git a/surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py b/surfsense_backend/alembic/versions/119_add_vision_llm_id_to_search_spaces.py
similarity index 86%
rename from surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py
rename to surfsense_backend/alembic/versions/119_add_vision_llm_id_to_search_spaces.py
index 2bec374c6..8e41d5e67 100644
--- a/surfsense_backend/alembic/versions/117_add_vision_llm_id_to_search_spaces.py
+++ b/surfsense_backend/alembic/versions/119_add_vision_llm_id_to_search_spaces.py
@@ -1,7 +1,7 @@
-"""117_add_vision_llm_id_to_search_spaces
+"""119_add_vision_llm_id_to_search_spaces
 
-Revision ID: 117
-Revises: 116
+Revision ID: 119
+Revises: 118
 
 Adds vision_llm_id column to search_spaces for vision/screenshot analysis
 LLM role assignment. Defaults to 0 (Auto mode), same convention as
@@ -16,8 +16,8 @@ import sqlalchemy as sa
 
 from alembic import op
 
-revision: str = "117"
-down_revision: str | None = "116"
+revision: str = "119"
+down_revision: str | None = "118"
 branch_labels: str | Sequence[str] | None = None
 depends_on: str | Sequence[str] | None = None
 
diff --git a/surfsense_backend/app/services/vision_autocomplete_service.py b/surfsense_backend/app/services/vision_autocomplete_service.py
index 2ddb56f51..f24a5c848 100644
--- a/surfsense_backend/app/services/vision_autocomplete_service.py
+++ b/surfsense_backend/app/services/vision_autocomplete_service.py
@@ -220,6 +220,6 @@ async def stream_vision_autocomplete(
             logger.warning(f"Vision autocomplete: selected model does not support vision: {e}")
             yield streaming.format_error(vision_error_msg)
         else:
-            logger.error(f"Vision autocomplete streaming error: {e}")
-            yield streaming.format_error(str(e))
+            logger.error(f"Vision autocomplete streaming error: {e}", exc_info=True)
+            yield streaming.format_error("Autocomplete failed. Please try again.")
         yield streaming.format_done()
diff --git a/surfsense_desktop/src/modules/autocomplete/index.ts b/surfsense_desktop/src/modules/autocomplete/index.ts
index 0d5073de4..01a4cf913 100644
--- a/surfsense_desktop/src/modules/autocomplete/index.ts
+++ b/surfsense_desktop/src/modules/autocomplete/index.ts
@@ -11,6 +11,7 @@ const SHORTCUT = 'CommandOrControl+Shift+Space';
 let autocompleteEnabled = true;
 let savedClipboard = '';
 let sourceApp = '';
+let lastSearchSpaceId: string | null = null;
 
 function isSurfSenseWindow(): boolean {
   const app = getFrontmostApp();
@@ -36,19 +37,24 @@ async function triggerAutocomplete(): Promise<void> {
     return;
   }
 
-  const cursor = screen.getCursorScreenPoint();
-  const win = createSuggestionWindow(cursor.x, cursor.y);
-
-  let searchSpaceId = '1';
   const mainWin = getMainWindow();
   if (mainWin && !mainWin.isDestroyed()) {
     const mainUrl = mainWin.webContents.getURL();
     const match = mainUrl.match(/\/dashboard\/(\d+)/);
     if (match) {
-      searchSpaceId = match[1];
+      lastSearchSpaceId = match[1];
     }
   }
 
+  if (!lastSearchSpaceId) {
+    console.warn('[autocomplete] No active search space. Open a search space first.');
+    return;
+  }
+
+  const searchSpaceId = lastSearchSpaceId;
+  const cursor = screen.getCursorScreenPoint();
+  const win = createSuggestionWindow(cursor.x, cursor.y);
+
   win.webContents.once('did-finish-load', () => {
     const sw = getSuggestionWindow();
     setTimeout(() => {
diff --git a/surfsense_web/components/editor-panel/editor-panel.tsx b/surfsense_web/components/editor-panel/editor-panel.tsx
index 248fe68eb..c307b3cea 100644
--- a/surfsense_web/components/editor-panel/editor-panel.tsx
+++ b/surfsense_web/components/editor-panel/editor-panel.tsx
@@ -96,9 +96,6 @@ export function EditorPanelContent({
 			}
 
 			try {
-				const response = await authenticatedFetch(
-					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`,
-					{ method: "GET", signal: controller.signal }
 				const url = new URL(
 					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`
 				);
diff --git a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
index d2ce3cc64..97c5b7cd9 100644
--- a/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
+++ b/surfsense_web/components/layout/ui/tabs/DocumentTabContent.tsx
@@ -81,9 +81,6 @@ export function DocumentTabContent({ documentId, searchSpaceId, title }: Documen
 			}
 
 			try {
-				const response = await authenticatedFetch(
-					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`,
-					{ method: "GET", signal: controller.signal }
 				const url = new URL(
 					`${process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL}/api/v1/search-spaces/${searchSpaceId}/documents/${documentId}/editor-content`
 				);

From 6b5b45d08d58e81c5cdadf76fd2f79f0dfe3821e Mon Sep 17 00:00:00 2001
From: Trevin Chow <trevin@trevinchow.com>
Date: Thu, 2 Apr 2026 05:05:04 -0700
Subject: [PATCH 118/202] perf: add passive option to scroll and touch event
 listeners

Browsers wait for scroll/touch listeners to finish to check if
preventDefault() is called, which delays scrolling. Since these
handlers (navbar scroll detection, click-outside detection, and
onboarding tour position updates) never call preventDefault(),
marking them as passive lets the browser scroll without waiting.

Fixes #1053
---
 surfsense_web/components/homepage/navbar.tsx | 4 ++--
 surfsense_web/components/onboarding-tour.tsx | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/surfsense_web/components/homepage/navbar.tsx b/surfsense_web/components/homepage/navbar.tsx
index 6ed5265bc..ec00de47f 100644
--- a/surfsense_web/components/homepage/navbar.tsx
+++ b/surfsense_web/components/homepage/navbar.tsx
@@ -32,7 +32,7 @@ export const Navbar = ({ scrolledBgClassName }: NavbarProps = {}) => {
 		};
 
 		handleScroll();
-		window.addEventListener("scroll", handleScroll);
+		window.addEventListener("scroll", handleScroll, { passive: true });
 		return () => window.removeEventListener("scroll", handleScroll);
 	}, []);
 
@@ -132,7 +132,7 @@ const MobileNav = ({ navItems, isScrolled, scrolledBgClassName }: any) => {
 		};
 
 		document.addEventListener("mousedown", handleClickOutside);
-		document.addEventListener("touchstart", handleClickOutside);
+		document.addEventListener("touchstart", handleClickOutside, { passive: true });
 		return () => {
 			document.removeEventListener("mousedown", handleClickOutside);
 			document.removeEventListener("touchstart", handleClickOutside);
diff --git a/surfsense_web/components/onboarding-tour.tsx b/surfsense_web/components/onboarding-tour.tsx
index a7d8f108b..178b6c97e 100644
--- a/surfsense_web/components/onboarding-tour.tsx
+++ b/surfsense_web/components/onboarding-tour.tsx
@@ -602,11 +602,11 @@ export function OnboardingTour() {
 		};
 
 		window.addEventListener("resize", handleUpdate);
-		window.addEventListener("scroll", handleUpdate, true);
+		window.addEventListener("scroll", handleUpdate, { capture: true, passive: true });
 
 		return () => {
 			window.removeEventListener("resize", handleUpdate);
-			window.removeEventListener("scroll", handleUpdate, true);
+			window.removeEventListener("scroll", handleUpdate, { capture: true });
 		};
 	}, [isActive, targetEl, currentStep?.placement]);
 

From 5d22349dc102e3e87b42e20a923ad79df1ecae51 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 17:25:25 +0530
Subject: [PATCH 119/202] feat: implement ETL pipeline with file classification
 and extraction services

---
 .../app/etl_pipeline/__init__.py              |  0
 .../app/etl_pipeline/constants.py             | 39 ++++++++++
 .../app/etl_pipeline/etl_document.py          | 21 ++++++
 .../app/etl_pipeline/etl_pipeline_service.py  | 73 +++++++++++++++++++
 .../app/etl_pipeline/exceptions.py            |  6 ++
 .../app/etl_pipeline/file_classifier.py       | 49 +++++++++++++
 6 files changed, 188 insertions(+)
 create mode 100644 surfsense_backend/app/etl_pipeline/__init__.py
 create mode 100644 surfsense_backend/app/etl_pipeline/constants.py
 create mode 100644 surfsense_backend/app/etl_pipeline/etl_document.py
 create mode 100644 surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
 create mode 100644 surfsense_backend/app/etl_pipeline/exceptions.py
 create mode 100644 surfsense_backend/app/etl_pipeline/file_classifier.py

diff --git a/surfsense_backend/app/etl_pipeline/__init__.py b/surfsense_backend/app/etl_pipeline/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/surfsense_backend/app/etl_pipeline/constants.py b/surfsense_backend/app/etl_pipeline/constants.py
new file mode 100644
index 000000000..f65759c13
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/constants.py
@@ -0,0 +1,39 @@
+import ssl
+
+import httpx
+
+LLAMACLOUD_MAX_RETRIES = 5
+LLAMACLOUD_BASE_DELAY = 10
+LLAMACLOUD_MAX_DELAY = 120
+LLAMACLOUD_RETRYABLE_EXCEPTIONS = (
+    ssl.SSLError,
+    httpx.ConnectError,
+    httpx.ConnectTimeout,
+    httpx.ReadError,
+    httpx.ReadTimeout,
+    httpx.WriteError,
+    httpx.WriteTimeout,
+    httpx.RemoteProtocolError,
+    httpx.LocalProtocolError,
+    ConnectionError,
+    ConnectionResetError,
+    TimeoutError,
+    OSError,
+)
+
+UPLOAD_BYTES_PER_SECOND_SLOW = 100 * 1024
+MIN_UPLOAD_TIMEOUT = 120
+MAX_UPLOAD_TIMEOUT = 1800
+BASE_JOB_TIMEOUT = 600
+PER_PAGE_JOB_TIMEOUT = 60
+
+
+def calculate_upload_timeout(file_size_bytes: int) -> float:
+    estimated_time = (file_size_bytes / UPLOAD_BYTES_PER_SECOND_SLOW) * 1.5
+    return max(MIN_UPLOAD_TIMEOUT, min(estimated_time, MAX_UPLOAD_TIMEOUT))
+
+
+def calculate_job_timeout(estimated_pages: int, file_size_bytes: int) -> float:
+    page_based_timeout = BASE_JOB_TIMEOUT + (estimated_pages * PER_PAGE_JOB_TIMEOUT)
+    size_based_timeout = BASE_JOB_TIMEOUT + (file_size_bytes / (10 * 1024 * 1024)) * 60
+    return max(page_based_timeout, size_based_timeout)
diff --git a/surfsense_backend/app/etl_pipeline/etl_document.py b/surfsense_backend/app/etl_pipeline/etl_document.py
new file mode 100644
index 000000000..350c3299f
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/etl_document.py
@@ -0,0 +1,21 @@
+from pydantic import BaseModel, field_validator
+
+
+class EtlRequest(BaseModel):
+    file_path: str
+    filename: str
+    estimated_pages: int = 0
+
+    @field_validator("filename")
+    @classmethod
+    def filename_must_not_be_empty(cls, v: str) -> str:
+        if not v.strip():
+            raise ValueError("filename must not be empty")
+        return v
+
+
+class EtlResult(BaseModel):
+    markdown_content: str
+    etl_service: str
+    actual_pages: int = 0
+    content_type: str
diff --git a/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py b/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
new file mode 100644
index 000000000..f382451df
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
@@ -0,0 +1,73 @@
+from app.config import config as app_config
+from app.etl_pipeline.etl_document import EtlRequest, EtlResult
+from app.etl_pipeline.exceptions import EtlServiceUnavailableError
+from app.etl_pipeline.file_classifier import FileCategory, classify_file
+from app.etl_pipeline.parsers.audio import transcribe_audio
+from app.etl_pipeline.parsers.direct_convert import convert_file_directly
+from app.etl_pipeline.parsers.plaintext import read_plaintext
+
+
+class EtlPipelineService:
+    """Single pipeline for extracting markdown from files. All callers use this."""
+
+    async def extract(self, request: EtlRequest) -> EtlResult:
+        category = classify_file(request.filename)
+
+        if category == FileCategory.PLAINTEXT:
+            content = read_plaintext(request.file_path)
+            return EtlResult(
+                markdown_content=content,
+                etl_service="PLAINTEXT",
+                content_type="plaintext",
+            )
+
+        if category == FileCategory.DIRECT_CONVERT:
+            content = convert_file_directly(request.file_path, request.filename)
+            return EtlResult(
+                markdown_content=content,
+                etl_service="DIRECT_CONVERT",
+                content_type="direct_convert",
+            )
+
+        if category == FileCategory.AUDIO:
+            content = await transcribe_audio(request.file_path, request.filename)
+            return EtlResult(
+                markdown_content=content,
+                etl_service="AUDIO",
+                content_type="audio",
+            )
+
+        return await self._extract_document(request)
+
+    async def _extract_document(self, request: EtlRequest) -> EtlResult:
+        etl_service = app_config.ETL_SERVICE
+        if not etl_service:
+            raise EtlServiceUnavailableError(
+                "No ETL_SERVICE configured. "
+                "Set ETL_SERVICE to UNSTRUCTURED, LLAMACLOUD, or DOCLING in your .env"
+            )
+
+        if etl_service == "DOCLING":
+            from app.etl_pipeline.parsers.docling import parse_with_docling
+
+            content = await parse_with_docling(request.file_path, request.filename)
+        elif etl_service == "UNSTRUCTURED":
+            from app.etl_pipeline.parsers.unstructured import parse_with_unstructured
+
+            content = await parse_with_unstructured(request.file_path)
+        elif etl_service == "LLAMACLOUD":
+            from app.etl_pipeline.parsers.llamacloud import parse_with_llamacloud
+
+            content = await parse_with_llamacloud(
+                request.file_path, request.estimated_pages
+            )
+        else:
+            raise EtlServiceUnavailableError(
+                f"Unknown ETL_SERVICE: {etl_service}"
+            )
+
+        return EtlResult(
+            markdown_content=content,
+            etl_service=etl_service,
+            content_type="document",
+        )
diff --git a/surfsense_backend/app/etl_pipeline/exceptions.py b/surfsense_backend/app/etl_pipeline/exceptions.py
new file mode 100644
index 000000000..ac8fc0172
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/exceptions.py
@@ -0,0 +1,6 @@
+class EtlParseError(Exception):
+    """Raised when an ETL parser fails to produce content."""
+
+
+class EtlServiceUnavailableError(Exception):
+    """Raised when the configured ETL_SERVICE is not recognised."""
diff --git a/surfsense_backend/app/etl_pipeline/file_classifier.py b/surfsense_backend/app/etl_pipeline/file_classifier.py
new file mode 100644
index 000000000..40c2d5aff
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/file_classifier.py
@@ -0,0 +1,49 @@
+from enum import Enum
+from pathlib import PurePosixPath
+
+
+PLAINTEXT_EXTENSIONS = frozenset(
+    {
+        ".md", ".markdown", ".txt", ".text",
+        ".json", ".jsonl", ".yaml", ".yml", ".toml", ".ini", ".cfg", ".conf", ".xml",
+        ".css", ".scss", ".less", ".sass",
+        ".py", ".pyw", ".pyi", ".pyx",
+        ".js", ".jsx", ".ts", ".tsx", ".mjs", ".cjs",
+        ".java", ".kt", ".kts", ".scala", ".groovy",
+        ".c", ".h", ".cpp", ".cxx", ".cc", ".hpp", ".hxx",
+        ".cs", ".fs", ".fsx",
+        ".go", ".rs", ".rb", ".php", ".pl", ".pm", ".lua", ".swift",
+        ".m", ".mm", ".r", ".jl",
+        ".sh", ".bash", ".zsh", ".fish", ".bat", ".cmd", ".ps1",
+        ".sql", ".graphql", ".gql",
+        ".env", ".gitignore", ".dockerignore", ".editorconfig",
+        ".makefile", ".cmake",
+        ".log", ".rst", ".tex", ".bib", ".org", ".adoc", ".asciidoc",
+        ".vue", ".svelte", ".astro",
+        ".tf", ".hcl", ".proto",
+    }
+)
+
+AUDIO_EXTENSIONS = frozenset(
+    {".mp3", ".mp4", ".mpeg", ".mpga", ".m4a", ".wav", ".webm"}
+)
+
+DIRECT_CONVERT_EXTENSIONS = frozenset({".csv", ".tsv", ".html", ".htm"})
+
+
+class FileCategory(Enum):
+    PLAINTEXT = "plaintext"
+    AUDIO = "audio"
+    DIRECT_CONVERT = "direct_convert"
+    DOCUMENT = "document"
+
+
+def classify_file(filename: str) -> FileCategory:
+    suffix = PurePosixPath(filename).suffix.lower()
+    if suffix in PLAINTEXT_EXTENSIONS:
+        return FileCategory.PLAINTEXT
+    if suffix in AUDIO_EXTENSIONS:
+        return FileCategory.AUDIO
+    if suffix in DIRECT_CONVERT_EXTENSIONS:
+        return FileCategory.DIRECT_CONVERT
+    return FileCategory.DOCUMENT

From 02fc6f1d1616de98a566d6925f96061a86a114db Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 17:26:03 +0530
Subject: [PATCH 120/202] feat: add audio transcription functionality to ETL
 pipeline

---
 .../app/etl_pipeline/parsers/__init__.py      |  0
 .../app/etl_pipeline/parsers/audio.py         | 34 +++++++++++++++++++
 2 files changed, 34 insertions(+)
 create mode 100644 surfsense_backend/app/etl_pipeline/parsers/__init__.py
 create mode 100644 surfsense_backend/app/etl_pipeline/parsers/audio.py

diff --git a/surfsense_backend/app/etl_pipeline/parsers/__init__.py b/surfsense_backend/app/etl_pipeline/parsers/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/surfsense_backend/app/etl_pipeline/parsers/audio.py b/surfsense_backend/app/etl_pipeline/parsers/audio.py
new file mode 100644
index 000000000..cd49bafde
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/parsers/audio.py
@@ -0,0 +1,34 @@
+from litellm import atranscription
+
+from app.config import config as app_config
+
+
+async def transcribe_audio(file_path: str, filename: str) -> str:
+    stt_service_type = (
+        "local"
+        if app_config.STT_SERVICE and app_config.STT_SERVICE.startswith("local/")
+        else "external"
+    )
+
+    if stt_service_type == "local":
+        from app.services.stt_service import stt_service
+
+        result = stt_service.transcribe_file(file_path)
+        text = result.get("text", "")
+        if not text:
+            raise ValueError("Transcription returned empty text")
+    else:
+        with open(file_path, "rb") as audio_file:
+            kwargs: dict = {
+                "model": app_config.STT_SERVICE,
+                "file": audio_file,
+                "api_key": app_config.STT_SERVICE_API_KEY,
+            }
+            if app_config.STT_SERVICE_API_BASE:
+                kwargs["api_base"] = app_config.STT_SERVICE_API_BASE
+            response = await atranscription(**kwargs)
+            text = response.get("text", "")
+            if not text:
+                raise ValueError("Transcription returned empty text")
+
+    return f"# Transcription of {filename}\n\n{text}"

From 35582c9389a9bc08f11cd603d8d9ed635e5a6218 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 17:26:29 +0530
Subject: [PATCH 121/202] feat: add direct_convert module to ETL pipeline for
 file conversion

---
 surfsense_backend/app/etl_pipeline/parsers/direct_convert.py | 3 +++
 1 file changed, 3 insertions(+)
 create mode 100644 surfsense_backend/app/etl_pipeline/parsers/direct_convert.py

diff --git a/surfsense_backend/app/etl_pipeline/parsers/direct_convert.py b/surfsense_backend/app/etl_pipeline/parsers/direct_convert.py
new file mode 100644
index 000000000..c9e6e8647
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/parsers/direct_convert.py
@@ -0,0 +1,3 @@
+from app.tasks.document_processors._direct_converters import convert_file_directly
+
+__all__ = ["convert_file_directly"]

From 2824410be225e43d5b22335776ca009c8c1ae2d1 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 17:26:42 +0530
Subject: [PATCH 122/202] feat: add plaintext parser to ETL pipeline for
 reading text files

---
 surfsense_backend/app/etl_pipeline/parsers/plaintext.py | 8 ++++++++
 1 file changed, 8 insertions(+)
 create mode 100644 surfsense_backend/app/etl_pipeline/parsers/plaintext.py

diff --git a/surfsense_backend/app/etl_pipeline/parsers/plaintext.py b/surfsense_backend/app/etl_pipeline/parsers/plaintext.py
new file mode 100644
index 000000000..24bfb71e5
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/parsers/plaintext.py
@@ -0,0 +1,8 @@
+def read_plaintext(file_path: str) -> str:
+    with open(file_path, encoding="utf-8", errors="replace") as f:
+        content = f.read()
+    if "\x00" in content:
+        raise ValueError(
+            f"File contains null bytes — likely a binary file opened as text: {file_path}"
+        )
+    return content

From f40de6b6954c1ca286a022eebff7e994213d6f26 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 17:27:24 +0530
Subject: [PATCH 123/202] feat: add parsers for Docling, LlamaCloud, and
 Unstructured to ETL pipeline

---
 .../app/etl_pipeline/parsers/docling.py       |  26 ++++
 .../app/etl_pipeline/parsers/llamacloud.py    | 129 ++++++++++++++++++
 .../app/etl_pipeline/parsers/unstructured.py  |  14 ++
 3 files changed, 169 insertions(+)
 create mode 100644 surfsense_backend/app/etl_pipeline/parsers/docling.py
 create mode 100644 surfsense_backend/app/etl_pipeline/parsers/llamacloud.py
 create mode 100644 surfsense_backend/app/etl_pipeline/parsers/unstructured.py

diff --git a/surfsense_backend/app/etl_pipeline/parsers/docling.py b/surfsense_backend/app/etl_pipeline/parsers/docling.py
new file mode 100644
index 000000000..df0498148
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/parsers/docling.py
@@ -0,0 +1,26 @@
+import warnings
+from logging import ERROR, getLogger
+
+
+async def parse_with_docling(file_path: str, filename: str) -> str:
+    from app.services.docling_service import create_docling_service
+
+    docling_service = create_docling_service()
+
+    pdfminer_logger = getLogger("pdfminer")
+    original_level = pdfminer_logger.level
+
+    with warnings.catch_warnings():
+        warnings.filterwarnings("ignore", category=UserWarning, module="pdfminer")
+        warnings.filterwarnings(
+            "ignore", message=".*Cannot set gray non-stroke color.*"
+        )
+        warnings.filterwarnings("ignore", message=".*invalid float value.*")
+        pdfminer_logger.setLevel(ERROR)
+
+        try:
+            result = await docling_service.process_document(file_path, filename)
+        finally:
+            pdfminer_logger.setLevel(original_level)
+
+    return result["content"]
diff --git a/surfsense_backend/app/etl_pipeline/parsers/llamacloud.py b/surfsense_backend/app/etl_pipeline/parsers/llamacloud.py
new file mode 100644
index 000000000..5115aebea
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/parsers/llamacloud.py
@@ -0,0 +1,129 @@
+import asyncio
+import logging
+import os
+import random
+
+import httpx
+
+from app.config import config as app_config
+from app.etl_pipeline.constants import (
+    LLAMACLOUD_BASE_DELAY,
+    LLAMACLOUD_MAX_DELAY,
+    LLAMACLOUD_MAX_RETRIES,
+    LLAMACLOUD_RETRYABLE_EXCEPTIONS,
+    PER_PAGE_JOB_TIMEOUT,
+    calculate_job_timeout,
+    calculate_upload_timeout,
+)
+
+
+async def parse_with_llamacloud(file_path: str, estimated_pages: int) -> str:
+    from llama_cloud_services import LlamaParse
+    from llama_cloud_services.parse.utils import ResultType
+
+    file_size_bytes = os.path.getsize(file_path)
+    file_size_mb = file_size_bytes / (1024 * 1024)
+
+    upload_timeout = calculate_upload_timeout(file_size_bytes)
+    job_timeout = calculate_job_timeout(estimated_pages, file_size_bytes)
+
+    custom_timeout = httpx.Timeout(
+        connect=120.0,
+        read=upload_timeout,
+        write=upload_timeout,
+        pool=120.0,
+    )
+
+    logging.info(
+        f"LlamaCloud upload configured: file_size={file_size_mb:.1f}MB, "
+        f"pages={estimated_pages}, upload_timeout={upload_timeout:.0f}s, "
+        f"job_timeout={job_timeout:.0f}s"
+    )
+
+    last_exception = None
+    attempt_errors: list[str] = []
+
+    for attempt in range(1, LLAMACLOUD_MAX_RETRIES + 1):
+        try:
+            async with httpx.AsyncClient(timeout=custom_timeout) as custom_client:
+                parser = LlamaParse(
+                    api_key=app_config.LLAMA_CLOUD_API_KEY,
+                    num_workers=1,
+                    verbose=True,
+                    language="en",
+                    result_type=ResultType.MD,
+                    max_timeout=int(max(2000, job_timeout + upload_timeout)),
+                    job_timeout_in_seconds=job_timeout,
+                    job_timeout_extra_time_per_page_in_seconds=PER_PAGE_JOB_TIMEOUT,
+                    custom_client=custom_client,
+                )
+                result = await parser.aparse(file_path)
+
+                if attempt > 1:
+                    logging.info(
+                        f"LlamaCloud upload succeeded on attempt {attempt} after "
+                        f"{len(attempt_errors)} failures"
+                    )
+
+                if hasattr(result, "get_markdown_documents"):
+                    markdown_docs = result.get_markdown_documents(
+                        split_by_page=False
+                    )
+                    if markdown_docs and hasattr(markdown_docs[0], "text"):
+                        return markdown_docs[0].text
+                    if hasattr(result, "pages") and result.pages:
+                        return "\n\n".join(
+                            p.md
+                            for p in result.pages
+                            if hasattr(p, "md") and p.md
+                        )
+                    return str(result)
+
+                if isinstance(result, list):
+                    if result and hasattr(result[0], "text"):
+                        return result[0].text
+                    return "\n\n".join(
+                        doc.page_content
+                        if hasattr(doc, "page_content")
+                        else str(doc)
+                        for doc in result
+                    )
+
+                return str(result)
+
+        except LLAMACLOUD_RETRYABLE_EXCEPTIONS as e:
+            last_exception = e
+            error_type = type(e).__name__
+            error_msg = str(e)[:200]
+            attempt_errors.append(f"Attempt {attempt}: {error_type} - {error_msg}")
+
+            if attempt < LLAMACLOUD_MAX_RETRIES:
+                base_delay = min(
+                    LLAMACLOUD_BASE_DELAY * (2 ** (attempt - 1)),
+                    LLAMACLOUD_MAX_DELAY,
+                )
+                jitter = base_delay * 0.25 * (2 * random.random() - 1)
+                delay = base_delay + jitter
+
+                logging.warning(
+                    f"LlamaCloud upload failed "
+                    f"(attempt {attempt}/{LLAMACLOUD_MAX_RETRIES}): "
+                    f"{error_type}. File: {file_size_mb:.1f}MB. "
+                    f"Retrying in {delay:.0f}s..."
+                )
+                await asyncio.sleep(delay)
+            else:
+                logging.error(
+                    f"LlamaCloud upload failed after {LLAMACLOUD_MAX_RETRIES} "
+                    f"attempts. File size: {file_size_mb:.1f}MB, "
+                    f"Pages: {estimated_pages}. "
+                    f"Errors: {'; '.join(attempt_errors)}"
+                )
+
+        except Exception:
+            raise
+
+    raise last_exception or RuntimeError(
+        f"LlamaCloud parsing failed after {LLAMACLOUD_MAX_RETRIES} retries. "
+        f"File size: {file_size_mb:.1f}MB"
+    )
diff --git a/surfsense_backend/app/etl_pipeline/parsers/unstructured.py b/surfsense_backend/app/etl_pipeline/parsers/unstructured.py
new file mode 100644
index 000000000..af8fb99b6
--- /dev/null
+++ b/surfsense_backend/app/etl_pipeline/parsers/unstructured.py
@@ -0,0 +1,14 @@
+async def parse_with_unstructured(file_path: str) -> str:
+    from langchain_unstructured import UnstructuredLoader
+
+    loader = UnstructuredLoader(
+        file_path,
+        mode="elements",
+        post_processors=[],
+        languages=["eng"],
+        include_orig_elements=False,
+        include_metadata=False,
+        strategy="auto",
+    )
+    docs = await loader.aload()
+    return "\n\n".join(doc.page_content for doc in docs if doc.page_content)

From 1248363ca980916cd5e16df66dbcc3cd37a2e68f Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 17:29:24 +0530
Subject: [PATCH 124/202] refactor: consolidate document processing logic and
 remove unused files and ETL strategies

---
 .../app/tasks/document_processors/__init__.py |  30 +--
 .../tasks/document_processors/_constants.py   |  74 -------
 .../app/tasks/document_processors/_etl.py     | 209 ------------------
 .../app/tasks/document_processors/_helpers.py |  25 ---
 .../app/tasks/document_processors/_save.py    |  81 -------
 5 files changed, 3 insertions(+), 416 deletions(-)
 delete mode 100644 surfsense_backend/app/tasks/document_processors/_constants.py
 delete mode 100644 surfsense_backend/app/tasks/document_processors/_etl.py

diff --git a/surfsense_backend/app/tasks/document_processors/__init__.py b/surfsense_backend/app/tasks/document_processors/__init__.py
index 2b5690d02..f82c10883 100644
--- a/surfsense_backend/app/tasks/document_processors/__init__.py
+++ b/surfsense_backend/app/tasks/document_processors/__init__.py
@@ -1,41 +1,17 @@
 """
 Document processors module for background tasks.
 
-This module provides a collection of document processors for different content types
-and sources. Each processor is responsible for handling a specific type of document
-processing task in the background.
-
-Available processors:
-- Extension processor: Handle documents from browser extension
-- Markdown processor: Process markdown files
-- File processors: Handle files using different ETL services (Unstructured, LlamaCloud, Docling)
-- YouTube processor: Process YouTube videos and extract transcripts
+Content extraction is handled by ``app.etl_pipeline.EtlPipelineService``.
+This package keeps orchestration (save, notify, page-limit) and
+non-ETL processors (extension, markdown, youtube).
 """
 
-# Extension processor
-# File processors (backward-compatible re-exports from _save)
-from ._save import (
-    add_received_file_document_using_docling,
-    add_received_file_document_using_llamacloud,
-    add_received_file_document_using_unstructured,
-)
 from .extension_processor import add_extension_received_document
-
-# Markdown processor
 from .markdown_processor import add_received_markdown_file_document
-
-# YouTube processor
 from .youtube_processor import add_youtube_video_document
 
 __all__ = [
-    # Extension processing
     "add_extension_received_document",
-    # File processing with different ETL services
-    "add_received_file_document_using_docling",
-    "add_received_file_document_using_llamacloud",
-    "add_received_file_document_using_unstructured",
-    # Markdown file processing
     "add_received_markdown_file_document",
-    # YouTube video processing
     "add_youtube_video_document",
 ]
diff --git a/surfsense_backend/app/tasks/document_processors/_constants.py b/surfsense_backend/app/tasks/document_processors/_constants.py
deleted file mode 100644
index f74d7acce..000000000
--- a/surfsense_backend/app/tasks/document_processors/_constants.py
+++ /dev/null
@@ -1,74 +0,0 @@
-"""
-Constants for file document processing.
-
-Centralizes file type classification, LlamaCloud retry configuration,
-and timeout calculation parameters.
-"""
-
-import ssl
-from enum import Enum
-
-import httpx
-
-# ---------------------------------------------------------------------------
-# File type classification
-# ---------------------------------------------------------------------------
-
-MARKDOWN_EXTENSIONS = (".md", ".markdown", ".txt")
-AUDIO_EXTENSIONS = (".mp3", ".mp4", ".mpeg", ".mpga", ".m4a", ".wav", ".webm")
-DIRECT_CONVERT_EXTENSIONS = (".csv", ".tsv", ".html", ".htm")
-
-
-class FileCategory(Enum):
-    MARKDOWN = "markdown"
-    AUDIO = "audio"
-    DIRECT_CONVERT = "direct_convert"
-    DOCUMENT = "document"
-
-
-def classify_file(filename: str) -> FileCategory:
-    """Classify a file by its extension into a processing category."""
-    lower = filename.lower()
-    if lower.endswith(MARKDOWN_EXTENSIONS):
-        return FileCategory.MARKDOWN
-    if lower.endswith(AUDIO_EXTENSIONS):
-        return FileCategory.AUDIO
-    if lower.endswith(DIRECT_CONVERT_EXTENSIONS):
-        return FileCategory.DIRECT_CONVERT
-    return FileCategory.DOCUMENT
-
-
-# ---------------------------------------------------------------------------
-# LlamaCloud retry configuration
-# ---------------------------------------------------------------------------
-
-LLAMACLOUD_MAX_RETRIES = 5
-LLAMACLOUD_BASE_DELAY = 10  # seconds (exponential backoff base)
-LLAMACLOUD_MAX_DELAY = 120  # max delay between retries (2 minutes)
-LLAMACLOUD_RETRYABLE_EXCEPTIONS = (
-    ssl.SSLError,
-    httpx.ConnectError,
-    httpx.ConnectTimeout,
-    httpx.ReadError,
-    httpx.ReadTimeout,
-    httpx.WriteError,
-    httpx.WriteTimeout,
-    httpx.RemoteProtocolError,
-    httpx.LocalProtocolError,
-    ConnectionError,
-    ConnectionResetError,
-    TimeoutError,
-    OSError,
-)
-
-# ---------------------------------------------------------------------------
-# Timeout calculation constants
-# ---------------------------------------------------------------------------
-
-UPLOAD_BYTES_PER_SECOND_SLOW = (
-    100 * 1024
-)  # 100 KB/s (conservative for slow connections)
-MIN_UPLOAD_TIMEOUT = 120  # Minimum 2 minutes for any file
-MAX_UPLOAD_TIMEOUT = 1800  # Maximum 30 minutes for very large files
-BASE_JOB_TIMEOUT = 600  # 10 minutes base for job processing
-PER_PAGE_JOB_TIMEOUT = 60  # 1 minute per page for processing
diff --git a/surfsense_backend/app/tasks/document_processors/_etl.py b/surfsense_backend/app/tasks/document_processors/_etl.py
deleted file mode 100644
index cc3a8b1ac..000000000
--- a/surfsense_backend/app/tasks/document_processors/_etl.py
+++ /dev/null
@@ -1,209 +0,0 @@
-"""
-ETL parsing strategies for different document processing services.
-
-Provides parse functions for Unstructured, LlamaCloud, and Docling, along with
-LlamaCloud retry logic and dynamic timeout calculations.
-"""
-
-import asyncio
-import logging
-import os
-import random
-import warnings
-from logging import ERROR, getLogger
-
-import httpx
-
-from app.config import config as app_config
-from app.db import Log
-from app.services.task_logging_service import TaskLoggingService
-
-from ._constants import (
-    LLAMACLOUD_BASE_DELAY,
-    LLAMACLOUD_MAX_DELAY,
-    LLAMACLOUD_MAX_RETRIES,
-    LLAMACLOUD_RETRYABLE_EXCEPTIONS,
-    PER_PAGE_JOB_TIMEOUT,
-)
-from ._helpers import calculate_job_timeout, calculate_upload_timeout
-
-# ---------------------------------------------------------------------------
-# LlamaCloud parsing with retry
-# ---------------------------------------------------------------------------
-
-
-async def parse_with_llamacloud_retry(
-    file_path: str,
-    estimated_pages: int,
-    task_logger: TaskLoggingService | None = None,
-    log_entry: Log | None = None,
-):
-    """
-    Parse a file with LlamaCloud with retry logic for transient SSL/connection errors.
-
-    Uses dynamic timeout calculations based on file size and page count to handle
-    very large files reliably.
-
-    Returns:
-        LlamaParse result object
-
-    Raises:
-        Exception: If all retries fail
-    """
-    from llama_cloud_services import LlamaParse
-    from llama_cloud_services.parse.utils import ResultType
-
-    file_size_bytes = os.path.getsize(file_path)
-    file_size_mb = file_size_bytes / (1024 * 1024)
-
-    upload_timeout = calculate_upload_timeout(file_size_bytes)
-    job_timeout = calculate_job_timeout(estimated_pages, file_size_bytes)
-
-    custom_timeout = httpx.Timeout(
-        connect=120.0,
-        read=upload_timeout,
-        write=upload_timeout,
-        pool=120.0,
-    )
-
-    logging.info(
-        f"LlamaCloud upload configured: file_size={file_size_mb:.1f}MB, "
-        f"pages={estimated_pages}, upload_timeout={upload_timeout:.0f}s, "
-        f"job_timeout={job_timeout:.0f}s"
-    )
-
-    last_exception = None
-    attempt_errors: list[str] = []
-
-    for attempt in range(1, LLAMACLOUD_MAX_RETRIES + 1):
-        try:
-            async with httpx.AsyncClient(timeout=custom_timeout) as custom_client:
-                parser = LlamaParse(
-                    api_key=app_config.LLAMA_CLOUD_API_KEY,
-                    num_workers=1,
-                    verbose=True,
-                    language="en",
-                    result_type=ResultType.MD,
-                    max_timeout=int(max(2000, job_timeout + upload_timeout)),
-                    job_timeout_in_seconds=job_timeout,
-                    job_timeout_extra_time_per_page_in_seconds=PER_PAGE_JOB_TIMEOUT,
-                    custom_client=custom_client,
-                )
-                result = await parser.aparse(file_path)
-
-                if attempt > 1:
-                    logging.info(
-                        f"LlamaCloud upload succeeded on attempt {attempt} after "
-                        f"{len(attempt_errors)} failures"
-                    )
-                return result
-
-        except LLAMACLOUD_RETRYABLE_EXCEPTIONS as e:
-            last_exception = e
-            error_type = type(e).__name__
-            error_msg = str(e)[:200]
-            attempt_errors.append(f"Attempt {attempt}: {error_type} - {error_msg}")
-
-            if attempt < LLAMACLOUD_MAX_RETRIES:
-                base_delay = min(
-                    LLAMACLOUD_BASE_DELAY * (2 ** (attempt - 1)),
-                    LLAMACLOUD_MAX_DELAY,
-                )
-                jitter = base_delay * 0.25 * (2 * random.random() - 1)
-                delay = base_delay + jitter
-
-                if task_logger and log_entry:
-                    await task_logger.log_task_progress(
-                        log_entry,
-                        f"LlamaCloud upload failed "
-                        f"(attempt {attempt}/{LLAMACLOUD_MAX_RETRIES}), "
-                        f"retrying in {delay:.0f}s",
-                        {
-                            "error_type": error_type,
-                            "error_message": error_msg,
-                            "attempt": attempt,
-                            "retry_delay": delay,
-                            "file_size_mb": round(file_size_mb, 1),
-                            "upload_timeout": upload_timeout,
-                        },
-                    )
-                else:
-                    logging.warning(
-                        f"LlamaCloud upload failed "
-                        f"(attempt {attempt}/{LLAMACLOUD_MAX_RETRIES}): "
-                        f"{error_type}. File: {file_size_mb:.1f}MB. "
-                        f"Retrying in {delay:.0f}s..."
-                    )
-
-                await asyncio.sleep(delay)
-            else:
-                logging.error(
-                    f"LlamaCloud upload failed after {LLAMACLOUD_MAX_RETRIES} "
-                    f"attempts. File size: {file_size_mb:.1f}MB, "
-                    f"Pages: {estimated_pages}. "
-                    f"Errors: {'; '.join(attempt_errors)}"
-                )
-
-        except Exception:
-            raise
-
-    raise last_exception or RuntimeError(
-        f"LlamaCloud parsing failed after {LLAMACLOUD_MAX_RETRIES} retries. "
-        f"File size: {file_size_mb:.1f}MB"
-    )
-
-
-# ---------------------------------------------------------------------------
-# Per-service parse functions
-# ---------------------------------------------------------------------------
-
-
-async def parse_with_unstructured(file_path: str):
-    """
-    Parse a file using the Unstructured ETL service.
-
-    Returns:
-        List of LangChain Document elements.
-    """
-    from langchain_unstructured import UnstructuredLoader
-
-    loader = UnstructuredLoader(
-        file_path,
-        mode="elements",
-        post_processors=[],
-        languages=["eng"],
-        include_orig_elements=False,
-        include_metadata=False,
-        strategy="auto",
-    )
-    return await loader.aload()
-
-
-async def parse_with_docling(file_path: str, filename: str) -> str:
-    """
-    Parse a file using the Docling ETL service (via the Docling service wrapper).
-
-    Returns:
-        Markdown content string.
-    """
-    from app.services.docling_service import create_docling_service
-
-    docling_service = create_docling_service()
-
-    pdfminer_logger = getLogger("pdfminer")
-    original_level = pdfminer_logger.level
-
-    with warnings.catch_warnings():
-        warnings.filterwarnings("ignore", category=UserWarning, module="pdfminer")
-        warnings.filterwarnings(
-            "ignore", message=".*Cannot set gray non-stroke color.*"
-        )
-        warnings.filterwarnings("ignore", message=".*invalid float value.*")
-        pdfminer_logger.setLevel(ERROR)
-
-        try:
-            result = await docling_service.process_document(file_path, filename)
-        finally:
-            pdfminer_logger.setLevel(original_level)
-
-    return result["content"]
diff --git a/surfsense_backend/app/tasks/document_processors/_helpers.py b/surfsense_backend/app/tasks/document_processors/_helpers.py
index 7ac05932c..9cd7b87c9 100644
--- a/surfsense_backend/app/tasks/document_processors/_helpers.py
+++ b/surfsense_backend/app/tasks/document_processors/_helpers.py
@@ -11,13 +11,6 @@ from sqlalchemy.ext.asyncio import AsyncSession
 from app.db import Document, DocumentStatus, DocumentType
 from app.utils.document_converters import generate_unique_identifier_hash
 
-from ._constants import (
-    BASE_JOB_TIMEOUT,
-    MAX_UPLOAD_TIMEOUT,
-    MIN_UPLOAD_TIMEOUT,
-    PER_PAGE_JOB_TIMEOUT,
-    UPLOAD_BYTES_PER_SECOND_SLOW,
-)
 from .base import (
     check_document_by_unique_identifier,
     check_duplicate_document,
@@ -198,21 +191,3 @@ async def update_document_from_connector(
     if "connector_id" in connector:
         document.connector_id = connector["connector_id"]
     await session.commit()
-
-
-# ---------------------------------------------------------------------------
-# Timeout calculations
-# ---------------------------------------------------------------------------
-
-
-def calculate_upload_timeout(file_size_bytes: int) -> float:
-    """Calculate upload timeout based on file size (conservative for slow connections)."""
-    estimated_time = (file_size_bytes / UPLOAD_BYTES_PER_SECOND_SLOW) * 1.5
-    return max(MIN_UPLOAD_TIMEOUT, min(estimated_time, MAX_UPLOAD_TIMEOUT))
-
-
-def calculate_job_timeout(estimated_pages: int, file_size_bytes: int) -> float:
-    """Calculate job processing timeout based on page count and file size."""
-    page_based_timeout = BASE_JOB_TIMEOUT + (estimated_pages * PER_PAGE_JOB_TIMEOUT)
-    size_based_timeout = BASE_JOB_TIMEOUT + (file_size_bytes / (10 * 1024 * 1024)) * 60
-    return max(page_based_timeout, size_based_timeout)
diff --git a/surfsense_backend/app/tasks/document_processors/_save.py b/surfsense_backend/app/tasks/document_processors/_save.py
index 5088ad004..ae45f7a69 100644
--- a/surfsense_backend/app/tasks/document_processors/_save.py
+++ b/surfsense_backend/app/tasks/document_processors/_save.py
@@ -1,14 +1,9 @@
 """
 Unified document save/update logic for file processors.
-
-Replaces the three nearly-identical ``add_received_file_document_using_*``
-functions with a single ``save_file_document`` function plus thin wrappers
-for backward compatibility.
 """
 
 import logging
 
-from langchain_core.documents import Document as LangChainDocument
 from sqlalchemy.exc import SQLAlchemyError
 from sqlalchemy.ext.asyncio import AsyncSession
 
@@ -207,79 +202,3 @@ async def save_file_document(
         raise RuntimeError(
             f"Failed to process file document using {etl_service}: {e!s}"
         ) from e
-
-
-# ---------------------------------------------------------------------------
-# Backward-compatible wrapper functions
-# ---------------------------------------------------------------------------
-
-
-async def add_received_file_document_using_unstructured(
-    session: AsyncSession,
-    file_name: str,
-    unstructured_processed_elements: list[LangChainDocument],
-    search_space_id: int,
-    user_id: str,
-    connector: dict | None = None,
-    enable_summary: bool = True,
-) -> Document | None:
-    """Process and store a file document using the Unstructured service."""
-    from app.utils.document_converters import convert_document_to_markdown
-
-    markdown_content = await convert_document_to_markdown(
-        unstructured_processed_elements
-    )
-    return await save_file_document(
-        session,
-        file_name,
-        markdown_content,
-        search_space_id,
-        user_id,
-        "UNSTRUCTURED",
-        connector,
-        enable_summary,
-    )
-
-
-async def add_received_file_document_using_llamacloud(
-    session: AsyncSession,
-    file_name: str,
-    llamacloud_markdown_document: str,
-    search_space_id: int,
-    user_id: str,
-    connector: dict | None = None,
-    enable_summary: bool = True,
-) -> Document | None:
-    """Process and store document content parsed by LlamaCloud."""
-    return await save_file_document(
-        session,
-        file_name,
-        llamacloud_markdown_document,
-        search_space_id,
-        user_id,
-        "LLAMACLOUD",
-        connector,
-        enable_summary,
-    )
-
-
-async def add_received_file_document_using_docling(
-    session: AsyncSession,
-    file_name: str,
-    docling_markdown_document: str,
-    search_space_id: int,
-    user_id: str,
-    connector: dict | None = None,
-    enable_summary: bool = True,
-) -> Document | None:
-    """Process and store document content parsed by Docling."""
-    return await save_file_document(
-        session,
-        file_name,
-        docling_markdown_document,
-        search_space_id,
-        user_id,
-        "DOCLING",
-        connector,
-        enable_summary,
-    )

From 8224360afa532300ffcd3afb7f4ea2627b253e99 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 17:30:29 +0530
Subject: [PATCH 125/202] refactor: unify file parsing logic across Dropbox,
 Google Drive, and OneDrive using the ETL pipeline

---
 .../connectors/dropbox/content_extractor.py   |   8 +-
 .../google_drive/content_extractor.py         | 102 ++--------------
 .../connectors/onedrive/content_extractor.py  | 110 ++----------------
 3 files changed, 21 insertions(+), 199 deletions(-)

diff --git a/surfsense_backend/app/connectors/dropbox/content_extractor.py b/surfsense_backend/app/connectors/dropbox/content_extractor.py
index e89893b14..8e947eee7 100644
--- a/surfsense_backend/app/connectors/dropbox/content_extractor.py
+++ b/surfsense_backend/app/connectors/dropbox/content_extractor.py
@@ -87,9 +87,13 @@ async def download_and_extract_content(
         if error:
             return None, metadata, error
 
-        from app.connectors.onedrive.content_extractor import _parse_file_to_markdown
+        from app.etl_pipeline.etl_document import EtlRequest
+        from app.etl_pipeline.etl_pipeline_service import EtlPipelineService
 
-        markdown = await _parse_file_to_markdown(temp_file_path, file_name)
+        result = await EtlPipelineService().extract(
+            EtlRequest(file_path=temp_file_path, filename=file_name)
+        )
+        markdown = result.markdown_content
         return markdown, metadata, None
 
     except Exception as e:
diff --git a/surfsense_backend/app/connectors/google_drive/content_extractor.py b/surfsense_backend/app/connectors/google_drive/content_extractor.py
index 1e94133b4..0c559fee9 100644
--- a/surfsense_backend/app/connectors/google_drive/content_extractor.py
+++ b/surfsense_backend/app/connectors/google_drive/content_extractor.py
@@ -1,12 +1,9 @@
 """Content extraction for Google Drive files."""
 
-import asyncio
 import contextlib
 import logging
 import os
 import tempfile
-import threading
-import time
 from pathlib import Path
 from typing import Any
 
@@ -110,99 +107,14 @@ async def download_and_extract_content(
 
 
 async def _parse_file_to_markdown(file_path: str, filename: str) -> str:
-    """Parse a local file to markdown using the configured ETL service."""
-    lower = filename.lower()
+    """Parse a local file to markdown using the unified ETL pipeline."""
+    from app.etl_pipeline.etl_document import EtlRequest
+    from app.etl_pipeline.etl_pipeline_service import EtlPipelineService
 
-    if lower.endswith((".md", ".markdown", ".txt")):
-        with open(file_path, encoding="utf-8") as f:
-            return f.read()
-
-    if lower.endswith((".mp3", ".mp4", ".mpeg", ".mpga", ".m4a", ".wav", ".webm")):
-        from litellm import atranscription
-
-        from app.config import config as app_config
-
-        stt_service_type = (
-            "local"
-            if app_config.STT_SERVICE and app_config.STT_SERVICE.startswith("local/")
-            else "external"
-        )
-        if stt_service_type == "local":
-            from app.services.stt_service import stt_service
-
-            t0 = time.monotonic()
-            logger.info(
-                f"[local-stt] START file={filename} thread={threading.current_thread().name}"
-            )
-            result = await asyncio.to_thread(stt_service.transcribe_file, file_path)
-            logger.info(
-                f"[local-stt] END file={filename} elapsed={time.monotonic() - t0:.2f}s"
-            )
-            text = result.get("text", "")
-        else:
-            with open(file_path, "rb") as audio_file:
-                kwargs: dict[str, Any] = {
-                    "model": app_config.STT_SERVICE,
-                    "file": audio_file,
-                    "api_key": app_config.STT_SERVICE_API_KEY,
-                }
-                if app_config.STT_SERVICE_API_BASE:
-                    kwargs["api_base"] = app_config.STT_SERVICE_API_BASE
-                resp = await atranscription(**kwargs)
-                text = resp.get("text", "")
-
-        if not text:
-            raise ValueError("Transcription returned empty text")
-        return f"# Transcription of {filename}\n\n{text}"
-
-    # Document files -- use configured ETL service
-    from app.config import config as app_config
-
-    if app_config.ETL_SERVICE == "UNSTRUCTURED":
-        from langchain_unstructured import UnstructuredLoader
-
-        from app.utils.document_converters import convert_document_to_markdown
-
-        loader = UnstructuredLoader(
-            file_path,
-            mode="elements",
-            post_processors=[],
-            languages=["eng"],
-            include_orig_elements=False,
-            include_metadata=False,
-            strategy="auto",
-        )
-        docs = await loader.aload()
-        return await convert_document_to_markdown(docs)
-
-    if app_config.ETL_SERVICE == "LLAMACLOUD":
-        from app.tasks.document_processors.file_processors import (
-            parse_with_llamacloud_retry,
-        )
-
-        result = await parse_with_llamacloud_retry(
-            file_path=file_path, estimated_pages=50
-        )
-        markdown_documents = await result.aget_markdown_documents(split_by_page=False)
-        if not markdown_documents:
-            raise RuntimeError(f"LlamaCloud returned no documents for {filename}")
-        return markdown_documents[0].text
-
-    if app_config.ETL_SERVICE == "DOCLING":
-        from docling.document_converter import DocumentConverter
-
-        converter = DocumentConverter()
-        t0 = time.monotonic()
-        logger.info(
-            f"[docling] START file={filename} thread={threading.current_thread().name}"
-        )
-        result = await asyncio.to_thread(converter.convert, file_path)
-        logger.info(
-            f"[docling] END file={filename} elapsed={time.monotonic() - t0:.2f}s"
-        )
-        return result.document.export_to_markdown()
-
-    raise RuntimeError(f"Unknown ETL_SERVICE: {app_config.ETL_SERVICE}")
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=file_path, filename=filename)
+    )
+    return result.markdown_content
 
 
 async def download_and_process_file(
diff --git a/surfsense_backend/app/connectors/onedrive/content_extractor.py b/surfsense_backend/app/connectors/onedrive/content_extractor.py
index 8917ba1fd..2355993eb 100644
--- a/surfsense_backend/app/connectors/onedrive/content_extractor.py
+++ b/surfsense_backend/app/connectors/onedrive/content_extractor.py
@@ -1,16 +1,9 @@
-"""Content extraction for OneDrive files.
+"""Content extraction for OneDrive files."""
 
-Reuses the same ETL parsing logic as Google Drive since file parsing is
-extension-based, not provider-specific.
-"""
-
-import asyncio
 import contextlib
 import logging
 import os
 import tempfile
-import threading
-import time
 from pathlib import Path
 from typing import Any
 
@@ -84,98 +77,11 @@ async def download_and_extract_content(
 
 
 async def _parse_file_to_markdown(file_path: str, filename: str) -> str:
-    """Parse a local file to markdown using the configured ETL service.
+    """Parse a local file to markdown using the unified ETL pipeline."""
+    from app.etl_pipeline.etl_document import EtlRequest
+    from app.etl_pipeline.etl_pipeline_service import EtlPipelineService
 
-    Same logic as Google Drive -- file parsing is extension-based.
-    """
-    lower = filename.lower()
-
-    if lower.endswith((".md", ".markdown", ".txt")):
-        with open(file_path, encoding="utf-8") as f:
-            return f.read()
-
-    if lower.endswith((".mp3", ".mp4", ".mpeg", ".mpga", ".m4a", ".wav", ".webm")):
-        from litellm import atranscription
-
-        from app.config import config as app_config
-
-        stt_service_type = (
-            "local"
-            if app_config.STT_SERVICE and app_config.STT_SERVICE.startswith("local/")
-            else "external"
-        )
-        if stt_service_type == "local":
-            from app.services.stt_service import stt_service
-
-            t0 = time.monotonic()
-            logger.info(
-                f"[local-stt] START file={filename} thread={threading.current_thread().name}"
-            )
-            result = await asyncio.to_thread(stt_service.transcribe_file, file_path)
-            logger.info(
-                f"[local-stt] END file={filename} elapsed={time.monotonic() - t0:.2f}s"
-            )
-            text = result.get("text", "")
-        else:
-            with open(file_path, "rb") as audio_file:
-                kwargs: dict[str, Any] = {
-                    "model": app_config.STT_SERVICE,
-                    "file": audio_file,
-                    "api_key": app_config.STT_SERVICE_API_KEY,
-                }
-                if app_config.STT_SERVICE_API_BASE:
-                    kwargs["api_base"] = app_config.STT_SERVICE_API_BASE
-                resp = await atranscription(**kwargs)
-                text = resp.get("text", "")
-
-        if not text:
-            raise ValueError("Transcription returned empty text")
-        return f"# Transcription of {filename}\n\n{text}"
-
-    from app.config import config as app_config
-
-    if app_config.ETL_SERVICE == "UNSTRUCTURED":
-        from langchain_unstructured import UnstructuredLoader
-
-        from app.utils.document_converters import convert_document_to_markdown
-
-        loader = UnstructuredLoader(
-            file_path,
-            mode="elements",
-            post_processors=[],
-            languages=["eng"],
-            include_orig_elements=False,
-            include_metadata=False,
-            strategy="auto",
-        )
-        docs = await loader.aload()
-        return await convert_document_to_markdown(docs)
-
-    if app_config.ETL_SERVICE == "LLAMACLOUD":
-        from app.tasks.document_processors.file_processors import (
-            parse_with_llamacloud_retry,
-        )
-
-        result = await parse_with_llamacloud_retry(
-            file_path=file_path, estimated_pages=50
-        )
-        markdown_documents = await result.aget_markdown_documents(split_by_page=False)
-        if not markdown_documents:
-            raise RuntimeError(f"LlamaCloud returned no documents for {filename}")
-        return markdown_documents[0].text
-
-    if app_config.ETL_SERVICE == "DOCLING":
-        from docling.document_converter import DocumentConverter
-
-        converter = DocumentConverter()
-        t0 = time.monotonic()
-        logger.info(
-            f"[docling] START file={filename} thread={threading.current_thread().name}"
-        )
-        result = await asyncio.to_thread(converter.convert, file_path)
-        logger.info(
-            f"[docling] END file={filename} elapsed={time.monotonic() - t0:.2f}s"
-        )
-        return result.document.export_to_markdown()
-
-    raise RuntimeError(f"Unknown ETL_SERVICE: {app_config.ETL_SERVICE}")
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=file_path, filename=filename)
+    )
+    return result.markdown_content

From 87af012a60eee451e0af2311e3aa1547e6a6616e Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 17:45:18 +0530
Subject: [PATCH 126/202] refactor: streamline file processing by integrating
 ETL pipeline for all file types and removing redundant functions

---
 .../local_folder_indexer.py                   | 178 +---
 .../document_processors/file_processors.py    | 785 +++---------------
 2 files changed, 123 insertions(+), 840 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index acfbce0bf..749dbf731 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -44,132 +44,6 @@ from .base import (
     logger,
 )
 
-PLAINTEXT_EXTENSIONS = frozenset(
-    {
-        ".md",
-        ".markdown",
-        ".txt",
-        ".text",
-        ".json",
-        ".jsonl",
-        ".yaml",
-        ".yml",
-        ".toml",
-        ".ini",
-        ".cfg",
-        ".conf",
-        ".xml",
-        ".css",
-        ".scss",
-        ".less",
-        ".sass",
-        ".py",
-        ".pyw",
-        ".pyi",
-        ".pyx",
-        ".js",
-        ".jsx",
-        ".ts",
-        ".tsx",
-        ".mjs",
-        ".cjs",
-        ".java",
-        ".kt",
-        ".kts",
-        ".scala",
-        ".groovy",
-        ".c",
-        ".h",
-        ".cpp",
-        ".cxx",
-        ".cc",
-        ".hpp",
-        ".hxx",
-        ".cs",
-        ".fs",
-        ".fsx",
-        ".go",
-        ".rs",
-        ".rb",
-        ".php",
-        ".pl",
-        ".pm",
-        ".lua",
-        ".swift",
-        ".m",
-        ".mm",
-        ".r",
-        ".R",
-        ".jl",
-        ".sh",
-        ".bash",
-        ".zsh",
-        ".fish",
-        ".bat",
-        ".cmd",
-        ".ps1",
-        ".sql",
-        ".graphql",
-        ".gql",
-        ".env",
-        ".gitignore",
-        ".dockerignore",
-        ".editorconfig",
-        ".makefile",
-        ".cmake",
-        ".log",
-        ".rst",
-        ".tex",
-        ".bib",
-        ".org",
-        ".adoc",
-        ".asciidoc",
-        ".vue",
-        ".svelte",
-        ".astro",
-        ".tf",
-        ".hcl",
-        ".proto",
-    }
-)
-
-AUDIO_EXTENSIONS = frozenset(
-    {
-        ".mp3",
-        ".mp4",
-        ".mpeg",
-        ".mpga",
-        ".m4a",
-        ".wav",
-        ".webm",
-    }
-)
-
-
-DIRECT_CONVERT_EXTENSIONS = frozenset({".csv", ".tsv", ".html", ".htm"})
-
-
-def _is_plaintext_file(filename: str) -> bool:
-    return Path(filename).suffix.lower() in PLAINTEXT_EXTENSIONS
-
-
-def _is_audio_file(filename: str) -> bool:
-    return Path(filename).suffix.lower() in AUDIO_EXTENSIONS
-
-
-def _is_direct_convert_file(filename: str) -> bool:
-    return Path(filename).suffix.lower() in DIRECT_CONVERT_EXTENSIONS
-
-
-def _needs_etl(filename: str) -> bool:
-    """File is not plaintext, not audio, and not direct-convert — requires ETL."""
-    return (
-        not _is_plaintext_file(filename)
-        and not _is_audio_file(filename)
-        and not _is_direct_convert_file(filename)
-    )
-
-
 HeartbeatCallbackType = Callable[[int], Awaitable[None]]
 
 
@@ -278,57 +152,21 @@ def scan_folder(
     return files
 
 
-def _read_plaintext_file(file_path: str) -> str:
-    """Read a plaintext/text-based file as UTF-8."""
-    with open(file_path, encoding="utf-8", errors="replace") as f:
-        content = f.read()
-    if "\x00" in content:
-        raise ValueError(
-            f"File contains null bytes — likely a binary file opened as text: {file_path}"
-        )
-    return content
 
 
 async def _read_file_content(file_path: str, filename: str) -> str:
-    """Read file content, using ETL for binary formats.
+    """Read file content via the unified ETL pipeline.
 
-    Plaintext files are read directly. Audio and document files (PDF, DOCX, etc.)
-    are routed through the configured ETL service (same as Google Drive / OneDrive).
-
-    Raises ValueError if the file cannot be parsed (e.g. no ETL service configured
-    for a binary file).
+    All file types (plaintext, audio, direct-convert, document) are handled
+    by ``EtlPipelineService``.
     """
-    if _is_plaintext_file(filename):
-        return _read_plaintext_file(file_path)
+    from app.etl_pipeline.etl_document import EtlRequest
+    from app.etl_pipeline.etl_pipeline_service import EtlPipelineService
 
-    if _is_direct_convert_file(filename):
-        from app.tasks.document_processors._direct_converters import (
-            convert_file_directly,
-        )
-
-        return convert_file_directly(file_path, filename)
-
-    if _is_audio_file(filename):
-        etl_service = config.ETL_SERVICE if hasattr(config, "ETL_SERVICE") else None
-        stt_service_val = config.STT_SERVICE if hasattr(config, "STT_SERVICE") else None
-        if not stt_service_val and not etl_service:
-            raise ValueError(
-                f"No STT_SERVICE configured — cannot transcribe audio file: {filename}"
-            )
-
-    if _needs_etl(filename):
-        etl_service = getattr(config, "ETL_SERVICE", None)
-        if not etl_service:
-            raise ValueError(
-                f"No ETL_SERVICE configured — cannot parse binary file: {filename}. "
-                f"Set ETL_SERVICE to UNSTRUCTURED, LLAMACLOUD, or DOCLING in your .env"
-            )
-
-    from app.connectors.onedrive.content_extractor import (
-        _parse_file_to_markdown,
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=file_path, filename=filename)
     )
-
-    return await _parse_file_to_markdown(file_path, filename)
+    return result.markdown_content
 
 
 def _content_hash(content: str, search_space_id: int) -> str:
diff --git a/surfsense_backend/app/tasks/document_processors/file_processors.py b/surfsense_backend/app/tasks/document_processors/file_processors.py
index 0c1cad52d..f54a963ad 100644
--- a/surfsense_backend/app/tasks/document_processors/file_processors.py
+++ b/surfsense_backend/app/tasks/document_processors/file_processors.py
@@ -1,14 +1,8 @@
 """
 File document processors orchestrating content extraction and indexing.
 
-This module is the public entry point for file processing.  It delegates to
-specialised sub-modules that each own a single concern:
-
-- ``_constants``          — file type classification and configuration constants
-- ``_helpers``            — document deduplication, migration, connector helpers
-- ``_direct_converters``  — lossless file-to-markdown for csv/tsv/html
-- ``_etl``               — ETL parsing strategies (Unstructured, LlamaCloud, Docling)
-- ``_save``              — unified document creation / update logic
+Delegates content extraction to ``app.etl_pipeline.EtlPipelineService`` and
+keeps only orchestration concerns (notifications, logging, page limits, saving).
 """
 
 from __future__ import annotations
@@ -17,38 +11,19 @@ import contextlib
 import logging
 import os
 from dataclasses import dataclass, field
-from logging import ERROR, getLogger
 
 from fastapi import HTTPException
 from sqlalchemy.ext.asyncio import AsyncSession
 
-from app.config import config as app_config
 from app.db import Document, Log, Notification
 from app.services.notification_service import NotificationService
 from app.services.task_logging_service import TaskLoggingService
 
-from ._constants import FileCategory, classify_file
-from ._direct_converters import convert_file_directly
-from ._etl import (
-    parse_with_docling,
-    parse_with_llamacloud_retry,
-    parse_with_unstructured,
-)
 from ._helpers import update_document_from_connector
-from ._save import (
-    add_received_file_document_using_docling,
-    add_received_file_document_using_llamacloud,
-    add_received_file_document_using_unstructured,
-    save_file_document,
-)
+from ._save import save_file_document
 from .markdown_processor import add_received_markdown_file_document
 
-# Re-export public API so existing ``from file_processors import …`` keeps working.
 __all__ = [
-    "add_received_file_document_using_docling",
-    "add_received_file_document_using_llamacloud",
-    "add_received_file_document_using_unstructured",
-    "parse_with_llamacloud_retry",
     "process_file_in_background",
     "process_file_in_background_with_document",
     "save_file_document",
@@ -142,35 +117,31 @@ async def _log_page_divergence(
 # ===================================================================
 
 
-async def _process_markdown_upload(ctx: _ProcessingContext) -> Document | None:
-    """Read a markdown / text file and create or update a document."""
-    await _notify(ctx, "parsing", "Reading file")
+async def _process_non_document_upload(ctx: _ProcessingContext) -> Document | None:
+    """Extract content from a non-document file (plaintext/direct_convert/audio) via the unified ETL pipeline."""
+    from app.etl_pipeline.etl_document import EtlRequest
+    from app.etl_pipeline.etl_pipeline_service import EtlPipelineService
+
+    await _notify(ctx, "parsing", "Processing file")
     await ctx.task_logger.log_task_progress(
         ctx.log_entry,
-        f"Processing markdown/text file: {ctx.filename}",
-        {"file_type": "markdown", "processing_stage": "reading_file"},
+        f"Processing file: {ctx.filename}",
+        {"processing_stage": "extracting"},
     )
 
-    with open(ctx.file_path, encoding="utf-8") as f:
-        markdown_content = f.read()
+    etl_result = await EtlPipelineService().extract(
+        EtlRequest(file_path=ctx.file_path, filename=ctx.filename)
+    )
 
     with contextlib.suppress(Exception):
         os.unlink(ctx.file_path)
 
     await _notify(ctx, "chunking")
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"Creating document from markdown content: {ctx.filename}",
-        {
-            "processing_stage": "creating_document",
-            "content_length": len(markdown_content),
-        },
-    )
 
     result = await add_received_markdown_file_document(
         ctx.session,
         ctx.filename,
-        markdown_content,
+        etl_result.markdown_content,
         ctx.search_space_id,
         ctx.user_id,
         ctx.connector,
@@ -181,179 +152,19 @@ async def _process_markdown_upload(ctx: _ProcessingContext) -> Document | None:
     if result:
         await ctx.task_logger.log_task_success(
             ctx.log_entry,
-            f"Successfully processed markdown file: {ctx.filename}",
+            f"Successfully processed file: {ctx.filename}",
             {
                 "document_id": result.id,
                 "content_hash": result.content_hash,
-                "file_type": "markdown",
+                "file_type": etl_result.content_type,
+                "etl_service": etl_result.etl_service,
             },
         )
     else:
         await ctx.task_logger.log_task_success(
             ctx.log_entry,
-            f"Markdown file already exists (duplicate): {ctx.filename}",
-            {"duplicate_detected": True, "file_type": "markdown"},
-        )
-    return result
-
-
-async def _process_direct_convert_upload(ctx: _ProcessingContext) -> Document | None:
-    """Convert a text-based file (csv/tsv/html) to markdown without ETL."""
-    await _notify(ctx, "parsing", "Converting file")
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"Direct-converting file to markdown: {ctx.filename}",
-        {"file_type": "direct_convert", "processing_stage": "converting"},
-    )
-
-    markdown_content = convert_file_directly(ctx.file_path, ctx.filename)
-
-    with contextlib.suppress(Exception):
-        os.unlink(ctx.file_path)
-
-    await _notify(ctx, "chunking")
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"Creating document from converted content: {ctx.filename}",
-        {
-            "processing_stage": "creating_document",
-            "content_length": len(markdown_content),
-        },
-    )
-
-    result = await add_received_markdown_file_document(
-        ctx.session,
-        ctx.filename,
-        markdown_content,
-        ctx.search_space_id,
-        ctx.user_id,
-        ctx.connector,
-    )
-    if ctx.connector:
-        await update_document_from_connector(result, ctx.connector, ctx.session)
-
-    if result:
-        await ctx.task_logger.log_task_success(
-            ctx.log_entry,
-            f"Successfully direct-converted file: {ctx.filename}",
-            {
-                "document_id": result.id,
-                "content_hash": result.content_hash,
-                "file_type": "direct_convert",
-            },
-        )
-    else:
-        await ctx.task_logger.log_task_success(
-            ctx.log_entry,
-            f"Direct-converted file already exists (duplicate): {ctx.filename}",
-            {"duplicate_detected": True, "file_type": "direct_convert"},
-        )
-    return result
-
-
-async def _process_audio_upload(ctx: _ProcessingContext) -> Document | None:
-    """Transcribe an audio file and create or update a document."""
-    await _notify(ctx, "parsing", "Transcribing audio")
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"Processing audio file for transcription: {ctx.filename}",
-        {"file_type": "audio", "processing_stage": "starting_transcription"},
-    )
-
-    stt_service_type = (
-        "local"
-        if app_config.STT_SERVICE and app_config.STT_SERVICE.startswith("local/")
-        else "external"
-    )
-
-    if stt_service_type == "local":
-        from app.services.stt_service import stt_service
-
-        try:
-            stt_result = stt_service.transcribe_file(ctx.file_path)
-            transcribed_text = stt_result.get("text", "")
-            if not transcribed_text:
-                raise ValueError("Transcription returned empty text")
-            transcribed_text = (
-                f"# Transcription of {ctx.filename}\n\n{transcribed_text}"
-            )
-        except Exception as e:
-            raise HTTPException(
-                status_code=422,
-                detail=f"Failed to transcribe audio file {ctx.filename}: {e!s}",
-            ) from e
-
-        await ctx.task_logger.log_task_progress(
-            ctx.log_entry,
-            f"Local STT transcription completed: {ctx.filename}",
-            {
-                "processing_stage": "local_transcription_complete",
-                "language": stt_result.get("language"),
-                "confidence": stt_result.get("language_probability"),
-                "duration": stt_result.get("duration"),
-            },
-        )
-    else:
-        from litellm import atranscription
-
-        with open(ctx.file_path, "rb") as audio_file:
-            transcription_kwargs: dict = {
-                "model": app_config.STT_SERVICE,
-                "file": audio_file,
-                "api_key": app_config.STT_SERVICE_API_KEY,
-            }
-            if app_config.STT_SERVICE_API_BASE:
-                transcription_kwargs["api_base"] = app_config.STT_SERVICE_API_BASE
-
-            transcription_response = await atranscription(**transcription_kwargs)
-            transcribed_text = transcription_response.get("text", "")
-            if not transcribed_text:
-                raise ValueError("Transcription returned empty text")
-
-        transcribed_text = f"# Transcription of {ctx.filename}\n\n{transcribed_text}"
-
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"Transcription completed, creating document: {ctx.filename}",
-        {
-            "processing_stage": "transcription_complete",
-            "transcript_length": len(transcribed_text),
-        },
-    )
-
-    await _notify(ctx, "chunking")
-
-    with contextlib.suppress(Exception):
-        os.unlink(ctx.file_path)
-
-    result = await add_received_markdown_file_document(
-        ctx.session,
-        ctx.filename,
-        transcribed_text,
-        ctx.search_space_id,
-        ctx.user_id,
-        ctx.connector,
-    )
-    if ctx.connector:
-        await update_document_from_connector(result, ctx.connector, ctx.session)
-
-    if result:
-        await ctx.task_logger.log_task_success(
-            ctx.log_entry,
-            f"Successfully transcribed and processed audio file: {ctx.filename}",
-            {
-                "document_id": result.id,
-                "content_hash": result.content_hash,
-                "file_type": "audio",
-                "transcript_length": len(transcribed_text),
-                "stt_service": stt_service_type,
-            },
-        )
-    else:
-        await ctx.task_logger.log_task_success(
-            ctx.log_entry,
-            f"Audio file transcript already exists (duplicate): {ctx.filename}",
-            {"duplicate_detected": True, "file_type": "audio"},
+            f"File already exists (duplicate): {ctx.filename}",
+            {"duplicate_detected": True, "file_type": etl_result.content_type},
         )
     return result
 
@@ -363,279 +174,10 @@ async def _process_audio_upload(ctx: _ProcessingContext) -> Document | None:
 # ---------------------------------------------------------------------------
 
 
-async def _etl_unstructured(
-    ctx: _ProcessingContext,
-    page_limit_service,
-    estimated_pages: int,
-) -> Document | None:
-    """Parse and save via the Unstructured ETL service."""
-    await _notify(ctx, "parsing", "Extracting content")
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"Processing file with Unstructured ETL: {ctx.filename}",
-        {
-            "file_type": "document",
-            "etl_service": "UNSTRUCTURED",
-            "processing_stage": "loading",
-        },
-    )
-
-    docs = await parse_with_unstructured(ctx.file_path)
-
-    await _notify(ctx, "chunking", chunks_count=len(docs))
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"Unstructured ETL completed, creating document: {ctx.filename}",
-        {"processing_stage": "etl_complete", "elements_count": len(docs)},
-    )
-
-    actual_pages = page_limit_service.estimate_pages_from_elements(docs)
-    final_pages = max(estimated_pages, actual_pages)
-    await _log_page_divergence(
-        ctx.task_logger,
-        ctx.log_entry,
-        ctx.filename,
-        estimated_pages,
-        actual_pages,
-        final_pages,
-    )
-
-    with contextlib.suppress(Exception):
-        os.unlink(ctx.file_path)
-
-    result = await add_received_file_document_using_unstructured(
-        ctx.session,
-        ctx.filename,
-        docs,
-        ctx.search_space_id,
-        ctx.user_id,
-        ctx.connector,
-        enable_summary=ctx.enable_summary,
-    )
-    if ctx.connector:
-        await update_document_from_connector(result, ctx.connector, ctx.session)
-
-    if result:
-        await page_limit_service.update_page_usage(
-            ctx.user_id, final_pages, allow_exceed=True
-        )
-        await ctx.task_logger.log_task_success(
-            ctx.log_entry,
-            f"Successfully processed file with Unstructured: {ctx.filename}",
-            {
-                "document_id": result.id,
-                "content_hash": result.content_hash,
-                "file_type": "document",
-                "etl_service": "UNSTRUCTURED",
-                "pages_processed": final_pages,
-            },
-        )
-    else:
-        await ctx.task_logger.log_task_success(
-            ctx.log_entry,
-            f"Document already exists (duplicate): {ctx.filename}",
-            {
-                "duplicate_detected": True,
-                "file_type": "document",
-                "etl_service": "UNSTRUCTURED",
-            },
-        )
-    return result
-
-
-async def _etl_llamacloud(
-    ctx: _ProcessingContext,
-    page_limit_service,
-    estimated_pages: int,
-) -> Document | None:
-    """Parse and save via the LlamaCloud ETL service."""
-    await _notify(ctx, "parsing", "Extracting content")
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"Processing file with LlamaCloud ETL: {ctx.filename}",
-        {
-            "file_type": "document",
-            "etl_service": "LLAMACLOUD",
-            "processing_stage": "parsing",
-            "estimated_pages": estimated_pages,
-        },
-    )
-
-    raw_result = await parse_with_llamacloud_retry(
-        file_path=ctx.file_path,
-        estimated_pages=estimated_pages,
-        task_logger=ctx.task_logger,
-        log_entry=ctx.log_entry,
-    )
-
-    with contextlib.suppress(Exception):
-        os.unlink(ctx.file_path)
-
-    markdown_documents = await raw_result.aget_markdown_documents(split_by_page=False)
-
-    await _notify(ctx, "chunking", chunks_count=len(markdown_documents))
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"LlamaCloud parsing completed, creating documents: {ctx.filename}",
-        {
-            "processing_stage": "parsing_complete",
-            "documents_count": len(markdown_documents),
-        },
-    )
-
-    if not markdown_documents:
-        await ctx.task_logger.log_task_failure(
-            ctx.log_entry,
-            f"LlamaCloud parsing returned no documents: {ctx.filename}",
-            "ETL service returned empty document list",
-            {"error_type": "EmptyDocumentList", "etl_service": "LLAMACLOUD"},
-        )
-        raise ValueError(f"LlamaCloud parsing returned no documents for {ctx.filename}")
-
-    actual_pages = page_limit_service.estimate_pages_from_markdown(markdown_documents)
-    final_pages = max(estimated_pages, actual_pages)
-    await _log_page_divergence(
-        ctx.task_logger,
-        ctx.log_entry,
-        ctx.filename,
-        estimated_pages,
-        actual_pages,
-        final_pages,
-    )
-
-    any_created = False
-    last_doc: Document | None = None
-
-    for doc in markdown_documents:
-        doc_result = await add_received_file_document_using_llamacloud(
-            ctx.session,
-            ctx.filename,
-            llamacloud_markdown_document=doc.text,
-            search_space_id=ctx.search_space_id,
-            user_id=ctx.user_id,
-            connector=ctx.connector,
-            enable_summary=ctx.enable_summary,
-        )
-        if doc_result:
-            any_created = True
-            last_doc = doc_result
-
-    if any_created:
-        await page_limit_service.update_page_usage(
-            ctx.user_id, final_pages, allow_exceed=True
-        )
-        if ctx.connector:
-            await update_document_from_connector(last_doc, ctx.connector, ctx.session)
-        await ctx.task_logger.log_task_success(
-            ctx.log_entry,
-            f"Successfully processed file with LlamaCloud: {ctx.filename}",
-            {
-                "document_id": last_doc.id,
-                "content_hash": last_doc.content_hash,
-                "file_type": "document",
-                "etl_service": "LLAMACLOUD",
-                "pages_processed": final_pages,
-                "documents_count": len(markdown_documents),
-            },
-        )
-        return last_doc
-
-    await ctx.task_logger.log_task_success(
-        ctx.log_entry,
-        f"Document already exists (duplicate): {ctx.filename}",
-        {
-            "duplicate_detected": True,
-            "file_type": "document",
-            "etl_service": "LLAMACLOUD",
-            "documents_count": len(markdown_documents),
-        },
-    )
-    return None
-
-
-async def _etl_docling(
-    ctx: _ProcessingContext,
-    page_limit_service,
-    estimated_pages: int,
-) -> Document | None:
-    """Parse and save via the Docling ETL service."""
-    await _notify(ctx, "parsing", "Extracting content")
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"Processing file with Docling ETL: {ctx.filename}",
-        {
-            "file_type": "document",
-            "etl_service": "DOCLING",
-            "processing_stage": "parsing",
-        },
-    )
-
-    content = await parse_with_docling(ctx.file_path, ctx.filename)
-
-    with contextlib.suppress(Exception):
-        os.unlink(ctx.file_path)
-
-    await ctx.task_logger.log_task_progress(
-        ctx.log_entry,
-        f"Docling parsing completed, creating document: {ctx.filename}",
-        {"processing_stage": "parsing_complete", "content_length": len(content)},
-    )
-
-    actual_pages = page_limit_service.estimate_pages_from_content_length(len(content))
-    final_pages = max(estimated_pages, actual_pages)
-    await _log_page_divergence(
-        ctx.task_logger,
-        ctx.log_entry,
-        ctx.filename,
-        estimated_pages,
-        actual_pages,
-        final_pages,
-    )
-
-    await _notify(ctx, "chunking")
-
-    result = await add_received_file_document_using_docling(
-        ctx.session,
-        ctx.filename,
-        docling_markdown_document=content,
-        search_space_id=ctx.search_space_id,
-        user_id=ctx.user_id,
-        connector=ctx.connector,
-        enable_summary=ctx.enable_summary,
-    )
-
-    if result:
-        await page_limit_service.update_page_usage(
-            ctx.user_id, final_pages, allow_exceed=True
-        )
-        if ctx.connector:
-            await update_document_from_connector(result, ctx.connector, ctx.session)
-        await ctx.task_logger.log_task_success(
-            ctx.log_entry,
-            f"Successfully processed file with Docling: {ctx.filename}",
-            {
-                "document_id": result.id,
-                "content_hash": result.content_hash,
-                "file_type": "document",
-                "etl_service": "DOCLING",
-                "pages_processed": final_pages,
-            },
-        )
-    else:
-        await ctx.task_logger.log_task_success(
-            ctx.log_entry,
-            f"Document already exists (duplicate): {ctx.filename}",
-            {
-                "duplicate_detected": True,
-                "file_type": "document",
-                "etl_service": "DOCLING",
-            },
-        )
-    return result
-
-
 async def _process_document_upload(ctx: _ProcessingContext) -> Document | None:
-    """Route a document file to the configured ETL service."""
+    """Route a document file to the configured ETL service via the unified pipeline."""
+    from app.etl_pipeline.etl_document import EtlRequest
+    from app.etl_pipeline.etl_pipeline_service import EtlPipelineService
     from app.services.page_limit_service import PageLimitExceededError, PageLimitService
 
     page_limit_service = PageLimitService(ctx.session)
@@ -665,16 +207,60 @@ async def _process_document_upload(ctx: _ProcessingContext) -> Document | None:
             os.unlink(ctx.file_path)
         raise HTTPException(status_code=403, detail=str(e)) from e
 
-    etl_dispatch = {
-        "UNSTRUCTURED": _etl_unstructured,
-        "LLAMACLOUD": _etl_llamacloud,
-        "DOCLING": _etl_docling,
-    }
-    handler = etl_dispatch.get(app_config.ETL_SERVICE)
-    if handler is None:
-        raise RuntimeError(f"Unknown ETL_SERVICE: {app_config.ETL_SERVICE}")
+    await _notify(ctx, "parsing", "Extracting content")
 
-    return await handler(ctx, page_limit_service, estimated_pages)
+    etl_result = await EtlPipelineService().extract(
+        EtlRequest(
+            file_path=ctx.file_path,
+            filename=ctx.filename,
+            estimated_pages=estimated_pages,
+        )
+    )
+
+    with contextlib.suppress(Exception):
+        os.unlink(ctx.file_path)
+
+    await _notify(ctx, "chunking")
+
+    result = await save_file_document(
+        ctx.session,
+        ctx.filename,
+        etl_result.markdown_content,
+        ctx.search_space_id,
+        ctx.user_id,
+        etl_result.etl_service,
+        ctx.connector,
+        enable_summary=ctx.enable_summary,
+    )
+
+    if result:
+        await page_limit_service.update_page_usage(
+            ctx.user_id, estimated_pages, allow_exceed=True
+        )
+        if ctx.connector:
+            await update_document_from_connector(result, ctx.connector, ctx.session)
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Successfully processed file: {ctx.filename}",
+            {
+                "document_id": result.id,
+                "content_hash": result.content_hash,
+                "file_type": "document",
+                "etl_service": etl_result.etl_service,
+                "pages_processed": estimated_pages,
+            },
+        )
+    else:
+        await ctx.task_logger.log_task_success(
+            ctx.log_entry,
+            f"Document already exists (duplicate): {ctx.filename}",
+            {
+                "duplicate_detected": True,
+                "file_type": "document",
+                "etl_service": etl_result.etl_service,
+            },
+        )
+    return result
 
 
 # ===================================================================
@@ -706,15 +292,14 @@ async def process_file_in_background(
     )
 
     try:
-        category = classify_file(filename)
+        from app.etl_pipeline.file_classifier import FileCategory as EtlFileCategory
+        from app.etl_pipeline.file_classifier import classify_file as etl_classify
 
-        if category == FileCategory.MARKDOWN:
-            return await _process_markdown_upload(ctx)
-        if category == FileCategory.DIRECT_CONVERT:
-            return await _process_direct_convert_upload(ctx)
-        if category == FileCategory.AUDIO:
-            return await _process_audio_upload(ctx)
-        return await _process_document_upload(ctx)
+        category = etl_classify(filename)
+
+        if category == EtlFileCategory.DOCUMENT:
+            return await _process_document_upload(ctx)
+        return await _process_non_document_upload(ctx)
 
     except Exception as e:
         await session.rollback()
@@ -758,201 +343,61 @@ async def _extract_file_content(
     Returns:
         Tuple of (markdown_content, etl_service_name).
     """
-    category = classify_file(filename)
+    from app.etl_pipeline.etl_document import EtlRequest
+    from app.etl_pipeline.etl_pipeline_service import EtlPipelineService
+    from app.etl_pipeline.file_classifier import FileCategory
+    from app.etl_pipeline.file_classifier import classify_file as etl_classify
 
-    if category == FileCategory.MARKDOWN:
-        if notification:
-            await NotificationService.document_processing.notify_processing_progress(
-                session,
-                notification,
-                stage="parsing",
-                stage_message="Reading file",
-            )
-        await task_logger.log_task_progress(
-            log_entry,
-            f"Processing markdown/text file: {filename}",
-            {"file_type": "markdown", "processing_stage": "reading_file"},
-        )
-        with open(file_path, encoding="utf-8") as f:
-            content = f.read()
-        with contextlib.suppress(Exception):
-            os.unlink(file_path)
-        return content, "MARKDOWN"
-
-    if category == FileCategory.DIRECT_CONVERT:
-        if notification:
-            await NotificationService.document_processing.notify_processing_progress(
-                session,
-                notification,
-                stage="parsing",
-                stage_message="Converting file",
-            )
-        await task_logger.log_task_progress(
-            log_entry,
-            f"Direct-converting file to markdown: {filename}",
-            {"file_type": "direct_convert", "processing_stage": "converting"},
-        )
-        content = convert_file_directly(file_path, filename)
-        with contextlib.suppress(Exception):
-            os.unlink(file_path)
-        return content, "DIRECT_CONVERT"
-
-    if category == FileCategory.AUDIO:
-        if notification:
-            await NotificationService.document_processing.notify_processing_progress(
-                session,
-                notification,
-                stage="parsing",
-                stage_message="Transcribing audio",
-            )
-        await task_logger.log_task_progress(
-            log_entry,
-            f"Processing audio file for transcription: {filename}",
-            {"file_type": "audio", "processing_stage": "starting_transcription"},
-        )
-        transcribed_text = await _transcribe_audio(file_path, filename)
-        with contextlib.suppress(Exception):
-            os.unlink(file_path)
-        return transcribed_text, "AUDIO_TRANSCRIPTION"
-
-    # Document file — use ETL service
-    return await _extract_document_content(
-        file_path,
-        filename,
-        session,
-        user_id,
-        task_logger,
-        log_entry,
-        notification,
-    )
-
-
-async def _transcribe_audio(file_path: str, filename: str) -> str:
-    """Transcribe an audio file and return formatted markdown text."""
-    stt_service_type = (
-        "local"
-        if app_config.STT_SERVICE and app_config.STT_SERVICE.startswith("local/")
-        else "external"
-    )
-
-    if stt_service_type == "local":
-        from app.services.stt_service import stt_service
-
-        result = stt_service.transcribe_file(file_path)
-        text = result.get("text", "")
-        if not text:
-            raise ValueError("Transcription returned empty text")
-    else:
-        from litellm import atranscription
-
-        with open(file_path, "rb") as audio_file:
-            kwargs: dict = {
-                "model": app_config.STT_SERVICE,
-                "file": audio_file,
-                "api_key": app_config.STT_SERVICE_API_KEY,
-            }
-            if app_config.STT_SERVICE_API_BASE:
-                kwargs["api_base"] = app_config.STT_SERVICE_API_BASE
-            response = await atranscription(**kwargs)
-            text = response.get("text", "")
-            if not text:
-                raise ValueError("Transcription returned empty text")
-
-    return f"# Transcription of {filename}\n\n{text}"
-
-
-async def _extract_document_content(
-    file_path: str,
-    filename: str,
-    session: AsyncSession,
-    user_id: str,
-    task_logger: TaskLoggingService,
-    log_entry: Log,
-    notification: Notification | None,
-) -> tuple[str, str]:
-    """
-    Parse a document file via the configured ETL service.
-
-    Returns:
-        Tuple of (markdown_content, etl_service_name).
-    """
-    from app.services.page_limit_service import PageLimitService
-
-    page_limit_service = PageLimitService(session)
-
-    try:
-        estimated_pages = page_limit_service.estimate_pages_before_processing(file_path)
-    except Exception:
-        file_size = os.path.getsize(file_path)
-        estimated_pages = max(1, file_size // (80 * 1024))
-
-    await page_limit_service.check_page_limit(user_id, estimated_pages)
-
-    etl_service = app_config.ETL_SERVICE
-    markdown_content: str | None = None
+    category = etl_classify(filename)
+    estimated_pages = 0
 
     if notification:
+        stage_messages = {
+            FileCategory.PLAINTEXT: "Reading file",
+            FileCategory.DIRECT_CONVERT: "Converting file",
+            FileCategory.AUDIO: "Transcribing audio",
+            FileCategory.DOCUMENT: "Extracting content",
+        }
         await NotificationService.document_processing.notify_processing_progress(
             session,
             notification,
             stage="parsing",
-            stage_message="Extracting content",
+            stage_message=stage_messages.get(category, "Processing"),
         )
 
-    if etl_service == "UNSTRUCTURED":
-        from app.utils.document_converters import convert_document_to_markdown
+    await task_logger.log_task_progress(
+        log_entry,
+        f"Processing {category.value} file: {filename}",
+        {"file_type": category.value, "processing_stage": "extracting"},
+    )
 
-        docs = await parse_with_unstructured(file_path)
-        markdown_content = await convert_document_to_markdown(docs)
-        actual_pages = page_limit_service.estimate_pages_from_elements(docs)
-        final_pages = max(estimated_pages, actual_pages)
-        await page_limit_service.update_page_usage(
-            user_id, final_pages, allow_exceed=True
-        )
+    if category == FileCategory.DOCUMENT:
+        from app.services.page_limit_service import PageLimitService
 
-    elif etl_service == "LLAMACLOUD":
-        raw_result = await parse_with_llamacloud_retry(
+        page_limit_service = PageLimitService(session)
+        estimated_pages = _estimate_pages_safe(page_limit_service, file_path)
+        await page_limit_service.check_page_limit(user_id, estimated_pages)
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(
             file_path=file_path,
+            filename=filename,
             estimated_pages=estimated_pages,
-            task_logger=task_logger,
-            log_entry=log_entry,
         )
-        markdown_documents = await raw_result.aget_markdown_documents(
-            split_by_page=False
-        )
-        if not markdown_documents:
-            raise RuntimeError(f"LlamaCloud parsing returned no documents: {filename}")
-        markdown_content = markdown_documents[0].text
+    )
+
+    if category == FileCategory.DOCUMENT:
         await page_limit_service.update_page_usage(
             user_id, estimated_pages, allow_exceed=True
         )
 
-    elif etl_service == "DOCLING":
-        getLogger("docling.pipeline.base_pipeline").setLevel(ERROR)
-        getLogger("docling.document_converter").setLevel(ERROR)
-        getLogger("docling_core.transforms.chunker.hierarchical_chunker").setLevel(
-            ERROR
-        )
-
-        from docling.document_converter import DocumentConverter
-
-        converter = DocumentConverter()
-        result = converter.convert(file_path)
-        markdown_content = result.document.export_to_markdown()
-        await page_limit_service.update_page_usage(
-            user_id, estimated_pages, allow_exceed=True
-        )
-
-    else:
-        raise RuntimeError(f"Unknown ETL_SERVICE: {etl_service}")
-
     with contextlib.suppress(Exception):
         os.unlink(file_path)
 
-    if not markdown_content:
+    if not result.markdown_content:
         raise RuntimeError(f"Failed to extract content from file: {filename}")
 
-    return markdown_content, etl_service
+    return result.markdown_content, result.etl_service
 
 
 async def process_file_in_background_with_document(

From f8913adaa30eadd5407c8286c726bda783fe44a9 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 17:46:04 +0530
Subject: [PATCH 127/202] test: add unit tests for content extraction from
 cloud connectors and ETL pipeline functionality

---
 .../test_content_extraction.py                | 244 ++++++++++++++
 .../tests/unit/etl_pipeline/conftest.py       |  29 ++
 .../etl_pipeline/test_etl_pipeline_service.py | 309 ++++++++++++++++++
 3 files changed, 582 insertions(+)
 create mode 100644 surfsense_backend/tests/unit/connector_indexers/test_content_extraction.py
 create mode 100644 surfsense_backend/tests/unit/etl_pipeline/conftest.py
 create mode 100644 surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py

diff --git a/surfsense_backend/tests/unit/connector_indexers/test_content_extraction.py b/surfsense_backend/tests/unit/connector_indexers/test_content_extraction.py
new file mode 100644
index 000000000..49f9a217a
--- /dev/null
+++ b/surfsense_backend/tests/unit/connector_indexers/test_content_extraction.py
@@ -0,0 +1,244 @@
+"""Tests that each cloud connector's download_and_extract_content correctly
+produces markdown from a real file via the unified ETL pipeline.
+
+Only the cloud client is mocked (system boundary).  The ETL pipeline runs for
+real so we know the full path from "cloud gives us bytes" to "we get markdown
+back" actually works.
+"""
+
+import os
+from unittest.mock import AsyncMock, MagicMock
+
+import pytest
+
+pytestmark = pytest.mark.unit
+
+_TXT_CONTENT = "Hello from the cloud connector test."
+_CSV_CONTENT = "name,age\nAlice,30\nBob,25\n"
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+async def _write_file(dest_path: str, content: str) -> None:
+    """Simulate a cloud client writing downloaded bytes to disk."""
+    with open(dest_path, "w", encoding="utf-8") as f:
+        f.write(content)
+
+
+def _make_download_side_effect(content: str):
+    """Return an async side-effect that writes *content* to the dest path
+    and returns ``None`` (success)."""
+
+    async def _side_effect(*args):
+        dest_path = args[-1]
+        await _write_file(dest_path, content)
+        return None
+
+    return _side_effect
+
+
+# ===================================================================
+# Google Drive
+# ===================================================================
+
+class TestGoogleDriveContentExtraction:
+
+    async def test_txt_file_returns_markdown(self):
+        from app.connectors.google_drive.content_extractor import (
+            download_and_extract_content,
+        )
+
+        client = MagicMock()
+        client.download_file_to_disk = AsyncMock(
+            side_effect=_make_download_side_effect(_TXT_CONTENT),
+        )
+
+        file = {"id": "f1", "name": "notes.txt", "mimeType": "text/plain"}
+
+        markdown, metadata, error = await download_and_extract_content(client, file)
+
+        assert error is None
+        assert _TXT_CONTENT in markdown
+        assert metadata["google_drive_file_id"] == "f1"
+        assert metadata["google_drive_file_name"] == "notes.txt"
+
+    async def test_csv_file_returns_markdown_table(self):
+        from app.connectors.google_drive.content_extractor import (
+            download_and_extract_content,
+        )
+
+        client = MagicMock()
+        client.download_file_to_disk = AsyncMock(
+            side_effect=_make_download_side_effect(_CSV_CONTENT),
+        )
+
+        file = {"id": "f2", "name": "data.csv", "mimeType": "text/csv"}
+
+        markdown, metadata, error = await download_and_extract_content(client, file)
+
+        assert error is None
+        assert "Alice" in markdown
+        assert "Bob" in markdown
+        assert "|" in markdown
+
+    async def test_download_error_returns_error_message(self):
+        from app.connectors.google_drive.content_extractor import (
+            download_and_extract_content,
+        )
+
+        client = MagicMock()
+        client.download_file_to_disk = AsyncMock(return_value="Network timeout")
+
+        file = {"id": "f3", "name": "doc.txt", "mimeType": "text/plain"}
+
+        markdown, metadata, error = await download_and_extract_content(client, file)
+
+        assert markdown is None
+        assert error == "Network timeout"
+
+
+# ===================================================================
+# OneDrive
+# ===================================================================
+
+class TestOneDriveContentExtraction:
+
+    async def test_txt_file_returns_markdown(self):
+        from app.connectors.onedrive.content_extractor import (
+            download_and_extract_content,
+        )
+
+        client = MagicMock()
+        client.download_file_to_disk = AsyncMock(
+            side_effect=_make_download_side_effect(_TXT_CONTENT),
+        )
+
+        file = {
+            "id": "od-1",
+            "name": "report.txt",
+            "file": {"mimeType": "text/plain"},
+        }
+
+        markdown, metadata, error = await download_and_extract_content(client, file)
+
+        assert error is None
+        assert _TXT_CONTENT in markdown
+        assert metadata["onedrive_file_id"] == "od-1"
+        assert metadata["onedrive_file_name"] == "report.txt"
+
+    async def test_csv_file_returns_markdown_table(self):
+        from app.connectors.onedrive.content_extractor import (
+            download_and_extract_content,
+        )
+
+        client = MagicMock()
+        client.download_file_to_disk = AsyncMock(
+            side_effect=_make_download_side_effect(_CSV_CONTENT),
+        )
+
+        file = {
+            "id": "od-2",
+            "name": "data.csv",
+            "file": {"mimeType": "text/csv"},
+        }
+
+        markdown, metadata, error = await download_and_extract_content(client, file)
+
+        assert error is None
+        assert "Alice" in markdown
+        assert "|" in markdown
+
+    async def test_download_error_returns_error_message(self):
+        from app.connectors.onedrive.content_extractor import (
+            download_and_extract_content,
+        )
+
+        client = MagicMock()
+        client.download_file_to_disk = AsyncMock(return_value="403 Forbidden")
+
+        file = {
+            "id": "od-3",
+            "name": "secret.txt",
+            "file": {"mimeType": "text/plain"},
+        }
+
+        markdown, metadata, error = await download_and_extract_content(client, file)
+
+        assert markdown is None
+        assert error == "403 Forbidden"
+
+
+# ===================================================================
+# Dropbox
+# ===================================================================
+
+class TestDropboxContentExtraction:
+
+    async def test_txt_file_returns_markdown(self):
+        from app.connectors.dropbox.content_extractor import (
+            download_and_extract_content,
+        )
+
+        client = MagicMock()
+        client.download_file_to_disk = AsyncMock(
+            side_effect=_make_download_side_effect(_TXT_CONTENT),
+        )
+
+        file = {
+            "id": "dbx-1",
+            "name": "memo.txt",
+            ".tag": "file",
+            "path_lower": "/memo.txt",
+        }
+
+        markdown, metadata, error = await download_and_extract_content(client, file)
+
+        assert error is None
+        assert _TXT_CONTENT in markdown
+        assert metadata["dropbox_file_id"] == "dbx-1"
+        assert metadata["dropbox_file_name"] == "memo.txt"
+
+    async def test_csv_file_returns_markdown_table(self):
+        from app.connectors.dropbox.content_extractor import (
+            download_and_extract_content,
+        )
+
+        client = MagicMock()
+        client.download_file_to_disk = AsyncMock(
+            side_effect=_make_download_side_effect(_CSV_CONTENT),
+        )
+
+        file = {
+            "id": "dbx-2",
+            "name": "data.csv",
+            ".tag": "file",
+            "path_lower": "/data.csv",
+        }
+
+        markdown, metadata, error = await download_and_extract_content(client, file)
+
+        assert error is None
+        assert "Alice" in markdown
+        assert "|" in markdown
+
+    async def test_download_error_returns_error_message(self):
+        from app.connectors.dropbox.content_extractor import (
+            download_and_extract_content,
+        )
+
+        client = MagicMock()
+        client.download_file_to_disk = AsyncMock(return_value="Rate limited")
+
+        file = {
+            "id": "dbx-3",
+            "name": "big.txt",
+            ".tag": "file",
+            "path_lower": "/big.txt",
+        }
+
+        markdown, metadata, error = await download_and_extract_content(client, file)
+
+        assert markdown is None
+        assert error == "Rate limited"
diff --git a/surfsense_backend/tests/unit/etl_pipeline/conftest.py b/surfsense_backend/tests/unit/etl_pipeline/conftest.py
new file mode 100644
index 000000000..6059caa01
--- /dev/null
+++ b/surfsense_backend/tests/unit/etl_pipeline/conftest.py
@@ -0,0 +1,29 @@
+"""Pre-register the etl_pipeline package to avoid circular imports during unit tests."""
+
+import sys
+import types
+from pathlib import Path
+
+_BACKEND = Path(__file__).resolve().parents[3]
+
+
+def _stub_package(dotted: str, fs_dir: Path) -> None:
+    if dotted not in sys.modules:
+        mod = types.ModuleType(dotted)
+        mod.__path__ = [str(fs_dir)]
+        mod.__package__ = dotted
+        sys.modules[dotted] = mod
+
+    parts = dotted.split(".")
+    if len(parts) > 1:
+        parent_dotted = ".".join(parts[:-1])
+        parent = sys.modules.get(parent_dotted)
+        if parent is not None:
+            setattr(parent, parts[-1], sys.modules[dotted])
+
+
+_stub_package("app", _BACKEND / "app")
+_stub_package("app.etl_pipeline", _BACKEND / "app" / "etl_pipeline")
+_stub_package(
+    "app.etl_pipeline.parsers", _BACKEND / "app" / "etl_pipeline" / "parsers"
+)
diff --git a/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py b/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
new file mode 100644
index 000000000..0d31507ca
--- /dev/null
+++ b/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
@@ -0,0 +1,309 @@
+"""Tests for EtlPipelineService -- the unified ETL pipeline public interface."""
+
+import pytest
+
+from app.etl_pipeline.etl_document import EtlRequest
+from app.etl_pipeline.etl_pipeline_service import EtlPipelineService
+
+pytestmark = pytest.mark.unit
+
+
+async def test_extract_txt_file_returns_markdown(tmp_path):
+    """Tracer bullet: a .txt file is read and returned as-is in an EtlResult."""
+    txt_file = tmp_path / "hello.txt"
+    txt_file.write_text("Hello, world!", encoding="utf-8")
+
+    service = EtlPipelineService()
+    result = await service.extract(
+        EtlRequest(file_path=str(txt_file), filename="hello.txt")
+    )
+
+    assert result.markdown_content == "Hello, world!"
+    assert result.etl_service == "PLAINTEXT"
+    assert result.content_type == "plaintext"
+
+
+async def test_extract_md_file(tmp_path):
+    """A .md file is classified as PLAINTEXT and extracted."""
+    md_file = tmp_path / "readme.md"
+    md_file.write_text("# Title\n\nBody text.", encoding="utf-8")
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(md_file), filename="readme.md")
+    )
+
+    assert result.markdown_content == "# Title\n\nBody text."
+    assert result.etl_service == "PLAINTEXT"
+    assert result.content_type == "plaintext"
+
+
+async def test_extract_markdown_file(tmp_path):
+    """A .markdown file is classified as PLAINTEXT and extracted."""
+    md_file = tmp_path / "notes.markdown"
+    md_file.write_text("Some notes.", encoding="utf-8")
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(md_file), filename="notes.markdown")
+    )
+
+    assert result.markdown_content == "Some notes."
+    assert result.etl_service == "PLAINTEXT"
+
+
+async def test_extract_python_file(tmp_path):
+    """A .py source code file is classified as PLAINTEXT."""
+    py_file = tmp_path / "script.py"
+    py_file.write_text("print('hello')", encoding="utf-8")
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(py_file), filename="script.py")
+    )
+
+    assert result.markdown_content == "print('hello')"
+    assert result.etl_service == "PLAINTEXT"
+    assert result.content_type == "plaintext"
+
+
+async def test_extract_js_file(tmp_path):
+    """A .js source code file is classified as PLAINTEXT."""
+    js_file = tmp_path / "app.js"
+    js_file.write_text("console.log('hi');", encoding="utf-8")
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(js_file), filename="app.js")
+    )
+
+    assert result.markdown_content == "console.log('hi');"
+    assert result.etl_service == "PLAINTEXT"
+
+
+async def test_extract_csv_returns_markdown_table(tmp_path):
+    """A .csv file is converted to a markdown table."""
+    csv_file = tmp_path / "data.csv"
+    csv_file.write_text("name,age\nAlice,30\nBob,25\n", encoding="utf-8")
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(csv_file), filename="data.csv")
+    )
+
+    assert "| name | age |" in result.markdown_content
+    assert "| Alice | 30 |" in result.markdown_content
+    assert result.etl_service == "DIRECT_CONVERT"
+    assert result.content_type == "direct_convert"
+
+
+async def test_extract_tsv_returns_markdown_table(tmp_path):
+    """A .tsv file is converted to a markdown table."""
+    tsv_file = tmp_path / "data.tsv"
+    tsv_file.write_text("x\ty\n1\t2\n", encoding="utf-8")
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(tsv_file), filename="data.tsv")
+    )
+
+    assert "| x | y |" in result.markdown_content
+    assert result.etl_service == "DIRECT_CONVERT"
+
+
+async def test_extract_html_returns_markdown(tmp_path):
+    """An .html file is converted to markdown."""
+    html_file = tmp_path / "page.html"
+    html_file.write_text("<h1>Title</h1><p>Body</p>", encoding="utf-8")
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(html_file), filename="page.html")
+    )
+
+    assert "Title" in result.markdown_content
+    assert "Body" in result.markdown_content
+    assert result.etl_service == "DIRECT_CONVERT"
+
+
+async def test_extract_mp3_returns_transcription(tmp_path, mocker):
+    """An .mp3 audio file is transcribed via litellm.atranscription."""
+    audio_file = tmp_path / "recording.mp3"
+    audio_file.write_bytes(b"\x00" * 100)
+
+    mocker.patch("app.config.config.STT_SERVICE", "openai/whisper-1")
+    mocker.patch("app.config.config.STT_SERVICE_API_KEY", "fake-key")
+    mocker.patch("app.config.config.STT_SERVICE_API_BASE", None)
+
+    mock_transcription = mocker.patch(
+        "app.etl_pipeline.parsers.audio.atranscription",
+        return_value={"text": "Hello from audio"},
+    )
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(audio_file), filename="recording.mp3")
+    )
+
+    assert "Hello from audio" in result.markdown_content
+    assert result.etl_service == "AUDIO"
+    assert result.content_type == "audio"
+    mock_transcription.assert_called_once()
+
+
+# ---------------------------------------------------------------------------
+# Slice 7 – DOCLING document parsing
+# ---------------------------------------------------------------------------
+
+
+async def test_extract_pdf_with_docling(tmp_path, mocker):
+    """A .pdf file with ETL_SERVICE=DOCLING returns parsed markdown."""
+    pdf_file = tmp_path / "report.pdf"
+    pdf_file.write_bytes(b"%PDF-1.4 fake")
+
+    mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
+
+    fake_docling = mocker.AsyncMock()
+    fake_docling.process_document.return_value = {"content": "# Parsed PDF"}
+    mocker.patch(
+        "app.services.docling_service.create_docling_service",
+        return_value=fake_docling,
+    )
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(pdf_file), filename="report.pdf")
+    )
+
+    assert result.markdown_content == "# Parsed PDF"
+    assert result.etl_service == "DOCLING"
+    assert result.content_type == "document"
+
+
+# ---------------------------------------------------------------------------
+# Slice 8 – UNSTRUCTURED document parsing
+# ---------------------------------------------------------------------------
+
+
+async def test_extract_pdf_with_unstructured(tmp_path, mocker):
+    """A .pdf file with ETL_SERVICE=UNSTRUCTURED returns parsed markdown."""
+    pdf_file = tmp_path / "report.pdf"
+    pdf_file.write_bytes(b"%PDF-1.4 fake")
+
+    mocker.patch("app.config.config.ETL_SERVICE", "UNSTRUCTURED")
+
+    class FakeDoc:
+        def __init__(self, text):
+            self.page_content = text
+
+    fake_loader_instance = mocker.AsyncMock()
+    fake_loader_instance.aload.return_value = [
+        FakeDoc("Page 1 content"),
+        FakeDoc("Page 2 content"),
+    ]
+    mocker.patch(
+        "langchain_unstructured.UnstructuredLoader",
+        return_value=fake_loader_instance,
+    )
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(pdf_file), filename="report.pdf")
+    )
+
+    assert "Page 1 content" in result.markdown_content
+    assert "Page 2 content" in result.markdown_content
+    assert result.etl_service == "UNSTRUCTURED"
+    assert result.content_type == "document"
+
+
+# ---------------------------------------------------------------------------
+# Slice 9 – LLAMACLOUD document parsing
+# ---------------------------------------------------------------------------
+
+
+async def test_extract_pdf_with_llamacloud(tmp_path, mocker):
+    """A .pdf file with ETL_SERVICE=LLAMACLOUD returns parsed markdown."""
+    pdf_file = tmp_path / "report.pdf"
+    pdf_file.write_bytes(b"%PDF-1.4 fake content " * 10)
+
+    mocker.patch("app.config.config.ETL_SERVICE", "LLAMACLOUD")
+    mocker.patch("app.config.config.LLAMA_CLOUD_API_KEY", "fake-key", create=True)
+
+    class FakeDoc:
+        text = "# LlamaCloud parsed"
+
+    class FakeJobResult:
+        pages = []
+
+        def get_markdown_documents(self, split_by_page=True):
+            return [FakeDoc()]
+
+    fake_parser = mocker.AsyncMock()
+    fake_parser.aparse.return_value = FakeJobResult()
+    mocker.patch(
+        "llama_cloud_services.LlamaParse",
+        return_value=fake_parser,
+    )
+    mocker.patch(
+        "llama_cloud_services.parse.utils.ResultType",
+        mocker.MagicMock(MD="md"),
+    )
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(
+            file_path=str(pdf_file), filename="report.pdf", estimated_pages=5
+        )
+    )
+
+    assert result.markdown_content == "# LlamaCloud parsed"
+    assert result.etl_service == "LLAMACLOUD"
+    assert result.content_type == "document"
+
+
+# ---------------------------------------------------------------------------
+# Slice 10 – unknown extension falls through to document ETL
+# ---------------------------------------------------------------------------
+
+
+async def test_unknown_extension_uses_document_etl(tmp_path, mocker):
+    """An unknown extension (e.g. .docx) falls through to the document ETL path."""
+    docx_file = tmp_path / "doc.docx"
+    docx_file.write_bytes(b"PK fake docx")
+
+    mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
+
+    fake_docling = mocker.AsyncMock()
+    fake_docling.process_document.return_value = {"content": "Docx content"}
+    mocker.patch(
+        "app.services.docling_service.create_docling_service",
+        return_value=fake_docling,
+    )
+
+    result = await EtlPipelineService().extract(
+        EtlRequest(file_path=str(docx_file), filename="doc.docx")
+    )
+
+    assert result.markdown_content == "Docx content"
+    assert result.content_type == "document"
+
+
+# ---------------------------------------------------------------------------
+# Slice 11 – EtlRequest validation
+# ---------------------------------------------------------------------------
+
+
+def test_etl_request_requires_filename():
+    """EtlRequest rejects missing filename."""
+    with pytest.raises(Exception):
+        EtlRequest(file_path="/tmp/some.txt", filename="")
+
+
+# ---------------------------------------------------------------------------
+# Slice 12 – unknown ETL_SERVICE raises EtlServiceUnavailableError
+# ---------------------------------------------------------------------------
+
+
+async def test_unknown_etl_service_raises(tmp_path, mocker):
+    """An unknown ETL_SERVICE raises EtlServiceUnavailableError."""
+    from app.etl_pipeline.exceptions import EtlServiceUnavailableError
+
+    pdf_file = tmp_path / "report.pdf"
+    pdf_file.write_bytes(b"%PDF fake")
+
+    mocker.patch("app.config.config.ETL_SERVICE", "NONEXISTENT")
+
+    with pytest.raises(EtlServiceUnavailableError, match="Unknown ETL_SERVICE"):
+        await EtlPipelineService().extract(
+            EtlRequest(file_path=str(pdf_file), filename="report.pdf")
+        )

From c6e94188eb83b8b7989b393ea1fe23756273faf2 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 18:23:32 +0530
Subject: [PATCH 128/202] refactor: remove destructive text classes from
 DocumentNode and enhance CreateSearchSpaceDialog with select-none and
 select-text classes

---
 surfsense_web/components/documents/DocumentNode.tsx         | 2 --
 .../layout/ui/dialogs/CreateSearchSpaceDialog.tsx           | 6 +++---
 2 files changed, 3 insertions(+), 5 deletions(-)

diff --git a/surfsense_web/components/documents/DocumentNode.tsx b/surfsense_web/components/documents/DocumentNode.tsx
index 919f904d4..33ce2bf26 100644
--- a/surfsense_web/components/documents/DocumentNode.tsx
+++ b/surfsense_web/components/documents/DocumentNode.tsx
@@ -260,7 +260,6 @@ export const DocumentNode = React.memo(function DocumentNode({
 								</DropdownMenuItem>
 							)}
 							<DropdownMenuItem
-								className="text-destructive focus:text-destructive"
 								disabled={isProcessing}
 								onClick={() => onDelete(doc)}
 							>
@@ -306,7 +305,6 @@ export const DocumentNode = React.memo(function DocumentNode({
 						</ContextMenuItem>
 					)}
 					<ContextMenuItem
-						className="text-destructive focus:text-destructive"
 						disabled={isProcessing}
 						onClick={() => onDelete(doc)}
 					>
diff --git a/surfsense_web/components/layout/ui/dialogs/CreateSearchSpaceDialog.tsx b/surfsense_web/components/layout/ui/dialogs/CreateSearchSpaceDialog.tsx
index e39bee679..d8ec767d7 100644
--- a/surfsense_web/components/layout/ui/dialogs/CreateSearchSpaceDialog.tsx
+++ b/surfsense_web/components/layout/ui/dialogs/CreateSearchSpaceDialog.tsx
@@ -82,7 +82,7 @@ export function CreateSearchSpaceDialog({ open, onOpenChange }: CreateSearchSpac
 
 	return (
 		<Dialog open={open} onOpenChange={handleOpenChange}>
-			<DialogContent className="max-w-[90vw] sm:max-w-sm p-4 sm:p-5 data-[state=open]:animate-none data-[state=closed]:animate-none">
+			<DialogContent className="max-w-[90vw] sm:max-w-sm p-4 sm:p-5 select-none data-[state=open]:animate-none data-[state=closed]:animate-none">
 				<DialogHeader className="space-y-2 pb-2">
 					<div className="flex items-center gap-2 sm:gap-3">
 						<div className="flex-1 min-w-0">
@@ -107,7 +107,7 @@ export function CreateSearchSpaceDialog({ open, onOpenChange }: CreateSearchSpac
 											placeholder={t("name_placeholder")}
 											{...field}
 											autoFocus
-											className="text-sm h-9 sm:h-10"
+											className="text-sm h-9 sm:h-10 select-text"
 										/>
 									</FormControl>
 									<FormMessage />
@@ -130,7 +130,7 @@ export function CreateSearchSpaceDialog({ open, onOpenChange }: CreateSearchSpac
 										<Input
 											placeholder={t("description_placeholder")}
 											{...field}
-											className="text-sm h-9 sm:h-10"
+											className="text-sm h-9 sm:h-10 select-text"
 										/>
 									</FormControl>
 									<FormMessage />

From 1f162f52c3199bc336ae1a3ba3a981c2f43e66cb Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 22:50:36 +0530
Subject: [PATCH 129/202] feat: add tooltip functionality to DocumentNode for
 title overflow handling and refactor ChatShareButton by removing unnecessary
 Tooltip wrapper

---
 .../components/documents/DocumentNode.tsx     | 25 ++++++++++++++++++-
 .../components/new-chat/chat-share-button.tsx | 25 ++++++++-----------
 2 files changed, 34 insertions(+), 16 deletions(-)

diff --git a/surfsense_web/components/documents/DocumentNode.tsx b/surfsense_web/components/documents/DocumentNode.tsx
index 33ce2bf26..92a211277 100644
--- a/surfsense_web/components/documents/DocumentNode.tsx
+++ b/surfsense_web/components/documents/DocumentNode.tsx
@@ -12,6 +12,7 @@ import {
 	Trash2,
 } from "lucide-react";
 import React, { useCallback, useRef, useState } from "react";
+import { useIsMobile } from "@/hooks/use-mobile";
 import { useDrag } from "react-dnd";
 import { getDocumentTypeIcon } from "@/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentTypeIcon";
 import { ExportContextItems, ExportDropdownItems } from "@/components/shared/ExportMenuItems";
@@ -106,7 +107,10 @@ export const DocumentNode = React.memo(function DocumentNode({
 	const isProcessing = statusState === "pending" || statusState === "processing";
 	const [dropdownOpen, setDropdownOpen] = useState(false);
 	const [exporting, setExporting] = useState<string | null>(null);
+	const [titleTooltipOpen, setTitleTooltipOpen] = useState(false);
 	const rowRef = useRef<HTMLDivElement>(null);
+	const titleRef = useRef<HTMLSpanElement>(null);
+	const isMobile = useIsMobile();
 
 	const handleExport = useCallback(
 		(format: string) => {
@@ -118,6 +122,18 @@ export const DocumentNode = React.memo(function DocumentNode({
 		[doc, onExport]
 	);
 
+	const handleTitleTooltipOpenChange = useCallback(
+		(open: boolean) => {
+			if (isMobile) return;
+			if (open && titleRef.current) {
+				setTitleTooltipOpen(titleRef.current.scrollWidth > titleRef.current.clientWidth);
+			} else {
+				setTitleTooltipOpen(false);
+			}
+		},
+		[isMobile]
+	);
+
 	const attachRef = useCallback(
 		(node: HTMLDivElement | null) => {
 			(rowRef as React.MutableRefObject<HTMLDivElement | null>).current = node;
@@ -197,7 +213,14 @@ export const DocumentNode = React.memo(function DocumentNode({
 						);
 					})()}
 
-					<span className="flex-1 min-w-0 truncate">{doc.title}</span>
+					<Tooltip delayDuration={600} open={titleTooltipOpen} onOpenChange={handleTitleTooltipOpenChange}>
+						<TooltipTrigger asChild>
+							<span ref={titleRef} className="flex-1 min-w-0 truncate">{doc.title}</span>
+						</TooltipTrigger>
+						<TooltipContent side="bottom" className="max-w-xs break-words">
+							{doc.title}
+						</TooltipContent>
+					</Tooltip>
 
 					{getDocumentTypeIcon(
 						doc.document_type as DocumentTypeEnum,
diff --git a/surfsense_web/components/new-chat/chat-share-button.tsx b/surfsense_web/components/new-chat/chat-share-button.tsx
index 82e8c6a78..4fc35aba1 100644
--- a/surfsense_web/components/new-chat/chat-share-button.tsx
+++ b/surfsense_web/components/new-chat/chat-share-button.tsx
@@ -163,21 +163,16 @@ export function ChatShareButton({ thread, onVisibilityChange, className }: ChatS
 			)}
 
 			<Popover open={open} onOpenChange={setOpen}>
-				<Tooltip>
-					<TooltipTrigger asChild>
-						<PopoverTrigger asChild>
-							<Button
-								variant="outline"
-								size="icon"
-								className="h-8 w-8 md:w-auto md:px-3 md:gap-2 relative bg-muted hover:bg-muted/80 border-0 select-none"
-							>
-								<CurrentIcon className="h-4 w-4" />
-								<span className="hidden md:inline text-sm">{buttonLabel}</span>
-							</Button>
-						</PopoverTrigger>
-					</TooltipTrigger>
-					<TooltipContent>Share settings</TooltipContent>
-				</Tooltip>
+				<PopoverTrigger asChild>
+					<Button
+						variant="outline"
+						size="icon"
+						className="h-8 w-8 md:w-auto md:px-3 md:gap-2 relative bg-muted hover:bg-muted/80 border-0 select-none"
+					>
+						<CurrentIcon className="h-4 w-4" />
+						<span className="hidden md:inline text-sm">{buttonLabel}</span>
+					</Button>
+				</PopoverTrigger>
 
 				<PopoverContent
 					className="w-[280px] md:w-[320px] p-0 rounded-lg shadow-lg border-border/60 dark:bg-neutral-900 dark:border dark:border-white/5 select-none"

From c9e5fe9cdb32a456d58af0a665e86d26ffea85aa Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 23:02:17 +0530
Subject: [PATCH 130/202] refactor: update icon usage in CommentActions and
 enhance Tooltip component for mobile responsiveness

---
 .../comment-item/comment-actions.tsx          |   4 +-
 .../components/documents/DocumentNode.tsx     |  20 +--
 .../ui/sidebar/AllPrivateChatsSidebar.tsx     |  36 ++---
 .../ui/sidebar/AllSharedChatsSidebar.tsx      |  36 ++---
 .../layout/ui/sidebar/InboxSidebar.tsx        | 123 ++++++------------
 surfsense_web/components/ui/tooltip.tsx       |  32 ++++-
 6 files changed, 113 insertions(+), 138 deletions(-)

diff --git a/surfsense_web/components/chat-comments/comment-item/comment-actions.tsx b/surfsense_web/components/chat-comments/comment-item/comment-actions.tsx
index 5c0e27779..564a6ba84 100644
--- a/surfsense_web/components/chat-comments/comment-item/comment-actions.tsx
+++ b/surfsense_web/components/chat-comments/comment-item/comment-actions.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { MoreHorizontal, Pencil, Trash2 } from "lucide-react";
+import { MoreHorizontal, PenLine, Trash2 } from "lucide-react";
 import { Button } from "@/components/ui/button";
 import {
 	DropdownMenu,
@@ -29,7 +29,7 @@ export function CommentActions({ canEdit, canDelete, onEdit, onDelete }: Comment
 			<DropdownMenuContent align="end">
 				{canEdit && (
 					<DropdownMenuItem onClick={onEdit}>
-						<Pencil className="mr-2 size-4" />
+						<PenLine className="mr-2 size-4" />
 						Edit
 					</DropdownMenuItem>
 				)}
diff --git a/surfsense_web/components/documents/DocumentNode.tsx b/surfsense_web/components/documents/DocumentNode.tsx
index 92a211277..fe796b5be 100644
--- a/surfsense_web/components/documents/DocumentNode.tsx
+++ b/surfsense_web/components/documents/DocumentNode.tsx
@@ -12,7 +12,6 @@ import {
 	Trash2,
 } from "lucide-react";
 import React, { useCallback, useRef, useState } from "react";
-import { useIsMobile } from "@/hooks/use-mobile";
 import { useDrag } from "react-dnd";
 import { getDocumentTypeIcon } from "@/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentTypeIcon";
 import { ExportContextItems, ExportDropdownItems } from "@/components/shared/ExportMenuItems";
@@ -110,7 +109,6 @@ export const DocumentNode = React.memo(function DocumentNode({
 	const [titleTooltipOpen, setTitleTooltipOpen] = useState(false);
 	const rowRef = useRef<HTMLDivElement>(null);
 	const titleRef = useRef<HTMLSpanElement>(null);
-	const isMobile = useIsMobile();
 
 	const handleExport = useCallback(
 		(format: string) => {
@@ -122,17 +120,13 @@ export const DocumentNode = React.memo(function DocumentNode({
 		[doc, onExport]
 	);
 
-	const handleTitleTooltipOpenChange = useCallback(
-		(open: boolean) => {
-			if (isMobile) return;
-			if (open && titleRef.current) {
-				setTitleTooltipOpen(titleRef.current.scrollWidth > titleRef.current.clientWidth);
-			} else {
-				setTitleTooltipOpen(false);
-			}
-		},
-		[isMobile]
-	);
+	const handleTitleTooltipOpenChange = useCallback((open: boolean) => {
+		if (open && titleRef.current) {
+			setTitleTooltipOpen(titleRef.current.scrollWidth > titleRef.current.clientWidth);
+		} else {
+			setTitleTooltipOpen(false);
+		}
+	}, []);
 
 	const attachRef = useCallback(
 		(node: HTMLDivElement | null) => {
diff --git a/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx
index 57c011f01..46b03a172 100644
--- a/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx
@@ -375,24 +375,24 @@ export function AllPrivateChatsSidebarContent({
 											<span className="truncate">{thread.title || "New Chat"}</span>
 										</button>
 									) : (
-										<Tooltip>
-											<TooltipTrigger asChild>
-												<button
-													type="button"
-													onClick={() => handleThreadClick(thread.id)}
-													disabled={isBusy}
-													className="flex items-center gap-2 flex-1 min-w-0 text-left overflow-hidden"
-												>
-													<span className="truncate">{thread.title || "New Chat"}</span>
-												</button>
-											</TooltipTrigger>
-											<TooltipContent side="bottom" align="start">
-												<p>
-													{t("updated") || "Updated"}:{" "}
-													{format(new Date(thread.updatedAt), "MMM d, yyyy 'at' h:mm a")}
-												</p>
-											</TooltipContent>
-										</Tooltip>
+									<Tooltip delayDuration={600}>
+										<TooltipTrigger asChild>
+											<button
+												type="button"
+												onClick={() => handleThreadClick(thread.id)}
+												disabled={isBusy}
+												className="flex items-center gap-2 flex-1 min-w-0 text-left overflow-hidden"
+											>
+												<span className="truncate">{thread.title || "New Chat"}</span>
+											</button>
+										</TooltipTrigger>
+										<TooltipContent side="bottom" align="start">
+											<p>
+												{t("updated") || "Updated"}:{" "}
+												{format(new Date(thread.updatedAt), "MMM d, yyyy 'at' h:mm a")}
+											</p>
+										</TooltipContent>
+									</Tooltip>
 									)}
 
 									<DropdownMenu
diff --git a/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx
index 4a59df440..9cc1da1e4 100644
--- a/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx
@@ -375,24 +375,24 @@ export function AllSharedChatsSidebarContent({
 											<span className="truncate">{thread.title || "New Chat"}</span>
 										</button>
 									) : (
-										<Tooltip>
-											<TooltipTrigger asChild>
-												<button
-													type="button"
-													onClick={() => handleThreadClick(thread.id)}
-													disabled={isBusy}
-													className="flex items-center gap-2 flex-1 min-w-0 text-left overflow-hidden"
-												>
-													<span className="truncate">{thread.title || "New Chat"}</span>
-												</button>
-											</TooltipTrigger>
-											<TooltipContent side="bottom" align="start">
-												<p>
-													{t("updated") || "Updated"}:{" "}
-													{format(new Date(thread.updatedAt), "MMM d, yyyy 'at' h:mm a")}
-												</p>
-											</TooltipContent>
-										</Tooltip>
+									<Tooltip delayDuration={600}>
+										<TooltipTrigger asChild>
+											<button
+												type="button"
+												onClick={() => handleThreadClick(thread.id)}
+												disabled={isBusy}
+												className="flex items-center gap-2 flex-1 min-w-0 text-left overflow-hidden"
+											>
+												<span className="truncate">{thread.title || "New Chat"}</span>
+											</button>
+										</TooltipTrigger>
+										<TooltipContent side="bottom" align="start">
+											<p>
+												{t("updated") || "Updated"}:{" "}
+												{format(new Date(thread.updatedAt), "MMM d, yyyy 'at' h:mm a")}
+											</p>
+										</TooltipContent>
+									</Tooltip>
 									)}
 
 									<DropdownMenu
diff --git a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
index 72400a589..51ecedd94 100644
--- a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
@@ -779,36 +779,23 @@ export function InboxSidebarContent({
 								</DropdownMenuContent>
 							</DropdownMenu>
 						)}
-						{isMobile ? (
-							<Button
-								variant="ghost"
-								size="icon"
-								className="h-7 w-7 rounded-full"
-								onClick={handleMarkAllAsRead}
-								disabled={totalUnreadCount === 0}
-							>
-								<CheckCheck className="h-4 w-4 text-muted-foreground" />
-								<span className="sr-only">{t("mark_all_read") || "Mark all as read"}</span>
-							</Button>
-						) : (
-							<Tooltip>
-								<TooltipTrigger asChild>
-									<Button
-										variant="ghost"
-										size="icon"
-										className="h-7 w-7 rounded-full"
-										onClick={handleMarkAllAsRead}
-										disabled={totalUnreadCount === 0}
-									>
-										<CheckCheck className="h-4 w-4 text-muted-foreground" />
-										<span className="sr-only">{t("mark_all_read") || "Mark all as read"}</span>
-									</Button>
-								</TooltipTrigger>
-								<TooltipContent className="z-80">
-									{t("mark_all_read") || "Mark all as read"}
-								</TooltipContent>
-							</Tooltip>
-						)}
+						<Tooltip>
+							<TooltipTrigger asChild>
+								<Button
+									variant="ghost"
+									size="icon"
+									className="h-7 w-7 rounded-full"
+									onClick={handleMarkAllAsRead}
+									disabled={totalUnreadCount === 0}
+								>
+									<CheckCheck className="h-4 w-4 text-muted-foreground" />
+									<span className="sr-only">{t("mark_all_read") || "Mark all as read"}</span>
+								</Button>
+							</TooltipTrigger>
+							<TooltipContent className="z-80">
+								{t("mark_all_read") || "Mark all as read"}
+							</TooltipContent>
+						</Tooltip>
 					</div>
 				</div>
 
@@ -921,61 +908,27 @@ export function InboxSidebarContent({
 									)}
 									style={{ contentVisibility: "auto", containIntrinsicSize: "0 80px" }}
 								>
-									{isMobile ? (
-										<button
-											type="button"
-											onClick={() => handleItemClick(item)}
-											disabled={isMarkingAsRead}
-											className="flex items-center gap-3 flex-1 min-w-0 text-left overflow-hidden"
-										>
-											<div className="shrink-0">{getStatusIcon(item)}</div>
-											<div className="flex-1 min-w-0 overflow-hidden">
-												<p
-													className={cn(
-														"text-xs font-medium line-clamp-2",
-														!item.read && "font-semibold"
-													)}
-												>
-													{item.title}
-												</p>
-												<p className="text-[11px] text-muted-foreground line-clamp-2 mt-0.5">
-													{convertRenderedToDisplay(item.message)}
-												</p>
-											</div>
-										</button>
-									) : (
-										<Tooltip>
-											<TooltipTrigger asChild>
-												<button
-													type="button"
-													onClick={() => handleItemClick(item)}
-													disabled={isMarkingAsRead}
-													className="flex items-center gap-3 flex-1 min-w-0 text-left overflow-hidden"
-												>
-													<div className="shrink-0">{getStatusIcon(item)}</div>
-													<div className="flex-1 min-w-0 overflow-hidden">
-														<p
-															className={cn(
-																"text-xs font-medium line-clamp-2",
-																!item.read && "font-semibold"
-															)}
-														>
-															{item.title}
-														</p>
-														<p className="text-[11px] text-muted-foreground line-clamp-2 mt-0.5">
-															{convertRenderedToDisplay(item.message)}
-														</p>
-													</div>
-												</button>
-											</TooltipTrigger>
-											<TooltipContent side="bottom" align="start" className="max-w-[250px]">
-												<p className="font-medium">{item.title}</p>
-												<p className="text-muted-foreground mt-1">
-													{convertRenderedToDisplay(item.message)}
-												</p>
-											</TooltipContent>
-										</Tooltip>
-									)}
+									<button
+										type="button"
+										onClick={() => handleItemClick(item)}
+										disabled={isMarkingAsRead}
+										className="flex items-center gap-3 flex-1 min-w-0 text-left overflow-hidden"
+									>
+										<div className="shrink-0">{getStatusIcon(item)}</div>
+										<div className="flex-1 min-w-0 overflow-hidden">
+											<p
+												className={cn(
+													"text-xs font-medium line-clamp-2",
+													!item.read && "font-semibold"
+												)}
+											>
+												{item.title}
+											</p>
+											<p className="text-[11px] text-muted-foreground line-clamp-2 mt-0.5">
+												{convertRenderedToDisplay(item.message)}
+											</p>
+										</div>
+									</button>
 
 									<div className="flex items-center justify-end gap-1.5 shrink-0 w-10">
 										<span className="text-[10px] text-muted-foreground">
diff --git a/surfsense_web/components/ui/tooltip.tsx b/surfsense_web/components/ui/tooltip.tsx
index 2fc85aae4..fb6dd17e7 100644
--- a/surfsense_web/components/ui/tooltip.tsx
+++ b/surfsense_web/components/ui/tooltip.tsx
@@ -2,9 +2,26 @@
 
 import * as TooltipPrimitive from "@radix-ui/react-tooltip";
 import type * as React from "react";
+import { useEffect, useState } from "react";
 
 import { cn } from "@/lib/utils";
 
+const MOBILE_BREAKPOINT = 768;
+
+function useIsTouchDevice() {
+	const [isTouch, setIsTouch] = useState(false);
+
+	useEffect(() => {
+		const mql = window.matchMedia(`(max-width: ${MOBILE_BREAKPOINT - 1}px)`);
+		const update = () => setIsTouch(mql.matches);
+		update();
+		mql.addEventListener("change", update);
+		return () => mql.removeEventListener("change", update);
+	}, []);
+
+	return isTouch;
+}
+
 function TooltipProvider({
 	delayDuration = 0,
 	disableHoverableContent = true,
@@ -20,10 +37,21 @@ function TooltipProvider({
 	);
 }
 
-function Tooltip({ ...props }: React.ComponentProps<typeof TooltipPrimitive.Root>) {
+function Tooltip({
+	open,
+	onOpenChange,
+	...props
+}: React.ComponentProps<typeof TooltipPrimitive.Root>) {
+	const isMobile = useIsTouchDevice();
+
 	return (
 		<TooltipProvider>
-			<TooltipPrimitive.Root data-slot="tooltip" {...props} />
+			<TooltipPrimitive.Root
+				data-slot="tooltip"
+				open={isMobile ? false : open}
+				onOpenChange={isMobile ? undefined : onOpenChange}
+				{...props}
+			/>
 		</TooltipProvider>
 	);
 }

From 7fa1810d5061ef7ad5896e69c1cd4bbdbfc90c59 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Sun, 5 Apr 2026 23:14:54 +0530
Subject: [PATCH 131/202] refactor: simplify CommentComposer button layout and
 update placeholder text in CommentItem

---
 .../comment-composer/comment-composer.tsx     | 26 ++++++++-----------
 .../comment-item/comment-actions.tsx          |  4 +--
 .../comment-item/comment-item.tsx             |  2 +-
 3 files changed, 14 insertions(+), 18 deletions(-)

diff --git a/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx b/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
index 3d6ea384b..e14022f5c 100644
--- a/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
+++ b/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { ArrowUp, Send, X } from "lucide-react";
+import { ArrowUp } from "lucide-react";
 import { useCallback, useEffect, useRef, useState } from "react";
 import { Button } from "@/components/ui/button";
 import { Popover, PopoverAnchor, PopoverContent } from "@/components/ui/popover";
@@ -300,16 +300,15 @@ export function CommentComposer({
 
 			<div className={cn("flex items-center gap-2", !compact && "justify-end")}>
 				{onCancel && (
-					<Button
-						type="button"
-						variant="ghost"
-						size="sm"
-						onClick={onCancel}
-						disabled={isSubmitting}
-					>
-						<X className="mr-1 size-4" />
-						Cancel
-					</Button>
+				<Button
+					type="button"
+					variant="ghost"
+					size="sm"
+					onClick={onCancel}
+					disabled={isSubmitting}
+				>
+					Cancel
+				</Button>
 				)}
 				<Button
 					type="button"
@@ -321,10 +320,7 @@ export function CommentComposer({
 					{compact ? (
 						<ArrowUp className="size-4" />
 					) : (
-						<>
-							<Send className="mr-1 size-4" />
-							{submitLabel}
-						</>
+						submitLabel
 					)}
 				</Button>
 			</div>
diff --git a/surfsense_web/components/chat-comments/comment-item/comment-actions.tsx b/surfsense_web/components/chat-comments/comment-item/comment-actions.tsx
index 564a6ba84..9638ac01c 100644
--- a/surfsense_web/components/chat-comments/comment-item/comment-actions.tsx
+++ b/surfsense_web/components/chat-comments/comment-item/comment-actions.tsx
@@ -21,9 +21,9 @@ export function CommentActions({ canEdit, canDelete, onEdit, onDelete }: Comment
 				<Button
 					variant="ghost"
 					size="icon"
-					className="size-7 opacity-100 md:opacity-0 md:group-hover:opacity-100 transition-opacity"
+					className="size-7 text-muted-foreground opacity-100 md:opacity-0 md:group-hover:opacity-100 transition-opacity"
 				>
-					<MoreHorizontal className="size-4 text-muted-foreground" />
+					<MoreHorizontal className="size-4" />
 				</Button>
 			</DropdownMenuTrigger>
 			<DropdownMenuContent align="end">
diff --git a/surfsense_web/components/chat-comments/comment-item/comment-item.tsx b/surfsense_web/components/chat-comments/comment-item/comment-item.tsx
index 4996fe01b..eb374ba49 100644
--- a/surfsense_web/components/chat-comments/comment-item/comment-item.tsx
+++ b/surfsense_web/components/chat-comments/comment-item/comment-item.tsx
@@ -198,7 +198,7 @@ export function CommentItem({
 						<CommentComposer
 							members={members}
 							membersLoading={membersLoading}
-							placeholder="Edit your comment..."
+							placeholder="Edit your comment"
 							submitLabel="Save"
 							isSubmitting={isSubmitting}
 							onSubmit={handleEditSubmit}

From 742548847a520204ec9dcdaa95b25c26336501f5 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 12:14:17 +0530
Subject: [PATCH 132/202] refactor: optimize navigation items in
 LayoutDataProvider, enhance button layout in InboxSidebar with tooltip
 support, full width in PageUsageDisplay

---
 .../assistant-ui/connector-popup.tsx          |  2 +-
 .../assistant-ui/document-upload-popup.tsx    |  2 +-
 .../layout/providers/LayoutDataProvider.tsx   | 52 +++++++------
 .../layout/ui/right-panel/RightPanel.tsx      |  2 +-
 .../layout/ui/sidebar/InboxSidebar.tsx        | 76 ++++++++++++++-----
 .../layout/ui/sidebar/PageUsageDisplay.tsx    |  4 +-
 6 files changed, 87 insertions(+), 51 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/connector-popup.tsx b/surfsense_web/components/assistant-ui/connector-popup.tsx
index fe7b29f28..c41e986d4 100644
--- a/surfsense_web/components/assistant-ui/connector-popup.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup.tsx
@@ -216,7 +216,7 @@ export const ConnectorIndicator = forwardRef<ConnectorIndicatorHandle, Connector
 					onPointerDownOutside={(e) => {
 						if (pickerOpen) e.preventDefault();
 					}}
-					className="max-w-3xl w-[95vw] sm:w-full h-[75vh] sm:h-[85vh] flex flex-col p-0 gap-0 overflow-hidden border border-border ring-0 dark:ring-0 bg-muted dark:bg-muted text-foreground [&>button]:right-4 sm:[&>button]:right-12 [&>button]:top-6 sm:[&>button]:top-10 [&>button]:opacity-80 hover:[&>button]:opacity-100 [&>button_svg]:size-5 select-none"
+					className="max-w-3xl w-[95vw] sm:w-full h-[75vh] sm:h-[85vh] flex flex-col p-0 gap-0 overflow-hidden border border-border ring-0 dark:ring-0 bg-muted dark:bg-muted text-foreground [&>button]:right-4 sm:[&>button]:right-12 [&>button]:top-6 sm:[&>button]:top-10 [&>button]:opacity-80 [&>button]:hover:opacity-100 [&>button]:hover:bg-foreground/10 [&>button>svg]:size-5 select-none"
 				>
 					<DialogTitle className="sr-only">Manage Connectors</DialogTitle>
 					{/* YouTube Crawler View - shown when adding YouTube videos */}
diff --git a/surfsense_web/components/assistant-ui/document-upload-popup.tsx b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
index 59d73e651..fdd4131e5 100644
--- a/surfsense_web/components/assistant-ui/document-upload-popup.tsx
+++ b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
@@ -125,7 +125,7 @@ const DocumentUploadPopupContent: FC<{
 				onPointerDownOutside={(e) => e.preventDefault()}
 				onInteractOutside={(e) => e.preventDefault()}
 				onEscapeKeyDown={(e) => e.preventDefault()}
-				className="select-none max-w-2xl w-[95vw] sm:w-[640px] h-[min(440px,75dvh)] sm:h-[min(500px,80vh)] flex flex-col p-0 gap-0 overflow-hidden border border-border ring-0 bg-muted dark:bg-muted text-foreground [&>button]:right-3 sm:[&>button]:right-6 [&>button]:top-3 sm:[&>button]:top-5 [&>button]:opacity-80 hover:[&>button]:opacity-100 [&>button]:z-[100] [&>button_svg]:size-4 sm:[&>button_svg]:size-5"
+				className="select-none max-w-2xl w-[95vw] sm:w-[640px] h-[min(440px,75dvh)] sm:h-[min(500px,80vh)] flex flex-col p-0 gap-0 overflow-hidden border border-border ring-0 bg-muted dark:bg-muted text-foreground [&>button]:right-3 sm:[&>button]:right-6 [&>button]:top-3 sm:[&>button]:top-5 [&>button]:opacity-80 [&>button]:hover:opacity-100 [&>button]:hover:bg-foreground/10 [&>button]:z-[100] [&>button>svg]:size-4 sm:[&>button>svg]:size-5"
 			>
 				<DialogTitle className="sr-only">Upload Document</DialogTitle>
 
diff --git a/surfsense_web/components/layout/providers/LayoutDataProvider.tsx b/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
index 6138b67fb..74c3c64de 100644
--- a/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
+++ b/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
@@ -347,35 +347,37 @@ export function LayoutDataProvider({ searchSpaceId, children }: LayoutDataProvid
 
 	// Navigation items
 	const navItems: NavItem[] = useMemo(
-		() => [
-			{
-				title: "Inbox",
-				url: "#inbox",
-				icon: Inbox,
-				isActive: isInboxSidebarOpen,
-				badge: totalUnreadCount > 0 ? formatInboxCount(totalUnreadCount) : undefined,
-			},
-			{
-				title: "Documents",
-				url: "#documents",
-				icon: SquareLibrary,
-				isActive: isMobile
-					? isDocumentsSidebarOpen
-					: isDocumentsSidebarOpen && !isRightPanelCollapsed,
-			},
-			{
-				title: "Announcements",
-				url: "#announcements",
-				icon: Megaphone,
-				isActive: isAnnouncementsSidebarOpen,
-				badge: announcementUnreadCount > 0 ? formatInboxCount(announcementUnreadCount) : undefined,
-			},
-		],
+		() =>
+			(
+				[
+					{
+						title: "Inbox",
+						url: "#inbox",
+						icon: Inbox,
+						isActive: isInboxSidebarOpen,
+						badge: totalUnreadCount > 0 ? formatInboxCount(totalUnreadCount) : undefined,
+					},
+					isMobile
+						? {
+								title: "Documents",
+								url: "#documents",
+								icon: SquareLibrary,
+								isActive: isDocumentsSidebarOpen,
+							}
+						: null,
+					{
+						title: "Announcements",
+						url: "#announcements",
+						icon: Megaphone,
+						isActive: isAnnouncementsSidebarOpen,
+						badge: announcementUnreadCount > 0 ? formatInboxCount(announcementUnreadCount) : undefined,
+					},
+				] as (NavItem | null)[]
+			).filter((item): item is NavItem => item !== null),
 		[
 			isMobile,
 			isInboxSidebarOpen,
 			isDocumentsSidebarOpen,
-			isRightPanelCollapsed,
 			totalUnreadCount,
 			isAnnouncementsSidebarOpen,
 			announcementUnreadCount,
diff --git a/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx b/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
index 717f5a459..59683b6dc 100644
--- a/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
+++ b/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
@@ -78,7 +78,7 @@ export function RightPanelExpandButton() {
 	if (!collapsed || !hasContent) return null;
 
 	return (
-		<div className="flex shrink-0 items-center px-1">
+		<div className="flex shrink-0 items-center px-0.5">
 			<Tooltip>
 				<TooltipTrigger asChild>
 					<Button
diff --git a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
index 51ecedd94..0b8953ae0 100644
--- a/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/InboxSidebar.tsx
@@ -908,27 +908,61 @@ export function InboxSidebarContent({
 									)}
 									style={{ contentVisibility: "auto", containIntrinsicSize: "0 80px" }}
 								>
-									<button
-										type="button"
-										onClick={() => handleItemClick(item)}
-										disabled={isMarkingAsRead}
-										className="flex items-center gap-3 flex-1 min-w-0 text-left overflow-hidden"
-									>
-										<div className="shrink-0">{getStatusIcon(item)}</div>
-										<div className="flex-1 min-w-0 overflow-hidden">
-											<p
-												className={cn(
-													"text-xs font-medium line-clamp-2",
-													!item.read && "font-semibold"
-												)}
-											>
-												{item.title}
-											</p>
-											<p className="text-[11px] text-muted-foreground line-clamp-2 mt-0.5">
-												{convertRenderedToDisplay(item.message)}
-											</p>
-										</div>
-									</button>
+									{activeTab === "status" ? (
+										<Tooltip delayDuration={600}>
+											<TooltipTrigger asChild>
+												<button
+													type="button"
+													onClick={() => handleItemClick(item)}
+													disabled={isMarkingAsRead}
+													className="flex items-center gap-3 flex-1 min-w-0 text-left overflow-hidden"
+												>
+													<div className="shrink-0">{getStatusIcon(item)}</div>
+													<div className="flex-1 min-w-0 overflow-hidden">
+														<p
+															className={cn(
+																"text-xs font-medium line-clamp-2",
+																!item.read && "font-semibold"
+															)}
+														>
+															{item.title}
+														</p>
+														<p className="text-[11px] text-muted-foreground line-clamp-2 mt-0.5">
+															{convertRenderedToDisplay(item.message)}
+														</p>
+													</div>
+												</button>
+											</TooltipTrigger>
+											<TooltipContent side="bottom" align="start" className="max-w-[250px]">
+												<p className="font-medium">{item.title}</p>
+												<p className="text-muted-foreground mt-1">
+													{convertRenderedToDisplay(item.message)}
+												</p>
+											</TooltipContent>
+										</Tooltip>
+									) : (
+										<button
+											type="button"
+											onClick={() => handleItemClick(item)}
+											disabled={isMarkingAsRead}
+											className="flex items-center gap-3 flex-1 min-w-0 text-left overflow-hidden"
+										>
+											<div className="shrink-0">{getStatusIcon(item)}</div>
+											<div className="flex-1 min-w-0 overflow-hidden">
+												<p
+													className={cn(
+														"text-xs font-medium line-clamp-2",
+														!item.read && "font-semibold"
+													)}
+												>
+													{item.title}
+												</p>
+												<p className="text-[11px] text-muted-foreground line-clamp-2 mt-0.5">
+													{convertRenderedToDisplay(item.message)}
+												</p>
+											</div>
+										</button>
+									)}
 
 									<div className="flex items-center justify-end gap-1.5 shrink-0 w-10">
 										<span className="text-[10px] text-muted-foreground">
diff --git a/surfsense_web/components/layout/ui/sidebar/PageUsageDisplay.tsx b/surfsense_web/components/layout/ui/sidebar/PageUsageDisplay.tsx
index 73347e304..7dd46e484 100644
--- a/surfsense_web/components/layout/ui/sidebar/PageUsageDisplay.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/PageUsageDisplay.tsx
@@ -35,7 +35,7 @@ export function PageUsageDisplay({ pagesUsed, pagesLimit }: PageUsageDisplayProp
 				<Progress value={usagePercentage} className="h-1.5" />
 				<Link
 					href={`/dashboard/${searchSpaceId}/more-pages`}
-					className="group flex w-full items-center justify-between rounded-md px-1.5 py-1 -mx-1.5 transition-colors hover:bg-accent"
+					className="group flex w-[calc(100%+0.75rem)] items-center justify-between rounded-md px-1.5 py-1 -mx-1.5 transition-colors hover:bg-accent"
 				>
 					<span className="flex items-center gap-1.5 text-xs text-muted-foreground group-hover:text-accent-foreground">
 						<Zap className="h-3 w-3 shrink-0" />
@@ -48,7 +48,7 @@ export function PageUsageDisplay({ pagesUsed, pagesLimit }: PageUsageDisplayProp
 				{pageBuyingEnabled && (
 					<Link
 						href={`/dashboard/${searchSpaceId}/buy-pages`}
-						className="group flex w-full items-center justify-between rounded-md px-1.5 py-1 -mx-1.5 transition-colors hover:bg-accent"
+						className="group flex w-[calc(100%+0.75rem)] items-center justify-between rounded-md px-1.5 py-1 -mx-1.5 transition-colors hover:bg-accent"
 					>
 						<span className="flex items-center gap-1.5 text-xs text-muted-foreground group-hover:text-accent-foreground">
 							<CreditCard className="h-3 w-3 shrink-0" />

From 46c15c11dadfced3759f3c04afeb4eef41dc482a Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 12:29:55 +0530
Subject: [PATCH 133/202] refactor: update layout and styling in
 DocumentUploadPopup for improved visual hierarchy and spacing

---
 .../components/assistant-ui/document-upload-popup.tsx     | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/document-upload-popup.tsx b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
index fdd4131e5..7b0409345 100644
--- a/surfsense_web/components/assistant-ui/document-upload-popup.tsx
+++ b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
@@ -125,18 +125,18 @@ const DocumentUploadPopupContent: FC<{
 				onPointerDownOutside={(e) => e.preventDefault()}
 				onInteractOutside={(e) => e.preventDefault()}
 				onEscapeKeyDown={(e) => e.preventDefault()}
-				className="select-none max-w-2xl w-[95vw] sm:w-[640px] h-[min(440px,75dvh)] sm:h-[min(500px,80vh)] flex flex-col p-0 gap-0 overflow-hidden border border-border ring-0 bg-muted dark:bg-muted text-foreground [&>button]:right-3 sm:[&>button]:right-6 [&>button]:top-3 sm:[&>button]:top-5 [&>button]:opacity-80 [&>button]:hover:opacity-100 [&>button]:hover:bg-foreground/10 [&>button]:z-[100] [&>button>svg]:size-4 sm:[&>button>svg]:size-5"
+				className="select-none max-w-2xl w-[95vw] sm:w-[640px] h-[min(440px,75dvh)] sm:h-[min(520px,80vh)] flex flex-col p-0 gap-0 overflow-hidden border border-border ring-0 bg-muted dark:bg-muted text-foreground [&>button]:right-3 sm:[&>button]:right-6 [&>button]:top-5 sm:[&>button]:top-8 [&>button]:opacity-80 [&>button]:hover:opacity-100 [&>button]:hover:bg-foreground/10 [&>button]:z-[100] [&>button>svg]:size-4 sm:[&>button>svg]:size-5"
 			>
 				<DialogTitle className="sr-only">Upload Document</DialogTitle>
 
 				<div className="flex-1 min-h-0 overflow-y-auto overscroll-contain">
-					<div className="sticky top-0 z-20 bg-muted px-4 sm:px-6 pt-4 sm:pt-5 pb-10">
+					<div className="sticky top-0 z-20 bg-muted px-4 sm:px-6 pt-6 sm:pt-8 pb-10">
 						<div className="flex items-center gap-2 mb-1 pr-8 sm:pr-0">
-							<h2 className="text-base sm:text-lg font-semibold tracking-tight">
+							<h2 className="text-xl sm:text-3xl font-semibold tracking-tight">
 								Upload Documents
 							</h2>
 						</div>
-						<p className="text-xs sm:text-sm text-muted-foreground line-clamp-1">
+						<p className="text-xs sm:text-base text-muted-foreground/80 line-clamp-1">
 							Upload and sync your documents to your search space
 						</p>
 					</div>

From 02323e7b55da78c3de0ec71dd20904f6bed49c16 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 12:56:29 +0530
Subject: [PATCH 134/202] refactor: enhance DocumentsFilters component with
 ToggleGroup for folder creation and improve search functionality

---
 .../(manage)/components/DocumentsFilters.tsx  | 232 +++++++++---------
 .../components/new-chat/model-selector.tsx    |   7 +-
 .../components/shared/image-config-dialog.tsx |   2 +-
 .../components/shared/model-config-dialog.tsx |   2 +-
 4 files changed, 124 insertions(+), 119 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
index b85af13b7..b043c61e9 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
@@ -8,6 +8,7 @@ import { Button } from "@/components/ui/button";
 import { Checkbox } from "@/components/ui/checkbox";
 import { Input } from "@/components/ui/input";
 import { Popover, PopoverContent, PopoverTrigger } from "@/components/ui/popover";
+import { ToggleGroup, ToggleGroupItem } from "@/components/ui/toggle-group";
 import { Tooltip, TooltipContent, TooltipTrigger } from "@/components/ui/tooltip";
 import type { DocumentTypeEnum } from "@/contracts/types/document.types";
 import { getDocumentTypeIcon, getDocumentTypeLabel } from "./DocumentTypeIcon";
@@ -63,109 +64,129 @@ export function DocumentsFilters({
 	return (
 		<div className="flex select-none">
 			<div className="flex items-center gap-2 w-full">
-				{/* Type Filter */}
-				<Popover>
-					<PopoverTrigger asChild>
-						<Button
-							variant="outline"
-							size="icon"
-							className="h-9 w-9 shrink-0 border-dashed border-sidebar-border text-sidebar-foreground/60 hover:text-sidebar-foreground hover:border-sidebar-border bg-sidebar"
-						>
-							<ListFilter size={14} />
-							{activeTypes.length > 0 && (
-								<span className="absolute -top-1 -right-1 flex h-4 w-4 items-center justify-center rounded-full bg-primary text-[9px] font-medium text-primary-foreground">
-									{activeTypes.length}
-								</span>
-							)}
-						</Button>
-					</PopoverTrigger>
-					<PopoverContent className="w-56 md:w-52 !p-0 overflow-hidden" align="end">
-						<div>
-							{/* Search input */}
-							<div className="p-2">
-								<div className="relative">
-									<Search className="absolute left-0.5 top-1/2 -translate-y-1/2 h-4 w-4 text-muted-foreground" />
-									<Input
-										placeholder="Search types"
-										value={typeSearchQuery}
-										onChange={(e) => setTypeSearchQuery(e.target.value)}
-										className="h-6 pl-6 text-sm bg-transparent border-0 shadow-none"
-									/>
-								</div>
-							</div>
+				{/* Filter + New Folder Toggle Group */}
+				<ToggleGroup type="multiple" variant="outline" value={[]}>
+					{onCreateFolder && (
+						<Tooltip>
+							<TooltipTrigger asChild>
+								<ToggleGroupItem
+									value="folder"
+									className="h-9 w-9 shrink-0 border-sidebar-border text-sidebar-foreground/60 hover:text-sidebar-foreground hover:border-sidebar-border bg-sidebar"
+									onClick={(e) => {
+										e.preventDefault();
+										onCreateFolder();
+									}}
+								>
+									<FolderPlus size={14} />
+								</ToggleGroupItem>
+							</TooltipTrigger>
+							<TooltipContent>New folder</TooltipContent>
+						</Tooltip>
+					)}
 
-							<div
-								className="max-h-[300px] overflow-y-auto overflow-x-hidden py-1.5 px-1.5"
-								onScroll={handleScroll}
-								style={{
-									maskImage: `linear-gradient(to bottom, ${scrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${scrollPos === "bottom" ? "black" : "transparent"})`,
-									WebkitMaskImage: `linear-gradient(to bottom, ${scrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${scrollPos === "bottom" ? "black" : "transparent"})`,
-								}}
-							>
-								{filteredTypes.length === 0 ? (
-									<div className="py-6 text-center text-sm text-muted-foreground">
-										No types found
+					<Popover>
+						<Tooltip>
+							<TooltipTrigger asChild>
+								<PopoverTrigger asChild>
+									<ToggleGroupItem
+										value="filter"
+										className="relative h-9 w-9 shrink-0 border-sidebar-border text-sidebar-foreground/60 hover:text-sidebar-foreground hover:border-sidebar-border bg-sidebar"
+									>
+										<ListFilter size={14} />
+										{activeTypes.length > 0 && (
+											<span className="absolute -top-1 -right-1 flex h-4 w-4 items-center justify-center rounded-full bg-primary text-[9px] font-medium text-primary-foreground">
+												{activeTypes.length}
+											</span>
+										)}
+									</ToggleGroupItem>
+								</PopoverTrigger>
+							</TooltipTrigger>
+							<TooltipContent>Filter by type</TooltipContent>
+						</Tooltip>
+						<PopoverContent className="w-56 md:w-52 !p-0 overflow-hidden" align="start">
+							<div>
+								<div className="p-2">
+									<div className="relative">
+										<Search className="absolute left-0.5 top-1/2 -translate-y-1/2 h-4 w-4 text-muted-foreground" />
+										<Input
+											placeholder="Search types"
+											value={typeSearchQuery}
+											onChange={(e) => setTypeSearchQuery(e.target.value)}
+											className="h-6 pl-6 text-sm bg-transparent border-0 shadow-none"
+										/>
 									</div>
-								) : (
-									filteredTypes.map((value: DocumentTypeEnum, i) => (
-										<div
-											role="option"
-											aria-selected={activeTypes.includes(value)}
-											tabIndex={0}
-											key={value}
-											className="flex w-full items-center gap-2.5 py-2 px-3 rounded-md hover:bg-neutral-200 dark:hover:bg-neutral-700 transition-colors cursor-pointer text-left"
-											onClick={() => onToggleType(value, !activeTypes.includes(value))}
-											onKeyDown={(e) => {
-												if (e.key === "Enter" || e.key === " ") {
-													e.preventDefault();
-													onToggleType(value, !activeTypes.includes(value));
-												}
+								</div>
+
+								<div
+									className="max-h-[300px] overflow-y-auto overflow-x-hidden py-1.5 px-1.5"
+									onScroll={handleScroll}
+									style={{
+										maskImage: `linear-gradient(to bottom, ${scrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${scrollPos === "bottom" ? "black" : "transparent"})`,
+										WebkitMaskImage: `linear-gradient(to bottom, ${scrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${scrollPos === "bottom" ? "black" : "transparent"})`,
+									}}
+								>
+									{filteredTypes.length === 0 ? (
+										<div className="py-6 text-center text-sm text-muted-foreground">
+											No types found
+										</div>
+									) : (
+										filteredTypes.map((value: DocumentTypeEnum, i) => (
+											<div
+												role="option"
+												aria-selected={activeTypes.includes(value)}
+												tabIndex={0}
+												key={value}
+												className="flex w-full items-center gap-2.5 py-2 px-3 rounded-md hover:bg-neutral-200 dark:hover:bg-neutral-700 transition-colors cursor-pointer text-left"
+												onClick={() => onToggleType(value, !activeTypes.includes(value))}
+												onKeyDown={(e) => {
+													if (e.key === "Enter" || e.key === " ") {
+														e.preventDefault();
+														onToggleType(value, !activeTypes.includes(value));
+													}
+												}}
+											>
+												<div className="flex h-7 w-7 shrink-0 items-center justify-center rounded-md bg-muted/50 text-foreground/80">
+													{getDocumentTypeIcon(value, "h-4 w-4")}
+												</div>
+												<div className="flex flex-col min-w-0 flex-1 gap-0.5">
+													<span className="text-[13px] font-medium text-foreground truncate leading-tight">
+														{getDocumentTypeLabel(value)}
+													</span>
+													<span className="text-[11px] text-muted-foreground leading-tight">
+														{typeCounts.get(value)} document
+														{(typeCounts.get(value) ?? 0) !== 1 ? "s" : ""}
+													</span>
+												</div>
+												<Checkbox
+													id={`${id}-${i}`}
+													checked={activeTypes.includes(value)}
+													onCheckedChange={(checked: boolean) => onToggleType(value, !!checked)}
+													className="h-4 w-4 shrink-0 rounded border-muted-foreground/30 data-[state=checked]:bg-primary data-[state=checked]:border-primary"
+												/>
+											</div>
+										))
+									)}
+								</div>
+								{activeTypes.length > 0 && (
+									<div className="px-3 pt-1.5 pb-1.5 border-t border-border dark:border-neutral-700">
+										<Button
+											variant="ghost"
+											size="sm"
+											className="w-full h-7 text-[11px] text-muted-foreground hover:text-foreground hover:bg-neutral-200 dark:hover:bg-neutral-700"
+											onClick={() => {
+												activeTypes.forEach((t) => {
+													onToggleType(t, false);
+												});
 											}}
 										>
-											{/* Icon */}
-											<div className="flex h-7 w-7 shrink-0 items-center justify-center rounded-md bg-muted/50 text-foreground/80">
-												{getDocumentTypeIcon(value, "h-4 w-4")}
-											</div>
-											{/* Text content */}
-											<div className="flex flex-col min-w-0 flex-1 gap-0.5">
-												<span className="text-[13px] font-medium text-foreground truncate leading-tight">
-													{getDocumentTypeLabel(value)}
-												</span>
-												<span className="text-[11px] text-muted-foreground leading-tight">
-													{typeCounts.get(value)} document
-													{(typeCounts.get(value) ?? 0) !== 1 ? "s" : ""}
-												</span>
-											</div>
-											{/* Checkbox */}
-											<Checkbox
-												id={`${id}-${i}`}
-												checked={activeTypes.includes(value)}
-												onCheckedChange={(checked: boolean) => onToggleType(value, !!checked)}
-												className="h-4 w-4 shrink-0 rounded border-muted-foreground/30 data-[state=checked]:bg-primary data-[state=checked]:border-primary"
-											/>
-										</div>
-									))
+											Clear filters
+										</Button>
+									</div>
 								)}
 							</div>
-							{activeTypes.length > 0 && (
-								<div className="px-3 pt-1.5 pb-1.5 border-t border-border dark:border-neutral-700">
-									<Button
-										variant="ghost"
-										size="sm"
-										className="w-full h-7 text-[11px] text-muted-foreground hover:text-foreground hover:bg-neutral-200 dark:hover:bg-neutral-700"
-										onClick={() => {
-											activeTypes.forEach((t) => {
-												onToggleType(t, false);
-											});
-										}}
-									>
-										Clear filters
-									</Button>
-								</div>
-							)}
-						</div>
-					</PopoverContent>
-				</Popover>
+						</PopoverContent>
+					</Popover>
+				</ToggleGroup>
 
 				{/* Search Input */}
 				<div className="relative flex-1 min-w-0">
@@ -197,23 +218,6 @@ export function DocumentsFilters({
 					)}
 				</div>
 
-				{/* New Folder Button */}
-				{onCreateFolder && (
-					<Tooltip>
-						<TooltipTrigger asChild>
-							<Button
-								variant="outline"
-								size="icon"
-								className="h-9 w-9 shrink-0 border-dashed border-sidebar-border text-sidebar-foreground/60 hover:text-sidebar-foreground hover:border-sidebar-border bg-sidebar"
-								onClick={onCreateFolder}
-							>
-								<FolderPlus size={14} />
-							</Button>
-						</TooltipTrigger>
-						<TooltipContent>New folder</TooltipContent>
-					</Tooltip>
-				)}
-
 				{/* Upload Button */}
 				<Button
 					data-joyride="upload-button"
diff --git a/surfsense_web/components/new-chat/model-selector.tsx b/surfsense_web/components/new-chat/model-selector.tsx
index b207d82b4..39f88f794 100644
--- a/surfsense_web/components/new-chat/model-selector.tsx
+++ b/surfsense_web/components/new-chat/model-selector.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useAtomValue } from "jotai";
-import { Bot, Check, ChevronDown, Edit3, ImageIcon, Plus, Zap } from "lucide-react";
+import { Bot, Check, ChevronDown, Edit3, ImageIcon, Plus, Search, Zap } from "lucide-react";
 import { type UIEvent, useCallback, useMemo, useState } from "react";
 import { toast } from "sonner";
 import {
@@ -344,7 +344,7 @@ export function ModelSelector({
 							>
 								<CommandEmpty className="py-8 text-center">
 									<div className="flex flex-col items-center gap-2">
-										<Bot className="size-8 text-muted-foreground" />
+										<Search className="size-8 text-muted-foreground" />
 										<p className="text-sm text-muted-foreground">No models found</p>
 										<p className="text-xs text-muted-foreground/60">Try a different search term</p>
 									</div>
@@ -531,8 +531,9 @@ export function ModelSelector({
 							>
 								<CommandEmpty className="py-8 text-center">
 									<div className="flex flex-col items-center gap-2">
-										<ImageIcon className="size-8 text-muted-foreground" />
+										<Search className="size-8 text-muted-foreground" />
 										<p className="text-sm text-muted-foreground">No image models found</p>
+										<p className="text-xs text-muted-foreground/60">Try a different search term</p>
 									</div>
 								</CommandEmpty>
 
diff --git a/surfsense_web/components/shared/image-config-dialog.tsx b/surfsense_web/components/shared/image-config-dialog.tsx
index 1cfbf8842..2ae53ccca 100644
--- a/surfsense_web/components/shared/image-config-dialog.tsx
+++ b/surfsense_web/components/shared/image-config-dialog.tsx
@@ -433,7 +433,7 @@ export function ImageConfigDialog({
 							className="relative text-sm h-9 min-w-[120px]"
 						>
 							<span className={isSubmitting ? "opacity-0" : ""}>
-								{mode === "edit" ? "Save Changes" : "Create & Use"}
+								{mode === "edit" ? "Save Changes" : "Add Model"}
 							</span>
 							{isSubmitting && <Spinner size="sm" className="absolute" />}
 						</Button>
diff --git a/surfsense_web/components/shared/model-config-dialog.tsx b/surfsense_web/components/shared/model-config-dialog.tsx
index 84ba821fc..4d2373b49 100644
--- a/surfsense_web/components/shared/model-config-dialog.tsx
+++ b/surfsense_web/components/shared/model-config-dialog.tsx
@@ -312,7 +312,7 @@ export function ModelConfigDialog({
 							className="relative text-sm h-9 min-w-[120px]"
 						>
 							<span className={isSubmitting ? "opacity-0" : ""}>
-								{mode === "edit" ? "Save Changes" : "Create & Use"}
+								{mode === "edit" ? "Save Changes" : "Add Model"}
 							</span>
 							{isSubmitting && <Spinner size="sm" className="absolute" />}
 						</Button>

From 8259fab254871b064e37239562fdd1104eb10bd9 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 13:27:49 +0530
Subject: [PATCH 135/202] refactor: update connector tabs to include search
 feedback and improve icon usage for better user experience

---
 .../connector-popup/tabs/active-connectors-tab.tsx | 14 +++++++++++---
 .../connector-popup/tabs/all-connectors-tab.tsx    | 13 +++++++++++++
 2 files changed, 24 insertions(+), 3 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/connector-popup/tabs/active-connectors-tab.tsx b/surfsense_web/components/assistant-ui/connector-popup/tabs/active-connectors-tab.tsx
index ccf1476dd..55fc99150 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/tabs/active-connectors-tab.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/tabs/active-connectors-tab.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { Cable } from "lucide-react";
+import { Search, Unplug } from "lucide-react";
 import type { FC } from "react";
 import { getDocumentTypeLabel } from "@/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentTypeIcon";
 import { Button } from "@/components/ui/button";
@@ -134,9 +134,17 @@ export const ActiveConnectorsTab: FC<ActiveConnectorsTabProps> = ({
 	const hasActiveConnectors =
 		filteredOAuthConnectorTypes.length > 0 || filteredNonOAuthConnectors.length > 0;
 
+	const hasFilteredResults = hasActiveConnectors || standaloneDocuments.length > 0;
+
 	return (
 		<TabsContent value="active" className="m-0">
-			{hasSources ? (
+			{hasSources && !hasFilteredResults && searchQuery ? (
+				<div className="flex flex-col items-center justify-center py-20 text-center">
+					<Search className="size-8 text-muted-foreground mb-3" />
+					<p className="text-sm text-muted-foreground">No connectors found</p>
+					<p className="text-xs text-muted-foreground/60 mt-1">Try a different search term</p>
+				</div>
+			) : hasSources ? (
 				<div className="space-y-6">
 					{/* Active Connectors Section */}
 					{hasActiveConnectors && (
@@ -302,7 +310,7 @@ export const ActiveConnectorsTab: FC<ActiveConnectorsTabProps> = ({
 			) : (
 				<div className="flex flex-col items-center justify-center py-20 text-center">
 					<div className="flex h-16 w-16 items-center justify-center rounded-full bg-muted mb-4">
-						<Cable className="size-8 text-muted-foreground" />
+						<Unplug className="size-8 text-muted-foreground" />
 					</div>
 					<h4 className="text-lg font-semibold">No active sources</h4>
 					<p className="text-sm text-muted-foreground mt-1 max-w-[280px]">
diff --git a/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx b/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx
index 3e8aad620..0afc192da 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx
@@ -1,5 +1,6 @@
 "use client";
 
+import { Search } from "lucide-react";
 import type { FC } from "react";
 import { EnumConnectorName } from "@/contracts/enums/connector";
 import type { SearchSourceConnector } from "@/contracts/types/connector.types";
@@ -287,6 +288,18 @@ export const AllConnectorsTab: FC<AllConnectorsTabProps> = ({
 		moreIntegrationsOther.length > 0 ||
 		moreIntegrationsCrawlers.length > 0;
 
+	const hasAnyResults = hasDocumentFileConnectors || hasMoreIntegrations;
+
+	if (!hasAnyResults && searchQuery) {
+		return (
+			<div className="flex flex-col items-center justify-center py-20 text-center">
+				<Search className="size-8 text-muted-foreground mb-3" />
+				<p className="text-sm text-muted-foreground">No connectors found</p>
+				<p className="text-xs text-muted-foreground/60 mt-1">Try a different search term</p>
+			</div>
+		);
+	}
+
 	return (
 		<div className="space-y-8">
 			{/* Document/Files Connectors */}

From 3251f0e98d700373cdefe3eeb03220916ec1d28c Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 13:56:28 +0530
Subject: [PATCH 136/202] refactor: remove childCount prop from FolderNode and
 optimize FolderTreeView by eliminating unnecessary child count calculations

---
 surfsense_web/components/documents/FolderNode.tsx   |  8 --------
 .../components/documents/FolderTreeView.tsx         | 13 +------------
 .../components/layout/ui/right-panel/RightPanel.tsx |  5 ++---
 3 files changed, 3 insertions(+), 23 deletions(-)

diff --git a/surfsense_web/components/documents/FolderNode.tsx b/surfsense_web/components/documents/FolderNode.tsx
index 88cc76c69..2ec430871 100644
--- a/surfsense_web/components/documents/FolderNode.tsx
+++ b/surfsense_web/components/documents/FolderNode.tsx
@@ -56,7 +56,6 @@ interface FolderNodeProps {
 	depth: number;
 	isExpanded: boolean;
 	isRenaming: boolean;
-	childCount: number;
 	selectionState: FolderSelectionState;
 	processingState: "idle" | "processing" | "failed";
 	onToggleSelect: (folderId: number, selectAll: boolean) => void;
@@ -101,7 +100,6 @@ export const FolderNode = React.memo(function FolderNode({
 	depth,
 	isExpanded,
 	isRenaming,
-	childCount,
 	selectionState,
 	processingState,
 	onToggleSelect,
@@ -336,12 +334,6 @@ export const FolderNode = React.memo(function FolderNode({
 						<span className="flex-1 min-w-0 truncate">{folder.name}</span>
 					)}
 
-					{!isRenaming && childCount > 0 && (
-						<span className="shrink-0 text-[10px] text-muted-foreground tabular-nums">
-							{childCount}
-						</span>
-					)}
-
 					{!isRenaming && (
 						<DropdownMenu>
 							<DropdownMenuTrigger asChild>
diff --git a/surfsense_web/components/documents/FolderTreeView.tsx b/surfsense_web/components/documents/FolderTreeView.tsx
index 1df007c0b..d9c74e0db 100644
--- a/surfsense_web/components/documents/FolderTreeView.tsx
+++ b/surfsense_web/components/documents/FolderTreeView.tsx
@@ -86,16 +86,6 @@ export function FolderTreeView({
 
 	const docsByFolder = useMemo(() => groupBy(documents, (d) => d.folderId ?? "root"), [documents]);
 
-	const folderChildCounts = useMemo(() => {
-		const counts: Record<number, number> = {};
-		for (const f of folders) {
-			const children = foldersByParent[f.id] ?? [];
-			const docs = docsByFolder[f.id] ?? [];
-			counts[f.id] = children.length + docs.length;
-		}
-		return counts;
-	}, [folders, foldersByParent, docsByFolder]);
-
 	const [openContextMenuId, setOpenContextMenuId] = useState<string | null>(null);
 
 	// Single subscription for rename state — derived boolean passed to each FolderNode
@@ -226,8 +216,7 @@ export function FolderTreeView({
 					depth={depth}
 					isExpanded={isExpanded}
 					isRenaming={renamingFolderId === f.id}
-					childCount={folderChildCounts[f.id] ?? 0}
-					selectionState={folderSelectionStates[f.id] ?? "none"}
+				selectionState={folderSelectionStates[f.id] ?? "none"}
 					processingState={folderProcessingStates[f.id] ?? "idle"}
 					onToggleSelect={onToggleFolderSelect}
 					onToggleExpand={onToggleExpand}
diff --git a/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx b/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
index 59683b6dc..83b7d5d1f 100644
--- a/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
+++ b/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
@@ -10,7 +10,6 @@ import { documentsSidebarOpenAtom } from "@/atoms/documents/ui.atoms";
 import { closeEditorPanelAtom, editorPanelAtom } from "@/atoms/editor/editor-panel.atom";
 import { rightPanelCollapsedAtom, rightPanelTabAtom } from "@/atoms/layout/right-panel.atom";
 import { Button } from "@/components/ui/button";
-import { Skeleton } from "@/components/ui/skeleton";
 import { Tooltip, TooltipContent, TooltipTrigger } from "@/components/ui/tooltip";
 import { DocumentsSidebar } from "../sidebar";
 
@@ -27,7 +26,7 @@ const HitlEditPanelContent = dynamic(
 		import("@/components/hitl-edit-panel/hitl-edit-panel").then((m) => ({
 			default: m.HitlEditPanelContent,
 		})),
-	{ ssr: false, loading: () => <Skeleton className="h-96 w-full" /> }
+	{ ssr: false, loading: () => null }
 );
 
 const ReportPanelContent = dynamic(
@@ -35,7 +34,7 @@ const ReportPanelContent = dynamic(
 		import("@/components/report-panel/report-panel").then((m) => ({
 			default: m.ReportPanelContent,
 		})),
-	{ ssr: false, loading: () => <Skeleton className="h-96 w-full" /> }
+	{ ssr: false, loading: () => null }
 );
 
 interface RightPanelProps {

From be7e73e615a850e4adee13aff6d91654abefdf51 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 14:41:53 +0530
Subject: [PATCH 137/202] refactor: enhance DocumentsFilters and FolderTreeView
 components for improved filter handling and search functionality

---
 .../(manage)/components/DocumentsFilters.tsx  | 22 +++----------------
 .../components/documents/FolderTreeView.tsx   | 17 +++++++++-----
 .../layout/ui/right-panel/RightPanel.tsx      |  2 +-
 .../layout/ui/sidebar/DocumentsSidebar.tsx    |  5 +++--
 .../contracts/enums/connectorIcons.tsx        |  2 +-
 5 files changed, 20 insertions(+), 28 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
index b043c61e9..a795b61c7 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/documents/(manage)/components/DocumentsFilters.tsx
@@ -65,7 +65,7 @@ export function DocumentsFilters({
 		<div className="flex select-none">
 			<div className="flex items-center gap-2 w-full">
 				{/* Filter + New Folder Toggle Group */}
-				<ToggleGroup type="multiple" variant="outline" value={[]}>
+				<ToggleGroup type="multiple" variant="outline" value={[]} className="overflow-visible">
 					{onCreateFolder && (
 						<Tooltip>
 							<TooltipTrigger asChild>
@@ -90,11 +90,11 @@ export function DocumentsFilters({
 								<PopoverTrigger asChild>
 									<ToggleGroupItem
 										value="filter"
-										className="relative h-9 w-9 shrink-0 border-sidebar-border text-sidebar-foreground/60 hover:text-sidebar-foreground hover:border-sidebar-border bg-sidebar"
+										className="relative h-9 w-9 shrink-0 border-sidebar-border text-sidebar-foreground/60 hover:text-sidebar-foreground hover:border-sidebar-border bg-sidebar overflow-visible"
 									>
 										<ListFilter size={14} />
 										{activeTypes.length > 0 && (
-											<span className="absolute -top-1 -right-1 flex h-4 w-4 items-center justify-center rounded-full bg-primary text-[9px] font-medium text-primary-foreground">
+											<span className="absolute -top-1 -right-1 flex h-4 w-4 items-center justify-center rounded-full bg-sidebar-border text-[9px] font-medium text-sidebar-foreground">
 												{activeTypes.length}
 											</span>
 										)}
@@ -167,22 +167,6 @@ export function DocumentsFilters({
 										))
 									)}
 								</div>
-								{activeTypes.length > 0 && (
-									<div className="px-3 pt-1.5 pb-1.5 border-t border-border dark:border-neutral-700">
-										<Button
-											variant="ghost"
-											size="sm"
-											className="w-full h-7 text-[11px] text-muted-foreground hover:text-foreground hover:bg-neutral-200 dark:hover:bg-neutral-700"
-											onClick={() => {
-												activeTypes.forEach((t) => {
-													onToggleType(t, false);
-												});
-											}}
-										>
-											Clear filters
-										</Button>
-									</div>
-								)}
 							</div>
 						</PopoverContent>
 					</Popover>
diff --git a/surfsense_web/components/documents/FolderTreeView.tsx b/surfsense_web/components/documents/FolderTreeView.tsx
index d9c74e0db..371d00f42 100644
--- a/surfsense_web/components/documents/FolderTreeView.tsx
+++ b/surfsense_web/components/documents/FolderTreeView.tsx
@@ -96,14 +96,21 @@ export function FolderTreeView({
 	);
 	const handleCancelRename = useCallback(() => setRenamingFolderId(null), [setRenamingFolderId]);
 
+	const effectiveActiveTypes = useMemo(() => {
+		if (activeTypes.includes("FILE" as DocumentTypeEnum) && !activeTypes.includes("LOCAL_FOLDER_FILE" as DocumentTypeEnum)) {
+			return [...activeTypes, "LOCAL_FOLDER_FILE" as DocumentTypeEnum];
+		}
+		return activeTypes;
+	}, [activeTypes]);
+
 	const hasDescendantMatch = useMemo(() => {
-		if (activeTypes.length === 0 && !searchQuery) return null;
+		if (effectiveActiveTypes.length === 0 && !searchQuery) return null;
 		const match: Record<number, boolean> = {};
 
 		function check(folderId: number): boolean {
 			if (match[folderId] !== undefined) return match[folderId];
 			const childDocs = (docsByFolder[folderId] ?? []).some(
-				(d) => activeTypes.length === 0 || activeTypes.includes(d.document_type as DocumentTypeEnum)
+				(d) => effectiveActiveTypes.length === 0 || effectiveActiveTypes.includes(d.document_type as DocumentTypeEnum)
 			);
 			if (childDocs) {
 				match[folderId] = true;
@@ -124,7 +131,7 @@ export function FolderTreeView({
 			check(f.id);
 		}
 		return match;
-	}, [folders, docsByFolder, foldersByParent, activeTypes, searchQuery]);
+	}, [folders, docsByFolder, foldersByParent, effectiveActiveTypes, searchQuery]);
 
 	const folderSelectionStates = useMemo(() => {
 		const states: Record<number, FolderSelectionState> = {};
@@ -194,7 +201,7 @@ export function FolderTreeView({
 			? childFolders.filter((f) => hasDescendantMatch[f.id])
 			: childFolders;
 		const childDocs = (docsByFolder[key] ?? []).filter(
-			(d) => activeTypes.length === 0 || activeTypes.includes(d.document_type as DocumentTypeEnum)
+			(d) => effectiveActiveTypes.length === 0 || effectiveActiveTypes.includes(d.document_type as DocumentTypeEnum)
 		);
 
 		const nodes: React.ReactNode[] = [];
@@ -278,7 +285,7 @@ export function FolderTreeView({
 		);
 	}
 
-	if (treeNodes.length === 0 && (activeTypes.length > 0 || searchQuery)) {
+	if (treeNodes.length === 0 && (effectiveActiveTypes.length > 0 || searchQuery)) {
 		return (
 			<div className="flex flex-1 flex-col items-center justify-center gap-3 px-4 py-12 text-muted-foreground">
 				<Search className="h-10 w-10" />
diff --git a/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx b/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
index 83b7d5d1f..febae35d3 100644
--- a/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
+++ b/surfsense_web/components/layout/ui/right-panel/RightPanel.tsx
@@ -84,7 +84,7 @@ export function RightPanelExpandButton() {
 						variant="ghost"
 						size="icon"
 						onClick={() => startTransition(() => setCollapsed(false))}
-						className="h-7 w-7 shrink-0"
+						className="h-8 w-8 shrink-0 -m-0.5"
 					>
 						<PanelRight className="h-4 w-4" />
 						<span className="sr-only">Expand panel</span>
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index aa409e179..8bd7d64ea 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -531,7 +531,8 @@ export function DocumentsSidebar({
 	const typeCounts = useMemo(() => {
 		const counts: Partial<Record<string, number>> = {};
 		for (const d of treeDocuments) {
-			counts[d.document_type] = (counts[d.document_type] || 0) + 1;
+			const displayType = d.document_type === "LOCAL_FOLDER_FILE" ? "FILE" : d.document_type;
+			counts[displayType] = (counts[displayType] || 0) + 1;
 		}
 		return counts;
 	}, [treeDocuments]);
@@ -746,7 +747,7 @@ export function DocumentsSidebar({
 				</button>
 			</div>
 
-			<div className="flex-1 min-h-0 overflow-x-hidden pt-0 flex flex-col">
+			<div className="flex-1 min-h-0 pt-0 flex flex-col">
 				<div className="px-4 pb-2">
 					<DocumentsFilters
 						typeCounts={typeCounts}
diff --git a/surfsense_web/contracts/enums/connectorIcons.tsx b/surfsense_web/contracts/enums/connectorIcons.tsx
index ab71d58b5..1c6745db5 100644
--- a/surfsense_web/contracts/enums/connectorIcons.tsx
+++ b/surfsense_web/contracts/enums/connectorIcons.tsx
@@ -127,7 +127,7 @@ export const getConnectorIcon = (connectorType: EnumConnectorName | string, clas
 		case "DEEPEST":
 			return <Telescope {...iconProps} />;
 		case "LOCAL_FOLDER_FILE":
-			return null;
+			return <File {...iconProps} />;
 		default:
 			return <Search {...iconProps} />;
 	}

From be622c417c8b8235c1e46dea41cc8dced53f4159 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 17:07:26 +0530
Subject: [PATCH 138/202] refactor: update loading skeleton in PlateEditor and
 clean up dark mode styles in various components

---
 surfsense_web/components/editor-panel/editor-panel.tsx   | 3 +--
 surfsense_web/components/ui/floating-toolbar.tsx         | 2 +-
 surfsense_web/components/ui/insert-toolbar-button.tsx    | 2 +-
 surfsense_web/components/ui/slash-node.tsx               | 2 +-
 surfsense_web/components/ui/turn-into-toolbar-button.tsx | 2 +-
 5 files changed, 5 insertions(+), 6 deletions(-)

diff --git a/surfsense_web/components/editor-panel/editor-panel.tsx b/surfsense_web/components/editor-panel/editor-panel.tsx
index 05bcd2dc0..d4c64570a 100644
--- a/surfsense_web/components/editor-panel/editor-panel.tsx
+++ b/surfsense_web/components/editor-panel/editor-panel.tsx
@@ -11,13 +11,12 @@ import { MarkdownViewer } from "@/components/markdown-viewer";
 import { Alert, AlertDescription } from "@/components/ui/alert";
 import { Button } from "@/components/ui/button";
 import { Drawer, DrawerContent, DrawerHandle, DrawerTitle } from "@/components/ui/drawer";
-import { Skeleton } from "@/components/ui/skeleton";
 import { useMediaQuery } from "@/hooks/use-media-query";
 import { authenticatedFetch, getBearerToken, redirectToLogin } from "@/lib/auth-utils";
 
 const PlateEditor = dynamic(
 	() => import("@/components/editor/plate-editor").then((m) => ({ default: m.PlateEditor })),
-	{ ssr: false, loading: () => <Skeleton className="h-64 w-full" /> }
+	{ ssr: false, loading: () => <EditorPanelSkeleton /> }
 );
 
 const LARGE_DOCUMENT_THRESHOLD = 2 * 1024 * 1024; // 2MB
diff --git a/surfsense_web/components/ui/floating-toolbar.tsx b/surfsense_web/components/ui/floating-toolbar.tsx
index 843e5ecc1..634919474 100644
--- a/surfsense_web/components/ui/floating-toolbar.tsx
+++ b/surfsense_web/components/ui/floating-toolbar.tsx
@@ -65,7 +65,7 @@ export function FloatingToolbar({
 				{...rootProps}
 				ref={ref}
 				className={cn(
-					"scrollbar-hide absolute z-50 overflow-x-auto whitespace-nowrap rounded-md border bg-popover p-1 opacity-100 shadow-md print:hidden dark:bg-neutral-900 dark:border-white/5",
+					"scrollbar-hide absolute z-50 overflow-x-auto whitespace-nowrap rounded-md border bg-popover p-1 opacity-100 shadow-md print:hidden",
 					"max-w-[80vw]",
 					className
 				)}
diff --git a/surfsense_web/components/ui/insert-toolbar-button.tsx b/surfsense_web/components/ui/insert-toolbar-button.tsx
index 1a64f3759..596557aa7 100644
--- a/surfsense_web/components/ui/insert-toolbar-button.tsx
+++ b/surfsense_web/components/ui/insert-toolbar-button.tsx
@@ -189,7 +189,7 @@ export function InsertToolbarButton(props: DropdownMenuProps) {
 			</DropdownMenuTrigger>
 
 			<DropdownMenuContent
-				className="z-[100] flex max-h-[60vh] min-w-0 flex-col overflow-y-auto dark:bg-neutral-900 dark:border dark:border-white/5"
+				className="z-[100] flex max-h-[60vh] min-w-0 flex-col overflow-y-auto"
 				align="start"
 			>
 				{groups.map(({ group, items }) => (
diff --git a/surfsense_web/components/ui/slash-node.tsx b/surfsense_web/components/ui/slash-node.tsx
index d5687efcc..b3fc6f8d6 100644
--- a/surfsense_web/components/ui/slash-node.tsx
+++ b/surfsense_web/components/ui/slash-node.tsx
@@ -176,7 +176,7 @@ export function SlashInputElement({ children, ...props }: PlateElementProps) {
 			<InlineCombobox element={props.element} trigger="/">
 				<InlineComboboxInput />
 
-				<InlineComboboxContent className="dark:bg-neutral-900 dark:border dark:border-white/5">
+				<InlineComboboxContent>
 					<InlineComboboxEmpty>No results found.</InlineComboboxEmpty>
 
 					{slashCommandGroups.map(({ heading, items }) => (
diff --git a/surfsense_web/components/ui/turn-into-toolbar-button.tsx b/surfsense_web/components/ui/turn-into-toolbar-button.tsx
index 64ae5e82e..aa58eef41 100644
--- a/surfsense_web/components/ui/turn-into-toolbar-button.tsx
+++ b/surfsense_web/components/ui/turn-into-toolbar-button.tsx
@@ -150,7 +150,7 @@ export function TurnIntoToolbarButton({
 			</DropdownMenuTrigger>
 
 			<DropdownMenuContent
-				className="z-[100] ignore-click-outside/toolbar min-w-0 max-h-[60vh] overflow-y-auto dark:bg-neutral-900 dark:border dark:border-white/5"
+				className="z-[100] ignore-click-outside/toolbar min-w-0 max-h-[60vh] overflow-y-auto"
 				onCloseAutoFocus={(e) => {
 					e.preventDefault();
 					editor.tf.focus();

From b5a15b7681b05ed1d17b7a34ae2c2769caaed4c9 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 18:36:29 +0530
Subject: [PATCH 139/202] feat: implement cursor-based delta sync for Dropbox
 integration, enhancing file indexing efficiency and preserving folder cursors
 during re-authentication

---
 .../app/connectors/dropbox/client.py          |  49 +++++
 .../app/connectors/dropbox/file_types.py      |  19 +-
 .../app/routes/dropbox_add_connector_route.py |   2 +
 .../app/services/docling_service.py           |   5 +-
 .../connector_indexers/dropbox_indexer.py     | 192 ++++++++++++++++--
 5 files changed, 249 insertions(+), 18 deletions(-)

diff --git a/surfsense_backend/app/connectors/dropbox/client.py b/surfsense_backend/app/connectors/dropbox/client.py
index dfae38f66..b177c2f8d 100644
--- a/surfsense_backend/app/connectors/dropbox/client.py
+++ b/surfsense_backend/app/connectors/dropbox/client.py
@@ -225,6 +225,55 @@ class DropboxClient:
 
         return all_items, None
 
+    async def get_latest_cursor(
+        self, path: str = ""
+    ) -> tuple[str | None, str | None]:
+        """Get a cursor representing the current state of a folder.
+
+        Uses /2/files/list_folder/get_latest_cursor so we can later call
+        get_changes to receive only incremental updates.
+        """
+        resp = await self._request(
+            "/2/files/list_folder/get_latest_cursor",
+            {"path": path, "recursive": False, "include_non_downloadable_files": True},
+        )
+        if resp.status_code != 200:
+            return None, f"Failed to get cursor: {resp.status_code} - {resp.text}"
+        return resp.json().get("cursor"), None
+
+    async def get_changes(
+        self, cursor: str
+    ) -> tuple[list[dict[str, Any]], str | None, str | None]:
+        """Fetch incremental changes since the given cursor.
+
+        Calls /2/files/list_folder/continue and handles pagination.
+        Returns (entries, new_cursor, error).
+        """
+        all_entries: list[dict[str, Any]] = []
+
+        resp = await self._request(
+            "/2/files/list_folder/continue", {"cursor": cursor}
+        )
+        if resp.status_code == 401:
+            return [], None, "Dropbox authentication expired (401)"
+        if resp.status_code != 200:
+            return [], None, f"Failed to get changes: {resp.status_code} - {resp.text}"
+
+        data = resp.json()
+        all_entries.extend(data.get("entries", []))
+
+        while data.get("has_more"):
+            cursor = data["cursor"]
+            resp = await self._request(
+                "/2/files/list_folder/continue", {"cursor": cursor}
+            )
+            if resp.status_code != 200:
+                return all_entries, data.get("cursor"), f"Pagination failed: {resp.status_code}"
+            data = resp.json()
+            all_entries.extend(data.get("entries", []))
+
+        return all_entries, data.get("cursor"), None
+
     async def get_metadata(self, path: str) -> tuple[dict[str, Any] | None, str | None]:
         resp = await self._request("/2/files/get_metadata", {"path": path})
         if resp.status_code != 200:
diff --git a/surfsense_backend/app/connectors/dropbox/file_types.py b/surfsense_backend/app/connectors/dropbox/file_types.py
index e6d772a1c..c245e039e 100644
--- a/surfsense_backend/app/connectors/dropbox/file_types.py
+++ b/surfsense_backend/app/connectors/dropbox/file_types.py
@@ -2,7 +2,24 @@
 
 PAPER_EXTENSION = ".paper"
 
-SKIP_EXTENSIONS: frozenset[str] = frozenset()
+SKIP_EXTENSIONS: frozenset[str] = frozenset({
+    # Non-universal images (not supported by all 3 ETL pipelines)
+    ".svg", ".gif", ".webp", ".heic", ".ico",
+    ".raw", ".cr2", ".nef", ".arw", ".dng",
+    ".psd", ".ai", ".sketch", ".fig",
+    # Video
+    ".mov", ".avi", ".mkv", ".wmv", ".flv",
+    # Binaries / executables
+    ".exe", ".dll", ".so", ".dylib", ".bin", ".app", ".dmg", ".iso",
+    # Archives
+    ".zip", ".tar", ".gz", ".rar", ".7z", ".bz2",
+    # Fonts
+    ".ttf", ".otf", ".woff", ".woff2",
+    # 3D / CAD
+    ".stl", ".obj", ".fbx", ".blend",
+    # Database
+    ".db", ".sqlite", ".mdb",
+})
 
 MIME_TO_EXTENSION: dict[str, str] = {
     "application/pdf": ".pdf",
diff --git a/surfsense_backend/app/routes/dropbox_add_connector_route.py b/surfsense_backend/app/routes/dropbox_add_connector_route.py
index 941e5c00f..1dba64467 100644
--- a/surfsense_backend/app/routes/dropbox_add_connector_route.py
+++ b/surfsense_backend/app/routes/dropbox_add_connector_route.py
@@ -311,9 +311,11 @@ async def dropbox_callback(
                 )
 
             existing_cursor = db_connector.config.get("cursor")
+            existing_folder_cursors = db_connector.config.get("folder_cursors")
             db_connector.config = {
                 **connector_config,
                 "cursor": existing_cursor,
+                "folder_cursors": existing_folder_cursors,
                 "auth_expired": False,
             }
             flag_modified(db_connector, "config")
diff --git a/surfsense_backend/app/services/docling_service.py b/surfsense_backend/app/services/docling_service.py
index 82eaf7f74..360c197ed 100644
--- a/surfsense_backend/app/services/docling_service.py
+++ b/surfsense_backend/app/services/docling_service.py
@@ -111,9 +111,10 @@ class DoclingService:
                 pipeline_options=pipeline_options, backend=PyPdfiumDocumentBackend
             )
 
-            # Initialize DocumentConverter
+            # Initialize DocumentConverter with PDF and IMAGE support
             self.converter = DocumentConverter(
-                format_options={InputFormat.PDF: pdf_format_option}
+                allowed_formats=[InputFormat.PDF, InputFormat.IMAGE],
+                format_options={InputFormat.PDF: pdf_format_option},
             )
 
             acceleration_type = "GPU (WSL2)" if self.use_gpu else "CPU"
diff --git a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
index 1b039add7..7a2f82a78 100644
--- a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
@@ -250,6 +250,124 @@ async def _download_and_index(
     return batch_indexed, download_failed + batch_failed
 
 
+async def _remove_document(
+    session: AsyncSession, file_id: str, search_space_id: int
+):
+    """Remove a document that was deleted in Dropbox."""
+    primary_hash = compute_identifier_hash(
+        DocumentType.DROPBOX_FILE.value, file_id, search_space_id
+    )
+    existing = await check_document_by_unique_identifier(session, primary_hash)
+
+    if not existing:
+        result = await session.execute(
+            select(Document).where(
+                Document.search_space_id == search_space_id,
+                Document.document_type == DocumentType.DROPBOX_FILE,
+                cast(Document.document_metadata["dropbox_file_id"], String)
+                == file_id,
+            )
+        )
+        existing = result.scalar_one_or_none()
+
+    if existing:
+        await session.delete(existing)
+
+
+async def _index_with_delta_sync(
+    dropbox_client: DropboxClient,
+    session: AsyncSession,
+    connector_id: int,
+    search_space_id: int,
+    user_id: str,
+    cursor: str,
+    task_logger: TaskLoggingService,
+    log_entry: object,
+    max_files: int,
+    on_heartbeat_callback: HeartbeatCallbackType | None = None,
+    enable_summary: bool = True,
+) -> tuple[int, int, str]:
+    """Delta sync using Dropbox cursor-based change tracking.
+
+    Returns (indexed_count, skipped_count, new_cursor).
+    """
+    await task_logger.log_task_progress(
+        log_entry,
+        f"Starting delta sync from cursor: {cursor[:20]}...",
+        {"stage": "delta_sync", "cursor_prefix": cursor[:20]},
+    )
+
+    entries, new_cursor, error = await dropbox_client.get_changes(cursor)
+    if error:
+        err_lower = error.lower()
+        if "401" in error or "authentication expired" in err_lower:
+            raise Exception(
+                f"Dropbox authentication failed. Please re-authenticate. (Error: {error})"
+            )
+        raise Exception(f"Failed to fetch Dropbox changes: {error}")
+
+    if not entries:
+        logger.info("No changes detected since last sync")
+        return 0, 0, new_cursor or cursor
+
+    logger.info(f"Processing {len(entries)} change entries")
+
+    renamed_count = 0
+    skipped = 0
+    files_to_download: list[dict] = []
+    files_processed = 0
+
+    for entry in entries:
+        if files_processed >= max_files:
+            break
+        files_processed += 1
+
+        tag = entry.get(".tag")
+
+        if tag == "deleted":
+            path_lower = entry.get("path_lower", "")
+            name = entry.get("name", "")
+            file_id = entry.get("id", "")
+            if file_id:
+                await _remove_document(session, file_id, search_space_id)
+            logger.debug(f"Processed deletion: {name or path_lower}")
+            continue
+
+        if tag != "file":
+            continue
+
+        if skip_item(entry):
+            skipped += 1
+            continue
+
+        skip, msg = await _should_skip_file(session, entry, search_space_id)
+        if skip:
+            if msg and "renamed" in msg.lower():
+                renamed_count += 1
+            else:
+                skipped += 1
+            continue
+
+        files_to_download.append(entry)
+
+    batch_indexed, failed = await _download_and_index(
+        dropbox_client,
+        session,
+        files_to_download,
+        connector_id=connector_id,
+        search_space_id=search_space_id,
+        user_id=user_id,
+        enable_summary=enable_summary,
+        on_heartbeat=on_heartbeat_callback,
+    )
+
+    indexed = renamed_count + batch_indexed
+    logger.info(
+        f"Delta sync complete: {indexed} indexed, {skipped} skipped, {failed} failed"
+    )
+    return indexed, skipped, new_cursor or cursor
+
+
 async def _index_full_scan(
     dropbox_client: DropboxClient,
     session: AsyncSession,
@@ -437,6 +555,9 @@ async def index_dropbox_files(
         max_files = indexing_options.get("max_files", 500)
         incremental_sync = indexing_options.get("incremental_sync", True)
         include_subfolders = indexing_options.get("include_subfolders", True)
+        use_delta_sync = indexing_options.get("use_delta_sync", True)
+
+        folder_cursors: dict = connector.config.get("folder_cursors", {})
 
         total_indexed = 0
         total_skipped = 0
@@ -471,25 +592,66 @@ async def index_dropbox_files(
             )
             folder_name = folder.get("name", "Root")
 
-            logger.info(f"Using full scan for folder {folder_name}")
-            indexed, skipped = await _index_full_scan(
-                dropbox_client,
-                session,
-                connector_id,
-                search_space_id,
-                user_id,
-                folder_path,
-                folder_name,
-                task_logger,
-                log_entry,
-                max_files,
-                include_subfolders,
-                incremental_sync=incremental_sync,
-                enable_summary=connector_enable_summary,
+            saved_cursor = folder_cursors.get(folder_path)
+            can_use_delta = (
+                use_delta_sync
+                and saved_cursor
+                and connector.last_indexed_at
             )
+
+            if can_use_delta:
+                logger.info(f"Using delta sync for folder {folder_name}")
+                indexed, skipped, new_cursor = await _index_with_delta_sync(
+                    dropbox_client,
+                    session,
+                    connector_id,
+                    search_space_id,
+                    user_id,
+                    saved_cursor,
+                    task_logger,
+                    log_entry,
+                    max_files,
+                    enable_summary=connector_enable_summary,
+                )
+                folder_cursors[folder_path] = new_cursor
+            else:
+                logger.info(f"Using full scan for folder {folder_name}")
+                indexed, skipped = await _index_full_scan(
+                    dropbox_client,
+                    session,
+                    connector_id,
+                    search_space_id,
+                    user_id,
+                    folder_path,
+                    folder_name,
+                    task_logger,
+                    log_entry,
+                    max_files,
+                    include_subfolders,
+                    incremental_sync=incremental_sync,
+                    enable_summary=connector_enable_summary,
+                )
+
             total_indexed += indexed
             total_skipped += skipped
 
+            # Persist latest cursor for this folder
+            try:
+                latest_cursor, cursor_err = await dropbox_client.get_latest_cursor(
+                    folder_path
+                )
+                if latest_cursor and not cursor_err:
+                    folder_cursors[folder_path] = latest_cursor
+            except Exception as e:
+                logger.warning(f"Failed to get latest cursor for {folder_path}: {e}")
+
+        # Persist folder cursors to connector config
+        if folders:
+            cfg = dict(connector.config)
+            cfg["folder_cursors"] = folder_cursors
+            connector.config = cfg
+            flag_modified(connector, "config")
+
         if total_indexed > 0 or folders:
             await update_connector_last_indexed(session, connector, True)
 

From caca49177499daa39f4c210fc903333233bafe53 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 18:36:48 +0530
Subject: [PATCH 140/202] test: add unit tests for Dropbox integration,
 covering delta sync methods, file type filtering, and re-authentication
 behavior

---
 .../test_dropbox_parallel.py                  | 545 ++++++++++++++++++
 .../tests/unit/connectors/__init__.py         |   0
 .../unit/connectors/test_dropbox_client.py    | 115 ++++
 .../connectors/test_dropbox_file_types.py     |  73 +++
 .../unit/connectors/test_dropbox_reauth.py    |  43 ++
 .../tests/unit/services/__init__.py           |   0
 .../services/test_docling_image_support.py    |  67 +++
 7 files changed, 843 insertions(+)
 create mode 100644 surfsense_backend/tests/unit/connectors/__init__.py
 create mode 100644 surfsense_backend/tests/unit/connectors/test_dropbox_client.py
 create mode 100644 surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
 create mode 100644 surfsense_backend/tests/unit/connectors/test_dropbox_reauth.py
 create mode 100644 surfsense_backend/tests/unit/services/__init__.py
 create mode 100644 surfsense_backend/tests/unit/services/test_docling_image_support.py

diff --git a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
index 76f8806dc..737e2c850 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
@@ -8,6 +8,10 @@ import pytest
 from app.db import DocumentType
 from app.tasks.connector_indexers.dropbox_indexer import (
     _download_files_parallel,
+    _index_full_scan,
+    _index_selected_files,
+    _index_with_delta_sync,
+    index_dropbox_files,
 )
 
 pytestmark = pytest.mark.unit
@@ -234,3 +238,544 @@ async def test_heartbeat_fires_during_parallel_downloads(
     assert len(docs) == 3
     assert failed == 0
     assert len(heartbeat_calls) >= 1, "Heartbeat should have fired at least once"
+
+
+# ---------------------------------------------------------------------------
+# D1-D2: _index_full_scan tests
+# ---------------------------------------------------------------------------
+
+
+def _folder_dict(name: str) -> dict:
+    return {".tag": "folder", "name": name}
+
+
+@pytest.fixture
+def full_scan_mocks(mock_dropbox_client, monkeypatch):
+    """Wire up mocks for _index_full_scan in isolation."""
+    import app.tasks.connector_indexers.dropbox_indexer as _mod
+
+    mock_session = AsyncMock()
+    mock_task_logger = MagicMock()
+    mock_task_logger.log_task_progress = AsyncMock()
+    mock_log_entry = MagicMock()
+
+    skip_results: dict[str, tuple[bool, str | None]] = {}
+
+    async def _fake_skip(session, file, search_space_id):
+        from app.connectors.dropbox.file_types import should_skip_file as _skip
+        if _skip(file):
+            return True, "folder/non-downloadable"
+        return skip_results.get(file.get("id", ""), (False, None))
+
+    monkeypatch.setattr(_mod, "_should_skip_file", _fake_skip)
+
+    download_and_index_mock = AsyncMock(return_value=(0, 0))
+    monkeypatch.setattr(_mod, "_download_and_index", download_and_index_mock)
+
+    return {
+        "dropbox_client": mock_dropbox_client,
+        "session": mock_session,
+        "task_logger": mock_task_logger,
+        "log_entry": mock_log_entry,
+        "skip_results": skip_results,
+        "download_and_index_mock": download_and_index_mock,
+    }
+
+
+async def _run_full_scan(mocks, monkeypatch, page_files, *, max_files=500):
+    import app.tasks.connector_indexers.dropbox_indexer as _mod
+
+    monkeypatch.setattr(
+        _mod,
+        "get_files_in_folder",
+        AsyncMock(return_value=(page_files, None)),
+    )
+    return await _index_full_scan(
+        mocks["dropbox_client"],
+        mocks["session"],
+        _CONNECTOR_ID,
+        _SEARCH_SPACE_ID,
+        _USER_ID,
+        "",
+        "Root",
+        mocks["task_logger"],
+        mocks["log_entry"],
+        max_files,
+        enable_summary=True,
+    )
+
+
+async def test_full_scan_three_phase_counts(full_scan_mocks, monkeypatch):
+    """Skipped files excluded, renames counted as indexed, new files downloaded."""
+    page_files = [
+        _folder_dict("SubFolder"),
+        _make_file_dict("skip1", "unchanged.txt"),
+        _make_file_dict("rename1", "renamed.txt"),
+        _make_file_dict("new1", "new1.txt"),
+        _make_file_dict("new2", "new2.txt"),
+    ]
+
+    full_scan_mocks["skip_results"]["skip1"] = (True, "unchanged")
+    full_scan_mocks["skip_results"]["rename1"] = (
+        True,
+        "File renamed: 'old' -> 'renamed.txt'",
+    )
+
+    full_scan_mocks["download_and_index_mock"].return_value = (2, 0)
+
+    indexed, skipped = await _run_full_scan(
+        full_scan_mocks, monkeypatch, page_files
+    )
+
+    assert indexed == 3  # 1 renamed + 2 from batch
+    assert skipped == 2  # 1 folder + 1 unchanged
+
+    call_args = full_scan_mocks["download_and_index_mock"].call_args
+    call_files = call_args[0][2]
+    assert len(call_files) == 2
+    assert {f["id"] for f in call_files} == {"new1", "new2"}
+
+
+async def test_full_scan_respects_max_files(full_scan_mocks, monkeypatch):
+    """Only max_files non-folder items are considered."""
+    page_files = [_make_file_dict(f"f{i}", f"file{i}.txt") for i in range(10)]
+
+    full_scan_mocks["download_and_index_mock"].return_value = (3, 0)
+
+    await _run_full_scan(full_scan_mocks, monkeypatch, page_files, max_files=3)
+
+    call_files = full_scan_mocks["download_and_index_mock"].call_args[0][2]
+    assert len(call_files) == 3
+
+
+# ---------------------------------------------------------------------------
+# D3-D5: _index_selected_files tests
+# ---------------------------------------------------------------------------
+
+
+@pytest.fixture
+def selected_files_mocks(mock_dropbox_client, monkeypatch):
+    """Wire up mocks for _index_selected_files tests."""
+    import app.tasks.connector_indexers.dropbox_indexer as _mod
+
+    mock_session = AsyncMock()
+
+    get_file_results: dict[str, tuple[dict | None, str | None]] = {}
+
+    async def _fake_get_file(client, path):
+        return get_file_results.get(path, (None, f"Not configured: {path}"))
+
+    monkeypatch.setattr(_mod, "get_file_by_path", _fake_get_file)
+
+    skip_results: dict[str, tuple[bool, str | None]] = {}
+
+    async def _fake_skip(session, file, search_space_id):
+        return skip_results.get(file["id"], (False, None))
+
+    monkeypatch.setattr(_mod, "_should_skip_file", _fake_skip)
+
+    download_and_index_mock = AsyncMock(return_value=(0, 0))
+    monkeypatch.setattr(_mod, "_download_and_index", download_and_index_mock)
+
+    return {
+        "dropbox_client": mock_dropbox_client,
+        "session": mock_session,
+        "get_file_results": get_file_results,
+        "skip_results": skip_results,
+        "download_and_index_mock": download_and_index_mock,
+    }
+
+
+async def _run_selected(mocks, file_tuples):
+    return await _index_selected_files(
+        mocks["dropbox_client"],
+        mocks["session"],
+        file_tuples,
+        connector_id=_CONNECTOR_ID,
+        search_space_id=_SEARCH_SPACE_ID,
+        user_id=_USER_ID,
+        enable_summary=True,
+    )
+
+
+async def test_selected_files_single_file_indexed(selected_files_mocks):
+    selected_files_mocks["get_file_results"]["/report.pdf"] = (
+        _make_file_dict("f1", "report.pdf"),
+        None,
+    )
+    selected_files_mocks["download_and_index_mock"].return_value = (1, 0)
+
+    indexed, skipped, errors = await _run_selected(
+        selected_files_mocks,
+        [("/report.pdf", "report.pdf")],
+    )
+
+    assert indexed == 1
+    assert skipped == 0
+    assert errors == []
+
+
+async def test_selected_files_fetch_failure_isolation(selected_files_mocks):
+    selected_files_mocks["get_file_results"]["/first.txt"] = (
+        _make_file_dict("f1", "first.txt"),
+        None,
+    )
+    selected_files_mocks["get_file_results"]["/mid.txt"] = (None, "HTTP 404")
+    selected_files_mocks["get_file_results"]["/third.txt"] = (
+        _make_file_dict("f3", "third.txt"),
+        None,
+    )
+    selected_files_mocks["download_and_index_mock"].return_value = (2, 0)
+
+    indexed, skipped, errors = await _run_selected(
+        selected_files_mocks,
+        [("/first.txt", "first.txt"), ("/mid.txt", "mid.txt"), ("/third.txt", "third.txt")],
+    )
+
+    assert indexed == 2
+    assert skipped == 0
+    assert len(errors) == 1
+    assert "mid.txt" in errors[0]
+
+
+async def test_selected_files_skip_rename_counting(selected_files_mocks):
+    for path, fid, fname in [
+        ("/unchanged.txt", "s1", "unchanged.txt"),
+        ("/renamed.txt", "r1", "renamed.txt"),
+        ("/new1.txt", "n1", "new1.txt"),
+        ("/new2.txt", "n2", "new2.txt"),
+    ]:
+        selected_files_mocks["get_file_results"][path] = (
+            _make_file_dict(fid, fname),
+            None,
+        )
+
+    selected_files_mocks["skip_results"]["s1"] = (True, "unchanged")
+    selected_files_mocks["skip_results"]["r1"] = (
+        True,
+        "File renamed: 'old' -> 'renamed.txt'",
+    )
+    selected_files_mocks["download_and_index_mock"].return_value = (2, 0)
+
+    indexed, skipped, errors = await _run_selected(
+        selected_files_mocks,
+        [
+            ("/unchanged.txt", "unchanged.txt"),
+            ("/renamed.txt", "renamed.txt"),
+            ("/new1.txt", "new1.txt"),
+            ("/new2.txt", "new2.txt"),
+        ],
+    )
+
+    assert indexed == 3  # 1 renamed + 2 batch
+    assert skipped == 1
+    assert errors == []
+
+    mock = selected_files_mocks["download_and_index_mock"]
+    call_files = mock.call_args[0][2]
+    assert len(call_files) == 2
+    assert {f["id"] for f in call_files} == {"n1", "n2"}
+
+
+# ---------------------------------------------------------------------------
+# E1-E4: _index_with_delta_sync tests
+# ---------------------------------------------------------------------------
+
+
+async def test_delta_sync_deletions_call_remove_document(monkeypatch):
+    """E1: deleted entries are processed via _remove_document."""
+    import app.tasks.connector_indexers.dropbox_indexer as _mod
+
+    entries = [
+        {".tag": "deleted", "name": "gone.txt", "path_lower": "/gone.txt", "id": "id:del1"},
+        {".tag": "deleted", "name": "also_gone.pdf", "path_lower": "/also_gone.pdf", "id": "id:del2"},
+    ]
+
+    mock_client = MagicMock()
+    mock_client.get_changes = AsyncMock(return_value=(entries, "new-cursor", None))
+
+    remove_calls: list[str] = []
+
+    async def _fake_remove(session, file_id, search_space_id):
+        remove_calls.append(file_id)
+
+    monkeypatch.setattr(_mod, "_remove_document", _fake_remove)
+    monkeypatch.setattr(_mod, "_download_and_index", AsyncMock(return_value=(0, 0)))
+
+    mock_task_logger = MagicMock()
+    mock_task_logger.log_task_progress = AsyncMock()
+
+    indexed, skipped, cursor = await _index_with_delta_sync(
+        mock_client,
+        AsyncMock(),
+        _CONNECTOR_ID,
+        _SEARCH_SPACE_ID,
+        _USER_ID,
+        "old-cursor",
+        mock_task_logger,
+        MagicMock(),
+        max_files=500,
+        enable_summary=True,
+    )
+
+    assert sorted(remove_calls) == ["id:del1", "id:del2"]
+    assert cursor == "new-cursor"
+
+
+async def test_delta_sync_upserts_filtered_and_downloaded(monkeypatch):
+    """E2: modified/new file entries go through skip filter then download+index."""
+    import app.tasks.connector_indexers.dropbox_indexer as _mod
+
+    entries = [
+        _make_file_dict("mod1", "modified1.txt"),
+        _make_file_dict("mod2", "modified2.txt"),
+    ]
+
+    mock_client = MagicMock()
+    mock_client.get_changes = AsyncMock(return_value=(entries, "cursor-v2", None))
+
+    monkeypatch.setattr(_mod, "_should_skip_file", AsyncMock(return_value=(False, None)))
+
+    download_mock = AsyncMock(return_value=(2, 0))
+    monkeypatch.setattr(_mod, "_download_and_index", download_mock)
+
+    mock_task_logger = MagicMock()
+    mock_task_logger.log_task_progress = AsyncMock()
+
+    indexed, skipped, cursor = await _index_with_delta_sync(
+        mock_client,
+        AsyncMock(),
+        _CONNECTOR_ID,
+        _SEARCH_SPACE_ID,
+        _USER_ID,
+        "cursor-v1",
+        mock_task_logger,
+        MagicMock(),
+        max_files=500,
+        enable_summary=True,
+    )
+
+    assert indexed == 2
+    assert skipped == 0
+    assert cursor == "cursor-v2"
+
+    downloaded_files = download_mock.call_args[0][2]
+    assert len(downloaded_files) == 2
+    assert {f["id"] for f in downloaded_files} == {"mod1", "mod2"}
+
+
+async def test_delta_sync_mix_deletions_and_upserts(monkeypatch):
+    """E3: deletions processed, then remaining upserts filtered and indexed."""
+    import app.tasks.connector_indexers.dropbox_indexer as _mod
+
+    entries = [
+        {".tag": "deleted", "name": "removed.txt", "path_lower": "/removed.txt", "id": "id:del1"},
+        {".tag": "deleted", "name": "trashed.pdf", "path_lower": "/trashed.pdf", "id": "id:del2"},
+        _make_file_dict("mod1", "updated.txt"),
+        _make_file_dict("new1", "brandnew.docx"),
+    ]
+
+    mock_client = MagicMock()
+    mock_client.get_changes = AsyncMock(return_value=(entries, "final-cursor", None))
+
+    remove_calls: list[str] = []
+
+    async def _fake_remove(session, file_id, search_space_id):
+        remove_calls.append(file_id)
+
+    monkeypatch.setattr(_mod, "_remove_document", _fake_remove)
+    monkeypatch.setattr(_mod, "_should_skip_file", AsyncMock(return_value=(False, None)))
+
+    download_mock = AsyncMock(return_value=(2, 0))
+    monkeypatch.setattr(_mod, "_download_and_index", download_mock)
+
+    mock_task_logger = MagicMock()
+    mock_task_logger.log_task_progress = AsyncMock()
+
+    indexed, skipped, cursor = await _index_with_delta_sync(
+        mock_client,
+        AsyncMock(),
+        _CONNECTOR_ID,
+        _SEARCH_SPACE_ID,
+        _USER_ID,
+        "old-cursor",
+        mock_task_logger,
+        MagicMock(),
+        max_files=500,
+        enable_summary=True,
+    )
+
+    assert sorted(remove_calls) == ["id:del1", "id:del2"]
+    assert indexed == 2
+    assert skipped == 0
+    assert cursor == "final-cursor"
+
+    downloaded_files = download_mock.call_args[0][2]
+    assert {f["id"] for f in downloaded_files} == {"mod1", "new1"}
+
+
+async def test_delta_sync_returns_new_cursor(monkeypatch):
+    """E4: the new cursor from the API response is returned."""
+    import app.tasks.connector_indexers.dropbox_indexer as _mod
+
+    mock_client = MagicMock()
+    mock_client.get_changes = AsyncMock(return_value=([], "brand-new-cursor-xyz", None))
+
+    monkeypatch.setattr(_mod, "_download_and_index", AsyncMock(return_value=(0, 0)))
+
+    mock_task_logger = MagicMock()
+    mock_task_logger.log_task_progress = AsyncMock()
+
+    indexed, skipped, cursor = await _index_with_delta_sync(
+        mock_client,
+        AsyncMock(),
+        _CONNECTOR_ID,
+        _SEARCH_SPACE_ID,
+        _USER_ID,
+        "old-cursor",
+        mock_task_logger,
+        MagicMock(),
+        max_files=500,
+        enable_summary=True,
+    )
+
+    assert cursor == "brand-new-cursor-xyz"
+    assert indexed == 0
+    assert skipped == 0
+
+
+# ---------------------------------------------------------------------------
+# F1-F3: index_dropbox_files orchestrator tests
+# ---------------------------------------------------------------------------
+
+
+@pytest.fixture
+def orchestrator_mocks(monkeypatch):
+    """Wire up mocks for index_dropbox_files orchestrator tests."""
+    import app.tasks.connector_indexers.dropbox_indexer as _mod
+
+    mock_connector = MagicMock()
+    mock_connector.config = {"_token_encrypted": False}
+    mock_connector.last_indexed_at = None
+    mock_connector.enable_summary = True
+
+    monkeypatch.setattr(
+        _mod,
+        "get_connector_by_id",
+        AsyncMock(return_value=mock_connector),
+    )
+
+    mock_task_logger = MagicMock()
+    mock_task_logger.log_task_start = AsyncMock(return_value=MagicMock())
+    mock_task_logger.log_task_progress = AsyncMock()
+    mock_task_logger.log_task_success = AsyncMock()
+    mock_task_logger.log_task_failure = AsyncMock()
+    monkeypatch.setattr(
+        _mod, "TaskLoggingService", MagicMock(return_value=mock_task_logger)
+    )
+
+    monkeypatch.setattr(_mod, "update_connector_last_indexed", AsyncMock())
+
+    full_scan_mock = AsyncMock(return_value=(5, 2))
+    monkeypatch.setattr(_mod, "_index_full_scan", full_scan_mock)
+
+    delta_sync_mock = AsyncMock(return_value=(3, 1, "delta-cursor-new"))
+    monkeypatch.setattr(_mod, "_index_with_delta_sync", delta_sync_mock)
+
+    mock_client = MagicMock()
+    mock_client.get_latest_cursor = AsyncMock(return_value=("latest-cursor-abc", None))
+    monkeypatch.setattr(
+        _mod, "DropboxClient", MagicMock(return_value=mock_client)
+    )
+
+    return {
+        "connector": mock_connector,
+        "full_scan_mock": full_scan_mock,
+        "delta_sync_mock": delta_sync_mock,
+        "mock_client": mock_client,
+    }
+
+
+async def test_orchestrator_uses_delta_sync_when_cursor_and_last_indexed(
+    orchestrator_mocks,
+):
+    """F1: with cursor + last_indexed_at + use_delta_sync, calls delta sync."""
+    from datetime import UTC, datetime
+
+    connector = orchestrator_mocks["connector"]
+    connector.config = {
+        "_token_encrypted": False,
+        "folder_cursors": {"/docs": "saved-cursor-123"},
+    }
+    connector.last_indexed_at = datetime(2026, 1, 1, tzinfo=UTC)
+
+    mock_session = AsyncMock()
+    mock_session.commit = AsyncMock()
+
+    indexed, skipped, error = await index_dropbox_files(
+        mock_session,
+        _CONNECTOR_ID,
+        _SEARCH_SPACE_ID,
+        _USER_ID,
+        {
+            "folders": [{"path": "/docs", "name": "Docs"}],
+            "files": [],
+            "indexing_options": {"use_delta_sync": True},
+        },
+    )
+
+    assert error is None
+    orchestrator_mocks["delta_sync_mock"].assert_called_once()
+    orchestrator_mocks["full_scan_mock"].assert_not_called()
+
+
+async def test_orchestrator_falls_back_to_full_scan_without_cursor(
+    orchestrator_mocks,
+):
+    """F2: without cursor, falls back to full scan."""
+    connector = orchestrator_mocks["connector"]
+    connector.config = {"_token_encrypted": False}
+    connector.last_indexed_at = None
+
+    mock_session = AsyncMock()
+    mock_session.commit = AsyncMock()
+
+    indexed, skipped, error = await index_dropbox_files(
+        mock_session,
+        _CONNECTOR_ID,
+        _SEARCH_SPACE_ID,
+        _USER_ID,
+        {
+            "folders": [{"path": "/docs", "name": "Docs"}],
+            "files": [],
+            "indexing_options": {"use_delta_sync": True},
+        },
+    )
+
+    assert error is None
+    orchestrator_mocks["full_scan_mock"].assert_called_once()
+    orchestrator_mocks["delta_sync_mock"].assert_not_called()
+
+
+async def test_orchestrator_persists_cursor_after_sync(orchestrator_mocks):
+    """F3: after sync, persists new cursor to connector config."""
+    connector = orchestrator_mocks["connector"]
+    connector.config = {"_token_encrypted": False}
+    connector.last_indexed_at = None
+
+    mock_session = AsyncMock()
+    mock_session.commit = AsyncMock()
+
+    await index_dropbox_files(
+        mock_session,
+        _CONNECTOR_ID,
+        _SEARCH_SPACE_ID,
+        _USER_ID,
+        {
+            "folders": [{"path": "/docs", "name": "Docs"}],
+            "files": [],
+        },
+    )
+
+    assert "folder_cursors" in connector.config
+    assert connector.config["folder_cursors"]["/docs"] == "latest-cursor-abc"
diff --git a/surfsense_backend/tests/unit/connectors/__init__.py b/surfsense_backend/tests/unit/connectors/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/surfsense_backend/tests/unit/connectors/test_dropbox_client.py b/surfsense_backend/tests/unit/connectors/test_dropbox_client.py
new file mode 100644
index 000000000..efacbcf72
--- /dev/null
+++ b/surfsense_backend/tests/unit/connectors/test_dropbox_client.py
@@ -0,0 +1,115 @@
+"""Tests for DropboxClient delta-sync methods (get_latest_cursor, get_changes)."""
+
+from unittest.mock import AsyncMock, MagicMock
+
+import pytest
+
+from app.connectors.dropbox.client import DropboxClient
+
+pytestmark = pytest.mark.unit
+
+
+def _make_client() -> DropboxClient:
+    """Create a DropboxClient with a mocked DB session so no real DB needed."""
+    client = DropboxClient.__new__(DropboxClient)
+    client._session = MagicMock()
+    client._connector_id = 1
+    return client
+
+
+# ---------- C1: get_latest_cursor ----------
+
+async def test_get_latest_cursor_returns_cursor_string(monkeypatch):
+    client = _make_client()
+
+    fake_resp = MagicMock()
+    fake_resp.status_code = 200
+    fake_resp.json.return_value = {"cursor": "AAHbKxRZ9enq…"}
+
+    monkeypatch.setattr(client, "_request", AsyncMock(return_value=fake_resp))
+
+    cursor, error = await client.get_latest_cursor("/my-folder")
+
+    assert cursor == "AAHbKxRZ9enq…"
+    assert error is None
+    client._request.assert_called_once_with(
+        "/2/files/list_folder/get_latest_cursor",
+        {"path": "/my-folder", "recursive": False, "include_non_downloadable_files": True},
+    )
+
+
+# ---------- C2: get_changes returns entries and new cursor ----------
+
+async def test_get_changes_returns_entries_and_cursor(monkeypatch):
+    client = _make_client()
+
+    fake_resp = MagicMock()
+    fake_resp.status_code = 200
+    fake_resp.json.return_value = {
+        "entries": [
+            {".tag": "file", "name": "new.txt", "id": "id:abc"},
+            {".tag": "deleted", "name": "old.txt"},
+        ],
+        "cursor": "cursor-v2",
+        "has_more": False,
+    }
+    monkeypatch.setattr(client, "_request", AsyncMock(return_value=fake_resp))
+
+    entries, new_cursor, error = await client.get_changes("cursor-v1")
+
+    assert error is None
+    assert new_cursor == "cursor-v2"
+    assert len(entries) == 2
+    assert entries[0]["name"] == "new.txt"
+    assert entries[1][".tag"] == "deleted"
+
+
+# ---------- C3: get_changes handles pagination ----------
+
+async def test_get_changes_handles_pagination(monkeypatch):
+    client = _make_client()
+
+    page1 = MagicMock()
+    page1.status_code = 200
+    page1.json.return_value = {
+        "entries": [{".tag": "file", "name": "a.txt", "id": "id:a"}],
+        "cursor": "cursor-page2",
+        "has_more": True,
+    }
+    page2 = MagicMock()
+    page2.status_code = 200
+    page2.json.return_value = {
+        "entries": [{".tag": "file", "name": "b.txt", "id": "id:b"}],
+        "cursor": "cursor-final",
+        "has_more": False,
+    }
+
+    request_mock = AsyncMock(side_effect=[page1, page2])
+    monkeypatch.setattr(client, "_request", request_mock)
+
+    entries, new_cursor, error = await client.get_changes("cursor-v1")
+
+    assert error is None
+    assert new_cursor == "cursor-final"
+    assert len(entries) == 2
+    assert {e["name"] for e in entries} == {"a.txt", "b.txt"}
+    assert request_mock.call_count == 2
+
+
+# ---------- C4: get_changes raises on 401 ----------
+
+async def test_get_changes_returns_error_on_401(monkeypatch):
+    client = _make_client()
+
+    fake_resp = MagicMock()
+    fake_resp.status_code = 401
+    fake_resp.text = "Unauthorized"
+
+    monkeypatch.setattr(client, "_request", AsyncMock(return_value=fake_resp))
+
+    entries, new_cursor, error = await client.get_changes("old-cursor")
+
+    assert error is not None
+    assert "401" in error
+    assert entries == []
+    assert new_cursor is None
diff --git a/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py b/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
new file mode 100644
index 000000000..5480d8c8a
--- /dev/null
+++ b/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
@@ -0,0 +1,73 @@
+"""Tests for Dropbox file type filtering (should_skip_file)."""
+
+import pytest
+
+from app.connectors.dropbox.file_types import should_skip_file
+
+pytestmark = pytest.mark.unit
+
+
+def test_folder_item_is_skipped():
+    item = {".tag": "folder", "name": "My Folder"}
+    assert should_skip_file(item) is True
+
+
+def test_paper_file_is_not_skipped():
+    item = {".tag": "file", "name": "notes.paper", "is_downloadable": False}
+    assert should_skip_file(item) is False
+
+
+def test_non_downloadable_item_is_skipped():
+    item = {".tag": "file", "name": "locked.gdoc", "is_downloadable": False}
+    assert should_skip_file(item) is True
+
+
+@pytest.mark.parametrize(
+    "filename",
+    [
+        "archive.zip", "backup.tar", "data.gz", "stuff.rar", "pack.7z",
+        "program.exe", "lib.dll", "module.so", "image.dmg", "disk.iso",
+        "movie.mov", "clip.avi", "video.mkv", "film.wmv", "stream.flv",
+        "icon.svg", "anim.gif", "photo.webp", "shot.heic", "favicon.ico",
+        "raw.cr2", "photo.nef", "image.arw", "pic.dng",
+        "design.psd", "vector.ai", "mockup.sketch", "proto.fig",
+        "font.ttf", "font.otf", "font.woff", "font.woff2",
+        "model.stl", "scene.fbx", "mesh.blend",
+        "local.db", "data.sqlite", "access.mdb",
+    ],
+)
+def test_non_parseable_extensions_are_skipped(filename):
+    item = {".tag": "file", "name": filename}
+    assert should_skip_file(item) is True, f"{filename} should be skipped"
+
+
+@pytest.mark.parametrize(
+    "filename",
+    [
+        "report.pdf", "document.docx", "sheet.xlsx", "slides.pptx",
+        "old.doc", "legacy.xls", "deck.ppt",
+        "readme.txt", "data.csv", "page.html", "notes.md",
+        "config.json", "feed.xml",
+    ],
+)
+def test_parseable_documents_are_not_skipped(filename):
+    item = {".tag": "file", "name": filename}
+    assert should_skip_file(item) is False, f"{filename} should NOT be skipped"
+
+
+@pytest.mark.parametrize(
+    "filename",
+    ["photo.jpg", "image.jpeg", "screenshot.png", "scan.bmp", "page.tiff", "doc.tif"],
+)
+def test_universal_images_are_not_skipped(filename):
+    item = {".tag": "file", "name": filename}
+    assert should_skip_file(item) is False, f"{filename} should NOT be skipped"
+
+
+@pytest.mark.parametrize(
+    "filename",
+    ["icon.svg", "anim.gif", "photo.webp", "live.heic"],
+)
+def test_non_universal_images_are_skipped(filename):
+    item = {".tag": "file", "name": filename}
+    assert should_skip_file(item) is True, f"{filename} should be skipped"
diff --git a/surfsense_backend/tests/unit/connectors/test_dropbox_reauth.py b/surfsense_backend/tests/unit/connectors/test_dropbox_reauth.py
new file mode 100644
index 000000000..85281354c
--- /dev/null
+++ b/surfsense_backend/tests/unit/connectors/test_dropbox_reauth.py
@@ -0,0 +1,43 @@
+"""Test that Dropbox re-auth preserves folder_cursors in connector config."""
+
+import pytest
+
+pytestmark = pytest.mark.unit
+
+
+def test_reauth_preserves_folder_cursors():
+    """G1: re-authentication preserves folder_cursors alongside cursor."""
+    old_config = {
+        "access_token": "old-token-enc",
+        "refresh_token": "old-refresh-enc",
+        "cursor": "old-cursor-abc",
+        "folder_cursors": {"/docs": "cursor-docs-123", "/photos": "cursor-photos-456"},
+        "_token_encrypted": True,
+        "auth_expired": True,
+    }
+
+    new_connector_config = {
+        "access_token": "new-token-enc",
+        "refresh_token": "new-refresh-enc",
+        "token_type": "bearer",
+        "expires_in": 14400,
+        "expires_at": "2026-04-06T16:00:00+00:00",
+        "_token_encrypted": True,
+    }
+
+    existing_cursor = old_config.get("cursor")
+    existing_folder_cursors = old_config.get("folder_cursors")
+    merged_config = {
+        **new_connector_config,
+        "cursor": existing_cursor,
+        "folder_cursors": existing_folder_cursors,
+        "auth_expired": False,
+    }
+
+    assert merged_config["access_token"] == "new-token-enc"
+    assert merged_config["cursor"] == "old-cursor-abc"
+    assert merged_config["folder_cursors"] == {
+        "/docs": "cursor-docs-123",
+        "/photos": "cursor-photos-456",
+    }
+    assert merged_config["auth_expired"] is False
diff --git a/surfsense_backend/tests/unit/services/__init__.py b/surfsense_backend/tests/unit/services/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/surfsense_backend/tests/unit/services/test_docling_image_support.py b/surfsense_backend/tests/unit/services/test_docling_image_support.py
new file mode 100644
index 000000000..071d061e2
--- /dev/null
+++ b/surfsense_backend/tests/unit/services/test_docling_image_support.py
@@ -0,0 +1,67 @@
+"""Test that DoclingService registers InputFormat.IMAGE for image processing."""
+
+from enum import Enum
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+pytestmark = pytest.mark.unit
+
+
+class _FakeInputFormat(Enum):
+    PDF = "pdf"
+    IMAGE = "image"
+
+
+def test_docling_service_registers_image_format():
+    """DoclingService should initialise DocumentConverter with InputFormat.IMAGE
+    in allowed_formats so that image files (jpg, png, bmp, tiff) are accepted."""
+
+    mock_converter_cls = MagicMock()
+    mock_backend = MagicMock()
+
+    fake_pipeline_options_cls = MagicMock()
+    fake_pipeline_options = MagicMock()
+    fake_pipeline_options_cls.return_value = fake_pipeline_options
+
+    fake_pdf_format_option_cls = MagicMock()
+
+    with patch.dict("sys.modules", {
+        "docling": MagicMock(),
+        "docling.backend": MagicMock(),
+        "docling.backend.pypdfium2_backend": MagicMock(
+            PyPdfiumDocumentBackend=mock_backend
+        ),
+        "docling.datamodel": MagicMock(),
+        "docling.datamodel.base_models": MagicMock(
+            InputFormat=_FakeInputFormat
+        ),
+        "docling.datamodel.pipeline_options": MagicMock(
+            PdfPipelineOptions=fake_pipeline_options_cls
+        ),
+        "docling.document_converter": MagicMock(
+            DocumentConverter=mock_converter_cls,
+            PdfFormatOption=fake_pdf_format_option_cls,
+        ),
+    }):
+        import app.services.docling_service as mod
+        from importlib import reload
+        reload(mod)
+
+        mod.DoclingService()
+
+    call_kwargs = mock_converter_cls.call_args
+    assert call_kwargs is not None, "DocumentConverter was never called"
+
+    _, kwargs = call_kwargs
+    allowed = kwargs.get("allowed_formats")
+    format_opts = kwargs.get("format_options", {})
+
+    image_registered = (
+        (allowed is not None and _FakeInputFormat.IMAGE in allowed)
+        or _FakeInputFormat.IMAGE in format_opts
+    )
+    assert image_registered, (
+        f"InputFormat.IMAGE not registered. "
+        f"allowed_formats={allowed}, format_options keys={list(format_opts.keys())}"
+    )

From 47f4be08d971fe96bce911a154d10568d724dde6 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 19:31:42 +0530
Subject: [PATCH 141/202] refactor: remove allowed_formats from
 DocumentConverter initialization in DoclingService to allow acceptance of all
 supported formats

---
 .../app/services/docling_service.py           |  2 --
 .../services/test_docling_image_support.py    | 26 +++++++++----------
 2 files changed, 13 insertions(+), 15 deletions(-)

diff --git a/surfsense_backend/app/services/docling_service.py b/surfsense_backend/app/services/docling_service.py
index 360c197ed..af9a7d2d5 100644
--- a/surfsense_backend/app/services/docling_service.py
+++ b/surfsense_backend/app/services/docling_service.py
@@ -111,9 +111,7 @@ class DoclingService:
                 pipeline_options=pipeline_options, backend=PyPdfiumDocumentBackend
             )
 
-            # Initialize DocumentConverter with PDF and IMAGE support
             self.converter = DocumentConverter(
-                allowed_formats=[InputFormat.PDF, InputFormat.IMAGE],
                 format_options={InputFormat.PDF: pdf_format_option},
             )
 
diff --git a/surfsense_backend/tests/unit/services/test_docling_image_support.py b/surfsense_backend/tests/unit/services/test_docling_image_support.py
index 071d061e2..430adbaf2 100644
--- a/surfsense_backend/tests/unit/services/test_docling_image_support.py
+++ b/surfsense_backend/tests/unit/services/test_docling_image_support.py
@@ -1,4 +1,5 @@
-"""Test that DoclingService registers InputFormat.IMAGE for image processing."""
+"""Test that DoclingService does NOT restrict allowed_formats, letting Docling
+accept all its supported formats (PDF, DOCX, PPTX, XLSX, IMAGE, etc.)."""
 
 from enum import Enum
 from unittest.mock import MagicMock, patch
@@ -11,11 +12,14 @@ pytestmark = pytest.mark.unit
 class _FakeInputFormat(Enum):
     PDF = "pdf"
     IMAGE = "image"
+    DOCX = "docx"
+    PPTX = "pptx"
+    XLSX = "xlsx"
 
 
-def test_docling_service_registers_image_format():
-    """DoclingService should initialise DocumentConverter with InputFormat.IMAGE
-    in allowed_formats so that image files (jpg, png, bmp, tiff) are accepted."""
+def test_docling_service_does_not_restrict_allowed_formats():
+    """DoclingService should NOT pass allowed_formats to DocumentConverter,
+    so Docling defaults to accepting every InputFormat it supports."""
 
     mock_converter_cls = MagicMock()
     mock_backend = MagicMock()
@@ -54,14 +58,10 @@ def test_docling_service_registers_image_format():
     assert call_kwargs is not None, "DocumentConverter was never called"
 
     _, kwargs = call_kwargs
-    allowed = kwargs.get("allowed_formats")
-    format_opts = kwargs.get("format_options", {})
-
-    image_registered = (
-        (allowed is not None and _FakeInputFormat.IMAGE in allowed)
-        or _FakeInputFormat.IMAGE in format_opts
+    assert "allowed_formats" not in kwargs, (
+        f"allowed_formats should not be passed — let Docling accept all formats. "
+        f"Got: {kwargs.get('allowed_formats')}"
     )
-    assert image_registered, (
-        f"InputFormat.IMAGE not registered. "
-        f"allowed_formats={allowed}, format_options keys={list(format_opts.keys())}"
+    assert _FakeInputFormat.PDF in kwargs.get("format_options", {}), (
+        "format_options should still configure PDF pipeline options"
     )

From dc7047f64de916bd002fa4e0fc265b8532f92def Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 22:03:47 +0530
Subject: [PATCH 142/202] refactor: implement file type classification for
 supported extensions across Dropbox, Google Drive, and OneDrive connectors,
 enhancing file handling and error management

---
 .../app/connectors/dropbox/file_types.py      | 24 +------
 .../google_drive/content_extractor.py         |  8 ++-
 .../app/connectors/google_drive/file_types.py |  7 ++
 .../app/connectors/onedrive/file_types.py     |  9 ++-
 .../app/etl_pipeline/etl_pipeline_service.py  |  7 +-
 .../app/etl_pipeline/exceptions.py            |  4 ++
 .../app/etl_pipeline/file_classifier.py       |  6 +-
 .../document_processors/file_processors.py    |  1 +
 .../app/utils/file_extensions.py              | 31 ++++++++
 .../test_google_drive_file_types.py           | 22 ++++++
 .../connectors/test_onedrive_file_types.py    | 44 ++++++++++++
 .../etl_pipeline/test_etl_pipeline_service.py | 72 ++++++++++++++++++-
 .../tests/unit/utils/__init__.py              |  0
 .../tests/unit/utils/test_file_extensions.py  | 42 +++++++++++
 14 files changed, 250 insertions(+), 27 deletions(-)
 create mode 100644 surfsense_backend/app/utils/file_extensions.py
 create mode 100644 surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
 create mode 100644 surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
 create mode 100644 surfsense_backend/tests/unit/utils/__init__.py
 create mode 100644 surfsense_backend/tests/unit/utils/test_file_extensions.py

diff --git a/surfsense_backend/app/connectors/dropbox/file_types.py b/surfsense_backend/app/connectors/dropbox/file_types.py
index c245e039e..7b72c1857 100644
--- a/surfsense_backend/app/connectors/dropbox/file_types.py
+++ b/surfsense_backend/app/connectors/dropbox/file_types.py
@@ -1,25 +1,8 @@
 """File type handlers for Dropbox."""
 
-PAPER_EXTENSION = ".paper"
+from app.etl_pipeline.file_classifier import FileCategory, classify_file
 
-SKIP_EXTENSIONS: frozenset[str] = frozenset({
-    # Non-universal images (not supported by all 3 ETL pipelines)
-    ".svg", ".gif", ".webp", ".heic", ".ico",
-    ".raw", ".cr2", ".nef", ".arw", ".dng",
-    ".psd", ".ai", ".sketch", ".fig",
-    # Video
-    ".mov", ".avi", ".mkv", ".wmv", ".flv",
-    # Binaries / executables
-    ".exe", ".dll", ".so", ".dylib", ".bin", ".app", ".dmg", ".iso",
-    # Archives
-    ".zip", ".tar", ".gz", ".rar", ".7z", ".bz2",
-    # Fonts
-    ".ttf", ".otf", ".woff", ".woff2",
-    # 3D / CAD
-    ".stl", ".obj", ".fbx", ".blend",
-    # Database
-    ".db", ".sqlite", ".mdb",
-})
+PAPER_EXTENSION = ".paper"
 
 MIME_TO_EXTENSION: dict[str, str] = {
     "application/pdf": ".pdf",
@@ -71,5 +54,4 @@ def should_skip_file(item: dict) -> bool:
     if not item.get("is_downloadable", True):
         return True
     name = item.get("name", "")
-    ext = get_extension_from_name(name).lower()
-    return ext in SKIP_EXTENSIONS
+    return classify_file(name) == FileCategory.UNSUPPORTED
diff --git a/surfsense_backend/app/connectors/google_drive/content_extractor.py b/surfsense_backend/app/connectors/google_drive/content_extractor.py
index 0c559fee9..10f008594 100644
--- a/surfsense_backend/app/connectors/google_drive/content_extractor.py
+++ b/surfsense_backend/app/connectors/google_drive/content_extractor.py
@@ -17,6 +17,7 @@ from .file_types import (
     get_export_mime_type,
     get_extension_from_mime,
     is_google_workspace_file,
+    should_skip_by_extension,
     should_skip_file,
 )
 
@@ -42,6 +43,9 @@ async def download_and_extract_content(
     if should_skip_file(mime_type):
         return None, {}, f"Skipping {mime_type}"
 
+    if should_skip_by_extension(file_name):
+        return None, {}, f"Skipping unsupported extension: {file_name}"
+
     logger.info(f"Downloading file for content extraction: {file_name} ({mime_type})")
 
     drive_metadata: dict[str, Any] = {
@@ -148,10 +152,12 @@ async def download_and_process_file(
     file_name = file.get("name", "Unknown")
     mime_type = file.get("mimeType", "")
 
-    # Skip folders and shortcuts
     if should_skip_file(mime_type):
         return None, f"Skipping {mime_type}", None
 
+    if should_skip_by_extension(file_name):
+        return None, f"Skipping unsupported extension: {file_name}", None
+
     logger.info(f"Downloading file: {file_name} ({mime_type})")
 
     temp_file_path = None
diff --git a/surfsense_backend/app/connectors/google_drive/file_types.py b/surfsense_backend/app/connectors/google_drive/file_types.py
index dd6aff4d7..e0b8f001e 100644
--- a/surfsense_backend/app/connectors/google_drive/file_types.py
+++ b/surfsense_backend/app/connectors/google_drive/file_types.py
@@ -1,5 +1,7 @@
 """File type handlers for Google Drive."""
 
+from app.etl_pipeline.file_classifier import FileCategory, classify_file
+
 GOOGLE_DOC = "application/vnd.google-apps.document"
 GOOGLE_SHEET = "application/vnd.google-apps.spreadsheet"
 GOOGLE_SLIDE = "application/vnd.google-apps.presentation"
@@ -46,6 +48,11 @@ def should_skip_file(mime_type: str) -> bool:
     return mime_type in [GOOGLE_FOLDER, GOOGLE_SHORTCUT]
 
 
+def should_skip_by_extension(filename: str) -> bool:
+    """Return True if the file extension is not parseable by any ETL pipeline."""
+    return classify_file(filename) == FileCategory.UNSUPPORTED
+
+
 def get_export_mime_type(mime_type: str) -> str | None:
     """Get export MIME type for Google Workspace files."""
     return EXPORT_FORMATS.get(mime_type)
diff --git a/surfsense_backend/app/connectors/onedrive/file_types.py b/surfsense_backend/app/connectors/onedrive/file_types.py
index 403fdc337..bcd78b711 100644
--- a/surfsense_backend/app/connectors/onedrive/file_types.py
+++ b/surfsense_backend/app/connectors/onedrive/file_types.py
@@ -1,5 +1,7 @@
 """File type handlers for Microsoft OneDrive."""
 
+from app.etl_pipeline.file_classifier import FileCategory, classify_file
+
 ONEDRIVE_FOLDER_FACET = "folder"
 ONENOTE_MIME = "application/msonenote"
 
@@ -39,7 +41,7 @@ def is_folder(item: dict) -> bool:
 
 
 def should_skip_file(item: dict) -> bool:
-    """Skip folders, OneNote files, remote items (shared links), and packages."""
+    """Skip folders, OneNote files, remote items (shared links), packages, and unsupported extensions."""
     if is_folder(item):
         return True
     if "remoteItem" in item:
@@ -47,4 +49,7 @@ def should_skip_file(item: dict) -> bool:
     if "package" in item:
         return True
     mime = item.get("file", {}).get("mimeType", "")
-    return mime in SKIP_MIME_TYPES
+    if mime in SKIP_MIME_TYPES:
+        return True
+    name = item.get("name", "")
+    return classify_file(name) == FileCategory.UNSUPPORTED
diff --git a/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py b/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
index f382451df..7c67d2345 100644
--- a/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
+++ b/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
@@ -1,6 +1,6 @@
 from app.config import config as app_config
 from app.etl_pipeline.etl_document import EtlRequest, EtlResult
-from app.etl_pipeline.exceptions import EtlServiceUnavailableError
+from app.etl_pipeline.exceptions import EtlServiceUnavailableError, EtlUnsupportedFileError
 from app.etl_pipeline.file_classifier import FileCategory, classify_file
 from app.etl_pipeline.parsers.audio import transcribe_audio
 from app.etl_pipeline.parsers.direct_convert import convert_file_directly
@@ -13,6 +13,11 @@ class EtlPipelineService:
     async def extract(self, request: EtlRequest) -> EtlResult:
         category = classify_file(request.filename)
 
+        if category == FileCategory.UNSUPPORTED:
+            raise EtlUnsupportedFileError(
+                f"File type not supported for parsing: {request.filename}"
+            )
+
         if category == FileCategory.PLAINTEXT:
             content = read_plaintext(request.file_path)
             return EtlResult(
diff --git a/surfsense_backend/app/etl_pipeline/exceptions.py b/surfsense_backend/app/etl_pipeline/exceptions.py
index ac8fc0172..26eecbef4 100644
--- a/surfsense_backend/app/etl_pipeline/exceptions.py
+++ b/surfsense_backend/app/etl_pipeline/exceptions.py
@@ -4,3 +4,7 @@ class EtlParseError(Exception):
 
 class EtlServiceUnavailableError(Exception):
     """Raised when the configured ETL_SERVICE is not recognised."""
+
+
+class EtlUnsupportedFileError(Exception):
+    """Raised when a file type cannot be parsed by any ETL pipeline."""
diff --git a/surfsense_backend/app/etl_pipeline/file_classifier.py b/surfsense_backend/app/etl_pipeline/file_classifier.py
index 40c2d5aff..eea9cce22 100644
--- a/surfsense_backend/app/etl_pipeline/file_classifier.py
+++ b/surfsense_backend/app/etl_pipeline/file_classifier.py
@@ -1,6 +1,7 @@
 from enum import Enum
 from pathlib import PurePosixPath
 
+from app.utils.file_extensions import DOCUMENT_EXTENSIONS
 
 PLAINTEXT_EXTENSIONS = frozenset(
     {
@@ -35,6 +36,7 @@ class FileCategory(Enum):
     PLAINTEXT = "plaintext"
     AUDIO = "audio"
     DIRECT_CONVERT = "direct_convert"
+    UNSUPPORTED = "unsupported"
     DOCUMENT = "document"
 
 
@@ -46,4 +48,6 @@ def classify_file(filename: str) -> FileCategory:
         return FileCategory.AUDIO
     if suffix in DIRECT_CONVERT_EXTENSIONS:
         return FileCategory.DIRECT_CONVERT
-    return FileCategory.DOCUMENT
+    if suffix in DOCUMENT_EXTENSIONS:
+        return FileCategory.DOCUMENT
+    return FileCategory.UNSUPPORTED
diff --git a/surfsense_backend/app/tasks/document_processors/file_processors.py b/surfsense_backend/app/tasks/document_processors/file_processors.py
index f54a963ad..a9a6b62be 100644
--- a/surfsense_backend/app/tasks/document_processors/file_processors.py
+++ b/surfsense_backend/app/tasks/document_processors/file_processors.py
@@ -356,6 +356,7 @@ async def _extract_file_content(
             FileCategory.PLAINTEXT: "Reading file",
             FileCategory.DIRECT_CONVERT: "Converting file",
             FileCategory.AUDIO: "Transcribing audio",
+            FileCategory.UNSUPPORTED: "Unsupported file type",
             FileCategory.DOCUMENT: "Extracting content",
         }
         await NotificationService.document_processing.notify_processing_progress(
diff --git a/surfsense_backend/app/utils/file_extensions.py b/surfsense_backend/app/utils/file_extensions.py
new file mode 100644
index 000000000..5dac10842
--- /dev/null
+++ b/surfsense_backend/app/utils/file_extensions.py
@@ -0,0 +1,31 @@
+"""Allowlist of document extensions the ETL parsers can handle.
+
+Every consumer (file_classifier, connector-level skip checks) imports from
+here so there is a single source of truth.  Extensions already covered by
+PLAINTEXT_EXTENSIONS, AUDIO_EXTENSIONS, or DIRECT_CONVERT_EXTENSIONS in
+file_classifier are NOT repeated here -- this set is exclusively for the
+"document" ETL path (Docling / LlamaParse / Unstructured).
+"""
+
+from pathlib import PurePosixPath
+
+DOCUMENT_EXTENSIONS: frozenset[str] = frozenset({
+    # PDF
+    ".pdf",
+    # Microsoft Office
+    ".docx", ".doc", ".xlsx", ".xls", ".pptx", ".ppt",
+    # Images (raster -- OCR / vision parsing)
+    ".png", ".jpg", ".jpeg", ".bmp", ".tiff", ".tif",
+    # Rich text / e-book
+    ".rtf", ".epub",
+    # OpenDocument
+    ".odt", ".ods", ".odp",
+    # Other (LlamaParse / Unstructured specific)
+    ".hwpx",
+})
+
+
+def is_supported_document_extension(filename: str) -> bool:
+    """Return True if the file's extension is in the supported document set."""
+    suffix = PurePosixPath(filename).suffix.lower()
+    return suffix in DOCUMENT_EXTENSIONS
diff --git a/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py b/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
new file mode 100644
index 000000000..adbad74c2
--- /dev/null
+++ b/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
@@ -0,0 +1,22 @@
+"""Tests for Google Drive file type filtering."""
+
+import pytest
+
+from app.connectors.google_drive.file_types import should_skip_by_extension
+
+pytestmark = pytest.mark.unit
+
+
+@pytest.mark.parametrize("filename", [
+    "malware.exe", "archive.zip", "video.mov", "font.woff2", "model.blend",
+])
+def test_unsupported_extensions_are_skipped(filename):
+    assert should_skip_by_extension(filename) is True
+
+
+@pytest.mark.parametrize("filename", [
+    "report.pdf", "doc.docx", "sheet.xlsx", "slides.pptx",
+    "readme.txt", "data.csv", "photo.png", "notes.md",
+])
+def test_parseable_extensions_are_not_skipped(filename):
+    assert should_skip_by_extension(filename) is False
diff --git a/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py b/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
new file mode 100644
index 000000000..a2491257d
--- /dev/null
+++ b/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
@@ -0,0 +1,44 @@
+"""Tests for OneDrive file type filtering."""
+
+import pytest
+
+from app.connectors.onedrive.file_types import should_skip_file
+
+pytestmark = pytest.mark.unit
+
+
+def test_folder_is_skipped():
+    item = {"folder": {}, "name": "My Folder"}
+    assert should_skip_file(item) is True
+
+
+def test_remote_item_is_skipped():
+    item = {"remoteItem": {}, "name": "shared.docx"}
+    assert should_skip_file(item) is True
+
+
+def test_package_is_skipped():
+    item = {"package": {}, "name": "notebook"}
+    assert should_skip_file(item) is True
+
+
+def test_onenote_is_skipped():
+    item = {"name": "notes", "file": {"mimeType": "application/msonenote"}}
+    assert should_skip_file(item) is True
+
+
+@pytest.mark.parametrize("filename", [
+    "malware.exe", "archive.zip", "video.mov", "font.woff2", "model.blend",
+])
+def test_unsupported_extensions_are_skipped(filename):
+    item = {"name": filename, "file": {"mimeType": "application/octet-stream"}}
+    assert should_skip_file(item) is True, f"{filename} should be skipped"
+
+
+@pytest.mark.parametrize("filename", [
+    "report.pdf", "doc.docx", "sheet.xlsx", "slides.pptx",
+    "readme.txt", "data.csv", "photo.png", "notes.md",
+])
+def test_parseable_files_are_not_skipped(filename):
+    item = {"name": filename, "file": {"mimeType": "application/octet-stream"}}
+    assert should_skip_file(item) is False, f"{filename} should NOT be skipped"
diff --git a/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py b/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
index 0d31507ca..facf15eab 100644
--- a/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
+++ b/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
@@ -257,7 +257,7 @@ async def test_extract_pdf_with_llamacloud(tmp_path, mocker):
 
 
 async def test_unknown_extension_uses_document_etl(tmp_path, mocker):
-    """An unknown extension (e.g. .docx) falls through to the document ETL path."""
+    """An allowlisted document extension (.docx) routes to the document ETL path."""
     docx_file = tmp_path / "doc.docx"
     docx_file.write_bytes(b"PK fake docx")
 
@@ -307,3 +307,73 @@ async def test_unknown_etl_service_raises(tmp_path, mocker):
         await EtlPipelineService().extract(
             EtlRequest(file_path=str(pdf_file), filename="report.pdf")
         )
+
+
+# ---------------------------------------------------------------------------
+# Slice 13 – unsupported file types are rejected before reaching any parser
+# ---------------------------------------------------------------------------
+
+
+def test_unknown_extension_classified_as_unsupported():
+    """An unknown extension defaults to UNSUPPORTED (allowlist behaviour)."""
+    from app.etl_pipeline.file_classifier import FileCategory, classify_file
+
+    assert classify_file("random.xyz") == FileCategory.UNSUPPORTED
+
+
+@pytest.mark.parametrize("filename", [
+    "malware.exe", "archive.zip", "video.mov", "font.woff2",
+    "model.blend", "data.parquet", "package.deb", "firmware.bin",
+])
+def test_unsupported_extensions_classified_correctly(filename):
+    """Extensions not in any allowlist are classified as UNSUPPORTED."""
+    from app.etl_pipeline.file_classifier import FileCategory, classify_file
+
+    assert classify_file(filename) == FileCategory.UNSUPPORTED
+
+
+@pytest.mark.parametrize("filename,expected", [
+    ("report.pdf", "document"),
+    ("doc.docx", "document"),
+    ("slides.pptx", "document"),
+    ("sheet.xlsx", "document"),
+    ("photo.png", "document"),
+    ("photo.jpg", "document"),
+    ("book.epub", "document"),
+    ("letter.odt", "document"),
+    ("readme.md", "plaintext"),
+    ("data.csv", "direct_convert"),
+])
+def test_parseable_extensions_classified_correctly(filename, expected):
+    """Parseable files are classified into their correct category."""
+    from app.etl_pipeline.file_classifier import FileCategory, classify_file
+
+    result = classify_file(filename)
+    assert result != FileCategory.UNSUPPORTED
+    assert result.value == expected
+
+
+async def test_extract_unsupported_file_raises_error(tmp_path):
+    """EtlPipelineService.extract() raises EtlUnsupportedFileError for .exe files."""
+    from app.etl_pipeline.exceptions import EtlUnsupportedFileError
+
+    exe_file = tmp_path / "program.exe"
+    exe_file.write_bytes(b"\x00" * 10)
+
+    with pytest.raises(EtlUnsupportedFileError, match="not supported"):
+        await EtlPipelineService().extract(
+            EtlRequest(file_path=str(exe_file), filename="program.exe")
+        )
+
+
+async def test_extract_zip_raises_unsupported_error(tmp_path):
+    """EtlPipelineService.extract() raises EtlUnsupportedFileError for .zip archives."""
+    from app.etl_pipeline.exceptions import EtlUnsupportedFileError
+
+    zip_file = tmp_path / "archive.zip"
+    zip_file.write_bytes(b"PK\x03\x04")
+
+    with pytest.raises(EtlUnsupportedFileError, match="not supported"):
+        await EtlPipelineService().extract(
+            EtlRequest(file_path=str(zip_file), filename="archive.zip")
+        )
diff --git a/surfsense_backend/tests/unit/utils/__init__.py b/surfsense_backend/tests/unit/utils/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/surfsense_backend/tests/unit/utils/test_file_extensions.py b/surfsense_backend/tests/unit/utils/test_file_extensions.py
new file mode 100644
index 000000000..a376f44bd
--- /dev/null
+++ b/surfsense_backend/tests/unit/utils/test_file_extensions.py
@@ -0,0 +1,42 @@
+"""Tests for the DOCUMENT_EXTENSIONS allowlist module."""
+
+import pytest
+
+pytestmark = pytest.mark.unit
+
+
+def test_pdf_is_supported_document():
+    from app.utils.file_extensions import is_supported_document_extension
+
+    assert is_supported_document_extension("report.pdf") is True
+
+
+def test_exe_is_not_supported_document():
+    from app.utils.file_extensions import is_supported_document_extension
+
+    assert is_supported_document_extension("malware.exe") is False
+
+
+@pytest.mark.parametrize("filename", [
+    "report.pdf", "doc.docx", "old.doc",
+    "sheet.xlsx", "legacy.xls",
+    "slides.pptx", "deck.ppt",
+    "photo.png", "photo.jpg", "photo.jpeg", "scan.bmp", "scan.tiff", "scan.tif",
+    "manual.rtf", "book.epub",
+    "letter.odt", "data.ods", "presentation.odp",
+    "korean.hwpx",
+])
+def test_document_extensions_are_supported(filename):
+    from app.utils.file_extensions import is_supported_document_extension
+
+    assert is_supported_document_extension(filename) is True, f"{filename} should be supported"
+
+
+@pytest.mark.parametrize("filename", [
+    "malware.exe", "archive.zip", "video.mov", "font.woff2",
+    "model.blend", "random.xyz", "data.parquet", "package.deb",
+])
+def test_non_document_extensions_are_not_supported(filename):
+    from app.utils.file_extensions import is_supported_document_extension
+
+    assert is_supported_document_extension(filename) is False, f"{filename} should NOT be supported"

From 0fb92b7c566cb48f95501dcf8f9a1ec6ea31b3d0 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 22:17:50 +0530
Subject: [PATCH 143/202] refactor: streamline file skipping logic in Dropbox
 indexer by removing redundant checks, improving code clarity

---
 .../app/tasks/connector_indexers/dropbox_indexer.py           | 4 ----
 surfsense_backend/app/utils/file_extensions.py                | 2 +-
 2 files changed, 1 insertion(+), 5 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
index ae46485cb..d116cc264 100644
--- a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
@@ -337,10 +337,6 @@ async def _index_with_delta_sync(
         if tag != "file":
             continue
 
-        if skip_item(entry):
-            skipped += 1
-            continue
-
         skip, msg = await _should_skip_file(session, entry, search_space_id)
         if skip:
             if msg and "renamed" in msg.lower():
diff --git a/surfsense_backend/app/utils/file_extensions.py b/surfsense_backend/app/utils/file_extensions.py
index 5dac10842..b0a4c808c 100644
--- a/surfsense_backend/app/utils/file_extensions.py
+++ b/surfsense_backend/app/utils/file_extensions.py
@@ -14,7 +14,7 @@ DOCUMENT_EXTENSIONS: frozenset[str] = frozenset({
     ".pdf",
     # Microsoft Office
     ".docx", ".doc", ".xlsx", ".xls", ".pptx", ".ppt",
-    # Images (raster -- OCR / vision parsing)
+    # Images (raster: OCR / vision parsing)
     ".png", ".jpg", ".jpeg", ".bmp", ".tiff", ".tif",
     # Rich text / e-book
     ".rtf", ".epub",

From f03bf05aaa6269cbcf937f55d58c779c249b5614 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Mon, 6 Apr 2026 22:34:49 +0530
Subject: [PATCH 144/202] refactor: enhance Google Drive indexer to support
 file extension filtering, improving file handling and error reporting

---
 .../google_drive_indexer.py                   |  7 +++-
 .../integration/document_upload/conftest.py   | 20 ++++-------
 .../test_dropbox_parallel.py                  | 34 +++++++++++++++++++
 3 files changed, 46 insertions(+), 15 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
index 5e9e0f62f..9c53092f5 100644
--- a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
@@ -25,7 +25,10 @@ from app.connectors.google_drive import (
     get_files_in_folder,
     get_start_page_token,
 )
-from app.connectors.google_drive.file_types import should_skip_file as skip_mime
+from app.connectors.google_drive.file_types import (
+    should_skip_by_extension,
+    should_skip_file as skip_mime,
+)
 from app.db import Document, DocumentStatus, DocumentType, SearchSourceConnectorType
 from app.indexing_pipeline.connector_document import ConnectorDocument
 from app.indexing_pipeline.document_hashing import compute_identifier_hash
@@ -78,6 +81,8 @@ async def _should_skip_file(
 
     if skip_mime(mime_type):
         return True, "folder/shortcut"
+    if should_skip_by_extension(file_name):
+        return True, "unsupported extension"
     if not file_id:
         return True, "missing file_id"
 
diff --git a/surfsense_backend/tests/integration/document_upload/conftest.py b/surfsense_backend/tests/integration/document_upload/conftest.py
index 41c379e58..62f4f6b47 100644
--- a/surfsense_backend/tests/integration/document_upload/conftest.py
+++ b/surfsense_backend/tests/integration/document_upload/conftest.py
@@ -319,31 +319,23 @@ def _mock_etl_parsing(monkeypatch):
 
     # -- LlamaParse mock (external API) --------------------------------
 
-    class _FakeMarkdownDoc:
-        def __init__(self, text: str):
-            self.text = text
-
-    class _FakeLlamaParseResult:
-        async def aget_markdown_documents(self, *, split_by_page=False):
-            return [_FakeMarkdownDoc(_MOCK_ETL_MARKDOWN)]
-
-    async def _fake_llamacloud_parse(**kwargs):
-        _reject_empty(kwargs["file_path"])
-        return _FakeLlamaParseResult()
+    async def _fake_llamacloud_parse(file_path: str, estimated_pages: int) -> str:
+        _reject_empty(file_path)
+        return _MOCK_ETL_MARKDOWN
 
     monkeypatch.setattr(
-        "app.tasks.document_processors.file_processors.parse_with_llamacloud_retry",
+        "app.etl_pipeline.parsers.llamacloud.parse_with_llamacloud",
         _fake_llamacloud_parse,
     )
 
     # -- Docling mock (heavy library boundary) -------------------------
 
-    async def _fake_docling_parse(file_path: str, filename: str):
+    async def _fake_docling_parse(file_path: str, filename: str) -> str:
         _reject_empty(file_path)
         return _MOCK_ETL_MARKDOWN
 
     monkeypatch.setattr(
-        "app.tasks.document_processors.file_processors.parse_with_docling",
+        "app.etl_pipeline.parsers.docling.parse_with_docling",
         _fake_docling_parse,
     )
 
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
index 737e2c850..7a828b9c4 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
@@ -272,6 +272,23 @@ def full_scan_mocks(mock_dropbox_client, monkeypatch):
     download_and_index_mock = AsyncMock(return_value=(0, 0))
     monkeypatch.setattr(_mod, "_download_and_index", download_and_index_mock)
 
+    from app.services.page_limit_service import PageLimitService as _RealPLS
+
+    mock_page_limit_instance = MagicMock()
+    mock_page_limit_instance.get_page_usage = AsyncMock(return_value=(0, 999_999))
+    mock_page_limit_instance.update_page_usage = AsyncMock()
+
+    class _MockPageLimitService:
+        estimate_pages_from_metadata = staticmethod(
+            _RealPLS.estimate_pages_from_metadata
+        )
+
+        def __init__(self, session):
+            self.get_page_usage = mock_page_limit_instance.get_page_usage
+            self.update_page_usage = mock_page_limit_instance.update_page_usage
+
+    monkeypatch.setattr(_mod, "PageLimitService", _MockPageLimitService)
+
     return {
         "dropbox_client": mock_dropbox_client,
         "session": mock_session,
@@ -377,6 +394,23 @@ def selected_files_mocks(mock_dropbox_client, monkeypatch):
     download_and_index_mock = AsyncMock(return_value=(0, 0))
     monkeypatch.setattr(_mod, "_download_and_index", download_and_index_mock)
 
+    from app.services.page_limit_service import PageLimitService as _RealPLS
+
+    mock_page_limit_instance = MagicMock()
+    mock_page_limit_instance.get_page_usage = AsyncMock(return_value=(0, 999_999))
+    mock_page_limit_instance.update_page_usage = AsyncMock()
+
+    class _MockPageLimitService:
+        estimate_pages_from_metadata = staticmethod(
+            _RealPLS.estimate_pages_from_metadata
+        )
+
+        def __init__(self, session):
+            self.get_page_usage = mock_page_limit_instance.get_page_usage
+            self.update_page_usage = mock_page_limit_instance.update_page_usage
+
+    monkeypatch.setattr(_mod, "PageLimitService", _MockPageLimitService)
+
     return {
         "dropbox_client": mock_dropbox_client,
         "session": mock_session,

From e7beeb2a3600b657d9d585d6ce3be0d7bc53b224 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 02:19:31 +0530
Subject: [PATCH 145/202] refactor: unify file skipping logic across Dropbox,
 Google Drive, and OneDrive connectors by replacing classification checks with
 a centralized service-based approach, enhancing maintainability and
 consistency in file handling

---
 .../app/connectors/dropbox/file_types.py      |  6 +-
 .../app/connectors/google_drive/file_types.py |  8 +-
 .../app/connectors/onedrive/file_types.py     |  6 +-
 .../app/etl_pipeline/etl_pipeline_service.py  | 11 +++
 .../app/etl_pipeline/file_classifier.py       | 19 ++++-
 .../app/utils/file_extensions.py              | 76 ++++++++++++++-----
 .../test_dropbox_parallel.py                  |  2 +
 .../connectors/test_dropbox_file_types.py     | 73 ++++++++++++++----
 .../test_google_drive_file_types.py           | 33 +++++++-
 .../connectors/test_onedrive_file_types.py    | 37 ++++++++-
 .../etl_pipeline/test_etl_pipeline_service.py | 69 +++++++++++++++++
 .../tests/unit/utils/test_file_extensions.py  | 76 ++++++++++++++++++-
 .../components/sources/DocumentUploadTab.tsx  | 39 +++++-----
 13 files changed, 388 insertions(+), 67 deletions(-)

diff --git a/surfsense_backend/app/connectors/dropbox/file_types.py b/surfsense_backend/app/connectors/dropbox/file_types.py
index 7b72c1857..13209ffd2 100644
--- a/surfsense_backend/app/connectors/dropbox/file_types.py
+++ b/surfsense_backend/app/connectors/dropbox/file_types.py
@@ -1,6 +1,6 @@
 """File type handlers for Dropbox."""
 
-from app.etl_pipeline.file_classifier import FileCategory, classify_file
+from app.etl_pipeline.file_classifier import should_skip_for_service
 
 PAPER_EXTENSION = ".paper"
 
@@ -53,5 +53,7 @@ def should_skip_file(item: dict) -> bool:
         return False
     if not item.get("is_downloadable", True):
         return True
+    from app.config import config as app_config
+
     name = item.get("name", "")
-    return classify_file(name) == FileCategory.UNSUPPORTED
+    return should_skip_for_service(name, app_config.ETL_SERVICE)
diff --git a/surfsense_backend/app/connectors/google_drive/file_types.py b/surfsense_backend/app/connectors/google_drive/file_types.py
index e0b8f001e..73f016ceb 100644
--- a/surfsense_backend/app/connectors/google_drive/file_types.py
+++ b/surfsense_backend/app/connectors/google_drive/file_types.py
@@ -1,6 +1,6 @@
 """File type handlers for Google Drive."""
 
-from app.etl_pipeline.file_classifier import FileCategory, classify_file
+from app.etl_pipeline.file_classifier import should_skip_for_service
 
 GOOGLE_DOC = "application/vnd.google-apps.document"
 GOOGLE_SHEET = "application/vnd.google-apps.spreadsheet"
@@ -49,8 +49,10 @@ def should_skip_file(mime_type: str) -> bool:
 
 
 def should_skip_by_extension(filename: str) -> bool:
-    """Return True if the file extension is not parseable by any ETL pipeline."""
-    return classify_file(filename) == FileCategory.UNSUPPORTED
+    """Return True if the file extension is not parseable by the configured ETL service."""
+    from app.config import config as app_config
+
+    return should_skip_for_service(filename, app_config.ETL_SERVICE)
 
 
 def get_export_mime_type(mime_type: str) -> str | None:
diff --git a/surfsense_backend/app/connectors/onedrive/file_types.py b/surfsense_backend/app/connectors/onedrive/file_types.py
index bcd78b711..f9c147da8 100644
--- a/surfsense_backend/app/connectors/onedrive/file_types.py
+++ b/surfsense_backend/app/connectors/onedrive/file_types.py
@@ -1,6 +1,6 @@
 """File type handlers for Microsoft OneDrive."""
 
-from app.etl_pipeline.file_classifier import FileCategory, classify_file
+from app.etl_pipeline.file_classifier import should_skip_for_service
 
 ONEDRIVE_FOLDER_FACET = "folder"
 ONENOTE_MIME = "application/msonenote"
@@ -51,5 +51,7 @@ def should_skip_file(item: dict) -> bool:
     mime = item.get("file", {}).get("mimeType", "")
     if mime in SKIP_MIME_TYPES:
         return True
+    from app.config import config as app_config
+
     name = item.get("name", "")
-    return classify_file(name) == FileCategory.UNSUPPORTED
+    return should_skip_for_service(name, app_config.ETL_SERVICE)
diff --git a/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py b/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
index 7c67d2345..a0041c843 100644
--- a/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
+++ b/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
@@ -45,6 +45,10 @@ class EtlPipelineService:
         return await self._extract_document(request)
 
     async def _extract_document(self, request: EtlRequest) -> EtlResult:
+        from pathlib import PurePosixPath
+
+        from app.utils.file_extensions import get_document_extensions_for_service
+
         etl_service = app_config.ETL_SERVICE
         if not etl_service:
             raise EtlServiceUnavailableError(
@@ -52,6 +56,13 @@ class EtlPipelineService:
                 "Set ETL_SERVICE to UNSTRUCTURED, LLAMACLOUD, or DOCLING in your .env"
             )
 
+        ext = PurePosixPath(request.filename).suffix.lower()
+        supported = get_document_extensions_for_service(etl_service)
+        if ext not in supported:
+            raise EtlUnsupportedFileError(
+                f"File type {ext} is not supported by {etl_service}"
+            )
+
         if etl_service == "DOCLING":
             from app.etl_pipeline.parsers.docling import parse_with_docling
 
diff --git a/surfsense_backend/app/etl_pipeline/file_classifier.py b/surfsense_backend/app/etl_pipeline/file_classifier.py
index eea9cce22..bc7b4537c 100644
--- a/surfsense_backend/app/etl_pipeline/file_classifier.py
+++ b/surfsense_backend/app/etl_pipeline/file_classifier.py
@@ -1,7 +1,7 @@
 from enum import Enum
 from pathlib import PurePosixPath
 
-from app.utils.file_extensions import DOCUMENT_EXTENSIONS
+from app.utils.file_extensions import DOCUMENT_EXTENSIONS, get_document_extensions_for_service
 
 PLAINTEXT_EXTENSIONS = frozenset(
     {
@@ -29,7 +29,7 @@ AUDIO_EXTENSIONS = frozenset(
     {".mp3", ".mp4", ".mpeg", ".mpga", ".m4a", ".wav", ".webm"}
 )
 
-DIRECT_CONVERT_EXTENSIONS = frozenset({".csv", ".tsv", ".html", ".htm"})
+DIRECT_CONVERT_EXTENSIONS = frozenset({".csv", ".tsv", ".html", ".htm", ".xhtml"})
 
 
 class FileCategory(Enum):
@@ -51,3 +51,18 @@ def classify_file(filename: str) -> FileCategory:
     if suffix in DOCUMENT_EXTENSIONS:
         return FileCategory.DOCUMENT
     return FileCategory.UNSUPPORTED
+
+
+def should_skip_for_service(filename: str, etl_service: str | None) -> bool:
+    """Return True if *filename* cannot be processed by *etl_service*.
+
+    Plaintext, audio, and direct-convert files are parser-agnostic and never
+    skipped.  Document files are checked against the per-parser extension set.
+    """
+    category = classify_file(filename)
+    if category == FileCategory.UNSUPPORTED:
+        return True
+    if category == FileCategory.DOCUMENT:
+        suffix = PurePosixPath(filename).suffix.lower()
+        return suffix not in get_document_extensions_for_service(etl_service)
+    return False
diff --git a/surfsense_backend/app/utils/file_extensions.py b/surfsense_backend/app/utils/file_extensions.py
index b0a4c808c..5eed36872 100644
--- a/surfsense_backend/app/utils/file_extensions.py
+++ b/surfsense_backend/app/utils/file_extensions.py
@@ -1,29 +1,69 @@
-"""Allowlist of document extensions the ETL parsers can handle.
+"""Per-parser document extension sets for the ETL pipeline.
 
-Every consumer (file_classifier, connector-level skip checks) imports from
-here so there is a single source of truth.  Extensions already covered by
-PLAINTEXT_EXTENSIONS, AUDIO_EXTENSIONS, or DIRECT_CONVERT_EXTENSIONS in
-file_classifier are NOT repeated here -- this set is exclusively for the
-"document" ETL path (Docling / LlamaParse / Unstructured).
+Every consumer (file_classifier, connector-level skip checks, ETL pipeline
+validation) imports from here so there is a single source of truth.
+
+Extensions already covered by PLAINTEXT_EXTENSIONS, AUDIO_EXTENSIONS, or
+DIRECT_CONVERT_EXTENSIONS in file_classifier are NOT repeated here -- these
+sets are exclusively for the "document" ETL path (Docling / LlamaParse /
+Unstructured).
 """
 
 from pathlib import PurePosixPath
 
-DOCUMENT_EXTENSIONS: frozenset[str] = frozenset({
-    # PDF
+# ---------------------------------------------------------------------------
+# Per-parser document extension sets (from official documentation)
+# ---------------------------------------------------------------------------
+
+DOCLING_DOCUMENT_EXTENSIONS: frozenset[str] = frozenset({
     ".pdf",
-    # Microsoft Office
-    ".docx", ".doc", ".xlsx", ".xls", ".pptx", ".ppt",
-    # Images (raster: OCR / vision parsing)
-    ".png", ".jpg", ".jpeg", ".bmp", ".tiff", ".tif",
-    # Rich text / e-book
-    ".rtf", ".epub",
-    # OpenDocument
-    ".odt", ".ods", ".odp",
-    # Other (LlamaParse / Unstructured specific)
-    ".hwpx",
+    ".docx", ".xlsx", ".pptx",
+    ".png", ".jpg", ".jpeg", ".tiff", ".tif", ".bmp", ".webp",
 })
 
+LLAMAPARSE_DOCUMENT_EXTENSIONS: frozenset[str] = frozenset({
+    ".pdf",
+    ".docx", ".doc", ".xlsx", ".xls", ".pptx", ".ppt",
+    ".docm", ".dot", ".dotm", ".pptm", ".pot", ".potx",
+    ".xlsm", ".xlsb", ".xlw",
+    ".rtf", ".epub",
+    ".png", ".jpg", ".jpeg", ".gif", ".bmp", ".tiff", ".tif", ".webp", ".svg",
+    ".odt", ".ods", ".odp",
+    ".hwp", ".hwpx",
+})
+
+UNSTRUCTURED_DOCUMENT_EXTENSIONS: frozenset[str] = frozenset({
+    ".pdf",
+    ".docx", ".doc", ".xlsx", ".xls", ".pptx", ".ppt",
+    ".png", ".jpg", ".jpeg", ".bmp", ".tiff", ".tif", ".heic",
+    ".rtf", ".epub", ".odt",
+    ".eml", ".msg", ".p7s",
+})
+
+# ---------------------------------------------------------------------------
+# Union (used by classify_file for routing) + service lookup
+# ---------------------------------------------------------------------------
+
+DOCUMENT_EXTENSIONS: frozenset[str] = (
+    DOCLING_DOCUMENT_EXTENSIONS
+    | LLAMAPARSE_DOCUMENT_EXTENSIONS
+    | UNSTRUCTURED_DOCUMENT_EXTENSIONS
+)
+
+_SERVICE_MAP: dict[str, frozenset[str]] = {
+    "DOCLING": DOCLING_DOCUMENT_EXTENSIONS,
+    "LLAMACLOUD": LLAMAPARSE_DOCUMENT_EXTENSIONS,
+    "UNSTRUCTURED": UNSTRUCTURED_DOCUMENT_EXTENSIONS,
+}
+
+
+def get_document_extensions_for_service(etl_service: str | None) -> frozenset[str]:
+    """Return the document extensions supported by *etl_service*.
+
+    Falls back to the full union when the service is ``None`` or unknown.
+    """
+    return _SERVICE_MAP.get(etl_service or "", DOCUMENT_EXTENSIONS)
+
 
 def is_supported_document_extension(filename: str) -> bool:
     """Return True if the file's extension is in the supported document set."""
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
index 7a828b9c4..8572fa8ea 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
@@ -261,6 +261,8 @@ def full_scan_mocks(mock_dropbox_client, monkeypatch):
 
     skip_results: dict[str, tuple[bool, str | None]] = {}
 
+    monkeypatch.setattr("app.config.config.ETL_SERVICE", "LLAMACLOUD")
+
     async def _fake_skip(session, file, search_space_id):
         from app.connectors.dropbox.file_types import should_skip_file as _skip
         if _skip(file):
diff --git a/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py b/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
index 5480d8c8a..e092872c5 100644
--- a/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
+++ b/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
@@ -7,6 +7,11 @@ from app.connectors.dropbox.file_types import should_skip_file
 pytestmark = pytest.mark.unit
 
 
+# ---------------------------------------------------------------------------
+# Structural skips (independent of ETL service)
+# ---------------------------------------------------------------------------
+
+
 def test_folder_item_is_skipped():
     item = {".tag": "folder", "name": "My Folder"}
     assert should_skip_file(item) is True
@@ -22,13 +27,18 @@ def test_non_downloadable_item_is_skipped():
     assert should_skip_file(item) is True
 
 
+# ---------------------------------------------------------------------------
+# Extension-based skips (require ETL service context)
+# ---------------------------------------------------------------------------
+
+
 @pytest.mark.parametrize(
     "filename",
     [
         "archive.zip", "backup.tar", "data.gz", "stuff.rar", "pack.7z",
         "program.exe", "lib.dll", "module.so", "image.dmg", "disk.iso",
         "movie.mov", "clip.avi", "video.mkv", "film.wmv", "stream.flv",
-        "icon.svg", "anim.gif", "photo.webp", "shot.heic", "favicon.ico",
+        "favicon.ico",
         "raw.cr2", "photo.nef", "image.arw", "pic.dng",
         "design.psd", "vector.ai", "mockup.sketch", "proto.fig",
         "font.ttf", "font.otf", "font.woff", "font.woff2",
@@ -36,7 +46,8 @@ def test_non_downloadable_item_is_skipped():
         "local.db", "data.sqlite", "access.mdb",
     ],
 )
-def test_non_parseable_extensions_are_skipped(filename):
+def test_non_parseable_extensions_are_skipped(filename, mocker):
+    mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
     item = {".tag": "file", "name": filename}
     assert should_skip_file(item) is True, f"{filename} should be skipped"
 
@@ -45,29 +56,61 @@ def test_non_parseable_extensions_are_skipped(filename):
     "filename",
     [
         "report.pdf", "document.docx", "sheet.xlsx", "slides.pptx",
-        "old.doc", "legacy.xls", "deck.ppt",
         "readme.txt", "data.csv", "page.html", "notes.md",
         "config.json", "feed.xml",
     ],
 )
-def test_parseable_documents_are_not_skipped(filename):
-    item = {".tag": "file", "name": filename}
-    assert should_skip_file(item) is False, f"{filename} should NOT be skipped"
+def test_parseable_documents_are_not_skipped(filename, mocker):
+    """Files in plaintext/direct_convert/universal document sets are never skipped."""
+    for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
+        mocker.patch("app.config.config.ETL_SERVICE", service)
+        item = {".tag": "file", "name": filename}
+        assert should_skip_file(item) is False, (
+            f"{filename} should NOT be skipped with {service}"
+        )
 
 
 @pytest.mark.parametrize(
     "filename",
     ["photo.jpg", "image.jpeg", "screenshot.png", "scan.bmp", "page.tiff", "doc.tif"],
 )
-def test_universal_images_are_not_skipped(filename):
-    item = {".tag": "file", "name": filename}
-    assert should_skip_file(item) is False, f"{filename} should NOT be skipped"
+def test_universal_images_are_not_skipped(filename, mocker):
+    """Images supported by all parsers are never skipped."""
+    for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
+        mocker.patch("app.config.config.ETL_SERVICE", service)
+        item = {".tag": "file", "name": filename}
+        assert should_skip_file(item) is False, (
+            f"{filename} should NOT be skipped with {service}"
+        )
 
 
-@pytest.mark.parametrize(
-    "filename",
-    ["icon.svg", "anim.gif", "photo.webp", "live.heic"],
-)
-def test_non_universal_images_are_skipped(filename):
+@pytest.mark.parametrize("filename,service,expected_skip", [
+    ("old.doc", "DOCLING", True),
+    ("old.doc", "LLAMACLOUD", False),
+    ("old.doc", "UNSTRUCTURED", False),
+    ("legacy.xls", "DOCLING", True),
+    ("legacy.xls", "LLAMACLOUD", False),
+    ("legacy.xls", "UNSTRUCTURED", False),
+    ("deck.ppt", "DOCLING", True),
+    ("deck.ppt", "LLAMACLOUD", False),
+    ("deck.ppt", "UNSTRUCTURED", False),
+    ("icon.svg", "DOCLING", True),
+    ("icon.svg", "LLAMACLOUD", False),
+    ("anim.gif", "DOCLING", True),
+    ("anim.gif", "LLAMACLOUD", False),
+    ("photo.webp", "DOCLING", False),
+    ("photo.webp", "LLAMACLOUD", False),
+    ("photo.webp", "UNSTRUCTURED", True),
+    ("live.heic", "DOCLING", True),
+    ("live.heic", "UNSTRUCTURED", False),
+    ("macro.docm", "DOCLING", True),
+    ("macro.docm", "LLAMACLOUD", False),
+    ("mail.eml", "DOCLING", True),
+    ("mail.eml", "UNSTRUCTURED", False),
+])
+def test_parser_specific_extensions(filename, service, expected_skip, mocker):
+    mocker.patch("app.config.config.ETL_SERVICE", service)
     item = {".tag": "file", "name": filename}
-    assert should_skip_file(item) is True, f"{filename} should be skipped"
+    assert should_skip_file(item) is expected_skip, (
+        f"{filename} with {service}: expected skip={expected_skip}"
+    )
diff --git a/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py b/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
index adbad74c2..4ed7eb4db 100644
--- a/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
+++ b/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
@@ -10,13 +10,38 @@ pytestmark = pytest.mark.unit
 @pytest.mark.parametrize("filename", [
     "malware.exe", "archive.zip", "video.mov", "font.woff2", "model.blend",
 ])
-def test_unsupported_extensions_are_skipped(filename):
-    assert should_skip_by_extension(filename) is True
+def test_unsupported_extensions_are_skipped_regardless_of_service(filename, mocker):
+    """Truly unsupported files are skipped no matter which ETL service is configured."""
+    for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
+        mocker.patch("app.config.config.ETL_SERVICE", service)
+        assert should_skip_by_extension(filename) is True
 
 
 @pytest.mark.parametrize("filename", [
     "report.pdf", "doc.docx", "sheet.xlsx", "slides.pptx",
     "readme.txt", "data.csv", "photo.png", "notes.md",
 ])
-def test_parseable_extensions_are_not_skipped(filename):
-    assert should_skip_by_extension(filename) is False
+def test_universal_extensions_are_not_skipped(filename, mocker):
+    """Files supported by all parsers (or handled by plaintext/direct_convert) are never skipped."""
+    for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
+        mocker.patch("app.config.config.ETL_SERVICE", service)
+        assert should_skip_by_extension(filename) is False, (
+            f"{filename} should NOT be skipped with {service}"
+        )
+
+
+@pytest.mark.parametrize("filename,service,expected_skip", [
+    ("macro.docm", "DOCLING", True),
+    ("macro.docm", "LLAMACLOUD", False),
+    ("mail.eml", "DOCLING", True),
+    ("mail.eml", "UNSTRUCTURED", False),
+    ("photo.gif", "DOCLING", True),
+    ("photo.gif", "LLAMACLOUD", False),
+    ("photo.heic", "UNSTRUCTURED", False),
+    ("photo.heic", "DOCLING", True),
+])
+def test_parser_specific_extensions(filename, service, expected_skip, mocker):
+    mocker.patch("app.config.config.ETL_SERVICE", service)
+    assert should_skip_by_extension(filename) is expected_skip, (
+        f"{filename} with {service}: expected skip={expected_skip}"
+    )
diff --git a/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py b/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
index a2491257d..e73f799e2 100644
--- a/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
+++ b/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
@@ -7,6 +7,11 @@ from app.connectors.onedrive.file_types import should_skip_file
 pytestmark = pytest.mark.unit
 
 
+# ---------------------------------------------------------------------------
+# Structural skips (independent of ETL service)
+# ---------------------------------------------------------------------------
+
+
 def test_folder_is_skipped():
     item = {"folder": {}, "name": "My Folder"}
     assert should_skip_file(item) is True
@@ -27,10 +32,16 @@ def test_onenote_is_skipped():
     assert should_skip_file(item) is True
 
 
+# ---------------------------------------------------------------------------
+# Extension-based skips (require ETL service context)
+# ---------------------------------------------------------------------------
+
+
 @pytest.mark.parametrize("filename", [
     "malware.exe", "archive.zip", "video.mov", "font.woff2", "model.blend",
 ])
-def test_unsupported_extensions_are_skipped(filename):
+def test_unsupported_extensions_are_skipped(filename, mocker):
+    mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
     item = {"name": filename, "file": {"mimeType": "application/octet-stream"}}
     assert should_skip_file(item) is True, f"{filename} should be skipped"
 
@@ -39,6 +50,26 @@ def test_unsupported_extensions_are_skipped(filename):
     "report.pdf", "doc.docx", "sheet.xlsx", "slides.pptx",
     "readme.txt", "data.csv", "photo.png", "notes.md",
 ])
-def test_parseable_files_are_not_skipped(filename):
+def test_universal_files_are_not_skipped(filename, mocker):
+    for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
+        mocker.patch("app.config.config.ETL_SERVICE", service)
+        item = {"name": filename, "file": {"mimeType": "application/octet-stream"}}
+        assert should_skip_file(item) is False, (
+            f"{filename} should NOT be skipped with {service}"
+        )
+
+
+@pytest.mark.parametrize("filename,service,expected_skip", [
+    ("macro.docm", "DOCLING", True),
+    ("macro.docm", "LLAMACLOUD", False),
+    ("mail.eml", "DOCLING", True),
+    ("mail.eml", "UNSTRUCTURED", False),
+    ("photo.heic", "UNSTRUCTURED", False),
+    ("photo.heic", "DOCLING", True),
+])
+def test_parser_specific_extensions(filename, service, expected_skip, mocker):
+    mocker.patch("app.config.config.ETL_SERVICE", service)
     item = {"name": filename, "file": {"mimeType": "application/octet-stream"}}
-    assert should_skip_file(item) is False, f"{filename} should NOT be skipped"
+    assert should_skip_file(item) is expected_skip, (
+        f"{filename} with {service}: expected skip={expected_skip}"
+    )
diff --git a/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py b/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
index facf15eab..e90847e3a 100644
--- a/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
+++ b/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
@@ -377,3 +377,72 @@ async def test_extract_zip_raises_unsupported_error(tmp_path):
         await EtlPipelineService().extract(
             EtlRequest(file_path=str(zip_file), filename="archive.zip")
         )
+
+
+# ---------------------------------------------------------------------------
+# Slice 14 – should_skip_for_service (per-parser document filtering)
+# ---------------------------------------------------------------------------
+
+
+@pytest.mark.parametrize("filename,etl_service,expected_skip", [
+    ("file.eml", "DOCLING", True),
+    ("file.eml", "UNSTRUCTURED", False),
+    ("file.docm", "LLAMACLOUD", False),
+    ("file.docm", "DOCLING", True),
+    ("file.txt", "DOCLING", False),
+    ("file.csv", "LLAMACLOUD", False),
+    ("file.mp3", "UNSTRUCTURED", False),
+    ("file.exe", "LLAMACLOUD", True),
+    ("file.pdf", "DOCLING", False),
+    ("file.webp", "DOCLING", False),
+    ("file.webp", "UNSTRUCTURED", True),
+    ("file.gif", "LLAMACLOUD", False),
+    ("file.gif", "DOCLING", True),
+    ("file.heic", "UNSTRUCTURED", False),
+    ("file.heic", "DOCLING", True),
+    ("file.svg", "LLAMACLOUD", False),
+    ("file.svg", "DOCLING", True),
+    ("file.p7s", "UNSTRUCTURED", False),
+    ("file.p7s", "LLAMACLOUD", True),
+])
+def test_should_skip_for_service(filename, etl_service, expected_skip):
+    from app.etl_pipeline.file_classifier import should_skip_for_service
+
+    assert should_skip_for_service(filename, etl_service) is expected_skip, (
+        f"{filename} with {etl_service}: expected skip={expected_skip}"
+    )
+
+
+# ---------------------------------------------------------------------------
+# Slice 14b – ETL pipeline rejects per-parser incompatible documents
+# ---------------------------------------------------------------------------
+
+
+async def test_extract_docm_with_docling_raises_unsupported(tmp_path, mocker):
+    """Docling cannot parse .docm -- pipeline should reject before dispatching."""
+    from app.etl_pipeline.exceptions import EtlUnsupportedFileError
+
+    mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
+
+    docm_file = tmp_path / "macro.docm"
+    docm_file.write_bytes(b"\x00" * 10)
+
+    with pytest.raises(EtlUnsupportedFileError, match="not supported by DOCLING"):
+        await EtlPipelineService().extract(
+            EtlRequest(file_path=str(docm_file), filename="macro.docm")
+        )
+
+
+async def test_extract_eml_with_docling_raises_unsupported(tmp_path, mocker):
+    """Docling cannot parse .eml -- pipeline should reject before dispatching."""
+    from app.etl_pipeline.exceptions import EtlUnsupportedFileError
+
+    mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
+
+    eml_file = tmp_path / "mail.eml"
+    eml_file.write_bytes(b"From: test@example.com")
+
+    with pytest.raises(EtlUnsupportedFileError, match="not supported by DOCLING"):
+        await EtlPipelineService().extract(
+            EtlRequest(file_path=str(eml_file), filename="mail.eml")
+        )
diff --git a/surfsense_backend/tests/unit/utils/test_file_extensions.py b/surfsense_backend/tests/unit/utils/test_file_extensions.py
index a376f44bd..acd8945ce 100644
--- a/surfsense_backend/tests/unit/utils/test_file_extensions.py
+++ b/surfsense_backend/tests/unit/utils/test_file_extensions.py
@@ -21,10 +21,17 @@ def test_exe_is_not_supported_document():
     "report.pdf", "doc.docx", "old.doc",
     "sheet.xlsx", "legacy.xls",
     "slides.pptx", "deck.ppt",
+    "macro.docm", "macro.xlsm", "macro.pptm",
     "photo.png", "photo.jpg", "photo.jpeg", "scan.bmp", "scan.tiff", "scan.tif",
+    "photo.webp", "anim.gif", "iphone.heic",
     "manual.rtf", "book.epub",
     "letter.odt", "data.ods", "presentation.odp",
-    "korean.hwpx",
+    "inbox.eml", "outlook.msg",
+    "korean.hwpx", "korean.hwp",
+    "template.dot", "template.dotm",
+    "template.pot", "template.potx",
+    "binary.xlsb", "workspace.xlw",
+    "vector.svg", "signature.p7s",
 ])
 def test_document_extensions_are_supported(filename):
     from app.utils.file_extensions import is_supported_document_extension
@@ -40,3 +47,70 @@ def test_non_document_extensions_are_not_supported(filename):
     from app.utils.file_extensions import is_supported_document_extension
 
     assert is_supported_document_extension(filename) is False, f"{filename} should NOT be supported"
+
+
+# ---------------------------------------------------------------------------
+# Per-parser extension sets
+# ---------------------------------------------------------------------------
+
+
+def test_union_equals_all_three_sets():
+    from app.utils.file_extensions import (
+        DOCLING_DOCUMENT_EXTENSIONS,
+        DOCUMENT_EXTENSIONS,
+        LLAMAPARSE_DOCUMENT_EXTENSIONS,
+        UNSTRUCTURED_DOCUMENT_EXTENSIONS,
+    )
+
+    expected = (
+        DOCLING_DOCUMENT_EXTENSIONS
+        | LLAMAPARSE_DOCUMENT_EXTENSIONS
+        | UNSTRUCTURED_DOCUMENT_EXTENSIONS
+    )
+    assert DOCUMENT_EXTENSIONS == expected
+
+
+def test_get_extensions_for_docling():
+    from app.utils.file_extensions import get_document_extensions_for_service
+
+    exts = get_document_extensions_for_service("DOCLING")
+    assert ".pdf" in exts
+    assert ".webp" in exts
+    assert ".docx" in exts
+    assert ".eml" not in exts
+    assert ".docm" not in exts
+    assert ".gif" not in exts
+    assert ".heic" not in exts
+
+
+def test_get_extensions_for_llamacloud():
+    from app.utils.file_extensions import get_document_extensions_for_service
+
+    exts = get_document_extensions_for_service("LLAMACLOUD")
+    assert ".docm" in exts
+    assert ".gif" in exts
+    assert ".svg" in exts
+    assert ".hwp" in exts
+    assert ".eml" not in exts
+    assert ".heic" not in exts
+
+
+def test_get_extensions_for_unstructured():
+    from app.utils.file_extensions import get_document_extensions_for_service
+
+    exts = get_document_extensions_for_service("UNSTRUCTURED")
+    assert ".eml" in exts
+    assert ".heic" in exts
+    assert ".p7s" in exts
+    assert ".docm" not in exts
+    assert ".gif" not in exts
+    assert ".svg" not in exts
+
+
+def test_get_extensions_for_none_returns_union():
+    from app.utils.file_extensions import (
+        DOCUMENT_EXTENSIONS,
+        get_document_extensions_for_service,
+    )
+
+    assert get_document_extensions_for_service(None) == DOCUMENT_EXTENSIONS
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 6b59f8ef6..c8ce195aa 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -85,7 +85,6 @@ const FILE_TYPE_CONFIG: Record<string, Record<string, string[]>> = {
 		"application/rtf": [".rtf"],
 		"application/xml": [".xml"],
 		"application/epub+zip": [".epub"],
-		"text/html": [".html", ".htm", ".web"],
 		"image/gif": [".gif"],
 		"image/svg+xml": [".svg"],
 		...audioFileTypes,
@@ -472,12 +471,13 @@ export function DocumentUploadTab({
 						</button>
 					))
 				) : (
-					<div
-						className="flex flex-col items-center gap-4 py-12 px-4 cursor-pointer"
-						onClick={() => {
-							if (!isElectron) fileInputRef.current?.click();
-						}}
-					>
+				<button
+					type="button"
+					className="flex flex-col items-center gap-4 py-12 px-4 cursor-pointer w-full bg-transparent border-none"
+					onClick={() => {
+						if (!isElectron) fileInputRef.current?.click();
+					}}
+				>
 						<Upload className="h-10 w-10 text-muted-foreground" />
 						<div className="text-center space-y-1.5">
 							<p className="text-base font-medium">
@@ -485,10 +485,11 @@ export function DocumentUploadTab({
 							</p>
 							<p className="text-sm text-muted-foreground">{t("file_size_limit")}</p>
 						</div>
-						<div className="w-full mt-1" onClick={(e) => e.stopPropagation()}>
-							{renderBrowseButton({ fullWidth: true })}
-						</div>
+					{/* biome-ignore lint/a11y/useSemanticElements: wrapper to stop click propagation to parent button */}
+					<div className="w-full mt-1" onClick={(e) => e.stopPropagation()} onKeyDown={(e) => e.stopPropagation()} role="group">
+						{renderBrowseButton({ fullWidth: true })}
 					</div>
+					</button>
 				)}
 			</div>
 
@@ -683,13 +684,17 @@ export function DocumentUploadTab({
 						</span>
 					</AccordionTrigger>
 					<AccordionContent className="px-3 pb-3">
-						<div className="flex flex-wrap gap-1">
-							{supportedExtensions.map((ext) => (
-								<Badge key={ext} variant="outline" className="text-[10px] px-1.5 py-0">
-									{ext}
-								</Badge>
-							))}
-						</div>
+					<div className="flex flex-wrap gap-1.5">
+						{supportedExtensions.map((ext) => (
+							<Badge
+								key={ext}
+								variant="secondary"
+								className="rounded border-0 bg-neutral-200/80 dark:bg-neutral-700/60 text-muted-foreground text-[10px] px-2 py-0.5 font-normal"
+							>
+								{ext}
+							</Badge>
+						))}
+					</div>
 					</AccordionContent>
 				</AccordionItem>
 			</Accordion>

From 3a1d7008174a43db3c13813a6237427587786ca8 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 03:16:34 +0530
Subject: [PATCH 146/202] refactor: enhance file skipping logic across Dropbox,
 Google Drive, and OneDrive connectors to return unsupported extensions,
 improving error reporting and maintainability

---
 .../app/connectors/dropbox/file_types.py      | 17 +++-
 .../app/connectors/google_drive/file_types.py | 14 ++-
 .../app/connectors/onedrive/file_types.py     | 24 +++--
 .../routes/search_source_connectors_routes.py | 11 ++-
 .../app/services/notification_service.py      | 47 +++++-----
 .../connector_indexers/dropbox_indexer.py     | 93 +++++++++++++------
 .../google_drive_indexer.py                   | 90 ++++++++++++------
 .../connector_indexers/onedrive_indexer.py    | 79 ++++++++++------
 .../test_dropbox_parallel.py                  | 13 ++-
 .../test_google_drive_parallel.py             |  2 +-
 .../connector_indexers/test_page_limits.py    |  4 +-
 .../connectors/test_dropbox_file_types.py     | 44 ++++++---
 .../test_google_drive_file_types.py           | 24 ++++-
 .../connectors/test_onedrive_file_types.py    | 42 +++++++--
 14 files changed, 344 insertions(+), 160 deletions(-)

diff --git a/surfsense_backend/app/connectors/dropbox/file_types.py b/surfsense_backend/app/connectors/dropbox/file_types.py
index 13209ffd2..d26306665 100644
--- a/surfsense_backend/app/connectors/dropbox/file_types.py
+++ b/surfsense_backend/app/connectors/dropbox/file_types.py
@@ -42,18 +42,25 @@ def is_paper_file(item: dict) -> bool:
     return ext == PAPER_EXTENSION
 
 
-def should_skip_file(item: dict) -> bool:
+def should_skip_file(item: dict) -> tuple[bool, str | None]:
     """Skip folders and truly non-indexable files.
 
     Paper docs are non-downloadable but exportable, so they are NOT skipped.
+    Returns (should_skip, unsupported_extension_or_None).
     """
     if is_folder(item):
-        return True
+        return True, None
     if is_paper_file(item):
-        return False
+        return False, None
     if not item.get("is_downloadable", True):
-        return True
+        return True, None
+
+    from pathlib import PurePosixPath
+
     from app.config import config as app_config
 
     name = item.get("name", "")
-    return should_skip_for_service(name, app_config.ETL_SERVICE)
+    if should_skip_for_service(name, app_config.ETL_SERVICE):
+        ext = PurePosixPath(name).suffix.lower()
+        return True, ext
+    return False, None
diff --git a/surfsense_backend/app/connectors/google_drive/file_types.py b/surfsense_backend/app/connectors/google_drive/file_types.py
index 73f016ceb..75dc1d4b3 100644
--- a/surfsense_backend/app/connectors/google_drive/file_types.py
+++ b/surfsense_backend/app/connectors/google_drive/file_types.py
@@ -48,11 +48,19 @@ def should_skip_file(mime_type: str) -> bool:
     return mime_type in [GOOGLE_FOLDER, GOOGLE_SHORTCUT]
 
 
-def should_skip_by_extension(filename: str) -> bool:
-    """Return True if the file extension is not parseable by the configured ETL service."""
+def should_skip_by_extension(filename: str) -> tuple[bool, str | None]:
+    """Check if the file extension is not parseable by the configured ETL service.
+
+    Returns (should_skip, unsupported_extension_or_None).
+    """
+    from pathlib import PurePosixPath
+
     from app.config import config as app_config
 
-    return should_skip_for_service(filename, app_config.ETL_SERVICE)
+    if should_skip_for_service(filename, app_config.ETL_SERVICE):
+        ext = PurePosixPath(filename).suffix.lower()
+        return True, ext
+    return False, None
 
 
 def get_export_mime_type(mime_type: str) -> str | None:
diff --git a/surfsense_backend/app/connectors/onedrive/file_types.py b/surfsense_backend/app/connectors/onedrive/file_types.py
index f9c147da8..942b0be73 100644
--- a/surfsense_backend/app/connectors/onedrive/file_types.py
+++ b/surfsense_backend/app/connectors/onedrive/file_types.py
@@ -40,18 +40,28 @@ def is_folder(item: dict) -> bool:
     return ONEDRIVE_FOLDER_FACET in item
 
 
-def should_skip_file(item: dict) -> bool:
-    """Skip folders, OneNote files, remote items (shared links), packages, and unsupported extensions."""
+def should_skip_file(item: dict) -> tuple[bool, str | None]:
+    """Skip folders, OneNote files, remote items, packages, and unsupported extensions.
+
+    Returns (should_skip, unsupported_extension_or_None).
+    The second element is only set when the skip is due to an unsupported extension.
+    """
     if is_folder(item):
-        return True
+        return True, None
     if "remoteItem" in item:
-        return True
+        return True, None
     if "package" in item:
-        return True
+        return True, None
     mime = item.get("file", {}).get("mimeType", "")
     if mime in SKIP_MIME_TYPES:
-        return True
+        return True, None
+
+    from pathlib import PurePosixPath
+
     from app.config import config as app_config
 
     name = item.get("name", "")
-    return should_skip_for_service(name, app_config.ETL_SERVICE)
+    if should_skip_for_service(name, app_config.ETL_SERVICE):
+        ext = PurePosixPath(name).suffix.lower()
+        return True, ext
+    return False, None
diff --git a/surfsense_backend/app/routes/search_source_connectors_routes.py b/surfsense_backend/app/routes/search_source_connectors_routes.py
index d208ff910..a30eb7297 100644
--- a/surfsense_backend/app/routes/search_source_connectors_routes.py
+++ b/surfsense_backend/app/routes/search_source_connectors_routes.py
@@ -2477,6 +2477,8 @@ async def run_google_drive_indexing(
                 stage="fetching",
             )
 
+        total_unsupported = 0
+
         # Index each folder with indexing options
         for folder in items.folders:
             try:
@@ -2484,6 +2486,7 @@ async def run_google_drive_indexing(
                     indexed_count,
                     skipped_count,
                     error_message,
+                    unsupported_count,
                 ) = await index_google_drive_files(
                     session,
                     connector_id,
@@ -2497,6 +2500,7 @@ async def run_google_drive_indexing(
                     include_subfolders=indexing_options.include_subfolders,
                 )
                 total_skipped += skipped_count
+                total_unsupported += unsupported_count
                 if error_message:
                     errors.append(f"Folder '{folder.name}': {error_message}")
                 else:
@@ -2572,6 +2576,7 @@ async def run_google_drive_indexing(
                 indexed_count=total_indexed,
                 error_message=error_message,
                 skipped_count=total_skipped,
+                unsupported_count=total_unsupported,
             )
 
     except Exception as e:
@@ -2642,7 +2647,7 @@ async def run_onedrive_indexing(
                 stage="fetching",
             )
 
-        total_indexed, total_skipped, error_message = await index_onedrive_files(
+        total_indexed, total_skipped, error_message, total_unsupported = await index_onedrive_files(
             session,
             connector_id,
             search_space_id,
@@ -2683,6 +2688,7 @@ async def run_onedrive_indexing(
                 indexed_count=total_indexed,
                 error_message=error_message,
                 skipped_count=total_skipped,
+                unsupported_count=total_unsupported,
             )
 
     except Exception as e:
@@ -2750,7 +2756,7 @@ async def run_dropbox_indexing(
                 stage="fetching",
             )
 
-        total_indexed, total_skipped, error_message = await index_dropbox_files(
+        total_indexed, total_skipped, error_message, total_unsupported = await index_dropbox_files(
             session,
             connector_id,
             search_space_id,
@@ -2791,6 +2797,7 @@ async def run_dropbox_indexing(
                 indexed_count=total_indexed,
                 error_message=error_message,
                 skipped_count=total_skipped,
+                unsupported_count=total_unsupported,
             )
 
     except Exception as e:
diff --git a/surfsense_backend/app/services/notification_service.py b/surfsense_backend/app/services/notification_service.py
index 5e40a3b42..5ffee12d7 100644
--- a/surfsense_backend/app/services/notification_service.py
+++ b/surfsense_backend/app/services/notification_service.py
@@ -421,6 +421,7 @@ class ConnectorIndexingNotificationHandler(BaseNotificationHandler):
         error_message: str | None = None,
         is_warning: bool = False,
         skipped_count: int | None = None,
+        unsupported_count: int | None = None,
     ) -> Notification:
         """
         Update notification when connector indexing completes.
@@ -428,10 +429,11 @@ class ConnectorIndexingNotificationHandler(BaseNotificationHandler):
         Args:
             session: Database session
             notification: Notification to update
-            indexed_count: Total number of items indexed
+            indexed_count: Total number of files indexed
             error_message: Error message if indexing failed, or warning message (optional)
             is_warning: If True, treat error_message as a warning (success case) rather than an error
-            skipped_count: Number of items skipped (e.g., duplicates) - optional
+            skipped_count: Number of files skipped (e.g., unchanged) - optional
+            unsupported_count: Number of files skipped because the ETL parser doesn't support them
 
         Returns:
             Updated notification
@@ -440,52 +442,45 @@ class ConnectorIndexingNotificationHandler(BaseNotificationHandler):
             "connector_name", "Connector"
         )
 
-        # Build the skipped text if there are skipped items
-        skipped_text = ""
-        if skipped_count and skipped_count > 0:
-            skipped_item_text = "item" if skipped_count == 1 else "items"
-            skipped_text = (
-                f" ({skipped_count} {skipped_item_text} skipped - already indexed)"
-            )
+        unsupported_text = ""
+        if unsupported_count and unsupported_count > 0:
+            file_word = "file was" if unsupported_count == 1 else "files were"
+            unsupported_text = f" {unsupported_count} {file_word} not supported."
 
-        # If there's an error message but items were indexed, treat it as a warning (partial success)
-        # If is_warning is True, treat it as success even with 0 items (e.g., duplicates found)
-        # Otherwise, treat it as a failure
         if error_message:
             if indexed_count > 0:
-                # Partial success with warnings (e.g., duplicate content from other connectors)
                 title = f"Ready: {connector_name}"
-                item_text = "item" if indexed_count == 1 else "items"
-                message = f"Now searchable! {indexed_count} {item_text} synced{skipped_text}. Note: {error_message}"
+                file_text = "file" if indexed_count == 1 else "files"
+                message = f"Now searchable! {indexed_count} {file_text} synced.{unsupported_text} Note: {error_message}"
                 status = "completed"
             elif is_warning:
-                # Warning case (e.g., duplicates found) - treat as success
                 title = f"Ready: {connector_name}"
-                message = f"Sync completed{skipped_text}. {error_message}"
+                message = f"Sync complete.{unsupported_text} {error_message}"
                 status = "completed"
             else:
-                # Complete failure
                 title = f"Failed: {connector_name}"
                 message = f"Sync failed: {error_message}"
+                if unsupported_text:
+                    message += unsupported_text
                 status = "failed"
         else:
             title = f"Ready: {connector_name}"
             if indexed_count == 0:
-                if skipped_count and skipped_count > 0:
-                    skipped_item_text = "item" if skipped_count == 1 else "items"
-                    message = f"Already up to date! {skipped_count} {skipped_item_text} skipped (already indexed)."
+                if unsupported_count and unsupported_count > 0:
+                    message = f"Sync complete.{unsupported_text}"
                 else:
-                    message = "Already up to date! No new items to sync."
+                    message = "Already up to date!"
             else:
-                item_text = "item" if indexed_count == 1 else "items"
-                message = (
-                    f"Now searchable! {indexed_count} {item_text} synced{skipped_text}."
-                )
+                file_text = "file" if indexed_count == 1 else "files"
+                message = f"Now searchable! {indexed_count} {file_text} synced."
+                if unsupported_text:
+                    message += unsupported_text
             status = "completed"
 
         metadata_updates = {
             "indexed_count": indexed_count,
             "skipped_count": skipped_count or 0,
+            "unsupported_count": unsupported_count or 0,
             "sync_stage": "completed"
             if (not error_message or is_warning or indexed_count > 0)
             else "failed",
diff --git a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
index d116cc264..9e7fe1cfb 100644
--- a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
@@ -51,7 +51,10 @@ async def _should_skip_file(
     file_id = file.get("id", "")
     file_name = file.get("name", "Unknown")
 
-    if skip_item(file):
+    skip, unsup_ext = skip_item(file)
+    if skip:
+        if unsup_ext:
+            return True, f"unsupported:{unsup_ext}"
         return True, "folder/non-downloadable"
     if not file_id:
         return True, "missing file_id"
@@ -287,7 +290,7 @@ async def _index_with_delta_sync(
     max_files: int,
     on_heartbeat_callback: HeartbeatCallbackType | None = None,
     enable_summary: bool = True,
-) -> tuple[int, int, str]:
+) -> tuple[int, int, int, str]:
     """Delta sync using Dropbox cursor-based change tracking.
 
     Returns (indexed_count, skipped_count, new_cursor).
@@ -309,12 +312,13 @@ async def _index_with_delta_sync(
 
     if not entries:
         logger.info("No changes detected since last sync")
-        return 0, 0, new_cursor or cursor
+        return 0, 0, 0, new_cursor or cursor
 
     logger.info(f"Processing {len(entries)} change entries")
 
     renamed_count = 0
     skipped = 0
+    unsupported_count = 0
     files_to_download: list[dict] = []
     files_processed = 0
 
@@ -339,7 +343,9 @@ async def _index_with_delta_sync(
 
         skip, msg = await _should_skip_file(session, entry, search_space_id)
         if skip:
-            if msg and "renamed" in msg.lower():
+            if msg and msg.startswith("unsupported:"):
+                unsupported_count += 1
+            elif msg and "renamed" in msg.lower():
                 renamed_count += 1
             else:
                 skipped += 1
@@ -360,9 +366,10 @@ async def _index_with_delta_sync(
 
     indexed = renamed_count + batch_indexed
     logger.info(
-        f"Delta sync complete: {indexed} indexed, {skipped} skipped, {failed} failed"
+        f"Delta sync complete: {indexed} indexed, {skipped} skipped, "
+        f"{unsupported_count} unsupported, {failed} failed"
     )
-    return indexed, skipped, new_cursor or cursor
+    return indexed, skipped, unsupported_count, new_cursor or cursor
 
 
 async def _index_full_scan(
@@ -380,8 +387,11 @@ async def _index_full_scan(
     incremental_sync: bool = True,
     on_heartbeat_callback: HeartbeatCallbackType | None = None,
     enable_summary: bool = True,
-) -> tuple[int, int]:
-    """Full scan indexing of a folder."""
+) -> tuple[int, int, int]:
+    """Full scan indexing of a folder.
+
+    Returns (indexed, skipped, unsupported_count).
+    """
     await task_logger.log_task_progress(
         log_entry,
         f"Starting full scan of folder: {folder_name}",
@@ -401,6 +411,7 @@ async def _index_full_scan(
 
     renamed_count = 0
     skipped = 0
+    unsupported_count = 0
     files_to_download: list[dict] = []
 
     all_files, error = await get_files_in_folder(
@@ -420,14 +431,21 @@ async def _index_full_scan(
         if incremental_sync:
             skip, msg = await _should_skip_file(session, file, search_space_id)
             if skip:
-                if msg and "renamed" in msg.lower():
+                if msg and msg.startswith("unsupported:"):
+                    unsupported_count += 1
+                elif msg and "renamed" in msg.lower():
                     renamed_count += 1
                 else:
                     skipped += 1
                 continue
-        elif skip_item(file):
-            skipped += 1
-            continue
+        else:
+            item_skip, item_unsup = skip_item(file)
+            if item_skip:
+                if item_unsup:
+                    unsupported_count += 1
+                else:
+                    skipped += 1
+                continue
 
         file_pages = PageLimitService.estimate_pages_from_metadata(
             file.get("name", ""), file.get("size")
@@ -466,9 +484,10 @@ async def _index_full_scan(
 
     indexed = renamed_count + batch_indexed
     logger.info(
-        f"Full scan complete: {indexed} indexed, {skipped} skipped, {failed} failed"
+        f"Full scan complete: {indexed} indexed, {skipped} skipped, "
+        f"{unsupported_count} unsupported, {failed} failed"
     )
-    return indexed, skipped
+    return indexed, skipped, unsupported_count
 
 
 async def _index_selected_files(
@@ -493,6 +512,7 @@ async def _index_selected_files(
     errors: list[str] = []
     renamed_count = 0
     skipped = 0
+    unsupported_count = 0
 
     for file_path, file_name in file_paths:
         file, error = await get_file_by_path(dropbox_client, file_path)
@@ -504,14 +524,21 @@ async def _index_selected_files(
         if incremental_sync:
             skip, msg = await _should_skip_file(session, file, search_space_id)
             if skip:
-                if msg and "renamed" in msg.lower():
+                if msg and msg.startswith("unsupported:"):
+                    unsupported_count += 1
+                elif msg and "renamed" in msg.lower():
                     renamed_count += 1
                 else:
                     skipped += 1
                 continue
-        elif skip_item(file):
-            skipped += 1
-            continue
+        else:
+            item_skip, item_unsup = skip_item(file)
+            if item_skip:
+                if item_unsup:
+                    unsupported_count += 1
+                else:
+                    skipped += 1
+                continue
 
         file_pages = PageLimitService.estimate_pages_from_metadata(
             file.get("name", ""), file.get("size")
@@ -543,7 +570,7 @@ async def _index_selected_files(
             user_id, pages_to_deduct, allow_exceed=True
         )
 
-    return renamed_count + batch_indexed, skipped, errors
+    return renamed_count + batch_indexed, skipped, unsupported_count, errors
 
 
 async def index_dropbox_files(
@@ -552,7 +579,7 @@ async def index_dropbox_files(
     search_space_id: int,
     user_id: str,
     items_dict: dict,
-) -> tuple[int, int, str | None]:
+) -> tuple[int, int, str | None, int]:
     """Index Dropbox files for a specific connector.
 
     items_dict format:
@@ -583,7 +610,7 @@ async def index_dropbox_files(
             await task_logger.log_task_failure(
                 log_entry, error_msg, None, {"error_type": "ConnectorNotFound"}
             )
-            return 0, 0, error_msg
+            return 0, 0, error_msg, 0
 
         token_encrypted = connector.config.get("_token_encrypted", False)
         if token_encrypted and not config.SECRET_KEY:
@@ -594,7 +621,7 @@ async def index_dropbox_files(
                 "Missing SECRET_KEY",
                 {"error_type": "MissingSecretKey"},
             )
-            return 0, 0, error_msg
+            return 0, 0, error_msg, 0
 
         connector_enable_summary = getattr(connector, "enable_summary", True)
         dropbox_client = DropboxClient(session, connector_id)
@@ -609,6 +636,7 @@ async def index_dropbox_files(
 
         total_indexed = 0
         total_skipped = 0
+        total_unsupported = 0
 
         selected_files = items_dict.get("files", [])
         if selected_files:
@@ -616,7 +644,7 @@ async def index_dropbox_files(
                 (f.get("path", f.get("path_lower", f.get("id", ""))), f.get("name"))
                 for f in selected_files
             ]
-            indexed, skipped, file_errors = await _index_selected_files(
+            indexed, skipped, unsupported, file_errors = await _index_selected_files(
                 dropbox_client,
                 session,
                 file_tuples,
@@ -628,6 +656,7 @@ async def index_dropbox_files(
             )
             total_indexed += indexed
             total_skipped += skipped
+            total_unsupported += unsupported
             if file_errors:
                 logger.warning(
                     f"File indexing errors for connector {connector_id}: {file_errors}"
@@ -649,7 +678,7 @@ async def index_dropbox_files(
 
             if can_use_delta:
                 logger.info(f"Using delta sync for folder {folder_name}")
-                indexed, skipped, new_cursor = await _index_with_delta_sync(
+                indexed, skipped, unsup, new_cursor = await _index_with_delta_sync(
                     dropbox_client,
                     session,
                     connector_id,
@@ -662,9 +691,10 @@ async def index_dropbox_files(
                     enable_summary=connector_enable_summary,
                 )
                 folder_cursors[folder_path] = new_cursor
+                total_unsupported += unsup
             else:
                 logger.info(f"Using full scan for folder {folder_name}")
-                indexed, skipped = await _index_full_scan(
+                indexed, skipped, unsup = await _index_full_scan(
                     dropbox_client,
                     session,
                     connector_id,
@@ -679,6 +709,7 @@ async def index_dropbox_files(
                     incremental_sync=incremental_sync,
                     enable_summary=connector_enable_summary,
                 )
+                total_unsupported += unsup
 
             total_indexed += indexed
             total_skipped += skipped
@@ -708,12 +739,14 @@ async def index_dropbox_files(
         await task_logger.log_task_success(
             log_entry,
             f"Successfully completed Dropbox indexing for connector {connector_id}",
-            {"files_processed": total_indexed, "files_skipped": total_skipped},
+            {"files_processed": total_indexed, "files_skipped": total_skipped, "files_unsupported": total_unsupported},
         )
         logger.info(
-            f"Dropbox indexing completed: {total_indexed} indexed, {total_skipped} skipped"
+            f"Dropbox indexing completed: {total_indexed} indexed, "
+            f"{total_skipped} skipped, {total_unsupported} unsupported"
         )
-        return total_indexed, total_skipped, None
+
+        return total_indexed, total_skipped, None, total_unsupported
 
     except SQLAlchemyError as db_error:
         await session.rollback()
@@ -724,7 +757,7 @@ async def index_dropbox_files(
             {"error_type": "SQLAlchemyError"},
         )
         logger.error(f"Database error: {db_error!s}", exc_info=True)
-        return 0, 0, f"Database error: {db_error!s}"
+        return 0, 0, f"Database error: {db_error!s}", 0
     except Exception as e:
         await session.rollback()
         await task_logger.log_task_failure(
@@ -734,4 +767,4 @@ async def index_dropbox_files(
             {"error_type": type(e).__name__},
         )
         logger.error(f"Failed to index Dropbox files: {e!s}", exc_info=True)
-        return 0, 0, f"Failed to index Dropbox files: {e!s}"
+        return 0, 0, f"Failed to index Dropbox files: {e!s}", 0
diff --git a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
index 9c53092f5..b2afbb9c9 100644
--- a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
@@ -81,8 +81,9 @@ async def _should_skip_file(
 
     if skip_mime(mime_type):
         return True, "folder/shortcut"
-    if should_skip_by_extension(file_name):
-        return True, "unsupported extension"
+    ext_skip, unsup_ext = should_skip_by_extension(file_name)
+    if ext_skip:
+        return True, f"unsupported:{unsup_ext}"
     if not file_id:
         return True, "missing file_id"
 
@@ -490,6 +491,7 @@ async def _index_selected_files(
     errors: list[str] = []
     renamed_count = 0
     skipped = 0
+    unsupported_count = 0
 
     for file_id, file_name in file_ids:
         file, error = await get_file_by_id(drive_client, file_id)
@@ -500,7 +502,9 @@ async def _index_selected_files(
 
         skip, msg = await _should_skip_file(session, file, search_space_id)
         if skip:
-            if msg and "renamed" in msg.lower():
+            if msg and msg.startswith("unsupported:"):
+                unsupported_count += 1
+            elif msg and "renamed" in msg.lower():
                 renamed_count += 1
             else:
                 skipped += 1
@@ -544,7 +548,7 @@ async def _index_selected_files(
             user_id, pages_to_deduct, allow_exceed=True
         )
 
-    return renamed_count + batch_indexed, skipped, errors
+    return renamed_count + batch_indexed, skipped, unsupported_count, errors
 
 
 # ---------------------------------------------------------------------------
@@ -567,8 +571,11 @@ async def _index_full_scan(
     include_subfolders: bool = False,
     on_heartbeat_callback: HeartbeatCallbackType | None = None,
     enable_summary: bool = True,
-) -> tuple[int, int]:
-    """Full scan indexing of a folder."""
+) -> tuple[int, int, int]:
+    """Full scan indexing of a folder.
+
+    Returns (indexed, skipped, unsupported_count).
+    """
     await task_logger.log_task_progress(
         log_entry,
         f"Starting full scan of folder: {folder_name} (include_subfolders={include_subfolders})",
@@ -590,6 +597,7 @@ async def _index_full_scan(
 
     renamed_count = 0
     skipped = 0
+    unsupported_count = 0
     files_processed = 0
     files_to_download: list[dict] = []
     folders_to_process = [(folder_id, folder_name)]
@@ -630,7 +638,9 @@ async def _index_full_scan(
 
                 skip, msg = await _should_skip_file(session, file, search_space_id)
                 if skip:
-                    if msg and "renamed" in msg.lower():
+                    if msg and msg.startswith("unsupported:"):
+                        unsupported_count += 1
+                    elif msg and "renamed" in msg.lower():
                         renamed_count += 1
                     else:
                         skipped += 1
@@ -703,9 +713,10 @@ async def _index_full_scan(
 
     indexed = renamed_count + batch_indexed
     logger.info(
-        f"Full scan complete: {indexed} indexed, {skipped} skipped, {failed} failed"
+        f"Full scan complete: {indexed} indexed, {skipped} skipped, "
+        f"{unsupported_count} unsupported, {failed} failed"
     )
-    return indexed, skipped
+    return indexed, skipped, unsupported_count
 
 
 async def _index_with_delta_sync(
@@ -723,8 +734,11 @@ async def _index_with_delta_sync(
     include_subfolders: bool = False,
     on_heartbeat_callback: HeartbeatCallbackType | None = None,
     enable_summary: bool = True,
-) -> tuple[int, int]:
-    """Delta sync using change tracking."""
+) -> tuple[int, int, int]:
+    """Delta sync using change tracking.
+
+    Returns (indexed, skipped, unsupported_count).
+    """
     await task_logger.log_task_progress(
         log_entry,
         f"Starting delta sync from token: {start_page_token[:20]}...",
@@ -759,6 +773,7 @@ async def _index_with_delta_sync(
 
     renamed_count = 0
     skipped = 0
+    unsupported_count = 0
     files_to_download: list[dict] = []
     files_processed = 0
 
@@ -780,7 +795,9 @@ async def _index_with_delta_sync(
 
         skip, msg = await _should_skip_file(session, file, search_space_id)
         if skip:
-            if msg and "renamed" in msg.lower():
+            if msg and msg.startswith("unsupported:"):
+                unsupported_count += 1
+            elif msg and "renamed" in msg.lower():
                 renamed_count += 1
             else:
                 skipped += 1
@@ -837,9 +854,10 @@ async def _index_with_delta_sync(
 
     indexed = renamed_count + batch_indexed
     logger.info(
-        f"Delta sync complete: {indexed} indexed, {skipped} skipped, {failed} failed"
+        f"Delta sync complete: {indexed} indexed, {skipped} skipped, "
+        f"{unsupported_count} unsupported, {failed} failed"
     )
-    return indexed, skipped
+    return indexed, skipped, unsupported_count
 
 
 # ---------------------------------------------------------------------------
@@ -859,8 +877,11 @@ async def index_google_drive_files(
     max_files: int = 500,
     include_subfolders: bool = False,
     on_heartbeat_callback: HeartbeatCallbackType | None = None,
-) -> tuple[int, int, str | None]:
-    """Index Google Drive files for a specific connector."""
+) -> tuple[int, int, str | None, int]:
+    """Index Google Drive files for a specific connector.
+
+    Returns (indexed, skipped, error_or_none, unsupported_count).
+    """
     task_logger = TaskLoggingService(session, search_space_id)
     log_entry = await task_logger.log_task_start(
         task_name="google_drive_files_indexing",
@@ -886,7 +907,7 @@ async def index_google_drive_files(
             await task_logger.log_task_failure(
                 log_entry, error_msg, None, {"error_type": "ConnectorNotFound"}
             )
-            return 0, 0, error_msg
+            return 0, 0, error_msg, 0
 
         await task_logger.log_task_progress(
             log_entry,
@@ -905,7 +926,7 @@ async def index_google_drive_files(
                     "Missing Composio account",
                     {"error_type": "MissingComposioAccount"},
                 )
-                return 0, 0, error_msg
+                return 0, 0, error_msg, 0
             pre_built_credentials = build_composio_credentials(connected_account_id)
         else:
             token_encrypted = connector.config.get("_token_encrypted", False)
@@ -920,6 +941,7 @@ async def index_google_drive_files(
                     0,
                     0,
                     "SECRET_KEY not configured but credentials are marked as encrypted",
+                    0,
                 )
 
         connector_enable_summary = getattr(connector, "enable_summary", True)
@@ -932,7 +954,7 @@ async def index_google_drive_files(
             await task_logger.log_task_failure(
                 log_entry, error_msg, {"error_type": "MissingParameter"}
             )
-            return 0, 0, error_msg
+            return 0, 0, error_msg, 0
 
         target_folder_id = folder_id
         target_folder_name = folder_name or "Selected Folder"
@@ -943,9 +965,11 @@ async def index_google_drive_files(
             use_delta_sync and start_page_token and connector.last_indexed_at
         )
 
+        documents_unsupported = 0
+
         if can_use_delta:
             logger.info(f"Using delta sync for connector {connector_id}")
-            documents_indexed, documents_skipped = await _index_with_delta_sync(
+            documents_indexed, documents_skipped, du = await _index_with_delta_sync(
                 drive_client,
                 session,
                 connector,
@@ -961,8 +985,9 @@ async def index_google_drive_files(
                 on_heartbeat_callback,
                 connector_enable_summary,
             )
+            documents_unsupported += du
             logger.info("Running reconciliation scan after delta sync")
-            ri, rs = await _index_full_scan(
+            ri, rs, ru = await _index_full_scan(
                 drive_client,
                 session,
                 connector,
@@ -980,9 +1005,10 @@ async def index_google_drive_files(
             )
             documents_indexed += ri
             documents_skipped += rs
+            documents_unsupported += ru
         else:
             logger.info(f"Using full scan for connector {connector_id}")
-            documents_indexed, documents_skipped = await _index_full_scan(
+            documents_indexed, documents_skipped, documents_unsupported = await _index_full_scan(
                 drive_client,
                 session,
                 connector,
@@ -1017,14 +1043,17 @@ async def index_google_drive_files(
             {
                 "files_processed": documents_indexed,
                 "files_skipped": documents_skipped,
+                "files_unsupported": documents_unsupported,
                 "sync_type": "delta" if can_use_delta else "full",
                 "folder": target_folder_name,
             },
         )
         logger.info(
-            f"Google Drive indexing completed: {documents_indexed} indexed, {documents_skipped} skipped"
+            f"Google Drive indexing completed: {documents_indexed} indexed, "
+            f"{documents_skipped} skipped, {documents_unsupported} unsupported"
         )
-        return documents_indexed, documents_skipped, None
+
+        return documents_indexed, documents_skipped, None, documents_unsupported
 
     except SQLAlchemyError as db_error:
         await session.rollback()
@@ -1035,7 +1064,7 @@ async def index_google_drive_files(
             {"error_type": "SQLAlchemyError"},
         )
         logger.error(f"Database error: {db_error!s}", exc_info=True)
-        return 0, 0, f"Database error: {db_error!s}"
+        return 0, 0, f"Database error: {db_error!s}", 0
     except Exception as e:
         await session.rollback()
         await task_logger.log_task_failure(
@@ -1045,7 +1074,7 @@ async def index_google_drive_files(
             {"error_type": type(e).__name__},
         )
         logger.error(f"Failed to index Google Drive files: {e!s}", exc_info=True)
-        return 0, 0, f"Failed to index Google Drive files: {e!s}"
+        return 0, 0, f"Failed to index Google Drive files: {e!s}", 0
 
 
 async def index_google_drive_single_file(
@@ -1247,7 +1276,7 @@ async def index_google_drive_selected_files(
             session, connector_id, credentials=pre_built_credentials
         )
 
-        indexed, skipped, errors = await _index_selected_files(
+        indexed, skipped, unsupported, errors = await _index_selected_files(
             drive_client,
             session,
             files,
@@ -1258,6 +1287,11 @@ async def index_google_drive_selected_files(
             on_heartbeat=on_heartbeat_callback,
         )
 
+        if unsupported > 0:
+            file_text = "file was" if unsupported == 1 else "files were"
+            unsup_msg = f"{unsupported} {file_text} not supported"
+            errors.append(unsup_msg)
+
         await session.commit()
 
         if errors:
@@ -1265,7 +1299,7 @@ async def index_google_drive_selected_files(
                 log_entry,
                 f"Batch file indexing completed with {len(errors)} error(s)",
                 "; ".join(errors),
-                {"indexed": indexed, "skipped": skipped, "error_count": len(errors)},
+                {"indexed": indexed, "skipped": skipped, "unsupported": unsupported, "error_count": len(errors)},
             )
         else:
             await task_logger.log_task_success(
diff --git a/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
index 2301b6260..db42773fe 100644
--- a/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
@@ -56,7 +56,10 @@ async def _should_skip_file(
     file_id = file.get("id")
     file_name = file.get("name", "Unknown")
 
-    if skip_item(file):
+    skip, unsup_ext = skip_item(file)
+    if skip:
+        if unsup_ext:
+            return True, f"unsupported:{unsup_ext}"
         return True, "folder/onenote/remote"
     if not file_id:
         return True, "missing file_id"
@@ -301,6 +304,7 @@ async def _index_selected_files(
     errors: list[str] = []
     renamed_count = 0
     skipped = 0
+    unsupported_count = 0
 
     for file_id, file_name in file_ids:
         file, error = await get_file_by_id(onedrive_client, file_id)
@@ -311,7 +315,9 @@ async def _index_selected_files(
 
         skip, msg = await _should_skip_file(session, file, search_space_id)
         if skip:
-            if msg and "renamed" in msg.lower():
+            if msg and msg.startswith("unsupported:"):
+                unsupported_count += 1
+            elif msg and "renamed" in msg.lower():
                 renamed_count += 1
             else:
                 skipped += 1
@@ -347,7 +353,7 @@ async def _index_selected_files(
             user_id, pages_to_deduct, allow_exceed=True
         )
 
-    return renamed_count + batch_indexed, skipped, errors
+    return renamed_count + batch_indexed, skipped, unsupported_count, errors
 
 
 # ---------------------------------------------------------------------------
@@ -369,8 +375,11 @@ async def _index_full_scan(
     include_subfolders: bool = True,
     on_heartbeat_callback: HeartbeatCallbackType | None = None,
     enable_summary: bool = True,
-) -> tuple[int, int]:
-    """Full scan indexing of a folder."""
+) -> tuple[int, int, int]:
+    """Full scan indexing of a folder.
+
+    Returns (indexed, skipped, unsupported_count).
+    """
     await task_logger.log_task_progress(
         log_entry,
         f"Starting full scan of folder: {folder_name}",
@@ -389,6 +398,7 @@ async def _index_full_scan(
 
     renamed_count = 0
     skipped = 0
+    unsupported_count = 0
     files_to_download: list[dict] = []
 
     all_files, error = await get_files_in_folder(
@@ -407,7 +417,9 @@ async def _index_full_scan(
     for file in all_files[:max_files]:
         skip, msg = await _should_skip_file(session, file, search_space_id)
         if skip:
-            if msg and "renamed" in msg.lower():
+            if msg and msg.startswith("unsupported:"):
+                unsupported_count += 1
+            elif msg and "renamed" in msg.lower():
                 renamed_count += 1
             else:
                 skipped += 1
@@ -450,9 +462,10 @@ async def _index_full_scan(
 
     indexed = renamed_count + batch_indexed
     logger.info(
-        f"Full scan complete: {indexed} indexed, {skipped} skipped, {failed} failed"
+        f"Full scan complete: {indexed} indexed, {skipped} skipped, "
+        f"{unsupported_count} unsupported, {failed} failed"
     )
-    return indexed, skipped
+    return indexed, skipped, unsupported_count
 
 
 async def _index_with_delta_sync(
@@ -468,8 +481,11 @@ async def _index_with_delta_sync(
     max_files: int,
     on_heartbeat_callback: HeartbeatCallbackType | None = None,
     enable_summary: bool = True,
-) -> tuple[int, int, str | None]:
-    """Delta sync using OneDrive change tracking. Returns (indexed, skipped, new_delta_link)."""
+) -> tuple[int, int, int, str | None]:
+    """Delta sync using OneDrive change tracking.
+
+    Returns (indexed, skipped, unsupported_count, new_delta_link).
+    """
     await task_logger.log_task_progress(
         log_entry,
         "Starting delta sync",
@@ -489,7 +505,7 @@ async def _index_with_delta_sync(
 
     if not changes:
         logger.info("No changes detected since last sync")
-        return 0, 0, new_delta_link
+        return 0, 0, 0, new_delta_link
 
     logger.info(f"Processing {len(changes)} delta changes")
 
@@ -501,6 +517,7 @@ async def _index_with_delta_sync(
 
     renamed_count = 0
     skipped = 0
+    unsupported_count = 0
     files_to_download: list[dict] = []
     files_processed = 0
 
@@ -523,7 +540,9 @@ async def _index_with_delta_sync(
 
         skip, msg = await _should_skip_file(session, change, search_space_id)
         if skip:
-            if msg and "renamed" in msg.lower():
+            if msg and msg.startswith("unsupported:"):
+                unsupported_count += 1
+            elif msg and "renamed" in msg.lower():
                 renamed_count += 1
             else:
                 skipped += 1
@@ -566,9 +585,10 @@ async def _index_with_delta_sync(
 
     indexed = renamed_count + batch_indexed
     logger.info(
-        f"Delta sync complete: {indexed} indexed, {skipped} skipped, {failed} failed"
+        f"Delta sync complete: {indexed} indexed, {skipped} skipped, "
+        f"{unsupported_count} unsupported, {failed} failed"
     )
-    return indexed, skipped, new_delta_link
+    return indexed, skipped, unsupported_count, new_delta_link
 
 
 # ---------------------------------------------------------------------------
@@ -582,7 +602,7 @@ async def index_onedrive_files(
     search_space_id: int,
     user_id: str,
     items_dict: dict,
-) -> tuple[int, int, str | None]:
+) -> tuple[int, int, str | None, int]:
     """Index OneDrive files for a specific connector.
 
     items_dict format:
@@ -609,7 +629,7 @@ async def index_onedrive_files(
             await task_logger.log_task_failure(
                 log_entry, error_msg, None, {"error_type": "ConnectorNotFound"}
             )
-            return 0, 0, error_msg
+            return 0, 0, error_msg, 0
 
         token_encrypted = connector.config.get("_token_encrypted", False)
         if token_encrypted and not config.SECRET_KEY:
@@ -620,7 +640,7 @@ async def index_onedrive_files(
                 "Missing SECRET_KEY",
                 {"error_type": "MissingSecretKey"},
             )
-            return 0, 0, error_msg
+            return 0, 0, error_msg, 0
 
         connector_enable_summary = getattr(connector, "enable_summary", True)
         onedrive_client = OneDriveClient(session, connector_id)
@@ -632,12 +652,13 @@ async def index_onedrive_files(
 
         total_indexed = 0
         total_skipped = 0
+        total_unsupported = 0
 
         # Index selected individual files
         selected_files = items_dict.get("files", [])
         if selected_files:
             file_tuples = [(f["id"], f.get("name")) for f in selected_files]
-            indexed, skipped, _errors = await _index_selected_files(
+            indexed, skipped, unsupported, _errors = await _index_selected_files(
                 onedrive_client,
                 session,
                 file_tuples,
@@ -648,6 +669,7 @@ async def index_onedrive_files(
             )
             total_indexed += indexed
             total_skipped += skipped
+            total_unsupported += unsupported
 
         # Index selected folders
         folders = items_dict.get("folders", [])
@@ -661,7 +683,7 @@ async def index_onedrive_files(
 
             if can_use_delta:
                 logger.info(f"Using delta sync for folder {folder_name}")
-                indexed, skipped, new_delta_link = await _index_with_delta_sync(
+                indexed, skipped, unsup, new_delta_link = await _index_with_delta_sync(
                     onedrive_client,
                     session,
                     connector_id,
@@ -676,6 +698,7 @@ async def index_onedrive_files(
                 )
                 total_indexed += indexed
                 total_skipped += skipped
+                total_unsupported += unsup
 
                 if new_delta_link:
                     await session.refresh(connector)
@@ -685,7 +708,7 @@ async def index_onedrive_files(
                     flag_modified(connector, "config")
 
                 # Reconciliation full scan
-                ri, rs = await _index_full_scan(
+                ri, rs, ru = await _index_full_scan(
                     onedrive_client,
                     session,
                     connector_id,
@@ -701,9 +724,10 @@ async def index_onedrive_files(
                 )
                 total_indexed += ri
                 total_skipped += rs
+                total_unsupported += ru
             else:
                 logger.info(f"Using full scan for folder {folder_name}")
-                indexed, skipped = await _index_full_scan(
+                indexed, skipped, unsup = await _index_full_scan(
                     onedrive_client,
                     session,
                     connector_id,
@@ -719,6 +743,7 @@ async def index_onedrive_files(
                 )
                 total_indexed += indexed
                 total_skipped += skipped
+                total_unsupported += unsup
 
             # Store new delta link for this folder
             _, new_delta_link, _ = await onedrive_client.get_delta(folder_id=folder_id)
@@ -737,12 +762,14 @@ async def index_onedrive_files(
         await task_logger.log_task_success(
             log_entry,
             f"Successfully completed OneDrive indexing for connector {connector_id}",
-            {"files_processed": total_indexed, "files_skipped": total_skipped},
+            {"files_processed": total_indexed, "files_skipped": total_skipped, "files_unsupported": total_unsupported},
         )
         logger.info(
-            f"OneDrive indexing completed: {total_indexed} indexed, {total_skipped} skipped"
+            f"OneDrive indexing completed: {total_indexed} indexed, "
+            f"{total_skipped} skipped, {total_unsupported} unsupported"
         )
-        return total_indexed, total_skipped, None
+
+        return total_indexed, total_skipped, None, total_unsupported
 
     except SQLAlchemyError as db_error:
         await session.rollback()
@@ -753,7 +780,7 @@ async def index_onedrive_files(
             {"error_type": "SQLAlchemyError"},
         )
         logger.error(f"Database error: {db_error!s}", exc_info=True)
-        return 0, 0, f"Database error: {db_error!s}"
+        return 0, 0, f"Database error: {db_error!s}", 0
     except Exception as e:
         await session.rollback()
         await task_logger.log_task_failure(
@@ -763,4 +790,4 @@ async def index_onedrive_files(
             {"error_type": type(e).__name__},
         )
         logger.error(f"Failed to index OneDrive files: {e!s}", exc_info=True)
-        return 0, 0, f"Failed to index OneDrive files: {e!s}"
+        return 0, 0, f"Failed to index OneDrive files: {e!s}", 0
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
index 8572fa8ea..14c16fce4 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
@@ -265,7 +265,10 @@ def full_scan_mocks(mock_dropbox_client, monkeypatch):
 
     async def _fake_skip(session, file, search_space_id):
         from app.connectors.dropbox.file_types import should_skip_file as _skip
-        if _skip(file):
+        item_skip, unsup_ext = _skip(file)
+        if item_skip:
+            if unsup_ext:
+                return True, f"unsupported:{unsup_ext}"
             return True, "folder/non-downloadable"
         return skip_results.get(file.get("id", ""), (False, None))
 
@@ -541,7 +544,7 @@ async def test_delta_sync_deletions_call_remove_document(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    indexed, skipped, cursor = await _index_with_delta_sync(
+    indexed, skipped, unsupported, cursor = await _index_with_delta_sync(
         mock_client,
         AsyncMock(),
         _CONNECTOR_ID,
@@ -578,7 +581,7 @@ async def test_delta_sync_upserts_filtered_and_downloaded(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    indexed, skipped, cursor = await _index_with_delta_sync(
+    indexed, skipped, unsupported, cursor = await _index_with_delta_sync(
         mock_client,
         AsyncMock(),
         _CONNECTOR_ID,
@@ -628,7 +631,7 @@ async def test_delta_sync_mix_deletions_and_upserts(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    indexed, skipped, cursor = await _index_with_delta_sync(
+    indexed, skipped, unsupported, cursor = await _index_with_delta_sync(
         mock_client,
         AsyncMock(),
         _CONNECTOR_ID,
@@ -662,7 +665,7 @@ async def test_delta_sync_returns_new_cursor(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    indexed, skipped, cursor = await _index_with_delta_sync(
+    indexed, skipped, unsupported, cursor = await _index_with_delta_sync(
         mock_client,
         AsyncMock(),
         _CONNECTOR_ID,
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py b/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
index 20bd3f3d6..b830e9773 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
@@ -497,7 +497,7 @@ async def test_delta_sync_removals_serial_rest_parallel(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    indexed, skipped = await _index_with_delta_sync(
+    indexed, skipped, unsupported = await _index_with_delta_sync(
         MagicMock(),
         mock_session,
         MagicMock(),
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
index b31a9557f..e2996ce9d 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
@@ -384,7 +384,7 @@ async def test_gdrive_full_scan_skips_over_quota(gdrive_full_scan_mocks, monkeyp
     m["download_mock"].return_value = ([], 0)
     m["batch_mock"].return_value = ([], 2, 0)
 
-    _indexed, skipped = await _run_gdrive_full_scan(m)
+    _indexed, skipped, _unsup = await _run_gdrive_full_scan(m)
 
     call_files = m["download_mock"].call_args[0][1]
     assert len(call_files) == 2
@@ -459,7 +459,7 @@ async def test_gdrive_delta_sync_skips_over_quota(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    _indexed, skipped = await _mod._index_with_delta_sync(
+    _indexed, skipped, _unsupported = await _mod._index_with_delta_sync(
         MagicMock(),
         session,
         MagicMock(),
diff --git a/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py b/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
index e092872c5..74277d47c 100644
--- a/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
+++ b/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
@@ -14,17 +14,23 @@ pytestmark = pytest.mark.unit
 
 def test_folder_item_is_skipped():
     item = {".tag": "folder", "name": "My Folder"}
-    assert should_skip_file(item) is True
+    skip, ext = should_skip_file(item)
+    assert skip is True
+    assert ext is None
 
 
 def test_paper_file_is_not_skipped():
     item = {".tag": "file", "name": "notes.paper", "is_downloadable": False}
-    assert should_skip_file(item) is False
+    skip, ext = should_skip_file(item)
+    assert skip is False
+    assert ext is None
 
 
 def test_non_downloadable_item_is_skipped():
     item = {".tag": "file", "name": "locked.gdoc", "is_downloadable": False}
-    assert should_skip_file(item) is True
+    skip, ext = should_skip_file(item)
+    assert skip is True
+    assert ext is None
 
 
 # ---------------------------------------------------------------------------
@@ -49,7 +55,9 @@ def test_non_downloadable_item_is_skipped():
 def test_non_parseable_extensions_are_skipped(filename, mocker):
     mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
     item = {".tag": "file", "name": filename}
-    assert should_skip_file(item) is True, f"{filename} should be skipped"
+    skip, ext = should_skip_file(item)
+    assert skip is True, f"{filename} should be skipped"
+    assert ext is not None
 
 
 @pytest.mark.parametrize(
@@ -65,9 +73,9 @@ def test_parseable_documents_are_not_skipped(filename, mocker):
     for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
         mocker.patch("app.config.config.ETL_SERVICE", service)
         item = {".tag": "file", "name": filename}
-        assert should_skip_file(item) is False, (
-            f"{filename} should NOT be skipped with {service}"
-        )
+        skip, ext = should_skip_file(item)
+        assert skip is False, f"{filename} should NOT be skipped with {service}"
+        assert ext is None
 
 
 @pytest.mark.parametrize(
@@ -79,9 +87,9 @@ def test_universal_images_are_not_skipped(filename, mocker):
     for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
         mocker.patch("app.config.config.ETL_SERVICE", service)
         item = {".tag": "file", "name": filename}
-        assert should_skip_file(item) is False, (
-            f"{filename} should NOT be skipped with {service}"
-        )
+        skip, ext = should_skip_file(item)
+        assert skip is False, f"{filename} should NOT be skipped with {service}"
+        assert ext is None
 
 
 @pytest.mark.parametrize("filename,service,expected_skip", [
@@ -111,6 +119,20 @@ def test_universal_images_are_not_skipped(filename, mocker):
 def test_parser_specific_extensions(filename, service, expected_skip, mocker):
     mocker.patch("app.config.config.ETL_SERVICE", service)
     item = {".tag": "file", "name": filename}
-    assert should_skip_file(item) is expected_skip, (
+    skip, ext = should_skip_file(item)
+    assert skip is expected_skip, (
         f"{filename} with {service}: expected skip={expected_skip}"
     )
+    if expected_skip:
+        assert ext is not None
+    else:
+        assert ext is None
+
+
+def test_returns_unsupported_extension(mocker):
+    """When a file is skipped due to unsupported extension, the ext string is returned."""
+    mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
+    item = {".tag": "file", "name": "old.doc"}
+    skip, ext = should_skip_file(item)
+    assert skip is True
+    assert ext == ".doc"
diff --git a/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py b/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
index 4ed7eb4db..5cd43736b 100644
--- a/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
+++ b/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
@@ -14,7 +14,8 @@ def test_unsupported_extensions_are_skipped_regardless_of_service(filename, mock
     """Truly unsupported files are skipped no matter which ETL service is configured."""
     for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
         mocker.patch("app.config.config.ETL_SERVICE", service)
-        assert should_skip_by_extension(filename) is True
+        skip, ext = should_skip_by_extension(filename)
+        assert skip is True
 
 
 @pytest.mark.parametrize("filename", [
@@ -25,9 +26,9 @@ def test_universal_extensions_are_not_skipped(filename, mocker):
     """Files supported by all parsers (or handled by plaintext/direct_convert) are never skipped."""
     for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
         mocker.patch("app.config.config.ETL_SERVICE", service)
-        assert should_skip_by_extension(filename) is False, (
-            f"{filename} should NOT be skipped with {service}"
-        )
+        skip, ext = should_skip_by_extension(filename)
+        assert skip is False, f"{filename} should NOT be skipped with {service}"
+        assert ext is None
 
 
 @pytest.mark.parametrize("filename,service,expected_skip", [
@@ -42,6 +43,19 @@ def test_universal_extensions_are_not_skipped(filename, mocker):
 ])
 def test_parser_specific_extensions(filename, service, expected_skip, mocker):
     mocker.patch("app.config.config.ETL_SERVICE", service)
-    assert should_skip_by_extension(filename) is expected_skip, (
+    skip, ext = should_skip_by_extension(filename)
+    assert skip is expected_skip, (
         f"{filename} with {service}: expected skip={expected_skip}"
     )
+    if expected_skip:
+        assert ext is not None, "unsupported extension should be returned"
+    else:
+        assert ext is None
+
+
+def test_returns_unsupported_extension(mocker):
+    """When a file is skipped, the unsupported extension string is returned."""
+    mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
+    skip, ext = should_skip_by_extension("macro.docm")
+    assert skip is True
+    assert ext == ".docm"
diff --git a/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py b/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
index e73f799e2..61212b340 100644
--- a/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
+++ b/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
@@ -14,22 +14,30 @@ pytestmark = pytest.mark.unit
 
 def test_folder_is_skipped():
     item = {"folder": {}, "name": "My Folder"}
-    assert should_skip_file(item) is True
+    skip, ext = should_skip_file(item)
+    assert skip is True
+    assert ext is None
 
 
 def test_remote_item_is_skipped():
     item = {"remoteItem": {}, "name": "shared.docx"}
-    assert should_skip_file(item) is True
+    skip, ext = should_skip_file(item)
+    assert skip is True
+    assert ext is None
 
 
 def test_package_is_skipped():
     item = {"package": {}, "name": "notebook"}
-    assert should_skip_file(item) is True
+    skip, ext = should_skip_file(item)
+    assert skip is True
+    assert ext is None
 
 
 def test_onenote_is_skipped():
     item = {"name": "notes", "file": {"mimeType": "application/msonenote"}}
-    assert should_skip_file(item) is True
+    skip, ext = should_skip_file(item)
+    assert skip is True
+    assert ext is None
 
 
 # ---------------------------------------------------------------------------
@@ -43,7 +51,9 @@ def test_onenote_is_skipped():
 def test_unsupported_extensions_are_skipped(filename, mocker):
     mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
     item = {"name": filename, "file": {"mimeType": "application/octet-stream"}}
-    assert should_skip_file(item) is True, f"{filename} should be skipped"
+    skip, ext = should_skip_file(item)
+    assert skip is True, f"{filename} should be skipped"
+    assert ext is not None
 
 
 @pytest.mark.parametrize("filename", [
@@ -54,9 +64,9 @@ def test_universal_files_are_not_skipped(filename, mocker):
     for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
         mocker.patch("app.config.config.ETL_SERVICE", service)
         item = {"name": filename, "file": {"mimeType": "application/octet-stream"}}
-        assert should_skip_file(item) is False, (
-            f"{filename} should NOT be skipped with {service}"
-        )
+        skip, ext = should_skip_file(item)
+        assert skip is False, f"{filename} should NOT be skipped with {service}"
+        assert ext is None
 
 
 @pytest.mark.parametrize("filename,service,expected_skip", [
@@ -70,6 +80,20 @@ def test_universal_files_are_not_skipped(filename, mocker):
 def test_parser_specific_extensions(filename, service, expected_skip, mocker):
     mocker.patch("app.config.config.ETL_SERVICE", service)
     item = {"name": filename, "file": {"mimeType": "application/octet-stream"}}
-    assert should_skip_file(item) is expected_skip, (
+    skip, ext = should_skip_file(item)
+    assert skip is expected_skip, (
         f"{filename} with {service}: expected skip={expected_skip}"
     )
+    if expected_skip:
+        assert ext is not None
+    else:
+        assert ext is None
+
+
+def test_returns_unsupported_extension(mocker):
+    """When a file is skipped due to unsupported extension, the ext string is returned."""
+    mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
+    item = {"name": "mail.eml", "file": {"mimeType": "application/octet-stream"}}
+    skip, ext = should_skip_file(item)
+    assert skip is True
+    assert ext == ".eml"

From 122be76133fbd5bfdc504464dff5f2cab69e6e5e Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 03:16:46 +0530
Subject: [PATCH 147/202] refactor: update _index_selected_files method
 signatures in Dropbox, Google Drive, and OneDrive indexers to include
 unsupported file count, enhancing error reporting and consistency across
 connectors

---
 .../app/tasks/connector_indexers/dropbox_indexer.py  |  2 +-
 .../tasks/connector_indexers/google_drive_indexer.py |  4 ++--
 .../app/tasks/connector_indexers/onedrive_indexer.py |  2 +-
 .../connector_indexers/test_google_drive_parallel.py |  8 ++++----
 .../unit/connector_indexers/test_page_limits.py      | 12 ++++++------
 5 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
index 9e7fe1cfb..8d2a45e03 100644
--- a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
@@ -501,7 +501,7 @@ async def _index_selected_files(
     enable_summary: bool,
     incremental_sync: bool = True,
     on_heartbeat: HeartbeatCallbackType | None = None,
-) -> tuple[int, int, list[str]]:
+) -> tuple[int, int, int, list[str]]:
     """Index user-selected files using the parallel pipeline."""
     page_limit_service = PageLimitService(session)
     pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
diff --git a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
index b2afbb9c9..0ded89102 100644
--- a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
@@ -474,13 +474,13 @@ async def _index_selected_files(
     user_id: str,
     enable_summary: bool,
     on_heartbeat: HeartbeatCallbackType | None = None,
-) -> tuple[int, int, list[str]]:
+) -> tuple[int, int, int, list[str]]:
     """Index user-selected files using the parallel pipeline.
 
     Phase 1 (serial): fetch metadata + skip checks.
     Phase 2+3 (parallel): download, ETL, index via _download_and_index.
 
-    Returns (indexed_count, skipped_count, errors).
+    Returns (indexed_count, skipped_count, unsupported_count, errors).
     """
     page_limit_service = PageLimitService(session)
     pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
diff --git a/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
index db42773fe..b26442490 100644
--- a/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
@@ -293,7 +293,7 @@ async def _index_selected_files(
     user_id: str,
     enable_summary: bool,
     on_heartbeat: HeartbeatCallbackType | None = None,
-) -> tuple[int, int, list[str]]:
+) -> tuple[int, int, int, list[str]]:
     """Index user-selected files using the parallel pipeline."""
     page_limit_service = PageLimitService(session)
     pages_used, pages_limit = await page_limit_service.get_page_usage(user_id)
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py b/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
index b830e9773..7fa92ce12 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
@@ -366,7 +366,7 @@ async def test_full_scan_three_phase_counts(full_scan_mocks, monkeypatch):
     full_scan_mocks["download_mock"].return_value = (mock_docs, 0)
     full_scan_mocks["batch_mock"].return_value = ([], 2, 0)
 
-    indexed, skipped = await _run_full_scan(full_scan_mocks)
+    indexed, skipped, unsupported = await _run_full_scan(full_scan_mocks)
 
     assert indexed == 3  # 1 renamed + 2 from batch
     assert skipped == 1  # 1 unchanged
@@ -589,7 +589,7 @@ async def test_selected_files_single_file_indexed(selected_files_mocks):
     )
     selected_files_mocks["download_and_index_mock"].return_value = (1, 0)
 
-    indexed, skipped, errors = await _run_selected(
+    indexed, skipped, unsup, errors = await _run_selected(
         selected_files_mocks,
         [("f1", "report.pdf")],
     )
@@ -613,7 +613,7 @@ async def test_selected_files_fetch_failure_isolation(selected_files_mocks):
     )
     selected_files_mocks["download_and_index_mock"].return_value = (2, 0)
 
-    indexed, skipped, errors = await _run_selected(
+    indexed, skipped, unsup, errors = await _run_selected(
         selected_files_mocks,
         [("f1", "first.txt"), ("f2", "mid.txt"), ("f3", "third.txt")],
     )
@@ -647,7 +647,7 @@ async def test_selected_files_skip_rename_counting(selected_files_mocks):
 
     selected_files_mocks["download_and_index_mock"].return_value = (2, 0)
 
-    indexed, skipped, errors = await _run_selected(
+    indexed, skipped, unsup, errors = await _run_selected(
         selected_files_mocks,
         [
             ("s1", "unchanged.txt"),
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
index e2996ce9d..58737b20b 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
@@ -198,7 +198,7 @@ async def test_gdrive_files_within_quota_are_downloaded(gdrive_selected_mocks):
         )
     m["download_and_index_mock"].return_value = (3, 0)
 
-    indexed, _skipped, errors = await _run_gdrive_selected(
+    indexed, _skipped, _unsup, errors = await _run_gdrive_selected(
         m, [("f1", "f1.xyz"), ("f2", "f2.xyz"), ("f3", "f3.xyz")]
     )
 
@@ -219,7 +219,7 @@ async def test_gdrive_files_exceeding_quota_rejected(gdrive_selected_mocks):
         None,
     )
 
-    indexed, _skipped, errors = await _run_gdrive_selected(m, [("big", "huge.pdf")])
+    indexed, _skipped, _unsup, errors = await _run_gdrive_selected(m, [("big", "huge.pdf")])
 
     assert indexed == 0
     assert len(errors) == 1
@@ -239,7 +239,7 @@ async def test_gdrive_quota_mix_partial_indexing(gdrive_selected_mocks):
         )
     m["download_and_index_mock"].return_value = (2, 0)
 
-    indexed, _skipped, errors = await _run_gdrive_selected(
+    indexed, _skipped, _unsup, errors = await _run_gdrive_selected(
         m, [("f1", "f1.xyz"), ("f2", "f2.xyz"), ("f3", "f3.xyz")]
     )
 
@@ -299,7 +299,7 @@ async def test_gdrive_zero_quota_rejects_all(gdrive_selected_mocks):
             None,
         )
 
-    indexed, _skipped, errors = await _run_gdrive_selected(
+    indexed, _skipped, _unsup, errors = await _run_gdrive_selected(
         m, [("f1", "f1.xyz"), ("f2", "f2.xyz")]
     )
 
@@ -552,7 +552,7 @@ async def test_onedrive_over_quota_rejected(onedrive_selected_mocks):
         None,
     )
 
-    indexed, _skipped, errors = await _run_onedrive_selected(m, [("big", "huge.pdf")])
+    indexed, _skipped, _unsup, errors = await _run_onedrive_selected(m, [("big", "huge.pdf")])
 
     assert indexed == 0
     assert len(errors) == 1
@@ -652,7 +652,7 @@ async def test_dropbox_over_quota_rejected(dropbox_selected_mocks):
         None,
     )
 
-    indexed, _skipped, errors = await _run_dropbox_selected(
+    indexed, _skipped, _unsup, errors = await _run_dropbox_selected(
         m, [("/huge.pdf", "huge.pdf")]
     )
 

From a624c86b04ff83336ae5d37cac3cf1095d63dcea Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 05:11:15 +0530
Subject: [PATCH 148/202] refactor: update file skipping logic in Dropbox,
 Google Drive, and OneDrive connectors to return unsupported extension
 information

---
 .../app/connectors/dropbox/content_extractor.py             | 3 ++-
 .../app/connectors/google_drive/content_extractor.py        | 6 ++++--
 .../app/connectors/onedrive/content_extractor.py            | 3 ++-
 .../google_unification/test_drive_indexer_credentials.py    | 2 +-
 4 files changed, 9 insertions(+), 5 deletions(-)

diff --git a/surfsense_backend/app/connectors/dropbox/content_extractor.py b/surfsense_backend/app/connectors/dropbox/content_extractor.py
index 8e947eee7..8cbc3e417 100644
--- a/surfsense_backend/app/connectors/dropbox/content_extractor.py
+++ b/surfsense_backend/app/connectors/dropbox/content_extractor.py
@@ -53,7 +53,8 @@ async def download_and_extract_content(
     file_name = file.get("name", "Unknown")
     file_id = file.get("id", "")
 
-    if should_skip_file(file):
+    skip, _unsup_ext = should_skip_file(file)
+    if skip:
         return None, {}, "Skipping non-indexable item"
 
     logger.info(f"Downloading file for content extraction: {file_name}")
diff --git a/surfsense_backend/app/connectors/google_drive/content_extractor.py b/surfsense_backend/app/connectors/google_drive/content_extractor.py
index 10f008594..9f49d491d 100644
--- a/surfsense_backend/app/connectors/google_drive/content_extractor.py
+++ b/surfsense_backend/app/connectors/google_drive/content_extractor.py
@@ -43,7 +43,8 @@ async def download_and_extract_content(
     if should_skip_file(mime_type):
         return None, {}, f"Skipping {mime_type}"
 
-    if should_skip_by_extension(file_name):
+    ext_skip, _unsup_ext = should_skip_by_extension(file_name)
+    if ext_skip:
         return None, {}, f"Skipping unsupported extension: {file_name}"
 
     logger.info(f"Downloading file for content extraction: {file_name} ({mime_type})")
@@ -155,7 +156,8 @@ async def download_and_process_file(
     if should_skip_file(mime_type):
         return None, f"Skipping {mime_type}", None
 
-    if should_skip_by_extension(file_name):
+    ext_skip, _unsup_ext = should_skip_by_extension(file_name)
+    if ext_skip:
         return None, f"Skipping unsupported extension: {file_name}", None
 
     logger.info(f"Downloading file: {file_name} ({mime_type})")
diff --git a/surfsense_backend/app/connectors/onedrive/content_extractor.py b/surfsense_backend/app/connectors/onedrive/content_extractor.py
index 2355993eb..2238b8603 100644
--- a/surfsense_backend/app/connectors/onedrive/content_extractor.py
+++ b/surfsense_backend/app/connectors/onedrive/content_extractor.py
@@ -24,7 +24,8 @@ async def download_and_extract_content(
     item_id = file.get("id")
     file_name = file.get("name", "Unknown")
 
-    if should_skip_file(file):
+    skip, _unsup_ext = should_skip_file(file)
+    if skip:
         return None, {}, "Skipping non-indexable item"
 
     file_info = file.get("file", {})
diff --git a/surfsense_backend/tests/integration/google_unification/test_drive_indexer_credentials.py b/surfsense_backend/tests/integration/google_unification/test_drive_indexer_credentials.py
index 5bb0b6137..e669fa143 100644
--- a/surfsense_backend/tests/integration/google_unification/test_drive_indexer_credentials.py
+++ b/surfsense_backend/tests/integration/google_unification/test_drive_indexer_credentials.py
@@ -124,7 +124,7 @@ async def test_composio_connector_without_account_id_returns_error(
 
     maker = make_session_factory(async_engine)
     async with maker() as session:
-        count, _skipped, error = await index_google_drive_files(
+        count, _skipped, error, _unsupported = await index_google_drive_files(
             session=session,
             connector_id=data["connector_id"],
             search_space_id=data["search_space_id"],

From aba5f6a124bebb75039db1482c4727aabb24360a Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 05:19:23 +0530
Subject: [PATCH 149/202] refactor: improve file handling logic in Dropbox and
 OneDrive connectors to include unsupported file extension information

---
 .../app/connectors/dropbox/folder_manager.py     |  6 ++++--
 .../app/connectors/onedrive/folder_manager.py    |  6 ++++--
 .../connector_indexers/test_dropbox_parallel.py  | 16 ++++++++--------
 3 files changed, 16 insertions(+), 12 deletions(-)

diff --git a/surfsense_backend/app/connectors/dropbox/folder_manager.py b/surfsense_backend/app/connectors/dropbox/folder_manager.py
index 5453c8785..f9aa78873 100644
--- a/surfsense_backend/app/connectors/dropbox/folder_manager.py
+++ b/surfsense_backend/app/connectors/dropbox/folder_manager.py
@@ -64,8 +64,10 @@ async def get_files_in_folder(
                         )
                         continue
                     files.extend(sub_files)
-            elif not should_skip_file(item):
-                files.append(item)
+            else:
+                skip, _unsup_ext = should_skip_file(item)
+                if not skip:
+                    files.append(item)
 
         return files, None
 
diff --git a/surfsense_backend/app/connectors/onedrive/folder_manager.py b/surfsense_backend/app/connectors/onedrive/folder_manager.py
index 6fa725ca1..a5d7fa713 100644
--- a/surfsense_backend/app/connectors/onedrive/folder_manager.py
+++ b/surfsense_backend/app/connectors/onedrive/folder_manager.py
@@ -71,8 +71,10 @@ async def get_files_in_folder(
                         )
                         continue
                     files.extend(sub_files)
-            elif not should_skip_file(item):
-                files.append(item)
+            else:
+                skip, _unsup_ext = should_skip_file(item)
+                if not skip:
+                    files.append(item)
 
         return files, None
 
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
index 14c16fce4..adac90085 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
@@ -345,7 +345,7 @@ async def test_full_scan_three_phase_counts(full_scan_mocks, monkeypatch):
 
     full_scan_mocks["download_and_index_mock"].return_value = (2, 0)
 
-    indexed, skipped = await _run_full_scan(
+    indexed, skipped, _unsupported = await _run_full_scan(
         full_scan_mocks, monkeypatch, page_files
     )
 
@@ -444,7 +444,7 @@ async def test_selected_files_single_file_indexed(selected_files_mocks):
     )
     selected_files_mocks["download_and_index_mock"].return_value = (1, 0)
 
-    indexed, skipped, errors = await _run_selected(
+    indexed, skipped, _unsupported, errors = await _run_selected(
         selected_files_mocks,
         [("/report.pdf", "report.pdf")],
     )
@@ -466,7 +466,7 @@ async def test_selected_files_fetch_failure_isolation(selected_files_mocks):
     )
     selected_files_mocks["download_and_index_mock"].return_value = (2, 0)
 
-    indexed, skipped, errors = await _run_selected(
+    indexed, skipped, _unsupported, errors = await _run_selected(
         selected_files_mocks,
         [("/first.txt", "first.txt"), ("/mid.txt", "mid.txt"), ("/third.txt", "third.txt")],
     )
@@ -496,7 +496,7 @@ async def test_selected_files_skip_rename_counting(selected_files_mocks):
     )
     selected_files_mocks["download_and_index_mock"].return_value = (2, 0)
 
-    indexed, skipped, errors = await _run_selected(
+    indexed, skipped, _unsupported, errors = await _run_selected(
         selected_files_mocks,
         [
             ("/unchanged.txt", "unchanged.txt"),
@@ -715,10 +715,10 @@ def orchestrator_mocks(monkeypatch):
 
     monkeypatch.setattr(_mod, "update_connector_last_indexed", AsyncMock())
 
-    full_scan_mock = AsyncMock(return_value=(5, 2))
+    full_scan_mock = AsyncMock(return_value=(5, 2, 0))
     monkeypatch.setattr(_mod, "_index_full_scan", full_scan_mock)
 
-    delta_sync_mock = AsyncMock(return_value=(3, 1, "delta-cursor-new"))
+    delta_sync_mock = AsyncMock(return_value=(3, 1, 0, "delta-cursor-new"))
     monkeypatch.setattr(_mod, "_index_with_delta_sync", delta_sync_mock)
 
     mock_client = MagicMock()
@@ -751,7 +751,7 @@ async def test_orchestrator_uses_delta_sync_when_cursor_and_last_indexed(
     mock_session = AsyncMock()
     mock_session.commit = AsyncMock()
 
-    indexed, skipped, error = await index_dropbox_files(
+    indexed, skipped, error, _unsupported = await index_dropbox_files(
         mock_session,
         _CONNECTOR_ID,
         _SEARCH_SPACE_ID,
@@ -779,7 +779,7 @@ async def test_orchestrator_falls_back_to_full_scan_without_cursor(
     mock_session = AsyncMock()
     mock_session.commit = AsyncMock()
 
-    indexed, skipped, error = await index_dropbox_files(
+    indexed, skipped, error, _unsupported = await index_dropbox_files(
         mock_session,
         _CONNECTOR_ID,
         _SEARCH_SPACE_ID,

From e4462292e456d38abca0c533b925b4d8a9bee24e Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 05:30:10 +0530
Subject: [PATCH 150/202] refactor: update Google Drive indexer to return an
 additional unsupported file count, enhancing error reporting consistency

---
 .../tasks/connector_indexers/google_drive_indexer.py   |  2 +-
 .../connector-configs/views/connector-edit-view.tsx    | 10 ++--------
 2 files changed, 3 insertions(+), 9 deletions(-)

diff --git a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
index 0ded89102..a33859af5 100644
--- a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
@@ -758,7 +758,7 @@ async def _index_with_delta_sync(
 
     if not changes:
         logger.info("No changes detected since last sync")
-        return 0, 0
+        return 0, 0, 0
 
     logger.info(f"Processing {len(changes)} changes")
 
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
index 1e71b0a25..06fc2b497 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
@@ -417,14 +417,8 @@ export const ConnectorEditView: FC<ConnectorEditViewProps> = ({
 						disabled={isSaving || isDisconnecting}
 						className="text-xs sm:text-sm flex-1 sm:flex-initial h-12 sm:h-auto py-3 sm:py-2"
 					>
-						{isSaving ? (
-							<>
-								<Spinner size="sm" className="mr-2" />
-								Saving
-							</>
-						) : (
-							"Save Changes"
-						)}
+						{isSaving && <Spinner size="sm" className="mr-2" />}
+						Save Changes
 					</Button>
 				)}
 			</div>

From 1b87719a927f5ecac96b254bdcf68d8cc2af38d1 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 05:36:29 +0530
Subject: [PATCH 151/202] refactor: enhance file skipping logic in Google Drive
 connector to check for Google Workspace files before unsupported extensions

---
 .../connectors/google_drive/content_extractor.py   | 14 ++++++++------
 .../connector_indexers/google_drive_indexer.py     |  8 +++++---
 2 files changed, 13 insertions(+), 9 deletions(-)

diff --git a/surfsense_backend/app/connectors/google_drive/content_extractor.py b/surfsense_backend/app/connectors/google_drive/content_extractor.py
index 9f49d491d..3e0bb39e5 100644
--- a/surfsense_backend/app/connectors/google_drive/content_extractor.py
+++ b/surfsense_backend/app/connectors/google_drive/content_extractor.py
@@ -43,9 +43,10 @@ async def download_and_extract_content(
     if should_skip_file(mime_type):
         return None, {}, f"Skipping {mime_type}"
 
-    ext_skip, _unsup_ext = should_skip_by_extension(file_name)
-    if ext_skip:
-        return None, {}, f"Skipping unsupported extension: {file_name}"
+    if not is_google_workspace_file(mime_type):
+        ext_skip, _unsup_ext = should_skip_by_extension(file_name)
+        if ext_skip:
+            return None, {}, f"Skipping unsupported extension: {file_name}"
 
     logger.info(f"Downloading file for content extraction: {file_name} ({mime_type})")
 
@@ -156,9 +157,10 @@ async def download_and_process_file(
     if should_skip_file(mime_type):
         return None, f"Skipping {mime_type}", None
 
-    ext_skip, _unsup_ext = should_skip_by_extension(file_name)
-    if ext_skip:
-        return None, f"Skipping unsupported extension: {file_name}", None
+    if not is_google_workspace_file(mime_type):
+        ext_skip, _unsup_ext = should_skip_by_extension(file_name)
+        if ext_skip:
+            return None, f"Skipping unsupported extension: {file_name}", None
 
     logger.info(f"Downloading file: {file_name} ({mime_type})")
 
diff --git a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
index a33859af5..9916e70a0 100644
--- a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
@@ -26,6 +26,7 @@ from app.connectors.google_drive import (
     get_start_page_token,
 )
 from app.connectors.google_drive.file_types import (
+    is_google_workspace_file,
     should_skip_by_extension,
     should_skip_file as skip_mime,
 )
@@ -81,9 +82,10 @@ async def _should_skip_file(
 
     if skip_mime(mime_type):
         return True, "folder/shortcut"
-    ext_skip, unsup_ext = should_skip_by_extension(file_name)
-    if ext_skip:
-        return True, f"unsupported:{unsup_ext}"
+    if not is_google_workspace_file(mime_type):
+        ext_skip, unsup_ext = should_skip_by_extension(file_name)
+        if ext_skip:
+            return True, f"unsupported:{unsup_ext}"
     if not file_id:
         return True, "missing file_id"
 

From 7f32dd068f0b4d9c2f3bad651d71e7420132495d Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 05:40:40 +0530
Subject: [PATCH 152/202] refactor: update button rendering logic in connector
 views to improve loading state handling

---
 .../views/connector-connect-view.tsx           | 18 +++++++-----------
 .../views/connector-edit-view.tsx              | 18 ++++++------------
 .../views/connector-accounts-list-view.tsx     |  2 +-
 .../views/youtube-crawler-view.tsx             | 14 +++++---------
 4 files changed, 19 insertions(+), 33 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx
index 596b98e93..8a0ef5ae1 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-connect-view.tsx
@@ -144,18 +144,14 @@ export const ConnectorConnectView: FC<ConnectorConnectViewProps> = ({
 					type="button"
 					onClick={handleFormSubmit}
 					disabled={isSubmitting}
-					className="text-xs sm:text-sm min-w-[140px] disabled:opacity-50 disabled:cursor-not-allowed disabled:pointer-events-none"
+					className="relative text-xs sm:text-sm min-w-[140px] disabled:opacity-50 disabled:cursor-not-allowed disabled:pointer-events-none"
 				>
-					{isSubmitting ? (
-						<>
-							<Spinner size="sm" className="mr-2" />
-							Connecting
-						</>
-					) : connectorType === "MCP_CONNECTOR" ? (
-						"Connect"
-					) : (
-						`Connect ${getConnectorTypeDisplay(connectorType)}`
-					)}
+					<span className={isSubmitting ? "opacity-0" : ""}>
+						{connectorType === "MCP_CONNECTOR"
+							? "Connect"
+							: `Connect ${getConnectorTypeDisplay(connectorType)}`}
+					</span>
+					{isSubmitting && <Spinner size="sm" className="absolute" />}
 				</Button>
 			</div>
 		</div>
diff --git a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
index 06fc2b497..7308e1e26 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/connector-configs/views/connector-edit-view.tsx
@@ -369,16 +369,10 @@ export const ConnectorEditView: FC<ConnectorEditViewProps> = ({
 								size="sm"
 								onClick={handleDisconnectConfirm}
 								disabled={isDisconnecting}
-								className="text-xs sm:text-sm flex-1 sm:flex-initial h-10 sm:h-auto py-2 sm:py-2"
+								className="relative text-xs sm:text-sm flex-1 sm:flex-initial h-10 sm:h-auto py-2 sm:py-2"
 							>
-								{isDisconnecting ? (
-									<>
-										<Spinner size="sm" className="mr-2" />
-										Disconnecting
-									</>
-								) : (
-									"Confirm Disconnect"
-								)}
+								<span className={isDisconnecting ? "opacity-0" : ""}>Confirm Disconnect</span>
+								{isDisconnecting && <Spinner size="sm" className="absolute" />}
 							</Button>
 							<Button
 								variant="ghost"
@@ -415,10 +409,10 @@ export const ConnectorEditView: FC<ConnectorEditViewProps> = ({
 					<Button
 						onClick={onSave}
 						disabled={isSaving || isDisconnecting}
-						className="text-xs sm:text-sm flex-1 sm:flex-initial h-12 sm:h-auto py-3 sm:py-2"
+						className="relative text-xs sm:text-sm flex-1 sm:flex-initial h-12 sm:h-auto py-3 sm:py-2"
 					>
-						{isSaving && <Spinner size="sm" className="mr-2" />}
-						Save Changes
+						<span className={isSaving ? "opacity-0" : ""}>Save Changes</span>
+						{isSaving && <Spinner size="sm" className="absolute" />}
 					</Button>
 				)}
 			</div>
diff --git a/surfsense_web/components/assistant-ui/connector-popup/views/connector-accounts-list-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/views/connector-accounts-list-view.tsx
index 5dfc252c2..5e2b8452b 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/views/connector-accounts-list-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/views/connector-accounts-list-view.tsx
@@ -174,7 +174,7 @@ export const ConnectorAccountsListView: FC<ConnectorAccountsListViewProps> = ({
 							)}
 						</div>
 						<span className="text-xs sm:text-sm font-medium">
-							{isConnecting ? "Connecting" : buttonText}
+							{buttonText}
 						</span>
 					</button>
 				</div>
diff --git a/surfsense_web/components/assistant-ui/connector-popup/views/youtube-crawler-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/views/youtube-crawler-view.tsx
index 7ec85f4d3..c16072bca 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/views/youtube-crawler-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/views/youtube-crawler-view.tsx
@@ -335,16 +335,12 @@ export const YouTubeCrawlerView: FC<YouTubeCrawlerViewProps> = ({ searchSpaceId,
 				<Button
 					onClick={handleSubmit}
 					disabled={isSubmitting || isFetchingPlaylist || videoTags.length === 0}
-					className="text-xs sm:text-sm min-w-[140px] disabled:opacity-50 disabled:cursor-not-allowed disabled:pointer-events-none"
+					className="relative text-xs sm:text-sm min-w-[140px] disabled:opacity-50 disabled:cursor-not-allowed disabled:pointer-events-none"
 				>
-					{isSubmitting ? (
-						<>
-							<Spinner size="sm" className="mr-2" />
-							{t("processing")}
-						</>
-					) : (
-						t("submit")
-					)}
+					<span className={isSubmitting ? "opacity-0" : ""}>
+						{t("submit")}
+					</span>
+					{isSubmitting && <Spinner size="sm" className="absolute" />}
 				</Button>
 			</div>
 		</div>

From 5803fe79dac41715be5b6a961cd978d0998a9069 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 05:43:34 +0530
Subject: [PATCH 153/202] refactor: update filename handling in Google Drive
 connector to include Google Workspace file extensions, improving content
 extraction accuracy

---
 .../app/connectors/google_drive/content_extractor.py        | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/surfsense_backend/app/connectors/google_drive/content_extractor.py b/surfsense_backend/app/connectors/google_drive/content_extractor.py
index 3e0bb39e5..025c3831a 100644
--- a/surfsense_backend/app/connectors/google_drive/content_extractor.py
+++ b/surfsense_backend/app/connectors/google_drive/content_extractor.py
@@ -100,7 +100,8 @@ async def download_and_extract_content(
             if error:
                 return None, drive_metadata, error
 
-        markdown = await _parse_file_to_markdown(temp_file_path, file_name)
+        etl_filename = file_name + extension if is_google_workspace_file(mime_type) else file_name
+        markdown = await _parse_file_to_markdown(temp_file_path, etl_filename)
         return markdown, drive_metadata, None
 
     except Exception as e:
@@ -232,10 +233,11 @@ async def download_and_process_file(
                 "."
             )[-1]
 
+        etl_filename = file_name + extension if is_google_workspace_file(mime_type) else file_name
         logger.info(f"Processing {file_name} with Surfsense's file processor")
         await process_file_in_background(
             file_path=temp_file_path,
-            filename=file_name,
+            filename=etl_filename,
             search_space_id=search_space_id,
             user_id=user_id,
             session=session,

From 0a26a6c5bb900d5e660b09a88665242c50c31f1f Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 05:55:39 +0530
Subject: [PATCH 154/202] chore: ran linting

---
 .../app/connectors/dropbox/client.py          |  14 +-
 .../google_drive/content_extractor.py         |   8 +-
 .../app/etl_pipeline/etl_pipeline_service.py  |   9 +-
 .../app/etl_pipeline/file_classifier.py       | 105 ++++++++++---
 .../app/etl_pipeline/parsers/llamacloud.py    |  12 +-
 .../app/routes/autocomplete_routes.py         |   9 +-
 .../routes/search_source_connectors_routes.py |  14 +-
 .../services/vision_autocomplete_service.py   |  65 +++++---
 .../connector_indexers/dropbox_indexer.py     |  17 +--
 .../google_drive_indexer.py                   |  13 +-
 .../local_folder_indexer.py                   |   3 -
 .../connector_indexers/onedrive_indexer.py    |   6 +-
 .../document_processors/file_processors.py    |  12 +-
 .../app/utils/file_extensions.py              |  97 +++++++++---
 .../test_content_extraction.py                |  20 +--
 .../test_dropbox_parallel.py                  |  59 +++++--
 .../test_google_drive_parallel.py             |  10 +-
 .../connector_indexers/test_page_limits.py    |   8 +-
 .../unit/connectors/test_dropbox_client.py    |  10 +-
 .../connectors/test_dropbox_file_types.py     | 105 ++++++++-----
 .../test_google_drive_file_types.py           |  55 ++++---
 .../connectors/test_onedrive_file_types.py    |  49 ++++--
 .../tests/unit/etl_pipeline/conftest.py       |   4 +-
 .../etl_pipeline/test_etl_pipeline_service.py | 113 ++++++++------
 .../services/test_docling_image_support.py    |  41 ++---
 .../tests/unit/utils/test_file_extensions.py  |  84 +++++++---
 .../components/DesktopContent.tsx             |   8 +-
 .../app/desktop/permissions/page.tsx          |  15 +-
 .../app/desktop/suggestion/layout.tsx         |   6 +-
 surfsense_web/app/desktop/suggestion/page.tsx |  50 +++---
 .../app/desktop/suggestion/suggestion.css     | 144 +++++++++---------
 .../views/connector-accounts-list-view.tsx    |   4 +-
 .../views/youtube-crawler-view.tsx            |   4 +-
 .../assistant-ui/document-upload-popup.tsx    |   4 +-
 .../components/assistant-ui/image.tsx         | 134 ++++++++--------
 .../components/assistant-ui/thread-list.tsx   |   4 +-
 .../components/assistant-ui/tool-fallback.tsx |   3 +-
 .../comment-composer/comment-composer.tsx     |  24 ++-
 .../components/documents/DocumentNode.tsx     |  20 +--
 .../components/documents/FolderTreeView.tsx   |  15 +-
 .../components/editor/plate-editor.tsx        |  19 +--
 .../components/homepage/use-cases-grid.tsx    |  16 +-
 .../layout/providers/LayoutDataProvider.tsx   |   3 +-
 .../ui/sidebar/AllPrivateChatsSidebar.tsx     |  36 ++---
 .../ui/sidebar/AllSharedChatsSidebar.tsx      |  36 ++---
 surfsense_web/components/markdown-viewer.tsx  |  51 ++++---
 .../settings/user-settings-dialog.tsx         |   2 +-
 .../components/sources/DocumentUploadTab.tsx  |  49 +++---
 .../tool-ui/citation/citation-list.tsx        |  31 ++--
 .../components/tool-ui/citation/citation.tsx  |  26 ++--
 surfsense_web/components/ui/animated-tabs.tsx |   5 +-
 surfsense_web/components/ui/toggle-group.tsx  |  10 +-
 surfsense_web/contexts/LocaleContext.tsx      |  13 +-
 surfsense_web/types/window.d.ts               |  13 +-
 54 files changed, 1015 insertions(+), 672 deletions(-)

diff --git a/surfsense_backend/app/connectors/dropbox/client.py b/surfsense_backend/app/connectors/dropbox/client.py
index b177c2f8d..e89800191 100644
--- a/surfsense_backend/app/connectors/dropbox/client.py
+++ b/surfsense_backend/app/connectors/dropbox/client.py
@@ -225,9 +225,7 @@ class DropboxClient:
 
         return all_items, None
 
-    async def get_latest_cursor(
-        self, path: str = ""
-    ) -> tuple[str | None, str | None]:
+    async def get_latest_cursor(self, path: str = "") -> tuple[str | None, str | None]:
         """Get a cursor representing the current state of a folder.
 
         Uses /2/files/list_folder/get_latest_cursor so we can later call
@@ -251,9 +249,7 @@ class DropboxClient:
         """
         all_entries: list[dict[str, Any]] = []
 
-        resp = await self._request(
-            "/2/files/list_folder/continue", {"cursor": cursor}
-        )
+        resp = await self._request("/2/files/list_folder/continue", {"cursor": cursor})
         if resp.status_code == 401:
             return [], None, "Dropbox authentication expired (401)"
         if resp.status_code != 200:
@@ -268,7 +264,11 @@ class DropboxClient:
                 "/2/files/list_folder/continue", {"cursor": cursor}
             )
             if resp.status_code != 200:
-                return all_entries, data.get("cursor"), f"Pagination failed: {resp.status_code}"
+                return (
+                    all_entries,
+                    data.get("cursor"),
+                    f"Pagination failed: {resp.status_code}",
+                )
             data = resp.json()
             all_entries.extend(data.get("entries", []))
 
diff --git a/surfsense_backend/app/connectors/google_drive/content_extractor.py b/surfsense_backend/app/connectors/google_drive/content_extractor.py
index 025c3831a..83ff32e82 100644
--- a/surfsense_backend/app/connectors/google_drive/content_extractor.py
+++ b/surfsense_backend/app/connectors/google_drive/content_extractor.py
@@ -100,7 +100,9 @@ async def download_and_extract_content(
             if error:
                 return None, drive_metadata, error
 
-        etl_filename = file_name + extension if is_google_workspace_file(mime_type) else file_name
+        etl_filename = (
+            file_name + extension if is_google_workspace_file(mime_type) else file_name
+        )
         markdown = await _parse_file_to_markdown(temp_file_path, etl_filename)
         return markdown, drive_metadata, None
 
@@ -233,7 +235,9 @@ async def download_and_process_file(
                 "."
             )[-1]
 
-        etl_filename = file_name + extension if is_google_workspace_file(mime_type) else file_name
+        etl_filename = (
+            file_name + extension if is_google_workspace_file(mime_type) else file_name
+        )
         logger.info(f"Processing {file_name} with Surfsense's file processor")
         await process_file_in_background(
             file_path=temp_file_path,
diff --git a/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py b/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
index a0041c843..6e7ab3c4c 100644
--- a/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
+++ b/surfsense_backend/app/etl_pipeline/etl_pipeline_service.py
@@ -1,6 +1,9 @@
 from app.config import config as app_config
 from app.etl_pipeline.etl_document import EtlRequest, EtlResult
-from app.etl_pipeline.exceptions import EtlServiceUnavailableError, EtlUnsupportedFileError
+from app.etl_pipeline.exceptions import (
+    EtlServiceUnavailableError,
+    EtlUnsupportedFileError,
+)
 from app.etl_pipeline.file_classifier import FileCategory, classify_file
 from app.etl_pipeline.parsers.audio import transcribe_audio
 from app.etl_pipeline.parsers.direct_convert import convert_file_directly
@@ -78,9 +81,7 @@ class EtlPipelineService:
                 request.file_path, request.estimated_pages
             )
         else:
-            raise EtlServiceUnavailableError(
-                f"Unknown ETL_SERVICE: {etl_service}"
-            )
+            raise EtlServiceUnavailableError(f"Unknown ETL_SERVICE: {etl_service}")
 
         return EtlResult(
             markdown_content=content,
diff --git a/surfsense_backend/app/etl_pipeline/file_classifier.py b/surfsense_backend/app/etl_pipeline/file_classifier.py
index bc7b4537c..4e690bcdc 100644
--- a/surfsense_backend/app/etl_pipeline/file_classifier.py
+++ b/surfsense_backend/app/etl_pipeline/file_classifier.py
@@ -1,27 +1,96 @@
 from enum import Enum
 from pathlib import PurePosixPath
 
-from app.utils.file_extensions import DOCUMENT_EXTENSIONS, get_document_extensions_for_service
+from app.utils.file_extensions import (
+    DOCUMENT_EXTENSIONS,
+    get_document_extensions_for_service,
+)
 
 PLAINTEXT_EXTENSIONS = frozenset(
     {
-        ".md", ".markdown", ".txt", ".text",
-        ".json", ".jsonl", ".yaml", ".yml", ".toml", ".ini", ".cfg", ".conf", ".xml",
-        ".css", ".scss", ".less", ".sass",
-        ".py", ".pyw", ".pyi", ".pyx",
-        ".js", ".jsx", ".ts", ".tsx", ".mjs", ".cjs",
-        ".java", ".kt", ".kts", ".scala", ".groovy",
-        ".c", ".h", ".cpp", ".cxx", ".cc", ".hpp", ".hxx",
-        ".cs", ".fs", ".fsx",
-        ".go", ".rs", ".rb", ".php", ".pl", ".pm", ".lua", ".swift",
-        ".m", ".mm", ".r", ".jl",
-        ".sh", ".bash", ".zsh", ".fish", ".bat", ".cmd", ".ps1",
-        ".sql", ".graphql", ".gql",
-        ".env", ".gitignore", ".dockerignore", ".editorconfig",
-        ".makefile", ".cmake",
-        ".log", ".rst", ".tex", ".bib", ".org", ".adoc", ".asciidoc",
-        ".vue", ".svelte", ".astro",
-        ".tf", ".hcl", ".proto",
+        ".md",
+        ".markdown",
+        ".txt",
+        ".text",
+        ".json",
+        ".jsonl",
+        ".yaml",
+        ".yml",
+        ".toml",
+        ".ini",
+        ".cfg",
+        ".conf",
+        ".xml",
+        ".css",
+        ".scss",
+        ".less",
+        ".sass",
+        ".py",
+        ".pyw",
+        ".pyi",
+        ".pyx",
+        ".js",
+        ".jsx",
+        ".ts",
+        ".tsx",
+        ".mjs",
+        ".cjs",
+        ".java",
+        ".kt",
+        ".kts",
+        ".scala",
+        ".groovy",
+        ".c",
+        ".h",
+        ".cpp",
+        ".cxx",
+        ".cc",
+        ".hpp",
+        ".hxx",
+        ".cs",
+        ".fs",
+        ".fsx",
+        ".go",
+        ".rs",
+        ".rb",
+        ".php",
+        ".pl",
+        ".pm",
+        ".lua",
+        ".swift",
+        ".m",
+        ".mm",
+        ".r",
+        ".jl",
+        ".sh",
+        ".bash",
+        ".zsh",
+        ".fish",
+        ".bat",
+        ".cmd",
+        ".ps1",
+        ".sql",
+        ".graphql",
+        ".gql",
+        ".env",
+        ".gitignore",
+        ".dockerignore",
+        ".editorconfig",
+        ".makefile",
+        ".cmake",
+        ".log",
+        ".rst",
+        ".tex",
+        ".bib",
+        ".org",
+        ".adoc",
+        ".asciidoc",
+        ".vue",
+        ".svelte",
+        ".astro",
+        ".tf",
+        ".hcl",
+        ".proto",
     }
 )
 
diff --git a/surfsense_backend/app/etl_pipeline/parsers/llamacloud.py b/surfsense_backend/app/etl_pipeline/parsers/llamacloud.py
index 5115aebea..ae2a34234 100644
--- a/surfsense_backend/app/etl_pipeline/parsers/llamacloud.py
+++ b/surfsense_backend/app/etl_pipeline/parsers/llamacloud.py
@@ -66,16 +66,12 @@ async def parse_with_llamacloud(file_path: str, estimated_pages: int) -> str:
                     )
 
                 if hasattr(result, "get_markdown_documents"):
-                    markdown_docs = result.get_markdown_documents(
-                        split_by_page=False
-                    )
+                    markdown_docs = result.get_markdown_documents(split_by_page=False)
                     if markdown_docs and hasattr(markdown_docs[0], "text"):
                         return markdown_docs[0].text
                     if hasattr(result, "pages") and result.pages:
                         return "\n\n".join(
-                            p.md
-                            for p in result.pages
-                            if hasattr(p, "md") and p.md
+                            p.md for p in result.pages if hasattr(p, "md") and p.md
                         )
                     return str(result)
 
@@ -83,9 +79,7 @@ async def parse_with_llamacloud(file_path: str, estimated_pages: int) -> str:
                     if result and hasattr(result[0], "text"):
                         return result[0].text
                     return "\n\n".join(
-                        doc.page_content
-                        if hasattr(doc, "page_content")
-                        else str(doc)
+                        doc.page_content if hasattr(doc, "page_content") else str(doc)
                         for doc in result
                     )
 
diff --git a/surfsense_backend/app/routes/autocomplete_routes.py b/surfsense_backend/app/routes/autocomplete_routes.py
index bb56709cb..a11b7dbc1 100644
--- a/surfsense_backend/app/routes/autocomplete_routes.py
+++ b/surfsense_backend/app/routes/autocomplete_routes.py
@@ -1,4 +1,4 @@
-from fastapi import APIRouter, Depends, HTTPException
+from fastapi import APIRouter, Depends
 from fastapi.responses import StreamingResponse
 from pydantic import BaseModel, Field
 from sqlalchemy.ext.asyncio import AsyncSession
@@ -31,8 +31,11 @@ async def vision_autocomplete_stream(
 
     return StreamingResponse(
         stream_vision_autocomplete(
-            body.screenshot, body.search_space_id, session,
-            app_name=body.app_name, window_title=body.window_title,
+            body.screenshot,
+            body.search_space_id,
+            session,
+            app_name=body.app_name,
+            window_title=body.window_title,
         ),
         media_type="text/event-stream",
         headers={
diff --git a/surfsense_backend/app/routes/search_source_connectors_routes.py b/surfsense_backend/app/routes/search_source_connectors_routes.py
index a30eb7297..bb20da65d 100644
--- a/surfsense_backend/app/routes/search_source_connectors_routes.py
+++ b/surfsense_backend/app/routes/search_source_connectors_routes.py
@@ -2647,7 +2647,12 @@ async def run_onedrive_indexing(
                 stage="fetching",
             )
 
-        total_indexed, total_skipped, error_message, total_unsupported = await index_onedrive_files(
+        (
+            total_indexed,
+            total_skipped,
+            error_message,
+            total_unsupported,
+        ) = await index_onedrive_files(
             session,
             connector_id,
             search_space_id,
@@ -2756,7 +2761,12 @@ async def run_dropbox_indexing(
                 stage="fetching",
             )
 
-        total_indexed, total_skipped, error_message, total_unsupported = await index_dropbox_files(
+        (
+            total_indexed,
+            total_skipped,
+            error_message,
+            total_unsupported,
+        ) = await index_dropbox_files(
             session,
             connector_id,
             search_space_id,
diff --git a/surfsense_backend/app/services/vision_autocomplete_service.py b/surfsense_backend/app/services/vision_autocomplete_service.py
index f24a5c848..7e9408be7 100644
--- a/surfsense_backend/app/services/vision_autocomplete_service.py
+++ b/surfsense_backend/app/services/vision_autocomplete_service.py
@@ -1,5 +1,5 @@
 import logging
-from typing import AsyncGenerator
+from collections.abc import AsyncGenerator
 
 from langchain_core.messages import HumanMessage, SystemMessage
 from sqlalchemy.ext.asyncio import AsyncSession
@@ -68,8 +68,10 @@ def _is_vision_unsupported_error(e: Exception) -> bool:
 
 
 async def _extract_query_from_screenshot(
-    llm, screenshot_data_url: str,
-    app_name: str = "", window_title: str = "",
+    llm,
+    screenshot_data_url: str,
+    app_name: str = "",
+    window_title: str = "",
 ) -> str | None:
     """Ask the Vision LLM to describe what the user is working on.
 
@@ -78,18 +80,26 @@ async def _extract_query_from_screenshot(
     """
     if app_name:
         prompt_text = EXTRACT_QUERY_PROMPT_WITH_APP.format(
-            app_name=app_name, window_title=window_title,
+            app_name=app_name,
+            window_title=window_title,
         )
     else:
         prompt_text = EXTRACT_QUERY_PROMPT
 
     try:
-        response = await llm.ainvoke([
-            HumanMessage(content=[
-                {"type": "text", "text": prompt_text},
-                {"type": "image_url", "image_url": {"url": screenshot_data_url}},
-            ]),
-        ])
+        response = await llm.ainvoke(
+            [
+                HumanMessage(
+                    content=[
+                        {"type": "text", "text": prompt_text},
+                        {
+                            "type": "image_url",
+                            "image_url": {"url": screenshot_data_url},
+                        },
+                    ]
+                ),
+            ]
+        )
         query = response.content.strip() if hasattr(response, "content") else ""
         return query if query else None
     except Exception as e:
@@ -167,10 +177,15 @@ async def stream_vision_autocomplete(
     kb_context = ""
     try:
         query = await _extract_query_from_screenshot(
-            llm, screenshot_data_url, app_name=app_name, window_title=window_title,
+            llm,
+            screenshot_data_url,
+            app_name=app_name,
+            window_title=window_title,
         )
     except Exception as e:
-        logger.warning(f"Vision autocomplete: selected model does not support vision: {e}")
+        logger.warning(
+            f"Vision autocomplete: selected model does not support vision: {e}"
+        )
         yield streaming.format_message_start()
         yield streaming.format_error(vision_error_msg)
         yield streaming.format_done()
@@ -183,16 +198,18 @@ async def stream_vision_autocomplete(
 
     messages = [
         SystemMessage(content=system_prompt),
-        HumanMessage(content=[
-            {
-                "type": "text",
-                "text": "Analyze this screenshot. Understand the full context of what the user is working on, then generate the text they most likely want to write in the active text area.",
-            },
-            {
-                "type": "image_url",
-                "image_url": {"url": screenshot_data_url},
-            },
-        ]),
+        HumanMessage(
+            content=[
+                {
+                    "type": "text",
+                    "text": "Analyze this screenshot. Understand the full context of what the user is working on, then generate the text they most likely want to write in the active text area.",
+                },
+                {
+                    "type": "image_url",
+                    "image_url": {"url": screenshot_data_url},
+                },
+            ]
+        ),
     ]
 
     text_started = False
@@ -217,7 +234,9 @@ async def stream_vision_autocomplete(
             yield streaming.format_text_end(text_id)
 
         if _is_vision_unsupported_error(e):
-            logger.warning(f"Vision autocomplete: selected model does not support vision: {e}")
+            logger.warning(
+                f"Vision autocomplete: selected model does not support vision: {e}"
+            )
             yield streaming.format_error(vision_error_msg)
         else:
             logger.error(f"Vision autocomplete streaming error: {e}", exc_info=True)
diff --git a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
index 8d2a45e03..4a49944c2 100644
--- a/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/dropbox_indexer.py
@@ -254,9 +254,7 @@ async def _download_and_index(
     return batch_indexed, download_failed + batch_failed
 
 
-async def _remove_document(
-    session: AsyncSession, file_id: str, search_space_id: int
-):
+async def _remove_document(session: AsyncSession, file_id: str, search_space_id: int):
     """Remove a document that was deleted in Dropbox."""
     primary_hash = compute_identifier_hash(
         DocumentType.DROPBOX_FILE.value, file_id, search_space_id
@@ -268,8 +266,7 @@ async def _remove_document(
             select(Document).where(
                 Document.search_space_id == search_space_id,
                 Document.document_type == DocumentType.DROPBOX_FILE,
-                cast(Document.document_metadata["dropbox_file_id"], String)
-                == file_id,
+                cast(Document.document_metadata["dropbox_file_id"], String) == file_id,
             )
         )
         existing = result.scalar_one_or_none()
@@ -671,9 +668,7 @@ async def index_dropbox_files(
 
             saved_cursor = folder_cursors.get(folder_path)
             can_use_delta = (
-                use_delta_sync
-                and saved_cursor
-                and connector.last_indexed_at
+                use_delta_sync and saved_cursor and connector.last_indexed_at
             )
 
             if can_use_delta:
@@ -739,7 +734,11 @@ async def index_dropbox_files(
         await task_logger.log_task_success(
             log_entry,
             f"Successfully completed Dropbox indexing for connector {connector_id}",
-            {"files_processed": total_indexed, "files_skipped": total_skipped, "files_unsupported": total_unsupported},
+            {
+                "files_processed": total_indexed,
+                "files_skipped": total_skipped,
+                "files_unsupported": total_unsupported,
+            },
         )
         logger.info(
             f"Dropbox indexing completed: {total_indexed} indexed, "
diff --git a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
index 9916e70a0..b11087fe6 100644
--- a/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/google_drive_indexer.py
@@ -1010,7 +1010,11 @@ async def index_google_drive_files(
             documents_unsupported += ru
         else:
             logger.info(f"Using full scan for connector {connector_id}")
-            documents_indexed, documents_skipped, documents_unsupported = await _index_full_scan(
+            (
+                documents_indexed,
+                documents_skipped,
+                documents_unsupported,
+            ) = await _index_full_scan(
                 drive_client,
                 session,
                 connector,
@@ -1301,7 +1305,12 @@ async def index_google_drive_selected_files(
                 log_entry,
                 f"Batch file indexing completed with {len(errors)} error(s)",
                 "; ".join(errors),
-                {"indexed": indexed, "skipped": skipped, "unsupported": unsupported, "error_count": len(errors)},
+                {
+                    "indexed": indexed,
+                    "skipped": skipped,
+                    "unsupported": unsupported,
+                    "error_count": len(errors),
+                },
             )
         else:
             await task_logger.log_task_success(
diff --git a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
index f4366fb78..7f42f4638 100644
--- a/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/local_folder_indexer.py
@@ -23,7 +23,6 @@ from sqlalchemy import select
 from sqlalchemy.exc import IntegrityError, SQLAlchemyError
 from sqlalchemy.ext.asyncio import AsyncSession
 
-from app.config import config
 from app.db import (
     Document,
     DocumentStatus,
@@ -153,8 +152,6 @@ def scan_folder(
     return files
 
 
-
-
 async def _read_file_content(file_path: str, filename: str) -> str:
     """Read file content via the unified ETL pipeline.
 
diff --git a/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py b/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
index b26442490..06517f542 100644
--- a/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
+++ b/surfsense_backend/app/tasks/connector_indexers/onedrive_indexer.py
@@ -762,7 +762,11 @@ async def index_onedrive_files(
         await task_logger.log_task_success(
             log_entry,
             f"Successfully completed OneDrive indexing for connector {connector_id}",
-            {"files_processed": total_indexed, "files_skipped": total_skipped, "files_unsupported": total_unsupported},
+            {
+                "files_processed": total_indexed,
+                "files_skipped": total_skipped,
+                "files_unsupported": total_unsupported,
+            },
         )
         logger.info(
             f"OneDrive indexing completed: {total_indexed} indexed, "
diff --git a/surfsense_backend/app/tasks/document_processors/file_processors.py b/surfsense_backend/app/tasks/document_processors/file_processors.py
index a9a6b62be..c765dbd87 100644
--- a/surfsense_backend/app/tasks/document_processors/file_processors.py
+++ b/surfsense_backend/app/tasks/document_processors/file_processors.py
@@ -292,8 +292,10 @@ async def process_file_in_background(
     )
 
     try:
-        from app.etl_pipeline.file_classifier import FileCategory as EtlFileCategory
-        from app.etl_pipeline.file_classifier import classify_file as etl_classify
+        from app.etl_pipeline.file_classifier import (
+            FileCategory as EtlFileCategory,
+            classify_file as etl_classify,
+        )
 
         category = etl_classify(filename)
 
@@ -345,8 +347,10 @@ async def _extract_file_content(
     """
     from app.etl_pipeline.etl_document import EtlRequest
     from app.etl_pipeline.etl_pipeline_service import EtlPipelineService
-    from app.etl_pipeline.file_classifier import FileCategory
-    from app.etl_pipeline.file_classifier import classify_file as etl_classify
+    from app.etl_pipeline.file_classifier import (
+        FileCategory,
+        classify_file as etl_classify,
+    )
 
     category = etl_classify(filename)
     estimated_pages = 0
diff --git a/surfsense_backend/app/utils/file_extensions.py b/surfsense_backend/app/utils/file_extensions.py
index 5eed36872..8d432ce56 100644
--- a/surfsense_backend/app/utils/file_extensions.py
+++ b/surfsense_backend/app/utils/file_extensions.py
@@ -15,30 +15,83 @@ from pathlib import PurePosixPath
 # Per-parser document extension sets (from official documentation)
 # ---------------------------------------------------------------------------
 
-DOCLING_DOCUMENT_EXTENSIONS: frozenset[str] = frozenset({
-    ".pdf",
-    ".docx", ".xlsx", ".pptx",
-    ".png", ".jpg", ".jpeg", ".tiff", ".tif", ".bmp", ".webp",
-})
+DOCLING_DOCUMENT_EXTENSIONS: frozenset[str] = frozenset(
+    {
+        ".pdf",
+        ".docx",
+        ".xlsx",
+        ".pptx",
+        ".png",
+        ".jpg",
+        ".jpeg",
+        ".tiff",
+        ".tif",
+        ".bmp",
+        ".webp",
+    }
+)
 
-LLAMAPARSE_DOCUMENT_EXTENSIONS: frozenset[str] = frozenset({
-    ".pdf",
-    ".docx", ".doc", ".xlsx", ".xls", ".pptx", ".ppt",
-    ".docm", ".dot", ".dotm", ".pptm", ".pot", ".potx",
-    ".xlsm", ".xlsb", ".xlw",
-    ".rtf", ".epub",
-    ".png", ".jpg", ".jpeg", ".gif", ".bmp", ".tiff", ".tif", ".webp", ".svg",
-    ".odt", ".ods", ".odp",
-    ".hwp", ".hwpx",
-})
+LLAMAPARSE_DOCUMENT_EXTENSIONS: frozenset[str] = frozenset(
+    {
+        ".pdf",
+        ".docx",
+        ".doc",
+        ".xlsx",
+        ".xls",
+        ".pptx",
+        ".ppt",
+        ".docm",
+        ".dot",
+        ".dotm",
+        ".pptm",
+        ".pot",
+        ".potx",
+        ".xlsm",
+        ".xlsb",
+        ".xlw",
+        ".rtf",
+        ".epub",
+        ".png",
+        ".jpg",
+        ".jpeg",
+        ".gif",
+        ".bmp",
+        ".tiff",
+        ".tif",
+        ".webp",
+        ".svg",
+        ".odt",
+        ".ods",
+        ".odp",
+        ".hwp",
+        ".hwpx",
+    }
+)
 
-UNSTRUCTURED_DOCUMENT_EXTENSIONS: frozenset[str] = frozenset({
-    ".pdf",
-    ".docx", ".doc", ".xlsx", ".xls", ".pptx", ".ppt",
-    ".png", ".jpg", ".jpeg", ".bmp", ".tiff", ".tif", ".heic",
-    ".rtf", ".epub", ".odt",
-    ".eml", ".msg", ".p7s",
-})
+UNSTRUCTURED_DOCUMENT_EXTENSIONS: frozenset[str] = frozenset(
+    {
+        ".pdf",
+        ".docx",
+        ".doc",
+        ".xlsx",
+        ".xls",
+        ".pptx",
+        ".ppt",
+        ".png",
+        ".jpg",
+        ".jpeg",
+        ".bmp",
+        ".tiff",
+        ".tif",
+        ".heic",
+        ".rtf",
+        ".epub",
+        ".odt",
+        ".eml",
+        ".msg",
+        ".p7s",
+    }
+)
 
 # ---------------------------------------------------------------------------
 # Union (used by classify_file for routing) + service lookup
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_content_extraction.py b/surfsense_backend/tests/unit/connector_indexers/test_content_extraction.py
index 49f9a217a..cd112e09f 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_content_extraction.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_content_extraction.py
@@ -6,7 +6,6 @@ real so we know the full path from "cloud gives us bytes" to "we get markdown
 back" actually works.
 """
 
-import os
 from unittest.mock import AsyncMock, MagicMock
 
 import pytest
@@ -21,6 +20,7 @@ _CSV_CONTENT = "name,age\nAlice,30\nBob,25\n"
 # Helpers
 # ---------------------------------------------------------------------------
 
+
 async def _write_file(dest_path: str, content: str) -> None:
     """Simulate a cloud client writing downloaded bytes to disk."""
     with open(dest_path, "w", encoding="utf-8") as f:
@@ -43,8 +43,8 @@ def _make_download_side_effect(content: str):
 # Google Drive
 # ===================================================================
 
-class TestGoogleDriveContentExtraction:
 
+class TestGoogleDriveContentExtraction:
     async def test_txt_file_returns_markdown(self):
         from app.connectors.google_drive.content_extractor import (
             download_and_extract_content,
@@ -76,7 +76,7 @@ class TestGoogleDriveContentExtraction:
 
         file = {"id": "f2", "name": "data.csv", "mimeType": "text/csv"}
 
-        markdown, metadata, error = await download_and_extract_content(client, file)
+        markdown, _metadata, error = await download_and_extract_content(client, file)
 
         assert error is None
         assert "Alice" in markdown
@@ -93,7 +93,7 @@ class TestGoogleDriveContentExtraction:
 
         file = {"id": "f3", "name": "doc.txt", "mimeType": "text/plain"}
 
-        markdown, metadata, error = await download_and_extract_content(client, file)
+        markdown, _metadata, error = await download_and_extract_content(client, file)
 
         assert markdown is None
         assert error == "Network timeout"
@@ -103,8 +103,8 @@ class TestGoogleDriveContentExtraction:
 # OneDrive
 # ===================================================================
 
-class TestOneDriveContentExtraction:
 
+class TestOneDriveContentExtraction:
     async def test_txt_file_returns_markdown(self):
         from app.connectors.onedrive.content_extractor import (
             download_and_extract_content,
@@ -144,7 +144,7 @@ class TestOneDriveContentExtraction:
             "file": {"mimeType": "text/csv"},
         }
 
-        markdown, metadata, error = await download_and_extract_content(client, file)
+        markdown, _metadata, error = await download_and_extract_content(client, file)
 
         assert error is None
         assert "Alice" in markdown
@@ -164,7 +164,7 @@ class TestOneDriveContentExtraction:
             "file": {"mimeType": "text/plain"},
         }
 
-        markdown, metadata, error = await download_and_extract_content(client, file)
+        markdown, _metadata, error = await download_and_extract_content(client, file)
 
         assert markdown is None
         assert error == "403 Forbidden"
@@ -174,8 +174,8 @@ class TestOneDriveContentExtraction:
 # Dropbox
 # ===================================================================
 
-class TestDropboxContentExtraction:
 
+class TestDropboxContentExtraction:
     async def test_txt_file_returns_markdown(self):
         from app.connectors.dropbox.content_extractor import (
             download_and_extract_content,
@@ -217,7 +217,7 @@ class TestDropboxContentExtraction:
             "path_lower": "/data.csv",
         }
 
-        markdown, metadata, error = await download_and_extract_content(client, file)
+        markdown, _metadata, error = await download_and_extract_content(client, file)
 
         assert error is None
         assert "Alice" in markdown
@@ -238,7 +238,7 @@ class TestDropboxContentExtraction:
             "path_lower": "/big.txt",
         }
 
-        markdown, metadata, error = await download_and_extract_content(client, file)
+        markdown, _metadata, error = await download_and_extract_content(client, file)
 
         assert markdown is None
         assert error == "Rate limited"
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
index adac90085..f72135d05 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_dropbox_parallel.py
@@ -265,6 +265,7 @@ def full_scan_mocks(mock_dropbox_client, monkeypatch):
 
     async def _fake_skip(session, file, search_space_id):
         from app.connectors.dropbox.file_types import should_skip_file as _skip
+
         item_skip, unsup_ext = _skip(file)
         if item_skip:
             if unsup_ext:
@@ -468,7 +469,11 @@ async def test_selected_files_fetch_failure_isolation(selected_files_mocks):
 
     indexed, skipped, _unsupported, errors = await _run_selected(
         selected_files_mocks,
-        [("/first.txt", "first.txt"), ("/mid.txt", "mid.txt"), ("/third.txt", "third.txt")],
+        [
+            ("/first.txt", "first.txt"),
+            ("/mid.txt", "mid.txt"),
+            ("/third.txt", "third.txt"),
+        ],
     )
 
     assert indexed == 2
@@ -526,8 +531,18 @@ async def test_delta_sync_deletions_call_remove_document(monkeypatch):
     import app.tasks.connector_indexers.dropbox_indexer as _mod
 
     entries = [
-        {".tag": "deleted", "name": "gone.txt", "path_lower": "/gone.txt", "id": "id:del1"},
-        {".tag": "deleted", "name": "also_gone.pdf", "path_lower": "/also_gone.pdf", "id": "id:del2"},
+        {
+            ".tag": "deleted",
+            "name": "gone.txt",
+            "path_lower": "/gone.txt",
+            "id": "id:del1",
+        },
+        {
+            ".tag": "deleted",
+            "name": "also_gone.pdf",
+            "path_lower": "/also_gone.pdf",
+            "id": "id:del2",
+        },
     ]
 
     mock_client = MagicMock()
@@ -544,7 +559,7 @@ async def test_delta_sync_deletions_call_remove_document(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    indexed, skipped, unsupported, cursor = await _index_with_delta_sync(
+    _indexed, _skipped, _unsupported, cursor = await _index_with_delta_sync(
         mock_client,
         AsyncMock(),
         _CONNECTOR_ID,
@@ -573,7 +588,9 @@ async def test_delta_sync_upserts_filtered_and_downloaded(monkeypatch):
     mock_client = MagicMock()
     mock_client.get_changes = AsyncMock(return_value=(entries, "cursor-v2", None))
 
-    monkeypatch.setattr(_mod, "_should_skip_file", AsyncMock(return_value=(False, None)))
+    monkeypatch.setattr(
+        _mod, "_should_skip_file", AsyncMock(return_value=(False, None))
+    )
 
     download_mock = AsyncMock(return_value=(2, 0))
     monkeypatch.setattr(_mod, "_download_and_index", download_mock)
@@ -581,7 +598,7 @@ async def test_delta_sync_upserts_filtered_and_downloaded(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    indexed, skipped, unsupported, cursor = await _index_with_delta_sync(
+    indexed, skipped, _unsupported, cursor = await _index_with_delta_sync(
         mock_client,
         AsyncMock(),
         _CONNECTOR_ID,
@@ -608,8 +625,18 @@ async def test_delta_sync_mix_deletions_and_upserts(monkeypatch):
     import app.tasks.connector_indexers.dropbox_indexer as _mod
 
     entries = [
-        {".tag": "deleted", "name": "removed.txt", "path_lower": "/removed.txt", "id": "id:del1"},
-        {".tag": "deleted", "name": "trashed.pdf", "path_lower": "/trashed.pdf", "id": "id:del2"},
+        {
+            ".tag": "deleted",
+            "name": "removed.txt",
+            "path_lower": "/removed.txt",
+            "id": "id:del1",
+        },
+        {
+            ".tag": "deleted",
+            "name": "trashed.pdf",
+            "path_lower": "/trashed.pdf",
+            "id": "id:del2",
+        },
         _make_file_dict("mod1", "updated.txt"),
         _make_file_dict("new1", "brandnew.docx"),
     ]
@@ -623,7 +650,9 @@ async def test_delta_sync_mix_deletions_and_upserts(monkeypatch):
         remove_calls.append(file_id)
 
     monkeypatch.setattr(_mod, "_remove_document", _fake_remove)
-    monkeypatch.setattr(_mod, "_should_skip_file", AsyncMock(return_value=(False, None)))
+    monkeypatch.setattr(
+        _mod, "_should_skip_file", AsyncMock(return_value=(False, None))
+    )
 
     download_mock = AsyncMock(return_value=(2, 0))
     monkeypatch.setattr(_mod, "_download_and_index", download_mock)
@@ -631,7 +660,7 @@ async def test_delta_sync_mix_deletions_and_upserts(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    indexed, skipped, unsupported, cursor = await _index_with_delta_sync(
+    indexed, skipped, _unsupported, cursor = await _index_with_delta_sync(
         mock_client,
         AsyncMock(),
         _CONNECTOR_ID,
@@ -665,7 +694,7 @@ async def test_delta_sync_returns_new_cursor(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    indexed, skipped, unsupported, cursor = await _index_with_delta_sync(
+    indexed, skipped, _unsupported, cursor = await _index_with_delta_sync(
         mock_client,
         AsyncMock(),
         _CONNECTOR_ID,
@@ -723,9 +752,7 @@ def orchestrator_mocks(monkeypatch):
 
     mock_client = MagicMock()
     mock_client.get_latest_cursor = AsyncMock(return_value=("latest-cursor-abc", None))
-    monkeypatch.setattr(
-        _mod, "DropboxClient", MagicMock(return_value=mock_client)
-    )
+    monkeypatch.setattr(_mod, "DropboxClient", MagicMock(return_value=mock_client))
 
     return {
         "connector": mock_connector,
@@ -751,7 +778,7 @@ async def test_orchestrator_uses_delta_sync_when_cursor_and_last_indexed(
     mock_session = AsyncMock()
     mock_session.commit = AsyncMock()
 
-    indexed, skipped, error, _unsupported = await index_dropbox_files(
+    _indexed, _skipped, error, _unsupported = await index_dropbox_files(
         mock_session,
         _CONNECTOR_ID,
         _SEARCH_SPACE_ID,
@@ -779,7 +806,7 @@ async def test_orchestrator_falls_back_to_full_scan_without_cursor(
     mock_session = AsyncMock()
     mock_session.commit = AsyncMock()
 
-    indexed, skipped, error, _unsupported = await index_dropbox_files(
+    _indexed, _skipped, error, _unsupported = await index_dropbox_files(
         mock_session,
         _CONNECTOR_ID,
         _SEARCH_SPACE_ID,
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py b/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
index 7fa92ce12..0ae096361 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_google_drive_parallel.py
@@ -366,7 +366,7 @@ async def test_full_scan_three_phase_counts(full_scan_mocks, monkeypatch):
     full_scan_mocks["download_mock"].return_value = (mock_docs, 0)
     full_scan_mocks["batch_mock"].return_value = ([], 2, 0)
 
-    indexed, skipped, unsupported = await _run_full_scan(full_scan_mocks)
+    indexed, skipped, _unsupported = await _run_full_scan(full_scan_mocks)
 
     assert indexed == 3  # 1 renamed + 2 from batch
     assert skipped == 1  # 1 unchanged
@@ -497,7 +497,7 @@ async def test_delta_sync_removals_serial_rest_parallel(monkeypatch):
     mock_task_logger = MagicMock()
     mock_task_logger.log_task_progress = AsyncMock()
 
-    indexed, skipped, unsupported = await _index_with_delta_sync(
+    indexed, skipped, _unsupported = await _index_with_delta_sync(
         MagicMock(),
         mock_session,
         MagicMock(),
@@ -589,7 +589,7 @@ async def test_selected_files_single_file_indexed(selected_files_mocks):
     )
     selected_files_mocks["download_and_index_mock"].return_value = (1, 0)
 
-    indexed, skipped, unsup, errors = await _run_selected(
+    indexed, skipped, _unsup, errors = await _run_selected(
         selected_files_mocks,
         [("f1", "report.pdf")],
     )
@@ -613,7 +613,7 @@ async def test_selected_files_fetch_failure_isolation(selected_files_mocks):
     )
     selected_files_mocks["download_and_index_mock"].return_value = (2, 0)
 
-    indexed, skipped, unsup, errors = await _run_selected(
+    indexed, skipped, _unsup, errors = await _run_selected(
         selected_files_mocks,
         [("f1", "first.txt"), ("f2", "mid.txt"), ("f3", "third.txt")],
     )
@@ -647,7 +647,7 @@ async def test_selected_files_skip_rename_counting(selected_files_mocks):
 
     selected_files_mocks["download_and_index_mock"].return_value = (2, 0)
 
-    indexed, skipped, unsup, errors = await _run_selected(
+    indexed, skipped, _unsup, errors = await _run_selected(
         selected_files_mocks,
         [
             ("s1", "unchanged.txt"),
diff --git a/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
index 58737b20b..573ee43d8 100644
--- a/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
+++ b/surfsense_backend/tests/unit/connector_indexers/test_page_limits.py
@@ -219,7 +219,9 @@ async def test_gdrive_files_exceeding_quota_rejected(gdrive_selected_mocks):
         None,
     )
 
-    indexed, _skipped, _unsup, errors = await _run_gdrive_selected(m, [("big", "huge.pdf")])
+    indexed, _skipped, _unsup, errors = await _run_gdrive_selected(
+        m, [("big", "huge.pdf")]
+    )
 
     assert indexed == 0
     assert len(errors) == 1
@@ -552,7 +554,9 @@ async def test_onedrive_over_quota_rejected(onedrive_selected_mocks):
         None,
     )
 
-    indexed, _skipped, _unsup, errors = await _run_onedrive_selected(m, [("big", "huge.pdf")])
+    indexed, _skipped, _unsup, errors = await _run_onedrive_selected(
+        m, [("big", "huge.pdf")]
+    )
 
     assert indexed == 0
     assert len(errors) == 1
diff --git a/surfsense_backend/tests/unit/connectors/test_dropbox_client.py b/surfsense_backend/tests/unit/connectors/test_dropbox_client.py
index efacbcf72..31cafe550 100644
--- a/surfsense_backend/tests/unit/connectors/test_dropbox_client.py
+++ b/surfsense_backend/tests/unit/connectors/test_dropbox_client.py
@@ -19,6 +19,7 @@ def _make_client() -> DropboxClient:
 
 # ---------- C1: get_latest_cursor ----------
 
+
 async def test_get_latest_cursor_returns_cursor_string(monkeypatch):
     client = _make_client()
 
@@ -34,12 +35,17 @@ async def test_get_latest_cursor_returns_cursor_string(monkeypatch):
     assert error is None
     client._request.assert_called_once_with(
         "/2/files/list_folder/get_latest_cursor",
-        {"path": "/my-folder", "recursive": False, "include_non_downloadable_files": True},
+        {
+            "path": "/my-folder",
+            "recursive": False,
+            "include_non_downloadable_files": True,
+        },
     )
 
 
 # ---------- C2: get_changes returns entries and new cursor ----------
 
+
 async def test_get_changes_returns_entries_and_cursor(monkeypatch):
     client = _make_client()
 
@@ -66,6 +72,7 @@ async def test_get_changes_returns_entries_and_cursor(monkeypatch):
 
 # ---------- C3: get_changes handles pagination ----------
 
+
 async def test_get_changes_handles_pagination(monkeypatch):
     client = _make_client()
 
@@ -98,6 +105,7 @@ async def test_get_changes_handles_pagination(monkeypatch):
 
 # ---------- C4: get_changes raises on 401 ----------
 
+
 async def test_get_changes_returns_error_on_401(monkeypatch):
     client = _make_client()
 
diff --git a/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py b/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
index 74277d47c..b4715e083 100644
--- a/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
+++ b/surfsense_backend/tests/unit/connectors/test_dropbox_file_types.py
@@ -41,15 +41,40 @@ def test_non_downloadable_item_is_skipped():
 @pytest.mark.parametrize(
     "filename",
     [
-        "archive.zip", "backup.tar", "data.gz", "stuff.rar", "pack.7z",
-        "program.exe", "lib.dll", "module.so", "image.dmg", "disk.iso",
-        "movie.mov", "clip.avi", "video.mkv", "film.wmv", "stream.flv",
+        "archive.zip",
+        "backup.tar",
+        "data.gz",
+        "stuff.rar",
+        "pack.7z",
+        "program.exe",
+        "lib.dll",
+        "module.so",
+        "image.dmg",
+        "disk.iso",
+        "movie.mov",
+        "clip.avi",
+        "video.mkv",
+        "film.wmv",
+        "stream.flv",
         "favicon.ico",
-        "raw.cr2", "photo.nef", "image.arw", "pic.dng",
-        "design.psd", "vector.ai", "mockup.sketch", "proto.fig",
-        "font.ttf", "font.otf", "font.woff", "font.woff2",
-        "model.stl", "scene.fbx", "mesh.blend",
-        "local.db", "data.sqlite", "access.mdb",
+        "raw.cr2",
+        "photo.nef",
+        "image.arw",
+        "pic.dng",
+        "design.psd",
+        "vector.ai",
+        "mockup.sketch",
+        "proto.fig",
+        "font.ttf",
+        "font.otf",
+        "font.woff",
+        "font.woff2",
+        "model.stl",
+        "scene.fbx",
+        "mesh.blend",
+        "local.db",
+        "data.sqlite",
+        "access.mdb",
     ],
 )
 def test_non_parseable_extensions_are_skipped(filename, mocker):
@@ -63,9 +88,16 @@ def test_non_parseable_extensions_are_skipped(filename, mocker):
 @pytest.mark.parametrize(
     "filename",
     [
-        "report.pdf", "document.docx", "sheet.xlsx", "slides.pptx",
-        "readme.txt", "data.csv", "page.html", "notes.md",
-        "config.json", "feed.xml",
+        "report.pdf",
+        "document.docx",
+        "sheet.xlsx",
+        "slides.pptx",
+        "readme.txt",
+        "data.csv",
+        "page.html",
+        "notes.md",
+        "config.json",
+        "feed.xml",
     ],
 )
 def test_parseable_documents_are_not_skipped(filename, mocker):
@@ -92,30 +124,33 @@ def test_universal_images_are_not_skipped(filename, mocker):
         assert ext is None
 
 
-@pytest.mark.parametrize("filename,service,expected_skip", [
-    ("old.doc", "DOCLING", True),
-    ("old.doc", "LLAMACLOUD", False),
-    ("old.doc", "UNSTRUCTURED", False),
-    ("legacy.xls", "DOCLING", True),
-    ("legacy.xls", "LLAMACLOUD", False),
-    ("legacy.xls", "UNSTRUCTURED", False),
-    ("deck.ppt", "DOCLING", True),
-    ("deck.ppt", "LLAMACLOUD", False),
-    ("deck.ppt", "UNSTRUCTURED", False),
-    ("icon.svg", "DOCLING", True),
-    ("icon.svg", "LLAMACLOUD", False),
-    ("anim.gif", "DOCLING", True),
-    ("anim.gif", "LLAMACLOUD", False),
-    ("photo.webp", "DOCLING", False),
-    ("photo.webp", "LLAMACLOUD", False),
-    ("photo.webp", "UNSTRUCTURED", True),
-    ("live.heic", "DOCLING", True),
-    ("live.heic", "UNSTRUCTURED", False),
-    ("macro.docm", "DOCLING", True),
-    ("macro.docm", "LLAMACLOUD", False),
-    ("mail.eml", "DOCLING", True),
-    ("mail.eml", "UNSTRUCTURED", False),
-])
+@pytest.mark.parametrize(
+    "filename,service,expected_skip",
+    [
+        ("old.doc", "DOCLING", True),
+        ("old.doc", "LLAMACLOUD", False),
+        ("old.doc", "UNSTRUCTURED", False),
+        ("legacy.xls", "DOCLING", True),
+        ("legacy.xls", "LLAMACLOUD", False),
+        ("legacy.xls", "UNSTRUCTURED", False),
+        ("deck.ppt", "DOCLING", True),
+        ("deck.ppt", "LLAMACLOUD", False),
+        ("deck.ppt", "UNSTRUCTURED", False),
+        ("icon.svg", "DOCLING", True),
+        ("icon.svg", "LLAMACLOUD", False),
+        ("anim.gif", "DOCLING", True),
+        ("anim.gif", "LLAMACLOUD", False),
+        ("photo.webp", "DOCLING", False),
+        ("photo.webp", "LLAMACLOUD", False),
+        ("photo.webp", "UNSTRUCTURED", True),
+        ("live.heic", "DOCLING", True),
+        ("live.heic", "UNSTRUCTURED", False),
+        ("macro.docm", "DOCLING", True),
+        ("macro.docm", "LLAMACLOUD", False),
+        ("mail.eml", "DOCLING", True),
+        ("mail.eml", "UNSTRUCTURED", False),
+    ],
+)
 def test_parser_specific_extensions(filename, service, expected_skip, mocker):
     mocker.patch("app.config.config.ETL_SERVICE", service)
     item = {".tag": "file", "name": filename}
diff --git a/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py b/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
index 5cd43736b..ab602468d 100644
--- a/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
+++ b/surfsense_backend/tests/unit/connectors/test_google_drive_file_types.py
@@ -7,21 +7,37 @@ from app.connectors.google_drive.file_types import should_skip_by_extension
 pytestmark = pytest.mark.unit
 
 
-@pytest.mark.parametrize("filename", [
-    "malware.exe", "archive.zip", "video.mov", "font.woff2", "model.blend",
-])
+@pytest.mark.parametrize(
+    "filename",
+    [
+        "malware.exe",
+        "archive.zip",
+        "video.mov",
+        "font.woff2",
+        "model.blend",
+    ],
+)
 def test_unsupported_extensions_are_skipped_regardless_of_service(filename, mocker):
     """Truly unsupported files are skipped no matter which ETL service is configured."""
     for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
         mocker.patch("app.config.config.ETL_SERVICE", service)
-        skip, ext = should_skip_by_extension(filename)
+        skip, _ext = should_skip_by_extension(filename)
         assert skip is True
 
 
-@pytest.mark.parametrize("filename", [
-    "report.pdf", "doc.docx", "sheet.xlsx", "slides.pptx",
-    "readme.txt", "data.csv", "photo.png", "notes.md",
-])
+@pytest.mark.parametrize(
+    "filename",
+    [
+        "report.pdf",
+        "doc.docx",
+        "sheet.xlsx",
+        "slides.pptx",
+        "readme.txt",
+        "data.csv",
+        "photo.png",
+        "notes.md",
+    ],
+)
 def test_universal_extensions_are_not_skipped(filename, mocker):
     """Files supported by all parsers (or handled by plaintext/direct_convert) are never skipped."""
     for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
@@ -31,16 +47,19 @@ def test_universal_extensions_are_not_skipped(filename, mocker):
         assert ext is None
 
 
-@pytest.mark.parametrize("filename,service,expected_skip", [
-    ("macro.docm", "DOCLING", True),
-    ("macro.docm", "LLAMACLOUD", False),
-    ("mail.eml", "DOCLING", True),
-    ("mail.eml", "UNSTRUCTURED", False),
-    ("photo.gif", "DOCLING", True),
-    ("photo.gif", "LLAMACLOUD", False),
-    ("photo.heic", "UNSTRUCTURED", False),
-    ("photo.heic", "DOCLING", True),
-])
+@pytest.mark.parametrize(
+    "filename,service,expected_skip",
+    [
+        ("macro.docm", "DOCLING", True),
+        ("macro.docm", "LLAMACLOUD", False),
+        ("mail.eml", "DOCLING", True),
+        ("mail.eml", "UNSTRUCTURED", False),
+        ("photo.gif", "DOCLING", True),
+        ("photo.gif", "LLAMACLOUD", False),
+        ("photo.heic", "UNSTRUCTURED", False),
+        ("photo.heic", "DOCLING", True),
+    ],
+)
 def test_parser_specific_extensions(filename, service, expected_skip, mocker):
     mocker.patch("app.config.config.ETL_SERVICE", service)
     skip, ext = should_skip_by_extension(filename)
diff --git a/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py b/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
index 61212b340..1d9124c47 100644
--- a/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
+++ b/surfsense_backend/tests/unit/connectors/test_onedrive_file_types.py
@@ -45,9 +45,16 @@ def test_onenote_is_skipped():
 # ---------------------------------------------------------------------------
 
 
-@pytest.mark.parametrize("filename", [
-    "malware.exe", "archive.zip", "video.mov", "font.woff2", "model.blend",
-])
+@pytest.mark.parametrize(
+    "filename",
+    [
+        "malware.exe",
+        "archive.zip",
+        "video.mov",
+        "font.woff2",
+        "model.blend",
+    ],
+)
 def test_unsupported_extensions_are_skipped(filename, mocker):
     mocker.patch("app.config.config.ETL_SERVICE", "DOCLING")
     item = {"name": filename, "file": {"mimeType": "application/octet-stream"}}
@@ -56,10 +63,19 @@ def test_unsupported_extensions_are_skipped(filename, mocker):
     assert ext is not None
 
 
-@pytest.mark.parametrize("filename", [
-    "report.pdf", "doc.docx", "sheet.xlsx", "slides.pptx",
-    "readme.txt", "data.csv", "photo.png", "notes.md",
-])
+@pytest.mark.parametrize(
+    "filename",
+    [
+        "report.pdf",
+        "doc.docx",
+        "sheet.xlsx",
+        "slides.pptx",
+        "readme.txt",
+        "data.csv",
+        "photo.png",
+        "notes.md",
+    ],
+)
 def test_universal_files_are_not_skipped(filename, mocker):
     for service in ("DOCLING", "LLAMACLOUD", "UNSTRUCTURED"):
         mocker.patch("app.config.config.ETL_SERVICE", service)
@@ -69,14 +85,17 @@ def test_universal_files_are_not_skipped(filename, mocker):
         assert ext is None
 
 
-@pytest.mark.parametrize("filename,service,expected_skip", [
-    ("macro.docm", "DOCLING", True),
-    ("macro.docm", "LLAMACLOUD", False),
-    ("mail.eml", "DOCLING", True),
-    ("mail.eml", "UNSTRUCTURED", False),
-    ("photo.heic", "UNSTRUCTURED", False),
-    ("photo.heic", "DOCLING", True),
-])
+@pytest.mark.parametrize(
+    "filename,service,expected_skip",
+    [
+        ("macro.docm", "DOCLING", True),
+        ("macro.docm", "LLAMACLOUD", False),
+        ("mail.eml", "DOCLING", True),
+        ("mail.eml", "UNSTRUCTURED", False),
+        ("photo.heic", "UNSTRUCTURED", False),
+        ("photo.heic", "DOCLING", True),
+    ],
+)
 def test_parser_specific_extensions(filename, service, expected_skip, mocker):
     mocker.patch("app.config.config.ETL_SERVICE", service)
     item = {"name": filename, "file": {"mimeType": "application/octet-stream"}}
diff --git a/surfsense_backend/tests/unit/etl_pipeline/conftest.py b/surfsense_backend/tests/unit/etl_pipeline/conftest.py
index 6059caa01..082ab9771 100644
--- a/surfsense_backend/tests/unit/etl_pipeline/conftest.py
+++ b/surfsense_backend/tests/unit/etl_pipeline/conftest.py
@@ -24,6 +24,4 @@ def _stub_package(dotted: str, fs_dir: Path) -> None:
 
 _stub_package("app", _BACKEND / "app")
 _stub_package("app.etl_pipeline", _BACKEND / "app" / "etl_pipeline")
-_stub_package(
-    "app.etl_pipeline.parsers", _BACKEND / "app" / "etl_pipeline" / "parsers"
-)
+_stub_package("app.etl_pipeline.parsers", _BACKEND / "app" / "etl_pipeline" / "parsers")
diff --git a/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py b/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
index e90847e3a..769b1dc53 100644
--- a/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
+++ b/surfsense_backend/tests/unit/etl_pipeline/test_etl_pipeline_service.py
@@ -144,7 +144,7 @@ async def test_extract_mp3_returns_transcription(tmp_path, mocker):
 
 
 # ---------------------------------------------------------------------------
-# Slice 7 – DOCLING document parsing
+# Slice 7 - DOCLING document parsing
 # ---------------------------------------------------------------------------
 
 
@@ -172,7 +172,7 @@ async def test_extract_pdf_with_docling(tmp_path, mocker):
 
 
 # ---------------------------------------------------------------------------
-# Slice 8 – UNSTRUCTURED document parsing
+# Slice 8 - UNSTRUCTURED document parsing
 # ---------------------------------------------------------------------------
 
 
@@ -208,7 +208,7 @@ async def test_extract_pdf_with_unstructured(tmp_path, mocker):
 
 
 # ---------------------------------------------------------------------------
-# Slice 9 – LLAMACLOUD document parsing
+# Slice 9 - LLAMACLOUD document parsing
 # ---------------------------------------------------------------------------
 
 
@@ -241,9 +241,7 @@ async def test_extract_pdf_with_llamacloud(tmp_path, mocker):
     )
 
     result = await EtlPipelineService().extract(
-        EtlRequest(
-            file_path=str(pdf_file), filename="report.pdf", estimated_pages=5
-        )
+        EtlRequest(file_path=str(pdf_file), filename="report.pdf", estimated_pages=5)
     )
 
     assert result.markdown_content == "# LlamaCloud parsed"
@@ -252,7 +250,7 @@ async def test_extract_pdf_with_llamacloud(tmp_path, mocker):
 
 
 # ---------------------------------------------------------------------------
-# Slice 10 – unknown extension falls through to document ETL
+# Slice 10 - unknown extension falls through to document ETL
 # ---------------------------------------------------------------------------
 
 
@@ -279,18 +277,18 @@ async def test_unknown_extension_uses_document_etl(tmp_path, mocker):
 
 
 # ---------------------------------------------------------------------------
-# Slice 11 – EtlRequest validation
+# Slice 11 - EtlRequest validation
 # ---------------------------------------------------------------------------
 
 
 def test_etl_request_requires_filename():
     """EtlRequest rejects missing filename."""
-    with pytest.raises(Exception):
+    with pytest.raises(ValueError, match="filename must not be empty"):
         EtlRequest(file_path="/tmp/some.txt", filename="")
 
 
 # ---------------------------------------------------------------------------
-# Slice 12 – unknown ETL_SERVICE raises EtlServiceUnavailableError
+# Slice 12 - unknown ETL_SERVICE raises EtlServiceUnavailableError
 # ---------------------------------------------------------------------------
 
 
@@ -310,7 +308,7 @@ async def test_unknown_etl_service_raises(tmp_path, mocker):
 
 
 # ---------------------------------------------------------------------------
-# Slice 13 – unsupported file types are rejected before reaching any parser
+# Slice 13 - unsupported file types are rejected before reaching any parser
 # ---------------------------------------------------------------------------
 
 
@@ -321,10 +319,19 @@ def test_unknown_extension_classified_as_unsupported():
     assert classify_file("random.xyz") == FileCategory.UNSUPPORTED
 
 
-@pytest.mark.parametrize("filename", [
-    "malware.exe", "archive.zip", "video.mov", "font.woff2",
-    "model.blend", "data.parquet", "package.deb", "firmware.bin",
-])
+@pytest.mark.parametrize(
+    "filename",
+    [
+        "malware.exe",
+        "archive.zip",
+        "video.mov",
+        "font.woff2",
+        "model.blend",
+        "data.parquet",
+        "package.deb",
+        "firmware.bin",
+    ],
+)
 def test_unsupported_extensions_classified_correctly(filename):
     """Extensions not in any allowlist are classified as UNSUPPORTED."""
     from app.etl_pipeline.file_classifier import FileCategory, classify_file
@@ -332,18 +339,21 @@ def test_unsupported_extensions_classified_correctly(filename):
     assert classify_file(filename) == FileCategory.UNSUPPORTED
 
 
-@pytest.mark.parametrize("filename,expected", [
-    ("report.pdf", "document"),
-    ("doc.docx", "document"),
-    ("slides.pptx", "document"),
-    ("sheet.xlsx", "document"),
-    ("photo.png", "document"),
-    ("photo.jpg", "document"),
-    ("book.epub", "document"),
-    ("letter.odt", "document"),
-    ("readme.md", "plaintext"),
-    ("data.csv", "direct_convert"),
-])
+@pytest.mark.parametrize(
+    "filename,expected",
+    [
+        ("report.pdf", "document"),
+        ("doc.docx", "document"),
+        ("slides.pptx", "document"),
+        ("sheet.xlsx", "document"),
+        ("photo.png", "document"),
+        ("photo.jpg", "document"),
+        ("book.epub", "document"),
+        ("letter.odt", "document"),
+        ("readme.md", "plaintext"),
+        ("data.csv", "direct_convert"),
+    ],
+)
 def test_parseable_extensions_classified_correctly(filename, expected):
     """Parseable files are classified into their correct category."""
     from app.etl_pipeline.file_classifier import FileCategory, classify_file
@@ -380,31 +390,34 @@ async def test_extract_zip_raises_unsupported_error(tmp_path):
 
 
 # ---------------------------------------------------------------------------
-# Slice 14 – should_skip_for_service (per-parser document filtering)
+# Slice 14 - should_skip_for_service (per-parser document filtering)
 # ---------------------------------------------------------------------------
 
 
-@pytest.mark.parametrize("filename,etl_service,expected_skip", [
-    ("file.eml", "DOCLING", True),
-    ("file.eml", "UNSTRUCTURED", False),
-    ("file.docm", "LLAMACLOUD", False),
-    ("file.docm", "DOCLING", True),
-    ("file.txt", "DOCLING", False),
-    ("file.csv", "LLAMACLOUD", False),
-    ("file.mp3", "UNSTRUCTURED", False),
-    ("file.exe", "LLAMACLOUD", True),
-    ("file.pdf", "DOCLING", False),
-    ("file.webp", "DOCLING", False),
-    ("file.webp", "UNSTRUCTURED", True),
-    ("file.gif", "LLAMACLOUD", False),
-    ("file.gif", "DOCLING", True),
-    ("file.heic", "UNSTRUCTURED", False),
-    ("file.heic", "DOCLING", True),
-    ("file.svg", "LLAMACLOUD", False),
-    ("file.svg", "DOCLING", True),
-    ("file.p7s", "UNSTRUCTURED", False),
-    ("file.p7s", "LLAMACLOUD", True),
-])
+@pytest.mark.parametrize(
+    "filename,etl_service,expected_skip",
+    [
+        ("file.eml", "DOCLING", True),
+        ("file.eml", "UNSTRUCTURED", False),
+        ("file.docm", "LLAMACLOUD", False),
+        ("file.docm", "DOCLING", True),
+        ("file.txt", "DOCLING", False),
+        ("file.csv", "LLAMACLOUD", False),
+        ("file.mp3", "UNSTRUCTURED", False),
+        ("file.exe", "LLAMACLOUD", True),
+        ("file.pdf", "DOCLING", False),
+        ("file.webp", "DOCLING", False),
+        ("file.webp", "UNSTRUCTURED", True),
+        ("file.gif", "LLAMACLOUD", False),
+        ("file.gif", "DOCLING", True),
+        ("file.heic", "UNSTRUCTURED", False),
+        ("file.heic", "DOCLING", True),
+        ("file.svg", "LLAMACLOUD", False),
+        ("file.svg", "DOCLING", True),
+        ("file.p7s", "UNSTRUCTURED", False),
+        ("file.p7s", "LLAMACLOUD", True),
+    ],
+)
 def test_should_skip_for_service(filename, etl_service, expected_skip):
     from app.etl_pipeline.file_classifier import should_skip_for_service
 
@@ -414,7 +427,7 @@ def test_should_skip_for_service(filename, etl_service, expected_skip):
 
 
 # ---------------------------------------------------------------------------
-# Slice 14b – ETL pipeline rejects per-parser incompatible documents
+# Slice 14b - ETL pipeline rejects per-parser incompatible documents
 # ---------------------------------------------------------------------------
 
 
diff --git a/surfsense_backend/tests/unit/services/test_docling_image_support.py b/surfsense_backend/tests/unit/services/test_docling_image_support.py
index 430adbaf2..11ffc0ed1 100644
--- a/surfsense_backend/tests/unit/services/test_docling_image_support.py
+++ b/surfsense_backend/tests/unit/services/test_docling_image_support.py
@@ -30,26 +30,29 @@ def test_docling_service_does_not_restrict_allowed_formats():
 
     fake_pdf_format_option_cls = MagicMock()
 
-    with patch.dict("sys.modules", {
-        "docling": MagicMock(),
-        "docling.backend": MagicMock(),
-        "docling.backend.pypdfium2_backend": MagicMock(
-            PyPdfiumDocumentBackend=mock_backend
-        ),
-        "docling.datamodel": MagicMock(),
-        "docling.datamodel.base_models": MagicMock(
-            InputFormat=_FakeInputFormat
-        ),
-        "docling.datamodel.pipeline_options": MagicMock(
-            PdfPipelineOptions=fake_pipeline_options_cls
-        ),
-        "docling.document_converter": MagicMock(
-            DocumentConverter=mock_converter_cls,
-            PdfFormatOption=fake_pdf_format_option_cls,
-        ),
-    }):
-        import app.services.docling_service as mod
+    with patch.dict(
+        "sys.modules",
+        {
+            "docling": MagicMock(),
+            "docling.backend": MagicMock(),
+            "docling.backend.pypdfium2_backend": MagicMock(
+                PyPdfiumDocumentBackend=mock_backend
+            ),
+            "docling.datamodel": MagicMock(),
+            "docling.datamodel.base_models": MagicMock(InputFormat=_FakeInputFormat),
+            "docling.datamodel.pipeline_options": MagicMock(
+                PdfPipelineOptions=fake_pipeline_options_cls
+            ),
+            "docling.document_converter": MagicMock(
+                DocumentConverter=mock_converter_cls,
+                PdfFormatOption=fake_pdf_format_option_cls,
+            ),
+        },
+    ):
         from importlib import reload
+
+        import app.services.docling_service as mod
+
         reload(mod)
 
         mod.DoclingService()
diff --git a/surfsense_backend/tests/unit/utils/test_file_extensions.py b/surfsense_backend/tests/unit/utils/test_file_extensions.py
index acd8945ce..c33b39f05 100644
--- a/surfsense_backend/tests/unit/utils/test_file_extensions.py
+++ b/surfsense_backend/tests/unit/utils/test_file_extensions.py
@@ -17,36 +17,74 @@ def test_exe_is_not_supported_document():
     assert is_supported_document_extension("malware.exe") is False
 
 
-@pytest.mark.parametrize("filename", [
-    "report.pdf", "doc.docx", "old.doc",
-    "sheet.xlsx", "legacy.xls",
-    "slides.pptx", "deck.ppt",
-    "macro.docm", "macro.xlsm", "macro.pptm",
-    "photo.png", "photo.jpg", "photo.jpeg", "scan.bmp", "scan.tiff", "scan.tif",
-    "photo.webp", "anim.gif", "iphone.heic",
-    "manual.rtf", "book.epub",
-    "letter.odt", "data.ods", "presentation.odp",
-    "inbox.eml", "outlook.msg",
-    "korean.hwpx", "korean.hwp",
-    "template.dot", "template.dotm",
-    "template.pot", "template.potx",
-    "binary.xlsb", "workspace.xlw",
-    "vector.svg", "signature.p7s",
-])
+@pytest.mark.parametrize(
+    "filename",
+    [
+        "report.pdf",
+        "doc.docx",
+        "old.doc",
+        "sheet.xlsx",
+        "legacy.xls",
+        "slides.pptx",
+        "deck.ppt",
+        "macro.docm",
+        "macro.xlsm",
+        "macro.pptm",
+        "photo.png",
+        "photo.jpg",
+        "photo.jpeg",
+        "scan.bmp",
+        "scan.tiff",
+        "scan.tif",
+        "photo.webp",
+        "anim.gif",
+        "iphone.heic",
+        "manual.rtf",
+        "book.epub",
+        "letter.odt",
+        "data.ods",
+        "presentation.odp",
+        "inbox.eml",
+        "outlook.msg",
+        "korean.hwpx",
+        "korean.hwp",
+        "template.dot",
+        "template.dotm",
+        "template.pot",
+        "template.potx",
+        "binary.xlsb",
+        "workspace.xlw",
+        "vector.svg",
+        "signature.p7s",
+    ],
+)
 def test_document_extensions_are_supported(filename):
     from app.utils.file_extensions import is_supported_document_extension
 
-    assert is_supported_document_extension(filename) is True, f"{filename} should be supported"
+    assert is_supported_document_extension(filename) is True, (
+        f"{filename} should be supported"
+    )
 
 
-@pytest.mark.parametrize("filename", [
-    "malware.exe", "archive.zip", "video.mov", "font.woff2",
-    "model.blend", "random.xyz", "data.parquet", "package.deb",
-])
+@pytest.mark.parametrize(
+    "filename",
+    [
+        "malware.exe",
+        "archive.zip",
+        "video.mov",
+        "font.woff2",
+        "model.blend",
+        "random.xyz",
+        "data.parquet",
+        "package.deb",
+    ],
+)
 def test_non_document_extensions_are_not_supported(filename):
     from app.utils.file_extensions import is_supported_document_extension
 
-    assert is_supported_document_extension(filename) is False, f"{filename} should NOT be supported"
+    assert is_supported_document_extension(filename) is False, (
+        f"{filename} should NOT be supported"
+    )
 
 
 # ---------------------------------------------------------------------------
@@ -67,7 +105,7 @@ def test_union_equals_all_three_sets():
         | LLAMAPARSE_DOCUMENT_EXTENSIONS
         | UNSTRUCTURED_DOCUMENT_EXTENSIONS
     )
-    assert DOCUMENT_EXTENSIONS == expected
+    assert expected == DOCUMENT_EXTENSIONS
 
 
 def test_get_extensions_for_docling():
diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
index 1522e153f..957ae9dae 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
@@ -3,8 +3,8 @@
 import { useEffect, useState } from "react";
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
 import { Label } from "@/components/ui/label";
-import { Switch } from "@/components/ui/switch";
 import { Spinner } from "@/components/ui/spinner";
+import { Switch } from "@/components/ui/switch";
 
 export function DesktopContent() {
 	const [isElectron, setIsElectron] = useState(false);
@@ -66,11 +66,7 @@ export function DesktopContent() {
 								Show suggestions while typing in other applications.
 							</p>
 						</div>
-						<Switch
-							id="autocomplete-toggle"
-							checked={enabled}
-							onCheckedChange={handleToggle}
-						/>
+						<Switch id="autocomplete-toggle" checked={enabled} onCheckedChange={handleToggle} />
 					</div>
 				</CardContent>
 			</Card>
diff --git a/surfsense_web/app/desktop/permissions/page.tsx b/surfsense_web/app/desktop/permissions/page.tsx
index 6c08e35b5..37cfe826f 100644
--- a/surfsense_web/app/desktop/permissions/page.tsx
+++ b/surfsense_web/app/desktop/permissions/page.tsx
@@ -1,7 +1,7 @@
 "use client";
 
-import { useEffect, useState } from "react";
 import { useRouter } from "next/navigation";
+import { useEffect, useState } from "react";
 import { Logo } from "@/components/Logo";
 import { Button } from "@/components/ui/button";
 import { Spinner } from "@/components/ui/spinner";
@@ -17,7 +17,8 @@ const STEPS = [
 	{
 		id: "screen-recording",
 		title: "Screen Recording",
-		description: "Lets SurfSense capture your screen to understand context and provide smart writing suggestions.",
+		description:
+			"Lets SurfSense capture your screen to understand context and provide smart writing suggestions.",
 		action: "requestScreenRecording",
 		field: "screenRecording" as const,
 	},
@@ -79,7 +80,9 @@ export default function DesktopPermissionsPage() {
 
 		poll();
 		interval = setInterval(poll, 2000);
-		return () => { if (interval) clearInterval(interval); };
+		return () => {
+			if (interval) clearInterval(interval);
+		};
 	}, []);
 
 	if (!isElectron) {
@@ -98,7 +101,8 @@ export default function DesktopPermissionsPage() {
 		);
 	}
 
-	const allGranted = permissions.accessibility === "authorized" && permissions.screenRecording === "authorized";
+	const allGranted =
+		permissions.accessibility === "authorized" && permissions.screenRecording === "authorized";
 
 	const handleRequest = async (action: string) => {
 		if (action === "requestScreenRecording") {
@@ -175,7 +179,8 @@ export default function DesktopPermissionsPage() {
 											</p>
 										)}
 										<p className="text-xs text-muted-foreground">
-											If SurfSense doesn&apos;t appear in the list, click <strong>+</strong> and select it from Applications.
+											If SurfSense doesn&apos;t appear in the list, click <strong>+</strong> and
+											select it from Applications.
 										</p>
 									</div>
 								)}
diff --git a/surfsense_web/app/desktop/suggestion/layout.tsx b/surfsense_web/app/desktop/suggestion/layout.tsx
index 36b7e037b..fd8faf099 100644
--- a/surfsense_web/app/desktop/suggestion/layout.tsx
+++ b/surfsense_web/app/desktop/suggestion/layout.tsx
@@ -4,10 +4,6 @@ export const metadata = {
 	title: "SurfSense Suggestion",
 };
 
-export default function SuggestionLayout({
-	children,
-}: {
-	children: React.ReactNode;
-}) {
+export default function SuggestionLayout({ children }: { children: React.ReactNode }) {
 	return <div className="suggestion-body">{children}</div>;
 }
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 03944867f..6ade64883 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -72,27 +72,23 @@ export default function SuggestionPage() {
 				return;
 			}
 
-			const backendUrl =
-				process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL || "http://localhost:8000";
+			const backendUrl = process.env.NEXT_PUBLIC_FASTAPI_BACKEND_URL || "http://localhost:8000";
 
 			try {
-				const response = await fetch(
-					`${backendUrl}/api/v1/autocomplete/vision/stream`,
-					{
-						method: "POST",
-						headers: {
-							Authorization: `Bearer ${token}`,
-							"Content-Type": "application/json",
-						},
-						body: JSON.stringify({
-							screenshot,
-							search_space_id: parseInt(searchSpaceId, 10),
-							app_name: appName || "",
-							window_title: windowTitle || "",
-						}),
-						signal: controller.signal,
+				const response = await fetch(`${backendUrl}/api/v1/autocomplete/vision/stream`, {
+					method: "POST",
+					headers: {
+						Authorization: `Bearer ${token}`,
+						"Content-Type": "application/json",
 					},
-				);
+					body: JSON.stringify({
+						screenshot,
+						search_space_id: parseInt(searchSpaceId, 10),
+						app_name: appName || "",
+						window_title: windowTitle || "",
+					}),
+					signal: controller.signal,
+				});
 
 				if (!response.ok) {
 					setError(friendlyError(response.status));
@@ -132,9 +128,7 @@ export default function SuggestionPage() {
 								} else if (parsed.type === "error") {
 									setError(friendlyError(parsed.errorText));
 								}
-							} catch {
-								continue;
-							}
+							} catch {}
 						}
 					}
 				}
@@ -145,7 +139,7 @@ export default function SuggestionPage() {
 				setIsLoading(false);
 			}
 		},
-		[],
+		[]
 	);
 
 	useEffect(() => {
@@ -207,10 +201,18 @@ export default function SuggestionPage() {
 		<div className="suggestion-tooltip">
 			<p className="suggestion-text">{suggestion}</p>
 			<div className="suggestion-actions">
-				<button className="suggestion-btn suggestion-btn-accept" onClick={handleAccept}>
+				<button
+					type="button"
+					className="suggestion-btn suggestion-btn-accept"
+					onClick={handleAccept}
+				>
 					Accept
 				</button>
-				<button className="suggestion-btn suggestion-btn-dismiss" onClick={handleDismiss}>
+				<button
+					type="button"
+					className="suggestion-btn suggestion-btn-dismiss"
+					onClick={handleDismiss}
+				>
 					Dismiss
 				</button>
 			</div>
diff --git a/surfsense_web/app/desktop/suggestion/suggestion.css b/surfsense_web/app/desktop/suggestion/suggestion.css
index 62f4d2ea7..ef578059c 100644
--- a/surfsense_web/app/desktop/suggestion/suggestion.css
+++ b/surfsense_web/app/desktop/suggestion/suggestion.css
@@ -1,121 +1,125 @@
 html:has(.suggestion-body),
 body:has(.suggestion-body) {
-  margin: 0 !important;
-  padding: 0 !important;
-  background: transparent !important;
-  overflow: hidden !important;
-  height: auto !important;
-  width: 100% !important;
+	margin: 0 !important;
+	padding: 0 !important;
+	background: transparent !important;
+	overflow: hidden !important;
+	height: auto !important;
+	width: 100% !important;
 }
 
 .suggestion-body {
-  margin: 0;
-  padding: 0;
-  background: transparent;
-  font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
-  -webkit-font-smoothing: antialiased;
-  user-select: none;
-  -webkit-app-region: no-drag;
+	margin: 0;
+	padding: 0;
+	background: transparent;
+	font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+	-webkit-font-smoothing: antialiased;
+	user-select: none;
+	-webkit-app-region: no-drag;
 }
 
 .suggestion-tooltip {
-  background: #1e1e1e;
-  border: 1px solid #3c3c3c;
-  border-radius: 8px;
-  padding: 8px 12px;
-  margin: 4px;
-  max-width: 400px;
-  box-shadow: 0 4px 16px rgba(0, 0, 0, 0.5);
+	background: #1e1e1e;
+	border: 1px solid #3c3c3c;
+	border-radius: 8px;
+	padding: 8px 12px;
+	margin: 4px;
+	max-width: 400px;
+	box-shadow: 0 4px 16px rgba(0, 0, 0, 0.5);
 }
 
 .suggestion-text {
-  color: #d4d4d4;
-  font-size: 13px;
-  line-height: 1.45;
-  margin: 0 0 6px 0;
-  word-wrap: break-word;
-  white-space: pre-wrap;
+	color: #d4d4d4;
+	font-size: 13px;
+	line-height: 1.45;
+	margin: 0 0 6px 0;
+	word-wrap: break-word;
+	white-space: pre-wrap;
 }
 
 .suggestion-actions {
-  display: flex;
-  justify-content: flex-end;
-  gap: 4px;
-  border-top: 1px solid #2a2a2a;
-  padding-top: 6px;
+	display: flex;
+	justify-content: flex-end;
+	gap: 4px;
+	border-top: 1px solid #2a2a2a;
+	padding-top: 6px;
 }
 
 .suggestion-btn {
-  padding: 2px 8px;
-  border-radius: 3px;
-  border: 1px solid #3c3c3c;
-  font-family: inherit;
-  font-size: 10px;
-  font-weight: 500;
-  cursor: pointer;
-  line-height: 16px;
-  transition: background 0.15s, border-color 0.15s;
+	padding: 2px 8px;
+	border-radius: 3px;
+	border: 1px solid #3c3c3c;
+	font-family: inherit;
+	font-size: 10px;
+	font-weight: 500;
+	cursor: pointer;
+	line-height: 16px;
+	transition:
+		background 0.15s,
+		border-color 0.15s;
 }
 
 .suggestion-btn-accept {
-  background: #2563eb;
-  border-color: #3b82f6;
-  color: #fff;
+	background: #2563eb;
+	border-color: #3b82f6;
+	color: #fff;
 }
 
 .suggestion-btn-accept:hover {
-  background: #1d4ed8;
+	background: #1d4ed8;
 }
 
 .suggestion-btn-dismiss {
-  background: #2a2a2a;
-  color: #999;
+	background: #2a2a2a;
+	color: #999;
 }
 
 .suggestion-btn-dismiss:hover {
-  background: #333;
-  color: #ccc;
+	background: #333;
+	color: #ccc;
 }
 
 .suggestion-error {
-  border-color: #5c2626;
+	border-color: #5c2626;
 }
 
 .suggestion-error-text {
-  color: #f48771;
-  font-size: 12px;
+	color: #f48771;
+	font-size: 12px;
 }
 
 .suggestion-loading {
-  display: flex;
-  gap: 5px;
-  padding: 2px 0;
-  justify-content: center;
+	display: flex;
+	gap: 5px;
+	padding: 2px 0;
+	justify-content: center;
 }
 
 .suggestion-dot {
-  width: 4px;
-  height: 4px;
-  border-radius: 50%;
-  background: #666;
-  animation: suggestion-pulse 1.2s infinite ease-in-out;
+	width: 4px;
+	height: 4px;
+	border-radius: 50%;
+	background: #666;
+	animation: suggestion-pulse 1.2s infinite ease-in-out;
 }
 
 .suggestion-dot:nth-child(2) {
-  animation-delay: 0.15s;
+	animation-delay: 0.15s;
 }
 
 .suggestion-dot:nth-child(3) {
-  animation-delay: 0.3s;
+	animation-delay: 0.3s;
 }
 
 @keyframes suggestion-pulse {
-  0%, 80%, 100% {
-    opacity: 0.3;
-    transform: scale(0.8);
-  }
-  40% {
-    opacity: 1;
-    transform: scale(1.1);
-  }
+	0%,
+	80%,
+	100% {
+		opacity: 0.3;
+		transform: scale(0.8);
+	}
+	40% {
+		opacity: 1;
+		transform: scale(1.1);
+	}
 }
diff --git a/surfsense_web/components/assistant-ui/connector-popup/views/connector-accounts-list-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/views/connector-accounts-list-view.tsx
index 5e2b8452b..b4c049c5c 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/views/connector-accounts-list-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/views/connector-accounts-list-view.tsx
@@ -173,9 +173,7 @@ export const ConnectorAccountsListView: FC<ConnectorAccountsListViewProps> = ({
 								<Plus className="size-3 text-primary" />
 							)}
 						</div>
-						<span className="text-xs sm:text-sm font-medium">
-							{buttonText}
-						</span>
+						<span className="text-xs sm:text-sm font-medium">{buttonText}</span>
 					</button>
 				</div>
 			</div>
diff --git a/surfsense_web/components/assistant-ui/connector-popup/views/youtube-crawler-view.tsx b/surfsense_web/components/assistant-ui/connector-popup/views/youtube-crawler-view.tsx
index c16072bca..8982b16a8 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/views/youtube-crawler-view.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/views/youtube-crawler-view.tsx
@@ -337,9 +337,7 @@ export const YouTubeCrawlerView: FC<YouTubeCrawlerViewProps> = ({ searchSpaceId,
 					disabled={isSubmitting || isFetchingPlaylist || videoTags.length === 0}
 					className="relative text-xs sm:text-sm min-w-[140px] disabled:opacity-50 disabled:cursor-not-allowed disabled:pointer-events-none"
 				>
-					<span className={isSubmitting ? "opacity-0" : ""}>
-						{t("submit")}
-					</span>
+					<span className={isSubmitting ? "opacity-0" : ""}>{t("submit")}</span>
 					{isSubmitting && <Spinner size="sm" className="absolute" />}
 				</Button>
 			</div>
diff --git a/surfsense_web/components/assistant-ui/document-upload-popup.tsx b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
index 7b0409345..0b38979a5 100644
--- a/surfsense_web/components/assistant-ui/document-upload-popup.tsx
+++ b/surfsense_web/components/assistant-ui/document-upload-popup.tsx
@@ -132,9 +132,7 @@ const DocumentUploadPopupContent: FC<{
 				<div className="flex-1 min-h-0 overflow-y-auto overscroll-contain">
 					<div className="sticky top-0 z-20 bg-muted px-4 sm:px-6 pt-6 sm:pt-8 pb-10">
 						<div className="flex items-center gap-2 mb-1 pr-8 sm:pr-0">
-							<h2 className="text-xl sm:text-3xl font-semibold tracking-tight">
-								Upload Documents
-							</h2>
+							<h2 className="text-xl sm:text-3xl font-semibold tracking-tight">Upload Documents</h2>
 						</div>
 						<p className="text-xs sm:text-base text-muted-foreground/80 line-clamp-1">
 							Upload and sync your documents to your search space
diff --git a/surfsense_web/components/assistant-ui/image.tsx b/surfsense_web/components/assistant-ui/image.tsx
index c147eede4..59781abcf 100644
--- a/surfsense_web/components/assistant-ui/image.tsx
+++ b/surfsense_web/components/assistant-ui/image.tsx
@@ -3,10 +3,10 @@
 import type { ImageMessagePartComponent } from "@assistant-ui/react";
 import { cva, type VariantProps } from "class-variance-authority";
 import { ImageIcon, ImageOffIcon } from "lucide-react";
+import NextImage from "next/image";
 import { memo, type PropsWithChildren, useEffect, useRef, useState } from "react";
 import { createPortal } from "react-dom";
 import { cn } from "@/lib/utils";
-import NextImage from 'next/image';
 
 const imageVariants = cva("aui-image-root relative overflow-hidden rounded-lg", {
 	variants: {
@@ -88,23 +88,23 @@ function ImagePreview({
 					<ImageOffIcon className="size-8 text-muted-foreground" />
 				</div>
 			) : isDataOrBlobUrl(src) ? (
-                // biome-ignore lint/performance/noImgElement: data/blob URLs need plain img
-                <img
-                    ref={imgRef}
-                    src={src}
-                    alt={alt}
-                    className={cn("block h-auto w-full object-contain", !loaded && "invisible", className)}
-                    onLoad={(e) => {
-                        if (typeof src === "string") setLoadedSrc(src);
-                        onLoad?.(e);
-                    }}
-                    onError={(e) => {
-                        if (typeof src === "string") setErrorSrc(src);
-                        onError?.(e);
-                    }}
-                    {...props}
-                />
-            ) : (
+				// biome-ignore lint/performance/noImgElement: data/blob URLs need plain img
+				<img
+					ref={imgRef}
+					src={src}
+					alt={alt}
+					className={cn("block h-auto w-full object-contain", !loaded && "invisible", className)}
+					onLoad={(e) => {
+						if (typeof src === "string") setLoadedSrc(src);
+						onLoad?.(e);
+					}}
+					onError={(e) => {
+						if (typeof src === "string") setErrorSrc(src);
+						onError?.(e);
+					}}
+					{...props}
+				/>
+			) : (
 				// biome-ignore lint/performance/noImgElement: intentional for dynamic external URLs
 				// <img
 				// 	ref={imgRef}
@@ -122,22 +122,22 @@ function ImagePreview({
 				// 	{...props}
 				// />
 				<NextImage
-				fill
-				src={src || ""}
-				alt={alt}
-				sizes="(max-width: 768px) 100vw, (max-width: 1200px) 80vw, 60vw"
-				className={cn("block object-contain", !loaded && "invisible", className)}
-				onLoad={() => {
-					if (typeof src === "string") setLoadedSrc(src);
-					onLoad?.();
-				}}
-				onError={() => {
-					if (typeof src === "string") setErrorSrc(src);
-					onError?.();
-				}}
-				unoptimized={false}
-				{...props}
-			/>
+					fill
+					src={src || ""}
+					alt={alt}
+					sizes="(max-width: 768px) 100vw, (max-width: 1200px) 80vw, 60vw"
+					className={cn("block object-contain", !loaded && "invisible", className)}
+					onLoad={() => {
+						if (typeof src === "string") setLoadedSrc(src);
+						onLoad?.();
+					}}
+					onError={() => {
+						if (typeof src === "string") setErrorSrc(src);
+						onError?.();
+					}}
+					unoptimized={false}
+					{...props}
+				/>
 			)}
 		</div>
 	);
@@ -162,8 +162,8 @@ type ImageZoomProps = PropsWithChildren<{
 	alt?: string;
 }>;
 function isDataOrBlobUrl(src: string | undefined): boolean {
-    if (!src || typeof src !== "string") return false;
-    return src.startsWith("data:") || src.startsWith("blob:");
+	if (!src || typeof src !== "string") return false;
+	return src.startsWith("data:") || src.startsWith("blob:");
 }
 function ImageZoom({ src, alt = "Image preview", children }: ImageZoomProps) {
 	const [isMounted, setIsMounted] = useState(false);
@@ -216,38 +216,38 @@ function ImageZoom({ src, alt = "Image preview", children }: ImageZoomProps) {
 					>
 						{/** biome-ignore lint/performance/noImgElement: <explanation> */}
 						{isDataOrBlobUrl(src) ? (
-                            // biome-ignore lint/performance/noImgElement: data/blob URLs need plain img
-                            <img
-                                data-slot="image-zoom-content"
-                                src={src}
-                                alt={alt}
-                                className="aui-image-zoom-content fade-in zoom-in-95 max-h-[90vh] max-w-[90vw] animate-in object-contain duration-200"
-                                onClick={(e) => {
-                                    e.stopPropagation();
-                                    handleClose();
-                                }}
-                                onKeyDown={(e) => {
-                                    if (e.key === "Enter") {
-                                        e.stopPropagation();
-                                        handleClose();
-                                    }
-                                }}
-                            />
-                        ) : (
+							// biome-ignore lint/performance/noImgElement: data/blob URLs need plain img
+							<img
+								data-slot="image-zoom-content"
+								src={src}
+								alt={alt}
+								className="aui-image-zoom-content fade-in zoom-in-95 max-h-[90vh] max-w-[90vw] animate-in object-contain duration-200"
+								onClick={(e) => {
+									e.stopPropagation();
+									handleClose();
+								}}
+								onKeyDown={(e) => {
+									if (e.key === "Enter") {
+										e.stopPropagation();
+										handleClose();
+									}
+								}}
+							/>
+						) : (
 							<NextImage
-                                data-slot="image-zoom-content"
-                                fill
-                                src={src}
-                                alt={alt}
-                                sizes="90vw"
-                                className="aui-image-zoom-content fade-in zoom-in-95 object-contain duration-200"
-                                onClick={(e) => {
-                                    e.stopPropagation();
-                                    handleClose();
-                                }}
-                                unoptimized={false}
-                            />
-                        )}
+								data-slot="image-zoom-content"
+								fill
+								src={src}
+								alt={alt}
+								sizes="90vw"
+								className="aui-image-zoom-content fade-in zoom-in-95 object-contain duration-200"
+								onClick={(e) => {
+									e.stopPropagation();
+									handleClose();
+								}}
+								unoptimized={false}
+							/>
+						)}
 					</button>,
 					document.body
 				)}
diff --git a/surfsense_web/components/assistant-ui/thread-list.tsx b/surfsense_web/components/assistant-ui/thread-list.tsx
index e8b8db6fe..bca36c037 100644
--- a/surfsense_web/components/assistant-ui/thread-list.tsx
+++ b/surfsense_web/components/assistant-ui/thread-list.tsx
@@ -241,9 +241,7 @@ const ThreadListItemComponent = memo(function ThreadListItemComponent({
 			<MessageSquareIcon className="size-4 shrink-0 text-muted-foreground" />
 			<div className="flex-1 min-w-0">
 				<p className="truncate text-sm font-medium">{thread.title || "New Chat"}</p>
-				<p className="truncate text-xs text-muted-foreground">
-					{relativeTime}
-				</p>
+				<p className="truncate text-xs text-muted-foreground">{relativeTime}</p>
 			</div>
 			<DropdownMenu>
 				<DropdownMenuTrigger asChild>
diff --git a/surfsense_web/components/assistant-ui/tool-fallback.tsx b/surfsense_web/components/assistant-ui/tool-fallback.tsx
index 40118d2e4..b658dba6d 100644
--- a/surfsense_web/components/assistant-ui/tool-fallback.tsx
+++ b/surfsense_web/components/assistant-ui/tool-fallback.tsx
@@ -26,7 +26,8 @@ export const ToolFallback: ToolCallMessagePartComponent = ({
 	);
 
 	const serializedResult = useMemo(
-		() => (result !== undefined && typeof result !== "string" ? JSON.stringify(result, null, 2) : null),
+		() =>
+			result !== undefined && typeof result !== "string" ? JSON.stringify(result, null, 2) : null,
 		[result]
 	);
 
diff --git a/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx b/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
index e14022f5c..1c4383388 100644
--- a/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
+++ b/surfsense_web/components/chat-comments/comment-composer/comment-composer.tsx
@@ -300,15 +300,15 @@ export function CommentComposer({
 
 			<div className={cn("flex items-center gap-2", !compact && "justify-end")}>
 				{onCancel && (
-				<Button
-					type="button"
-					variant="ghost"
-					size="sm"
-					onClick={onCancel}
-					disabled={isSubmitting}
-				>
-					Cancel
-				</Button>
+					<Button
+						type="button"
+						variant="ghost"
+						size="sm"
+						onClick={onCancel}
+						disabled={isSubmitting}
+					>
+						Cancel
+					</Button>
 				)}
 				<Button
 					type="button"
@@ -317,11 +317,7 @@ export function CommentComposer({
 					disabled={!canSubmit}
 					className={cn(!canSubmit && "opacity-50", compact && "size-8 shrink-0 rounded-full")}
 				>
-					{compact ? (
-						<ArrowUp className="size-4" />
-					) : (
-						submitLabel
-					)}
+					{compact ? <ArrowUp className="size-4" /> : submitLabel}
 				</Button>
 			</div>
 		</div>
diff --git a/surfsense_web/components/documents/DocumentNode.tsx b/surfsense_web/components/documents/DocumentNode.tsx
index fe796b5be..d8e37df1c 100644
--- a/surfsense_web/components/documents/DocumentNode.tsx
+++ b/surfsense_web/components/documents/DocumentNode.tsx
@@ -207,9 +207,15 @@ export const DocumentNode = React.memo(function DocumentNode({
 						);
 					})()}
 
-					<Tooltip delayDuration={600} open={titleTooltipOpen} onOpenChange={handleTitleTooltipOpenChange}>
+					<Tooltip
+						delayDuration={600}
+						open={titleTooltipOpen}
+						onOpenChange={handleTitleTooltipOpenChange}
+					>
 						<TooltipTrigger asChild>
-							<span ref={titleRef} className="flex-1 min-w-0 truncate">{doc.title}</span>
+							<span ref={titleRef} className="flex-1 min-w-0 truncate">
+								{doc.title}
+							</span>
 						</TooltipTrigger>
 						<TooltipContent side="bottom" className="max-w-xs break-words">
 							{doc.title}
@@ -276,10 +282,7 @@ export const DocumentNode = React.memo(function DocumentNode({
 									Versions
 								</DropdownMenuItem>
 							)}
-							<DropdownMenuItem
-								disabled={isProcessing}
-								onClick={() => onDelete(doc)}
-							>
+							<DropdownMenuItem disabled={isProcessing} onClick={() => onDelete(doc)}>
 								<Trash2 className="mr-2 h-4 w-4" />
 								Delete
 							</DropdownMenuItem>
@@ -321,10 +324,7 @@ export const DocumentNode = React.memo(function DocumentNode({
 							Versions
 						</ContextMenuItem>
 					)}
-					<ContextMenuItem
-						disabled={isProcessing}
-						onClick={() => onDelete(doc)}
-					>
+					<ContextMenuItem disabled={isProcessing} onClick={() => onDelete(doc)}>
 						<Trash2 className="mr-2 h-4 w-4" />
 						Delete
 					</ContextMenuItem>
diff --git a/surfsense_web/components/documents/FolderTreeView.tsx b/surfsense_web/components/documents/FolderTreeView.tsx
index 371d00f42..47cd17596 100644
--- a/surfsense_web/components/documents/FolderTreeView.tsx
+++ b/surfsense_web/components/documents/FolderTreeView.tsx
@@ -97,7 +97,10 @@ export function FolderTreeView({
 	const handleCancelRename = useCallback(() => setRenamingFolderId(null), [setRenamingFolderId]);
 
 	const effectiveActiveTypes = useMemo(() => {
-		if (activeTypes.includes("FILE" as DocumentTypeEnum) && !activeTypes.includes("LOCAL_FOLDER_FILE" as DocumentTypeEnum)) {
+		if (
+			activeTypes.includes("FILE" as DocumentTypeEnum) &&
+			!activeTypes.includes("LOCAL_FOLDER_FILE" as DocumentTypeEnum)
+		) {
 			return [...activeTypes, "LOCAL_FOLDER_FILE" as DocumentTypeEnum];
 		}
 		return activeTypes;
@@ -110,7 +113,9 @@ export function FolderTreeView({
 		function check(folderId: number): boolean {
 			if (match[folderId] !== undefined) return match[folderId];
 			const childDocs = (docsByFolder[folderId] ?? []).some(
-				(d) => effectiveActiveTypes.length === 0 || effectiveActiveTypes.includes(d.document_type as DocumentTypeEnum)
+				(d) =>
+					effectiveActiveTypes.length === 0 ||
+					effectiveActiveTypes.includes(d.document_type as DocumentTypeEnum)
 			);
 			if (childDocs) {
 				match[folderId] = true;
@@ -201,7 +206,9 @@ export function FolderTreeView({
 			? childFolders.filter((f) => hasDescendantMatch[f.id])
 			: childFolders;
 		const childDocs = (docsByFolder[key] ?? []).filter(
-			(d) => effectiveActiveTypes.length === 0 || effectiveActiveTypes.includes(d.document_type as DocumentTypeEnum)
+			(d) =>
+				effectiveActiveTypes.length === 0 ||
+				effectiveActiveTypes.includes(d.document_type as DocumentTypeEnum)
 		);
 
 		const nodes: React.ReactNode[] = [];
@@ -223,7 +230,7 @@ export function FolderTreeView({
 					depth={depth}
 					isExpanded={isExpanded}
 					isRenaming={renamingFolderId === f.id}
-				selectionState={folderSelectionStates[f.id] ?? "none"}
+					selectionState={folderSelectionStates[f.id] ?? "none"}
 					processingState={folderProcessingStates[f.id] ?? "idle"}
 					onToggleSelect={onToggleFolderSelect}
 					onToggleExpand={onToggleExpand}
diff --git a/surfsense_web/components/editor/plate-editor.tsx b/surfsense_web/components/editor/plate-editor.tsx
index ed239ffa3..66e9a0e5e 100644
--- a/surfsense_web/components/editor/plate-editor.tsx
+++ b/surfsense_web/components/editor/plate-editor.tsx
@@ -158,17 +158,18 @@ export function PlateEditor({
 	// When not forced read-only, the user can toggle between editing/viewing.
 	const canToggleMode = !readOnly;
 
-	const contextProviderValue = useMemo(()=> ({
-		onSave,
-		hasUnsavedChanges,
-		isSaving,
-		canToggleMode,
-	}), [onSave, hasUnsavedChanges, isSaving, canToggleMode]);
+	const contextProviderValue = useMemo(
+		() => ({
+			onSave,
+			hasUnsavedChanges,
+			isSaving,
+			canToggleMode,
+		}),
+		[onSave, hasUnsavedChanges, isSaving, canToggleMode]
+	);
 
 	return (
-		<EditorSaveContext.Provider
-			value={contextProviderValue}
-		>
+		<EditorSaveContext.Provider value={contextProviderValue}>
 			<Plate
 				editor={editor}
 				// Only pass readOnly as a controlled prop when forced (permanently read-only).
diff --git a/surfsense_web/components/homepage/use-cases-grid.tsx b/surfsense_web/components/homepage/use-cases-grid.tsx
index f9d315b49..7aa272a5c 100644
--- a/surfsense_web/components/homepage/use-cases-grid.tsx
+++ b/surfsense_web/components/homepage/use-cases-grid.tsx
@@ -1,7 +1,7 @@
 "use client";
-import Image from 'next/image';
 
 import { AnimatePresence, motion } from "motion/react";
+import Image from "next/image";
 import { ExpandedGifOverlay, useExpandedGif } from "@/components/ui/expanded-gif-overlay";
 
 const useCases = [
@@ -83,13 +83,13 @@ function UseCaseCard({
 						className="w-full rounded-xl object-cover transition-transform duration-500 group-hover:scale-[1.02]"
 					/>
 					<div className="relative w-full h-48">
-					<Image
-						src={src}
-						alt={title}
-						fill
-						className="rounded-xl object-cover transition-transform duration-500 group-hover:scale-[1.02]"
-						unoptimized={src.endsWith('.gif')}
-					/>
+						<Image
+							src={src}
+							alt={title}
+							fill
+							className="rounded-xl object-cover transition-transform duration-500 group-hover:scale-[1.02]"
+							unoptimized={src.endsWith(".gif")}
+						/>
 					</div>
 				</div>
 				<div className="px-5 py-4">
diff --git a/surfsense_web/components/layout/providers/LayoutDataProvider.tsx b/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
index 74c3c64de..7d4cd9901 100644
--- a/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
+++ b/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
@@ -370,7 +370,8 @@ export function LayoutDataProvider({ searchSpaceId, children }: LayoutDataProvid
 						url: "#announcements",
 						icon: Megaphone,
 						isActive: isAnnouncementsSidebarOpen,
-						badge: announcementUnreadCount > 0 ? formatInboxCount(announcementUnreadCount) : undefined,
+						badge:
+							announcementUnreadCount > 0 ? formatInboxCount(announcementUnreadCount) : undefined,
 					},
 				] as (NavItem | null)[]
 			).filter((item): item is NavItem => item !== null),
diff --git a/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx
index 0e2163dd4..3459fccf6 100644
--- a/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/AllPrivateChatsSidebar.tsx
@@ -376,24 +376,24 @@ export function AllPrivateChatsSidebarContent({
 											<span className="truncate">{thread.title || "New Chat"}</span>
 										</button>
 									) : (
-									<Tooltip delayDuration={600}>
-										<TooltipTrigger asChild>
-											<button
-												type="button"
-												onClick={() => handleThreadClick(thread.id)}
-												disabled={isBusy}
-												className="flex items-center gap-2 flex-1 min-w-0 text-left overflow-hidden"
-											>
-												<span className="truncate">{thread.title || "New Chat"}</span>
-											</button>
-										</TooltipTrigger>
-										<TooltipContent side="bottom" align="start">
-											<p>
-												{t("updated") || "Updated"}:{" "}
-												{format(new Date(thread.updatedAt), "MMM d, yyyy 'at' h:mm a")}
-											</p>
-										</TooltipContent>
-									</Tooltip>
+										<Tooltip delayDuration={600}>
+											<TooltipTrigger asChild>
+												<button
+													type="button"
+													onClick={() => handleThreadClick(thread.id)}
+													disabled={isBusy}
+													className="flex items-center gap-2 flex-1 min-w-0 text-left overflow-hidden"
+												>
+													<span className="truncate">{thread.title || "New Chat"}</span>
+												</button>
+											</TooltipTrigger>
+											<TooltipContent side="bottom" align="start">
+												<p>
+													{t("updated") || "Updated"}:{" "}
+													{format(new Date(thread.updatedAt), "MMM d, yyyy 'at' h:mm a")}
+												</p>
+											</TooltipContent>
+										</Tooltip>
 									)}
 
 									<DropdownMenu
diff --git a/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx
index 9cc1da1e4..097d10121 100644
--- a/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/AllSharedChatsSidebar.tsx
@@ -375,24 +375,24 @@ export function AllSharedChatsSidebarContent({
 											<span className="truncate">{thread.title || "New Chat"}</span>
 										</button>
 									) : (
-									<Tooltip delayDuration={600}>
-										<TooltipTrigger asChild>
-											<button
-												type="button"
-												onClick={() => handleThreadClick(thread.id)}
-												disabled={isBusy}
-												className="flex items-center gap-2 flex-1 min-w-0 text-left overflow-hidden"
-											>
-												<span className="truncate">{thread.title || "New Chat"}</span>
-											</button>
-										</TooltipTrigger>
-										<TooltipContent side="bottom" align="start">
-											<p>
-												{t("updated") || "Updated"}:{" "}
-												{format(new Date(thread.updatedAt), "MMM d, yyyy 'at' h:mm a")}
-											</p>
-										</TooltipContent>
-									</Tooltip>
+										<Tooltip delayDuration={600}>
+											<TooltipTrigger asChild>
+												<button
+													type="button"
+													onClick={() => handleThreadClick(thread.id)}
+													disabled={isBusy}
+													className="flex items-center gap-2 flex-1 min-w-0 text-left overflow-hidden"
+												>
+													<span className="truncate">{thread.title || "New Chat"}</span>
+												</button>
+											</TooltipTrigger>
+											<TooltipContent side="bottom" align="start">
+												<p>
+													{t("updated") || "Updated"}:{" "}
+													{format(new Date(thread.updatedAt), "MMM d, yyyy 'at' h:mm a")}
+												</p>
+											</TooltipContent>
+										</Tooltip>
 									)}
 
 									<DropdownMenu
diff --git a/surfsense_web/components/markdown-viewer.tsx b/surfsense_web/components/markdown-viewer.tsx
index 1c39f03a0..2acf68e94 100644
--- a/surfsense_web/components/markdown-viewer.tsx
+++ b/surfsense_web/components/markdown-viewer.tsx
@@ -2,9 +2,9 @@ import { createCodePlugin } from "@streamdown/code";
 import { createMathPlugin } from "@streamdown/math";
 import { Streamdown, type StreamdownProps } from "streamdown";
 import "katex/dist/katex.min.css";
-import { cn } from "@/lib/utils";
-import Image from 'next/image';
 import { is } from "drizzle-orm";
+import Image from "next/image";
+import { cn } from "@/lib/utils";
 
 const code = createCodePlugin({
 	themes: ["nord", "nord"],
@@ -130,30 +130,31 @@ export function MarkdownViewer({ content, className, maxLength }: MarkdownViewer
 		),
 		hr: ({ ...props }) => <hr className="my-4 border-muted" {...props} />,
 		img: ({ src, alt, width: _w, height: _h, ...props }) => {
-    	const isDataOrUnknownUrl = typeof src === "string" && (src.startsWith("data:") || !src.startsWith("http"));
+			const isDataOrUnknownUrl =
+				typeof src === "string" && (src.startsWith("data:") || !src.startsWith("http"));
 
-    return isDataOrUnknownUrl ? (
-        // eslint-disable-next-line @next/next/no-img-element
-        <img
-            className="max-w-full h-auto my-4 rounded"
-            alt={alt || "markdown image"}
-            src={src}
-            loading="lazy"
-            {...props}
-        />
-    ) : (
-        <Image
-            className="max-w-full h-auto my-4 rounded"
-            alt={alt || "markdown image"}
-            src={typeof src === "string" ? src : ""}
-            width={_w || 800}
-            height={_h || 600}
-            sizes="(max-width: 768px) 100vw, (max-width: 1200px) 75vw, 60vw"
-            unoptimized={isDataOrUnknownUrl}
-            {...props}
-        />
-    );
-},
+			return isDataOrUnknownUrl ? (
+				// eslint-disable-next-line @next/next/no-img-element
+				<img
+					className="max-w-full h-auto my-4 rounded"
+					alt={alt || "markdown image"}
+					src={src}
+					loading="lazy"
+					{...props}
+				/>
+			) : (
+				<Image
+					className="max-w-full h-auto my-4 rounded"
+					alt={alt || "markdown image"}
+					src={typeof src === "string" ? src : ""}
+					width={_w || 800}
+					height={_h || 600}
+					sizes="(max-width: 768px) 100vw, (max-width: 1200px) 75vw, 60vw"
+					unoptimized={isDataOrUnknownUrl}
+					{...props}
+				/>
+			);
+		},
 		table: ({ ...props }) => (
 			<div className="overflow-x-auto my-4 rounded-lg border border-border w-full">
 				<table className="w-full divide-y divide-border" {...props} />
diff --git a/surfsense_web/components/settings/user-settings-dialog.tsx b/surfsense_web/components/settings/user-settings-dialog.tsx
index b74ff973b..0afdfb2b7 100644
--- a/surfsense_web/components/settings/user-settings-dialog.tsx
+++ b/surfsense_web/components/settings/user-settings-dialog.tsx
@@ -5,10 +5,10 @@ import { Globe, KeyRound, Monitor, Receipt, Sparkles, User } from "lucide-react"
 import { useTranslations } from "next-intl";
 import { ApiKeyContent } from "@/app/dashboard/[search_space_id]/user-settings/components/ApiKeyContent";
 import { CommunityPromptsContent } from "@/app/dashboard/[search_space_id]/user-settings/components/CommunityPromptsContent";
+import { DesktopContent } from "@/app/dashboard/[search_space_id]/user-settings/components/DesktopContent";
 import { ProfileContent } from "@/app/dashboard/[search_space_id]/user-settings/components/ProfileContent";
 import { PromptsContent } from "@/app/dashboard/[search_space_id]/user-settings/components/PromptsContent";
 import { PurchaseHistoryContent } from "@/app/dashboard/[search_space_id]/user-settings/components/PurchaseHistoryContent";
-import { DesktopContent } from "@/app/dashboard/[search_space_id]/user-settings/components/DesktopContent";
 import { userSettingsDialogAtom } from "@/atoms/settings/settings-dialog.atoms";
 import { SettingsDialog } from "@/components/settings/settings-dialog";
 
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index c8ce195aa..36a24e299 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -471,13 +471,13 @@ export function DocumentUploadTab({
 						</button>
 					))
 				) : (
-				<button
-					type="button"
-					className="flex flex-col items-center gap-4 py-12 px-4 cursor-pointer w-full bg-transparent border-none"
-					onClick={() => {
-						if (!isElectron) fileInputRef.current?.click();
-					}}
-				>
+					<button
+						type="button"
+						className="flex flex-col items-center gap-4 py-12 px-4 cursor-pointer w-full bg-transparent border-none"
+						onClick={() => {
+							if (!isElectron) fileInputRef.current?.click();
+						}}
+					>
 						<Upload className="h-10 w-10 text-muted-foreground" />
 						<div className="text-center space-y-1.5">
 							<p className="text-base font-medium">
@@ -485,10 +485,15 @@ export function DocumentUploadTab({
 							</p>
 							<p className="text-sm text-muted-foreground">{t("file_size_limit")}</p>
 						</div>
-					{/* biome-ignore lint/a11y/useSemanticElements: wrapper to stop click propagation to parent button */}
-					<div className="w-full mt-1" onClick={(e) => e.stopPropagation()} onKeyDown={(e) => e.stopPropagation()} role="group">
-						{renderBrowseButton({ fullWidth: true })}
-					</div>
+						{/* biome-ignore lint/a11y/useSemanticElements: wrapper to stop click propagation to parent button */}
+						<div
+							className="w-full mt-1"
+							onClick={(e) => e.stopPropagation()}
+							onKeyDown={(e) => e.stopPropagation()}
+							role="group"
+						>
+							{renderBrowseButton({ fullWidth: true })}
+						</div>
 					</button>
 				)}
 			</div>
@@ -684,17 +689,17 @@ export function DocumentUploadTab({
 						</span>
 					</AccordionTrigger>
 					<AccordionContent className="px-3 pb-3">
-					<div className="flex flex-wrap gap-1.5">
-						{supportedExtensions.map((ext) => (
-							<Badge
-								key={ext}
-								variant="secondary"
-								className="rounded border-0 bg-neutral-200/80 dark:bg-neutral-700/60 text-muted-foreground text-[10px] px-2 py-0.5 font-normal"
-							>
-								{ext}
-							</Badge>
-						))}
-					</div>
+						<div className="flex flex-wrap gap-1.5">
+							{supportedExtensions.map((ext) => (
+								<Badge
+									key={ext}
+									variant="secondary"
+									className="rounded border-0 bg-neutral-200/80 dark:bg-neutral-700/60 text-muted-foreground text-[10px] px-2 py-0.5 font-normal"
+								>
+									{ext}
+								</Badge>
+							))}
+						</div>
 					</AccordionContent>
 				</AccordionItem>
 			</Accordion>
diff --git a/surfsense_web/components/tool-ui/citation/citation-list.tsx b/surfsense_web/components/tool-ui/citation/citation-list.tsx
index 75b02bf3d..bbe869a09 100644
--- a/surfsense_web/components/tool-ui/citation/citation-list.tsx
+++ b/surfsense_web/components/tool-ui/citation/citation-list.tsx
@@ -2,13 +2,12 @@
 
 import type { LucideIcon } from "lucide-react";
 import { Code2, Database, ExternalLink, File, FileText, Globe, Newspaper } from "lucide-react";
+import NextImage from "next/image";
 import * as React from "react";
 import { openSafeNavigationHref, resolveSafeNavigationHref } from "../shared/media";
 import { cn, Popover, PopoverContent, PopoverTrigger } from "./_adapter";
 import { Citation } from "./citation";
 import type { CitationType, CitationVariant, SerializableCitation } from "./schema";
-import NextImage from 'next/image';
-
 
 const TYPE_ICONS: Record<CitationType, LucideIcon> = {
 	webpage: Globe,
@@ -264,9 +263,9 @@ function OverflowItem({ citation, onClick }: OverflowItemProps) {
 					className="size-4.5 rounded-full object-cover"
 					unoptimized={true}
 				/>
-				) : (
+			) : (
 				<TypeIcon className="text-muted-foreground size-3" aria-hidden="true" />
-				)}
+			)}
 			<div className="min-w-0 flex-1">
 				<p className="group-hover:decoration-foreground/30 truncate text-sm font-medium group-hover:underline group-hover:underline-offset-2">
 					{citation.title}
@@ -341,18 +340,18 @@ function StackedCitations({ id, citations, className, onNavigate }: StackedCitat
 										style={{ zIndex: maxIcons - index }}
 									>
 										{citation.favicon ? (
-										<NextImage
-											src={citation.favicon}
-											alt=""
-											aria-hidden="true"
-											width={18}
-											height={18}
-											className="size-4.5 rounded-full object-cover"
-											unoptimized={true}
-										/>
-									) : (
-										<TypeIcon className="text-muted-foreground size-3" aria-hidden="true" />
-									)}	
+											<NextImage
+												src={citation.favicon}
+												alt=""
+												aria-hidden="true"
+												width={18}
+												height={18}
+												className="size-4.5 rounded-full object-cover"
+												unoptimized={true}
+											/>
+										) : (
+											<TypeIcon className="text-muted-foreground size-3" aria-hidden="true" />
+										)}
 									</div>
 								);
 							})}
diff --git a/surfsense_web/components/tool-ui/citation/citation.tsx b/surfsense_web/components/tool-ui/citation/citation.tsx
index fa5d4d165..c60034a0a 100644
--- a/surfsense_web/components/tool-ui/citation/citation.tsx
+++ b/surfsense_web/components/tool-ui/citation/citation.tsx
@@ -2,11 +2,11 @@
 
 import type { LucideIcon } from "lucide-react";
 import { Code2, Database, ExternalLink, File, FileText, Globe, Newspaper } from "lucide-react";
+import NextImage from "next/image";
 import * as React from "react";
 import { openSafeNavigationHref, sanitizeHref } from "../shared/media";
 import { cn, Popover, PopoverContent, PopoverTrigger } from "./_adapter";
 import type { CitationType, CitationVariant, SerializableCitation } from "./schema";
-import NextImage from 'next/image';
 
 const FALLBACK_LOCALE = "en-US";
 
@@ -115,18 +115,18 @@ export function Citation(props: CitationProps) {
 	};
 
 	const iconElement = favicon ? (
-    <NextImage
-        src={favicon}
-        alt=""
-        aria-hidden="true"
-        width={16}
-        height={16}
-        className="bg-muted size-3.5 shrink-0 rounded object-cover"
-        unoptimized={true}
-    />
-) : (
-    <TypeIcon className="size-3.5 shrink-0 opacity-60" aria-hidden="true" />
-);
+		<NextImage
+			src={favicon}
+			alt=""
+			aria-hidden="true"
+			width={16}
+			height={16}
+			className="bg-muted size-3.5 shrink-0 rounded object-cover"
+			unoptimized={true}
+		/>
+	) : (
+		<TypeIcon className="size-3.5 shrink-0 opacity-60" aria-hidden="true" />
+	);
 
 	const { open, handleMouseEnter, handleMouseLeave } = useHoverPopover();
 
diff --git a/surfsense_web/components/ui/animated-tabs.tsx b/surfsense_web/components/ui/animated-tabs.tsx
index 0cd8dd54c..f26e5af8d 100644
--- a/surfsense_web/components/ui/animated-tabs.tsx
+++ b/surfsense_web/components/ui/animated-tabs.tsx
@@ -202,7 +202,10 @@ const Tabs = forwardRef<
 		},
 		[onValueChange, value]
 	);
-	const contextValue = useMemo(() => ({ activeValue, onValueChange: handleValueChange }), [activeValue, handleValueChange]);
+	const contextValue = useMemo(
+		() => ({ activeValue, onValueChange: handleValueChange }),
+		[activeValue, handleValueChange]
+	);
 	return (
 		<TabsContext.Provider value={contextValue}>
 			<div ref={ref} className={cn("tabs-container", className)} {...props}>
diff --git a/surfsense_web/components/ui/toggle-group.tsx b/surfsense_web/components/ui/toggle-group.tsx
index 860fa7a52..44a94234a 100644
--- a/surfsense_web/components/ui/toggle-group.tsx
+++ b/surfsense_web/components/ui/toggle-group.tsx
@@ -3,9 +3,9 @@
 import * as ToggleGroupPrimitive from "@radix-ui/react-toggle-group";
 import type { VariantProps } from "class-variance-authority";
 import * as React from "react";
+import { useMemo } from "react";
 import { toggleVariants } from "@/components/ui/toggle";
 import { cn } from "@/lib/utils";
-import { useMemo } from "react";
 
 const ToggleGroupContext = React.createContext<
 	VariantProps<typeof toggleVariants> & {
@@ -28,8 +28,8 @@ function ToggleGroup({
 	VariantProps<typeof toggleVariants> & {
 		spacing?: number;
 	}) {
-	const contextValue = useMemo(() => ({variant, size, spacing }), [variant, size, spacing]);
-	
+	const contextValue = useMemo(() => ({ variant, size, spacing }), [variant, size, spacing]);
+
 	return (
 		<ToggleGroupPrimitive.Root
 			data-slot="toggle-group"
@@ -43,9 +43,7 @@ function ToggleGroup({
 			)}
 			{...props}
 		>
-			<ToggleGroupContext.Provider value={contextValue}>
-				{children}
-			</ToggleGroupContext.Provider>
+			<ToggleGroupContext.Provider value={contextValue}>{children}</ToggleGroupContext.Provider>
 		</ToggleGroupPrimitive.Root>
 	);
 }
diff --git a/surfsense_web/contexts/LocaleContext.tsx b/surfsense_web/contexts/LocaleContext.tsx
index e67e9c2a5..484721cbc 100644
--- a/surfsense_web/contexts/LocaleContext.tsx
+++ b/surfsense_web/contexts/LocaleContext.tsx
@@ -2,12 +2,12 @@
 
 import type React from "react";
 import { createContext, useCallback, useContext, useEffect, useMemo, useState } from "react";
+import { set } from "zod";
 import enMessages from "../messages/en.json";
 import esMessages from "../messages/es.json";
 import hiMessages from "../messages/hi.json";
 import ptMessages from "../messages/pt.json";
 import zhMessages from "../messages/zh.json";
-import { set } from "zod";
 
 type Locale = "en" | "es" | "pt" | "hi" | "zh";
 
@@ -66,13 +66,12 @@ export function LocaleProvider({ children }: { children: React.ReactNode }) {
 		}
 	}, [locale, mounted]);
 
-	const contextValue = useMemo(() => ({ locale, messages, setLocale }), [locale, messages, setLocale]);
-
-	return (
-		<LocaleContext.Provider value={contextValue}>
-			{children}
-		</LocaleContext.Provider>
+	const contextValue = useMemo(
+		() => ({ locale, messages, setLocale }),
+		[locale, messages, setLocale]
 	);
+
+	return <LocaleContext.Provider value={contextValue}>{children}</LocaleContext.Provider>;
 }
 
 export function useLocaleContext() {
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 6feb75463..a6959c32d 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -50,14 +50,21 @@ interface ElectronAPI {
 	replaceText: (text: string) => Promise<void>;
 	// Permissions
 	getPermissionsStatus: () => Promise<{
-		accessibility: 'authorized' | 'denied' | 'not determined' | 'restricted' | 'limited';
-		screenRecording: 'authorized' | 'denied' | 'not determined' | 'restricted' | 'limited';
+		accessibility: "authorized" | "denied" | "not determined" | "restricted" | "limited";
+		screenRecording: "authorized" | "denied" | "not determined" | "restricted" | "limited";
 	}>;
 	requestAccessibility: () => Promise<void>;
 	requestScreenRecording: () => Promise<void>;
 	restartApp: () => Promise<void>;
 	// Autocomplete
-	onAutocompleteContext: (callback: (data: { screenshot: string; searchSpaceId?: string; appName?: string; windowTitle?: string }) => void) => () => void;
+	onAutocompleteContext: (
+		callback: (data: {
+			screenshot: string;
+			searchSpaceId?: string;
+			appName?: string;
+			windowTitle?: string;
+		}) => void
+	) => () => void;
 	acceptSuggestion: (text: string) => Promise<void>;
 	dismissSuggestion: () => Promise<void>;
 	setAutocompleteEnabled: (enabled: boolean) => Promise<void>;

From 8d810467dd95a2cb7e34fa83324dc07d35801a04 Mon Sep 17 00:00:00 2001
From: Anish Sarkar <104695310+AnishSarkar22@users.noreply.github.com>
Date: Tue, 7 Apr 2026 05:57:13 +0530
Subject: [PATCH 155/202] refactor: add support for XHTML file conversion to
 markdown in document processors

---
 .../app/tasks/document_processors/_direct_converters.py      | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/surfsense_backend/app/tasks/document_processors/_direct_converters.py b/surfsense_backend/app/tasks/document_processors/_direct_converters.py
index b1a69ef4f..bbff4838e 100644
--- a/surfsense_backend/app/tasks/document_processors/_direct_converters.py
+++ b/surfsense_backend/app/tasks/document_processors/_direct_converters.py
@@ -4,8 +4,8 @@ Lossless file-to-markdown converters for text-based formats.
 These converters handle file types that can be faithfully represented as
 markdown without any external ETL/OCR service:
 
-- CSV / TSV  → markdown table  (stdlib ``csv``)
-- HTML / HTM → markdown        (``markdownify``)
+- CSV / TSV          → markdown table  (stdlib ``csv``)
+- HTML / HTM / XHTML → markdown        (``markdownify``)
 """
 
 from __future__ import annotations
@@ -73,6 +73,7 @@ _CONVERTER_MAP: dict[str, Callable[..., str]] = {
     ".tsv": tsv_to_markdown,
     ".html": html_to_markdown,
     ".htm": html_to_markdown,
+    ".xhtml": html_to_markdown,
 }
 
 

From 6ecd75fbbbc834fafce36b0c8ffb367b89d1beea Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Mon, 6 Apr 2026 21:32:49 -0700
Subject: [PATCH 156/202] refactor: simplify HeroSection component and enhance
 UI with new features

- Removed dynamic import of HeroCarousel and replaced it with a static layout.
- Introduced new TAB_ITEMS for showcasing features with descriptions and media.
- Enhanced the layout and styling for better responsiveness and visual appeal.
- Cleaned up unused code and improved overall readability of the component.
---
 .../components/homepage/hero-section.tsx      | 636 +++++++++---------
 1 file changed, 313 insertions(+), 323 deletions(-)

diff --git a/surfsense_web/components/homepage/hero-section.tsx b/surfsense_web/components/homepage/hero-section.tsx
index 299cf1032..1bb28e770 100644
--- a/surfsense_web/components/homepage/hero-section.tsx
+++ b/surfsense_web/components/homepage/hero-section.tsx
@@ -1,39 +1,22 @@
 "use client";
 import { AnimatePresence, motion } from "motion/react";
-import dynamic from "next/dynamic";
+import { Monitor } from "lucide-react";
 import Link from "next/link";
-import type React from "react";
-import { useEffect, useRef, useState } from "react";
+import React, { useCallback, useEffect, useRef, useState, memo } from "react";
 import Balancer from "react-wrap-balancer";
 import { AUTH_TYPE, BACKEND_URL } from "@/lib/env-config";
 import { trackLoginAttempt } from "@/lib/posthog/events";
 import { cn } from "@/lib/utils";
+import {
+	ExpandedMediaOverlay,
+	useExpandedMedia,
+} from "@/components/ui/expanded-gif-overlay";
+import {
+	Tooltip,
+	TooltipContent,
+	TooltipTrigger,
+} from "@/components/ui/tooltip";
 
-const HeroCarousel = dynamic(
-	() => import("@/components/ui/hero-carousel").then((m) => ({ default: m.HeroCarousel })),
-	{
-		ssr: false,
-		loading: () => (
-			<div className="w-full py-4 sm:py-8">
-				<div className="mx-auto w-full max-w-[900px]">
-					<div className="overflow-hidden rounded-2xl border border-neutral-200/60 bg-white shadow-xl sm:rounded-3xl dark:border-neutral-700/60 dark:bg-neutral-900">
-						<div className="flex items-center gap-3 border-b border-neutral-200/60 px-4 py-3 sm:px-6 sm:py-4 dark:border-neutral-700/60">
-							<div className="min-w-0 flex-1">
-								<div className="h-5 w-32 animate-pulse rounded bg-neutral-200 dark:bg-neutral-700" />
-								<div className="mt-2 h-4 w-64 animate-pulse rounded bg-neutral-100 dark:bg-neutral-800" />
-							</div>
-						</div>
-						<div className="bg-neutral-50 p-2 sm:p-3 dark:bg-neutral-950">
-							<div className="aspect-video w-full animate-pulse rounded-lg bg-neutral-100 sm:rounded-xl dark:bg-neutral-800" />
-						</div>
-					</div>
-				</div>
-			</div>
-		),
-	}
-);
-
-// Official Google "G" logo with brand colors
 const GoogleLogo = ({ className }: { className?: string }) => (
 	<svg
 		className={className}
@@ -62,87 +45,102 @@ const GoogleLogo = ({ className }: { className?: string }) => (
 	</svg>
 );
 
-function useIsDesktop(breakpoint = 1024) {
-	const [isDesktop, setIsDesktop] = useState(false);
-	useEffect(() => {
-		const mql = window.matchMedia(`(min-width: ${breakpoint}px)`);
-		setIsDesktop(mql.matches);
-		const handler = (e: MediaQueryListEvent) => setIsDesktop(e.matches);
-		mql.addEventListener("change", handler);
-		return () => mql.removeEventListener("change", handler);
-	}, [breakpoint]);
-	return isDesktop;
-}
+const TAB_ITEMS = [
+	{
+		title: "Connect & Sync",
+		description:
+			"Connect data sources like Notion, Drive and Gmail. Automatically sync to keep them updated.",
+		src: "/homepage/hero_tutorial/ConnectorFlowGif.mp4",
+		featured: true,
+	},
+	{
+		title: "Upload Documents",
+		description: "Upload documents directly, from images to massive PDFs.",
+		src: "/homepage/hero_tutorial/DocUploadGif.mp4",
+		featured: true,
+	},
+	{
+		title: "Search & Citation",
+		description:
+			"Ask questions and get cited responses from your knowledge base.",
+		src: "/homepage/hero_tutorial/BSNCGif.mp4",
+		featured: false,
+	},
+	{
+		title: "Document Q&A",
+		description: "Mention specific documents in chat for targeted answers.",
+		src: "/homepage/hero_tutorial/BQnaGif_compressed.mp4",
+		featured: false,
+	},
+	{
+		title: "Reports",
+		description: "Generate reports from your sources in many formats.",
+		src: "/homepage/hero_tutorial/ReportGenGif_compressed.mp4",
+		featured: false,
+	},
+	{
+		title: "Podcasts",
+		description: "Turn anything into a podcast in under 20 seconds.",
+		src: "/homepage/hero_tutorial/PodcastGenGif.mp4",
+		featured: false,
+	},
+	{
+		title: "Image Generation",
+		description:
+			"Generate high-quality images easily from your conversations.",
+		src: "/homepage/hero_tutorial/ImageGenGif.mp4",
+		featured: false,
+	},
+	{
+		title: "Collaborative Chat",
+		description:
+			"Collaborate on AI-powered conversations in realtime with your team.",
+		src: "/homepage/hero_realtime/RealTimeChatGif.mp4",
+		featured: false,
+	},
+	{
+		title: "Comments",
+		description: "Add comments and tag teammates on any message.",
+		src: "/homepage/hero_realtime/RealTimeCommentsFlow.mp4",
+		featured: false,
+	},
+	{
+		title: "Video Generation",
+		description:
+			"Create short videos with AI-generated visuals and narration from your sources.",
+		src: "/homepage/hero_tutorial/video_gen_surf.mp4",
+		featured: false,
+	},
+] as const;
 
 export function HeroSection() {
-	const containerRef = useRef<HTMLDivElement>(null);
-	const parentRef = useRef<HTMLDivElement>(null);
-	const isDesktop = useIsDesktop();
-
 	return (
-		<div
-			ref={parentRef}
-			className="relative flex min-h-screen flex-col items-center justify-center overflow-hidden px-4 py-24 md:px-8 md:py-48"
-		>
-			<BackgroundGrids />
-			{isDesktop && (
-				<>
-					<CollisionMechanism
-						parentRef={parentRef}
-						beamOptions={{
-							initialX: -400,
-							translateX: 600,
-							duration: 7,
-							repeatDelay: 3,
-						}}
-					/>
-					<CollisionMechanism
-						parentRef={parentRef}
-						beamOptions={{
-							initialX: -200,
-							translateX: 800,
-							duration: 4,
-							repeatDelay: 3,
-						}}
-					/>
-					<CollisionMechanism
-						parentRef={parentRef}
-						beamOptions={{
-							initialX: 200,
-							translateX: 1200,
-							duration: 5,
-							repeatDelay: 3,
-						}}
-					/>
-					<CollisionMechanism
-						parentRef={parentRef}
-						beamOptions={{
-							initialX: 400,
-							translateX: 1400,
-							duration: 6,
-							repeatDelay: 3,
-						}}
-					/>
-				</>
-			)}
+		<div className="mx-auto w-full max-w-7xl min-w-0 pt-36">
+			<div className="mt-4 flex w-full min-w-0 flex-col items-start px-2 md:px-8 xl:px-0">
+				<h1
+					className={cn(
+						"relative mt-4 max-w-7xl text-left text-4xl font-bold tracking-tight text-balance text-neutral-900 sm:text-5xl md:text-6xl xl:text-8xl dark:text-neutral-50",
+					)}
+				>
+					<Balancer>NotebookLM for Teams</Balancer>
+				</h1>
+				<div className="mt-4 flex w-full flex-col items-start justify-between gap-4 md:mt-12 md:flex-row md:items-end md:gap-10">
+					<div>
+						<h2
+							className={cn(
+								"relative mb-8 max-w-2xl text-left text-sm tracking-wide text-neutral-600 antialiased sm:text-base md:text-xl dark:text-neutral-400",
+							)}
+						>
+							An open source, privacy focused alternative to NotebookLM for teams with no data limits.
+						</h2>
 
-			<h2 className="relative z-50 mx-auto mb-4 mt-8 max-w-4xl text-balance text-center text-3xl font-semibold tracking-tight text-gray-700 md:text-7xl dark:text-neutral-300">
-				<div className="relative mx-auto inline-block w-max filter-[drop-shadow(0px_1px_3px_rgba(27,37,80,0.14))]">
-					<div className="text-black [text-shadow:0_0_rgba(0,0,0,0.1)] dark:text-white">
-						<Balancer>NotebookLM for Teams</Balancer>
+						<div className="relative mb-4 flex w-full flex-col justify-center gap-y-2 sm:flex-row sm:justify-start sm:space-y-0 sm:space-x-4">
+							<GetStartedButton />
+						</div>
 					</div>
+					<DownloadApp />
 				</div>
-			</h2>
-			<p className="relative z-50 mx-auto mt-4 max-w-lg px-6 text-center text-sm leading-relaxed text-gray-600 sm:text-base sm:leading-relaxed md:max-w-xl md:text-lg md:leading-relaxed dark:text-gray-200">
-				Connect any LLM to your internal knowledge sources and chat with it in real time alongside
-				your team.
-			</p>
-			<div className="mb-6 mt-6 flex w-full flex-col items-center justify-center gap-4 px-8 sm:flex-row md:mb-10">
-				<GetStartedButton />
-				{/* <ContactSalesButton /> */}
-			</div>
-			<div ref={containerRef} className="relative w-full z-51">
-				<HeroCarousel />
+				<BrowserWindow />
 			</div>
 		</div>
 	);
@@ -158,193 +156,155 @@ function GetStartedButton() {
 
 	if (isGoogleAuth) {
 		return (
-			<motion.button
+			<button
 				type="button"
 				onClick={handleGoogleLogin}
-				whileHover="hover"
-				whileTap={{ scale: 0.98 }}
-				initial="idle"
-				className="group relative z-20 flex h-11 w-full cursor-pointer items-center justify-center gap-3 overflow-hidden rounded-xl bg-white px-6 py-2.5 text-sm font-semibold text-neutral-700 shadow-lg ring-1 ring-neutral-200/50 transition-shadow duration-300 hover:shadow-xl sm:w-56 dark:bg-neutral-900 dark:text-neutral-200 dark:ring-neutral-700/50"
-				variants={{
-					idle: { scale: 1, y: 0 },
-					hover: { scale: 1.02, y: -2 },
-				}}
+				className="flex h-14 w-full cursor-pointer items-center justify-center gap-3 rounded-lg bg-white text-center text-base font-medium text-neutral-700 shadow-sm ring-1 shadow-black/10 ring-black/10 transition duration-150 active:scale-98 hover:bg-neutral-50 sm:w-56 dark:bg-neutral-900 dark:text-neutral-200 dark:ring-neutral-700/50 dark:hover:bg-neutral-800"
 			>
-				{/* Animated gradient background on hover */}
-				<motion.div
-					className="absolute inset-0 bg-linear-to-r from-blue-50 via-green-50 to-yellow-50 dark:from-blue-950/30 dark:via-green-950/30 dark:to-yellow-950/30"
-					variants={{
-						idle: { opacity: 0 },
-						hover: { opacity: 1 },
-					}}
-					transition={{ duration: 0.3 }}
-				/>
-				{/* Google logo with subtle animation */}
-				<motion.div
-					className="relative"
-					variants={{
-						idle: { rotate: 0 },
-						hover: { rotate: [0, -8, 8, 0] },
-					}}
-					transition={{ duration: 0.4, ease: "easeInOut" }}
-				>
-					<GoogleLogo className="h-5 w-5" />
-				</motion.div>
-				<span className="relative">Continue with Google</span>
-			</motion.button>
+				<GoogleLogo className="h-5 w-5" />
+				<span>Continue with Google</span>
+			</button>
 		);
 	}
 
 	return (
-		<motion.div whileHover={{ scale: 1.02, y: -2 }} whileTap={{ scale: 0.98 }}>
-			<Link
-				href="/login"
-				className="group relative z-20 flex h-11 w-full cursor-pointer items-center justify-center gap-2 rounded-xl bg-black px-6 py-2.5 text-sm font-semibold text-white shadow-lg transition-shadow duration-300 hover:shadow-xl sm:w-56 dark:bg-white dark:text-black"
-			>
-				Get Started
-			</Link>
-		</motion.div>
+		<Link
+			href="/login"
+			className="flex h-14 w-full items-center justify-center rounded-lg bg-black text-center text-base font-medium text-white shadow-sm ring-1 shadow-black/10 ring-black/10 transition duration-150 active:scale-98 sm:w-52 dark:bg-white dark:text-black"
+		>
+			Get Started
+		</Link>
 	);
 }
 
-const BackgroundGrids = () => {
-	return (
-		<div className="pointer-events-none absolute inset-0 z-0 grid h-screen w-full -rotate-45 transform select-none grid-cols-2 gap-10 md:grid-cols-4">
-			<div className="relative h-full w-full">
-				<GridLineVertical className="left-0" />
-				<GridLineVertical className="left-auto right-0" />
-			</div>
-			<div className="relative h-full w-full">
-				<GridLineVertical className="left-0" />
-				<GridLineVertical className="left-auto right-0" />
-			</div>
-			<div className="relative h-full w-full bg-linear-to-b from-transparent via-neutral-100 to-transparent dark:via-neutral-800">
-				<GridLineVertical className="left-0" />
-				<GridLineVertical className="left-auto right-0" />
-			</div>
-			<div className="relative h-full w-full">
-				<GridLineVertical className="left-0" />
-				<GridLineVertical className="left-auto right-0" />
-			</div>
-		</div>
-	);
-};
+const BrowserWindow = () => {
+	const [selectedIndex, setSelectedIndex] = useState(0);
+	const selectedItem = TAB_ITEMS[selectedIndex];
+	const intervalRef = useRef<NodeJS.Timeout | null>(null);
+	const { expanded, open, close } = useExpandedMedia();
 
-const CollisionMechanism = ({
-	parentRef,
-	beamOptions = {},
-}: {
-	parentRef: React.RefObject<HTMLDivElement | null>;
-	beamOptions?: {
-		initialX?: number;
-		translateX?: number;
-		initialY?: number;
-		translateY?: number;
-		rotate?: number;
-		className?: string;
-		duration?: number;
-		delay?: number;
-		repeatDelay?: number;
-	};
-}) => {
-	const beamRef = useRef<HTMLDivElement>(null);
-	const [collision, setCollision] = useState<{
-		detected: boolean;
-		coordinates: { x: number; y: number } | null;
-	}>({ detected: false, coordinates: null });
-	const [beamKey, setBeamKey] = useState(0);
-	const [cycleCollisionDetected, setCycleCollisionDetected] = useState(false);
+	const startInterval = useCallback(() => {
+		if (intervalRef.current) {
+			clearInterval(intervalRef.current);
+		}
+		intervalRef.current = setInterval(() => {
+			setSelectedIndex((prev) => (prev + 1) % TAB_ITEMS.length);
+		}, 10000);
+	}, []);
 
 	useEffect(() => {
-		const checkCollision = () => {
-			if (beamRef.current && parentRef.current && !cycleCollisionDetected) {
-				const beamRect = beamRef.current.getBoundingClientRect();
-				const parentRect = parentRef.current.getBoundingClientRect();
-				const rightEdge = parentRect.right;
-
-				if (beamRect.right >= rightEdge - 20) {
-					const relativeX = parentRect.width - 20;
-					const relativeY = beamRect.top - parentRect.top + beamRect.height / 2;
-
-					setCollision({
-						detected: true,
-						coordinates: { x: relativeX, y: relativeY },
-					});
-					setCycleCollisionDetected(true);
-					if (beamRef.current) {
-						beamRef.current.style.opacity = "0";
-					}
-				}
-			}
-		};
-
-		const animationInterval = setInterval(checkCollision, 100);
-
-		return () => clearInterval(animationInterval);
-	}, [cycleCollisionDetected, parentRef]);
-
-	useEffect(() => {
-		if (!collision.detected || !collision.coordinates) return;
-
-		const timer1 = setTimeout(() => {
-			setCollision({ detected: false, coordinates: null });
-			setCycleCollisionDetected(false);
-			if (beamRef.current) {
-				beamRef.current.style.opacity = "1";
-			}
-		}, 2000);
-
-		const timer2 = setTimeout(() => {
-			setBeamKey((prevKey) => prevKey + 1);
-		}, 2000);
-
+		startInterval();
 		return () => {
-			clearTimeout(timer1);
-			clearTimeout(timer2);
+			if (intervalRef.current) {
+				clearInterval(intervalRef.current);
+			}
 		};
-	}, [collision]);
+	}, [startInterval]);
+
+	const handleTabClick = (index: number) => {
+		setSelectedIndex(index);
+		startInterval();
+	};
 
 	return (
 		<>
-			<motion.div
-				key={beamKey}
-				ref={beamRef}
-				animate="animate"
-				initial={{
-					translateY: beamOptions.initialY || "-200px",
-					translateX: beamOptions.initialX || "0px",
-					rotate: beamOptions.rotate || -45,
-				}}
-				variants={{
-					animate: {
-						translateY: beamOptions.translateY || "800px",
-						translateX: beamOptions.translateX || "700px",
-						rotate: beamOptions.rotate || -45,
-					},
-				}}
-				transition={{
-					duration: beamOptions.duration || 8,
-					repeat: Infinity,
-					repeatType: "loop",
-					ease: "linear",
-					delay: beamOptions.delay || 0,
-					repeatDelay: beamOptions.repeatDelay || 0,
-				}}
-				className={cn(
-					"absolute left-96 top-20 m-auto h-14 w-px rounded-full bg-linear-to-t from-orange-500 via-yellow-500 to-transparent will-change-transform",
-					beamOptions.className
-				)}
-			/>
+			<motion.div className="relative my-4 flex w-full flex-col items-start justify-start overflow-hidden rounded-2xl shadow-2xl md:my-12">
+				<div className="flex w-full items-center justify-start overflow-hidden bg-gray-200 py-4 pl-4 dark:bg-neutral-800">
+					<div className="mr-6 flex items-center gap-2">
+						<div className="size-3 rounded-full bg-red-500" />
+						<div className="size-3 rounded-full bg-yellow-500" />
+						<div className="size-3 rounded-full bg-green-500" />
+					</div>
+					<div className="no-visible-scrollbar flex min-w-0 shrink flex-row items-center justify-start gap-2 overflow-x-auto mask-l-from-98% py-0.5 pr-2 pl-2 md:pl-4">
+						{TAB_ITEMS.map((item, index) => (
+							<React.Fragment key={item.title}>
+							<button
+								type="button"
+								onClick={() => handleTabClick(index)}
+								className={cn(
+									"flex shrink-0 items-center gap-1.5 rounded-md px-2 py-1 text-xs transition duration-150 hover:bg-white sm:text-sm dark:hover:bg-neutral-950",
+									selectedIndex === index && !item.featured &&
+										"bg-white shadow ring-1 shadow-black/10 ring-black/10 dark:bg-neutral-900",
+									selectedIndex === index && item.featured &&
+										"bg-amber-50 shadow ring-1 shadow-amber-200/50 ring-amber-400/60 dark:bg-amber-950/40 dark:shadow-amber-900/30 dark:ring-amber-500/50",
+									item.featured && selectedIndex !== index &&
+										"hover:bg-amber-50 dark:hover:bg-amber-950/30",
+								)}
+							>
+									{item.title}
+								{item.featured && (
+									<Tooltip>
+										<TooltipTrigger asChild>
+											<span className="inline-flex shrink-0 items-center justify-center rounded border border-amber-300 bg-amber-100 p-0.5 text-amber-700 dark:border-amber-700 dark:bg-amber-900/50 dark:text-amber-400">
+												<Monitor className="size-3" />
+											</span>
+										</TooltipTrigger>
+										<TooltipContent side="bottom">
+											Desktop app only
+										</TooltipContent>
+									</Tooltip>
+								)}
+							</button>
+								{index !== TAB_ITEMS.length - 1 && (
+									<div className="h-4 w-px shrink-0 rounded-full bg-neutral-300 dark:bg-neutral-700" />
+								)}
+							</React.Fragment>
+						))}
+					</div>
+				</div>
+				<div className="w-full overflow-hidden bg-gray-100/50 px-4 pt-4 perspective-distant dark:bg-neutral-950">
+					<AnimatePresence mode="wait">
+						<motion.div
+							initial={{
+								opacity: 0,
+								scale: 0.99,
+								filter: "blur(10px)",
+							}}
+							animate={{
+								opacity: 1,
+								scale: 1,
+								filter: "blur(0px)",
+							}}
+							exit={{
+								opacity: 0,
+								scale: 0.98,
+								filter: "blur(10px)",
+							}}
+							transition={{
+								duration: 0.3,
+								ease: "easeOut",
+							}}
+							key={selectedItem.title}
+							className="relative overflow-hidden rounded-tl-xl rounded-tr-xl bg-white shadow-sm ring-1 shadow-black/10 ring-black/10 will-change-transform dark:bg-neutral-950"
+						>
+							<div className="flex items-center gap-3 border-b border-neutral-200/60 px-4 py-3 sm:px-6 sm:py-4 dark:border-neutral-700/60">
+								<div className="min-w-0">
+									<h3 className="truncate text-base font-semibold text-neutral-900 sm:text-lg dark:text-white">
+										{selectedItem.title}
+									</h3>
+									<p className="text-sm text-neutral-500 dark:text-neutral-400">
+										{selectedItem.description}
+									</p>
+								</div>
+							</div>
+							{/* biome-ignore lint/a11y/useKeyWithClickEvents: wrapper for video expand */}
+							<div
+								className="cursor-pointer bg-neutral-50 p-2 sm:p-3 dark:bg-neutral-950"
+								onClick={open}
+							>
+								<TabVideo src={selectedItem.src} />
+							</div>
+						</motion.div>
+					</AnimatePresence>
+				</div>
+			</motion.div>
+
 			<AnimatePresence>
-				{collision.detected && collision.coordinates && (
-					<Explosion
-						key={`${collision.coordinates.x}-${collision.coordinates.y}`}
-						className=""
-						style={{
-							left: `${collision.coordinates.x + 20}px`,
-							top: `${collision.coordinates.y}px`,
-							transform: "translate(-50%, -50%)",
-						}}
+				{expanded && (
+					<ExpandedMediaOverlay
+						src={selectedItem.src}
+						alt={selectedItem.title}
+						onClose={close}
 					/>
 				)}
 			</AnimatePresence>
@@ -352,62 +312,92 @@ const CollisionMechanism = ({
 	);
 };
 
-const Explosion = ({ ...props }: React.HTMLProps<HTMLDivElement>) => {
-	const spans = Array.from({ length: 20 }, (_, index) => ({
-		id: index,
-		initialX: 0,
-		initialY: 0,
-		directionX: Math.floor(Math.random() * 80 - 40),
-		directionY: Math.floor(Math.random() * -50 - 10),
-	}));
+const TabVideo = memo(function TabVideo({ src }: { src: string }) {
+	const videoRef = useRef<HTMLVideoElement>(null);
+	const [hasLoaded, setHasLoaded] = useState(false);
+
+	useEffect(() => {
+		setHasLoaded(false);
+		const video = videoRef.current;
+		if (!video) return;
+		video.currentTime = 0;
+		video.play().catch(() => { });
+	}, [src]);
+
+	const handleCanPlay = useCallback(() => {
+		setHasLoaded(true);
+	}, []);
 
 	return (
-		<div {...props} className={cn("absolute z-50 h-2 w-2", props.className)}>
-			<motion.div
-				initial={{ opacity: 0 }}
-				animate={{ opacity: [0, 1, 0] }}
-				exit={{ opacity: 0 }}
-				transition={{ duration: 1, ease: "easeOut" }}
-				className="absolute -inset-x-10 top-0 m-auto h-[4px] w-10 rounded-full bg-linear-to-r from-transparent via-orange-500 to-transparent blur-sm"
-			></motion.div>
-			{spans.map((span) => (
-				<motion.span
-					key={span.id}
-					initial={{ x: span.initialX, y: span.initialY, opacity: 1 }}
-					animate={{ x: span.directionX, y: span.directionY, opacity: 0 }}
-					transition={{ duration: Math.random() * 1.5 + 0.5, ease: "easeOut" }}
-					className="absolute h-1 w-1 rounded-full bg-linear-to-b from-orange-500 to-yellow-500"
-				/>
-			))}
+		<div className="relative">
+			<video
+				ref={videoRef}
+				key={src}
+				src={src}
+				preload="none"
+				loop
+				muted
+				playsInline
+				onCanPlay={handleCanPlay}
+				className="aspect-video w-full rounded-lg sm:rounded-xl"
+			/>
+			{!hasLoaded && (
+				<div className="absolute inset-0 aspect-video w-full animate-pulse rounded-lg bg-neutral-100 sm:rounded-xl dark:bg-neutral-800" />
+			)}
 		</div>
 	);
-};
+});
 
-const GridLineVertical = ({ className, offset }: { className?: string; offset?: string }) => {
+const GITHUB_RELEASES_URL =
+	"https://github.com/MODSetter/SurfSense/releases/latest";
+
+const DownloadApp = memo(function DownloadApp() {
 	return (
-		<div
-			style={
-				{
-					"--background": "#ffffff",
-					"--color": "rgba(0, 0, 0, 0.2)",
-					"--height": "5px",
-					"--width": "1px",
-					"--fade-stop": "90%",
-					"--offset": offset || "150px", //-100px if you want to keep the line inside
-					"--color-dark": "rgba(255, 255, 255, 0.3)",
-					maskComposite: "exclude",
-				} as React.CSSProperties
-			}
-			className={cn(
-				"absolute top-[calc(var(--offset)/2*-1)] h-[calc(100%+var(--offset))] w-(--width)",
-				"bg-[linear-gradient(to_bottom,var(--color),var(--color)_50%,transparent_0,transparent)]",
-				"bg-size-[var(--width)_var(--height)]",
-				"[mask:linear-gradient(to_top,var(--background)_var(--fade-stop),transparent),linear-gradient(to_bottom,var(--background)_var(--fade-stop),transparent),linear-gradient(black,black)]",
-				"mask-exclude",
-				"z-30",
-				"dark:bg-[linear-gradient(to_bottom,var(--color-dark),var(--color-dark)_50%,transparent_0,transparent)]",
-				className
-			)}
-		></div>
+		<div className="flex flex-col items-start justify-start">
+			<p className="mb-4 text-left text-sm text-neutral-500 lg:text-lg dark:text-neutral-400">
+				Download the desktop app
+			</p>
+			<div className="mb-2 flex flex-row flex-wrap items-center gap-3">
+				<a
+					href={GITHUB_RELEASES_URL}
+					target="_blank"
+					rel="noopener noreferrer"
+					className="flex items-center gap-2 rounded-lg border border-neutral-200 bg-white px-4 py-2.5 text-sm font-medium text-neutral-700 shadow-sm transition hover:bg-neutral-50 dark:border-neutral-700 dark:bg-neutral-900 dark:text-neutral-200 dark:hover:bg-neutral-800"
+				>
+					<svg className="size-4" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
+						<path d="M12 17V3" />
+						<path d="m6 11 6 6 6-6" />
+						<path d="M19 21H5" />
+					</svg>
+					macOS
+				</a>
+				<a
+					href={GITHUB_RELEASES_URL}
+					target="_blank"
+					rel="noopener noreferrer"
+					className="flex items-center gap-2 rounded-lg border border-neutral-200 bg-white px-4 py-2.5 text-sm font-medium text-neutral-700 shadow-sm transition hover:bg-neutral-50 dark:border-neutral-700 dark:bg-neutral-900 dark:text-neutral-200 dark:hover:bg-neutral-800"
+				>
+					<svg className="size-4" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
+						<path d="M12 17V3" />
+						<path d="m6 11 6 6 6-6" />
+						<path d="M19 21H5" />
+					</svg>
+					Windows
+				</a>
+				<a
+					href={GITHUB_RELEASES_URL}
+					target="_blank"
+					rel="noopener noreferrer"
+					className="flex items-center gap-2 rounded-lg border border-neutral-200 bg-white px-4 py-2.5 text-sm font-medium text-neutral-700 shadow-sm transition hover:bg-neutral-50 dark:border-neutral-700 dark:bg-neutral-900 dark:text-neutral-200 dark:hover:bg-neutral-800"
+				>
+					<svg className="size-4" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
+						<path d="M12 17V3" />
+						<path d="m6 11 6 6 6-6" />
+						<path d="M19 21H5" />
+					</svg>
+					Linux
+				</a>
+			</div>
+		</div>
 	);
-};
+});

From 323886b48135ec36888862d4183e5da8eb69966f Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Mon, 6 Apr 2026 21:39:14 -0700
Subject: [PATCH 157/202] security : CVE-2026-35030 fix

---
 surfsense_backend/pyproject.toml |   4 +-
 surfsense_backend/uv.lock        | 180 +++++++++++++++----------------
 2 files changed, 92 insertions(+), 92 deletions(-)

diff --git a/surfsense_backend/pyproject.toml b/surfsense_backend/pyproject.toml
index 8e3f48b11..893aa77f9 100644
--- a/surfsense_backend/pyproject.toml
+++ b/surfsense_backend/pyproject.toml
@@ -46,8 +46,6 @@ dependencies = [
     "redis>=5.2.1",
     "firecrawl-py>=4.9.0",
     "boto3>=1.35.0",
-    "litellm>=1.80.10",
-    "langchain-litellm>=0.3.5",
     "fake-useragent>=2.2.0",
     "trafilatura>=2.0.0",
     "fastapi-users[oauth,sqlalchemy]>=15.0.3",
@@ -75,6 +73,8 @@ dependencies = [
     "langchain-community>=0.4.1",
     "deepagents>=0.4.12",
     "stripe>=15.0.0",
+    "litellm>=1.83.0",
+    "langchain-litellm>=0.6.4",
 ]
 
 [dependency-groups]
diff --git a/surfsense_backend/uv.lock b/surfsense_backend/uv.lock
index 8de78705d..c35bbf7d7 100644
--- a/surfsense_backend/uv.lock
+++ b/surfsense_backend/uv.lock
@@ -62,7 +62,7 @@ wheels = [
 
 [[package]]
 name = "aiohttp"
-version = "3.13.3"
+version = "3.13.5"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "aiohappyeyeballs" },
@@ -73,76 +73,76 @@ dependencies = [
     { name = "propcache" },
     { name = "yarl" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/50/42/32cf8e7704ceb4481406eb87161349abb46a57fee3f008ba9cb610968646/aiohttp-3.13.3.tar.gz", hash = "sha256:a949eee43d3782f2daae4f4a2819b2cb9b0c5d3b7f7a927067cc84dafdbb9f88", size = 7844556 }
+sdist = { url = "https://files.pythonhosted.org/packages/77/9a/152096d4808df8e4268befa55fba462f440f14beab85e8ad9bf990516918/aiohttp-3.13.5.tar.gz", hash = "sha256:9d98cc980ecc96be6eb4c1994ce35d28d8b1f5e5208a23b421187d1209dbb7d1", size = 7858271 }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/a0/be/4fc11f202955a69e0db803a12a062b8379c970c7c84f4882b6da17337cc1/aiohttp-3.13.3-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:b903a4dfee7d347e2d87697d0713be59e0b87925be030c9178c5faa58ea58d5c", size = 739732 },
-    { url = "https://files.pythonhosted.org/packages/97/2c/621d5b851f94fa0bb7430d6089b3aa970a9d9b75196bc93bb624b0db237a/aiohttp-3.13.3-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:a45530014d7a1e09f4a55f4f43097ba0fd155089372e105e4bff4ca76cb1b168", size = 494293 },
-    { url = "https://files.pythonhosted.org/packages/5d/43/4be01406b78e1be8320bb8316dc9c42dbab553d281c40364e0f862d5661c/aiohttp-3.13.3-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:27234ef6d85c914f9efeb77ff616dbf4ad2380be0cda40b4db086ffc7ddd1b7d", size = 493533 },
-    { url = "https://files.pythonhosted.org/packages/8d/a8/5a35dc56a06a2c90d4742cbf35294396907027f80eea696637945a106f25/aiohttp-3.13.3-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:d32764c6c9aafb7fb55366a224756387cd50bfa720f32b88e0e6fa45b27dcf29", size = 1737839 },
-    { url = "https://files.pythonhosted.org/packages/bf/62/4b9eeb331da56530bf2e198a297e5303e1c1ebdceeb00fe9b568a65c5a0c/aiohttp-3.13.3-cp312-cp312-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:b1a6102b4d3ebc07dad44fbf07b45bb600300f15b552ddf1851b5390202ea2e3", size = 1703932 },
-    { url = "https://files.pythonhosted.org/packages/7c/f6/af16887b5d419e6a367095994c0b1332d154f647e7dc2bd50e61876e8e3d/aiohttp-3.13.3-cp312-cp312-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:c014c7ea7fb775dd015b2d3137378b7be0249a448a1612268b5a90c2d81de04d", size = 1771906 },
-    { url = "https://files.pythonhosted.org/packages/ce/83/397c634b1bcc24292fa1e0c7822800f9f6569e32934bdeef09dae7992dfb/aiohttp-3.13.3-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:2b8d8ddba8f95ba17582226f80e2de99c7a7948e66490ef8d947e272a93e9463", size = 1871020 },
-    { url = "https://files.pythonhosted.org/packages/86/f6/a62cbbf13f0ac80a70f71b1672feba90fdb21fd7abd8dbf25c0105fb6fa3/aiohttp-3.13.3-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:9ae8dd55c8e6c4257eae3a20fd2c8f41edaea5992ed67156642493b8daf3cecc", size = 1755181 },
-    { url = "https://files.pythonhosted.org/packages/0a/87/20a35ad487efdd3fba93d5843efdfaa62d2f1479eaafa7453398a44faf13/aiohttp-3.13.3-cp312-cp312-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:01ad2529d4b5035578f5081606a465f3b814c542882804e2e8cda61adf5c71bf", size = 1561794 },
-    { url = "https://files.pythonhosted.org/packages/de/95/8fd69a66682012f6716e1bc09ef8a1a2a91922c5725cb904689f112309c4/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:bb4f7475e359992b580559e008c598091c45b5088f28614e855e42d39c2f1033", size = 1697900 },
-    { url = "https://files.pythonhosted.org/packages/e5/66/7b94b3b5ba70e955ff597672dad1691333080e37f50280178967aff68657/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_armv7l.whl", hash = "sha256:c19b90316ad3b24c69cd78d5c9b4f3aa4497643685901185b65166293d36a00f", size = 1728239 },
-    { url = "https://files.pythonhosted.org/packages/47/71/6f72f77f9f7d74719692ab65a2a0252584bf8d5f301e2ecb4c0da734530a/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:96d604498a7c782cb15a51c406acaea70d8c027ee6b90c569baa6e7b93073679", size = 1740527 },
-    { url = "https://files.pythonhosted.org/packages/fa/b4/75ec16cbbd5c01bdaf4a05b19e103e78d7ce1ef7c80867eb0ace42ff4488/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_riscv64.whl", hash = "sha256:084911a532763e9d3dd95adf78a78f4096cd5f58cdc18e6fdbc1b58417a45423", size = 1554489 },
-    { url = "https://files.pythonhosted.org/packages/52/8f/bc518c0eea29f8406dcf7ed1f96c9b48e3bc3995a96159b3fc11f9e08321/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_s390x.whl", hash = "sha256:7a4a94eb787e606d0a09404b9c38c113d3b099d508021faa615d70a0131907ce", size = 1767852 },
-    { url = "https://files.pythonhosted.org/packages/9d/f2/a07a75173124f31f11ea6f863dc44e6f09afe2bca45dd4e64979490deab1/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:87797e645d9d8e222e04160ee32aa06bc5c163e8499f24db719e7852ec23093a", size = 1722379 },
-    { url = "https://files.pythonhosted.org/packages/3c/4a/1a3fee7c21350cac78e5c5cef711bac1b94feca07399f3d406972e2d8fcd/aiohttp-3.13.3-cp312-cp312-win32.whl", hash = "sha256:b04be762396457bef43f3597c991e192ee7da460a4953d7e647ee4b1c28e7046", size = 428253 },
-    { url = "https://files.pythonhosted.org/packages/d9/b7/76175c7cb4eb73d91ad63c34e29fc4f77c9386bba4a65b53ba8e05ee3c39/aiohttp-3.13.3-cp312-cp312-win_amd64.whl", hash = "sha256:e3531d63d3bdfa7e3ac5e9b27b2dd7ec9df3206a98e0b3445fa906f233264c57", size = 455407 },
-    { url = "https://files.pythonhosted.org/packages/97/8a/12ca489246ca1faaf5432844adbfce7ff2cc4997733e0af120869345643a/aiohttp-3.13.3-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:5dff64413671b0d3e7d5918ea490bdccb97a4ad29b3f311ed423200b2203e01c", size = 734190 },
-    { url = "https://files.pythonhosted.org/packages/32/08/de43984c74ed1fca5c014808963cc83cb00d7bb06af228f132d33862ca76/aiohttp-3.13.3-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:87b9aab6d6ed88235aa2970294f496ff1a1f9adcd724d800e9b952395a80ffd9", size = 491783 },
-    { url = "https://files.pythonhosted.org/packages/17/f8/8dd2cf6112a5a76f81f81a5130c57ca829d101ad583ce57f889179accdda/aiohttp-3.13.3-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:425c126c0dc43861e22cb1c14ba4c8e45d09516d0a3ae0a3f7494b79f5f233a3", size = 490704 },
-    { url = "https://files.pythonhosted.org/packages/6d/40/a46b03ca03936f832bc7eaa47cfbb1ad012ba1be4790122ee4f4f8cba074/aiohttp-3.13.3-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:7f9120f7093c2a32d9647abcaf21e6ad275b4fbec5b55969f978b1a97c7c86bf", size = 1720652 },
-    { url = "https://files.pythonhosted.org/packages/f7/7e/917fe18e3607af92657e4285498f500dca797ff8c918bd7d90b05abf6c2a/aiohttp-3.13.3-cp313-cp313-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:697753042d57f4bf7122cab985bf15d0cef23c770864580f5af4f52023a56bd6", size = 1692014 },
-    { url = "https://files.pythonhosted.org/packages/71/b6/cefa4cbc00d315d68973b671cf105b21a609c12b82d52e5d0c9ae61d2a09/aiohttp-3.13.3-cp313-cp313-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:6de499a1a44e7de70735d0b39f67c8f25eb3d91eb3103be99ca0fa882cdd987d", size = 1759777 },
-    { url = "https://files.pythonhosted.org/packages/fb/e3/e06ee07b45e59e6d81498b591fc589629be1553abb2a82ce33efe2a7b068/aiohttp-3.13.3-cp313-cp313-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:37239e9f9a7ea9ac5bf6b92b0260b01f8a22281996da609206a84df860bc1261", size = 1861276 },
-    { url = "https://files.pythonhosted.org/packages/7c/24/75d274228acf35ceeb2850b8ce04de9dd7355ff7a0b49d607ee60c29c518/aiohttp-3.13.3-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:f76c1e3fe7d7c8afad7ed193f89a292e1999608170dcc9751a7462a87dfd5bc0", size = 1743131 },
-    { url = "https://files.pythonhosted.org/packages/04/98/3d21dde21889b17ca2eea54fdcff21b27b93f45b7bb94ca029c31ab59dc3/aiohttp-3.13.3-cp313-cp313-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:fc290605db2a917f6e81b0e1e0796469871f5af381ce15c604a3c5c7e51cb730", size = 1556863 },
-    { url = "https://files.pythonhosted.org/packages/9e/84/da0c3ab1192eaf64782b03971ab4055b475d0db07b17eff925e8c93b3aa5/aiohttp-3.13.3-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:4021b51936308aeea0367b8f006dc999ca02bc118a0cc78c303f50a2ff6afb91", size = 1682793 },
-    { url = "https://files.pythonhosted.org/packages/ff/0f/5802ada182f575afa02cbd0ec5180d7e13a402afb7c2c03a9aa5e5d49060/aiohttp-3.13.3-cp313-cp313-musllinux_1_2_armv7l.whl", hash = "sha256:49a03727c1bba9a97d3e93c9f93ca03a57300f484b6e935463099841261195d3", size = 1716676 },
-    { url = "https://files.pythonhosted.org/packages/3f/8c/714d53bd8b5a4560667f7bbbb06b20c2382f9c7847d198370ec6526af39c/aiohttp-3.13.3-cp313-cp313-musllinux_1_2_ppc64le.whl", hash = "sha256:3d9908a48eb7416dc1f4524e69f1d32e5d90e3981e4e37eb0aa1cd18f9cfa2a4", size = 1733217 },
-    { url = "https://files.pythonhosted.org/packages/7d/79/e2176f46d2e963facea939f5be2d26368ce543622be6f00a12844d3c991f/aiohttp-3.13.3-cp313-cp313-musllinux_1_2_riscv64.whl", hash = "sha256:2712039939ec963c237286113c68dbad80a82a4281543f3abf766d9d73228998", size = 1552303 },
-    { url = "https://files.pythonhosted.org/packages/ab/6a/28ed4dea1759916090587d1fe57087b03e6c784a642b85ef48217b0277ae/aiohttp-3.13.3-cp313-cp313-musllinux_1_2_s390x.whl", hash = "sha256:7bfdc049127717581866fa4708791220970ce291c23e28ccf3922c700740fdc0", size = 1763673 },
-    { url = "https://files.pythonhosted.org/packages/e8/35/4a3daeb8b9fab49240d21c04d50732313295e4bd813a465d840236dd0ce1/aiohttp-3.13.3-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:8057c98e0c8472d8846b9c79f56766bcc57e3e8ac7bfd510482332366c56c591", size = 1721120 },
-    { url = "https://files.pythonhosted.org/packages/bc/9f/d643bb3c5fb99547323e635e251c609fbbc660d983144cfebec529e09264/aiohttp-3.13.3-cp313-cp313-win32.whl", hash = "sha256:1449ceddcdbcf2e0446957863af03ebaaa03f94c090f945411b61269e2cb5daf", size = 427383 },
-    { url = "https://files.pythonhosted.org/packages/4e/f1/ab0395f8a79933577cdd996dd2f9aa6014af9535f65dddcf88204682fe62/aiohttp-3.13.3-cp313-cp313-win_amd64.whl", hash = "sha256:693781c45a4033d31d4187d2436f5ac701e7bbfe5df40d917736108c1cc7436e", size = 453899 },
-    { url = "https://files.pythonhosted.org/packages/99/36/5b6514a9f5d66f4e2597e40dea2e3db271e023eb7a5d22defe96ba560996/aiohttp-3.13.3-cp314-cp314-macosx_10_13_universal2.whl", hash = "sha256:ea37047c6b367fd4bd632bff8077449b8fa034b69e812a18e0132a00fae6e808", size = 737238 },
-    { url = "https://files.pythonhosted.org/packages/f7/49/459327f0d5bcd8c6c9ca69e60fdeebc3622861e696490d8674a6d0cb90a6/aiohttp-3.13.3-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:6fc0e2337d1a4c3e6acafda6a78a39d4c14caea625124817420abceed36e2415", size = 492292 },
-    { url = "https://files.pythonhosted.org/packages/e8/0b/b97660c5fd05d3495b4eb27f2d0ef18dc1dc4eff7511a9bf371397ff0264/aiohttp-3.13.3-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:c685f2d80bb67ca8c3837823ad76196b3694b0159d232206d1e461d3d434666f", size = 493021 },
-    { url = "https://files.pythonhosted.org/packages/54/d4/438efabdf74e30aeceb890c3290bbaa449780583b1270b00661126b8aae4/aiohttp-3.13.3-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:48e377758516d262bde50c2584fc6c578af272559c409eecbdd2bae1601184d6", size = 1717263 },
-    { url = "https://files.pythonhosted.org/packages/71/f2/7bddc7fd612367d1459c5bcf598a9e8f7092d6580d98de0e057eb42697ad/aiohttp-3.13.3-cp314-cp314-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:34749271508078b261c4abb1767d42b8d0c0cc9449c73a4df494777dc55f0687", size = 1669107 },
-    { url = "https://files.pythonhosted.org/packages/00/5a/1aeaecca40e22560f97610a329e0e5efef5e0b5afdf9f857f0d93839ab2e/aiohttp-3.13.3-cp314-cp314-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:82611aeec80eb144416956ec85b6ca45a64d76429c1ed46ae1b5f86c6e0c9a26", size = 1760196 },
-    { url = "https://files.pythonhosted.org/packages/f8/f8/0ff6992bea7bd560fc510ea1c815f87eedd745fe035589c71ce05612a19a/aiohttp-3.13.3-cp314-cp314-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:2fff83cfc93f18f215896e3a190e8e5cb413ce01553901aca925176e7568963a", size = 1843591 },
-    { url = "https://files.pythonhosted.org/packages/e3/d1/e30e537a15f53485b61f5be525f2157da719819e8377298502aebac45536/aiohttp-3.13.3-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:bbe7d4cecacb439e2e2a8a1a7b935c25b812af7a5fd26503a66dadf428e79ec1", size = 1720277 },
-    { url = "https://files.pythonhosted.org/packages/84/45/23f4c451d8192f553d38d838831ebbc156907ea6e05557f39563101b7717/aiohttp-3.13.3-cp314-cp314-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:b928f30fe49574253644b1ca44b1b8adbd903aa0da4b9054a6c20fc7f4092a25", size = 1548575 },
-    { url = "https://files.pythonhosted.org/packages/6a/ed/0a42b127a43712eda7807e7892c083eadfaf8429ca8fb619662a530a3aab/aiohttp-3.13.3-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:7b5e8fe4de30df199155baaf64f2fcd604f4c678ed20910db8e2c66dc4b11603", size = 1679455 },
-    { url = "https://files.pythonhosted.org/packages/2e/b5/c05f0c2b4b4fe2c9d55e73b6d3ed4fd6c9dc2684b1d81cbdf77e7fad9adb/aiohttp-3.13.3-cp314-cp314-musllinux_1_2_armv7l.whl", hash = "sha256:8542f41a62bcc58fc7f11cf7c90e0ec324ce44950003feb70640fc2a9092c32a", size = 1687417 },
-    { url = "https://files.pythonhosted.org/packages/c9/6b/915bc5dad66aef602b9e459b5a973529304d4e89ca86999d9d75d80cbd0b/aiohttp-3.13.3-cp314-cp314-musllinux_1_2_ppc64le.whl", hash = "sha256:5e1d8c8b8f1d91cd08d8f4a3c2b067bfca6ec043d3ff36de0f3a715feeedf926", size = 1729968 },
-    { url = "https://files.pythonhosted.org/packages/11/3b/e84581290a9520024a08640b63d07673057aec5ca548177a82026187ba73/aiohttp-3.13.3-cp314-cp314-musllinux_1_2_riscv64.whl", hash = "sha256:90455115e5da1c3c51ab619ac57f877da8fd6d73c05aacd125c5ae9819582aba", size = 1545690 },
-    { url = "https://files.pythonhosted.org/packages/f5/04/0c3655a566c43fd647c81b895dfe361b9f9ad6d58c19309d45cff52d6c3b/aiohttp-3.13.3-cp314-cp314-musllinux_1_2_s390x.whl", hash = "sha256:042e9e0bcb5fba81886c8b4fbb9a09d6b8a00245fd8d88e4d989c1f96c74164c", size = 1746390 },
-    { url = "https://files.pythonhosted.org/packages/1f/53/71165b26978f719c3419381514c9690bd5980e764a09440a10bb816ea4ab/aiohttp-3.13.3-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:2eb752b102b12a76ca02dff751a801f028b4ffbbc478840b473597fc91a9ed43", size = 1702188 },
-    { url = "https://files.pythonhosted.org/packages/29/a7/cbe6c9e8e136314fa1980da388a59d2f35f35395948a08b6747baebb6aa6/aiohttp-3.13.3-cp314-cp314-win32.whl", hash = "sha256:b556c85915d8efaed322bf1bdae9486aa0f3f764195a0fb6ee962e5c71ef5ce1", size = 433126 },
-    { url = "https://files.pythonhosted.org/packages/de/56/982704adea7d3b16614fc5936014e9af85c0e34b58f9046655817f04306e/aiohttp-3.13.3-cp314-cp314-win_amd64.whl", hash = "sha256:9bf9f7a65e7aa20dd764151fb3d616c81088f91f8df39c3893a536e279b4b984", size = 459128 },
-    { url = "https://files.pythonhosted.org/packages/6c/2a/3c79b638a9c3d4658d345339d22070241ea341ed4e07b5ac60fb0f418003/aiohttp-3.13.3-cp314-cp314t-macosx_10_13_universal2.whl", hash = "sha256:05861afbbec40650d8a07ea324367cb93e9e8cc7762e04dd4405df99fa65159c", size = 769512 },
-    { url = "https://files.pythonhosted.org/packages/29/b9/3e5014d46c0ab0db8707e0ac2711ed28c4da0218c358a4e7c17bae0d8722/aiohttp-3.13.3-cp314-cp314t-macosx_10_13_x86_64.whl", hash = "sha256:2fc82186fadc4a8316768d61f3722c230e2c1dcab4200d52d2ebdf2482e47592", size = 506444 },
-    { url = "https://files.pythonhosted.org/packages/90/03/c1d4ef9a054e151cd7839cdc497f2638f00b93cbe8043983986630d7a80c/aiohttp-3.13.3-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:0add0900ff220d1d5c5ebbf99ed88b0c1bbf87aa7e4262300ed1376a6b13414f", size = 510798 },
-    { url = "https://files.pythonhosted.org/packages/ea/76/8c1e5abbfe8e127c893fe7ead569148a4d5a799f7cf958d8c09f3eedf097/aiohttp-3.13.3-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:568f416a4072fbfae453dcf9a99194bbb8bdeab718e08ee13dfa2ba0e4bebf29", size = 1868835 },
-    { url = "https://files.pythonhosted.org/packages/8e/ac/984c5a6f74c363b01ff97adc96a3976d9c98940b8969a1881575b279ac5d/aiohttp-3.13.3-cp314-cp314t-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:add1da70de90a2569c5e15249ff76a631ccacfe198375eead4aadf3b8dc849dc", size = 1720486 },
-    { url = "https://files.pythonhosted.org/packages/b2/9a/b7039c5f099c4eb632138728828b33428585031a1e658d693d41d07d89d1/aiohttp-3.13.3-cp314-cp314t-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:10b47b7ba335d2e9b1239fa571131a87e2d8ec96b333e68b2a305e7a98b0bae2", size = 1847951 },
-    { url = "https://files.pythonhosted.org/packages/3c/02/3bec2b9a1ba3c19ff89a43a19324202b8eb187ca1e928d8bdac9bbdddebd/aiohttp-3.13.3-cp314-cp314t-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:3dd4dce1c718e38081c8f35f323209d4c1df7d4db4bab1b5c88a6b4d12b74587", size = 1941001 },
-    { url = "https://files.pythonhosted.org/packages/37/df/d879401cedeef27ac4717f6426c8c36c3091c6e9f08a9178cc87549c537f/aiohttp-3.13.3-cp314-cp314t-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:34bac00a67a812570d4a460447e1e9e06fae622946955f939051e7cc895cfab8", size = 1797246 },
-    { url = "https://files.pythonhosted.org/packages/8d/15/be122de1f67e6953add23335c8ece6d314ab67c8bebb3f181063010795a7/aiohttp-3.13.3-cp314-cp314t-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:a19884d2ee70b06d9204b2727a7b9f983d0c684c650254679e716b0b77920632", size = 1627131 },
-    { url = "https://files.pythonhosted.org/packages/12/12/70eedcac9134cfa3219ab7af31ea56bc877395b1ac30d65b1bc4b27d0438/aiohttp-3.13.3-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:5f8ca7f2bb6ba8348a3614c7918cc4bb73268c5ac2a207576b7afea19d3d9f64", size = 1795196 },
-    { url = "https://files.pythonhosted.org/packages/32/11/b30e1b1cd1f3054af86ebe60df96989c6a414dd87e27ad16950eee420bea/aiohttp-3.13.3-cp314-cp314t-musllinux_1_2_armv7l.whl", hash = "sha256:b0d95340658b9d2f11d9697f59b3814a9d3bb4b7a7c20b131df4bcef464037c0", size = 1782841 },
-    { url = "https://files.pythonhosted.org/packages/88/0d/d98a9367b38912384a17e287850f5695c528cff0f14f791ce8ee2e4f7796/aiohttp-3.13.3-cp314-cp314t-musllinux_1_2_ppc64le.whl", hash = "sha256:a1e53262fd202e4b40b70c3aff944a8155059beedc8a89bba9dc1f9ef06a1b56", size = 1795193 },
-    { url = "https://files.pythonhosted.org/packages/43/a5/a2dfd1f5ff5581632c7f6a30e1744deda03808974f94f6534241ef60c751/aiohttp-3.13.3-cp314-cp314t-musllinux_1_2_riscv64.whl", hash = "sha256:d60ac9663f44168038586cab2157e122e46bdef09e9368b37f2d82d354c23f72", size = 1621979 },
-    { url = "https://files.pythonhosted.org/packages/fa/f0/12973c382ae7c1cccbc4417e129c5bf54c374dfb85af70893646e1f0e749/aiohttp-3.13.3-cp314-cp314t-musllinux_1_2_s390x.whl", hash = "sha256:90751b8eed69435bac9ff4e3d2f6b3af1f57e37ecb0fbeee59c0174c9e2d41df", size = 1822193 },
-    { url = "https://files.pythonhosted.org/packages/3c/5f/24155e30ba7f8c96918af1350eb0663e2430aad9e001c0489d89cd708ab1/aiohttp-3.13.3-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:fc353029f176fd2b3ec6cfc71be166aba1936fe5d73dd1992ce289ca6647a9aa", size = 1769801 },
-    { url = "https://files.pythonhosted.org/packages/eb/f8/7314031ff5c10e6ece114da79b338ec17eeff3a079e53151f7e9f43c4723/aiohttp-3.13.3-cp314-cp314t-win32.whl", hash = "sha256:2e41b18a58da1e474a057b3d35248d8320029f61d70a37629535b16a0c8f3767", size = 466523 },
-    { url = "https://files.pythonhosted.org/packages/b4/63/278a98c715ae467624eafe375542d8ba9b4383a016df8fdefe0ae28382a7/aiohttp-3.13.3-cp314-cp314t-win_amd64.whl", hash = "sha256:44531a36aa2264a1860089ffd4dce7baf875ee5a6079d5fb42e261c704ef7344", size = 499694 },
+    { url = "https://files.pythonhosted.org/packages/be/6f/353954c29e7dcce7cf00280a02c75f30e133c00793c7a2ed3776d7b2f426/aiohttp-3.13.5-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:023ecba036ddd840b0b19bf195bfae970083fd7024ce1ac22e9bba90464620e9", size = 748876 },
+    { url = "https://files.pythonhosted.org/packages/f5/1b/428a7c64687b3b2e9cd293186695affc0e1e54a445d0361743b231f11066/aiohttp-3.13.5-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:15c933ad7920b7d9a20de151efcd05a6e38302cbf0e10c9b2acb9a42210a2416", size = 499557 },
+    { url = "https://files.pythonhosted.org/packages/29/47/7be41556bfbb6917069d6a6634bb7dd5e163ba445b783a90d40f5ac7e3a7/aiohttp-3.13.5-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:ab2899f9fa2f9f741896ebb6fa07c4c883bfa5c7f2ddd8cf2aafa86fa981b2d2", size = 500258 },
+    { url = "https://files.pythonhosted.org/packages/67/84/c9ecc5828cb0b3695856c07c0a6817a99d51e2473400f705275a2b3d9239/aiohttp-3.13.5-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:a60eaa2d440cd4707696b52e40ed3e2b0f73f65be07fd0ef23b6b539c9c0b0b4", size = 1749199 },
+    { url = "https://files.pythonhosted.org/packages/f0/d3/3c6d610e66b495657622edb6ae7c7fd31b2e9086b4ec50b47897ad6042a9/aiohttp-3.13.5-cp312-cp312-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:55b3bdd3292283295774ab585160c4004f4f2f203946997f49aac032c84649e9", size = 1721013 },
+    { url = "https://files.pythonhosted.org/packages/49/a0/24409c12217456df0bae7babe3b014e460b0b38a8e60753d6cb339f6556d/aiohttp-3.13.5-cp312-cp312-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:c2b2355dc094e5f7d45a7bb262fe7207aa0460b37a0d87027dcf21b5d890e7d5", size = 1781501 },
+    { url = "https://files.pythonhosted.org/packages/98/9d/b65ec649adc5bccc008b0957a9a9c691070aeac4e41cea18559fef49958b/aiohttp-3.13.5-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:b38765950832f7d728297689ad78f5f2cf79ff82487131c4d26fe6ceecdc5f8e", size = 1878981 },
+    { url = "https://files.pythonhosted.org/packages/57/d8/8d44036d7eb7b6a8ec4c5494ea0c8c8b94fbc0ed3991c1a7adf230df03bf/aiohttp-3.13.5-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:b18f31b80d5a33661e08c89e202edabf1986e9b49c42b4504371daeaa11b47c1", size = 1767934 },
+    { url = "https://files.pythonhosted.org/packages/31/04/d3f8211f273356f158e3464e9e45484d3fb8c4ce5eb2f6fe9405c3273983/aiohttp-3.13.5-cp312-cp312-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:33add2463dde55c4f2d9635c6ab33ce154e5ecf322bd26d09af95c5f81cfa286", size = 1566671 },
+    { url = "https://files.pythonhosted.org/packages/41/db/073e4ebe00b78e2dfcacff734291651729a62953b48933d765dc513bf798/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:327cc432fdf1356fb4fbc6fe833ad4e9f6aacb71a8acaa5f1855e4b25910e4a9", size = 1705219 },
+    { url = "https://files.pythonhosted.org/packages/48/45/7dfba71a2f9fd97b15c95c06819de7eb38113d2cdb6319669195a7d64270/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_armv7l.whl", hash = "sha256:7c35b0bf0b48a70b4cb4fc5d7bed9b932532728e124874355de1a0af8ec4bc88", size = 1743049 },
+    { url = "https://files.pythonhosted.org/packages/18/71/901db0061e0f717d226386a7f471bb59b19566f2cae5f0d93874b017271f/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:df23d57718f24badef8656c49743e11a89fd6f5358fa8a7b96e728fda2abf7d3", size = 1749557 },
+    { url = "https://files.pythonhosted.org/packages/08/d5/41eebd16066e59cd43728fe74bce953d7402f2b4ddfdfef2c0e9f17ca274/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_riscv64.whl", hash = "sha256:02e048037a6501a5ec1f6fc9736135aec6eb8a004ce48838cb951c515f32c80b", size = 1558931 },
+    { url = "https://files.pythonhosted.org/packages/30/e6/4a799798bf05740e66c3a1161079bda7a3dd8e22ca392481d7a7f9af82a6/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_s390x.whl", hash = "sha256:31cebae8b26f8a615d2b546fee45d5ffb76852ae6450e2a03f42c9102260d6fe", size = 1774125 },
+    { url = "https://files.pythonhosted.org/packages/84/63/7749337c90f92bc2cb18f9560d67aa6258c7060d1397d21529b8004fcf6f/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:888e78eb5ca55a615d285c3c09a7a91b42e9dd6fc699b166ebd5dee87c9ccf14", size = 1732427 },
+    { url = "https://files.pythonhosted.org/packages/98/de/cf2f44ff98d307e72fb97d5f5bbae3bfcb442f0ea9790c0bf5c5c2331404/aiohttp-3.13.5-cp312-cp312-win32.whl", hash = "sha256:8bd3ec6376e68a41f9f95f5ed170e2fcf22d4eb27a1f8cb361d0508f6e0557f3", size = 433534 },
+    { url = "https://files.pythonhosted.org/packages/aa/ca/eadf6f9c8fa5e31d40993e3db153fb5ed0b11008ad5d9de98a95045bed84/aiohttp-3.13.5-cp312-cp312-win_amd64.whl", hash = "sha256:110e448e02c729bcebb18c60b9214a87ba33bac4a9fa5e9a5f139938b56c6cb1", size = 460446 },
+    { url = "https://files.pythonhosted.org/packages/78/e9/d76bf503005709e390122d34e15256b88f7008e246c4bdbe915cd4f1adce/aiohttp-3.13.5-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:a5029cc80718bbd545123cd8fe5d15025eccaaaace5d0eeec6bd556ad6163d61", size = 742930 },
+    { url = "https://files.pythonhosted.org/packages/57/00/4b7b70223deaebd9bb85984d01a764b0d7bd6526fcdc73cca83bcbe7243e/aiohttp-3.13.5-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:4bb6bf5811620003614076bdc807ef3b5e38244f9d25ca5fe888eaccea2a9832", size = 496927 },
+    { url = "https://files.pythonhosted.org/packages/9c/f5/0fb20fb49f8efdcdce6cd8127604ad2c503e754a8f139f5e02b01626523f/aiohttp-3.13.5-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:a84792f8631bf5a94e52d9cc881c0b824ab42717165a5579c760b830d9392ac9", size = 497141 },
+    { url = "https://files.pythonhosted.org/packages/3b/86/b7c870053e36a94e8951b803cb5b909bfbc9b90ca941527f5fcafbf6b0fa/aiohttp-3.13.5-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:57653eac22c6a4c13eb22ecf4d673d64a12f266e72785ab1c8b8e5940d0e8090", size = 1732476 },
+    { url = "https://files.pythonhosted.org/packages/b5/e5/4e161f84f98d80c03a238671b4136e6530453d65262867d989bbe78244d0/aiohttp-3.13.5-cp313-cp313-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:e5e5f7debc7a57af53fdf5c5009f9391d9f4c12867049d509bf7bb164a6e295b", size = 1706507 },
+    { url = "https://files.pythonhosted.org/packages/d4/56/ea11a9f01518bd5a2a2fcee869d248c4b8a0cfa0bb13401574fa31adf4d4/aiohttp-3.13.5-cp313-cp313-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:c719f65bebcdf6716f10e9eff80d27567f7892d8988c06de12bbbd39307c6e3a", size = 1773465 },
+    { url = "https://files.pythonhosted.org/packages/eb/40/333ca27fb74b0383f17c90570c748f7582501507307350a79d9f9f3c6eb1/aiohttp-3.13.5-cp313-cp313-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:d97f93fdae594d886c5a866636397e2bcab146fd7a132fd6bb9ce182224452f8", size = 1873523 },
+    { url = "https://files.pythonhosted.org/packages/f0/d2/e2f77eef1acb7111405433c707dc735e63f67a56e176e72e9e7a2cd3f493/aiohttp-3.13.5-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:3df334e39d4c2f899a914f1dba283c1aadc311790733f705182998c6f7cae665", size = 1754113 },
+    { url = "https://files.pythonhosted.org/packages/fb/56/3f653d7f53c89669301ec9e42c95233e2a0c0a6dd051269e6e678db4fdb0/aiohttp-3.13.5-cp313-cp313-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:fe6970addfea9e5e081401bcbadf865d2b6da045472f58af08427e108d618540", size = 1562351 },
+    { url = "https://files.pythonhosted.org/packages/ec/a6/9b3e91eb8ae791cce4ee736da02211c85c6f835f1bdfac0594a8a3b7018c/aiohttp-3.13.5-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:7becdf835feff2f4f335d7477f121af787e3504b48b449ff737afb35869ba7bb", size = 1693205 },
+    { url = "https://files.pythonhosted.org/packages/98/fc/bfb437a99a2fcebd6b6eaec609571954de2ed424f01c352f4b5504371dd3/aiohttp-3.13.5-cp313-cp313-musllinux_1_2_armv7l.whl", hash = "sha256:676e5651705ad5d8a70aeb8eb6936c436d8ebbd56e63436cb7dd9bb36d2a9a46", size = 1730618 },
+    { url = "https://files.pythonhosted.org/packages/e4/b6/c8534862126191a034f68153194c389addc285a0f1347d85096d349bbc15/aiohttp-3.13.5-cp313-cp313-musllinux_1_2_ppc64le.whl", hash = "sha256:9b16c653d38eb1a611cc898c41e76859ca27f119d25b53c12875fd0474ae31a8", size = 1745185 },
+    { url = "https://files.pythonhosted.org/packages/0b/93/4ca8ee2ef5236e2707e0fd5fecb10ce214aee1ff4ab307af9c558bda3b37/aiohttp-3.13.5-cp313-cp313-musllinux_1_2_riscv64.whl", hash = "sha256:999802d5fa0389f58decd24b537c54aa63c01c3219ce17d1214cbda3c2b22d2d", size = 1557311 },
+    { url = "https://files.pythonhosted.org/packages/57/ae/76177b15f18c5f5d094f19901d284025db28eccc5ae374d1d254181d33f4/aiohttp-3.13.5-cp313-cp313-musllinux_1_2_s390x.whl", hash = "sha256:ec707059ee75732b1ba130ed5f9580fe10ff75180c812bc267ded039db5128c6", size = 1773147 },
+    { url = "https://files.pythonhosted.org/packages/01/a4/62f05a0a98d88af59d93b7fcac564e5f18f513cb7471696ac286db970d6a/aiohttp-3.13.5-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:2d6d44a5b48132053c2f6cd5c8cb14bc67e99a63594e336b0f2af81e94d5530c", size = 1730356 },
+    { url = "https://files.pythonhosted.org/packages/e4/85/fc8601f59dfa8c9523808281f2da571f8b4699685f9809a228adcc90838d/aiohttp-3.13.5-cp313-cp313-win32.whl", hash = "sha256:329f292ed14d38a6c4c435e465f48bebb47479fd676a0411936cc371643225cc", size = 432637 },
+    { url = "https://files.pythonhosted.org/packages/c0/1b/ac685a8882896acf0f6b31d689e3792199cfe7aba37969fa91da63a7fa27/aiohttp-3.13.5-cp313-cp313-win_amd64.whl", hash = "sha256:69f571de7500e0557801c0b51f4780482c0ec5fe2ac851af5a92cfce1af1cb83", size = 458896 },
+    { url = "https://files.pythonhosted.org/packages/5d/ce/46572759afc859e867a5bc8ec3487315869013f59281ce61764f76d879de/aiohttp-3.13.5-cp314-cp314-macosx_10_13_universal2.whl", hash = "sha256:eb4639f32fd4a9904ab8fb45bf3383ba71137f3d9d4ba25b3b3f3109977c5b8c", size = 745721 },
+    { url = "https://files.pythonhosted.org/packages/13/fe/8a2efd7626dbe6049b2ef8ace18ffda8a4dfcbe1bcff3ac30c0c7575c20b/aiohttp-3.13.5-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:7e5dc4311bd5ac493886c63cbf76ab579dbe4641268e7c74e48e774c74b6f2be", size = 497663 },
+    { url = "https://files.pythonhosted.org/packages/9b/91/cc8cc78a111826c54743d88651e1687008133c37e5ee615fee9b57990fac/aiohttp-3.13.5-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:756c3c304d394977519824449600adaf2be0ccee76d206ee339c5e76b70ded25", size = 499094 },
+    { url = "https://files.pythonhosted.org/packages/0a/33/a8362cb15cf16a3af7e86ed11962d5cd7d59b449202dc576cdc731310bde/aiohttp-3.13.5-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:ecc26751323224cf8186efcf7fbcbc30f4e1d8c7970659daf25ad995e4032a56", size = 1726701 },
+    { url = "https://files.pythonhosted.org/packages/45/0c/c091ac5c3a17114bd76cbf85d674650969ddf93387876cf67f754204bd77/aiohttp-3.13.5-cp314-cp314-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:10a75acfcf794edf9d8db50e5a7ec5fc818b2a8d3f591ce93bc7b1210df016d2", size = 1683360 },
+    { url = "https://files.pythonhosted.org/packages/23/73/bcee1c2b79bc275e964d1446c55c54441a461938e70267c86afaae6fba27/aiohttp-3.13.5-cp314-cp314-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:0f7a18f258d124cd678c5fe072fe4432a4d5232b0657fca7c1847f599233c83a", size = 1773023 },
+    { url = "https://files.pythonhosted.org/packages/c7/ef/720e639df03004fee2d869f771799d8c23046dec47d5b81e396c7cda583a/aiohttp-3.13.5-cp314-cp314-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:df6104c009713d3a89621096f3e3e88cc323fd269dbd7c20afe18535094320be", size = 1853795 },
+    { url = "https://files.pythonhosted.org/packages/bd/c9/989f4034fb46841208de7aeeac2c6d8300745ab4f28c42f629ba77c2d916/aiohttp-3.13.5-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:241a94f7de7c0c3b616627aaad530fe2cb620084a8b144d3be7b6ecfe95bae3b", size = 1730405 },
+    { url = "https://files.pythonhosted.org/packages/ce/75/ee1fd286ca7dc599d824b5651dad7b3be7ff8d9a7e7b3fe9820d9180f7db/aiohttp-3.13.5-cp314-cp314-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:c974fb66180e58709b6fc402846f13791240d180b74de81d23913abe48e96d94", size = 1558082 },
+    { url = "https://files.pythonhosted.org/packages/c3/20/1e9e6650dfc436340116b7aa89ff8cb2bbdf0abc11dfaceaad8f74273a10/aiohttp-3.13.5-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:6e27ea05d184afac78aabbac667450c75e54e35f62238d44463131bd3f96753d", size = 1692346 },
+    { url = "https://files.pythonhosted.org/packages/d8/40/8ebc6658d48ea630ac7903912fe0dd4e262f0e16825aa4c833c56c9f1f56/aiohttp-3.13.5-cp314-cp314-musllinux_1_2_armv7l.whl", hash = "sha256:a79a6d399cef33a11b6f004c67bb07741d91f2be01b8d712d52c75711b1e07c7", size = 1698891 },
+    { url = "https://files.pythonhosted.org/packages/d8/78/ea0ae5ec8ba7a5c10bdd6e318f1ba5e76fcde17db8275188772afc7917a4/aiohttp-3.13.5-cp314-cp314-musllinux_1_2_ppc64le.whl", hash = "sha256:c632ce9c0b534fbe25b52c974515ed674937c5b99f549a92127c85f771a78772", size = 1742113 },
+    { url = "https://files.pythonhosted.org/packages/8a/66/9d308ed71e3f2491be1acb8769d96c6f0c47d92099f3bc9119cada27b357/aiohttp-3.13.5-cp314-cp314-musllinux_1_2_riscv64.whl", hash = "sha256:fceedde51fbd67ee2bcc8c0b33d0126cc8b51ef3bbde2f86662bd6d5a6f10ec5", size = 1553088 },
+    { url = "https://files.pythonhosted.org/packages/da/a6/6cc25ed8dfc6e00c90f5c6d126a98e2cf28957ad06fa1036bd34b6f24a2c/aiohttp-3.13.5-cp314-cp314-musllinux_1_2_s390x.whl", hash = "sha256:f92995dfec9420bb69ae629abf422e516923ba79ba4403bc750d94fb4a6c68c1", size = 1757976 },
+    { url = "https://files.pythonhosted.org/packages/c1/2b/cce5b0ffe0de99c83e5e36d8f828e4161e415660a9f3e58339d07cce3006/aiohttp-3.13.5-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:20ae0ff08b1f2c8788d6fb85afcb798654ae6ba0b747575f8562de738078457b", size = 1712444 },
+    { url = "https://files.pythonhosted.org/packages/6c/cf/9e1795b4160c58d29421eafd1a69c6ce351e2f7c8d3c6b7e4ca44aea1a5b/aiohttp-3.13.5-cp314-cp314-win32.whl", hash = "sha256:b20df693de16f42b2472a9c485e1c948ee55524786a0a34345511afdd22246f3", size = 438128 },
+    { url = "https://files.pythonhosted.org/packages/22/4d/eaedff67fc805aeba4ba746aec891b4b24cebb1a7d078084b6300f79d063/aiohttp-3.13.5-cp314-cp314-win_amd64.whl", hash = "sha256:f85c6f327bf0b8c29da7d93b1cabb6363fb5e4e160a32fa241ed2dce21b73162", size = 464029 },
+    { url = "https://files.pythonhosted.org/packages/79/11/c27d9332ee20d68dd164dc12a6ecdef2e2e35ecc97ed6cf0d2442844624b/aiohttp-3.13.5-cp314-cp314t-macosx_10_13_universal2.whl", hash = "sha256:1efb06900858bb618ff5cee184ae2de5828896c448403d51fb633f09e109be0a", size = 778758 },
+    { url = "https://files.pythonhosted.org/packages/04/fb/377aead2e0a3ba5f09b7624f702a964bdf4f08b5b6728a9799830c80041e/aiohttp-3.13.5-cp314-cp314t-macosx_10_13_x86_64.whl", hash = "sha256:fee86b7c4bd29bdaf0d53d14739b08a106fdda809ca5fe032a15f52fae5fe254", size = 512883 },
+    { url = "https://files.pythonhosted.org/packages/bb/a6/aa109a33671f7a5d3bd78b46da9d852797c5e665bfda7d6b373f56bff2ec/aiohttp-3.13.5-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:20058e23909b9e65f9da62b396b77dfa95965cbe840f8def6e572538b1d32e36", size = 516668 },
+    { url = "https://files.pythonhosted.org/packages/79/b3/ca078f9f2fa9563c36fb8ef89053ea2bb146d6f792c5104574d49d8acb63/aiohttp-3.13.5-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:8cf20a8d6868cb15a73cab329ffc07291ba8c22b1b88176026106ae39aa6df0f", size = 1883461 },
+    { url = "https://files.pythonhosted.org/packages/b7/e3/a7ad633ca1ca497b852233a3cce6906a56c3225fb6d9217b5e5e60b7419d/aiohttp-3.13.5-cp314-cp314t-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:330f5da04c987f1d5bdb8ae189137c77139f36bd1cb23779ca1a354a4b027800", size = 1747661 },
+    { url = "https://files.pythonhosted.org/packages/33/b9/cd6fe579bed34a906d3d783fe60f2fa297ef55b27bb4538438ee49d4dc41/aiohttp-3.13.5-cp314-cp314t-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:6f1cbf0c7926d315c3c26c2da41fd2b5d2fe01ac0e157b78caefc51a782196cf", size = 1863800 },
+    { url = "https://files.pythonhosted.org/packages/c0/3f/2c1e2f5144cefa889c8afd5cf431994c32f3b29da9961698ff4e3811b79a/aiohttp-3.13.5-cp314-cp314t-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:53fc049ed6390d05423ba33103ded7281fe897cf97878f369a527070bd95795b", size = 1958382 },
+    { url = "https://files.pythonhosted.org/packages/66/1d/f31ec3f1013723b3babe3609e7f119c2c2fb6ef33da90061a705ef3e1bc8/aiohttp-3.13.5-cp314-cp314t-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:898703aa2667e3c5ca4c54ca36cd73f58b7a38ef87a5606414799ebce4d3fd3a", size = 1803724 },
+    { url = "https://files.pythonhosted.org/packages/0e/b4/57712dfc6f1542f067daa81eb61da282fab3e6f1966fca25db06c4fc62d5/aiohttp-3.13.5-cp314-cp314t-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:0494a01ca9584eea1e5fbd6d748e61ecff218c51b576ee1999c23db7066417d8", size = 1640027 },
+    { url = "https://files.pythonhosted.org/packages/25/3c/734c878fb43ec083d8e31bf029daae1beafeae582d1b35da234739e82ee7/aiohttp-3.13.5-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:6cf81fe010b8c17b09495cbd15c1d35afbc8fb405c0c9cf4738e5ae3af1d65be", size = 1806644 },
+    { url = "https://files.pythonhosted.org/packages/20/a5/f671e5cbec1c21d044ff3078223f949748f3a7f86b14e34a365d74a5d21f/aiohttp-3.13.5-cp314-cp314t-musllinux_1_2_armv7l.whl", hash = "sha256:c564dd5f09ddc9d8f2c2d0a301cd30a79a2cc1b46dd1a73bef8f0038863d016b", size = 1791630 },
+    { url = "https://files.pythonhosted.org/packages/0b/63/fb8d0ad63a0b8a99be97deac8c04dacf0785721c158bdf23d679a87aa99e/aiohttp-3.13.5-cp314-cp314t-musllinux_1_2_ppc64le.whl", hash = "sha256:2994be9f6e51046c4f864598fd9abeb4fba6e88f0b2152422c9666dcd4aea9c6", size = 1809403 },
+    { url = "https://files.pythonhosted.org/packages/59/0c/bfed7f30662fcf12206481c2aac57dedee43fe1c49275e85b3a1e1742294/aiohttp-3.13.5-cp314-cp314t-musllinux_1_2_riscv64.whl", hash = "sha256:157826e2fa245d2ef46c83ea8a5faf77ca19355d278d425c29fda0beb3318037", size = 1634924 },
+    { url = "https://files.pythonhosted.org/packages/17/d6/fd518d668a09fd5a3319ae5e984d4d80b9a4b3df4e21c52f02251ef5a32e/aiohttp-3.13.5-cp314-cp314t-musllinux_1_2_s390x.whl", hash = "sha256:a8aca50daa9493e9e13c0f566201a9006f080e7c50e5e90d0b06f53146a54500", size = 1836119 },
+    { url = "https://files.pythonhosted.org/packages/78/b7/15fb7a9d52e112a25b621c67b69c167805cb1f2ab8f1708a5c490d1b52fe/aiohttp-3.13.5-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:3b13560160d07e047a93f23aaa30718606493036253d5430887514715b67c9d9", size = 1772072 },
+    { url = "https://files.pythonhosted.org/packages/7e/df/57ba7f0c4a553fc2bd8b6321df236870ec6fd64a2a473a8a13d4f733214e/aiohttp-3.13.5-cp314-cp314t-win32.whl", hash = "sha256:9a0f4474b6ea6818b41f82172d799e4b3d29e22c2c520ce4357856fced9af2f8", size = 471819 },
+    { url = "https://files.pythonhosted.org/packages/62/29/2f8418269e46454a26171bfdd6a055d74febf32234e474930f2f60a17145/aiohttp-3.13.5-cp314-cp314t-win_amd64.whl", hash = "sha256:18a2f6c1182c51baa1d28d68fea51513cb2a76612f038853c0ad3c145423d3d9", size = 505441 },
 ]
 
 [[package]]
@@ -1023,14 +1023,14 @@ wheels = [
 
 [[package]]
 name = "click"
-version = "8.3.1"
+version = "8.1.8"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "colorama", marker = "sys_platform == 'win32'" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/3d/fa/656b739db8587d7b5dfa22e22ed02566950fbfbcdc20311993483657a5c0/click-8.3.1.tar.gz", hash = "sha256:12ff4785d337a1bb490bb7e9c2b1ee5da3112e94a8622f26a6c77f5d2fc6842a", size = 295065 }
+sdist = { url = "https://files.pythonhosted.org/packages/b9/2e/0090cbf739cee7d23781ad4b89a9894a41538e4fcf4c31dcdd705b78eb8b/click-8.1.8.tar.gz", hash = "sha256:ed53c9d8990d83c2a27deae68e4ee337473f6330c040a31d4225c9574d16096a", size = 226593 }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/98/78/01c019cdb5d6498122777c1a43056ebb3ebfeef2076d9d026bfe15583b2b/click-8.3.1-py3-none-any.whl", hash = "sha256:981153a64e25f12d547d3426c367a4857371575ee7ad18df2a6183ab0545b2a6", size = 108274 },
+    { url = "https://files.pythonhosted.org/packages/7e/d4/7ebdbd03970677812aac39c869717059dbb71a4cfc033ca6e5221787892c/click-8.1.8-py3-none-any.whl", hash = "sha256:63c132bbbed01578a06712a2d1f497bb62d9c1c0d329b7903a866228027263b2", size = 98188 },
 ]
 
 [[package]]
@@ -2984,14 +2984,14 @@ wheels = [
 
 [[package]]
 name = "importlib-metadata"
-version = "8.7.1"
+version = "8.5.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "zipp" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/f3/49/3b30cad09e7771a4982d9975a8cbf64f00d4a1ececb53297f1d9a7be1b10/importlib_metadata-8.7.1.tar.gz", hash = "sha256:49fef1ae6440c182052f407c8d34a68f72efc36db9ca90dc0113398f2fdde8bb", size = 57107 }
+sdist = { url = "https://files.pythonhosted.org/packages/cd/12/33e59336dca5be0c398a7482335911a33aa0e20776128f038019f1a95f1b/importlib_metadata-8.5.0.tar.gz", hash = "sha256:71522656f0abace1d072b9e5481a48f07c138e00f079c38c8f883823f9c26bd7", size = 55304 }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/fa/5e/f8e9a1d23b9c20a551a8a02ea3637b4642e22c2626e3a13a9a29cdea99eb/importlib_metadata-8.7.1-py3-none-any.whl", hash = "sha256:5a1f80bf1daa489495071efbb095d75a634cf28a8bc299581244063b53176151", size = 27865 },
+    { url = "https://files.pythonhosted.org/packages/a0/d9/a1e041c5e7caa9a05c925f4bdbdfb7f006d1f74996af53467bc394c97be7/importlib_metadata-8.5.0-py3-none-any.whl", hash = "sha256:45e54197d28b7a7f1559e60b95e7c567032b602131fbd588f1497f47880aa68b", size = 26514 },
 ]
 
 [[package]]
@@ -3222,7 +3222,7 @@ wheels = [
 
 [[package]]
 name = "jsonschema"
-version = "4.26.0"
+version = "4.23.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "attrs" },
@@ -3230,9 +3230,9 @@ dependencies = [
     { name = "referencing" },
     { name = "rpds-py" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/b3/fc/e067678238fa451312d4c62bf6e6cf5ec56375422aee02f9cb5f909b3047/jsonschema-4.26.0.tar.gz", hash = "sha256:0c26707e2efad8aa1bfc5b7ce170f3fccc2e4918ff85989ba9ffa9facb2be326", size = 366583 }
+sdist = { url = "https://files.pythonhosted.org/packages/38/2e/03362ee4034a4c917f697890ccd4aec0800ccf9ded7f511971c75451deec/jsonschema-4.23.0.tar.gz", hash = "sha256:d71497fef26351a33265337fa77ffeb82423f3ea21283cd9467bb03999266bc4", size = 325778 }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/69/90/f63fb5873511e014207a475e2bb4e8b2e570d655b00ac19a9a0ca0a385ee/jsonschema-4.26.0-py3-none-any.whl", hash = "sha256:d489f15263b8d200f8387e64b4c3a75f06629559fb73deb8fdfb525f2dab50ce", size = 90630 },
+    { url = "https://files.pythonhosted.org/packages/69/4a/4f9dbeb84e8850557c02365a0eee0649abe5eb1d84af92a25731c6c0f922/jsonschema-4.23.0-py3-none-any.whl", hash = "sha256:fbadb6f8b144a8f8cf9f0b89ba94501d143e50411a1278633f56a7acf7fd5566", size = 88462 },
 ]
 
 [[package]]
@@ -3533,7 +3533,7 @@ wheels = [
 
 [[package]]
 name = "langchain-litellm"
-version = "0.6.2"
+version = "0.6.4"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "cryptography" },
@@ -3541,9 +3541,9 @@ dependencies = [
     { name = "langchain-core" },
     { name = "litellm" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/ee/6f/ba0490ec0fbc9d97cd9433749455fb4b5fbec3852bcbe113a0278ec1d32d/langchain_litellm-0.6.2.tar.gz", hash = "sha256:93372df7c3f1802358746e2c0a94012d8c27d9f9b57b769b23f6af2264bbaabb", size = 332878 }
+sdist = { url = "https://files.pythonhosted.org/packages/68/37/ccc1f284a42900ca5b267a50da8e50145e9f264b32ee955ce91aa360d188/langchain_litellm-0.6.4.tar.gz", hash = "sha256:663281db392b3de1f07f891d0f80f9d4b26c0f0d2abbf854ef9b186d99c309ee", size = 339457 }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/da/14/ad857a3f56fa4ea0879ac9d6ee5248c883663d0bad94bf8741e1ab6ab200/langchain_litellm-0.6.2-py3-none-any.whl", hash = "sha256:98af79dbcdea4b492e9601351bc5fd15fdd368e021183b8540f0d0b6b6b1589c", size = 24865 },
+    { url = "https://files.pythonhosted.org/packages/43/e8/25c50bbad7a05106c7af65557e165d6cb6159c90854dae61de59debe735d/langchain_litellm-0.6.4-py3-none-any.whl", hash = "sha256:60f4e37be1a47dc88f94fac7085675ef8fa04bba92f48735792d82f492120744", size = 26360 },
 ]
 
 [[package]]
@@ -3709,7 +3709,7 @@ wheels = [
 
 [[package]]
 name = "litellm"
-version = "1.82.6"
+version = "1.83.4"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "aiohttp" },
@@ -3725,9 +3725,9 @@ dependencies = [
     { name = "tiktoken" },
     { name = "tokenizers" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/29/75/1c537aa458426a9127a92bc2273787b2f987f4e5044e21f01f2eed5244fd/litellm-1.82.6.tar.gz", hash = "sha256:2aa1c2da21fe940c33613aa447119674a3ad4d2ad5eb064e4d5ce5ee42420136", size = 17414147 }
+sdist = { url = "https://files.pythonhosted.org/packages/03/c4/30469c06ae7437a4406bc11e3c433cfd380a6771068cca15ea918dcd158f/litellm-1.83.4.tar.gz", hash = "sha256:6458d2030a41229460b321adee00517a91dbd8e63213cc953d355cb41d16f2d4", size = 17733899 }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/02/6c/5327667e6dbe9e98cbfbd4261c8e91386a52e38f41419575854248bbab6a/litellm-1.82.6-py3-none-any.whl", hash = "sha256:164a3ef3e19f309e3cabc199bef3d2045212712fefdfa25fc7f75884a5b5b205", size = 15591595 },
+    { url = "https://files.pythonhosted.org/packages/b8/bd/df19d3f8f6654535ee343a341fd921f81c411abf601a53e3eaef58129b02/litellm-1.83.4-py3-none-any.whl", hash = "sha256:17d7b4d48d47aca988ea4f762ddda5e7bd72cda3270192b22813d0330869d7b4", size = 16015555 },
 ]
 
 [[package]]
@@ -6766,11 +6766,11 @@ wheels = [
 
 [[package]]
 name = "python-dotenv"
-version = "1.2.2"
+version = "1.0.1"
 source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/82/ed/0301aeeac3e5353ef3d94b6ec08bbcabd04a72018415dcb29e588514bba8/python_dotenv-1.2.2.tar.gz", hash = "sha256:2c371a91fbd7ba082c2c1dc1f8bf89ca22564a087c2c287cd9b662adde799cf3", size = 50135 }
+sdist = { url = "https://files.pythonhosted.org/packages/bc/57/e84d88dfe0aec03b7a2d4327012c1627ab5f03652216c63d49846d7a6c58/python-dotenv-1.0.1.tar.gz", hash = "sha256:e324ee90a023d808f1959c46bcbc04446a10ced277783dc6ee09987c37ec10ca", size = 39115 }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/0b/d7/1959b9648791274998a9c3526f6d0ec8fd2233e4d4acce81bbae76b44b2a/python_dotenv-1.2.2-py3-none-any.whl", hash = "sha256:1d8214789a24de455a8b8bd8ae6fe3c6b69a5e3d64aa8a8e5d68e694bbcb285a", size = 22101 },
+    { url = "https://files.pythonhosted.org/packages/6a/3e/b68c118422ec867fa7ab88444e1274aa40681c606d59ac27de5a5588f082/python_dotenv-1.0.1-py3-none-any.whl", hash = "sha256:f7b63ef50f1b690dddf550d03497b66d609393b40b564ed0d674909a68ebf16a", size = 19863 },
 ]
 
 [[package]]
@@ -8049,12 +8049,12 @@ requires-dist = [
     { name = "langchain", specifier = ">=1.2.13" },
     { name = "langchain-community", specifier = ">=0.4.1" },
     { name = "langchain-daytona", specifier = ">=0.0.2" },
-    { name = "langchain-litellm", specifier = ">=0.3.5" },
+    { name = "langchain-litellm", specifier = ">=0.6.4" },
     { name = "langchain-unstructured", specifier = ">=1.0.1" },
     { name = "langgraph", specifier = ">=1.1.3" },
     { name = "langgraph-checkpoint-postgres", specifier = ">=3.0.2" },
     { name = "linkup-sdk", specifier = ">=0.2.4" },
-    { name = "litellm", specifier = ">=1.80.10" },
+    { name = "litellm", specifier = ">=1.83.0" },
     { name = "llama-cloud-services", specifier = ">=0.6.25" },
     { name = "markdown", specifier = ">=3.7" },
     { name = "markdownify", specifier = ">=0.14.1" },

From eb5799336c22e884e7eecde4273b5051d76fa83e Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Mon, 6 Apr 2026 22:15:05 -0700
Subject: [PATCH 158/202] refactor: streamline BrowserWindow component
 functionality

- Removed the interval management for tab selection, simplifying the state handling.
- Updated tab click handler to directly set the selected index without restarting the interval.
- Changed video preload attribute from "none" to "auto" for improved loading performance.
---
 .../components/homepage/hero-section.tsx      | 28 ++-----------------
 1 file changed, 2 insertions(+), 26 deletions(-)

diff --git a/surfsense_web/components/homepage/hero-section.tsx b/surfsense_web/components/homepage/hero-section.tsx
index 1bb28e770..60f293005 100644
--- a/surfsense_web/components/homepage/hero-section.tsx
+++ b/surfsense_web/components/homepage/hero-section.tsx
@@ -180,32 +180,8 @@ function GetStartedButton() {
 const BrowserWindow = () => {
 	const [selectedIndex, setSelectedIndex] = useState(0);
 	const selectedItem = TAB_ITEMS[selectedIndex];
-	const intervalRef = useRef<NodeJS.Timeout | null>(null);
 	const { expanded, open, close } = useExpandedMedia();
 
-	const startInterval = useCallback(() => {
-		if (intervalRef.current) {
-			clearInterval(intervalRef.current);
-		}
-		intervalRef.current = setInterval(() => {
-			setSelectedIndex((prev) => (prev + 1) % TAB_ITEMS.length);
-		}, 10000);
-	}, []);
-
-	useEffect(() => {
-		startInterval();
-		return () => {
-			if (intervalRef.current) {
-				clearInterval(intervalRef.current);
-			}
-		};
-	}, [startInterval]);
-
-	const handleTabClick = (index: number) => {
-		setSelectedIndex(index);
-		startInterval();
-	};
-
 	return (
 		<>
 			<motion.div className="relative my-4 flex w-full flex-col items-start justify-start overflow-hidden rounded-2xl shadow-2xl md:my-12">
@@ -220,7 +196,7 @@ const BrowserWindow = () => {
 							<React.Fragment key={item.title}>
 							<button
 								type="button"
-								onClick={() => handleTabClick(index)}
+								onClick={() => setSelectedIndex(index)}
 								className={cn(
 									"flex shrink-0 items-center gap-1.5 rounded-md px-2 py-1 text-xs transition duration-150 hover:bg-white sm:text-sm dark:hover:bg-neutral-950",
 									selectedIndex === index && !item.featured &&
@@ -334,7 +310,7 @@ const TabVideo = memo(function TabVideo({ src }: { src: string }) {
 				ref={videoRef}
 				key={src}
 				src={src}
-				preload="none"
+				preload="auto"
 				loop
 				muted
 				playsInline

From e920923fa44ecc471d007f6a036671158e3330a3 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Mon, 6 Apr 2026 23:02:25 -0700
Subject: [PATCH 159/202] feat: implement auth token synchronization between
 Electron and web app

- Added IPC channels for getting and setting auth tokens in Electron.
- Implemented functions to sync tokens from localStorage to Electron and vice versa.
- Updated components to ensure tokens are retrieved from Electron when not available locally.
- Enhanced user authentication flow by integrating token management across windows.
---
 surfsense_desktop/electron-builder.yml        |  2 +-
 surfsense_desktop/src/ipc/channels.ts         |  3 ++
 surfsense_desktop/src/ipc/handlers.ts         | 10 +++++
 surfsense_desktop/src/preload.ts              |  5 +++
 surfsense_web/app/dashboard/layout.tsx        | 23 ++++++-----
 surfsense_web/app/desktop/suggestion/page.tsx |  8 +++-
 surfsense_web/lib/auth-utils.ts               | 40 +++++++++++++++++++
 surfsense_web/types/window.d.ts               |  3 ++
 8 files changed, 82 insertions(+), 12 deletions(-)

diff --git a/surfsense_desktop/electron-builder.yml b/surfsense_desktop/electron-builder.yml
index be5e07c63..4d6f0b283 100644
--- a/surfsense_desktop/electron-builder.yml
+++ b/surfsense_desktop/electron-builder.yml
@@ -58,7 +58,7 @@ win:
   icon: assets/icon.ico
   target:
     - target: nsis
-      arch: [x64, arm64]
+      arch: [x64]
 nsis:
   oneClick: false
   perMachine: false
diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index 2a50de75f..d8a30347f 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -32,4 +32,7 @@ export const IPC_CHANNELS = {
   FOLDER_SYNC_ACK_EVENTS: 'folder-sync:ack-events',
   BROWSE_FILES: 'browse:files',
   READ_LOCAL_FILES: 'browse:read-local-files',
+  // Auth token sync across windows
+  GET_AUTH_TOKENS: 'auth:get-tokens',
+  SET_AUTH_TOKENS: 'auth:set-tokens',
 } as const;
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index de7cdb659..b36dcbdcd 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -21,6 +21,8 @@ import {
   readLocalFiles,
 } from '../modules/folder-watcher';
 
+let authTokens: { bearer: string; refresh: string } | null = null;
+
 export function registerIpcHandlers(): void {
   ipcMain.on(IPC_CHANNELS.OPEN_EXTERNAL, (_event, url: string) => {
     try {
@@ -89,4 +91,12 @@ export function registerIpcHandlers(): void {
   ipcMain.handle(IPC_CHANNELS.READ_LOCAL_FILES, (_event, paths: string[]) =>
     readLocalFiles(paths)
   );
+
+  ipcMain.handle(IPC_CHANNELS.SET_AUTH_TOKENS, (_event, tokens: { bearer: string; refresh: string }) => {
+    authTokens = tokens;
+  });
+
+  ipcMain.handle(IPC_CHANNELS.GET_AUTH_TOKENS, () => {
+    return authTokens;
+  });
 }
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 6a9190693..2811c3b46 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -68,4 +68,9 @@ contextBridge.exposeInMainWorld('electronAPI', {
   // Browse files via native dialog
   browseFiles: () => ipcRenderer.invoke(IPC_CHANNELS.BROWSE_FILES),
   readLocalFiles: (paths: string[]) => ipcRenderer.invoke(IPC_CHANNELS.READ_LOCAL_FILES, paths),
+
+  // Auth token sync across windows
+  getAuthTokens: () => ipcRenderer.invoke(IPC_CHANNELS.GET_AUTH_TOKENS),
+  setAuthTokens: (bearer: string, refresh: string) =>
+    ipcRenderer.invoke(IPC_CHANNELS.SET_AUTH_TOKENS, { bearer, refresh }),
 });
diff --git a/surfsense_web/app/dashboard/layout.tsx b/surfsense_web/app/dashboard/layout.tsx
index f727a2018..25bea5467 100644
--- a/surfsense_web/app/dashboard/layout.tsx
+++ b/surfsense_web/app/dashboard/layout.tsx
@@ -3,7 +3,7 @@
 import { useEffect, useState } from "react";
 import { USER_QUERY_KEY } from "@/atoms/user/user-query.atoms";
 import { useGlobalLoadingEffect } from "@/hooks/use-global-loading";
-import { getBearerToken, redirectToLogin } from "@/lib/auth-utils";
+import { getBearerToken, ensureTokensFromElectron, redirectToLogin } from "@/lib/auth-utils";
 import { queryClient } from "@/lib/query-client/client";
 
 interface DashboardLayoutProps {
@@ -17,15 +17,20 @@ export default function DashboardLayout({ children }: DashboardLayoutProps) {
 	useGlobalLoadingEffect(isCheckingAuth);
 
 	useEffect(() => {
-		// Check if user is authenticated
-		const token = getBearerToken();
-		if (!token) {
-			// Save current path and redirect to login
-			redirectToLogin();
-			return;
+		async function checkAuth() {
+			let token = getBearerToken();
+			if (!token) {
+				const synced = await ensureTokensFromElectron();
+				if (synced) token = getBearerToken();
+			}
+			if (!token) {
+				redirectToLogin();
+				return;
+			}
+			queryClient.invalidateQueries({ queryKey: [...USER_QUERY_KEY] });
+			setIsCheckingAuth(false);
 		}
-		queryClient.invalidateQueries({ queryKey: [...USER_QUERY_KEY] });
-		setIsCheckingAuth(false);
+		checkAuth();
 	}, []);
 
 	// Return null while loading - the global provider handles the loading UI
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 03944867f..097047bb1 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useCallback, useEffect, useRef, useState } from "react";
-import { getBearerToken } from "@/lib/auth-utils";
+import { getBearerToken, ensureTokensFromElectron } from "@/lib/auth-utils";
 
 type SSEEvent =
 	| { type: "text-delta"; id: string; delta: string }
@@ -65,7 +65,11 @@ export default function SuggestionPage() {
 			setSuggestion("");
 			setError(null);
 
-			const token = getBearerToken();
+			let token = getBearerToken();
+			if (!token) {
+				await ensureTokensFromElectron();
+				token = getBearerToken();
+			}
 			if (!token) {
 				setError(friendlyError("not authenticated"));
 				setIsLoading(false);
diff --git a/surfsense_web/lib/auth-utils.ts b/surfsense_web/lib/auth-utils.ts
index c2a0d58a5..f7d1c5b09 100644
--- a/surfsense_web/lib/auth-utils.ts
+++ b/surfsense_web/lib/auth-utils.ts
@@ -87,6 +87,7 @@ export function getBearerToken(): string | null {
 export function setBearerToken(token: string): void {
 	if (typeof window === "undefined") return;
 	localStorage.setItem(BEARER_TOKEN_KEY, token);
+	syncTokensToElectron();
 }
 
 /**
@@ -111,6 +112,7 @@ export function getRefreshToken(): string | null {
 export function setRefreshToken(token: string): void {
 	if (typeof window === "undefined") return;
 	localStorage.setItem(REFRESH_TOKEN_KEY, token);
+	syncTokensToElectron();
 }
 
 /**
@@ -129,6 +131,44 @@ export function clearAllTokens(): void {
 	clearRefreshToken();
 }
 
+/**
+ * Pushes the current localStorage tokens into the Electron main process
+ * so that other BrowserWindows (Quick Ask, Autocomplete) can access them.
+ */
+function syncTokensToElectron(): void {
+	if (typeof window === "undefined" || !window.electronAPI?.setAuthTokens) return;
+	const bearer = localStorage.getItem(BEARER_TOKEN_KEY) || "";
+	const refresh = localStorage.getItem(REFRESH_TOKEN_KEY) || "";
+	if (bearer) {
+		window.electronAPI.setAuthTokens(bearer, refresh);
+	}
+}
+
+/**
+ * Attempts to pull auth tokens from the Electron main process into localStorage.
+ * Useful for popup windows (Quick Ask, Autocomplete) on platforms where
+ * localStorage is not reliably shared across BrowserWindow instances.
+ * Returns true if tokens were found and written to localStorage.
+ */
+export async function ensureTokensFromElectron(): Promise<boolean> {
+	if (typeof window === "undefined" || !window.electronAPI?.getAuthTokens) return false;
+	if (getBearerToken()) return true;
+
+	try {
+		const tokens = await window.electronAPI.getAuthTokens();
+		if (tokens?.bearer) {
+			localStorage.setItem(BEARER_TOKEN_KEY, tokens.bearer);
+			if (tokens.refresh) {
+				localStorage.setItem(REFRESH_TOKEN_KEY, tokens.refresh);
+			}
+			return true;
+		}
+	} catch {
+		// IPC failure — fall through
+	}
+	return false;
+}
+
 /**
  * Logout the current user by revoking the refresh token and clearing localStorage.
  * Returns true if logout was successful (or tokens were cleared), false otherwise.
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 6feb75463..5e45635a2 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -78,6 +78,9 @@ interface ElectronAPI {
 	// Browse files/folders via native dialogs
 	browseFiles: () => Promise<string[] | null>;
 	readLocalFiles: (paths: string[]) => Promise<LocalFileData[]>;
+	// Auth token sync across windows
+	getAuthTokens: () => Promise<{ bearer: string; refresh: string } | null>;
+	setAuthTokens: (bearer: string, refresh: string) => Promise<void>;
 }
 
 declare global {

From 49441233e7815e557730524cc753456fabab852b Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 00:43:40 -0700
Subject: [PATCH 160/202] feat: enhance keyboard shortcut management and
 improve app responsiveness

- Updated the development script to include a build step before launching the app.
- Refactored the registration of quick ask and autocomplete functionalities to be asynchronous, ensuring proper initialization.
- Introduced IPC channels for getting and setting keyboard shortcuts, allowing users to customize their experience.
- Enhanced the platform module to support better interaction with the Electron API for clipboard operations.
- Improved the user interface for managing keyboard shortcuts in the settings dialog, providing a more intuitive experience.
---
 surfsense_desktop/package.json                |   2 +-
 surfsense_desktop/src/ipc/channels.ts         |   3 +
 surfsense_desktop/src/ipc/handlers.ts         |  12 +
 surfsense_desktop/src/main.ts                 |   4 +-
 .../src/modules/autocomplete/index.ts         |  48 +++-
 surfsense_desktop/src/modules/platform.ts     |  32 ++-
 surfsense_desktop/src/modules/quick-ask.ts    |  88 ++++--
 surfsense_desktop/src/modules/shortcuts.ts    |  42 +++
 surfsense_desktop/src/preload.ts              |   5 +
 .../components/DesktopContent.tsx             |  99 ++++++-
 surfsense_web/app/desktop/login/page.tsx      | 258 ++++++++++++++++++
 .../app/desktop/permissions/page.tsx          |  18 +-
 surfsense_web/app/desktop/suggestion/page.tsx |  24 +-
 surfsense_web/app/layout.tsx                  |  21 +-
 surfsense_web/components/UserDropdown.tsx     |   9 +-
 .../assistant-ui/assistant-message.tsx        |  12 +-
 .../tabs/all-connectors-tab.tsx               |   4 +-
 .../assistant-ui/inline-mention-editor.tsx    |  15 +
 .../components/assistant-ui/thread.tsx        |  24 +-
 .../components/desktop/shortcut-recorder.tsx  | 168 ++++++++++++
 .../layout/providers/LayoutDataProvider.tsx   |   6 +-
 .../layout/ui/sidebar/DocumentsSidebar.tsx    |  39 ++-
 surfsense_web/components/platform-gate.tsx    |  16 ++
 .../settings/user-settings-dialog.tsx         |  58 ++--
 .../components/sources/DocumentUploadTab.tsx  |  28 +-
 surfsense_web/contexts/platform-context.tsx   |  31 +++
 surfsense_web/hooks/use-folder-sync.ts        |  20 +-
 surfsense_web/hooks/use-platform.ts           |  12 +
 surfsense_web/lib/auth-utils.ts               |  13 +-
 surfsense_web/types/window.d.ts               |   3 +
 30 files changed, 923 insertions(+), 191 deletions(-)
 create mode 100644 surfsense_desktop/src/modules/shortcuts.ts
 create mode 100644 surfsense_web/app/desktop/login/page.tsx
 create mode 100644 surfsense_web/components/desktop/shortcut-recorder.tsx
 create mode 100644 surfsense_web/components/platform-gate.tsx
 create mode 100644 surfsense_web/contexts/platform-context.tsx
 create mode 100644 surfsense_web/hooks/use-platform.ts

diff --git a/surfsense_desktop/package.json b/surfsense_desktop/package.json
index 58c053c04..74f6274cb 100644
--- a/surfsense_desktop/package.json
+++ b/surfsense_desktop/package.json
@@ -4,7 +4,7 @@
   "description": "SurfSense Desktop App",
   "main": "dist/main.js",
   "scripts": {
-    "dev": "concurrently -k \"pnpm --dir ../surfsense_web dev\" \"wait-on http://localhost:3000 && electron .\"",
+    "dev": "pnpm build && concurrently -k \"pnpm --dir ../surfsense_web dev\" \"wait-on http://localhost:3000 && electron .\"",
     "build": "node scripts/build-electron.mjs",
     "pack:dir": "pnpm build && electron-builder --dir --config electron-builder.yml",
     "dist": "pnpm build && electron-builder --config electron-builder.yml",
diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index d8a30347f..8051703fb 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -35,4 +35,7 @@ export const IPC_CHANNELS = {
   // Auth token sync across windows
   GET_AUTH_TOKENS: 'auth:get-tokens',
   SET_AUTH_TOKENS: 'auth:set-tokens',
+  // Keyboard shortcut configuration
+  GET_SHORTCUTS: 'shortcuts:get',
+  SET_SHORTCUTS: 'shortcuts:set',
 } as const;
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index b36dcbdcd..7872e7a42 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -20,6 +20,9 @@ import {
   browseFiles,
   readLocalFiles,
 } from '../modules/folder-watcher';
+import { getShortcuts, setShortcuts, type ShortcutConfig } from '../modules/shortcuts';
+import { reregisterQuickAsk } from '../modules/quick-ask';
+import { reregisterAutocomplete } from '../modules/autocomplete';
 
 let authTokens: { bearer: string; refresh: string } | null = null;
 
@@ -99,4 +102,13 @@ export function registerIpcHandlers(): void {
   ipcMain.handle(IPC_CHANNELS.GET_AUTH_TOKENS, () => {
     return authTokens;
   });
+
+  ipcMain.handle(IPC_CHANNELS.GET_SHORTCUTS, () => getShortcuts());
+
+  ipcMain.handle(IPC_CHANNELS.SET_SHORTCUTS, async (_event, config: Partial<ShortcutConfig>) => {
+    const updated = await setShortcuts(config);
+    if (config.quickAsk) await reregisterQuickAsk();
+    if (config.autocomplete) await reregisterAutocomplete();
+    return updated;
+  });
 }
diff --git a/surfsense_desktop/src/main.ts b/surfsense_desktop/src/main.ts
index 7ef0ad5be..9eae8a4db 100644
--- a/surfsense_desktop/src/main.ts
+++ b/surfsense_desktop/src/main.ts
@@ -29,8 +29,8 @@ app.whenReady().then(async () => {
   }
 
   createMainWindow('/dashboard');
-  registerQuickAsk();
-  registerAutocomplete();
+  await registerQuickAsk();
+  await registerAutocomplete();
   registerFolderWatcher();
   setupAutoUpdater();
 
diff --git a/surfsense_desktop/src/modules/autocomplete/index.ts b/surfsense_desktop/src/modules/autocomplete/index.ts
index 01a4cf913..1b64396b0 100644
--- a/surfsense_desktop/src/modules/autocomplete/index.ts
+++ b/surfsense_desktop/src/modules/autocomplete/index.ts
@@ -5,9 +5,9 @@ import { hasScreenRecordingPermission, requestAccessibility, requestScreenRecord
 import { getMainWindow } from '../window';
 import { captureScreen } from './screenshot';
 import { createSuggestionWindow, destroySuggestion, getSuggestionWindow } from './suggestion-window';
+import { getShortcuts } from '../shortcuts';
 
-const SHORTCUT = 'CommandOrControl+Shift+Space';
-
+let currentShortcut = '';
 let autocompleteEnabled = true;
 let savedClipboard = '';
 let sourceApp = '';
@@ -91,7 +91,12 @@ async function acceptAndInject(text: string): Promise<void> {
   }
 }
 
+let ipcRegistered = false;
+
 function registerIpcHandlers(): void {
+  if (ipcRegistered) return;
+  ipcRegistered = true;
+
   ipcMain.handle(IPC_CHANNELS.ACCEPT_SUGGESTION, async (_event, text: string) => {
     await acceptAndInject(text);
   });
@@ -107,26 +112,39 @@ function registerIpcHandlers(): void {
   ipcMain.handle(IPC_CHANNELS.GET_AUTOCOMPLETE_ENABLED, () => autocompleteEnabled);
 }
 
-export function registerAutocomplete(): void {
-  registerIpcHandlers();
+function autocompleteHandler(): void {
+  const sw = getSuggestionWindow();
+  if (sw && !sw.isDestroyed()) {
+    destroySuggestion();
+    return;
+  }
+  triggerAutocomplete();
+}
 
-  const ok = globalShortcut.register(SHORTCUT, () => {
-    const sw = getSuggestionWindow();
-    if (sw && !sw.isDestroyed()) {
-      destroySuggestion();
-      return;
-    }
-    triggerAutocomplete();
-  });
+async function registerShortcut(): Promise<void> {
+  const shortcuts = await getShortcuts();
+  currentShortcut = shortcuts.autocomplete;
+
+  const ok = globalShortcut.register(currentShortcut, autocompleteHandler);
 
   if (!ok) {
-    console.error(`[autocomplete] Failed to register shortcut ${SHORTCUT}`);
+    console.error(`[autocomplete] Failed to register shortcut ${currentShortcut}`);
   } else {
-    console.log(`[autocomplete] Registered shortcut ${SHORTCUT}`);
+    console.log(`[autocomplete] Registered shortcut ${currentShortcut}`);
   }
 }
 
+export async function registerAutocomplete(): Promise<void> {
+  registerIpcHandlers();
+  await registerShortcut();
+}
+
 export function unregisterAutocomplete(): void {
-  globalShortcut.unregister(SHORTCUT);
+  if (currentShortcut) globalShortcut.unregister(currentShortcut);
   destroySuggestion();
 }
+
+export async function reregisterAutocomplete(): Promise<void> {
+  unregisterAutocomplete();
+  await registerShortcut();
+}
diff --git a/surfsense_desktop/src/modules/platform.ts b/surfsense_desktop/src/modules/platform.ts
index 122e2efed..2b4d1f4a1 100644
--- a/surfsense_desktop/src/modules/platform.ts
+++ b/surfsense_desktop/src/modules/platform.ts
@@ -1,16 +1,20 @@
 import { execSync } from 'child_process';
 import { systemPreferences } from 'electron';
 
+const EXEC_OPTS = { windowsHide: true } as const;
+
 export function getFrontmostApp(): string {
   try {
     if (process.platform === 'darwin') {
       return execSync(
-        'osascript -e \'tell application "System Events" to get name of first application process whose frontmost is true\''
+        'osascript -e \'tell application "System Events" to get name of first application process whose frontmost is true\'',
+        EXEC_OPTS,
       ).toString().trim();
     }
     if (process.platform === 'win32') {
       return execSync(
-        'powershell -command "Add-Type \'using System; using System.Runtime.InteropServices; public class W { [DllImport(\\\"user32.dll\\\")] public static extern IntPtr GetForegroundWindow(); }\'; (Get-Process | Where-Object { $_.MainWindowHandle -eq [W]::GetForegroundWindow() }).ProcessName"'
+        'powershell -NoProfile -NonInteractive -command "Add-Type \'using System; using System.Runtime.InteropServices; public class W { [DllImport(\\\"user32.dll\\\")] public static extern IntPtr GetForegroundWindow(); }\'; (Get-Process | Where-Object { $_.MainWindowHandle -eq [W]::GetForegroundWindow() }).ProcessName"',
+        EXEC_OPTS,
       ).toString().trim();
     }
   } catch {
@@ -21,9 +25,23 @@ export function getFrontmostApp(): string {
 
 export function simulatePaste(): void {
   if (process.platform === 'darwin') {
-    execSync('osascript -e \'tell application "System Events" to keystroke "v" using command down\'');
+    execSync('osascript -e \'tell application "System Events" to keystroke "v" using command down\'', EXEC_OPTS);
   } else if (process.platform === 'win32') {
-    execSync('powershell -command "Add-Type -AssemblyName System.Windows.Forms; [System.Windows.Forms.SendKeys]::SendWait(\'^v\')"');
+    execSync('powershell -NoProfile -NonInteractive -command "Add-Type -AssemblyName System.Windows.Forms; [System.Windows.Forms.SendKeys]::SendWait(\'^v\')"', EXEC_OPTS);
+  }
+}
+
+export function simulateCopy(): boolean {
+  try {
+    if (process.platform === 'darwin') {
+      execSync('osascript -e \'tell application "System Events" to keystroke "c" using command down\'', EXEC_OPTS);
+    } else if (process.platform === 'win32') {
+      execSync('powershell -NoProfile -NonInteractive -command "Add-Type -AssemblyName System.Windows.Forms; [System.Windows.Forms.SendKeys]::SendWait(\'^c\')"', EXEC_OPTS);
+    }
+    return true;
+  } catch (err) {
+    console.error('[simulateCopy] Failed:', err);
+    return false;
   }
 }
 
@@ -36,12 +54,14 @@ export function getWindowTitle(): string {
   try {
     if (process.platform === 'darwin') {
       return execSync(
-        'osascript -e \'tell application "System Events" to get title of front window of first application process whose frontmost is true\''
+        'osascript -e \'tell application "System Events" to get title of front window of first application process whose frontmost is true\'',
+        EXEC_OPTS,
       ).toString().trim();
     }
     if (process.platform === 'win32') {
       return execSync(
-        'powershell -command "(Get-Process | Where-Object { $_.MainWindowHandle -eq (Add-Type -MemberDefinition \'[DllImport(\\\"user32.dll\\\")] public static extern IntPtr GetForegroundWindow();\' -Name W -PassThru)::GetForegroundWindow() }).MainWindowTitle"'
+        'powershell -NoProfile -NonInteractive -command "(Get-Process | Where-Object { $_.MainWindowHandle -eq (Add-Type -MemberDefinition \'[DllImport(\\\"user32.dll\\\")] public static extern IntPtr GetForegroundWindow();\' -Name W -PassThru)::GetForegroundWindow() }).MainWindowTitle"',
+        EXEC_OPTS,
       ).toString().trim();
     }
   } catch {
diff --git a/surfsense_desktop/src/modules/quick-ask.ts b/surfsense_desktop/src/modules/quick-ask.ts
index 52bfc6054..a015bfabf 100644
--- a/surfsense_desktop/src/modules/quick-ask.ts
+++ b/surfsense_desktop/src/modules/quick-ask.ts
@@ -1,10 +1,11 @@
 import { BrowserWindow, clipboard, globalShortcut, ipcMain, screen, shell } from 'electron';
 import path from 'path';
 import { IPC_CHANNELS } from '../ipc/channels';
-import { checkAccessibilityPermission, getFrontmostApp, simulatePaste } from './platform';
+import { checkAccessibilityPermission, getFrontmostApp, simulateCopy, simulatePaste } from './platform';
 import { getServerPort } from './server';
+import { getShortcuts } from './shortcuts';
 
-const SHORTCUT = 'CommandOrControl+Option+S';
+let currentShortcut = '';
 let quickAskWindow: BrowserWindow | null = null;
 let pendingText = '';
 let pendingMode = '';
@@ -77,29 +78,52 @@ function createQuickAskWindow(x: number, y: number): BrowserWindow {
   return quickAskWindow;
 }
 
-export function registerQuickAsk(): void {
-  const ok = globalShortcut.register(SHORTCUT, () => {
-    if (quickAskWindow && !quickAskWindow.isDestroyed()) {
-      destroyQuickAsk();
-      return;
-    }
+function openQuickAsk(text: string): void {
+  pendingText = text;
+  const cursor = screen.getCursorScreenPoint();
+  const pos = clampToScreen(cursor.x, cursor.y, 450, 750);
+  createQuickAskWindow(pos.x, pos.y);
+}
 
-    sourceApp = getFrontmostApp();
-    savedClipboard = clipboard.readText();
+async function quickAskHandler(): Promise<void> {
+  console.log('[quick-ask] Handler triggered');
 
-    const text = savedClipboard.trim();
-    if (!text) return;
-
-    pendingText = text;
-    const cursor = screen.getCursorScreenPoint();
-    const pos = clampToScreen(cursor.x, cursor.y, 450, 750);
-    createQuickAskWindow(pos.x, pos.y);
-  });
-
-  if (!ok) {
-    console.log(`Quick-ask: failed to register ${SHORTCUT}`);
+  if (quickAskWindow && !quickAskWindow.isDestroyed()) {
+    console.log('[quick-ask] Window already open, closing');
+    destroyQuickAsk();
+    return;
   }
 
+  if (!checkAccessibilityPermission()) {
+    console.log('[quick-ask] Accessibility permission denied');
+    return;
+  }
+
+  savedClipboard = clipboard.readText();
+  console.log('[quick-ask] Saved clipboard length:', savedClipboard.length);
+
+  const copyOk = simulateCopy();
+  console.log('[quick-ask] simulateCopy result:', copyOk);
+
+  await new Promise((r) => setTimeout(r, 300));
+
+  const afterCopy = clipboard.readText();
+  const selected = afterCopy.trim();
+  console.log('[quick-ask] Clipboard after copy length:', afterCopy.length, 'changed:', afterCopy !== savedClipboard);
+
+  const text = selected || savedClipboard.trim();
+
+  sourceApp = getFrontmostApp();
+  console.log('[quick-ask] Source app:', sourceApp, '| Opening Quick Ask with', text.length, 'chars', selected ? '(selected)' : text ? '(clipboard fallback)' : '(empty)');
+  openQuickAsk(text);
+}
+
+let ipcRegistered = false;
+
+function registerIpcHandlers(): void {
+  if (ipcRegistered) return;
+  ipcRegistered = true;
+
   ipcMain.handle(IPC_CHANNELS.QUICK_ASK_TEXT, () => {
     const text = pendingText;
     pendingText = '';
@@ -136,6 +160,24 @@ export function registerQuickAsk(): void {
   });
 }
 
-export function unregisterQuickAsk(): void {
-  globalShortcut.unregister(SHORTCUT);
+async function registerShortcut(): Promise<void> {
+  const shortcuts = await getShortcuts();
+  currentShortcut = shortcuts.quickAsk;
+
+  const ok = globalShortcut.register(currentShortcut, () => { quickAskHandler(); });
+  console.log(`[quick-ask] Register ${currentShortcut}: ${ok ? 'OK' : 'FAILED'}`);
+}
+
+export async function registerQuickAsk(): Promise<void> {
+  registerIpcHandlers();
+  await registerShortcut();
+}
+
+export function unregisterQuickAsk(): void {
+  if (currentShortcut) globalShortcut.unregister(currentShortcut);
+}
+
+export async function reregisterQuickAsk(): Promise<void> {
+  unregisterQuickAsk();
+  await registerShortcut();
 }
diff --git a/surfsense_desktop/src/modules/shortcuts.ts b/surfsense_desktop/src/modules/shortcuts.ts
new file mode 100644
index 000000000..8173b96c1
--- /dev/null
+++ b/surfsense_desktop/src/modules/shortcuts.ts
@@ -0,0 +1,42 @@
+export interface ShortcutConfig {
+  quickAsk: string;
+  autocomplete: string;
+}
+
+const DEFAULTS: ShortcutConfig = {
+  quickAsk: 'CommandOrControl+Alt+S',
+  autocomplete: 'CommandOrControl+Shift+Space',
+};
+
+const STORE_KEY = 'shortcuts';
+// eslint-disable-next-line @typescript-eslint/no-explicit-any -- lazily imported ESM module; matches folder-watcher.ts pattern
+let store: any = null;
+
+async function getStore() {
+  if (!store) {
+    const { default: Store } = await import('electron-store');
+    store = new Store({
+      name: 'keyboard-shortcuts',
+      defaults: { [STORE_KEY]: DEFAULTS },
+    });
+  }
+  return store;
+}
+
+export async function getShortcuts(): Promise<ShortcutConfig> {
+  const s = await getStore();
+  const stored = s.get(STORE_KEY) as Partial<ShortcutConfig> | undefined;
+  return { ...DEFAULTS, ...stored };
+}
+
+export async function setShortcuts(config: Partial<ShortcutConfig>): Promise<ShortcutConfig> {
+  const s = await getStore();
+  const current = (s.get(STORE_KEY) as ShortcutConfig) ?? DEFAULTS;
+  const merged = { ...current, ...config };
+  s.set(STORE_KEY, merged);
+  return merged;
+}
+
+export function getDefaults(): ShortcutConfig {
+  return { ...DEFAULTS };
+}
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 2811c3b46..58ddd745e 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -73,4 +73,9 @@ contextBridge.exposeInMainWorld('electronAPI', {
   getAuthTokens: () => ipcRenderer.invoke(IPC_CHANNELS.GET_AUTH_TOKENS),
   setAuthTokens: (bearer: string, refresh: string) =>
     ipcRenderer.invoke(IPC_CHANNELS.SET_AUTH_TOKENS, { bearer, refresh }),
+
+  // Keyboard shortcut configuration
+  getShortcuts: () => ipcRenderer.invoke(IPC_CHANNELS.GET_SHORTCUTS),
+  setShortcuts: (config: Record<string, string>) =>
+    ipcRenderer.invoke(IPC_CHANNELS.SET_SHORTCUTS, config),
 });
diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
index 1522e153f..f83c3c9d4 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
@@ -1,30 +1,54 @@
 "use client";
 
-import { useEffect, useState } from "react";
+import { Clipboard, Sparkles } from "lucide-react";
+import { useCallback, useEffect, useState } from "react";
+import { toast } from "sonner";
+import {
+	DEFAULT_SHORTCUTS,
+	ShortcutRecorder,
+} from "@/components/desktop/shortcut-recorder";
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
 import { Label } from "@/components/ui/label";
 import { Switch } from "@/components/ui/switch";
 import { Spinner } from "@/components/ui/spinner";
+import { useElectronAPI } from "@/hooks/use-platform";
 
 export function DesktopContent() {
-	const [isElectron, setIsElectron] = useState(false);
+	const api = useElectronAPI();
 	const [loading, setLoading] = useState(true);
 	const [enabled, setEnabled] = useState(true);
 
+	const [shortcuts, setShortcuts] = useState(DEFAULT_SHORTCUTS);
+	const [shortcutsLoaded, setShortcutsLoaded] = useState(false);
+
 	useEffect(() => {
-		if (!window.electronAPI) {
+		if (!api) {
 			setLoading(false);
+			setShortcutsLoaded(true);
 			return;
 		}
-		setIsElectron(true);
 
-		window.electronAPI.getAutocompleteEnabled().then((val) => {
-			setEnabled(val);
+		let mounted = true;
+
+		Promise.all([
+			api.getAutocompleteEnabled(),
+			api.getShortcuts?.() ?? Promise.resolve(null),
+		]).then(([autoEnabled, config]) => {
+			if (!mounted) return;
+			setEnabled(autoEnabled);
+			if (config) setShortcuts(config);
 			setLoading(false);
+			setShortcutsLoaded(true);
+		}).catch(() => {
+			if (!mounted) return;
+			setLoading(false);
+			setShortcutsLoaded(true);
 		});
-	}, []);
 
-	if (!isElectron) {
+		return () => { mounted = false; };
+	}, [api]);
+
+	if (!api) {
 		return (
 			<div className="flex flex-col items-center justify-center py-12 text-center">
 				<p className="text-sm text-muted-foreground">
@@ -44,11 +68,68 @@ export function DesktopContent() {
 
 	const handleToggle = async (checked: boolean) => {
 		setEnabled(checked);
-		await window.electronAPI!.setAutocompleteEnabled(checked);
+		await api.setAutocompleteEnabled(checked);
+	};
+
+	const updateShortcut = (key: "quickAsk" | "autocomplete", accelerator: string) => {
+		setShortcuts((prev) => {
+			const updated = { ...prev, [key]: accelerator };
+			api.setShortcuts?.({ [key]: accelerator }).catch(() => {
+				toast.error("Failed to update shortcut");
+			});
+			return updated;
+		});
+		toast.success("Shortcut updated");
+	};
+
+	const resetShortcut = (key: "quickAsk" | "autocomplete") => {
+		updateShortcut(key, DEFAULT_SHORTCUTS[key]);
 	};
 
 	return (
 		<div className="space-y-4 md:space-y-6">
+			{/* Keyboard Shortcuts */}
+			<Card>
+				<CardHeader className="px-3 md:px-6 pt-3 md:pt-6 pb-2 md:pb-3">
+					<CardTitle className="text-base md:text-lg">Keyboard Shortcuts</CardTitle>
+					<CardDescription className="text-xs md:text-sm">
+						Customize the global keyboard shortcuts for desktop features.
+					</CardDescription>
+				</CardHeader>
+				<CardContent className="px-3 md:px-6 pb-3 md:pb-6">
+					{shortcutsLoaded ? (
+						<div className="flex flex-col gap-3">
+							<ShortcutRecorder
+								value={shortcuts.quickAsk}
+								onChange={(accel) => updateShortcut("quickAsk", accel)}
+								onReset={() => resetShortcut("quickAsk")}
+								defaultValue={DEFAULT_SHORTCUTS.quickAsk}
+								label="Quick Ask"
+								description="Copy selected text and ask AI about it"
+								icon={Clipboard}
+							/>
+							<ShortcutRecorder
+								value={shortcuts.autocomplete}
+								onChange={(accel) => updateShortcut("autocomplete", accel)}
+								onReset={() => resetShortcut("autocomplete")}
+								defaultValue={DEFAULT_SHORTCUTS.autocomplete}
+								label="Autocomplete"
+								description="Get AI writing suggestions from a screenshot"
+								icon={Sparkles}
+							/>
+							<p className="text-[11px] text-muted-foreground">
+								Click a shortcut and press a new key combination to change it.
+							</p>
+						</div>
+					) : (
+						<div className="flex justify-center py-4">
+							<Spinner size="sm" />
+						</div>
+					)}
+				</CardContent>
+			</Card>
+
+			{/* Autocomplete Toggle */}
 			<Card>
 				<CardHeader className="px-3 md:px-6 pt-3 md:pt-6 pb-2 md:pb-3">
 					<CardTitle className="text-base md:text-lg">Autocomplete</CardTitle>
diff --git a/surfsense_web/app/desktop/login/page.tsx b/surfsense_web/app/desktop/login/page.tsx
new file mode 100644
index 000000000..529577b59
--- /dev/null
+++ b/surfsense_web/app/desktop/login/page.tsx
@@ -0,0 +1,258 @@
+"use client";
+
+import { IconBrandGoogleFilled } from "@tabler/icons-react";
+import { useAtom } from "jotai";
+import {
+	Eye,
+	EyeOff,
+	Keyboard,
+	Clipboard,
+	Sparkles,
+} from "lucide-react";
+import Image from "next/image";
+import { useRouter } from "next/navigation";
+import { useCallback, useEffect, useState } from "react";
+import { toast } from "sonner";
+import { loginMutationAtom } from "@/atoms/auth/auth-mutation.atoms";
+import {
+	DEFAULT_SHORTCUTS,
+	ShortcutRecorder,
+} from "@/components/desktop/shortcut-recorder";
+import { Button } from "@/components/ui/button";
+import {
+	Card,
+	CardContent,
+	CardDescription,
+	CardHeader,
+	CardTitle,
+} from "@/components/ui/card";
+import { Input } from "@/components/ui/input";
+import { Label } from "@/components/ui/label";
+import { Separator } from "@/components/ui/separator";
+import { Spinner } from "@/components/ui/spinner";
+import { useElectronAPI } from "@/hooks/use-platform";
+import { AUTH_TYPE, BACKEND_URL } from "@/lib/env-config";
+
+const isGoogleAuth = AUTH_TYPE === "GOOGLE";
+
+export default function DesktopLoginPage() {
+	const router = useRouter();
+	const api = useElectronAPI();
+	const [{ mutateAsync: login, isPending: isLoggingIn }] =
+		useAtom(loginMutationAtom);
+
+	const [email, setEmail] = useState("");
+	const [password, setPassword] = useState("");
+	const [showPassword, setShowPassword] = useState(false);
+	const [loginError, setLoginError] = useState<string | null>(null);
+
+	const [shortcuts, setShortcuts] = useState(DEFAULT_SHORTCUTS);
+	const [shortcutsLoaded, setShortcutsLoaded] = useState(false);
+
+	useEffect(() => {
+		if (!api?.getShortcuts) {
+			setShortcutsLoaded(true);
+			return;
+		}
+		api.getShortcuts().then((config) => {
+			if (config) setShortcuts(config);
+			setShortcutsLoaded(true);
+		}).catch(() => setShortcutsLoaded(true));
+	}, [api]);
+
+	const updateShortcut = useCallback(
+		(key: "quickAsk" | "autocomplete", accelerator: string) => {
+			setShortcuts((prev) => {
+				const updated = { ...prev, [key]: accelerator };
+				api?.setShortcuts?.({ [key]: accelerator }).catch(() => {
+					toast.error("Failed to update shortcut");
+				});
+				return updated;
+			});
+			toast.success("Shortcut updated");
+		},
+		[api]
+	);
+
+	const resetShortcut = useCallback(
+		(key: "quickAsk" | "autocomplete") => {
+			updateShortcut(key, DEFAULT_SHORTCUTS[key]);
+		},
+		[updateShortcut]
+	);
+
+	const handleGoogleLogin = () => {
+		window.location.href = `${BACKEND_URL}/auth/google/authorize-redirect`;
+	};
+
+	const handleLocalLogin = async (e: React.FormEvent) => {
+		e.preventDefault();
+		setLoginError(null);
+
+		try {
+			const data = await login({
+				username: email,
+				password,
+				grant_type: "password",
+			});
+
+			if (typeof window !== "undefined") {
+				sessionStorage.setItem("login_success_tracked", "true");
+			}
+
+			setTimeout(() => {
+				router.push(`/auth/callback?token=${data.access_token}`);
+			}, 300);
+		} catch (err) {
+			if (err instanceof Error) {
+				setLoginError(err.message);
+			} else {
+				setLoginError("Login failed. Please check your credentials.");
+			}
+		}
+	};
+
+	return (
+		<div className="relative flex min-h-screen items-center justify-center bg-background p-4">
+			<div className="pointer-events-none absolute inset-0 overflow-hidden">
+				<div
+					className="absolute -top-1/2 left-1/2 size-[800px] -translate-x-1/2 rounded-full opacity-[0.03]"
+					style={{
+						background:
+							"radial-gradient(circle, hsl(var(--primary)) 0%, transparent 70%)",
+					}}
+				/>
+			</div>
+
+			<Card className="relative w-full max-w-md shadow-lg">
+				<CardHeader className="items-center text-center pb-4">
+					<Image
+						src="/icon-128.svg"
+						className="select-none dark:invert size-14 rounded-md mb-2"
+						alt="SurfSense"
+						width={56}
+						height={56}
+						priority
+					/>
+					<CardTitle className="text-xl">Welcome to SurfSense Desktop App</CardTitle>
+					<CardDescription>
+						Configure your shortcuts, then sign in to get started.
+					</CardDescription>
+				</CardHeader>
+
+				<CardContent className="flex flex-col gap-6">
+					{/* ---- Shortcuts Section (first) ---- */}
+					{shortcutsLoaded ? (
+						<div className="flex flex-col gap-3">
+							<div className="flex items-center gap-1.5 text-xs font-medium text-muted-foreground mb-1">
+								<Keyboard className="size-3" />
+								Keyboard Shortcuts
+							</div>
+							<ShortcutRecorder
+								value={shortcuts.quickAsk}
+								onChange={(accel) => updateShortcut("quickAsk", accel)}
+								onReset={() => resetShortcut("quickAsk")}
+								defaultValue={DEFAULT_SHORTCUTS.quickAsk}
+								label="Quick Ask"
+								description="Copy selected text and ask AI about it"
+								icon={Clipboard}
+							/>
+							<ShortcutRecorder
+								value={shortcuts.autocomplete}
+								onChange={(accel) => updateShortcut("autocomplete", accel)}
+								onReset={() => resetShortcut("autocomplete")}
+								defaultValue={DEFAULT_SHORTCUTS.autocomplete}
+								label="Autocomplete"
+								description="Get AI writing suggestions from a screenshot"
+								icon={Sparkles}
+							/>
+							<p className="text-[11px] text-muted-foreground text-center">
+								Click a shortcut and press a new key combination to change it.
+							</p>
+						</div>
+					) : (
+						<div className="flex justify-center py-4">
+							<Spinner size="sm" />
+						</div>
+					)}
+
+					{/* ---- Divider ---- */}
+					<Separator />
+
+					{/* ---- Auth Section (second) ---- */}
+					{isGoogleAuth ? (
+						<Button
+							variant="outline"
+							className="w-full gap-2 py-5"
+							onClick={handleGoogleLogin}
+						>
+							<IconBrandGoogleFilled className="size-5" />
+							Continue with Google
+						</Button>
+					) : (
+						<form onSubmit={handleLocalLogin} className="flex flex-col gap-4">
+							{loginError && (
+								<div className="rounded-md border border-destructive/20 bg-destructive/10 px-3 py-2 text-sm text-destructive">
+									{loginError}
+								</div>
+							)}
+
+							<div className="flex flex-col gap-2">
+								<Label htmlFor="email">Email</Label>
+								<Input
+									id="email"
+									type="email"
+									placeholder="you@example.com"
+									required
+									value={email}
+									onChange={(e) => setEmail(e.target.value)}
+									disabled={isLoggingIn}
+									autoFocus
+								/>
+							</div>
+
+							<div className="flex flex-col gap-2">
+								<Label htmlFor="password">Password</Label>
+								<div className="relative">
+									<Input
+										id="password"
+										type={showPassword ? "text" : "password"}
+										placeholder="Enter your password"
+										required
+										value={password}
+										onChange={(e) => setPassword(e.target.value)}
+										disabled={isLoggingIn}
+										className="pr-10"
+									/>
+									<button
+										type="button"
+										onClick={() => setShowPassword((v) => !v)}
+										className="absolute inset-y-0 right-0 flex items-center pr-3 text-muted-foreground hover:text-foreground"
+										tabIndex={-1}
+									>
+										{showPassword ? (
+											<EyeOff className="size-4" />
+										) : (
+											<Eye className="size-4" />
+										)}
+									</button>
+								</div>
+							</div>
+
+							<Button type="submit" disabled={isLoggingIn} className="mt-1">
+								{isLoggingIn ? (
+									<>
+										<Spinner size="sm" className="text-primary-foreground" />
+										Signing in...
+									</>
+								) : (
+									"Sign in"
+								)}
+							</Button>
+						</form>
+					)}
+				</CardContent>
+			</Card>
+		</div>
+	);
+}
diff --git a/surfsense_web/app/desktop/permissions/page.tsx b/surfsense_web/app/desktop/permissions/page.tsx
index 6c08e35b5..178b6a533 100644
--- a/surfsense_web/app/desktop/permissions/page.tsx
+++ b/surfsense_web/app/desktop/permissions/page.tsx
@@ -5,6 +5,7 @@ import { useRouter } from "next/navigation";
 import { Logo } from "@/components/Logo";
 import { Button } from "@/components/ui/button";
 import { Spinner } from "@/components/ui/spinner";
+import { useElectronAPI } from "@/hooks/use-platform";
 
 type PermissionStatus = "authorized" | "denied" | "not determined" | "restricted" | "limited";
 
@@ -57,19 +58,18 @@ function StatusBadge({ status }: { status: PermissionStatus }) {
 
 export default function DesktopPermissionsPage() {
 	const router = useRouter();
+	const api = useElectronAPI();
 	const [permissions, setPermissions] = useState<PermissionsStatus | null>(null);
-	const [isElectron, setIsElectron] = useState(false);
 
 	useEffect(() => {
-		if (!window.electronAPI) return;
-		setIsElectron(true);
+		if (!api) return;
 
 		let interval: ReturnType<typeof setInterval> | null = null;
 
 		const isResolved = (s: string) => s === "authorized" || s === "restricted";
 
 		const poll = async () => {
-			const status = await window.electronAPI!.getPermissionsStatus();
+			const status = await api.getPermissionsStatus();
 			setPermissions(status);
 
 			if (isResolved(status.accessibility) && isResolved(status.screenRecording)) {
@@ -80,9 +80,9 @@ export default function DesktopPermissionsPage() {
 		poll();
 		interval = setInterval(poll, 2000);
 		return () => { if (interval) clearInterval(interval); };
-	}, []);
+	}, [api]);
 
-	if (!isElectron) {
+	if (!api) {
 		return (
 			<div className="h-screen flex items-center justify-center bg-background">
 				<p className="text-muted-foreground">This page is only available in the desktop app.</p>
@@ -102,15 +102,15 @@ export default function DesktopPermissionsPage() {
 
 	const handleRequest = async (action: string) => {
 		if (action === "requestScreenRecording") {
-			await window.electronAPI!.requestScreenRecording();
+			await api.requestScreenRecording();
 		} else if (action === "requestAccessibility") {
-			await window.electronAPI!.requestAccessibility();
+			await api.requestAccessibility();
 		}
 	};
 
 	const handleContinue = () => {
 		if (allGranted) {
-			window.electronAPI!.restartApp();
+			api.restartApp();
 		}
 	};
 
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 097047bb1..fb83e2113 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -1,6 +1,7 @@
 "use client";
 
 import { useCallback, useEffect, useRef, useState } from "react";
+import { useElectronAPI } from "@/hooks/use-platform";
 import { getBearerToken, ensureTokensFromElectron } from "@/lib/auth-utils";
 
 type SSEEvent =
@@ -34,26 +35,27 @@ function friendlyError(raw: string | number): string {
 const AUTO_DISMISS_MS = 3000;
 
 export default function SuggestionPage() {
+	const api = useElectronAPI();
 	const [suggestion, setSuggestion] = useState("");
 	const [isLoading, setIsLoading] = useState(true);
-	const [isDesktop, setIsDesktop] = useState(true);
 	const [error, setError] = useState<string | null>(null);
 	const abortRef = useRef<AbortController | null>(null);
 
+	const isDesktop = !!api?.onAutocompleteContext;
+
 	useEffect(() => {
-		if (!window.electronAPI?.onAutocompleteContext) {
-			setIsDesktop(false);
+		if (!api?.onAutocompleteContext) {
 			setIsLoading(false);
 		}
-	}, []);
+	}, [api]);
 
 	useEffect(() => {
 		if (!error) return;
 		const timer = setTimeout(() => {
-			window.electronAPI?.dismissSuggestion?.();
+			api?.dismissSuggestion?.();
 		}, AUTO_DISMISS_MS);
 		return () => clearTimeout(timer);
-	}, [error]);
+	}, [error, api]);
 
 	const fetchSuggestion = useCallback(
 		async (screenshot: string, searchSpaceId: string, appName?: string, windowTitle?: string) => {
@@ -153,9 +155,9 @@ export default function SuggestionPage() {
 	);
 
 	useEffect(() => {
-		if (!window.electronAPI?.onAutocompleteContext) return;
+		if (!api?.onAutocompleteContext) return;
 
-		const cleanup = window.electronAPI.onAutocompleteContext((data) => {
+		const cleanup = api.onAutocompleteContext((data) => {
 			const searchSpaceId = data.searchSpaceId || "1";
 			if (data.screenshot) {
 				fetchSuggestion(data.screenshot, searchSpaceId, data.appName, data.windowTitle);
@@ -163,7 +165,7 @@ export default function SuggestionPage() {
 		});
 
 		return cleanup;
-	}, [fetchSuggestion]);
+	}, [fetchSuggestion, api]);
 
 	if (!isDesktop) {
 		return (
@@ -197,12 +199,12 @@ export default function SuggestionPage() {
 
 	const handleAccept = () => {
 		if (suggestion) {
-			window.electronAPI?.acceptSuggestion?.(suggestion);
+			api?.acceptSuggestion?.(suggestion);
 		}
 	};
 
 	const handleDismiss = () => {
-		window.electronAPI?.dismissSuggestion?.();
+		api?.dismissSuggestion?.();
 	};
 
 	if (!suggestion) return null;
diff --git a/surfsense_web/app/layout.tsx b/surfsense_web/app/layout.tsx
index 784fd3bcf..8ebb0e848 100644
--- a/surfsense_web/app/layout.tsx
+++ b/surfsense_web/app/layout.tsx
@@ -10,6 +10,7 @@ import { ZeroProvider } from "@/components/providers/ZeroProvider";
 import { ThemeProvider } from "@/components/theme/theme-provider";
 import { Toaster } from "@/components/ui/sonner";
 import { LocaleProvider } from "@/contexts/LocaleContext";
+import { PlatformProvider } from "@/contexts/platform-context";
 import { ReactQueryClientProvider } from "@/lib/query-client/query-client.provider";
 import { cn } from "@/lib/utils";
 
@@ -139,15 +140,17 @@ export default function RootLayout({
 								disableTransitionOnChange
 								defaultTheme="system"
 							>
-								<RootProvider>
-									<ReactQueryClientProvider>
-										<ZeroProvider>
-											<GlobalLoadingProvider>{children}</GlobalLoadingProvider>
-										</ZeroProvider>
-									</ReactQueryClientProvider>
-									<Toaster />
-									<AnnouncementToastProvider />
-								</RootProvider>
+								<PlatformProvider>
+									<RootProvider>
+										<ReactQueryClientProvider>
+											<ZeroProvider>
+												<GlobalLoadingProvider>{children}</GlobalLoadingProvider>
+											</ZeroProvider>
+										</ReactQueryClientProvider>
+										<Toaster />
+										<AnnouncementToastProvider />
+									</RootProvider>
+								</PlatformProvider>
 							</ThemeProvider>
 						</I18nProvider>
 					</LocaleProvider>
diff --git a/surfsense_web/components/UserDropdown.tsx b/surfsense_web/components/UserDropdown.tsx
index 197db6287..19dceb06b 100644
--- a/surfsense_web/components/UserDropdown.tsx
+++ b/surfsense_web/components/UserDropdown.tsx
@@ -15,7 +15,7 @@ import {
 	DropdownMenuTrigger,
 } from "@/components/ui/dropdown-menu";
 import { Spinner } from "@/components/ui/spinner";
-import { logout } from "@/lib/auth-utils";
+import { getLoginPath, logout } from "@/lib/auth-utils";
 import { resetUser, trackLogout } from "@/lib/posthog/events";
 
 export function UserDropdown({
@@ -33,22 +33,19 @@ export function UserDropdown({
 		if (isLoggingOut) return;
 		setIsLoggingOut(true);
 		try {
-			// Track logout event and reset PostHog identity
 			trackLogout();
 			resetUser();
 
-			// Revoke refresh token on server and clear all tokens from localStorage
 			await logout();
 
 			if (typeof window !== "undefined") {
-				window.location.href = "/";
+				window.location.href = getLoginPath();
 			}
 		} catch (error) {
 			console.error("Error during logout:", error);
-			// Even if there's an error, try to clear tokens and redirect
 			await logout();
 			if (typeof window !== "undefined") {
-				window.location.href = "/";
+				window.location.href = getLoginPath();
 			}
 		}
 	};
diff --git a/surfsense_web/components/assistant-ui/assistant-message.tsx b/surfsense_web/components/assistant-ui/assistant-message.tsx
index 0dcaf6350..d0cada0bd 100644
--- a/surfsense_web/components/assistant-ui/assistant-message.tsx
+++ b/surfsense_web/components/assistant-ui/assistant-message.tsx
@@ -87,6 +87,7 @@ import {
 } from "@/components/ui/drawer";
 import { useComments } from "@/hooks/use-comments";
 import { useMediaQuery } from "@/hooks/use-media-query";
+import { useElectronAPI } from "@/hooks/use-platform";
 import { cn } from "@/lib/utils";
 
 // Dynamically import video presentation tool to avoid loading Babel and Remotion in main bundle
@@ -463,16 +464,17 @@ export const AssistantMessage: FC = () => {
 const AssistantActionBar: FC = () => {
 	const isLast = useAuiState((s) => s.message.isLast);
 	const aui = useAui();
+	const api = useElectronAPI();
 	const [quickAskMode, setQuickAskMode] = useState("");
 
 	useEffect(() => {
-		if (!isLast || !window.electronAPI?.getQuickAskMode) return;
-		window.electronAPI.getQuickAskMode().then((mode) => {
+		if (!isLast || !api?.getQuickAskMode) return;
+		api.getQuickAskMode().then((mode) => {
 			if (mode) setQuickAskMode(mode);
 		});
-	}, [isLast]);
+	}, [isLast, api]);
 
-	const isTransform = isLast && !!window.electronAPI?.replaceText && quickAskMode === "transform";
+	const isTransform = isLast && !!api?.replaceText && quickAskMode === "transform";
 
 	return (
 		<ActionBarPrimitive.Root
@@ -508,7 +510,7 @@ const AssistantActionBar: FC = () => {
 					type="button"
 					onClick={() => {
 						const text = aui.message().getCopyText();
-						window.electronAPI?.replaceText(text);
+						api?.replaceText(text);
 					}}
 					className="ml-1 inline-flex items-center gap-1.5 rounded-md bg-primary px-3 py-1.5 text-xs font-medium text-primary-foreground transition-colors hover:bg-primary/90"
 				>
diff --git a/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx b/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx
index 3e8aad620..4a97863fb 100644
--- a/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx
+++ b/surfsense_web/components/assistant-ui/connector-popup/tabs/all-connectors-tab.tsx
@@ -3,6 +3,7 @@
 import type { FC } from "react";
 import { EnumConnectorName } from "@/contracts/enums/connector";
 import type { SearchSourceConnector } from "@/contracts/types/connector.types";
+import { usePlatform } from "@/hooks/use-platform";
 import { isSelfHosted } from "@/lib/env-config";
 import { ConnectorCard } from "../components/connector-card";
 import {
@@ -74,9 +75,8 @@ export const AllConnectorsTab: FC<AllConnectorsTabProps> = ({
 	onManage,
 	onViewAccountsList,
 }) => {
-	// Check if self-hosted mode (for showing self-hosted only connectors)
 	const selfHosted = isSelfHosted();
-	const isDesktop = typeof window !== "undefined" && !!window.electronAPI;
+	const { isDesktop } = usePlatform();
 
 	const matchesSearch = (title: string, description: string) =>
 		title.toLowerCase().includes(searchQuery.toLowerCase()) ||
diff --git a/surfsense_web/components/assistant-ui/inline-mention-editor.tsx b/surfsense_web/components/assistant-ui/inline-mention-editor.tsx
index af7a8397c..2d55f4d20 100644
--- a/surfsense_web/components/assistant-ui/inline-mention-editor.tsx
+++ b/surfsense_web/components/assistant-ui/inline-mention-editor.tsx
@@ -24,6 +24,7 @@ export interface MentionedDocument {
 export interface InlineMentionEditorRef {
 	focus: () => void;
 	clear: () => void;
+	setText: (text: string) => void;
 	getText: () => string;
 	getMentionedDocuments: () => MentionedDocument[];
 	insertDocumentChip: (doc: Pick<Document, "id" | "title" | "document_type">) => void;
@@ -397,6 +398,19 @@ export const InlineMentionEditor = forwardRef<InlineMentionEditorRef, InlineMent
 			}
 		}, []);
 
+		// Replace editor content with plain text and place cursor at end
+		const setText = useCallback(
+			(text: string) => {
+				if (!editorRef.current) return;
+				editorRef.current.innerText = text;
+				const empty = text.length === 0;
+				setIsEmpty(empty);
+				onChange?.(text, Array.from(mentionedDocs.values()));
+				focusAtEnd();
+			},
+			[focusAtEnd, onChange, mentionedDocs]
+		);
+
 		const setDocumentChipStatus = useCallback(
 			(
 				docId: number,
@@ -469,6 +483,7 @@ export const InlineMentionEditor = forwardRef<InlineMentionEditorRef, InlineMent
 		useImperativeHandle(ref, () => ({
 			focus: () => editorRef.current?.focus(),
 			clear,
+			setText,
 			getText,
 			getMentionedDocuments,
 			insertDocumentChip,
diff --git a/surfsense_web/components/assistant-ui/thread.tsx b/surfsense_web/components/assistant-ui/thread.tsx
index 597fcce39..7d8765399 100644
--- a/surfsense_web/components/assistant-ui/thread.tsx
+++ b/surfsense_web/components/assistant-ui/thread.tsx
@@ -89,6 +89,7 @@ import type { Document } from "@/contracts/types/document.types";
 import { useBatchCommentsPreload } from "@/hooks/use-comments";
 import { useCommentsSync } from "@/hooks/use-comments-sync";
 import { useMediaQuery } from "@/hooks/use-media-query";
+import { useElectronAPI } from "@/hooks/use-platform";
 import { cn } from "@/lib/utils";
 
 /** Placeholder texts that cycle in new chats when input is empty */
@@ -362,18 +363,19 @@ const Composer: FC = () => {
 		};
 	}, []);
 
+	const electronAPI = useElectronAPI();
 	const [clipboardInitialText, setClipboardInitialText] = useState<string | undefined>();
 	const clipboardLoadedRef = useRef(false);
 	useEffect(() => {
-		if (!window.electronAPI || clipboardLoadedRef.current) return;
+		if (!electronAPI || clipboardLoadedRef.current) return;
 		clipboardLoadedRef.current = true;
-		window.electronAPI.getQuickAskText().then((text) => {
+		electronAPI.getQuickAskText().then((text) => {
 			if (text) {
 				setClipboardInitialText(text);
 				setShowPromptPicker(true);
 			}
 		});
-	}, []);
+	}, [electronAPI]);
 
 	const isThreadEmpty = useAuiState(({ thread }) => thread.isEmpty);
 	const isThreadRunning = useAuiState(({ thread }) => thread.isRunning);
@@ -504,34 +506,28 @@ const Composer: FC = () => {
 				: userText
 					? `${action.prompt}\n\n${userText}`
 					: action.prompt;
+			editorRef.current?.setText(finalPrompt);
 			aui.composer().setText(finalPrompt);
-			aui.composer().send();
-			editorRef.current?.clear();
 			setShowPromptPicker(false);
 			setActionQuery("");
-			setMentionedDocuments([]);
-			setSidebarDocs([]);
 		},
-		[actionQuery, aui, setMentionedDocuments, setSidebarDocs]
+		[actionQuery, aui]
 	);
 
 	const handleQuickAskSelect = useCallback(
 		(action: { name: string; prompt: string; mode: "transform" | "explore" }) => {
 			if (!clipboardInitialText) return;
-			window.electronAPI?.setQuickAskMode(action.mode);
+			electronAPI?.setQuickAskMode(action.mode);
 			const finalPrompt = action.prompt.includes("{selection}")
 				? action.prompt.replace("{selection}", () => clipboardInitialText)
 				: `${action.prompt}\n\n${clipboardInitialText}`;
+			editorRef.current?.setText(finalPrompt);
 			aui.composer().setText(finalPrompt);
-			aui.composer().send();
-			editorRef.current?.clear();
 			setShowPromptPicker(false);
 			setActionQuery("");
 			setClipboardInitialText(undefined);
-			setMentionedDocuments([]);
-			setSidebarDocs([]);
 		},
-		[clipboardInitialText, aui, setMentionedDocuments, setSidebarDocs]
+		[clipboardInitialText, electronAPI, aui]
 	);
 
 	// Keyboard navigation for document/action picker (arrow keys, Enter, Escape)
diff --git a/surfsense_web/components/desktop/shortcut-recorder.tsx b/surfsense_web/components/desktop/shortcut-recorder.tsx
new file mode 100644
index 000000000..0c0012002
--- /dev/null
+++ b/surfsense_web/components/desktop/shortcut-recorder.tsx
@@ -0,0 +1,168 @@
+"use client";
+
+import { RotateCcw } from "lucide-react";
+import { useCallback, useRef, useState } from "react";
+import { Button } from "@/components/ui/button";
+import { cn } from "@/lib/utils";
+
+// ---------------------------------------------------------------------------
+// Accelerator ↔ display helpers
+// ---------------------------------------------------------------------------
+
+export function keyEventToAccelerator(e: React.KeyboardEvent): string | null {
+	const parts: string[] = [];
+	if (e.ctrlKey || e.metaKey) parts.push("CommandOrControl");
+	if (e.altKey) parts.push("Alt");
+	if (e.shiftKey) parts.push("Shift");
+
+	const key = e.key;
+	if (["Control", "Meta", "Alt", "Shift"].includes(key)) return null;
+
+	if (key === " ") parts.push("Space");
+	else if (key.length === 1) parts.push(key.toUpperCase());
+	else parts.push(key);
+
+	if (parts.length < 2) return null;
+	return parts.join("+");
+}
+
+export function acceleratorToDisplay(accel: string): string[] {
+	if (!accel) return [];
+	return accel.split("+").map((part) => {
+		if (part === "CommandOrControl") return "Ctrl";
+		if (part === "Space") return "Space";
+		return part;
+	});
+}
+
+export const DEFAULT_SHORTCUTS = {
+	quickAsk: "CommandOrControl+Alt+S",
+	autocomplete: "CommandOrControl+Shift+Space",
+};
+
+// ---------------------------------------------------------------------------
+// Kbd pill component
+// ---------------------------------------------------------------------------
+
+export function Kbd({
+	keys,
+	className,
+}: {
+	keys: string[];
+	className?: string;
+}) {
+	return (
+		<span className={cn("inline-flex items-center gap-1", className)}>
+			{keys.map((key) => (
+				<kbd
+					key={key}
+					className={cn(
+						"inline-flex h-7 min-w-7 items-center justify-center rounded-md border bg-muted px-1.5 font-mono text-xs font-medium text-muted-foreground shadow-sm",
+						key.length > 3 && "px-2"
+					)}
+				>
+					{key}
+				</kbd>
+			))}
+		</span>
+	);
+}
+
+// ---------------------------------------------------------------------------
+// Shortcut recorder component
+// ---------------------------------------------------------------------------
+
+export function ShortcutRecorder({
+	value,
+	onChange,
+	onReset,
+	defaultValue,
+	label,
+	description,
+	icon: Icon,
+}: {
+	value: string;
+	onChange: (accelerator: string) => void;
+	onReset: () => void;
+	defaultValue: string;
+	label: string;
+	description: string;
+	icon: React.ElementType;
+}) {
+	const [recording, setRecording] = useState(false);
+	const inputRef = useRef<HTMLButtonElement>(null);
+
+	const handleKeyDown = useCallback(
+		(e: React.KeyboardEvent) => {
+			if (!recording) return;
+			e.preventDefault();
+			e.stopPropagation();
+
+			if (e.key === "Escape") {
+				setRecording(false);
+				return;
+			}
+
+			const accel = keyEventToAccelerator(e);
+			if (accel) {
+				onChange(accel);
+				setRecording(false);
+			}
+		},
+		[recording, onChange]
+	);
+
+	const displayKeys = acceleratorToDisplay(value);
+	const isDefault = value === defaultValue;
+
+	return (
+		<div className="flex items-center justify-between gap-4 rounded-lg border bg-background p-3">
+			<div className="flex items-center gap-3 min-w-0">
+				<div className="flex size-9 shrink-0 items-center justify-center rounded-md bg-primary/10 text-primary">
+					<Icon className="size-4" />
+				</div>
+				<div className="min-w-0">
+					<p className="text-sm font-medium leading-none">{label}</p>
+					<p className="mt-1 text-xs text-muted-foreground truncate">
+						{description}
+					</p>
+				</div>
+			</div>
+
+			<div className="flex items-center gap-2 shrink-0">
+				{!isDefault && (
+					<Button
+						variant="ghost"
+						size="icon"
+						className="size-7"
+						onClick={onReset}
+						title="Reset to default"
+					>
+						<RotateCcw />
+					</Button>
+				)}
+				<button
+					ref={inputRef}
+					type="button"
+					onClick={() => setRecording(true)}
+					onKeyDown={handleKeyDown}
+					onBlur={() => setRecording(false)}
+					className={cn(
+						"flex h-9 items-center gap-1 rounded-md border px-3 text-sm transition-all focus:outline-none",
+						recording
+							? "border-primary bg-primary/5 ring-2 ring-primary/20"
+							: "border-input bg-muted/50 hover:bg-muted"
+					)}
+				>
+					{recording ? (
+						<span className="text-xs text-primary animate-pulse">
+							Press keys...
+						</span>
+					) : (
+						<Kbd keys={displayKeys} />
+					)}
+				</button>
+			</div>
+		</div>
+	);
+}
diff --git a/surfsense_web/components/layout/providers/LayoutDataProvider.tsx b/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
index 6138b67fb..380ffa656 100644
--- a/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
+++ b/surfsense_web/components/layout/providers/LayoutDataProvider.tsx
@@ -55,7 +55,7 @@ import { useInbox } from "@/hooks/use-inbox";
 import { useIsMobile } from "@/hooks/use-mobile";
 import { notificationsApiService } from "@/lib/apis/notifications-api.service";
 import { searchSpacesApiService } from "@/lib/apis/search-spaces-api.service";
-import { logout } from "@/lib/auth-utils";
+import { getLoginPath, logout } from "@/lib/auth-utils";
 import { deleteThread, fetchThreads, updateThread } from "@/lib/chat/thread-persistence";
 import { resetUser, trackLogout } from "@/lib/posthog/events";
 import { cacheKeys } from "@/lib/query-client/cache-keys";
@@ -600,12 +600,12 @@ export function LayoutDataProvider({ searchSpaceId, children }: LayoutDataProvid
 			await logout();
 
 			if (typeof window !== "undefined") {
-				router.push("/");
+				router.push(getLoginPath());
 			}
 		} catch (error) {
 			console.error("Error during logout:", error);
 			await logout();
-			router.push("/");
+			router.push(getLoginPath());
 		}
 	}, [router]);
 
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index aa409e179..f19b20971 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -41,6 +41,7 @@ import { getConnectorIcon } from "@/contracts/enums/connectorIcons";
 import type { DocumentTypeEnum } from "@/contracts/types/document.types";
 import { useDebouncedValue } from "@/hooks/use-debounced-value";
 import { useMediaQuery } from "@/hooks/use-media-query";
+import { useElectronAPI } from "@/hooks/use-platform";
 import { documentsApiService } from "@/lib/apis/documents-api.service";
 import { foldersApiService } from "@/lib/apis/folders-api.service";
 import { authenticatedFetch } from "@/lib/auth-utils";
@@ -84,6 +85,7 @@ export function DocumentsSidebar({
 	const tSidebar = useTranslations("sidebar");
 	const params = useParams();
 	const isMobile = !useMediaQuery("(min-width: 640px)");
+	const electronAPI = useElectronAPI();
 	const searchSpaceId = Number(params.search_space_id);
 	const setConnectorDialogOpen = useSetAtom(connectorDialogOpenAtom);
 	const setRightPanelCollapsed = useSetAtom(rightPanelCollapsedAtom);
@@ -97,11 +99,11 @@ export function DocumentsSidebar({
 	const [watchedFolderIds, setWatchedFolderIds] = useState<Set<number>>(new Set());
 
 	useEffect(() => {
-		const api = typeof window !== "undefined" ? window.electronAPI : null;
-		if (!api?.getWatchedFolders) return;
+		if (!electronAPI?.getWatchedFolders) return;
+		const api = electronAPI;
 
 		async function loadWatchedIds() {
-			const folders = await api!.getWatchedFolders();
+			const folders = await api.getWatchedFolders();
 
 			if (folders.length === 0) {
 				try {
@@ -109,7 +111,7 @@ export function DocumentsSidebar({
 					for (const bf of backendFolders) {
 						const meta = bf.metadata as Record<string, unknown> | null;
 						if (!meta?.watched || !meta.folder_path) continue;
-						await api!.addWatchedFolder({
+						await api.addWatchedFolder({
 							path: meta.folder_path as string,
 							name: bf.name,
 							rootFolderId: bf.id,
@@ -119,7 +121,7 @@ export function DocumentsSidebar({
 							active: true,
 						});
 					}
-					const recovered = await api!.getWatchedFolders();
+					const recovered = await api.getWatchedFolders();
 					const ids = new Set(
 						recovered.filter((f) => f.rootFolderId != null).map((f) => f.rootFolderId as number)
 					);
@@ -137,7 +139,7 @@ export function DocumentsSidebar({
 		}
 
 		loadWatchedIds();
-	}, [searchSpaceId]);
+	}, [searchSpaceId, electronAPI]);
 	const { mutateAsync: deleteDocumentMutation } = useAtomValue(deleteDocumentMutationAtom);
 
 	const [sidebarDocs, setSidebarDocs] = useAtom(sidebarSelectedDocumentsAtom);
@@ -276,10 +278,9 @@ export function DocumentsSidebar({
 
 	const handleRescanFolder = useCallback(
 		async (folder: FolderDisplay) => {
-			const api = window.electronAPI;
-			if (!api) return;
+			if (!electronAPI) return;
 
-			const watchedFolders = await api.getWatchedFolders();
+			const watchedFolders = await electronAPI.getWatchedFolders();
 			const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
 			if (!matched) {
 				toast.error("This folder is not being watched");
@@ -298,28 +299,27 @@ export function DocumentsSidebar({
 				toast.error((err as Error)?.message || "Failed to re-scan folder");
 			}
 		},
-		[searchSpaceId]
+		[searchSpaceId, electronAPI]
 	);
 
 	const handleStopWatching = useCallback(async (folder: FolderDisplay) => {
-		const api = window.electronAPI;
-		if (!api) return;
+		if (!electronAPI) return;
 
-		const watchedFolders = await api.getWatchedFolders();
+		const watchedFolders = await electronAPI.getWatchedFolders();
 		const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
 		if (!matched) {
 			toast.error("This folder is not being watched");
 			return;
 		}
 
-		await api.removeWatchedFolder(matched.path);
+		await electronAPI.removeWatchedFolder(matched.path);
 		try {
 			await foldersApiService.stopWatching(folder.id);
 		} catch (err) {
 			console.error("[DocumentsSidebar] Failed to clear watched metadata:", err);
 		}
 		toast.success(`Stopped watching: ${matched.name}`);
-	}, []);
+	}, [electronAPI]);
 
 	const handleRenameFolder = useCallback(async (folder: FolderDisplay, newName: string) => {
 		try {
@@ -333,12 +333,11 @@ export function DocumentsSidebar({
 	const handleDeleteFolder = useCallback(async (folder: FolderDisplay) => {
 		if (!confirm(`Delete folder "${folder.name}" and all its contents?`)) return;
 		try {
-			const api = window.electronAPI;
-			if (api) {
-				const watchedFolders = await api.getWatchedFolders();
+			if (electronAPI) {
+				const watchedFolders = await electronAPI.getWatchedFolders();
 				const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
 				if (matched) {
-					await api.removeWatchedFolder(matched.path);
+					await electronAPI.removeWatchedFolder(matched.path);
 				}
 			}
 			await foldersApiService.deleteFolder(folder.id);
@@ -346,7 +345,7 @@ export function DocumentsSidebar({
 		} catch (e: unknown) {
 			toast.error((e as Error)?.message || "Failed to delete folder");
 		}
-	}, []);
+	}, [electronAPI]);
 
 	const handleMoveFolder = useCallback(
 		(folder: FolderDisplay) => {
diff --git a/surfsense_web/components/platform-gate.tsx b/surfsense_web/components/platform-gate.tsx
new file mode 100644
index 000000000..6908c6d32
--- /dev/null
+++ b/surfsense_web/components/platform-gate.tsx
@@ -0,0 +1,16 @@
+"use client";
+
+import type { ReactNode } from "react";
+import { usePlatform } from "@/hooks/use-platform";
+
+export function DesktopOnly({ children }: { children: ReactNode }) {
+	const { isDesktop } = usePlatform();
+	if (!isDesktop) return null;
+	return <>{children}</>;
+}
+
+export function WebOnly({ children }: { children: ReactNode }) {
+	const { isWeb } = usePlatform();
+	if (!isWeb) return null;
+	return <>{children}</>;
+}
diff --git a/surfsense_web/components/settings/user-settings-dialog.tsx b/surfsense_web/components/settings/user-settings-dialog.tsx
index b74ff973b..919b08174 100644
--- a/surfsense_web/components/settings/user-settings-dialog.tsx
+++ b/surfsense_web/components/settings/user-settings-dialog.tsx
@@ -3,6 +3,7 @@
 import { useAtom } from "jotai";
 import { Globe, KeyRound, Monitor, Receipt, Sparkles, User } from "lucide-react";
 import { useTranslations } from "next-intl";
+import { useMemo } from "react";
 import { ApiKeyContent } from "@/app/dashboard/[search_space_id]/user-settings/components/ApiKeyContent";
 import { CommunityPromptsContent } from "@/app/dashboard/[search_space_id]/user-settings/components/CommunityPromptsContent";
 import { ProfileContent } from "@/app/dashboard/[search_space_id]/user-settings/components/ProfileContent";
@@ -11,37 +12,42 @@ import { PurchaseHistoryContent } from "@/app/dashboard/[search_space_id]/user-s
 import { DesktopContent } from "@/app/dashboard/[search_space_id]/user-settings/components/DesktopContent";
 import { userSettingsDialogAtom } from "@/atoms/settings/settings-dialog.atoms";
 import { SettingsDialog } from "@/components/settings/settings-dialog";
+import { usePlatform } from "@/hooks/use-platform";
 
 export function UserSettingsDialog() {
 	const t = useTranslations("userSettings");
 	const [state, setState] = useAtom(userSettingsDialogAtom);
+	const { isDesktop } = usePlatform();
 
-	const navItems = [
-		{ value: "profile", label: t("profile_nav_label"), icon: <User className="h-4 w-4" /> },
-		{
-			value: "api-key",
-			label: t("api_key_nav_label"),
-			icon: <KeyRound className="h-4 w-4" />,
-		},
-		{
-			value: "prompts",
-			label: "My Prompts",
-			icon: <Sparkles className="h-4 w-4" />,
-		},
-		{
-			value: "community-prompts",
-			label: "Community Prompts",
-			icon: <Globe className="h-4 w-4" />,
-		},
-		{
-			value: "purchases",
-			label: "Purchase History",
-			icon: <Receipt className="h-4 w-4" />,
-		},
-		...(typeof window !== "undefined" && window.electronAPI
-			? [{ value: "desktop", label: "Desktop", icon: <Monitor className="h-4 w-4" /> }]
-			: []),
-	];
+	const navItems = useMemo(
+		() => [
+			{ value: "profile", label: t("profile_nav_label"), icon: <User className="h-4 w-4" /> },
+			{
+				value: "api-key",
+				label: t("api_key_nav_label"),
+				icon: <KeyRound className="h-4 w-4" />,
+			},
+			{
+				value: "prompts",
+				label: "My Prompts",
+				icon: <Sparkles className="h-4 w-4" />,
+			},
+			{
+				value: "community-prompts",
+				label: "Community Prompts",
+				icon: <Globe className="h-4 w-4" />,
+			},
+			{
+				value: "purchases",
+				label: "Purchase History",
+				icon: <Receipt className="h-4 w-4" />,
+			},
+			...(isDesktop
+				? [{ value: "desktop", label: "Desktop", icon: <Monitor className="h-4 w-4" /> }]
+				: []),
+		],
+		[t, isDesktop]
+	);
 
 	return (
 		<SettingsDialog
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 6b59f8ef6..cf4019d93 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -26,6 +26,7 @@ import { Progress } from "@/components/ui/progress";
 import { Spinner } from "@/components/ui/spinner";
 import { Switch } from "@/components/ui/switch";
 import { documentsApiService } from "@/lib/apis/documents-api.service";
+import { useElectronAPI } from "@/hooks/use-platform";
 import {
 	trackDocumentUploadFailure,
 	trackDocumentUploadStarted,
@@ -151,10 +152,11 @@ export function DocumentUploadTab({
 		};
 	}, []);
 
+	const electronAPI = useElectronAPI();
 	const [selectedFolder, setSelectedFolder] = useState<SelectedFolder | null>(null);
 	const [watchFolder, setWatchFolder] = useState(true);
 	const [folderSubmitting, setFolderSubmitting] = useState(false);
-	const isElectron = typeof window !== "undefined" && !!window.electronAPI?.browseFiles;
+	const isElectron = !!electronAPI?.browseFiles;
 
 	const acceptedFileTypes = useMemo(() => {
 		const etlService = process.env.NEXT_PUBLIC_ETL_SERVICE;
@@ -216,33 +218,31 @@ export function DocumentUploadTab({
 	}, []);
 
 	const handleBrowseFiles = useCallback(async () => {
-		const api = window.electronAPI;
-		if (!api?.browseFiles) return;
+		if (!electronAPI?.browseFiles) return;
 
-		const paths = await api.browseFiles();
+		const paths = await electronAPI.browseFiles();
 		if (!paths || paths.length === 0) return;
 
 		setSelectedFolder(null);
-		const fileDataList = await api.readLocalFiles(paths);
+		const fileDataList = await electronAPI.readLocalFiles(paths);
 		const newFiles: FileWithId[] = fileDataList.map((fd) => ({
 			id: crypto.randomUUID?.() ?? `file-${Date.now()}-${Math.random().toString(36)}`,
 			file: new File([fd.data], fd.name, { type: fd.mimeType }),
 		}));
 		setFiles((prev) => [...prev, ...newFiles]);
-	}, []);
+	}, [electronAPI]);
 
 	const handleBrowseFolder = useCallback(async () => {
-		const api = window.electronAPI;
-		if (!api?.selectFolder) return;
+		if (!electronAPI?.selectFolder) return;
 
-		const folderPath = await api.selectFolder();
+		const folderPath = await electronAPI.selectFolder();
 		if (!folderPath) return;
 
 		const folderName = folderPath.split("/").pop() || folderPath.split("\\").pop() || folderPath;
 		setFiles([]);
 		setSelectedFolder({ path: folderPath, name: folderName });
 		setWatchFolder(true);
-	}, []);
+	}, [electronAPI]);
 
 	const handleFolderChange = useCallback(
 		(e: ChangeEvent<HTMLInputElement>) => {
@@ -287,9 +287,7 @@ export function DocumentUploadTab({
 	);
 
 	const handleFolderSubmit = useCallback(async () => {
-		if (!selectedFolder) return;
-		const api = window.electronAPI;
-		if (!api) return;
+		if (!selectedFolder || !electronAPI) return;
 
 		setFolderSubmitting(true);
 		try {
@@ -304,7 +302,7 @@ export function DocumentUploadTab({
 			const rootFolderId = (result as { root_folder_id?: number })?.root_folder_id ?? null;
 
 			if (watchFolder) {
-				await api.addWatchedFolder({
+				await electronAPI.addWatchedFolder({
 					path: selectedFolder.path,
 					name: selectedFolder.name,
 					excludePatterns: [
@@ -332,7 +330,7 @@ export function DocumentUploadTab({
 		} finally {
 			setFolderSubmitting(false);
 		}
-	}, [selectedFolder, watchFolder, searchSpaceId, shouldSummarize, onSuccess]);
+	}, [selectedFolder, watchFolder, searchSpaceId, shouldSummarize, onSuccess, electronAPI]);
 
 	const handleUpload = async () => {
 		setUploadProgress(0);
diff --git a/surfsense_web/contexts/platform-context.tsx b/surfsense_web/contexts/platform-context.tsx
new file mode 100644
index 000000000..bb3e3800d
--- /dev/null
+++ b/surfsense_web/contexts/platform-context.tsx
@@ -0,0 +1,31 @@
+"use client";
+
+import { createContext, useEffect, useState, type ReactNode } from "react";
+
+export interface PlatformContextValue {
+	isDesktop: boolean;
+	isWeb: boolean;
+	electronAPI: ElectronAPI | null;
+}
+
+const SSR_VALUE: PlatformContextValue = {
+	isDesktop: false,
+	isWeb: false,
+	electronAPI: null,
+};
+
+export const PlatformContext = createContext<PlatformContextValue>(SSR_VALUE);
+
+export function PlatformProvider({ children }: { children: ReactNode }) {
+	const [value, setValue] = useState<PlatformContextValue>(SSR_VALUE);
+
+	useEffect(() => {
+		const api = window.electronAPI ?? null;
+		const isDesktop = !!api;
+		setValue({ isDesktop, isWeb: !isDesktop, electronAPI: api });
+	}, []);
+
+	return (
+		<PlatformContext.Provider value={value}>{children}</PlatformContext.Provider>
+	);
+}
diff --git a/surfsense_web/hooks/use-folder-sync.ts b/surfsense_web/hooks/use-folder-sync.ts
index ef3326556..847d0081b 100644
--- a/surfsense_web/hooks/use-folder-sync.ts
+++ b/surfsense_web/hooks/use-folder-sync.ts
@@ -1,6 +1,7 @@
 "use client";
 
 import { useEffect, useRef } from "react";
+import { useElectronAPI } from "@/hooks/use-platform";
 import { documentsApiService } from "@/lib/apis/documents-api.service";
 
 interface FileChangedEvent {
@@ -29,6 +30,7 @@ interface BatchItem {
 }
 
 export function useFolderSync() {
+	const electronAPI = useElectronAPI();
 	const queueRef = useRef<BatchItem[]>([]);
 	const processingRef = useRef(false);
 	const debounceTimers = useRef<Map<string, ReturnType<typeof setTimeout>>>(new Map());
@@ -49,9 +51,8 @@ export function useFolderSync() {
 					target_file_paths: batch.filePaths,
 					root_folder_id: batch.rootFolderId,
 				});
-				const api = typeof window !== "undefined" ? window.electronAPI : null;
-				if (api?.acknowledgeFileEvents && batch.ackIds.length > 0) {
-					await api.acknowledgeFileEvents(batch.ackIds);
+				if (electronAPI?.acknowledgeFileEvents && batch.ackIds.length > 0) {
+					await electronAPI.acknowledgeFileEvents(batch.ackIds);
 				}
 			} catch (err) {
 				console.error("[FolderSync] Failed to trigger batch re-index:", err);
@@ -117,25 +118,22 @@ export function useFolderSync() {
 
 	useEffect(() => {
 		isMountedRef.current = true;
-		const api = typeof window !== "undefined" ? window.electronAPI : null;
-		if (!api?.onFileChanged) {
+		if (!electronAPI?.onFileChanged) {
 			return () => {
 				isMountedRef.current = false;
 			};
 		}
 
-		// Signal to main process that the renderer is ready to receive events
-		api.signalRendererReady?.();
+		electronAPI.signalRendererReady?.();
 
-		// Drain durable outbox first so events survive renderer startup gaps and restarts
-		void api.getPendingFileEvents?.().then((pendingEvents) => {
+		void electronAPI.getPendingFileEvents?.().then((pendingEvents) => {
 			if (!isMountedRef.current || !pendingEvents?.length) return;
 			for (const event of pendingEvents) {
 				enqueueWithDebounce(event);
 			}
 		});
 
-		const cleanup = api.onFileChanged((event: FileChangedEvent) => {
+		const cleanup = electronAPI.onFileChanged((event: FileChangedEvent) => {
 			enqueueWithDebounce(event);
 		});
 
@@ -149,5 +147,5 @@ export function useFolderSync() {
 			pendingByFolder.current.clear();
 			firstEventTime.current.clear();
 		};
-	}, []);
+	}, [electronAPI]);
 }
diff --git a/surfsense_web/hooks/use-platform.ts b/surfsense_web/hooks/use-platform.ts
new file mode 100644
index 000000000..dc1f7e914
--- /dev/null
+++ b/surfsense_web/hooks/use-platform.ts
@@ -0,0 +1,12 @@
+import { useContext } from "react";
+import { PlatformContext, type PlatformContextValue } from "@/contexts/platform-context";
+
+export function usePlatform(): Pick<PlatformContextValue, "isDesktop" | "isWeb"> {
+	const { isDesktop, isWeb } = useContext(PlatformContext);
+	return { isDesktop, isWeb };
+}
+
+export function useElectronAPI(): ElectronAPI | null {
+	const { electronAPI } = useContext(PlatformContext);
+	return electronAPI;
+}
diff --git a/surfsense_web/lib/auth-utils.ts b/surfsense_web/lib/auth-utils.ts
index f7d1c5b09..d66934c3b 100644
--- a/surfsense_web/lib/auth-utils.ts
+++ b/surfsense_web/lib/auth-utils.ts
@@ -15,6 +15,7 @@ const PUBLIC_ROUTE_PREFIXES = [
 	"/login",
 	"/register",
 	"/auth",
+	"/desktop/login",
 	"/docs",
 	"/public",
 	"/invite",
@@ -34,6 +35,11 @@ export function isPublicRoute(pathname: string): boolean {
 	return PUBLIC_ROUTE_PREFIXES.some((prefix) => pathname.startsWith(prefix));
 }
 
+export function getLoginPath(): string {
+	if (typeof window !== "undefined" && window.electronAPI) return "/desktop/login";
+	return "/login";
+}
+
 /**
  * Clears tokens and optionally redirects to login.
  * Call this when a 401 response is received.
@@ -55,7 +61,7 @@ export function handleUnauthorized(): void {
 		if (!excludedPaths.includes(pathname)) {
 			localStorage.setItem(REDIRECT_PATH_KEY, currentPath);
 		}
-		window.location.href = "/login";
+		window.location.href = getLoginPath();
 	}
 }
 
@@ -221,13 +227,12 @@ export function redirectToLogin(): void {
 	const currentPath = window.location.pathname + window.location.search + window.location.hash;
 
 	// Don't save auth-related paths or home page
-	const excludedPaths = ["/auth", "/auth/callback", "/", "/login", "/register"];
+	const excludedPaths = ["/auth", "/auth/callback", "/", "/login", "/register", "/desktop/login"];
 	if (!excludedPaths.includes(window.location.pathname)) {
 		localStorage.setItem(REDIRECT_PATH_KEY, currentPath);
 	}
 
-	// Redirect to login page
-	window.location.href = "/login";
+	window.location.href = getLoginPath();
 }
 
 /**
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 5e45635a2..615b861ea 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -81,6 +81,9 @@ interface ElectronAPI {
 	// Auth token sync across windows
 	getAuthTokens: () => Promise<{ bearer: string; refresh: string } | null>;
 	setAuthTokens: (bearer: string, refresh: string) => Promise<void>;
+	// Keyboard shortcut configuration
+	getShortcuts: () => Promise<{ quickAsk: string; autocomplete: string }>;
+	setShortcuts: (config: Partial<{ quickAsk: string; autocomplete: string }>) => Promise<{ quickAsk: string; autocomplete: string }>;
 }
 
 declare global {

From bb1dcd32b6b89ca8bcfed3c606ff227759614904 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 02:49:24 -0700
Subject: [PATCH 161/202] feat: enhance vision autocomplete service and UI
 feedback

- Optimized the vision autocomplete service by starting the SSE stream immediately and deriving KB search queries directly from window titles.
- Refactored the service to run KB filesystem pre-computation and agent graph compilation in parallel, improving performance.
- Updated the SuggestionPage component to handle new agent step data, displaying progress indicators for each step.
- Enhanced the CSS for the suggestion tooltip and agent activity indicators, improving the user interface and experience.
---
 .../app/agents/autocomplete/__init__.py       |  11 +
 .../agents/autocomplete/autocomplete_agent.py | 429 ++++++++++++++++++
 .../services/vision_autocomplete_service.py   | 258 ++++-------
 surfsense_web/app/desktop/suggestion/page.tsx |  68 ++-
 .../app/desktop/suggestion/suggestion.css     | 114 ++++-
 .../components/assistant-ui/thread.tsx        |  34 +-
 6 files changed, 686 insertions(+), 228 deletions(-)
 create mode 100644 surfsense_backend/app/agents/autocomplete/__init__.py
 create mode 100644 surfsense_backend/app/agents/autocomplete/autocomplete_agent.py

diff --git a/surfsense_backend/app/agents/autocomplete/__init__.py b/surfsense_backend/app/agents/autocomplete/__init__.py
new file mode 100644
index 000000000..55d7a692d
--- /dev/null
+++ b/surfsense_backend/app/agents/autocomplete/__init__.py
@@ -0,0 +1,11 @@
+"""Agent-based vision autocomplete with scoped filesystem exploration."""
+
+from app.agents.autocomplete.autocomplete_agent import (
+    create_autocomplete_agent,
+    stream_autocomplete_agent,
+)
+
+__all__ = [
+    "create_autocomplete_agent",
+    "stream_autocomplete_agent",
+]
diff --git a/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py b/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
new file mode 100644
index 000000000..928a133cc
--- /dev/null
+++ b/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
@@ -0,0 +1,429 @@
+"""Vision autocomplete agent with scoped filesystem exploration.
+
+Converts the stateless single-shot vision autocomplete into an agent that
+seeds a virtual filesystem from KB search results and lets the vision LLM
+explore documents via ``ls``, ``read_file``, ``glob``, ``grep``, etc.
+before generating the final completion.
+
+Performance: KB search and agent graph compilation run in parallel so
+the only sequential latency is KB-search (or agent compile, whichever is
+slower) + the agent's LLM turns.  There is no separate "query extraction"
+LLM call — the window title is used directly as the KB search query.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import logging
+import uuid
+from typing import Any, AsyncGenerator
+
+from deepagents.graph import BASE_AGENT_PROMPT
+from deepagents.middleware.patch_tool_calls import PatchToolCallsMiddleware
+from langchain.agents import create_agent
+from langchain_anthropic.middleware import AnthropicPromptCachingMiddleware
+from langchain_core.language_models import BaseChatModel
+from langchain_core.messages import AIMessage, ToolMessage
+
+from app.agents.new_chat.middleware.filesystem import SurfSenseFilesystemMiddleware
+from app.agents.new_chat.middleware.knowledge_search import (
+    build_scoped_filesystem,
+    search_knowledge_base,
+)
+from app.services.new_streaming_service import VercelStreamingService
+
+logger = logging.getLogger(__name__)
+
+KB_TOP_K = 10
+
+# ---------------------------------------------------------------------------
+# System prompt
+# ---------------------------------------------------------------------------
+
+AUTOCOMPLETE_SYSTEM_PROMPT = """You are a smart writing assistant that analyzes the user's screen to draft or complete text.
+
+You will receive a screenshot of the user's screen. Your PRIMARY source of truth is the screenshot itself — the visual context determines what to write.
+
+Your job:
+1. Analyze the ENTIRE screenshot to understand what the user is working on (email thread, chat conversation, document, code editor, form, etc.).
+2. Identify the text area where the user will type.
+3. Generate the text the user most likely wants to write based on the visual context.
+
+You also have access to the user's knowledge base documents via filesystem tools. However:
+- ONLY consult the knowledge base if the screenshot clearly involves a topic where your KB documents are DIRECTLY relevant (e.g., the user is writing about a specific project/topic that matches a document title).
+- Do NOT explore documents just because they exist. Most autocomplete requests can be answered purely from the screenshot.
+- If you do read a document, only incorporate information that is 100% relevant to what the user is typing RIGHT NOW. Do not add extra details, background, or tangential information from the KB.
+- Keep your output SHORT — autocomplete should feel like a natural continuation, not an essay.
+
+Key behavior:
+- If the text area is EMPTY, draft a concise response or message based on what you see on screen (e.g., reply to an email, respond to a chat message, continue a document).
+- If the text area already has text, continue it naturally — typically just a sentence or two.
+
+Rules:
+- Output ONLY the text to be inserted. No quotes, no explanations, no meta-commentary.
+- Be CONCISE. Prefer a single paragraph or a few sentences. Autocomplete is a quick assist, not a full draft.
+- Match the tone and formality of the surrounding context.
+- If the screen shows code, write code. If it shows a casual chat, be casual. If it shows a formal email, be formal.
+- Do NOT describe the screenshot or explain your reasoning.
+- Do NOT cite or reference documents explicitly — just let the knowledge inform your writing naturally.
+- If you cannot determine what to write, output nothing.
+
+## Filesystem Tools `ls`, `read_file`, `write_file`, `edit_file`, `glob`, `grep`
+
+All file paths must start with a `/`.
+- ls: list files and directories at a given path.
+- read_file: read a file from the filesystem.
+- write_file: create a temporary file in the session (not persisted).
+- edit_file: edit a file in the session (not persisted for /documents/ files).
+- glob: find files matching a pattern (e.g., "**/*.xml").
+- grep: search for text within files.
+
+## When to Use Filesystem Tools
+
+BEFORE reaching for any tool, ask yourself: "Can I write a good completion purely from the screenshot?" If yes, just write it — do NOT explore the KB.
+
+Only use tools when:
+- The user is clearly writing about a specific topic that likely has detailed information in their KB.
+- You need a specific fact, name, number, or reference that the screenshot doesn't provide.
+
+When you do use tools, be surgical:
+- Check the `ls` output first. If no document title looks relevant, stop — do not read files just to see what's there.
+- If a title looks relevant, read only the `<chunk_index>` (first ~20 lines) and jump to matched chunks. Do not read entire documents.
+- Extract only the specific information you need and move on to generating the completion.
+
+## Reading Documents Efficiently
+
+Documents are formatted as XML. Each document contains:
+- `<document_metadata>` — title, type, URL, etc.
+- `<chunk_index>` — a table of every chunk with its **line range** and a
+  `matched="true"` flag for chunks that matched the search query.
+- `<document_content>` — the actual chunks in original document order.
+
+**Workflow**: read the first ~20 lines to see the `<chunk_index>`, identify
+chunks marked `matched="true"`, then use `read_file(path, offset=<start_line>,
+limit=<lines>)` to jump directly to those sections."""
+
+APP_CONTEXT_BLOCK = """
+
+The user is currently working in "{app_name}" (window: "{window_title}"). Use this to understand the type of application and adapt your tone and format accordingly."""
+
+
+def _build_autocomplete_system_prompt(app_name: str, window_title: str) -> str:
+    prompt = AUTOCOMPLETE_SYSTEM_PROMPT
+    if app_name:
+        prompt += APP_CONTEXT_BLOCK.format(app_name=app_name, window_title=window_title)
+    return prompt
+
+
+# ---------------------------------------------------------------------------
+# Pre-compute KB filesystem (runs in parallel with agent compilation)
+# ---------------------------------------------------------------------------
+
+
+class _KBResult:
+    """Container for pre-computed KB filesystem results."""
+    __slots__ = ("files", "ls_ai_msg", "ls_tool_msg")
+
+    def __init__(
+        self,
+        files: dict[str, Any] | None = None,
+        ls_ai_msg: AIMessage | None = None,
+        ls_tool_msg: ToolMessage | None = None,
+    ) -> None:
+        self.files = files
+        self.ls_ai_msg = ls_ai_msg
+        self.ls_tool_msg = ls_tool_msg
+
+    @property
+    def has_documents(self) -> bool:
+        return bool(self.files)
+
+
+async def precompute_kb_filesystem(
+    search_space_id: int,
+    query: str,
+    top_k: int = KB_TOP_K,
+) -> _KBResult:
+    """Search the KB and build the scoped filesystem outside the agent.
+
+    This is designed to be called via ``asyncio.gather`` alongside agent
+    graph compilation so the two run concurrently.
+    """
+    if not query:
+        return _KBResult()
+
+    try:
+        search_results = await search_knowledge_base(
+            query=query,
+            search_space_id=search_space_id,
+            top_k=top_k,
+        )
+
+        if not search_results:
+            return _KBResult()
+
+        new_files, _ = await build_scoped_filesystem(
+            documents=search_results,
+            search_space_id=search_space_id,
+        )
+
+        if not new_files:
+            return _KBResult()
+
+        doc_paths = [
+            p for p, v in new_files.items()
+            if p.startswith("/documents/") and v is not None
+        ]
+        tool_call_id = f"auto_ls_{uuid.uuid4().hex[:12]}"
+        ai_msg = AIMessage(
+            content="",
+            tool_calls=[{"name": "ls", "args": {"path": "/documents"}, "id": tool_call_id}],
+        )
+        tool_msg = ToolMessage(
+            content=str(doc_paths) if doc_paths else "No documents found.",
+            tool_call_id=tool_call_id,
+        )
+        return _KBResult(files=new_files, ls_ai_msg=ai_msg, ls_tool_msg=tool_msg)
+
+    except Exception:
+        logger.warning("KB pre-computation failed, proceeding without KB", exc_info=True)
+        return _KBResult()
+
+
+# ---------------------------------------------------------------------------
+# Filesystem middleware — no save_document, no persistence
+# ---------------------------------------------------------------------------
+
+
+class AutocompleteFilesystemMiddleware(SurfSenseFilesystemMiddleware):
+    """Filesystem middleware for autocomplete — read-only exploration only.
+
+    Strips ``save_document`` (permanent KB persistence) and passes
+    ``search_space_id=None`` so ``write_file`` / ``edit_file`` stay ephemeral.
+    """
+
+    def __init__(self) -> None:
+        super().__init__(search_space_id=None, created_by_id=None)
+        self.tools = [t for t in self.tools if t.name != "save_document"]
+
+
+# ---------------------------------------------------------------------------
+# Agent factory
+# ---------------------------------------------------------------------------
+
+
+async def _compile_agent(
+    llm: BaseChatModel,
+    app_name: str,
+    window_title: str,
+) -> Any:
+    """Compile the agent graph (CPU-bound, runs in a thread)."""
+    system_prompt = _build_autocomplete_system_prompt(app_name, window_title)
+    final_system_prompt = system_prompt + "\n\n" + BASE_AGENT_PROMPT
+
+    middleware = [
+        AutocompleteFilesystemMiddleware(),
+        PatchToolCallsMiddleware(),
+        AnthropicPromptCachingMiddleware(unsupported_model_behavior="ignore"),
+    ]
+
+    agent = await asyncio.to_thread(
+        create_agent,
+        llm,
+        system_prompt=final_system_prompt,
+        tools=[],
+        middleware=middleware,
+    )
+    return agent.with_config({"recursion_limit": 200})
+
+
+async def create_autocomplete_agent(
+    llm: BaseChatModel,
+    *,
+    search_space_id: int,
+    kb_query: str,
+    app_name: str = "",
+    window_title: str = "",
+) -> tuple[Any, _KBResult]:
+    """Create the autocomplete agent and pre-compute KB in parallel.
+
+    Returns ``(agent, kb_result)`` so the caller can inject the pre-computed
+    filesystem into the agent's initial state without any middleware delay.
+    """
+    agent, kb = await asyncio.gather(
+        _compile_agent(llm, app_name, window_title),
+        precompute_kb_filesystem(search_space_id, kb_query),
+    )
+    return agent, kb
+
+
+# ---------------------------------------------------------------------------
+# Streaming helper
+# ---------------------------------------------------------------------------
+
+
+async def stream_autocomplete_agent(
+    agent: Any,
+    input_data: dict[str, Any],
+    streaming_service: VercelStreamingService,
+    *,
+    emit_message_start: bool = True,
+) -> AsyncGenerator[str, None]:
+    """Stream agent events as Vercel SSE, with thinking steps for tool calls.
+
+    When ``emit_message_start`` is False the caller has already sent the
+    ``message_start`` event (e.g. to show preparation steps before the agent
+    runs).
+    """
+    thread_id = uuid.uuid4().hex
+    config = {"configurable": {"thread_id": thread_id}}
+
+    current_text_id: str | None = None
+    active_tool_depth = 0
+    thinking_step_counter = 0
+    tool_step_ids: dict[str, str] = {}
+    step_titles: dict[str, str] = {}
+    completed_step_ids: set[str] = set()
+    last_active_step_id: str | None = None
+
+    def next_thinking_step_id() -> str:
+        nonlocal thinking_step_counter
+        thinking_step_counter += 1
+        return f"autocomplete-step-{thinking_step_counter}"
+
+    def complete_current_step() -> str | None:
+        nonlocal last_active_step_id
+        if last_active_step_id and last_active_step_id not in completed_step_ids:
+            completed_step_ids.add(last_active_step_id)
+            title = step_titles.get(last_active_step_id, "Done")
+            event = streaming_service.format_thinking_step(
+                step_id=last_active_step_id,
+                title=title,
+                status="complete",
+            )
+            last_active_step_id = None
+            return event
+        return None
+
+    if emit_message_start:
+        yield streaming_service.format_message_start()
+
+    # Emit an initial "Generating completion" step so the UI immediately
+    # shows activity once the agent starts its first LLM call.
+    gen_step_id = next_thinking_step_id()
+    last_active_step_id = gen_step_id
+    step_titles[gen_step_id] = "Generating completion"
+    yield streaming_service.format_thinking_step(
+        step_id=gen_step_id,
+        title="Generating completion",
+        status="in_progress",
+    )
+
+    try:
+        async for event in agent.astream_events(input_data, config=config, version="v2"):
+            event_type = event.get("event", "")
+
+            if event_type == "on_chat_model_stream":
+                if active_tool_depth > 0:
+                    continue
+                if "surfsense:internal" in event.get("tags", []):
+                    continue
+                chunk = event.get("data", {}).get("chunk")
+                if chunk and hasattr(chunk, "content"):
+                    content = chunk.content
+                    if content and isinstance(content, str):
+                        if current_text_id is None:
+                            step_event = complete_current_step()
+                            if step_event:
+                                yield step_event
+                            current_text_id = streaming_service.generate_text_id()
+                            yield streaming_service.format_text_start(current_text_id)
+                        yield streaming_service.format_text_delta(current_text_id, content)
+
+            elif event_type == "on_tool_start":
+                active_tool_depth += 1
+                tool_name = event.get("name", "unknown_tool")
+                run_id = event.get("run_id", "")
+                tool_input = event.get("data", {}).get("input", {})
+
+                if current_text_id is not None:
+                    yield streaming_service.format_text_end(current_text_id)
+                    current_text_id = None
+
+                step_event = complete_current_step()
+                if step_event:
+                    yield step_event
+
+                tool_step_id = next_thinking_step_id()
+                tool_step_ids[run_id] = tool_step_id
+                last_active_step_id = tool_step_id
+
+                title, items = _describe_tool_call(tool_name, tool_input)
+                step_titles[tool_step_id] = title
+                yield streaming_service.format_thinking_step(
+                    step_id=tool_step_id,
+                    title=title,
+                    status="in_progress",
+                    items=items,
+                )
+
+            elif event_type == "on_tool_end":
+                active_tool_depth = max(0, active_tool_depth - 1)
+                run_id = event.get("run_id", "")
+                step_id = tool_step_ids.pop(run_id, None)
+                if step_id and step_id not in completed_step_ids:
+                    completed_step_ids.add(step_id)
+                    title = step_titles.get(step_id, "Done")
+                    yield streaming_service.format_thinking_step(
+                        step_id=step_id,
+                        title=title,
+                        status="complete",
+                    )
+                    if last_active_step_id == step_id:
+                        last_active_step_id = None
+
+        if current_text_id is not None:
+            yield streaming_service.format_text_end(current_text_id)
+        step_event = complete_current_step()
+        if step_event:
+            yield step_event
+
+        yield streaming_service.format_finish()
+        yield streaming_service.format_done()
+
+    except Exception as e:
+        logger.error(f"Autocomplete agent streaming error: {e}", exc_info=True)
+        if current_text_id is not None:
+            yield streaming_service.format_text_end(current_text_id)
+        yield streaming_service.format_error("Autocomplete failed. Please try again.")
+        yield streaming_service.format_done()
+
+
+def _describe_tool_call(tool_name: str, tool_input: Any) -> tuple[str, list[str]]:
+    """Return a human-readable (title, items) for a tool call thinking step."""
+    inp = tool_input if isinstance(tool_input, dict) else {}
+    if tool_name == "ls":
+        path = inp.get("path", "/")
+        return "Listing files", [path]
+    if tool_name == "read_file":
+        fp = inp.get("file_path", "")
+        display = fp if len(fp) <= 80 else "…" + fp[-77:]
+        return "Reading file", [display]
+    if tool_name == "write_file":
+        fp = inp.get("file_path", "")
+        display = fp if len(fp) <= 80 else "…" + fp[-77:]
+        return "Writing file", [display]
+    if tool_name == "edit_file":
+        fp = inp.get("file_path", "")
+        display = fp if len(fp) <= 80 else "…" + fp[-77:]
+        return "Editing file", [display]
+    if tool_name == "glob":
+        pat = inp.get("pattern", "")
+        base = inp.get("path", "/")
+        return "Searching files", [f"{pat} in {base}"]
+    if tool_name == "grep":
+        pat = inp.get("pattern", "")
+        path = inp.get("path", "")
+        display_pat = pat[:60] + ("…" if len(pat) > 60 else "")
+        return "Searching content", [f'"{display_pat}"' + (f" in {path}" if path else "")]
+    return f"Using {tool_name}", []
diff --git a/surfsense_backend/app/services/vision_autocomplete_service.py b/surfsense_backend/app/services/vision_autocomplete_service.py
index f24a5c848..7d16c5864 100644
--- a/surfsense_backend/app/services/vision_autocomplete_service.py
+++ b/surfsense_backend/app/services/vision_autocomplete_service.py
@@ -1,139 +1,40 @@
+"""Vision autocomplete service — agent-based with scoped filesystem.
+
+Optimized pipeline:
+1. Start the SSE stream immediately so the UI shows progress.
+2. Derive a KB search query from window_title (no separate LLM call).
+3. Run KB filesystem pre-computation and agent graph compilation in PARALLEL.
+4. Inject pre-computed KB files as initial state and stream the agent.
+"""
+
 import logging
 from typing import AsyncGenerator
 
-from langchain_core.messages import HumanMessage, SystemMessage
+from langchain_core.messages import HumanMessage
 from sqlalchemy.ext.asyncio import AsyncSession
 
-from app.retriever.chunks_hybrid_search import ChucksHybridSearchRetriever
+from app.agents.autocomplete import create_autocomplete_agent, stream_autocomplete_agent
 from app.services.llm_service import get_vision_llm
 from app.services.new_streaming_service import VercelStreamingService
 
 logger = logging.getLogger(__name__)
 
-KB_TOP_K = 5
-KB_MAX_CHARS = 4000
-
-EXTRACT_QUERY_PROMPT = """Look at this screenshot and describe in 1-2 short sentences what the user is working on and what topic they need to write about. Be specific about the subject matter. Output ONLY the description, nothing else."""
-
-EXTRACT_QUERY_PROMPT_WITH_APP = """The user is currently in the application "{app_name}" with the window titled "{window_title}".
-
-Look at this screenshot and describe in 1-2 short sentences what the user is working on and what topic they need to write about. Be specific about the subject matter. Output ONLY the description, nothing else."""
-
-VISION_SYSTEM_PROMPT = """You are a smart writing assistant that analyzes the user's screen to draft or complete text.
-
-You will receive a screenshot of the user's screen. Your job:
-1. Analyze the ENTIRE screenshot to understand what the user is working on (email thread, chat conversation, document, code editor, form, etc.).
-2. Identify the text area where the user will type.
-3. Based on the full visual context, generate the text the user most likely wants to write.
-
-Key behavior:
-- If the text area is EMPTY, draft a full response or message based on what you see on screen (e.g., reply to an email, respond to a chat message, continue a document).
-- If the text area already has text, continue it naturally.
-
-Rules:
-- Output ONLY the text to be inserted. No quotes, no explanations, no meta-commentary.
-- Be concise but complete — a full thought, not a fragment.
-- Match the tone and formality of the surrounding context.
-- If the screen shows code, write code. If it shows a casual chat, be casual. If it shows a formal email, be formal.
-- Do NOT describe the screenshot or explain your reasoning.
-- If you cannot determine what to write, output nothing."""
-
-APP_CONTEXT_BLOCK = """
-
-The user is currently working in "{app_name}" (window: "{window_title}"). Use this to understand the type of application and adapt your tone and format accordingly."""
-
-KB_CONTEXT_BLOCK = """
-
-You also have access to the user's knowledge base documents below. Use them to write more accurate, informed, and contextually relevant text. Do NOT cite or reference the documents explicitly — just let the knowledge inform your writing naturally.
-
-<knowledge_base>
-{kb_context}
-</knowledge_base>"""
+PREP_STEP_ID = "autocomplete-prep"
 
 
-def _build_system_prompt(app_name: str, window_title: str, kb_context: str) -> str:
-    """Assemble the system prompt from optional context blocks."""
-    prompt = VISION_SYSTEM_PROMPT
-    if app_name:
-        prompt += APP_CONTEXT_BLOCK.format(app_name=app_name, window_title=window_title)
-    if kb_context:
-        prompt += KB_CONTEXT_BLOCK.format(kb_context=kb_context)
-    return prompt
+def _derive_kb_query(app_name: str, window_title: str) -> str:
+    parts = [p for p in (window_title, app_name) if p]
+    return " ".join(parts)
 
 
 def _is_vision_unsupported_error(e: Exception) -> bool:
-    """Check if an exception indicates the model doesn't support vision/images."""
     msg = str(e).lower()
     return "content must be a string" in msg or "does not support image" in msg
 
 
-async def _extract_query_from_screenshot(
-    llm, screenshot_data_url: str,
-    app_name: str = "", window_title: str = "",
-) -> str | None:
-    """Ask the Vision LLM to describe what the user is working on.
-
-    Raises vision-unsupported errors so the caller can return a
-    friendly message immediately instead of retrying with astream.
-    """
-    if app_name:
-        prompt_text = EXTRACT_QUERY_PROMPT_WITH_APP.format(
-            app_name=app_name, window_title=window_title,
-        )
-    else:
-        prompt_text = EXTRACT_QUERY_PROMPT
-
-    try:
-        response = await llm.ainvoke([
-            HumanMessage(content=[
-                {"type": "text", "text": prompt_text},
-                {"type": "image_url", "image_url": {"url": screenshot_data_url}},
-            ]),
-        ])
-        query = response.content.strip() if hasattr(response, "content") else ""
-        return query if query else None
-    except Exception as e:
-        if _is_vision_unsupported_error(e):
-            raise
-        logger.warning(f"Failed to extract query from screenshot: {e}")
-        return None
-
-
-async def _search_knowledge_base(
-    session: AsyncSession, search_space_id: int, query: str
-) -> str:
-    """Search the KB and return formatted context string."""
-    try:
-        retriever = ChucksHybridSearchRetriever(session)
-        results = await retriever.hybrid_search(
-            query_text=query,
-            top_k=KB_TOP_K,
-            search_space_id=search_space_id,
-        )
-
-        if not results:
-            return ""
-
-        parts: list[str] = []
-        char_count = 0
-        for doc in results:
-            title = doc.get("document", {}).get("title", "Untitled")
-            for chunk in doc.get("chunks", []):
-                content = chunk.get("content", "").strip()
-                if not content:
-                    continue
-                entry = f"[{title}]\n{content}"
-                if char_count + len(entry) > KB_MAX_CHARS:
-                    break
-                parts.append(entry)
-                char_count += len(entry)
-            if char_count >= KB_MAX_CHARS:
-                break
-
-        return "\n\n---\n\n".join(parts)
-    except Exception as e:
-        logger.warning(f"KB search failed, proceeding without context: {e}")
-        return ""
+# ---------------------------------------------------------------------------
+# Main entry point
+# ---------------------------------------------------------------------------
 
 
 async def stream_vision_autocomplete(
@@ -144,13 +45,7 @@ async def stream_vision_autocomplete(
     app_name: str = "",
     window_title: str = "",
 ) -> AsyncGenerator[str, None]:
-    """Analyze a screenshot with the vision LLM and stream a text completion.
-
-    Pipeline:
-    1. Extract a search query from the screenshot (non-streaming)
-    2. Search the knowledge base for relevant context
-    3. Stream the final completion with screenshot + KB + app context
-    """
+    """Analyze a screenshot with a vision-LLM agent and stream a text completion."""
     streaming = VercelStreamingService()
     vision_error_msg = (
         "The selected model does not support vision. "
@@ -164,62 +59,89 @@ async def stream_vision_autocomplete(
         yield streaming.format_done()
         return
 
-    kb_context = ""
+    # Start SSE stream immediately so the UI has something to show
+    yield streaming.format_message_start()
+
+    kb_query = _derive_kb_query(app_name, window_title)
+
+    # Show a preparation step while KB search + agent compile run
+    yield streaming.format_thinking_step(
+        step_id=PREP_STEP_ID,
+        title="Searching knowledge base",
+        status="in_progress",
+        items=[kb_query] if kb_query else [],
+    )
+
     try:
-        query = await _extract_query_from_screenshot(
-            llm, screenshot_data_url, app_name=app_name, window_title=window_title,
+        agent, kb = await create_autocomplete_agent(
+            llm,
+            search_space_id=search_space_id,
+            kb_query=kb_query,
+            app_name=app_name,
+            window_title=window_title,
         )
     except Exception as e:
-        logger.warning(f"Vision autocomplete: selected model does not support vision: {e}")
-        yield streaming.format_message_start()
-        yield streaming.format_error(vision_error_msg)
+        if _is_vision_unsupported_error(e):
+            logger.warning("Vision autocomplete: model does not support vision: %s", e)
+            yield streaming.format_error(vision_error_msg)
+            yield streaming.format_done()
+            return
+        logger.error("Failed to create autocomplete agent: %s", e, exc_info=True)
+        yield streaming.format_error("Autocomplete failed. Please try again.")
         yield streaming.format_done()
         return
 
-    if query:
-        kb_context = await _search_knowledge_base(session, search_space_id, query)
+    has_kb = kb.has_documents
+    doc_count = len(kb.files) if has_kb else 0  # type: ignore[arg-type]
 
-    system_prompt = _build_system_prompt(app_name, window_title, kb_context)
+    yield streaming.format_thinking_step(
+        step_id=PREP_STEP_ID,
+        title="Searching knowledge base",
+        status="complete",
+        items=[f"Found {doc_count} document{'s' if doc_count != 1 else ''}"] if kb_query else ["Skipped"],
+    )
 
-    messages = [
-        SystemMessage(content=system_prompt),
-        HumanMessage(content=[
-            {
-                "type": "text",
-                "text": "Analyze this screenshot. Understand the full context of what the user is working on, then generate the text they most likely want to write in the active text area.",
-            },
-            {
-                "type": "image_url",
-                "image_url": {"url": screenshot_data_url},
-            },
-        ]),
-    ]
+    # Build agent input with pre-computed KB as initial state
+    if has_kb:
+        instruction = (
+            "Analyze this screenshot, then explore the knowledge base documents "
+            "listed above — read the chunk index of any document whose title "
+            "looks relevant and check matched chunks for useful facts. "
+            "Finally, generate a concise autocomplete for the active text area, "
+            "enhanced with any relevant KB information you found."
+        )
+    else:
+        instruction = (
+            "Analyze this screenshot and generate a concise autocomplete "
+            "for the active text area based on what you see."
+        )
 
-    text_started = False
-    text_id = ""
+    user_message = HumanMessage(content=[
+        {"type": "text", "text": instruction},
+        {"type": "image_url", "image_url": {"url": screenshot_data_url}},
+    ])
+
+    input_data: dict = {"messages": [user_message]}
+
+    if has_kb:
+        input_data["files"] = kb.files
+        input_data["messages"] = [kb.ls_ai_msg, kb.ls_tool_msg, user_message]
+        logger.info("Autocomplete: injected %d KB files into agent initial state", doc_count)
+    else:
+        logger.info("Autocomplete: no KB documents found, proceeding with screenshot only")
+
+    # Stream the agent (message_start already sent above)
     try:
-        yield streaming.format_message_start()
-        text_id = streaming.generate_text_id()
-        yield streaming.format_text_start(text_id)
-        text_started = True
-
-        async for chunk in llm.astream(messages):
-            token = chunk.content if hasattr(chunk, "content") else str(chunk)
-            if token:
-                yield streaming.format_text_delta(text_id, token)
-
-        yield streaming.format_text_end(text_id)
-        yield streaming.format_finish()
-        yield streaming.format_done()
-
+        async for sse in stream_autocomplete_agent(
+            agent, input_data, streaming, emit_message_start=False,
+        ):
+            yield sse
     except Exception as e:
-        if text_started:
-            yield streaming.format_text_end(text_id)
-
         if _is_vision_unsupported_error(e):
-            logger.warning(f"Vision autocomplete: selected model does not support vision: {e}")
+            logger.warning("Vision autocomplete: model does not support vision: %s", e)
             yield streaming.format_error(vision_error_msg)
+            yield streaming.format_done()
         else:
-            logger.error(f"Vision autocomplete streaming error: {e}", exc_info=True)
+            logger.error("Vision autocomplete streaming error: %s", e, exc_info=True)
             yield streaming.format_error("Autocomplete failed. Please try again.")
-        yield streaming.format_done()
+            yield streaming.format_done()
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index fb83e2113..42ce025a8 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -10,7 +10,18 @@ type SSEEvent =
 	| { type: "text-end"; id: string }
 	| { type: "start"; messageId: string }
 	| { type: "finish" }
-	| { type: "error"; errorText: string };
+	| { type: "error"; errorText: string }
+	| {
+			type: "data-thinking-step";
+			data: { id: string; title: string; status: string; items: string[] };
+	  };
+
+interface AgentStep {
+	id: string;
+	title: string;
+	status: string;
+	items: string[];
+}
 
 function friendlyError(raw: string | number): string {
 	if (typeof raw === "number") {
@@ -34,11 +45,24 @@ function friendlyError(raw: string | number): string {
 
 const AUTO_DISMISS_MS = 3000;
 
+function StepIcon({ status }: { status: string }) {
+	if (status === "complete") {
+		return (
+			<svg className="step-icon step-icon-done" viewBox="0 0 16 16" fill="none">
+				<circle cx="8" cy="8" r="7" stroke="#4ade80" strokeWidth="1.5" />
+				<path d="M5 8.5l2 2 4-4.5" stroke="#4ade80" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round" />
+			</svg>
+		);
+	}
+	return <span className="step-spinner" />;
+}
+
 export default function SuggestionPage() {
 	const api = useElectronAPI();
 	const [suggestion, setSuggestion] = useState("");
 	const [isLoading, setIsLoading] = useState(true);
 	const [error, setError] = useState<string | null>(null);
+	const [steps, setSteps] = useState<AgentStep[]>([]);
 	const abortRef = useRef<AbortController | null>(null);
 
 	const isDesktop = !!api?.onAutocompleteContext;
@@ -66,6 +90,7 @@ export default function SuggestionPage() {
 			setIsLoading(true);
 			setSuggestion("");
 			setError(null);
+			setSteps([]);
 
 			let token = getBearerToken();
 			if (!token) {
@@ -137,6 +162,17 @@ export default function SuggestionPage() {
 									setSuggestion((prev) => prev + parsed.delta);
 								} else if (parsed.type === "error") {
 									setError(friendlyError(parsed.errorText));
+								} else if (parsed.type === "data-thinking-step") {
+									const { id, title, status, items } = parsed.data;
+									setSteps((prev) => {
+										const existing = prev.findIndex((s) => s.id === id);
+										if (existing >= 0) {
+											const updated = [...prev];
+											updated[existing] = { id, title, status, items };
+											return updated;
+										}
+										return [...prev, { id, title, status, items }];
+									});
 								}
 							} catch {
 								continue;
@@ -185,13 +221,33 @@ export default function SuggestionPage() {
 		);
 	}
 
-	if (isLoading && !suggestion) {
+	const showLoading = isLoading && !suggestion;
+
+	if (showLoading) {
 		return (
 			<div className="suggestion-tooltip">
-				<div className="suggestion-loading">
-					<span className="suggestion-dot" />
-					<span className="suggestion-dot" />
-					<span className="suggestion-dot" />
+				<div className="agent-activity">
+					{steps.length === 0 && (
+						<div className="activity-initial">
+							<span className="step-spinner" />
+							<span className="activity-label">Preparing…</span>
+						</div>
+					)}
+					{steps.length > 0 && (
+						<div className="activity-steps">
+							{steps.map((step) => (
+								<div key={step.id} className="activity-step">
+									<StepIcon status={step.status} />
+									<span className="step-label">
+										{step.title}
+										{step.items.length > 0 && (
+											<span className="step-detail"> · {step.items[0]}</span>
+										)}
+									</span>
+								</div>
+							))}
+						</div>
+					)}
 				</div>
 			</div>
 		);
diff --git a/surfsense_web/app/desktop/suggestion/suggestion.css b/surfsense_web/app/desktop/suggestion/suggestion.css
index 62f4d2ea7..d2213fefd 100644
--- a/surfsense_web/app/desktop/suggestion/suggestion.css
+++ b/surfsense_web/app/desktop/suggestion/suggestion.css
@@ -19,13 +19,21 @@ body:has(.suggestion-body) {
 }
 
 .suggestion-tooltip {
+  box-sizing: border-box;
   background: #1e1e1e;
   border: 1px solid #3c3c3c;
   border-radius: 8px;
   padding: 8px 12px;
   margin: 4px;
   max-width: 400px;
+  /* MAX_HEIGHT in suggestion-window.ts is 400px. Subtract 8px for margin
+     (4px * 2) so the tooltip + margin fits within the Electron window.
+     box-sizing: border-box ensures padding + border are included. */
+  max-height: 392px;
   box-shadow: 0 4px 16px rgba(0, 0, 0, 0.5);
+  display: flex;
+  flex-direction: column;
+  overflow: hidden;
 }
 
 .suggestion-text {
@@ -35,6 +43,26 @@ body:has(.suggestion-body) {
   margin: 0 0 6px 0;
   word-wrap: break-word;
   white-space: pre-wrap;
+  overflow-y: auto;
+  flex: 1 1 auto;
+  min-height: 0;
+}
+
+.suggestion-text::-webkit-scrollbar {
+  width: 5px;
+}
+
+.suggestion-text::-webkit-scrollbar-track {
+  background: transparent;
+}
+
+.suggestion-text::-webkit-scrollbar-thumb {
+  background: #555;
+  border-radius: 3px;
+}
+
+.suggestion-text::-webkit-scrollbar-thumb:hover {
+  background: #777;
 }
 
 .suggestion-actions {
@@ -43,6 +71,7 @@ body:has(.suggestion-body) {
   gap: 4px;
   border-top: 1px solid #2a2a2a;
   padding-top: 6px;
+  flex-shrink: 0;
 }
 
 .suggestion-btn {
@@ -86,36 +115,77 @@ body:has(.suggestion-body) {
   font-size: 12px;
 }
 
-.suggestion-loading {
+/* --- Agent activity indicator --- */
+
+.agent-activity {
   display: flex;
-  gap: 5px;
+  flex-direction: column;
+  gap: 4px;
+  overflow-y: auto;
+  max-height: 340px;
+}
+
+.activity-initial {
+  display: flex;
+  align-items: center;
+  gap: 8px;
   padding: 2px 0;
-  justify-content: center;
 }
 
-.suggestion-dot {
-  width: 4px;
-  height: 4px;
+.activity-label {
+  color: #a1a1aa;
+  font-size: 12px;
+  white-space: nowrap;
+  overflow: hidden;
+  text-overflow: ellipsis;
+}
+
+.activity-steps {
+  display: flex;
+  flex-direction: column;
+  gap: 3px;
+}
+
+.activity-step {
+  display: flex;
+  align-items: center;
+  gap: 6px;
+  min-height: 18px;
+}
+
+.step-label {
+  color: #d4d4d4;
+  font-size: 12px;
+  white-space: nowrap;
+  overflow: hidden;
+  text-overflow: ellipsis;
+}
+
+.step-detail {
+  color: #71717a;
+  font-size: 11px;
+}
+
+/* Spinner (in_progress) */
+.step-spinner {
+  width: 14px;
+  height: 14px;
+  flex-shrink: 0;
+  border: 1.5px solid #3f3f46;
+  border-top-color: #a78bfa;
   border-radius: 50%;
-  background: #666;
-  animation: suggestion-pulse 1.2s infinite ease-in-out;
+  animation: step-spin 0.7s linear infinite;
 }
 
-.suggestion-dot:nth-child(2) {
-  animation-delay: 0.15s;
+/* Checkmark icon (complete) */
+.step-icon {
+  width: 14px;
+  height: 14px;
+  flex-shrink: 0;
 }
 
-.suggestion-dot:nth-child(3) {
-  animation-delay: 0.3s;
-}
-
-@keyframes suggestion-pulse {
-  0%, 80%, 100% {
-    opacity: 0.3;
-    transform: scale(0.8);
-  }
-  40% {
-    opacity: 1;
-    transform: scale(1.1);
+@keyframes step-spin {
+  to {
+    transform: rotate(360deg);
   }
 }
diff --git a/surfsense_web/components/assistant-ui/thread.tsx b/surfsense_web/components/assistant-ui/thread.tsx
index 7d8765399..6c8c619b2 100644
--- a/surfsense_web/components/assistant-ui/thread.tsx
+++ b/surfsense_web/components/assistant-ui/thread.tsx
@@ -92,15 +92,7 @@ import { useMediaQuery } from "@/hooks/use-media-query";
 import { useElectronAPI } from "@/hooks/use-platform";
 import { cn } from "@/lib/utils";
 
-/** Placeholder texts that cycle in new chats when input is empty */
-const CYCLING_PLACEHOLDERS = [
-	"Ask SurfSense anything or @mention docs",
-	"Generate a podcast from my vacation ideas in Notion",
-	"Sum up last week's meeting notes from Drive in a bulleted list",
-	"Give me a brief overview of the most urgent tickets in Jira and Linear",
-	"Briefly, what are today's top ten important emails and calendar events?",
-	"Check if this week's Slack messages reference any GitHub issues",
-];
+const COMPOSER_PLACEHOLDER = "Ask anything · Type / for prompts · Type @ to mention docs";
 
 export const Thread: FC = () => {
 	return <ThreadContent />;
@@ -380,29 +372,7 @@ const Composer: FC = () => {
 	const isThreadEmpty = useAuiState(({ thread }) => thread.isEmpty);
 	const isThreadRunning = useAuiState(({ thread }) => thread.isRunning);
 
-	// Cycling placeholder state - only cycles in new chats
-	const [placeholderIndex, setPlaceholderIndex] = useState(0);
-
-	// Cycle through placeholders every 4 seconds when thread is empty (new chat)
-	useEffect(() => {
-		// Only cycle when thread is empty (new chat)
-		if (!isThreadEmpty) {
-			// Reset to first placeholder when chat becomes active
-			setPlaceholderIndex(0);
-			return;
-		}
-
-		const intervalId = setInterval(() => {
-			setPlaceholderIndex((prev) => (prev + 1) % CYCLING_PLACEHOLDERS.length);
-		}, 6000);
-
-		return () => clearInterval(intervalId);
-	}, [isThreadEmpty]);
-
-	// Compute current placeholder - only cycle in new chats
-	const currentPlaceholder = isThreadEmpty
-		? CYCLING_PLACEHOLDERS[placeholderIndex]
-		: CYCLING_PLACEHOLDERS[0];
+	const currentPlaceholder = COMPOSER_PLACEHOLDER;
 
 	// Live collaboration state
 	const { data: currentUser } = useAtomValue(currentUserAtom);

From 91ea293fa214bd1290f14c0f125a6ca66c4a875a Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 03:10:06 -0700
Subject: [PATCH 162/202] chore: linting

---
 .../agents/autocomplete/autocomplete_agent.py |  27 +++-
 .../services/vision_autocomplete_service.py   |  27 +++-
 .../components/DesktopContent.tsx             |  36 ++---
 surfsense_web/app/dashboard/layout.tsx        |   2 +-
 surfsense_web/app/desktop/login/page.tsx      |  54 ++-----
 .../app/desktop/permissions/page.tsx          |   5 +-
 surfsense_web/app/desktop/suggestion/page.tsx |  17 +-
 .../app/desktop/suggestion/suggestion.css     | 148 +++++++++---------
 .../components/desktop/shortcut-recorder.tsx  |  16 +-
 .../components/homepage/hero-section.tsx      | 139 ++++++++--------
 .../layout/ui/sidebar/DocumentsSidebar.tsx    |  66 ++++----
 .../components/sources/DocumentUploadTab.tsx  |   2 +-
 surfsense_web/contexts/platform-context.tsx   |   6 +-
 surfsense_web/types/window.d.ts               |   4 +-
 14 files changed, 285 insertions(+), 264 deletions(-)

diff --git a/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py b/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
index 928a133cc..c6a071b0f 100644
--- a/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
+++ b/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
@@ -16,7 +16,8 @@ from __future__ import annotations
 import asyncio
 import logging
 import uuid
-from typing import Any, AsyncGenerator
+from collections.abc import AsyncGenerator
+from typing import Any
 
 from deepagents.graph import BASE_AGENT_PROMPT
 from deepagents.middleware.patch_tool_calls import PatchToolCallsMiddleware
@@ -122,6 +123,7 @@ def _build_autocomplete_system_prompt(app_name: str, window_title: str) -> str:
 
 class _KBResult:
     """Container for pre-computed KB filesystem results."""
+
     __slots__ = ("files", "ls_ai_msg", "ls_tool_msg")
 
     def __init__(
@@ -171,13 +173,16 @@ async def precompute_kb_filesystem(
             return _KBResult()
 
         doc_paths = [
-            p for p, v in new_files.items()
+            p
+            for p, v in new_files.items()
             if p.startswith("/documents/") and v is not None
         ]
         tool_call_id = f"auto_ls_{uuid.uuid4().hex[:12]}"
         ai_msg = AIMessage(
             content="",
-            tool_calls=[{"name": "ls", "args": {"path": "/documents"}, "id": tool_call_id}],
+            tool_calls=[
+                {"name": "ls", "args": {"path": "/documents"}, "id": tool_call_id}
+            ],
         )
         tool_msg = ToolMessage(
             content=str(doc_paths) if doc_paths else "No documents found.",
@@ -186,7 +191,9 @@ async def precompute_kb_filesystem(
         return _KBResult(files=new_files, ls_ai_msg=ai_msg, ls_tool_msg=tool_msg)
 
     except Exception:
-        logger.warning("KB pre-computation failed, proceeding without KB", exc_info=True)
+        logger.warning(
+            "KB pre-computation failed, proceeding without KB", exc_info=True
+        )
         return _KBResult()
 
 
@@ -320,7 +327,9 @@ async def stream_autocomplete_agent(
     )
 
     try:
-        async for event in agent.astream_events(input_data, config=config, version="v2"):
+        async for event in agent.astream_events(
+            input_data, config=config, version="v2"
+        ):
             event_type = event.get("event", "")
 
             if event_type == "on_chat_model_stream":
@@ -338,7 +347,9 @@ async def stream_autocomplete_agent(
                                 yield step_event
                             current_text_id = streaming_service.generate_text_id()
                             yield streaming_service.format_text_start(current_text_id)
-                        yield streaming_service.format_text_delta(current_text_id, content)
+                        yield streaming_service.format_text_delta(
+                            current_text_id, content
+                        )
 
             elif event_type == "on_tool_start":
                 active_tool_depth += 1
@@ -425,5 +436,7 @@ def _describe_tool_call(tool_name: str, tool_input: Any) -> tuple[str, list[str]
         pat = inp.get("pattern", "")
         path = inp.get("path", "")
         display_pat = pat[:60] + ("…" if len(pat) > 60 else "")
-        return "Searching content", [f'"{display_pat}"' + (f" in {path}" if path else "")]
+        return "Searching content", [
+            f'"{display_pat}"' + (f" in {path}" if path else "")
+        ]
     return f"Using {tool_name}", []
diff --git a/surfsense_backend/app/services/vision_autocomplete_service.py b/surfsense_backend/app/services/vision_autocomplete_service.py
index 2c2cd65d2..c28962b31 100644
--- a/surfsense_backend/app/services/vision_autocomplete_service.py
+++ b/surfsense_backend/app/services/vision_autocomplete_service.py
@@ -98,7 +98,9 @@ async def stream_vision_autocomplete(
         step_id=PREP_STEP_ID,
         title="Searching knowledge base",
         status="complete",
-        items=[f"Found {doc_count} document{'s' if doc_count != 1 else ''}"] if kb_query else ["Skipped"],
+        items=[f"Found {doc_count} document{'s' if doc_count != 1 else ''}"]
+        if kb_query
+        else ["Skipped"],
     )
 
     # Build agent input with pre-computed KB as initial state
@@ -116,24 +118,33 @@ async def stream_vision_autocomplete(
             "for the active text area based on what you see."
         )
 
-    user_message = HumanMessage(content=[
-        {"type": "text", "text": instruction},
-        {"type": "image_url", "image_url": {"url": screenshot_data_url}},
-    ])
+    user_message = HumanMessage(
+        content=[
+            {"type": "text", "text": instruction},
+            {"type": "image_url", "image_url": {"url": screenshot_data_url}},
+        ]
+    )
 
     input_data: dict = {"messages": [user_message]}
 
     if has_kb:
         input_data["files"] = kb.files
         input_data["messages"] = [kb.ls_ai_msg, kb.ls_tool_msg, user_message]
-        logger.info("Autocomplete: injected %d KB files into agent initial state", doc_count)
+        logger.info(
+            "Autocomplete: injected %d KB files into agent initial state", doc_count
+        )
     else:
-        logger.info("Autocomplete: no KB documents found, proceeding with screenshot only")
+        logger.info(
+            "Autocomplete: no KB documents found, proceeding with screenshot only"
+        )
 
     # Stream the agent (message_start already sent above)
     try:
         async for sse in stream_autocomplete_agent(
-            agent, input_data, streaming, emit_message_start=False,
+            agent,
+            input_data,
+            streaming,
+            emit_message_start=False,
         ):
             yield sse
     except Exception as e:
diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
index 07b746a19..a2f9da0f8 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
@@ -3,10 +3,7 @@
 import { Clipboard, Sparkles } from "lucide-react";
 import { useCallback, useEffect, useState } from "react";
 import { toast } from "sonner";
-import {
-	DEFAULT_SHORTCUTS,
-	ShortcutRecorder,
-} from "@/components/desktop/shortcut-recorder";
+import { DEFAULT_SHORTCUTS, ShortcutRecorder } from "@/components/desktop/shortcut-recorder";
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
 import { Label } from "@/components/ui/label";
 import { Spinner } from "@/components/ui/spinner";
@@ -29,22 +26,23 @@ export function DesktopContent() {
 
 		let mounted = true;
 
-		Promise.all([
-			api.getAutocompleteEnabled(),
-			api.getShortcuts?.() ?? Promise.resolve(null),
-		]).then(([autoEnabled, config]) => {
-			if (!mounted) return;
-			setEnabled(autoEnabled);
-			if (config) setShortcuts(config);
-			setLoading(false);
-			setShortcutsLoaded(true);
-		}).catch(() => {
-			if (!mounted) return;
-			setLoading(false);
-			setShortcutsLoaded(true);
-		});
+		Promise.all([api.getAutocompleteEnabled(), api.getShortcuts?.() ?? Promise.resolve(null)])
+			.then(([autoEnabled, config]) => {
+				if (!mounted) return;
+				setEnabled(autoEnabled);
+				if (config) setShortcuts(config);
+				setLoading(false);
+				setShortcutsLoaded(true);
+			})
+			.catch(() => {
+				if (!mounted) return;
+				setLoading(false);
+				setShortcutsLoaded(true);
+			});
 
-		return () => { mounted = false; };
+		return () => {
+			mounted = false;
+		};
 	}, [api]);
 
 	if (!api) {
diff --git a/surfsense_web/app/dashboard/layout.tsx b/surfsense_web/app/dashboard/layout.tsx
index 25bea5467..1f5481b15 100644
--- a/surfsense_web/app/dashboard/layout.tsx
+++ b/surfsense_web/app/dashboard/layout.tsx
@@ -3,7 +3,7 @@
 import { useEffect, useState } from "react";
 import { USER_QUERY_KEY } from "@/atoms/user/user-query.atoms";
 import { useGlobalLoadingEffect } from "@/hooks/use-global-loading";
-import { getBearerToken, ensureTokensFromElectron, redirectToLogin } from "@/lib/auth-utils";
+import { ensureTokensFromElectron, getBearerToken, redirectToLogin } from "@/lib/auth-utils";
 import { queryClient } from "@/lib/query-client/client";
 
 interface DashboardLayoutProps {
diff --git a/surfsense_web/app/desktop/login/page.tsx b/surfsense_web/app/desktop/login/page.tsx
index 529577b59..c81e284ba 100644
--- a/surfsense_web/app/desktop/login/page.tsx
+++ b/surfsense_web/app/desktop/login/page.tsx
@@ -2,30 +2,15 @@
 
 import { IconBrandGoogleFilled } from "@tabler/icons-react";
 import { useAtom } from "jotai";
-import {
-	Eye,
-	EyeOff,
-	Keyboard,
-	Clipboard,
-	Sparkles,
-} from "lucide-react";
+import { Clipboard, Eye, EyeOff, Keyboard, Sparkles } from "lucide-react";
 import Image from "next/image";
 import { useRouter } from "next/navigation";
 import { useCallback, useEffect, useState } from "react";
 import { toast } from "sonner";
 import { loginMutationAtom } from "@/atoms/auth/auth-mutation.atoms";
-import {
-	DEFAULT_SHORTCUTS,
-	ShortcutRecorder,
-} from "@/components/desktop/shortcut-recorder";
+import { DEFAULT_SHORTCUTS, ShortcutRecorder } from "@/components/desktop/shortcut-recorder";
 import { Button } from "@/components/ui/button";
-import {
-	Card,
-	CardContent,
-	CardDescription,
-	CardHeader,
-	CardTitle,
-} from "@/components/ui/card";
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
 import { Input } from "@/components/ui/input";
 import { Label } from "@/components/ui/label";
 import { Separator } from "@/components/ui/separator";
@@ -38,8 +23,7 @@ const isGoogleAuth = AUTH_TYPE === "GOOGLE";
 export default function DesktopLoginPage() {
 	const router = useRouter();
 	const api = useElectronAPI();
-	const [{ mutateAsync: login, isPending: isLoggingIn }] =
-		useAtom(loginMutationAtom);
+	const [{ mutateAsync: login, isPending: isLoggingIn }] = useAtom(loginMutationAtom);
 
 	const [email, setEmail] = useState("");
 	const [password, setPassword] = useState("");
@@ -54,10 +38,13 @@ export default function DesktopLoginPage() {
 			setShortcutsLoaded(true);
 			return;
 		}
-		api.getShortcuts().then((config) => {
-			if (config) setShortcuts(config);
-			setShortcutsLoaded(true);
-		}).catch(() => setShortcutsLoaded(true));
+		api
+			.getShortcuts()
+			.then((config) => {
+				if (config) setShortcuts(config);
+				setShortcutsLoaded(true);
+			})
+			.catch(() => setShortcutsLoaded(true));
 	}, [api]);
 
 	const updateShortcut = useCallback(
@@ -118,8 +105,7 @@ export default function DesktopLoginPage() {
 				<div
 					className="absolute -top-1/2 left-1/2 size-[800px] -translate-x-1/2 rounded-full opacity-[0.03]"
 					style={{
-						background:
-							"radial-gradient(circle, hsl(var(--primary)) 0%, transparent 70%)",
+						background: "radial-gradient(circle, hsl(var(--primary)) 0%, transparent 70%)",
 					}}
 				/>
 			</div>
@@ -135,9 +121,7 @@ export default function DesktopLoginPage() {
 						priority
 					/>
 					<CardTitle className="text-xl">Welcome to SurfSense Desktop App</CardTitle>
-					<CardDescription>
-						Configure your shortcuts, then sign in to get started.
-					</CardDescription>
+					<CardDescription>Configure your shortcuts, then sign in to get started.</CardDescription>
 				</CardHeader>
 
 				<CardContent className="flex flex-col gap-6">
@@ -181,11 +165,7 @@ export default function DesktopLoginPage() {
 
 					{/* ---- Auth Section (second) ---- */}
 					{isGoogleAuth ? (
-						<Button
-							variant="outline"
-							className="w-full gap-2 py-5"
-							onClick={handleGoogleLogin}
-						>
+						<Button variant="outline" className="w-full gap-2 py-5" onClick={handleGoogleLogin}>
 							<IconBrandGoogleFilled className="size-5" />
 							Continue with Google
 						</Button>
@@ -230,11 +210,7 @@ export default function DesktopLoginPage() {
 										className="absolute inset-y-0 right-0 flex items-center pr-3 text-muted-foreground hover:text-foreground"
 										tabIndex={-1}
 									>
-										{showPassword ? (
-											<EyeOff className="size-4" />
-										) : (
-											<Eye className="size-4" />
-										)}
+										{showPassword ? <EyeOff className="size-4" /> : <Eye className="size-4" />}
 									</button>
 								</div>
 							</div>
diff --git a/surfsense_web/app/desktop/permissions/page.tsx b/surfsense_web/app/desktop/permissions/page.tsx
index b636fcd7c..a2fadc8ff 100644
--- a/surfsense_web/app/desktop/permissions/page.tsx
+++ b/surfsense_web/app/desktop/permissions/page.tsx
@@ -80,7 +80,9 @@ export default function DesktopPermissionsPage() {
 
 		poll();
 		interval = setInterval(poll, 2000);
-		return () => { if (interval) clearInterval(interval); };
+		return () => {
+			if (interval) clearInterval(interval);
+		};
 	}, [api]);
 
 	if (!api) {
@@ -204,6 +206,7 @@ export default function DesktopPermissionsPage() {
 								Grant permissions to continue
 							</Button>
 							<button
+								type="button"
 								onClick={handleSkip}
 								className="block mx-auto text-xs text-muted-foreground hover:text-foreground transition-colors"
 							>
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 587bee9db..8d9095320 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -2,7 +2,7 @@
 
 import { useCallback, useEffect, useRef, useState } from "react";
 import { useElectronAPI } from "@/hooks/use-platform";
-import { getBearerToken, ensureTokensFromElectron } from "@/lib/auth-utils";
+import { ensureTokensFromElectron, getBearerToken } from "@/lib/auth-utils";
 
 type SSEEvent =
 	| { type: "text-delta"; id: string; delta: string }
@@ -48,9 +48,20 @@ const AUTO_DISMISS_MS = 3000;
 function StepIcon({ status }: { status: string }) {
 	if (status === "complete") {
 		return (
-			<svg className="step-icon step-icon-done" viewBox="0 0 16 16" fill="none">
+			<svg
+				className="step-icon step-icon-done"
+				viewBox="0 0 16 16"
+				fill="none"
+				aria-label="Step complete"
+			>
 				<circle cx="8" cy="8" r="7" stroke="#4ade80" strokeWidth="1.5" />
-				<path d="M5 8.5l2 2 4-4.5" stroke="#4ade80" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round" />
+				<path
+					d="M5 8.5l2 2 4-4.5"
+					stroke="#4ade80"
+					strokeWidth="1.5"
+					strokeLinecap="round"
+					strokeLinejoin="round"
+				/>
 			</svg>
 		);
 	}
diff --git a/surfsense_web/app/desktop/suggestion/suggestion.css b/surfsense_web/app/desktop/suggestion/suggestion.css
index 57a7fd4f4..2aa614efb 100644
--- a/surfsense_web/app/desktop/suggestion/suggestion.css
+++ b/surfsense_web/app/desktop/suggestion/suggestion.css
@@ -19,59 +19,59 @@ body:has(.suggestion-body) {
 }
 
 .suggestion-tooltip {
-  box-sizing: border-box;
-  background: #1e1e1e;
-  border: 1px solid #3c3c3c;
-  border-radius: 8px;
-  padding: 8px 12px;
-  margin: 4px;
-  max-width: 400px;
-  /* MAX_HEIGHT in suggestion-window.ts is 400px. Subtract 8px for margin
+	box-sizing: border-box;
+	background: #1e1e1e;
+	border: 1px solid #3c3c3c;
+	border-radius: 8px;
+	padding: 8px 12px;
+	margin: 4px;
+	max-width: 400px;
+	/* MAX_HEIGHT in suggestion-window.ts is 400px. Subtract 8px for margin
      (4px * 2) so the tooltip + margin fits within the Electron window.
      box-sizing: border-box ensures padding + border are included. */
-  max-height: 392px;
-  box-shadow: 0 4px 16px rgba(0, 0, 0, 0.5);
-  display: flex;
-  flex-direction: column;
-  overflow: hidden;
+	max-height: 392px;
+	box-shadow: 0 4px 16px rgba(0, 0, 0, 0.5);
+	display: flex;
+	flex-direction: column;
+	overflow: hidden;
 }
 
 .suggestion-text {
-  color: #d4d4d4;
-  font-size: 13px;
-  line-height: 1.45;
-  margin: 0 0 6px 0;
-  word-wrap: break-word;
-  white-space: pre-wrap;
-  overflow-y: auto;
-  flex: 1 1 auto;
-  min-height: 0;
+	color: #d4d4d4;
+	font-size: 13px;
+	line-height: 1.45;
+	margin: 0 0 6px 0;
+	word-wrap: break-word;
+	white-space: pre-wrap;
+	overflow-y: auto;
+	flex: 1 1 auto;
+	min-height: 0;
 }
 
 .suggestion-text::-webkit-scrollbar {
-  width: 5px;
+	width: 5px;
 }
 
 .suggestion-text::-webkit-scrollbar-track {
-  background: transparent;
+	background: transparent;
 }
 
 .suggestion-text::-webkit-scrollbar-thumb {
-  background: #555;
-  border-radius: 3px;
+	background: #555;
+	border-radius: 3px;
 }
 
 .suggestion-text::-webkit-scrollbar-thumb:hover {
-  background: #777;
+	background: #777;
 }
 
 .suggestion-actions {
-  display: flex;
-  justify-content: flex-end;
-  gap: 4px;
-  border-top: 1px solid #2a2a2a;
-  padding-top: 6px;
-  flex-shrink: 0;
+	display: flex;
+	justify-content: flex-end;
+	gap: 4px;
+	border-top: 1px solid #2a2a2a;
+	padding-top: 6px;
+	flex-shrink: 0;
 }
 
 .suggestion-btn {
@@ -120,74 +120,74 @@ body:has(.suggestion-body) {
 /* --- Agent activity indicator --- */
 
 .agent-activity {
-  display: flex;
-  flex-direction: column;
-  gap: 4px;
-  overflow-y: auto;
-  max-height: 340px;
+	display: flex;
+	flex-direction: column;
+	gap: 4px;
+	overflow-y: auto;
+	max-height: 340px;
 }
 
 .activity-initial {
-  display: flex;
-  align-items: center;
-  gap: 8px;
-  padding: 2px 0;
+	display: flex;
+	align-items: center;
+	gap: 8px;
+	padding: 2px 0;
 }
 
 .activity-label {
-  color: #a1a1aa;
-  font-size: 12px;
-  white-space: nowrap;
-  overflow: hidden;
-  text-overflow: ellipsis;
+	color: #a1a1aa;
+	font-size: 12px;
+	white-space: nowrap;
+	overflow: hidden;
+	text-overflow: ellipsis;
 }
 
 .activity-steps {
-  display: flex;
-  flex-direction: column;
-  gap: 3px;
+	display: flex;
+	flex-direction: column;
+	gap: 3px;
 }
 
 .activity-step {
-  display: flex;
-  align-items: center;
-  gap: 6px;
-  min-height: 18px;
+	display: flex;
+	align-items: center;
+	gap: 6px;
+	min-height: 18px;
 }
 
 .step-label {
-  color: #d4d4d4;
-  font-size: 12px;
-  white-space: nowrap;
-  overflow: hidden;
-  text-overflow: ellipsis;
+	color: #d4d4d4;
+	font-size: 12px;
+	white-space: nowrap;
+	overflow: hidden;
+	text-overflow: ellipsis;
 }
 
 .step-detail {
-  color: #71717a;
-  font-size: 11px;
+	color: #71717a;
+	font-size: 11px;
 }
 
 /* Spinner (in_progress) */
 .step-spinner {
-  width: 14px;
-  height: 14px;
-  flex-shrink: 0;
-  border: 1.5px solid #3f3f46;
-  border-top-color: #a78bfa;
-  border-radius: 50%;
-  animation: step-spin 0.7s linear infinite;
+	width: 14px;
+	height: 14px;
+	flex-shrink: 0;
+	border: 1.5px solid #3f3f46;
+	border-top-color: #a78bfa;
+	border-radius: 50%;
+	animation: step-spin 0.7s linear infinite;
 }
 
 /* Checkmark icon (complete) */
 .step-icon {
-  width: 14px;
-  height: 14px;
-  flex-shrink: 0;
+	width: 14px;
+	height: 14px;
+	flex-shrink: 0;
 }
 
 @keyframes step-spin {
-  to {
-    transform: rotate(360deg);
-  }
+	to {
+		transform: rotate(360deg);
+	}
 }
diff --git a/surfsense_web/components/desktop/shortcut-recorder.tsx b/surfsense_web/components/desktop/shortcut-recorder.tsx
index 0c0012002..6d5e93a65 100644
--- a/surfsense_web/components/desktop/shortcut-recorder.tsx
+++ b/surfsense_web/components/desktop/shortcut-recorder.tsx
@@ -44,13 +44,7 @@ export const DEFAULT_SHORTCUTS = {
 // Kbd pill component
 // ---------------------------------------------------------------------------
 
-export function Kbd({
-	keys,
-	className,
-}: {
-	keys: string[];
-	className?: string;
-}) {
+export function Kbd({ keys, className }: { keys: string[]; className?: string }) {
 	return (
 		<span className={cn("inline-flex items-center gap-1", className)}>
 			{keys.map((key) => (
@@ -123,9 +117,7 @@ export function ShortcutRecorder({
 				</div>
 				<div className="min-w-0">
 					<p className="text-sm font-medium leading-none">{label}</p>
-					<p className="mt-1 text-xs text-muted-foreground truncate">
-						{description}
-					</p>
+					<p className="mt-1 text-xs text-muted-foreground truncate">{description}</p>
 				</div>
 			</div>
 
@@ -155,9 +147,7 @@ export function ShortcutRecorder({
 					)}
 				>
 					{recording ? (
-						<span className="text-xs text-primary animate-pulse">
-							Press keys...
-						</span>
+						<span className="text-xs text-primary animate-pulse">Press keys...</span>
 					) : (
 						<Kbd keys={displayKeys} />
 					)}
diff --git a/surfsense_web/components/homepage/hero-section.tsx b/surfsense_web/components/homepage/hero-section.tsx
index 60f293005..c8dde97ee 100644
--- a/surfsense_web/components/homepage/hero-section.tsx
+++ b/surfsense_web/components/homepage/hero-section.tsx
@@ -1,21 +1,14 @@
 "use client";
-import { AnimatePresence, motion } from "motion/react";
 import { Monitor } from "lucide-react";
+import { AnimatePresence, motion } from "motion/react";
 import Link from "next/link";
-import React, { useCallback, useEffect, useRef, useState, memo } from "react";
+import React, { memo, useCallback, useEffect, useRef, useState } from "react";
 import Balancer from "react-wrap-balancer";
+import { ExpandedMediaOverlay, useExpandedMedia } from "@/components/ui/expanded-gif-overlay";
+import { Tooltip, TooltipContent, TooltipTrigger } from "@/components/ui/tooltip";
 import { AUTH_TYPE, BACKEND_URL } from "@/lib/env-config";
 import { trackLoginAttempt } from "@/lib/posthog/events";
 import { cn } from "@/lib/utils";
-import {
-	ExpandedMediaOverlay,
-	useExpandedMedia,
-} from "@/components/ui/expanded-gif-overlay";
-import {
-	Tooltip,
-	TooltipContent,
-	TooltipTrigger,
-} from "@/components/ui/tooltip";
 
 const GoogleLogo = ({ className }: { className?: string }) => (
 	<svg
@@ -61,8 +54,7 @@ const TAB_ITEMS = [
 	},
 	{
 		title: "Search & Citation",
-		description:
-			"Ask questions and get cited responses from your knowledge base.",
+		description: "Ask questions and get cited responses from your knowledge base.",
 		src: "/homepage/hero_tutorial/BSNCGif.mp4",
 		featured: false,
 	},
@@ -86,15 +78,13 @@ const TAB_ITEMS = [
 	},
 	{
 		title: "Image Generation",
-		description:
-			"Generate high-quality images easily from your conversations.",
+		description: "Generate high-quality images easily from your conversations.",
 		src: "/homepage/hero_tutorial/ImageGenGif.mp4",
 		featured: false,
 	},
 	{
 		title: "Collaborative Chat",
-		description:
-			"Collaborate on AI-powered conversations in realtime with your team.",
+		description: "Collaborate on AI-powered conversations in realtime with your team.",
 		src: "/homepage/hero_realtime/RealTimeChatGif.mp4",
 		featured: false,
 	},
@@ -106,8 +96,7 @@ const TAB_ITEMS = [
 	},
 	{
 		title: "Video Generation",
-		description:
-			"Create short videos with AI-generated visuals and narration from your sources.",
+		description: "Create short videos with AI-generated visuals and narration from your sources.",
 		src: "/homepage/hero_tutorial/video_gen_surf.mp4",
 		featured: false,
 	},
@@ -119,7 +108,7 @@ export function HeroSection() {
 			<div className="mt-4 flex w-full min-w-0 flex-col items-start px-2 md:px-8 xl:px-0">
 				<h1
 					className={cn(
-						"relative mt-4 max-w-7xl text-left text-4xl font-bold tracking-tight text-balance text-neutral-900 sm:text-5xl md:text-6xl xl:text-8xl dark:text-neutral-50",
+						"relative mt-4 max-w-7xl text-left text-4xl font-bold tracking-tight text-balance text-neutral-900 sm:text-5xl md:text-6xl xl:text-8xl dark:text-neutral-50"
 					)}
 				>
 					<Balancer>NotebookLM for Teams</Balancer>
@@ -128,10 +117,11 @@ export function HeroSection() {
 					<div>
 						<h2
 							className={cn(
-								"relative mb-8 max-w-2xl text-left text-sm tracking-wide text-neutral-600 antialiased sm:text-base md:text-xl dark:text-neutral-400",
+								"relative mb-8 max-w-2xl text-left text-sm tracking-wide text-neutral-600 antialiased sm:text-base md:text-xl dark:text-neutral-400"
 							)}
 						>
-							An open source, privacy focused alternative to NotebookLM for teams with no data limits.
+							An open source, privacy focused alternative to NotebookLM for teams with no data
+							limits.
 						</h2>
 
 						<div className="relative mb-4 flex w-full flex-col justify-center gap-y-2 sm:flex-row sm:justify-start sm:space-y-0 sm:space-x-4">
@@ -194,33 +184,34 @@ const BrowserWindow = () => {
 					<div className="no-visible-scrollbar flex min-w-0 shrink flex-row items-center justify-start gap-2 overflow-x-auto mask-l-from-98% py-0.5 pr-2 pl-2 md:pl-4">
 						{TAB_ITEMS.map((item, index) => (
 							<React.Fragment key={item.title}>
-							<button
-								type="button"
-								onClick={() => setSelectedIndex(index)}
-								className={cn(
-									"flex shrink-0 items-center gap-1.5 rounded-md px-2 py-1 text-xs transition duration-150 hover:bg-white sm:text-sm dark:hover:bg-neutral-950",
-									selectedIndex === index && !item.featured &&
-										"bg-white shadow ring-1 shadow-black/10 ring-black/10 dark:bg-neutral-900",
-									selectedIndex === index && item.featured &&
-										"bg-amber-50 shadow ring-1 shadow-amber-200/50 ring-amber-400/60 dark:bg-amber-950/40 dark:shadow-amber-900/30 dark:ring-amber-500/50",
-									item.featured && selectedIndex !== index &&
-										"hover:bg-amber-50 dark:hover:bg-amber-950/30",
-								)}
-							>
+								<button
+									type="button"
+									onClick={() => setSelectedIndex(index)}
+									className={cn(
+										"flex shrink-0 items-center gap-1.5 rounded-md px-2 py-1 text-xs transition duration-150 hover:bg-white sm:text-sm dark:hover:bg-neutral-950",
+										selectedIndex === index &&
+											!item.featured &&
+											"bg-white shadow ring-1 shadow-black/10 ring-black/10 dark:bg-neutral-900",
+										selectedIndex === index &&
+											item.featured &&
+											"bg-amber-50 shadow ring-1 shadow-amber-200/50 ring-amber-400/60 dark:bg-amber-950/40 dark:shadow-amber-900/30 dark:ring-amber-500/50",
+										item.featured &&
+											selectedIndex !== index &&
+											"hover:bg-amber-50 dark:hover:bg-amber-950/30"
+									)}
+								>
 									{item.title}
-								{item.featured && (
-									<Tooltip>
-										<TooltipTrigger asChild>
-											<span className="inline-flex shrink-0 items-center justify-center rounded border border-amber-300 bg-amber-100 p-0.5 text-amber-700 dark:border-amber-700 dark:bg-amber-900/50 dark:text-amber-400">
-												<Monitor className="size-3" />
-											</span>
-										</TooltipTrigger>
-										<TooltipContent side="bottom">
-											Desktop app only
-										</TooltipContent>
-									</Tooltip>
-								)}
-							</button>
+									{item.featured && (
+										<Tooltip>
+											<TooltipTrigger asChild>
+												<span className="inline-flex shrink-0 items-center justify-center rounded border border-amber-300 bg-amber-100 p-0.5 text-amber-700 dark:border-amber-700 dark:bg-amber-900/50 dark:text-amber-400">
+													<Monitor className="size-3" />
+												</span>
+											</TooltipTrigger>
+											<TooltipContent side="bottom">Desktop app only</TooltipContent>
+										</Tooltip>
+									)}
+								</button>
 								{index !== TAB_ITEMS.length - 1 && (
 									<div className="h-4 w-px shrink-0 rounded-full bg-neutral-300 dark:bg-neutral-700" />
 								)}
@@ -263,13 +254,13 @@ const BrowserWindow = () => {
 									</p>
 								</div>
 							</div>
-							{/* biome-ignore lint/a11y/useKeyWithClickEvents: wrapper for video expand */}
-							<div
-								className="cursor-pointer bg-neutral-50 p-2 sm:p-3 dark:bg-neutral-950"
+							<button
+								type="button"
+								className="cursor-pointer bg-neutral-50 p-2 sm:p-3 dark:bg-neutral-950 w-full"
 								onClick={open}
 							>
 								<TabVideo src={selectedItem.src} />
-							</div>
+							</button>
 						</motion.div>
 					</AnimatePresence>
 				</div>
@@ -277,11 +268,7 @@ const BrowserWindow = () => {
 
 			<AnimatePresence>
 				{expanded && (
-					<ExpandedMediaOverlay
-						src={selectedItem.src}
-						alt={selectedItem.title}
-						onClose={close}
-					/>
+					<ExpandedMediaOverlay src={selectedItem.src} alt={selectedItem.title} onClose={close} />
 				)}
 			</AnimatePresence>
 		</>
@@ -297,7 +284,7 @@ const TabVideo = memo(function TabVideo({ src }: { src: string }) {
 		const video = videoRef.current;
 		if (!video) return;
 		video.currentTime = 0;
-		video.play().catch(() => { });
+		video.play().catch(() => {});
 	}, [src]);
 
 	const handleCanPlay = useCallback(() => {
@@ -324,8 +311,7 @@ const TabVideo = memo(function TabVideo({ src }: { src: string }) {
 	);
 });
 
-const GITHUB_RELEASES_URL =
-	"https://github.com/MODSetter/SurfSense/releases/latest";
+const GITHUB_RELEASES_URL = "https://github.com/MODSetter/SurfSense/releases/latest";
 
 const DownloadApp = memo(function DownloadApp() {
 	return (
@@ -340,7 +326,16 @@ const DownloadApp = memo(function DownloadApp() {
 					rel="noopener noreferrer"
 					className="flex items-center gap-2 rounded-lg border border-neutral-200 bg-white px-4 py-2.5 text-sm font-medium text-neutral-700 shadow-sm transition hover:bg-neutral-50 dark:border-neutral-700 dark:bg-neutral-900 dark:text-neutral-200 dark:hover:bg-neutral-800"
 				>
-					<svg className="size-4" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
+					<svg
+						className="size-4"
+						viewBox="0 0 24 24"
+						fill="none"
+						stroke="currentColor"
+						strokeWidth="2"
+						strokeLinecap="round"
+						strokeLinejoin="round"
+						aria-label="Download for macOS"
+					>
 						<path d="M12 17V3" />
 						<path d="m6 11 6 6 6-6" />
 						<path d="M19 21H5" />
@@ -353,7 +348,16 @@ const DownloadApp = memo(function DownloadApp() {
 					rel="noopener noreferrer"
 					className="flex items-center gap-2 rounded-lg border border-neutral-200 bg-white px-4 py-2.5 text-sm font-medium text-neutral-700 shadow-sm transition hover:bg-neutral-50 dark:border-neutral-700 dark:bg-neutral-900 dark:text-neutral-200 dark:hover:bg-neutral-800"
 				>
-					<svg className="size-4" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
+					<svg
+						className="size-4"
+						viewBox="0 0 24 24"
+						fill="none"
+						stroke="currentColor"
+						strokeWidth="2"
+						strokeLinecap="round"
+						strokeLinejoin="round"
+						aria-label="Download for Windows"
+					>
 						<path d="M12 17V3" />
 						<path d="m6 11 6 6 6-6" />
 						<path d="M19 21H5" />
@@ -366,7 +370,16 @@ const DownloadApp = memo(function DownloadApp() {
 					rel="noopener noreferrer"
 					className="flex items-center gap-2 rounded-lg border border-neutral-200 bg-white px-4 py-2.5 text-sm font-medium text-neutral-700 shadow-sm transition hover:bg-neutral-50 dark:border-neutral-700 dark:bg-neutral-900 dark:text-neutral-200 dark:hover:bg-neutral-800"
 				>
-					<svg className="size-4" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
+					<svg
+						className="size-4"
+						viewBox="0 0 24 24"
+						fill="none"
+						stroke="currentColor"
+						strokeWidth="2"
+						strokeLinecap="round"
+						strokeLinejoin="round"
+						aria-label="Download for Linux"
+					>
 						<path d="M12 17V3" />
 						<path d="m6 11 6 6 6-6" />
 						<path d="M19 21H5" />
diff --git a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
index 35489fe32..6de235d17 100644
--- a/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
+++ b/surfsense_web/components/layout/ui/sidebar/DocumentsSidebar.tsx
@@ -302,24 +302,27 @@ export function DocumentsSidebar({
 		[searchSpaceId, electronAPI]
 	);
 
-	const handleStopWatching = useCallback(async (folder: FolderDisplay) => {
-		if (!electronAPI) return;
+	const handleStopWatching = useCallback(
+		async (folder: FolderDisplay) => {
+			if (!electronAPI) return;
 
-		const watchedFolders = await electronAPI.getWatchedFolders();
-		const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
-		if (!matched) {
-			toast.error("This folder is not being watched");
-			return;
-		}
+			const watchedFolders = await electronAPI.getWatchedFolders();
+			const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
+			if (!matched) {
+				toast.error("This folder is not being watched");
+				return;
+			}
 
-		await electronAPI.removeWatchedFolder(matched.path);
-		try {
-			await foldersApiService.stopWatching(folder.id);
-		} catch (err) {
-			console.error("[DocumentsSidebar] Failed to clear watched metadata:", err);
-		}
-		toast.success(`Stopped watching: ${matched.name}`);
-	}, [electronAPI]);
+			await electronAPI.removeWatchedFolder(matched.path);
+			try {
+				await foldersApiService.stopWatching(folder.id);
+			} catch (err) {
+				console.error("[DocumentsSidebar] Failed to clear watched metadata:", err);
+			}
+			toast.success(`Stopped watching: ${matched.name}`);
+		},
+		[electronAPI]
+	);
 
 	const handleRenameFolder = useCallback(async (folder: FolderDisplay, newName: string) => {
 		try {
@@ -330,22 +333,25 @@ export function DocumentsSidebar({
 		}
 	}, []);
 
-	const handleDeleteFolder = useCallback(async (folder: FolderDisplay) => {
-		if (!confirm(`Delete folder "${folder.name}" and all its contents?`)) return;
-		try {
-			if (electronAPI) {
-				const watchedFolders = await electronAPI.getWatchedFolders();
-				const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
-				if (matched) {
-					await electronAPI.removeWatchedFolder(matched.path);
+	const handleDeleteFolder = useCallback(
+		async (folder: FolderDisplay) => {
+			if (!confirm(`Delete folder "${folder.name}" and all its contents?`)) return;
+			try {
+				if (electronAPI) {
+					const watchedFolders = await electronAPI.getWatchedFolders();
+					const matched = watchedFolders.find((wf) => wf.rootFolderId === folder.id);
+					if (matched) {
+						await electronAPI.removeWatchedFolder(matched.path);
+					}
 				}
+				await foldersApiService.deleteFolder(folder.id);
+				toast.success("Folder deleted");
+			} catch (e: unknown) {
+				toast.error((e as Error)?.message || "Failed to delete folder");
 			}
-			await foldersApiService.deleteFolder(folder.id);
-			toast.success("Folder deleted");
-		} catch (e: unknown) {
-			toast.error((e as Error)?.message || "Failed to delete folder");
-		}
-	}, [electronAPI]);
+		},
+		[electronAPI]
+	);
 
 	const handleMoveFolder = useCallback(
 		(folder: FolderDisplay) => {
diff --git a/surfsense_web/components/sources/DocumentUploadTab.tsx b/surfsense_web/components/sources/DocumentUploadTab.tsx
index 28e160261..76af48c45 100644
--- a/surfsense_web/components/sources/DocumentUploadTab.tsx
+++ b/surfsense_web/components/sources/DocumentUploadTab.tsx
@@ -25,8 +25,8 @@ import {
 import { Progress } from "@/components/ui/progress";
 import { Spinner } from "@/components/ui/spinner";
 import { Switch } from "@/components/ui/switch";
-import { documentsApiService } from "@/lib/apis/documents-api.service";
 import { useElectronAPI } from "@/hooks/use-platform";
+import { documentsApiService } from "@/lib/apis/documents-api.service";
 import {
 	trackDocumentUploadFailure,
 	trackDocumentUploadStarted,
diff --git a/surfsense_web/contexts/platform-context.tsx b/surfsense_web/contexts/platform-context.tsx
index bb3e3800d..578901214 100644
--- a/surfsense_web/contexts/platform-context.tsx
+++ b/surfsense_web/contexts/platform-context.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { createContext, useEffect, useState, type ReactNode } from "react";
+import { createContext, type ReactNode, useEffect, useState } from "react";
 
 export interface PlatformContextValue {
 	isDesktop: boolean;
@@ -25,7 +25,5 @@ export function PlatformProvider({ children }: { children: ReactNode }) {
 		setValue({ isDesktop, isWeb: !isDesktop, electronAPI: api });
 	}, []);
 
-	return (
-		<PlatformContext.Provider value={value}>{children}</PlatformContext.Provider>
-	);
+	return <PlatformContext.Provider value={value}>{children}</PlatformContext.Provider>;
 }
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 961ad9066..3f228066a 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -90,7 +90,9 @@ interface ElectronAPI {
 	setAuthTokens: (bearer: string, refresh: string) => Promise<void>;
 	// Keyboard shortcut configuration
 	getShortcuts: () => Promise<{ quickAsk: string; autocomplete: string }>;
-	setShortcuts: (config: Partial<{ quickAsk: string; autocomplete: string }>) => Promise<{ quickAsk: string; autocomplete: string }>;
+	setShortcuts: (
+		config: Partial<{ quickAsk: string; autocomplete: string }>
+	) => Promise<{ quickAsk: string; autocomplete: string }>;
 }
 
 declare global {

From e574b5ec4a5fcc46b4ef6104138fe078ab027b3b Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 03:17:10 -0700
Subject: [PATCH 163/202] refactor: remove prompt picker display on quick ask
 text retrieval

- Eliminated the automatic display of the prompt picker when quick ask text is retrieved from the Electron API, streamlining the user experience.
---
 surfsense_web/components/assistant-ui/thread.tsx | 1 -
 1 file changed, 1 deletion(-)

diff --git a/surfsense_web/components/assistant-ui/thread.tsx b/surfsense_web/components/assistant-ui/thread.tsx
index 6c8c619b2..e0086cd66 100644
--- a/surfsense_web/components/assistant-ui/thread.tsx
+++ b/surfsense_web/components/assistant-ui/thread.tsx
@@ -364,7 +364,6 @@ const Composer: FC = () => {
 		electronAPI.getQuickAskText().then((text) => {
 			if (text) {
 				setClipboardInitialText(text);
-				setShowPromptPicker(true);
 			}
 		});
 	}, [electronAPI]);

From 27e9e8d8736e0b71d4082010f125e4b477e81b1d Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 03:42:46 -0700
Subject: [PATCH 164/202] feat: add general assist feature and enhance shortcut
 management

- Introduced a new "General Assist" shortcut, allowing users to open SurfSense from anywhere.
- Updated shortcut management to include the new general assist functionality in both the desktop and web applications.
- Enhanced the UI to reflect changes in shortcut labels and descriptions for better clarity.
- Improved the Electron API to support the new shortcut configuration.
---
 surfsense_desktop/electron-builder.yml        |  3 +
 surfsense_desktop/src/ipc/handlers.ts         |  2 +
 surfsense_desktop/src/main.ts                 | 34 ++++++--
 surfsense_desktop/src/modules/quick-ask.ts    |  2 +-
 surfsense_desktop/src/modules/shortcuts.ts    |  2 +
 surfsense_desktop/src/modules/tray.ts         | 77 +++++++++++++++++++
 .../components/DesktopContent.tsx             | 44 +++++++----
 surfsense_web/app/desktop/login/page.tsx      | 21 +++--
 .../components/desktop/shortcut-recorder.tsx  |  1 +
 surfsense_web/types/window.d.ts               |  6 +-
 10 files changed, 159 insertions(+), 33 deletions(-)
 create mode 100644 surfsense_desktop/src/modules/tray.ts

diff --git a/surfsense_desktop/electron-builder.yml b/surfsense_desktop/electron-builder.yml
index 4d6f0b283..2c46c827a 100644
--- a/surfsense_desktop/electron-builder.yml
+++ b/surfsense_desktop/electron-builder.yml
@@ -19,6 +19,9 @@ files:
   - "!scripts"
   - "!release"
 extraResources:
+  - from: assets/
+    to: assets/
+    filter: ["*.ico", "*.png", "*.icns"]
   - from: ../surfsense_web/.next/standalone/surfsense_web/
     to: standalone/
     filter:
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index 7872e7a42..a583e5afc 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -23,6 +23,7 @@ import {
 import { getShortcuts, setShortcuts, type ShortcutConfig } from '../modules/shortcuts';
 import { reregisterQuickAsk } from '../modules/quick-ask';
 import { reregisterAutocomplete } from '../modules/autocomplete';
+import { reregisterGeneralAssist } from '../modules/tray';
 
 let authTokens: { bearer: string; refresh: string } | null = null;
 
@@ -107,6 +108,7 @@ export function registerIpcHandlers(): void {
 
   ipcMain.handle(IPC_CHANNELS.SET_SHORTCUTS, async (_event, config: Partial<ShortcutConfig>) => {
     const updated = await setShortcuts(config);
+    if (config.generalAssist) await reregisterGeneralAssist();
     if (config.quickAsk) await reregisterQuickAsk();
     if (config.autocomplete) await reregisterAutocomplete();
     return updated;
diff --git a/surfsense_desktop/src/main.ts b/surfsense_desktop/src/main.ts
index 9eae8a4db..95b0359c8 100644
--- a/surfsense_desktop/src/main.ts
+++ b/surfsense_desktop/src/main.ts
@@ -1,7 +1,9 @@
 import { app, BrowserWindow } from 'electron';
+
+let isQuitting = false;
 import { registerGlobalErrorHandlers, showErrorDialog } from './modules/errors';
 import { startNextServer } from './modules/server';
-import { createMainWindow } from './modules/window';
+import { createMainWindow, getMainWindow } from './modules/window';
 import { setupDeepLinks, handlePendingDeepLink } from './modules/deep-links';
 import { setupAutoUpdater } from './modules/auto-updater';
 import { setupMenu } from './modules/menu';
@@ -9,6 +11,7 @@ import { registerQuickAsk, unregisterQuickAsk } from './modules/quick-ask';
 import { registerAutocomplete, unregisterAutocomplete } from './modules/autocomplete';
 import { registerFolderWatcher, unregisterFolderWatcher } from './modules/folder-watcher';
 import { registerIpcHandlers } from './ipc/handlers';
+import { createTray, destroyTray } from './modules/tray';
 
 registerGlobalErrorHandlers();
 
@@ -28,7 +31,18 @@ app.whenReady().then(async () => {
     return;
   }
 
-  createMainWindow('/dashboard');
+  await createTray();
+
+  const win = createMainWindow('/dashboard');
+
+  // Minimize to tray instead of closing the app
+  win.on('close', (e) => {
+    if (!isQuitting) {
+      e.preventDefault();
+      win.hide();
+    }
+  });
+
   await registerQuickAsk();
   await registerAutocomplete();
   registerFolderWatcher();
@@ -37,20 +51,28 @@ app.whenReady().then(async () => {
   handlePendingDeepLink();
 
   app.on('activate', () => {
-    if (BrowserWindow.getAllWindows().length === 0) {
+    const mw = getMainWindow();
+    if (!mw || mw.isDestroyed()) {
       createMainWindow('/dashboard');
+    } else {
+      mw.show();
+      mw.focus();
     }
   });
 });
 
+// Keep running in the background — the tray "Quit" calls app.exit()
 app.on('window-all-closed', () => {
-  if (process.platform !== 'darwin') {
-    app.quit();
-  }
+  // Do nothing: the app stays alive in the tray
+});
+
+app.on('before-quit', () => {
+  isQuitting = true;
 });
 
 app.on('will-quit', () => {
   unregisterQuickAsk();
   unregisterAutocomplete();
   unregisterFolderWatcher();
+  destroyTray();
 });
diff --git a/surfsense_desktop/src/modules/quick-ask.ts b/surfsense_desktop/src/modules/quick-ask.ts
index a015bfabf..224444be6 100644
--- a/surfsense_desktop/src/modules/quick-ask.ts
+++ b/surfsense_desktop/src/modules/quick-ask.ts
@@ -114,7 +114,7 @@ async function quickAskHandler(): Promise<void> {
   const text = selected || savedClipboard.trim();
 
   sourceApp = getFrontmostApp();
-  console.log('[quick-ask] Source app:', sourceApp, '| Opening Quick Ask with', text.length, 'chars', selected ? '(selected)' : text ? '(clipboard fallback)' : '(empty)');
+  console.log('[quick-ask] Source app:', sourceApp, '| Opening Quick Assist with', text.length, 'chars', selected ? '(selected)' : text ? '(clipboard fallback)' : '(empty)');
   openQuickAsk(text);
 }
 
diff --git a/surfsense_desktop/src/modules/shortcuts.ts b/surfsense_desktop/src/modules/shortcuts.ts
index 8173b96c1..6948a005e 100644
--- a/surfsense_desktop/src/modules/shortcuts.ts
+++ b/surfsense_desktop/src/modules/shortcuts.ts
@@ -1,9 +1,11 @@
 export interface ShortcutConfig {
+  generalAssist: string;
   quickAsk: string;
   autocomplete: string;
 }
 
 const DEFAULTS: ShortcutConfig = {
+  generalAssist: 'CommandOrControl+Shift+S',
   quickAsk: 'CommandOrControl+Alt+S',
   autocomplete: 'CommandOrControl+Shift+Space',
 };
diff --git a/surfsense_desktop/src/modules/tray.ts b/surfsense_desktop/src/modules/tray.ts
new file mode 100644
index 000000000..1749145a1
--- /dev/null
+++ b/surfsense_desktop/src/modules/tray.ts
@@ -0,0 +1,77 @@
+import { app, globalShortcut, Menu, nativeImage, Tray } from 'electron';
+import path from 'path';
+import { getMainWindow, createMainWindow } from './window';
+import { getShortcuts } from './shortcuts';
+
+let tray: Tray | null = null;
+let currentShortcut: string | null = null;
+
+function getTrayIcon(): nativeImage {
+  const iconName = process.platform === 'win32' ? 'icon.ico' : 'icon.png';
+  const iconPath = app.isPackaged
+    ? path.join(process.resourcesPath, 'assets', iconName)
+    : path.join(__dirname, '..', 'assets', iconName);
+  const img = nativeImage.createFromPath(iconPath);
+  return img.resize({ width: 16, height: 16 });
+}
+
+function showMainWindow(): void {
+  let win = getMainWindow();
+  if (!win || win.isDestroyed()) {
+    win = createMainWindow('/dashboard');
+  } else {
+    win.show();
+    win.focus();
+  }
+}
+
+function registerShortcut(accelerator: string): void {
+  if (currentShortcut) {
+    globalShortcut.unregister(currentShortcut);
+    currentShortcut = null;
+  }
+  if (!accelerator) return;
+  try {
+    const ok = globalShortcut.register(accelerator, showMainWindow);
+    if (ok) {
+      currentShortcut = accelerator;
+    } else {
+      console.warn(`[tray] Failed to register General Assist shortcut: ${accelerator}`);
+    }
+  } catch (err) {
+    console.error(`[tray] Error registering General Assist shortcut:`, err);
+  }
+}
+
+export async function createTray(): Promise<void> {
+  if (tray) return;
+
+  tray = new Tray(getTrayIcon());
+  tray.setToolTip('SurfSense');
+
+  const contextMenu = Menu.buildFromTemplate([
+    { label: 'Open SurfSense', click: showMainWindow },
+    { type: 'separator' },
+    { label: 'Quit', click: () => { app.exit(0); } },
+  ]);
+
+  tray.setContextMenu(contextMenu);
+  tray.on('double-click', showMainWindow);
+
+  const shortcuts = await getShortcuts();
+  registerShortcut(shortcuts.generalAssist);
+}
+
+export async function reregisterGeneralAssist(): Promise<void> {
+  const shortcuts = await getShortcuts();
+  registerShortcut(shortcuts.generalAssist);
+}
+
+export function destroyTray(): void {
+  if (currentShortcut) {
+    globalShortcut.unregister(currentShortcut);
+    currentShortcut = null;
+  }
+  tray?.destroy();
+  tray = null;
+}
diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
index a2f9da0f8..eaf015740 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
@@ -1,12 +1,13 @@
 "use client";
 
-import { Clipboard, Sparkles } from "lucide-react";
+import { AppWindow, Clipboard, Sparkles } from "lucide-react";
 import { useCallback, useEffect, useState } from "react";
 import { toast } from "sonner";
 import { DEFAULT_SHORTCUTS, ShortcutRecorder } from "@/components/desktop/shortcut-recorder";
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
 import { Label } from "@/components/ui/label";
 import { Spinner } from "@/components/ui/spinner";
+import { Switch } from "@/components/ui/switch";
 import { useElectronAPI } from "@/hooks/use-platform";
 
 export function DesktopContent() {
@@ -68,7 +69,7 @@ export function DesktopContent() {
 		await api.setAutocompleteEnabled(checked);
 	};
 
-	const updateShortcut = (key: "quickAsk" | "autocomplete", accelerator: string) => {
+	const updateShortcut = (key: "generalAssist" | "quickAsk" | "autocomplete", accelerator: string) => {
 		setShortcuts((prev) => {
 			const updated = { ...prev, [key]: accelerator };
 			api.setShortcuts?.({ [key]: accelerator }).catch(() => {
@@ -79,7 +80,7 @@ export function DesktopContent() {
 		toast.success("Shortcut updated");
 	};
 
-	const resetShortcut = (key: "quickAsk" | "autocomplete") => {
+	const resetShortcut = (key: "generalAssist" | "quickAsk" | "autocomplete") => {
 		updateShortcut(key, DEFAULT_SHORTCUTS[key]);
 	};
 
@@ -95,23 +96,32 @@ export function DesktopContent() {
 				</CardHeader>
 				<CardContent className="px-3 md:px-6 pb-3 md:pb-6">
 					{shortcutsLoaded ? (
-						<div className="flex flex-col gap-3">
-							<ShortcutRecorder
-								value={shortcuts.quickAsk}
-								onChange={(accel) => updateShortcut("quickAsk", accel)}
-								onReset={() => resetShortcut("quickAsk")}
-								defaultValue={DEFAULT_SHORTCUTS.quickAsk}
-								label="Quick Ask"
+					<div className="flex flex-col gap-3">
+						<ShortcutRecorder
+							value={shortcuts.generalAssist}
+							onChange={(accel) => updateShortcut("generalAssist", accel)}
+							onReset={() => resetShortcut("generalAssist")}
+							defaultValue={DEFAULT_SHORTCUTS.generalAssist}
+							label="General Assist"
+							description="Open SurfSense from anywhere"
+							icon={AppWindow}
+						/>
+						<ShortcutRecorder
+							value={shortcuts.quickAsk}
+							onChange={(accel) => updateShortcut("quickAsk", accel)}
+							onReset={() => resetShortcut("quickAsk")}
+							defaultValue={DEFAULT_SHORTCUTS.quickAsk}
+								label="Quick Assist"
 								description="Copy selected text and ask AI about it"
-								icon={Clipboard}
-							/>
+							icon={Clipboard}
+						/>
 							<ShortcutRecorder
 								value={shortcuts.autocomplete}
 								onChange={(accel) => updateShortcut("autocomplete", accel)}
 								onReset={() => resetShortcut("autocomplete")}
 								defaultValue={DEFAULT_SHORTCUTS.autocomplete}
-								label="Autocomplete"
-								description="Get AI writing suggestions from a screenshot"
+								label="Extreme Assist"
+								description="AI writing powered by your screen and knowledge base"
 								icon={Sparkles}
 							/>
 							<p className="text-[11px] text-muted-foreground">
@@ -126,10 +136,10 @@ export function DesktopContent() {
 				</CardContent>
 			</Card>
 
-			{/* Autocomplete Toggle */}
+			{/* Extreme Assist Toggle */}
 			<Card>
 				<CardHeader className="px-3 md:px-6 pt-3 md:pt-6 pb-2 md:pb-3">
-					<CardTitle className="text-base md:text-lg">Autocomplete</CardTitle>
+					<CardTitle className="text-base md:text-lg">Extreme Assist</CardTitle>
 					<CardDescription className="text-xs md:text-sm">
 						Get inline writing suggestions powered by your knowledge base as you type in any app.
 					</CardDescription>
@@ -138,7 +148,7 @@ export function DesktopContent() {
 					<div className="flex items-center justify-between rounded-lg border p-4">
 						<div className="space-y-0.5">
 							<Label htmlFor="autocomplete-toggle" className="text-sm font-medium cursor-pointer">
-								Enable autocomplete
+								Enable Extreme Assist
 							</Label>
 							<p className="text-xs text-muted-foreground">
 								Show suggestions while typing in other applications.
diff --git a/surfsense_web/app/desktop/login/page.tsx b/surfsense_web/app/desktop/login/page.tsx
index c81e284ba..f442b5d26 100644
--- a/surfsense_web/app/desktop/login/page.tsx
+++ b/surfsense_web/app/desktop/login/page.tsx
@@ -2,7 +2,7 @@
 
 import { IconBrandGoogleFilled } from "@tabler/icons-react";
 import { useAtom } from "jotai";
-import { Clipboard, Eye, EyeOff, Keyboard, Sparkles } from "lucide-react";
+import { AppWindow, Clipboard, Eye, EyeOff, Keyboard, Sparkles } from "lucide-react";
 import Image from "next/image";
 import { useRouter } from "next/navigation";
 import { useCallback, useEffect, useState } from "react";
@@ -48,7 +48,7 @@ export default function DesktopLoginPage() {
 	}, [api]);
 
 	const updateShortcut = useCallback(
-		(key: "quickAsk" | "autocomplete", accelerator: string) => {
+		(key: "generalAssist" | "quickAsk" | "autocomplete", accelerator: string) => {
 			setShortcuts((prev) => {
 				const updated = { ...prev, [key]: accelerator };
 				api?.setShortcuts?.({ [key]: accelerator }).catch(() => {
@@ -62,7 +62,7 @@ export default function DesktopLoginPage() {
 	);
 
 	const resetShortcut = useCallback(
-		(key: "quickAsk" | "autocomplete") => {
+		(key: "generalAssist" | "quickAsk" | "autocomplete") => {
 			updateShortcut(key, DEFAULT_SHORTCUTS[key]);
 		},
 		[updateShortcut]
@@ -132,12 +132,21 @@ export default function DesktopLoginPage() {
 								<Keyboard className="size-3" />
 								Keyboard Shortcuts
 							</div>
+							<ShortcutRecorder
+								value={shortcuts.generalAssist}
+								onChange={(accel) => updateShortcut("generalAssist", accel)}
+								onReset={() => resetShortcut("generalAssist")}
+								defaultValue={DEFAULT_SHORTCUTS.generalAssist}
+								label="General Assist"
+								description="Open SurfSense from anywhere"
+								icon={AppWindow}
+							/>
 							<ShortcutRecorder
 								value={shortcuts.quickAsk}
 								onChange={(accel) => updateShortcut("quickAsk", accel)}
 								onReset={() => resetShortcut("quickAsk")}
 								defaultValue={DEFAULT_SHORTCUTS.quickAsk}
-								label="Quick Ask"
+								label="Quick Assist"
 								description="Copy selected text and ask AI about it"
 								icon={Clipboard}
 							/>
@@ -146,8 +155,8 @@ export default function DesktopLoginPage() {
 								onChange={(accel) => updateShortcut("autocomplete", accel)}
 								onReset={() => resetShortcut("autocomplete")}
 								defaultValue={DEFAULT_SHORTCUTS.autocomplete}
-								label="Autocomplete"
-								description="Get AI writing suggestions from a screenshot"
+								label="Extreme Assist"
+								description="AI writing powered by your screen and knowledge base"
 								icon={Sparkles}
 							/>
 							<p className="text-[11px] text-muted-foreground text-center">
diff --git a/surfsense_web/components/desktop/shortcut-recorder.tsx b/surfsense_web/components/desktop/shortcut-recorder.tsx
index 6d5e93a65..751579e50 100644
--- a/surfsense_web/components/desktop/shortcut-recorder.tsx
+++ b/surfsense_web/components/desktop/shortcut-recorder.tsx
@@ -36,6 +36,7 @@ export function acceleratorToDisplay(accel: string): string[] {
 }
 
 export const DEFAULT_SHORTCUTS = {
+	generalAssist: "CommandOrControl+Shift+S",
 	quickAsk: "CommandOrControl+Alt+S",
 	autocomplete: "CommandOrControl+Shift+Space",
 };
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 3f228066a..25077d1da 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -89,10 +89,10 @@ interface ElectronAPI {
 	getAuthTokens: () => Promise<{ bearer: string; refresh: string } | null>;
 	setAuthTokens: (bearer: string, refresh: string) => Promise<void>;
 	// Keyboard shortcut configuration
-	getShortcuts: () => Promise<{ quickAsk: string; autocomplete: string }>;
+	getShortcuts: () => Promise<{ generalAssist: string; quickAsk: string; autocomplete: string }>;
 	setShortcuts: (
-		config: Partial<{ quickAsk: string; autocomplete: string }>
-	) => Promise<{ quickAsk: string; autocomplete: string }>;
+		config: Partial<{ generalAssist: string; quickAsk: string; autocomplete: string }>
+	) => Promise<{ generalAssist: string; quickAsk: string; autocomplete: string }>;
 }
 
 declare global {

From b74ac8a608fe5b5ad1e0ac0e76fb2d98d71230aa Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 04:22:22 -0700
Subject: [PATCH 165/202] feat: update shortcut icons and descriptions for
 improved clarity

- Replaced icons for "General Assist," "Quick Assist," and "Extreme Assist" shortcuts to better represent their functionalities.
- Updated descriptions for each shortcut to enhance user understanding of their actions.
- Refactored the layout of the shortcut recorder for a more streamlined user experience.
---
 .../components/DesktopContent.tsx             |  30 +-
 surfsense_web/app/desktop/login/page.tsx      | 265 ++++++++++--------
 .../components/desktop/shortcut-recorder.tsx  |  44 +--
 3 files changed, 182 insertions(+), 157 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
index eaf015740..5ecea6708 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { AppWindow, Clipboard, Sparkles } from "lucide-react";
+import { BrainCog, Rocket, Zap } from "lucide-react";
 import { useCallback, useEffect, useState } from "react";
 import { toast } from "sonner";
 import { DEFAULT_SHORTCUTS, ShortcutRecorder } from "@/components/desktop/shortcut-recorder";
@@ -103,27 +103,27 @@ export function DesktopContent() {
 							onReset={() => resetShortcut("generalAssist")}
 							defaultValue={DEFAULT_SHORTCUTS.generalAssist}
 							label="General Assist"
-							description="Open SurfSense from anywhere"
-							icon={AppWindow}
+							description="Launch SurfSense instantly from any application"
+							icon={Rocket}
 						/>
 						<ShortcutRecorder
 							value={shortcuts.quickAsk}
 							onChange={(accel) => updateShortcut("quickAsk", accel)}
 							onReset={() => resetShortcut("quickAsk")}
 							defaultValue={DEFAULT_SHORTCUTS.quickAsk}
-								label="Quick Assist"
-								description="Copy selected text and ask AI about it"
-							icon={Clipboard}
+							label="Quick Assist"
+							description="Select text anywhere, then ask AI to explain, rewrite, or act on it"
+							icon={Zap}
+						/>
+						<ShortcutRecorder
+							value={shortcuts.autocomplete}
+							onChange={(accel) => updateShortcut("autocomplete", accel)}
+							onReset={() => resetShortcut("autocomplete")}
+							defaultValue={DEFAULT_SHORTCUTS.autocomplete}
+							label="Extreme Assist"
+							description="AI drafts text using your screen context and knowledge base"
+							icon={BrainCog}
 						/>
-							<ShortcutRecorder
-								value={shortcuts.autocomplete}
-								onChange={(accel) => updateShortcut("autocomplete", accel)}
-								onReset={() => resetShortcut("autocomplete")}
-								defaultValue={DEFAULT_SHORTCUTS.autocomplete}
-								label="Extreme Assist"
-								description="AI writing powered by your screen and knowledge base"
-								icon={Sparkles}
-							/>
 							<p className="text-[11px] text-muted-foreground">
 								Click a shortcut and press a new key combination to change it.
 							</p>
diff --git a/surfsense_web/app/desktop/login/page.tsx b/surfsense_web/app/desktop/login/page.tsx
index f442b5d26..5d931b5c2 100644
--- a/surfsense_web/app/desktop/login/page.tsx
+++ b/surfsense_web/app/desktop/login/page.tsx
@@ -2,7 +2,7 @@
 
 import { IconBrandGoogleFilled } from "@tabler/icons-react";
 import { useAtom } from "jotai";
-import { AppWindow, Clipboard, Eye, EyeOff, Keyboard, Sparkles } from "lucide-react";
+import { BrainCog, Eye, EyeOff, Rocket, Zap } from "lucide-react";
 import Image from "next/image";
 import { useRouter } from "next/navigation";
 import { useCallback, useEffect, useState } from "react";
@@ -10,7 +10,6 @@ import { toast } from "sonner";
 import { loginMutationAtom } from "@/atoms/auth/auth-mutation.atoms";
 import { DEFAULT_SHORTCUTS, ShortcutRecorder } from "@/components/desktop/shortcut-recorder";
 import { Button } from "@/components/ui/button";
-import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
 import { Input } from "@/components/ui/input";
 import { Label } from "@/components/ui/label";
 import { Separator } from "@/components/ui/separator";
@@ -100,8 +99,9 @@ export default function DesktopLoginPage() {
 	};
 
 	return (
-		<div className="relative flex min-h-screen items-center justify-center bg-background p-4">
-			<div className="pointer-events-none absolute inset-0 overflow-hidden">
+		<div className="relative flex min-h-svh items-center justify-center bg-background p-4 sm:p-6">
+			{/* Subtle radial glow */}
+			<div className="pointer-events-none fixed inset-0 overflow-hidden">
 				<div
 					className="absolute -top-1/2 left-1/2 size-[800px] -translate-x-1/2 rounded-full opacity-[0.03]"
 					style={{
@@ -110,134 +110,157 @@ export default function DesktopLoginPage() {
 				/>
 			</div>
 
-			<Card className="relative w-full max-w-md shadow-lg">
-				<CardHeader className="items-center text-center pb-4">
+			<div className="relative flex w-full max-w-md flex-col overflow-hidden rounded-xl border bg-card shadow-lg">
+				{/* Header */}
+				<div className="flex flex-col items-center px-6 pt-6 pb-2 text-center">
 					<Image
 						src="/icon-128.svg"
-						className="select-none dark:invert size-14 rounded-md mb-2"
+						className="select-none dark:invert size-12 rounded-lg mb-3"
 						alt="SurfSense"
-						width={56}
-						height={56}
+						width={48}
+						height={48}
 						priority
 					/>
-					<CardTitle className="text-xl">Welcome to SurfSense Desktop App</CardTitle>
-					<CardDescription>Configure your shortcuts, then sign in to get started.</CardDescription>
-				</CardHeader>
-
-				<CardContent className="flex flex-col gap-6">
-					{/* ---- Shortcuts Section (first) ---- */}
-					{shortcutsLoaded ? (
-						<div className="flex flex-col gap-3">
-							<div className="flex items-center gap-1.5 text-xs font-medium text-muted-foreground mb-1">
-								<Keyboard className="size-3" />
-								Keyboard Shortcuts
-							</div>
-							<ShortcutRecorder
-								value={shortcuts.generalAssist}
-								onChange={(accel) => updateShortcut("generalAssist", accel)}
-								onReset={() => resetShortcut("generalAssist")}
-								defaultValue={DEFAULT_SHORTCUTS.generalAssist}
-								label="General Assist"
-								description="Open SurfSense from anywhere"
-								icon={AppWindow}
-							/>
-							<ShortcutRecorder
-								value={shortcuts.quickAsk}
-								onChange={(accel) => updateShortcut("quickAsk", accel)}
-								onReset={() => resetShortcut("quickAsk")}
-								defaultValue={DEFAULT_SHORTCUTS.quickAsk}
-								label="Quick Assist"
-								description="Copy selected text and ask AI about it"
-								icon={Clipboard}
-							/>
-							<ShortcutRecorder
-								value={shortcuts.autocomplete}
-								onChange={(accel) => updateShortcut("autocomplete", accel)}
-								onReset={() => resetShortcut("autocomplete")}
-								defaultValue={DEFAULT_SHORTCUTS.autocomplete}
-								label="Extreme Assist"
-								description="AI writing powered by your screen and knowledge base"
-								icon={Sparkles}
-							/>
-							<p className="text-[11px] text-muted-foreground text-center">
-								Click a shortcut and press a new key combination to change it.
-							</p>
-						</div>
-					) : (
-						<div className="flex justify-center py-4">
-							<Spinner size="sm" />
-						</div>
-					)}
-
-					{/* ---- Divider ---- */}
-					<Separator />
-
-					{/* ---- Auth Section (second) ---- */}
-					{isGoogleAuth ? (
-						<Button variant="outline" className="w-full gap-2 py-5" onClick={handleGoogleLogin}>
-							<IconBrandGoogleFilled className="size-5" />
-							Continue with Google
-						</Button>
-					) : (
-						<form onSubmit={handleLocalLogin} className="flex flex-col gap-4">
-							{loginError && (
-								<div className="rounded-md border border-destructive/20 bg-destructive/10 px-3 py-2 text-sm text-destructive">
-									{loginError}
-								</div>
-							)}
+					<h1 className="text-lg font-semibold tracking-tight">
+						Welcome to SurfSense Desktop
+					</h1>
+					<p className="mt-1 text-sm text-muted-foreground">
+						Configure shortcuts, then sign in to get started.
+					</p>
+				</div>
 
+				{/* Scrollable content */}
+				<div className="flex-1 overflow-y-auto px-6 py-4">
+					<div className="flex flex-col gap-5">
+						{/* ---- Shortcuts ---- */}
+						{shortcutsLoaded ? (
 							<div className="flex flex-col gap-2">
-								<Label htmlFor="email">Email</Label>
-								<Input
-									id="email"
-									type="email"
-									placeholder="you@example.com"
-									required
-									value={email}
-									onChange={(e) => setEmail(e.target.value)}
-									disabled={isLoggingIn}
-									autoFocus
-								/>
-							</div>
-
-							<div className="flex flex-col gap-2">
-								<Label htmlFor="password">Password</Label>
-								<div className="relative">
-									<Input
-										id="password"
-										type={showPassword ? "text" : "password"}
-										placeholder="Enter your password"
-										required
-										value={password}
-										onChange={(e) => setPassword(e.target.value)}
-										disabled={isLoggingIn}
-										className="pr-10"
+								<p className="text-xs font-medium uppercase tracking-wider text-muted-foreground">
+									Keyboard Shortcuts
+								</p>
+								<div className="flex flex-col gap-1.5">
+									<ShortcutRecorder
+										value={shortcuts.generalAssist}
+										onChange={(accel) => updateShortcut("generalAssist", accel)}
+										onReset={() => resetShortcut("generalAssist")}
+										defaultValue={DEFAULT_SHORTCUTS.generalAssist}
+										label="General Assist"
+										description="Launch SurfSense instantly from any application"
+										icon={Rocket}
+									/>
+									<ShortcutRecorder
+										value={shortcuts.quickAsk}
+										onChange={(accel) => updateShortcut("quickAsk", accel)}
+										onReset={() => resetShortcut("quickAsk")}
+										defaultValue={DEFAULT_SHORTCUTS.quickAsk}
+										label="Quick Assist"
+										description="Select text anywhere, then ask AI to explain, rewrite, or act on it"
+										icon={Zap}
+									/>
+									<ShortcutRecorder
+										value={shortcuts.autocomplete}
+										onChange={(accel) => updateShortcut("autocomplete", accel)}
+										onReset={() => resetShortcut("autocomplete")}
+										defaultValue={DEFAULT_SHORTCUTS.autocomplete}
+										label="Extreme Assist"
+										description="AI drafts text using your screen context and knowledge base"
+										icon={BrainCog}
 									/>
-									<button
-										type="button"
-										onClick={() => setShowPassword((v) => !v)}
-										className="absolute inset-y-0 right-0 flex items-center pr-3 text-muted-foreground hover:text-foreground"
-										tabIndex={-1}
-									>
-										{showPassword ? <EyeOff className="size-4" /> : <Eye className="size-4" />}
-									</button>
 								</div>
+								<p className="text-[11px] text-muted-foreground text-center mt-1">
+									Click a shortcut and press a new key combination to change it.
+								</p>
 							</div>
+						) : (
+							<div className="flex justify-center py-6">
+								<Spinner size="sm" />
+							</div>
+						)}
 
-							<Button type="submit" disabled={isLoggingIn} className="mt-1">
-								{isLoggingIn ? (
-									<>
-										<Spinner size="sm" className="text-primary-foreground" />
-										Signing in...
-									</>
-								) : (
-									"Sign in"
-								)}
-							</Button>
-						</form>
-					)}
-				</CardContent>
-			</Card>
+						<Separator />
+
+						{/* ---- Auth ---- */}
+						<div className="flex flex-col gap-3">
+							<p className="text-xs font-medium uppercase tracking-wider text-muted-foreground">
+								Sign In
+							</p>
+
+							{isGoogleAuth ? (
+								<Button variant="outline" className="w-full gap-2 h-10" onClick={handleGoogleLogin}>
+									<IconBrandGoogleFilled className="size-4" />
+									Continue with Google
+								</Button>
+							) : (
+								<form onSubmit={handleLocalLogin} className="flex flex-col gap-3">
+									{loginError && (
+										<div className="rounded-md border border-destructive/20 bg-destructive/10 px-3 py-2 text-sm text-destructive">
+											{loginError}
+										</div>
+									)}
+
+									<div className="flex flex-col gap-1.5">
+										<Label htmlFor="email" className="text-xs">
+											Email
+										</Label>
+										<Input
+											id="email"
+											type="email"
+											placeholder="you@example.com"
+											required
+											value={email}
+											onChange={(e) => setEmail(e.target.value)}
+											disabled={isLoggingIn}
+											autoFocus
+											className="h-9"
+										/>
+									</div>
+
+									<div className="flex flex-col gap-1.5">
+										<Label htmlFor="password" className="text-xs">
+											Password
+										</Label>
+										<div className="relative">
+											<Input
+												id="password"
+												type={showPassword ? "text" : "password"}
+												placeholder="Enter your password"
+												required
+												value={password}
+												onChange={(e) => setPassword(e.target.value)}
+												disabled={isLoggingIn}
+												className="h-9 pr-9"
+											/>
+											<button
+												type="button"
+												onClick={() => setShowPassword((v) => !v)}
+												className="absolute inset-y-0 right-0 flex items-center pr-2.5 text-muted-foreground hover:text-foreground"
+												tabIndex={-1}
+											>
+												{showPassword ? (
+													<EyeOff className="size-3.5" />
+												) : (
+													<Eye className="size-3.5" />
+												)}
+											</button>
+										</div>
+									</div>
+
+									<Button type="submit" disabled={isLoggingIn} className="h-9 mt-1">
+										{isLoggingIn ? (
+											<>
+												<Spinner size="sm" className="text-primary-foreground" />
+												Signing in…
+											</>
+										) : (
+											"Sign in"
+										)}
+									</Button>
+								</form>
+							)}
+						</div>
+					</div>
+				</div>
+			</div>
 		</div>
 	);
 }
diff --git a/surfsense_web/components/desktop/shortcut-recorder.tsx b/surfsense_web/components/desktop/shortcut-recorder.tsx
index 751579e50..ec4e5a528 100644
--- a/surfsense_web/components/desktop/shortcut-recorder.tsx
+++ b/surfsense_web/components/desktop/shortcut-recorder.tsx
@@ -6,7 +6,7 @@ import { Button } from "@/components/ui/button";
 import { cn } from "@/lib/utils";
 
 // ---------------------------------------------------------------------------
-// Accelerator ↔ display helpers
+// Accelerator <-> display helpers
 // ---------------------------------------------------------------------------
 
 export function keyEventToAccelerator(e: React.KeyboardEvent): string | null {
@@ -47,13 +47,13 @@ export const DEFAULT_SHORTCUTS = {
 
 export function Kbd({ keys, className }: { keys: string[]; className?: string }) {
 	return (
-		<span className={cn("inline-flex items-center gap-1", className)}>
-			{keys.map((key) => (
+		<span className={cn("inline-flex items-center gap-0.5", className)}>
+			{keys.map((key, i) => (
 				<kbd
-					key={key}
+					key={`${key}-${i}`}
 					className={cn(
-						"inline-flex h-7 min-w-7 items-center justify-center rounded-md border bg-muted px-1.5 font-mono text-xs font-medium text-muted-foreground shadow-sm",
-						key.length > 3 && "px-2"
+						"inline-flex h-6 min-w-6 items-center justify-center rounded border bg-muted px-1 font-mono text-[11px] font-medium text-muted-foreground",
+						key.length > 3 && "px-1.5"
 					)}
 				>
 					{key}
@@ -111,27 +111,29 @@ export function ShortcutRecorder({
 	const isDefault = value === defaultValue;
 
 	return (
-		<div className="flex items-center justify-between gap-4 rounded-lg border bg-background p-3">
-			<div className="flex items-center gap-3 min-w-0">
-				<div className="flex size-9 shrink-0 items-center justify-center rounded-md bg-primary/10 text-primary">
-					<Icon className="size-4" />
-				</div>
-				<div className="min-w-0">
-					<p className="text-sm font-medium leading-none">{label}</p>
-					<p className="mt-1 text-xs text-muted-foreground truncate">{description}</p>
-				</div>
+		<div className="group flex items-center gap-3 rounded-lg border border-border/60 bg-card px-3 py-2.5 transition-colors hover:border-border">
+			{/* Icon */}
+			<div className="flex size-8 shrink-0 items-center justify-center rounded-md bg-primary/10 text-primary">
+				<Icon className="size-4" />
 			</div>
 
-			<div className="flex items-center gap-2 shrink-0">
+			{/* Label + description */}
+			<div className="min-w-0 flex-1">
+				<p className="text-[13px] font-medium leading-none">{label}</p>
+				<p className="mt-1 text-[11px] leading-snug text-muted-foreground">{description}</p>
+			</div>
+
+			{/* Actions */}
+			<div className="flex shrink-0 items-center gap-1">
 				{!isDefault && (
 					<Button
 						variant="ghost"
 						size="icon"
-						className="size-7"
+						className="size-6 opacity-0 group-hover:opacity-100 transition-opacity"
 						onClick={onReset}
 						title="Reset to default"
 					>
-						<RotateCcw />
+						<RotateCcw className="size-3" />
 					</Button>
 				)}
 				<button
@@ -141,14 +143,14 @@ export function ShortcutRecorder({
 					onKeyDown={handleKeyDown}
 					onBlur={() => setRecording(false)}
 					className={cn(
-						"flex h-9 items-center gap-1 rounded-md border px-3 text-sm transition-all focus:outline-none",
+						"flex h-7 items-center gap-0.5 rounded-md border px-2 transition-all focus:outline-none",
 						recording
 							? "border-primary bg-primary/5 ring-2 ring-primary/20"
-							: "border-input bg-muted/50 hover:bg-muted"
+							: "border-input bg-muted/40 hover:bg-muted"
 					)}
 				>
 					{recording ? (
-						<span className="text-xs text-primary animate-pulse">Press keys...</span>
+						<span className="text-[11px] text-primary animate-pulse whitespace-nowrap">Press keys…</span>
 					) : (
 						<Kbd keys={displayKeys} />
 					)}

From 7c6e52a0a50e4ec8fe0a920f4d37e0df2eae539b Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 04:45:48 -0700
Subject: [PATCH 166/202] feat: add active search space management to Electron
 API and UI

- Introduced IPC channels for getting and setting the active search space, enhancing user experience across the application.
- Updated the preload script to expose new API methods for active search space management.
- Modified the main window and quick ask functionalities to sync the active search space based on user navigation.
- Enhanced the desktop and web applications to allow users to select and manage their default search space seamlessly.
- Implemented automatic synchronization of the active search space during login and navigation events.
---
 surfsense_desktop/src/ipc/channels.ts         |  3 +
 surfsense_desktop/src/ipc/handlers.ts         |  7 ++
 .../src/modules/active-search-space.ts        | 24 ++++++
 .../src/modules/autocomplete/index.ts         | 19 +----
 surfsense_desktop/src/modules/quick-ask.ts    |  9 +-
 surfsense_desktop/src/modules/window.ts       | 11 +++
 surfsense_desktop/src/preload.ts              |  5 ++
 .../[search_space_id]/client-layout.tsx       | 14 ++-
 .../components/DesktopContent.tsx             | 53 +++++++++++-
 surfsense_web/app/desktop/login/page.tsx      | 18 ++++
 surfsense_web/components/TokenHandler.tsx     | 85 ++++++++++---------
 surfsense_web/types/window.d.ts               |  3 +
 12 files changed, 189 insertions(+), 62 deletions(-)
 create mode 100644 surfsense_desktop/src/modules/active-search-space.ts

diff --git a/surfsense_desktop/src/ipc/channels.ts b/surfsense_desktop/src/ipc/channels.ts
index 8051703fb..39e75f046 100644
--- a/surfsense_desktop/src/ipc/channels.ts
+++ b/surfsense_desktop/src/ipc/channels.ts
@@ -38,4 +38,7 @@ export const IPC_CHANNELS = {
   // Keyboard shortcut configuration
   GET_SHORTCUTS: 'shortcuts:get',
   SET_SHORTCUTS: 'shortcuts:set',
+  // Active search space
+  GET_ACTIVE_SEARCH_SPACE: 'search-space:get-active',
+  SET_ACTIVE_SEARCH_SPACE: 'search-space:set-active',
 } as const;
diff --git a/surfsense_desktop/src/ipc/handlers.ts b/surfsense_desktop/src/ipc/handlers.ts
index a583e5afc..200fa75bd 100644
--- a/surfsense_desktop/src/ipc/handlers.ts
+++ b/surfsense_desktop/src/ipc/handlers.ts
@@ -21,6 +21,7 @@ import {
   readLocalFiles,
 } from '../modules/folder-watcher';
 import { getShortcuts, setShortcuts, type ShortcutConfig } from '../modules/shortcuts';
+import { getActiveSearchSpaceId, setActiveSearchSpaceId } from '../modules/active-search-space';
 import { reregisterQuickAsk } from '../modules/quick-ask';
 import { reregisterAutocomplete } from '../modules/autocomplete';
 import { reregisterGeneralAssist } from '../modules/tray';
@@ -106,6 +107,12 @@ export function registerIpcHandlers(): void {
 
   ipcMain.handle(IPC_CHANNELS.GET_SHORTCUTS, () => getShortcuts());
 
+  ipcMain.handle(IPC_CHANNELS.GET_ACTIVE_SEARCH_SPACE, () => getActiveSearchSpaceId());
+
+  ipcMain.handle(IPC_CHANNELS.SET_ACTIVE_SEARCH_SPACE, (_event, id: string) =>
+    setActiveSearchSpaceId(id)
+  );
+
   ipcMain.handle(IPC_CHANNELS.SET_SHORTCUTS, async (_event, config: Partial<ShortcutConfig>) => {
     const updated = await setShortcuts(config);
     if (config.generalAssist) await reregisterGeneralAssist();
diff --git a/surfsense_desktop/src/modules/active-search-space.ts b/surfsense_desktop/src/modules/active-search-space.ts
new file mode 100644
index 000000000..e5f55c8f4
--- /dev/null
+++ b/surfsense_desktop/src/modules/active-search-space.ts
@@ -0,0 +1,24 @@
+const STORE_KEY = 'activeSearchSpaceId';
+// eslint-disable-next-line @typescript-eslint/no-explicit-any
+let store: any = null;
+
+async function getStore() {
+  if (!store) {
+    const { default: Store } = await import('electron-store');
+    store = new Store({
+      name: 'active-search-space',
+      defaults: { [STORE_KEY]: null as string | null },
+    });
+  }
+  return store;
+}
+
+export async function getActiveSearchSpaceId(): Promise<string | null> {
+  const s = await getStore();
+  return (s.get(STORE_KEY) as string | null) ?? null;
+}
+
+export async function setActiveSearchSpaceId(id: string): Promise<void> {
+  const s = await getStore();
+  s.set(STORE_KEY, id);
+}
diff --git a/surfsense_desktop/src/modules/autocomplete/index.ts b/surfsense_desktop/src/modules/autocomplete/index.ts
index 1b64396b0..cb09a42e1 100644
--- a/surfsense_desktop/src/modules/autocomplete/index.ts
+++ b/surfsense_desktop/src/modules/autocomplete/index.ts
@@ -2,16 +2,15 @@ import { clipboard, globalShortcut, ipcMain, screen } from 'electron';
 import { IPC_CHANNELS } from '../../ipc/channels';
 import { getFrontmostApp, getWindowTitle, hasAccessibilityPermission, simulatePaste } from '../platform';
 import { hasScreenRecordingPermission, requestAccessibility, requestScreenRecording } from '../permissions';
-import { getMainWindow } from '../window';
 import { captureScreen } from './screenshot';
 import { createSuggestionWindow, destroySuggestion, getSuggestionWindow } from './suggestion-window';
 import { getShortcuts } from '../shortcuts';
+import { getActiveSearchSpaceId } from '../active-search-space';
 
 let currentShortcut = '';
 let autocompleteEnabled = true;
 let savedClipboard = '';
 let sourceApp = '';
-let lastSearchSpaceId: string | null = null;
 
 function isSurfSenseWindow(): boolean {
   const app = getFrontmostApp();
@@ -37,21 +36,11 @@ async function triggerAutocomplete(): Promise<void> {
     return;
   }
 
-  const mainWin = getMainWindow();
-  if (mainWin && !mainWin.isDestroyed()) {
-    const mainUrl = mainWin.webContents.getURL();
-    const match = mainUrl.match(/\/dashboard\/(\d+)/);
-    if (match) {
-      lastSearchSpaceId = match[1];
-    }
-  }
-
-  if (!lastSearchSpaceId) {
-    console.warn('[autocomplete] No active search space. Open a search space first.');
+  const searchSpaceId = await getActiveSearchSpaceId();
+  if (!searchSpaceId) {
+    console.warn('[autocomplete] No active search space. Select a search space first.');
     return;
   }
-
-  const searchSpaceId = lastSearchSpaceId;
   const cursor = screen.getCursorScreenPoint();
   const win = createSuggestionWindow(cursor.x, cursor.y);
 
diff --git a/surfsense_desktop/src/modules/quick-ask.ts b/surfsense_desktop/src/modules/quick-ask.ts
index 224444be6..d5a2a9c2e 100644
--- a/surfsense_desktop/src/modules/quick-ask.ts
+++ b/surfsense_desktop/src/modules/quick-ask.ts
@@ -4,11 +4,13 @@ import { IPC_CHANNELS } from '../ipc/channels';
 import { checkAccessibilityPermission, getFrontmostApp, simulateCopy, simulatePaste } from './platform';
 import { getServerPort } from './server';
 import { getShortcuts } from './shortcuts';
+import { getActiveSearchSpaceId } from './active-search-space';
 
 let currentShortcut = '';
 let quickAskWindow: BrowserWindow | null = null;
 let pendingText = '';
 let pendingMode = '';
+let pendingSearchSpaceId: string | null = null;
 let sourceApp = '';
 let savedClipboard = '';
 
@@ -53,7 +55,9 @@ function createQuickAskWindow(x: number, y: number): BrowserWindow {
     skipTaskbar: true,
   });
 
-  quickAskWindow.loadURL(`http://localhost:${getServerPort()}/dashboard`);
+  const spaceId = pendingSearchSpaceId;
+  const route = spaceId ? `/dashboard/${spaceId}/new-chat` : '/dashboard';
+  quickAskWindow.loadURL(`http://localhost:${getServerPort()}${route}`);
 
   quickAskWindow.once('ready-to-show', () => {
     quickAskWindow?.show();
@@ -78,8 +82,9 @@ function createQuickAskWindow(x: number, y: number): BrowserWindow {
   return quickAskWindow;
 }
 
-function openQuickAsk(text: string): void {
+async function openQuickAsk(text: string): Promise<void> {
   pendingText = text;
+  pendingSearchSpaceId = await getActiveSearchSpaceId();
   const cursor = screen.getCursorScreenPoint();
   const pos = clampToScreen(cursor.x, cursor.y, 450, 750);
   createQuickAskWindow(pos.x, pos.y);
diff --git a/surfsense_desktop/src/modules/window.ts b/surfsense_desktop/src/modules/window.ts
index 7a77773d8..9cd216501 100644
--- a/surfsense_desktop/src/modules/window.ts
+++ b/surfsense_desktop/src/modules/window.ts
@@ -2,6 +2,7 @@ import { app, BrowserWindow, shell, session } from 'electron';
 import path from 'path';
 import { showErrorDialog } from './errors';
 import { getServerPort } from './server';
+import { setActiveSearchSpaceId } from './active-search-space';
 
 const isDev = !app.isPackaged;
 const HOSTED_FRONTEND_URL = process.env.HOSTED_FRONTEND_URL as string;
@@ -55,6 +56,16 @@ export function createMainWindow(initialPath = '/dashboard'): BrowserWindow {
     showErrorDialog('Page failed to load', new Error(`${errorDescription} (${errorCode})\n${validatedURL}`));
   });
 
+  // Auto-sync active search space from URL navigation
+  const syncSearchSpace = (url: string) => {
+    const match = url.match(/\/dashboard\/(\d+)/);
+    if (match) {
+      setActiveSearchSpaceId(match[1]);
+    }
+  };
+  mainWindow.webContents.on('did-navigate', (_event, url) => syncSearchSpace(url));
+  mainWindow.webContents.on('did-navigate-in-page', (_event, url) => syncSearchSpace(url));
+
   if (isDev) {
     mainWindow.webContents.openDevTools();
   }
diff --git a/surfsense_desktop/src/preload.ts b/surfsense_desktop/src/preload.ts
index 58ddd745e..4d9537c91 100644
--- a/surfsense_desktop/src/preload.ts
+++ b/surfsense_desktop/src/preload.ts
@@ -78,4 +78,9 @@ contextBridge.exposeInMainWorld('electronAPI', {
   getShortcuts: () => ipcRenderer.invoke(IPC_CHANNELS.GET_SHORTCUTS),
   setShortcuts: (config: Record<string, string>) =>
     ipcRenderer.invoke(IPC_CHANNELS.SET_SHORTCUTS, config),
+
+  // Active search space
+  getActiveSearchSpace: () => ipcRenderer.invoke(IPC_CHANNELS.GET_ACTIVE_SEARCH_SPACE),
+  setActiveSearchSpace: (id: string) =>
+    ipcRenderer.invoke(IPC_CHANNELS.SET_ACTIVE_SEARCH_SPACE, id),
 });
diff --git a/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx b/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx
index 60b8aef12..16af9ac6b 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx
@@ -19,6 +19,7 @@ import { OnboardingTour } from "@/components/onboarding-tour";
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
 import { useFolderSync } from "@/hooks/use-folder-sync";
 import { useGlobalLoadingEffect } from "@/hooks/use-global-loading";
+import { useElectronAPI } from "@/hooks/use-platform";
 
 export function DashboardClientLayout({
 	children,
@@ -139,6 +140,8 @@ export function DashboardClientLayout({
 		refetchPreferences,
 	]);
 
+	const electronAPI = useElectronAPI();
+
 	useEffect(() => {
 		const activeSeacrhSpaceId =
 			typeof search_space_id === "string"
@@ -148,7 +151,16 @@ export function DashboardClientLayout({
 					: "";
 		if (!activeSeacrhSpaceId) return;
 		setActiveSearchSpaceIdState(activeSeacrhSpaceId);
-	}, [search_space_id, setActiveSearchSpaceIdState]);
+
+		// Sync to Electron store if stored value is null (first navigation)
+		if (electronAPI?.setActiveSearchSpace) {
+			electronAPI.getActiveSearchSpace?.().then((stored) => {
+				if (!stored) {
+					electronAPI.setActiveSearchSpace!(activeSeacrhSpaceId);
+				}
+			}).catch(() => {});
+		}
+	}, [search_space_id, setActiveSearchSpaceIdState, electronAPI]);
 
 	// Determine if we should show loading
 	const shouldShowLoading =
diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
index 5ecea6708..596ed3e8b 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
@@ -1,14 +1,17 @@
 "use client";
 
 import { BrainCog, Rocket, Zap } from "lucide-react";
-import { useCallback, useEffect, useState } from "react";
+import { useEffect, useState } from "react";
 import { toast } from "sonner";
 import { DEFAULT_SHORTCUTS, ShortcutRecorder } from "@/components/desktop/shortcut-recorder";
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
 import { Label } from "@/components/ui/label";
+import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue } from "@/components/ui/select";
 import { Spinner } from "@/components/ui/spinner";
 import { Switch } from "@/components/ui/switch";
 import { useElectronAPI } from "@/hooks/use-platform";
+import { searchSpacesApiService } from "@/lib/apis/search-spaces-api.service";
+import type { SearchSpace } from "@/contracts/types/search-space.types";
 
 export function DesktopContent() {
 	const api = useElectronAPI();
@@ -18,6 +21,9 @@ export function DesktopContent() {
 	const [shortcuts, setShortcuts] = useState(DEFAULT_SHORTCUTS);
 	const [shortcutsLoaded, setShortcutsLoaded] = useState(false);
 
+	const [searchSpaces, setSearchSpaces] = useState<SearchSpace[]>([]);
+	const [activeSpaceId, setActiveSpaceId] = useState<string | null>(null);
+
 	useEffect(() => {
 		if (!api) {
 			setLoading(false);
@@ -27,11 +33,18 @@ export function DesktopContent() {
 
 		let mounted = true;
 
-		Promise.all([api.getAutocompleteEnabled(), api.getShortcuts?.() ?? Promise.resolve(null)])
-			.then(([autoEnabled, config]) => {
+		Promise.all([
+			api.getAutocompleteEnabled(),
+			api.getShortcuts?.() ?? Promise.resolve(null),
+			api.getActiveSearchSpace?.() ?? Promise.resolve(null),
+			searchSpacesApiService.getSearchSpaces(),
+		])
+			.then(([autoEnabled, config, spaceId, spaces]) => {
 				if (!mounted) return;
 				setEnabled(autoEnabled);
 				if (config) setShortcuts(config);
+				setActiveSpaceId(spaceId);
+				if (spaces) setSearchSpaces(spaces);
 				setLoading(false);
 				setShortcutsLoaded(true);
 			})
@@ -84,8 +97,42 @@ export function DesktopContent() {
 		updateShortcut(key, DEFAULT_SHORTCUTS[key]);
 	};
 
+	const handleSearchSpaceChange = (value: string) => {
+		setActiveSpaceId(value);
+		api.setActiveSearchSpace?.(value);
+		toast.success("Default search space updated");
+	};
+
 	return (
 		<div className="space-y-4 md:space-y-6">
+			{/* Default Search Space */}
+			<Card>
+				<CardHeader className="px-3 md:px-6 pt-3 md:pt-6 pb-2 md:pb-3">
+					<CardTitle className="text-base md:text-lg">Default Search Space</CardTitle>
+					<CardDescription className="text-xs md:text-sm">
+						Choose which search space General Assist, Quick Assist, and Extreme Assist operate against.
+					</CardDescription>
+				</CardHeader>
+				<CardContent className="px-3 md:px-6 pb-3 md:pb-6">
+					{searchSpaces.length > 0 ? (
+						<Select value={activeSpaceId ?? undefined} onValueChange={handleSearchSpaceChange}>
+							<SelectTrigger className="w-full">
+								<SelectValue placeholder="Select a search space" />
+							</SelectTrigger>
+							<SelectContent>
+								{searchSpaces.map((space) => (
+									<SelectItem key={space.id} value={String(space.id)}>
+										{space.name}
+									</SelectItem>
+								))}
+							</SelectContent>
+						</Select>
+					) : (
+						<p className="text-sm text-muted-foreground">No search spaces found. Create one first.</p>
+					)}
+				</CardContent>
+			</Card>
+
 			{/* Keyboard Shortcuts */}
 			<Card>
 				<CardHeader className="px-3 md:px-6 pt-3 md:pt-6 pb-2 md:pb-3">
diff --git a/surfsense_web/app/desktop/login/page.tsx b/surfsense_web/app/desktop/login/page.tsx
index 5d931b5c2..744680010 100644
--- a/surfsense_web/app/desktop/login/page.tsx
+++ b/surfsense_web/app/desktop/login/page.tsx
@@ -15,6 +15,8 @@ import { Label } from "@/components/ui/label";
 import { Separator } from "@/components/ui/separator";
 import { Spinner } from "@/components/ui/spinner";
 import { useElectronAPI } from "@/hooks/use-platform";
+import { searchSpacesApiService } from "@/lib/apis/search-spaces-api.service";
+import { setBearerToken } from "@/lib/auth-utils";
 import { AUTH_TYPE, BACKEND_URL } from "@/lib/env-config";
 
 const isGoogleAuth = AUTH_TYPE === "GOOGLE";
@@ -71,6 +73,19 @@ export default function DesktopLoginPage() {
 		window.location.href = `${BACKEND_URL}/auth/google/authorize-redirect`;
 	};
 
+	const autoSetSearchSpace = async () => {
+		try {
+			const stored = await api?.getActiveSearchSpace?.();
+			if (stored) return;
+			const spaces = await searchSpacesApiService.getSearchSpaces();
+			if (spaces?.length) {
+				await api?.setActiveSearchSpace?.(String(spaces[0].id));
+			}
+		} catch {
+			// non-critical — dashboard-sync will catch it later
+		}
+	};
+
 	const handleLocalLogin = async (e: React.FormEvent) => {
 		e.preventDefault();
 		setLoginError(null);
@@ -86,6 +101,9 @@ export default function DesktopLoginPage() {
 				sessionStorage.setItem("login_success_tracked", "true");
 			}
 
+			setBearerToken(data.access_token);
+			await autoSetSearchSpace();
+
 			setTimeout(() => {
 				router.push(`/auth/callback?token=${data.access_token}`);
 			}, 300);
diff --git a/surfsense_web/components/TokenHandler.tsx b/surfsense_web/components/TokenHandler.tsx
index 02a7089d9..cd585f0ca 100644
--- a/surfsense_web/components/TokenHandler.tsx
+++ b/surfsense_web/components/TokenHandler.tsx
@@ -3,6 +3,7 @@
 import { useEffect } from "react";
 import { useGlobalLoadingEffect } from "@/hooks/use-global-loading";
 import { getAndClearRedirectPath, setBearerToken, setRefreshToken } from "@/lib/auth-utils";
+import { searchSpacesApiService } from "@/lib/apis/search-spaces-api.service";
 import { trackLoginSuccess } from "@/lib/posthog/events";
 
 interface TokenHandlerProps {
@@ -29,52 +30,54 @@ const TokenHandler = ({
 	useGlobalLoadingEffect(true);
 
 	useEffect(() => {
-		// Only run on client-side
 		if (typeof window === "undefined") return;
 
-		// Read tokens from URL at mount time — no subscription needed.
-		// TokenHandler only runs once after an auth redirect, so a stale read
-		// is impossible and useSearchParams() would add a pointless subscription.
-		// (Vercel Best Practice: rerender-defer-reads 5.2)
-		const params = new URLSearchParams(window.location.search);
-		const token = params.get(tokenParamName);
-		const refreshToken = params.get("refresh_token");
+		const run = async () => {
+			const params = new URLSearchParams(window.location.search);
+			const token = params.get(tokenParamName);
+			const refreshToken = params.get("refresh_token");
 
-		if (token) {
-			try {
-				// Track login success for OAuth flows (e.g., Google)
-				// Local login already tracks success before redirecting here
-				const alreadyTracked = sessionStorage.getItem("login_success_tracked");
-				if (!alreadyTracked) {
-					// This is an OAuth flow (Google login) - track success
-					trackLoginSuccess("google");
+			if (token) {
+				try {
+					const alreadyTracked = sessionStorage.getItem("login_success_tracked");
+					if (!alreadyTracked) {
+						trackLoginSuccess("google");
+					}
+					sessionStorage.removeItem("login_success_tracked");
+
+					localStorage.setItem(storageKey, token);
+					setBearerToken(token);
+
+					if (refreshToken) {
+						setRefreshToken(refreshToken);
+					}
+
+					// Auto-set active search space in desktop if not already set
+					if (window.electronAPI?.getActiveSearchSpace) {
+						try {
+							const stored = await window.electronAPI.getActiveSearchSpace();
+							if (!stored) {
+								const spaces = await searchSpacesApiService.getSearchSpaces();
+								if (spaces?.length) {
+									await window.electronAPI.setActiveSearchSpace?.(String(spaces[0].id));
+								}
+							}
+						} catch {
+							// non-critical
+						}
+					}
+
+					const savedRedirectPath = getAndClearRedirectPath();
+					const finalRedirectPath = savedRedirectPath || redirectPath;
+					window.location.href = finalRedirectPath;
+				} catch (error) {
+					console.error("Error storing token in localStorage:", error);
+					window.location.href = redirectPath;
 				}
-				// Clear the flag for future logins
-				sessionStorage.removeItem("login_success_tracked");
-
-				// Store access token in localStorage using both methods for compatibility
-				localStorage.setItem(storageKey, token);
-				setBearerToken(token);
-
-				// Store refresh token if provided
-				if (refreshToken) {
-					setRefreshToken(refreshToken);
-				}
-
-				// Check if there's a saved redirect path from before the auth flow
-				const savedRedirectPath = getAndClearRedirectPath();
-
-				// Use the saved path if available, otherwise use the default redirectPath
-				const finalRedirectPath = savedRedirectPath || redirectPath;
-
-				// Redirect to the appropriate path
-				window.location.href = finalRedirectPath;
-			} catch (error) {
-				console.error("Error storing token in localStorage:", error);
-				// Even if there's an error, try to redirect to the default path
-				window.location.href = redirectPath;
 			}
-		}
+		};
+
+		run();
 	}, [tokenParamName, storageKey, redirectPath]);
 
 	// Return null - the global provider handles the loading UI
diff --git a/surfsense_web/types/window.d.ts b/surfsense_web/types/window.d.ts
index 25077d1da..eeef51b0b 100644
--- a/surfsense_web/types/window.d.ts
+++ b/surfsense_web/types/window.d.ts
@@ -93,6 +93,9 @@ interface ElectronAPI {
 	setShortcuts: (
 		config: Partial<{ generalAssist: string; quickAsk: string; autocomplete: string }>
 	) => Promise<{ generalAssist: string; quickAsk: string; autocomplete: string }>;
+	// Active search space
+	getActiveSearchSpace: () => Promise<string | null>;
+	setActiveSearchSpace: (id: string) => Promise<void>;
 }
 
 declare global {

From 518cacf56e245463be9ed0f1d96aef8aa8d56a26 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 05:03:20 -0700
Subject: [PATCH 167/202] refactor: improve AssistantActionBar functionality
 and UI elements

- Removed unused quick ask mode state and effect, simplifying the component logic.
- Updated tooltip descriptions for action buttons to provide clearer user guidance.
- Enhanced the conditional rendering for the quick assist feature, improving user interaction with the clipboard functionality.
---
 .../assistant-ui/assistant-message.tsx        | 28 ++++++-------------
 1 file changed, 9 insertions(+), 19 deletions(-)

diff --git a/surfsense_web/components/assistant-ui/assistant-message.tsx b/surfsense_web/components/assistant-ui/assistant-message.tsx
index d0cada0bd..5567cfca8 100644
--- a/surfsense_web/components/assistant-ui/assistant-message.tsx
+++ b/surfsense_web/components/assistant-ui/assistant-message.tsx
@@ -465,16 +465,8 @@ const AssistantActionBar: FC = () => {
 	const isLast = useAuiState((s) => s.message.isLast);
 	const aui = useAui();
 	const api = useElectronAPI();
-	const [quickAskMode, setQuickAskMode] = useState("");
 
-	useEffect(() => {
-		if (!isLast || !api?.getQuickAskMode) return;
-		api.getQuickAskMode().then((mode) => {
-			if (mode) setQuickAskMode(mode);
-		});
-	}, [isLast, api]);
-
-	const isTransform = isLast && !!api?.replaceText && quickAskMode === "transform";
+	const isQuickAssist = !!api?.replaceText && !!api?.getQuickAskMode;
 
 	return (
 		<ActionBarPrimitive.Root
@@ -484,7 +476,7 @@ const AssistantActionBar: FC = () => {
 			className="aui-assistant-action-bar-root -ml-1 col-start-3 row-start-2 flex gap-1 text-muted-foreground md:data-floating:absolute md:data-floating:rounded-md md:data-floating:p-1 [&>button]:opacity-100 md:[&>button]:opacity-[var(--aui-button-opacity,1)]"
 		>
 			<ActionBarPrimitive.Copy asChild>
-				<TooltipIconButton tooltip="Copy">
+				<TooltipIconButton tooltip="Copy to clipboard">
 					<AuiIf condition={({ message }) => message.isCopied}>
 						<CheckIcon />
 					</AuiIf>
@@ -494,29 +486,27 @@ const AssistantActionBar: FC = () => {
 				</TooltipIconButton>
 			</ActionBarPrimitive.Copy>
 			<ActionBarPrimitive.ExportMarkdown asChild>
-				<TooltipIconButton tooltip="Download">
+				<TooltipIconButton tooltip="Download as Markdown">
 					<DownloadIcon />
 				</TooltipIconButton>
 			</ActionBarPrimitive.ExportMarkdown>
 			{isLast && (
 				<ActionBarPrimitive.Reload asChild>
-					<TooltipIconButton tooltip="Refresh">
+					<TooltipIconButton tooltip="Regenerate response">
 						<RefreshCwIcon />
 					</TooltipIconButton>
 				</ActionBarPrimitive.Reload>
 			)}
-			{isTransform && (
-				<button
-					type="button"
+			{isQuickAssist && (
+				<TooltipIconButton
+					tooltip="Paste back into source app"
 					onClick={() => {
 						const text = aui.message().getCopyText();
 						api?.replaceText(text);
 					}}
-					className="ml-1 inline-flex items-center gap-1.5 rounded-md bg-primary px-3 py-1.5 text-xs font-medium text-primary-foreground transition-colors hover:bg-primary/90"
 				>
-					<ClipboardPaste className="size-3.5" />
-					Paste back
-				</button>
+					<ClipboardPaste />
+				</TooltipIconButton>
 			)}
 		</ActionBarPrimitive.Root>
 	);

From 80f775581bd44dd980c1d75cdbc125dcc7b41f56 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 05:11:41 -0700
Subject: [PATCH 168/202] feat: implement quick assist mode detection in
 AssistantActionBar

- Added state management for quick assist mode using the Electron API.
- Introduced a useEffect hook to asynchronously check and set the quick assist mode based on the API response, enhancing the component's interactivity.
---
 .../components/assistant-ui/assistant-message.tsx         | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/surfsense_web/components/assistant-ui/assistant-message.tsx b/surfsense_web/components/assistant-ui/assistant-message.tsx
index 5567cfca8..49853b0b5 100644
--- a/surfsense_web/components/assistant-ui/assistant-message.tsx
+++ b/surfsense_web/components/assistant-ui/assistant-message.tsx
@@ -465,8 +465,14 @@ const AssistantActionBar: FC = () => {
 	const isLast = useAuiState((s) => s.message.isLast);
 	const aui = useAui();
 	const api = useElectronAPI();
+	const [isQuickAssist, setIsQuickAssist] = useState(false);
 
-	const isQuickAssist = !!api?.replaceText && !!api?.getQuickAskMode;
+	useEffect(() => {
+		if (!api?.getQuickAskMode) return;
+		api.getQuickAskMode().then((mode) => {
+			if (mode) setIsQuickAssist(true);
+		});
+	}, [api]);
 
 	return (
 		<ActionBarPrimitive.Root

From 55845d68efc32afcf74b26f4133921c00b11bc6e Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 17:38:39 +0200
Subject: [PATCH 169/202] feat: return 3 suggestion options from vision
 autocomplete agent

---
 .../agents/autocomplete/autocomplete_agent.py | 91 ++++++++++++++-----
 1 file changed, 67 insertions(+), 24 deletions(-)

diff --git a/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py b/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
index c6a071b0f..36b5bc086 100644
--- a/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
+++ b/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
@@ -14,7 +14,9 @@ LLM call — the window title is used directly as the KB search query.
 from __future__ import annotations
 
 import asyncio
+import json
 import logging
+import re
 import uuid
 from collections.abc import AsyncGenerator
 from typing import Any
@@ -61,13 +63,21 @@ Key behavior:
 - If the text area already has text, continue it naturally — typically just a sentence or two.
 
 Rules:
-- Output ONLY the text to be inserted. No quotes, no explanations, no meta-commentary.
 - Be CONCISE. Prefer a single paragraph or a few sentences. Autocomplete is a quick assist, not a full draft.
 - Match the tone and formality of the surrounding context.
 - If the screen shows code, write code. If it shows a casual chat, be casual. If it shows a formal email, be formal.
 - Do NOT describe the screenshot or explain your reasoning.
 - Do NOT cite or reference documents explicitly — just let the knowledge inform your writing naturally.
-- If you cannot determine what to write, output nothing.
+- If you cannot determine what to write, output an empty JSON array: []
+
+## Output Format
+
+You MUST provide exactly 3 different suggestion options. Each should be a distinct, plausible completion — vary the tone, detail level, or angle.
+
+Return your suggestions as a JSON array of exactly 3 strings. Output ONLY the JSON array, nothing else — no markdown fences, no explanation, no commentary.
+
+Example format:
+["First suggestion text here.", "Second suggestion — a different take.", "Third option with another approach."]
 
 ## Filesystem Tools `ls`, `read_file`, `write_file`, `edit_file`, `glob`, `grep`
 
@@ -264,6 +274,50 @@ async def create_autocomplete_agent(
     return agent, kb
 
 
+# ---------------------------------------------------------------------------
+# JSON suggestion parsing (robust fallback)
+# ---------------------------------------------------------------------------
+
+
+def _parse_suggestions(raw: str) -> list[str]:
+    """Extract a list of suggestion strings from the agent's output.
+
+    Tries, in order:
+      1. Direct ``json.loads``
+      2. Extract content between ```json ... ``` fences
+      3. Find the first ``[`` … ``]`` span
+    Falls back to wrapping the raw text as a single suggestion.
+    """
+    text = raw.strip()
+    if not text:
+        return []
+
+    for candidate in _json_candidates(text):
+        try:
+            parsed = json.loads(candidate)
+            if isinstance(parsed, list) and all(isinstance(s, str) for s in parsed):
+                return [s for s in parsed if s.strip()]
+        except (json.JSONDecodeError, ValueError):
+            continue
+
+    return [text]
+
+
+def _json_candidates(text: str) -> list[str]:
+    """Yield candidate JSON strings from raw text."""
+    candidates = [text]
+
+    fence = re.search(r"```(?:json)?\s*\n?(.*?)```", text, re.DOTALL)
+    if fence:
+        candidates.append(fence.group(1).strip())
+
+    bracket = re.search(r"\[.*]", text, re.DOTALL)
+    if bracket:
+        candidates.append(bracket.group(0))
+
+    return candidates
+
+
 # ---------------------------------------------------------------------------
 # Streaming helper
 # ---------------------------------------------------------------------------
@@ -285,7 +339,7 @@ async def stream_autocomplete_agent(
     thread_id = uuid.uuid4().hex
     config = {"configurable": {"thread_id": thread_id}}
 
-    current_text_id: str | None = None
+    text_buffer: list[str] = []
     active_tool_depth = 0
     thinking_step_counter = 0
     tool_step_ids: dict[str, str] = {}
@@ -315,14 +369,12 @@ async def stream_autocomplete_agent(
     if emit_message_start:
         yield streaming_service.format_message_start()
 
-    # Emit an initial "Generating completion" step so the UI immediately
-    # shows activity once the agent starts its first LLM call.
     gen_step_id = next_thinking_step_id()
     last_active_step_id = gen_step_id
-    step_titles[gen_step_id] = "Generating completion"
+    step_titles[gen_step_id] = "Generating suggestions"
     yield streaming_service.format_thinking_step(
         step_id=gen_step_id,
-        title="Generating completion",
+        title="Generating suggestions",
         status="in_progress",
     )
 
@@ -341,15 +393,7 @@ async def stream_autocomplete_agent(
                 if chunk and hasattr(chunk, "content"):
                     content = chunk.content
                     if content and isinstance(content, str):
-                        if current_text_id is None:
-                            step_event = complete_current_step()
-                            if step_event:
-                                yield step_event
-                            current_text_id = streaming_service.generate_text_id()
-                            yield streaming_service.format_text_start(current_text_id)
-                        yield streaming_service.format_text_delta(
-                            current_text_id, content
-                        )
+                        text_buffer.append(content)
 
             elif event_type == "on_tool_start":
                 active_tool_depth += 1
@@ -357,10 +401,6 @@ async def stream_autocomplete_agent(
                 run_id = event.get("run_id", "")
                 tool_input = event.get("data", {}).get("input", {})
 
-                if current_text_id is not None:
-                    yield streaming_service.format_text_end(current_text_id)
-                    current_text_id = None
-
                 step_event = complete_current_step()
                 if step_event:
                     yield step_event
@@ -393,19 +433,22 @@ async def stream_autocomplete_agent(
                     if last_active_step_id == step_id:
                         last_active_step_id = None
 
-        if current_text_id is not None:
-            yield streaming_service.format_text_end(current_text_id)
         step_event = complete_current_step()
         if step_event:
             yield step_event
 
+        raw_text = "".join(text_buffer)
+        suggestions = _parse_suggestions(raw_text)
+
+        yield streaming_service.format_data(
+            "suggestions", {"options": suggestions}
+        )
+
         yield streaming_service.format_finish()
         yield streaming_service.format_done()
 
     except Exception as e:
         logger.error(f"Autocomplete agent streaming error: {e}", exc_info=True)
-        if current_text_id is not None:
-            yield streaming_service.format_text_end(current_text_id)
         yield streaming_service.format_error("Autocomplete failed. Please try again.")
         yield streaming_service.format_done()
 

From 2602248e7a552a19be0ac4e005f2c8183e18995a Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 17:43:40 +0200
Subject: [PATCH 170/202] feat: handle multi-option suggestions in suggestion
 page UI

---
 surfsense_web/app/desktop/suggestion/page.tsx | 68 ++++++++++++++-----
 1 file changed, 50 insertions(+), 18 deletions(-)

diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 8d9095320..e98da9a1c 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -14,6 +14,10 @@ type SSEEvent =
 	| {
 			type: "data-thinking-step";
 			data: { id: string; title: string; status: string; items: string[] };
+	  }
+	| {
+			type: "data-suggestions";
+			data: { options: string[] };
 	  };
 
 interface AgentStep {
@@ -70,10 +74,11 @@ function StepIcon({ status }: { status: string }) {
 
 export default function SuggestionPage() {
 	const api = useElectronAPI();
-	const [suggestion, setSuggestion] = useState("");
+	const [options, setOptions] = useState<string[]>([]);
 	const [isLoading, setIsLoading] = useState(true);
 	const [error, setError] = useState<string | null>(null);
 	const [steps, setSteps] = useState<AgentStep[]>([]);
+	const [expandedOption, setExpandedOption] = useState<number | null>(null);
 	const abortRef = useRef<AbortController | null>(null);
 
 	const isDesktop = !!api?.onAutocompleteContext;
@@ -99,9 +104,10 @@ export default function SuggestionPage() {
 			abortRef.current = controller;
 
 			setIsLoading(true);
-			setSuggestion("");
+			setOptions([]);
 			setError(null);
 			setSteps([]);
+			setExpandedOption(null);
 
 			let token = getBearerToken();
 			if (!token) {
@@ -165,8 +171,8 @@ export default function SuggestionPage() {
 
 							try {
 								const parsed: SSEEvent = JSON.parse(data);
-								if (parsed.type === "text-delta") {
-									setSuggestion((prev) => prev + parsed.delta);
+								if (parsed.type === "data-suggestions") {
+									setOptions(parsed.data.options);
 								} else if (parsed.type === "error") {
 									setError(friendlyError(parsed.errorText));
 								} else if (parsed.type === "data-thinking-step") {
@@ -226,7 +232,7 @@ export default function SuggestionPage() {
 		);
 	}
 
-	const showLoading = isLoading && !suggestion;
+	const showLoading = isLoading && options.length === 0;
 
 	if (showLoading) {
 		return (
@@ -258,29 +264,55 @@ export default function SuggestionPage() {
 		);
 	}
 
-	const handleAccept = () => {
-		if (suggestion) {
-			api?.acceptSuggestion?.(suggestion);
-		}
+	const handleSelect = (text: string) => {
+		api?.acceptSuggestion?.(text);
 	};
 
 	const handleDismiss = () => {
 		api?.dismissSuggestion?.();
 	};
 
-	if (!suggestion) return null;
+	const TRUNCATE_LENGTH = 120;
+
+	if (options.length === 0) return null;
 
 	return (
 		<div className="suggestion-tooltip">
-			<p className="suggestion-text">{suggestion}</p>
+			<div className="suggestion-options">
+				{options.map((option, index) => {
+					const isExpanded = expandedOption === index;
+					const needsTruncation = option.length > TRUNCATE_LENGTH;
+					const displayText =
+						needsTruncation && !isExpanded
+							? option.slice(0, TRUNCATE_LENGTH) + "…"
+							: option;
+
+					return (
+						<button
+							key={index}
+							type="button"
+							className="suggestion-option"
+							onClick={() => handleSelect(option)}
+						>
+							<span className="option-number">{index + 1}</span>
+							<span className="option-text">{displayText}</span>
+							{needsTruncation && (
+								<button
+									type="button"
+									className="option-expand"
+									onClick={(e) => {
+										e.stopPropagation();
+										setExpandedOption(isExpanded ? null : index);
+									}}
+								>
+									{isExpanded ? "less" : "more"}
+								</button>
+							)}
+						</button>
+					);
+				})}
+			</div>
 			<div className="suggestion-actions">
-				<button
-					type="button"
-					className="suggestion-btn suggestion-btn-accept"
-					onClick={handleAccept}
-				>
-					Accept
-				</button>
 				<button
 					type="button"
 					className="suggestion-btn suggestion-btn-dismiss"

From e8f82a05909a7d19466c9df036566b0fa9464534 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 17:46:42 +0200
Subject: [PATCH 171/202] feat: add option card styles for multi-suggestion UI

---
 .../app/desktop/suggestion/suggestion.css     | 93 +++++++++++++++++++
 1 file changed, 93 insertions(+)

diff --git a/surfsense_web/app/desktop/suggestion/suggestion.css b/surfsense_web/app/desktop/suggestion/suggestion.css
index 2aa614efb..e0c56857d 100644
--- a/surfsense_web/app/desktop/suggestion/suggestion.css
+++ b/surfsense_web/app/desktop/suggestion/suggestion.css
@@ -191,3 +191,96 @@ body:has(.suggestion-body) {
 		transform: rotate(360deg);
 	}
 }
+
+/* --- Suggestion option cards --- */
+
+.suggestion-options {
+	display: flex;
+	flex-direction: column;
+	gap: 4px;
+	overflow-y: auto;
+	flex: 1 1 auto;
+	min-height: 0;
+	margin-bottom: 6px;
+}
+
+.suggestion-options::-webkit-scrollbar {
+	width: 5px;
+}
+
+.suggestion-options::-webkit-scrollbar-track {
+	background: transparent;
+}
+
+.suggestion-options::-webkit-scrollbar-thumb {
+	background: #555;
+	border-radius: 3px;
+}
+
+.suggestion-option {
+	display: flex;
+	align-items: flex-start;
+	gap: 8px;
+	padding: 6px 8px;
+	border-radius: 5px;
+	border: 1px solid #333;
+	background: #262626;
+	cursor: pointer;
+	text-align: left;
+	font-family: inherit;
+	transition:
+		background 0.15s,
+		border-color 0.15s;
+	width: 100%;
+}
+
+.suggestion-option:hover {
+	background: #2a2d3a;
+	border-color: #3b82f6;
+}
+
+.option-number {
+	flex-shrink: 0;
+	width: 18px;
+	height: 18px;
+	border-radius: 50%;
+	background: #3f3f46;
+	color: #d4d4d4;
+	font-size: 10px;
+	font-weight: 600;
+	display: flex;
+	align-items: center;
+	justify-content: center;
+	margin-top: 1px;
+}
+
+.suggestion-option:hover .option-number {
+	background: #2563eb;
+	color: #fff;
+}
+
+.option-text {
+	color: #d4d4d4;
+	font-size: 12px;
+	line-height: 1.45;
+	word-wrap: break-word;
+	white-space: pre-wrap;
+	flex: 1 1 auto;
+	min-width: 0;
+}
+
+.option-expand {
+	flex-shrink: 0;
+	background: none;
+	border: none;
+	color: #71717a;
+	font-size: 10px;
+	cursor: pointer;
+	padding: 0 2px;
+	font-family: inherit;
+	margin-top: 1px;
+}
+
+.option-expand:hover {
+	color: #a1a1aa;
+}

From 5f354ef6ac7d74f65b08682cf259576c2ba2980a Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 18:06:40 +0200
Subject: [PATCH 172/202] fix: capture agent text from on_chat_model_end for
 non-streaming LLM calls

---
 .../app/agents/autocomplete/autocomplete_agent.py  | 14 ++++++++++++--
 1 file changed, 12 insertions(+), 2 deletions(-)

diff --git a/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py b/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
index 36b5bc086..84f6a064d 100644
--- a/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
+++ b/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
@@ -275,7 +275,7 @@ async def create_autocomplete_agent(
 
 
 # ---------------------------------------------------------------------------
-# JSON suggestion parsing (robust fallback)
+# JSON suggestion parsing (with fallback)
 # ---------------------------------------------------------------------------
 
 
@@ -383,7 +383,6 @@ async def stream_autocomplete_agent(
             input_data, config=config, version="v2"
         ):
             event_type = event.get("event", "")
-
             if event_type == "on_chat_model_stream":
                 if active_tool_depth > 0:
                     continue
@@ -395,6 +394,17 @@ async def stream_autocomplete_agent(
                     if content and isinstance(content, str):
                         text_buffer.append(content)
 
+            elif event_type == "on_chat_model_end":
+                if active_tool_depth > 0:
+                    continue
+                if "surfsense:internal" in event.get("tags", []):
+                    continue
+                output = event.get("data", {}).get("output")
+                if output and hasattr(output, "content"):
+                    content = output.content
+                    if content and isinstance(content, str) and not text_buffer:
+                        text_buffer.append(content)
+
             elif event_type == "on_tool_start":
                 active_tool_depth += 1
                 tool_name = event.get("name", "unknown_tool")

From 60b9f0f21c0fcdc20caa6beee87491840a963627 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 18:12:34 +0200
Subject: [PATCH 173/202] fix: nested button, empty options fallback, skip
 intermediate tool_calls

---
 .../agents/autocomplete/autocomplete_agent.py  |  2 ++
 surfsense_web/app/desktop/suggestion/page.tsx  | 18 ++++++++++++++----
 2 files changed, 16 insertions(+), 4 deletions(-)

diff --git a/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py b/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
index 84f6a064d..77c0af5bb 100644
--- a/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
+++ b/surfsense_backend/app/agents/autocomplete/autocomplete_agent.py
@@ -401,6 +401,8 @@ async def stream_autocomplete_agent(
                     continue
                 output = event.get("data", {}).get("output")
                 if output and hasattr(output, "content"):
+                    if getattr(output, "tool_calls", None):
+                        continue
                     content = output.content
                     if content and isinstance(content, str) and not text_buffer:
                         text_buffer.append(content)
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index e98da9a1c..af1c50be0 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -274,7 +274,13 @@ export default function SuggestionPage() {
 
 	const TRUNCATE_LENGTH = 120;
 
-	if (options.length === 0) return null;
+	if (options.length === 0) {
+		return (
+			<div className="suggestion-tooltip suggestion-error">
+				<span className="suggestion-error-text">No suggestions available.</span>
+			</div>
+		);
+	}
 
 	return (
 		<div className="suggestion-tooltip">
@@ -288,11 +294,15 @@ export default function SuggestionPage() {
 							: option;
 
 					return (
-						<button
+						<div
 							key={index}
-							type="button"
+							role="button"
+							tabIndex={0}
 							className="suggestion-option"
 							onClick={() => handleSelect(option)}
+							onKeyDown={(e) => {
+								if (e.key === "Enter") handleSelect(option);
+							}}
 						>
 							<span className="option-number">{index + 1}</span>
 							<span className="option-text">{displayText}</span>
@@ -308,7 +318,7 @@ export default function SuggestionPage() {
 									{isExpanded ? "less" : "more"}
 								</button>
 							)}
-						</button>
+						</div>
 					);
 				})}
 			</div>

From 70807cccd1cb55f47ea136c1c5cf8399fd5eec63 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 18:22:16 +0200
Subject: [PATCH 174/202] fix: hide scrollbar during streaming to prevent UI
 flicker

---
 surfsense_web/app/desktop/suggestion/suggestion.css | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/surfsense_web/app/desktop/suggestion/suggestion.css b/surfsense_web/app/desktop/suggestion/suggestion.css
index e0c56857d..f5471cf37 100644
--- a/surfsense_web/app/desktop/suggestion/suggestion.css
+++ b/surfsense_web/app/desktop/suggestion/suggestion.css
@@ -127,6 +127,10 @@ body:has(.suggestion-body) {
 	max-height: 340px;
 }
 
+.agent-activity::-webkit-scrollbar {
+	display: none;
+}
+
 .activity-initial {
 	display: flex;
 	align-items: center;

From 5439b3991b6f61fd547ae8ef1d2020e04f6ec1a3 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 18:25:06 +0200
Subject: [PATCH 175/202] fix: auto-dismiss overlay when no suggestions are
 available

---
 surfsense_web/app/desktop/suggestion/page.tsx | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index af1c50be0..e458f6615 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -97,6 +97,14 @@ export default function SuggestionPage() {
 		return () => clearTimeout(timer);
 	}, [error, api]);
 
+	useEffect(() => {
+		if (isLoading || error || options.length > 0) return;
+		const timer = setTimeout(() => {
+			api?.dismissSuggestion?.();
+		}, AUTO_DISMISS_MS);
+		return () => clearTimeout(timer);
+	}, [isLoading, error, options, api]);
+
 	const fetchSuggestion = useCallback(
 		async (screenshot: string, searchSpaceId: string, appName?: string, windowTitle?: string) => {
 			abortRef.current?.abort();

From 879945eeae05d22845a2dd682a6e3eb1cbeb578d Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 18:49:04 +0200
Subject: [PATCH 176/202] Add VisionProvider enum, VisionLLMConfig table, and
 vision RBAC permissions

---
 surfsense_backend/app/db.py | 77 ++++++++++++++++++++++++++++++++++++-
 1 file changed, 76 insertions(+), 1 deletion(-)

diff --git a/surfsense_backend/app/db.py b/surfsense_backend/app/db.py
index 6e9553307..4689313f7 100644
--- a/surfsense_backend/app/db.py
+++ b/surfsense_backend/app/db.py
@@ -260,6 +260,24 @@ class ImageGenProvider(StrEnum):
     NSCALE = "NSCALE"
 
 
+class VisionProvider(StrEnum):
+    OPENAI = "OPENAI"
+    ANTHROPIC = "ANTHROPIC"
+    GOOGLE = "GOOGLE"
+    AZURE_OPENAI = "AZURE_OPENAI"
+    VERTEX_AI = "VERTEX_AI"
+    BEDROCK = "BEDROCK"
+    XAI = "XAI"
+    OPENROUTER = "OPENROUTER"
+    OLLAMA = "OLLAMA"
+    GROQ = "GROQ"
+    TOGETHER_AI = "TOGETHER_AI"
+    FIREWORKS_AI = "FIREWORKS_AI"
+    DEEPSEEK = "DEEPSEEK"
+    MISTRAL = "MISTRAL"
+    CUSTOM = "CUSTOM"
+
+
 class LogLevel(StrEnum):
     DEBUG = "DEBUG"
     INFO = "INFO"
@@ -377,6 +395,11 @@ class Permission(StrEnum):
     IMAGE_GENERATIONS_READ = "image_generations:read"
     IMAGE_GENERATIONS_DELETE = "image_generations:delete"
 
+    # Vision LLM Configs
+    VISION_CONFIGS_CREATE = "vision_configs:create"
+    VISION_CONFIGS_READ = "vision_configs:read"
+    VISION_CONFIGS_DELETE = "vision_configs:delete"
+
     # Connectors
     CONNECTORS_CREATE = "connectors:create"
     CONNECTORS_READ = "connectors:read"
@@ -445,6 +468,9 @@ DEFAULT_ROLE_PERMISSIONS = {
         # Image Generations (create and read, no delete)
         Permission.IMAGE_GENERATIONS_CREATE.value,
         Permission.IMAGE_GENERATIONS_READ.value,
+        # Vision Configs (create and read, no delete)
+        Permission.VISION_CONFIGS_CREATE.value,
+        Permission.VISION_CONFIGS_READ.value,
         # Connectors (no delete)
         Permission.CONNECTORS_CREATE.value,
         Permission.CONNECTORS_READ.value,
@@ -478,6 +504,8 @@ DEFAULT_ROLE_PERMISSIONS = {
         Permission.VIDEO_PRESENTATIONS_READ.value,
         # Image Generations (read only)
         Permission.IMAGE_GENERATIONS_READ.value,
+        # Vision Configs (read only)
+        Permission.VISION_CONFIGS_READ.value,
         # Connectors (read only)
         Permission.CONNECTORS_READ.value,
         # Logs (read only)
@@ -1263,6 +1291,35 @@ class ImageGenerationConfig(BaseModel, TimestampMixin):
     user = relationship("User", back_populates="image_generation_configs")
 
 
+class VisionLLMConfig(BaseModel, TimestampMixin):
+    __tablename__ = "vision_llm_configs"
+
+    name = Column(String(100), nullable=False, index=True)
+    description = Column(String(500), nullable=True)
+
+    provider = Column(SQLAlchemyEnum(VisionProvider), nullable=False)
+    custom_provider = Column(String(100), nullable=True)
+    model_name = Column(String(100), nullable=False)
+
+    api_key = Column(String, nullable=False)
+    api_base = Column(String(500), nullable=True)
+    api_version = Column(String(50), nullable=True)
+
+    litellm_params = Column(JSON, nullable=True, default={})
+
+    search_space_id = Column(
+        Integer, ForeignKey("searchspaces.id", ondelete="CASCADE"), nullable=False
+    )
+    search_space = relationship(
+        "SearchSpace", back_populates="vision_llm_configs"
+    )
+
+    user_id = Column(
+        UUID(as_uuid=True), ForeignKey("user.id", ondelete="CASCADE"), nullable=False
+    )
+    user = relationship("User", back_populates="vision_llm_configs")
+
+
 class ImageGeneration(BaseModel, TimestampMixin):
     """
     Stores image generation requests and results using litellm.aimage_generation().
@@ -1351,7 +1408,7 @@ class SearchSpace(BaseModel, TimestampMixin):
     image_generation_config_id = Column(
         Integer, nullable=True, default=0
     )  # For image generation, defaults to Auto mode
-    vision_llm_id = Column(
+    vision_llm_config_id = Column(
         Integer, nullable=True, default=0
     )  # For vision/screenshot analysis, defaults to Auto mode
 
@@ -1432,6 +1489,12 @@ class SearchSpace(BaseModel, TimestampMixin):
         order_by="ImageGenerationConfig.id",
         cascade="all, delete-orphan",
     )
+    vision_llm_configs = relationship(
+        "VisionLLMConfig",
+        back_populates="search_space",
+        order_by="VisionLLMConfig.id",
+        cascade="all, delete-orphan",
+    )
 
     # RBAC relationships
     roles = relationship(
@@ -1961,6 +2024,12 @@ if config.AUTH_TYPE == "GOOGLE":
             passive_deletes=True,
         )
 
+        vision_llm_configs = relationship(
+            "VisionLLMConfig",
+            back_populates="user",
+            passive_deletes=True,
+        )
+
         # User memories for personalized AI responses
         memories = relationship(
             "UserMemory",
@@ -2075,6 +2144,12 @@ else:
             passive_deletes=True,
         )
 
+        vision_llm_configs = relationship(
+            "VisionLLMConfig",
+            back_populates="user",
+            passive_deletes=True,
+        )
+
         # User memories for personalized AI responses
         memories = relationship(
             "UserMemory",

From 32a3356f55cc3c9003df88e1d529eca5cf8babbc Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 18:50:51 +0200
Subject: [PATCH 177/202] Add migration 120: vision_llm_configs table and
 column rename

---
 .../120_add_vision_llm_configs_table.py       | 190 ++++++++++++++++++
 1 file changed, 190 insertions(+)
 create mode 100644 surfsense_backend/alembic/versions/120_add_vision_llm_configs_table.py

diff --git a/surfsense_backend/alembic/versions/120_add_vision_llm_configs_table.py b/surfsense_backend/alembic/versions/120_add_vision_llm_configs_table.py
new file mode 100644
index 000000000..c0c915388
--- /dev/null
+++ b/surfsense_backend/alembic/versions/120_add_vision_llm_configs_table.py
@@ -0,0 +1,190 @@
+"""Add vision LLM configs table and rename preference column
+
+Revision ID: 120
+Revises: 119
+
+Changes:
+1. Create visionprovider enum type
+2. Create vision_llm_configs table
+3. Rename vision_llm_id -> vision_llm_config_id on searchspaces
+4. Add vision config permissions to existing system roles
+"""
+
+from __future__ import annotations
+
+from collections.abc import Sequence
+
+import sqlalchemy as sa
+from sqlalchemy.dialects.postgresql import ENUM as PG_ENUM, UUID
+
+from alembic import op
+
+revision: str = "120"
+down_revision: str | None = "119"
+branch_labels: str | Sequence[str] | None = None
+depends_on: str | Sequence[str] | None = None
+
+VISION_PROVIDER_VALUES = (
+    "OPENAI",
+    "ANTHROPIC",
+    "GOOGLE",
+    "AZURE_OPENAI",
+    "VERTEX_AI",
+    "BEDROCK",
+    "XAI",
+    "OPENROUTER",
+    "OLLAMA",
+    "GROQ",
+    "TOGETHER_AI",
+    "FIREWORKS_AI",
+    "DEEPSEEK",
+    "MISTRAL",
+    "CUSTOM",
+)
+
+
+def upgrade() -> None:
+    connection = op.get_bind()
+
+    # 1. Create visionprovider enum
+    connection.execute(
+        sa.text(
+            """
+            DO $$
+            BEGIN
+                IF NOT EXISTS (SELECT 1 FROM pg_type WHERE typname = 'visionprovider') THEN
+                    CREATE TYPE visionprovider AS ENUM (
+                        'OPENAI', 'ANTHROPIC', 'GOOGLE', 'AZURE_OPENAI', 'VERTEX_AI',
+                        'BEDROCK', 'XAI', 'OPENROUTER', 'OLLAMA', 'GROQ',
+                        'TOGETHER_AI', 'FIREWORKS_AI', 'DEEPSEEK', 'MISTRAL', 'CUSTOM'
+                    );
+                END IF;
+            END
+            $$;
+            """
+        )
+    )
+
+    # 2. Create vision_llm_configs table
+    result = connection.execute(
+        sa.text(
+            "SELECT EXISTS (SELECT FROM information_schema.tables WHERE table_name = 'vision_llm_configs')"
+        )
+    )
+    if not result.scalar():
+        op.create_table(
+            "vision_llm_configs",
+            sa.Column("id", sa.Integer(), autoincrement=True, nullable=False),
+            sa.Column("name", sa.String(100), nullable=False),
+            sa.Column("description", sa.String(500), nullable=True),
+            sa.Column(
+                "provider",
+                PG_ENUM(*VISION_PROVIDER_VALUES, name="visionprovider", create_type=False),
+                nullable=False,
+            ),
+            sa.Column("custom_provider", sa.String(100), nullable=True),
+            sa.Column("model_name", sa.String(100), nullable=False),
+            sa.Column("api_key", sa.String(), nullable=False),
+            sa.Column("api_base", sa.String(500), nullable=True),
+            sa.Column("api_version", sa.String(50), nullable=True),
+            sa.Column("litellm_params", sa.JSON(), nullable=True),
+            sa.Column("search_space_id", sa.Integer(), nullable=False),
+            sa.Column("user_id", UUID(as_uuid=True), nullable=False),
+            sa.Column(
+                "created_at",
+                sa.TIMESTAMP(timezone=True),
+                server_default=sa.text("now()"),
+                nullable=False,
+            ),
+            sa.PrimaryKeyConstraint("id"),
+            sa.ForeignKeyConstraint(
+                ["search_space_id"], ["searchspaces.id"], ondelete="CASCADE"
+            ),
+            sa.ForeignKeyConstraint(
+                ["user_id"], ["user.id"], ondelete="CASCADE"
+            ),
+        )
+        op.execute(
+            "CREATE INDEX IF NOT EXISTS ix_vision_llm_configs_name "
+            "ON vision_llm_configs (name)"
+        )
+        op.execute(
+            "CREATE INDEX IF NOT EXISTS ix_vision_llm_configs_search_space_id "
+            "ON vision_llm_configs (search_space_id)"
+        )
+
+    # 3. Rename vision_llm_id -> vision_llm_config_id on searchspaces
+    existing_columns = [
+        col["name"] for col in sa.inspect(connection).get_columns("searchspaces")
+    ]
+    if "vision_llm_id" in existing_columns and "vision_llm_config_id" not in existing_columns:
+        op.alter_column("searchspaces", "vision_llm_id", new_column_name="vision_llm_config_id")
+    elif "vision_llm_config_id" not in existing_columns:
+        op.add_column(
+            "searchspaces",
+            sa.Column("vision_llm_config_id", sa.Integer(), nullable=True, server_default="0"),
+        )
+
+    # 4. Add vision config permissions to existing system roles
+    connection.execute(
+        sa.text(
+            """
+            UPDATE search_space_roles
+            SET permissions = array_cat(
+                permissions,
+                ARRAY['vision_configs:create', 'vision_configs:read']
+            )
+            WHERE is_system_role = true
+              AND name = 'Editor'
+              AND NOT ('vision_configs:create' = ANY(permissions))
+            """
+        )
+    )
+    connection.execute(
+        sa.text(
+            """
+            UPDATE search_space_roles
+            SET permissions = array_cat(
+                permissions,
+                ARRAY['vision_configs:read']
+            )
+            WHERE is_system_role = true
+              AND name = 'Viewer'
+              AND NOT ('vision_configs:read' = ANY(permissions))
+            """
+        )
+    )
+
+
+def downgrade() -> None:
+    connection = op.get_bind()
+
+    # Remove permissions
+    connection.execute(
+        sa.text(
+            """
+            UPDATE search_space_roles
+            SET permissions = array_remove(
+                array_remove(
+                    array_remove(permissions, 'vision_configs:create'),
+                    'vision_configs:read'
+                ),
+                'vision_configs:delete'
+            )
+            WHERE is_system_role = true
+            """
+        )
+    )
+
+    # Rename column back
+    existing_columns = [
+        col["name"] for col in sa.inspect(connection).get_columns("searchspaces")
+    ]
+    if "vision_llm_config_id" in existing_columns:
+        op.alter_column("searchspaces", "vision_llm_config_id", new_column_name="vision_llm_id")
+
+    # Drop table and enum
+    op.execute("DROP INDEX IF EXISTS ix_vision_llm_configs_search_space_id")
+    op.execute("DROP INDEX IF EXISTS ix_vision_llm_configs_name")
+    op.execute("DROP TABLE IF EXISTS vision_llm_configs")
+    op.execute("DROP TYPE IF EXISTS visionprovider")

From ecfcc6101112bcb59d95469785d9acb0b656319a Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 18:52:37 +0200
Subject: [PATCH 178/202] Add VisionLLMConfig Pydantic schemas

---
 surfsense_backend/app/schemas/__init__.py   | 13 ++++
 surfsense_backend/app/schemas/vision_llm.py | 75 +++++++++++++++++++++
 2 files changed, 88 insertions(+)
 create mode 100644 surfsense_backend/app/schemas/vision_llm.py

diff --git a/surfsense_backend/app/schemas/__init__.py b/surfsense_backend/app/schemas/__init__.py
index b94a30c19..fdf34672b 100644
--- a/surfsense_backend/app/schemas/__init__.py
+++ b/surfsense_backend/app/schemas/__init__.py
@@ -125,6 +125,13 @@ from .video_presentations import (
     VideoPresentationRead,
     VideoPresentationUpdate,
 )
+from .vision_llm import (
+    GlobalVisionLLMConfigRead,
+    VisionLLMConfigCreate,
+    VisionLLMConfigPublic,
+    VisionLLMConfigRead,
+    VisionLLMConfigUpdate,
+)
 
 __all__ = [
     # Folder schemas
@@ -163,6 +170,8 @@ __all__ = [
     "FolderUpdate",
     "GlobalImageGenConfigRead",
     "GlobalNewLLMConfigRead",
+    # Vision LLM Config schemas
+    "GlobalVisionLLMConfigRead",
     "GoogleDriveIndexRequest",
     "GoogleDriveIndexingOptions",
     # Base schemas
@@ -264,4 +273,8 @@ __all__ = [
     "VideoPresentationCreate",
     "VideoPresentationRead",
     "VideoPresentationUpdate",
+    "VisionLLMConfigCreate",
+    "VisionLLMConfigPublic",
+    "VisionLLMConfigRead",
+    "VisionLLMConfigUpdate",
 ]
diff --git a/surfsense_backend/app/schemas/vision_llm.py b/surfsense_backend/app/schemas/vision_llm.py
new file mode 100644
index 000000000..ab2e609dc
--- /dev/null
+++ b/surfsense_backend/app/schemas/vision_llm.py
@@ -0,0 +1,75 @@
+import uuid
+from datetime import datetime
+from typing import Any
+
+from pydantic import BaseModel, ConfigDict, Field
+
+from app.db import VisionProvider
+
+
+class VisionLLMConfigBase(BaseModel):
+    name: str = Field(..., max_length=100)
+    description: str | None = Field(None, max_length=500)
+    provider: VisionProvider = Field(...)
+    custom_provider: str | None = Field(None, max_length=100)
+    model_name: str = Field(..., max_length=100)
+    api_key: str = Field(...)
+    api_base: str | None = Field(None, max_length=500)
+    api_version: str | None = Field(None, max_length=50)
+    litellm_params: dict[str, Any] | None = Field(default=None)
+
+
+class VisionLLMConfigCreate(VisionLLMConfigBase):
+    search_space_id: int = Field(...)
+
+
+class VisionLLMConfigUpdate(BaseModel):
+    name: str | None = Field(None, max_length=100)
+    description: str | None = Field(None, max_length=500)
+    provider: VisionProvider | None = None
+    custom_provider: str | None = Field(None, max_length=100)
+    model_name: str | None = Field(None, max_length=100)
+    api_key: str | None = None
+    api_base: str | None = Field(None, max_length=500)
+    api_version: str | None = Field(None, max_length=50)
+    litellm_params: dict[str, Any] | None = None
+
+
+class VisionLLMConfigRead(VisionLLMConfigBase):
+    id: int
+    created_at: datetime
+    search_space_id: int
+    user_id: uuid.UUID
+
+    model_config = ConfigDict(from_attributes=True)
+
+
+class VisionLLMConfigPublic(BaseModel):
+    id: int
+    name: str
+    description: str | None = None
+    provider: VisionProvider
+    custom_provider: str | None = None
+    model_name: str
+    api_base: str | None = None
+    api_version: str | None = None
+    litellm_params: dict[str, Any] | None = None
+    created_at: datetime
+    search_space_id: int
+    user_id: uuid.UUID
+
+    model_config = ConfigDict(from_attributes=True)
+
+
+class GlobalVisionLLMConfigRead(BaseModel):
+    id: int = Field(...)
+    name: str
+    description: str | None = None
+    provider: str
+    custom_provider: str | None = None
+    model_name: str
+    api_base: str | None = None
+    api_version: str | None = None
+    litellm_params: dict[str, Any] | None = None
+    is_global: bool = True
+    is_auto_mode: bool = False

From 362cd3590c2c68b9bed4a461f00af839e6130c73 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 18:59:33 +0200
Subject: [PATCH 179/202] Add VisionLLMRouterService for Auto mode routing

---
 .../app/services/vision_llm_router_service.py | 193 ++++++++++++++++++
 1 file changed, 193 insertions(+)
 create mode 100644 surfsense_backend/app/services/vision_llm_router_service.py

diff --git a/surfsense_backend/app/services/vision_llm_router_service.py b/surfsense_backend/app/services/vision_llm_router_service.py
new file mode 100644
index 000000000..0d782ab2b
--- /dev/null
+++ b/surfsense_backend/app/services/vision_llm_router_service.py
@@ -0,0 +1,193 @@
+import logging
+from typing import Any
+
+from litellm import Router
+
+logger = logging.getLogger(__name__)
+
+VISION_AUTO_MODE_ID = 0
+
+VISION_PROVIDER_MAP = {
+    "OPENAI": "openai",
+    "ANTHROPIC": "anthropic",
+    "GOOGLE": "gemini",
+    "AZURE_OPENAI": "azure",
+    "VERTEX_AI": "vertex_ai",
+    "BEDROCK": "bedrock",
+    "XAI": "xai",
+    "OPENROUTER": "openrouter",
+    "OLLAMA": "ollama_chat",
+    "GROQ": "groq",
+    "TOGETHER_AI": "together_ai",
+    "FIREWORKS_AI": "fireworks_ai",
+    "DEEPSEEK": "openai",
+    "MISTRAL": "mistral",
+    "CUSTOM": "custom",
+}
+
+
+class VisionLLMRouterService:
+    _instance = None
+    _router: Router | None = None
+    _model_list: list[dict] = []
+    _router_settings: dict = {}
+    _initialized: bool = False
+
+    def __new__(cls):
+        if cls._instance is None:
+            cls._instance = super().__new__(cls)
+        return cls._instance
+
+    @classmethod
+    def get_instance(cls) -> "VisionLLMRouterService":
+        if cls._instance is None:
+            cls._instance = cls()
+        return cls._instance
+
+    @classmethod
+    def initialize(
+        cls,
+        global_configs: list[dict],
+        router_settings: dict | None = None,
+    ) -> None:
+        instance = cls.get_instance()
+
+        if instance._initialized:
+            logger.debug("Vision LLM Router already initialized, skipping")
+            return
+
+        model_list = []
+        for config in global_configs:
+            deployment = cls._config_to_deployment(config)
+            if deployment:
+                model_list.append(deployment)
+
+        if not model_list:
+            logger.warning(
+                "No valid vision LLM configs found for router initialization"
+            )
+            return
+
+        instance._model_list = model_list
+        instance._router_settings = router_settings or {}
+
+        default_settings = {
+            "routing_strategy": "usage-based-routing",
+            "num_retries": 3,
+            "allowed_fails": 3,
+            "cooldown_time": 60,
+            "retry_after": 5,
+        }
+
+        final_settings = {**default_settings, **instance._router_settings}
+
+        try:
+            instance._router = Router(
+                model_list=model_list,
+                routing_strategy=final_settings.get(
+                    "routing_strategy", "usage-based-routing"
+                ),
+                num_retries=final_settings.get("num_retries", 3),
+                allowed_fails=final_settings.get("allowed_fails", 3),
+                cooldown_time=final_settings.get("cooldown_time", 60),
+                set_verbose=False,
+            )
+            instance._initialized = True
+            logger.info(
+                "Vision LLM Router initialized with %d deployments, strategy: %s",
+                len(model_list),
+                final_settings.get("routing_strategy"),
+            )
+        except Exception as e:
+            logger.error(f"Failed to initialize Vision LLM Router: {e}")
+            instance._router = None
+
+    @classmethod
+    def _config_to_deployment(cls, config: dict) -> dict | None:
+        try:
+            if not config.get("model_name") or not config.get("api_key"):
+                return None
+
+            if config.get("custom_provider"):
+                model_string = f"{config['custom_provider']}/{config['model_name']}"
+            else:
+                provider = config.get("provider", "").upper()
+                provider_prefix = VISION_PROVIDER_MAP.get(provider, provider.lower())
+                model_string = f"{provider_prefix}/{config['model_name']}"
+
+            litellm_params: dict[str, Any] = {
+                "model": model_string,
+                "api_key": config.get("api_key"),
+            }
+
+            if config.get("api_base"):
+                litellm_params["api_base"] = config["api_base"]
+
+            if config.get("api_version"):
+                litellm_params["api_version"] = config["api_version"]
+
+            if config.get("litellm_params"):
+                litellm_params.update(config["litellm_params"])
+
+            deployment: dict[str, Any] = {
+                "model_name": "auto",
+                "litellm_params": litellm_params,
+            }
+
+            if config.get("rpm"):
+                deployment["rpm"] = config["rpm"]
+            if config.get("tpm"):
+                deployment["tpm"] = config["tpm"]
+
+            return deployment
+
+        except Exception as e:
+            logger.warning(f"Failed to convert vision config to deployment: {e}")
+            return None
+
+    @classmethod
+    def get_router(cls) -> Router | None:
+        instance = cls.get_instance()
+        return instance._router
+
+    @classmethod
+    def is_initialized(cls) -> bool:
+        instance = cls.get_instance()
+        return instance._initialized and instance._router is not None
+
+    @classmethod
+    def get_model_count(cls) -> int:
+        instance = cls.get_instance()
+        return len(instance._model_list)
+
+
+def is_vision_auto_mode(config_id: int | None) -> bool:
+    return config_id == VISION_AUTO_MODE_ID
+
+
+def build_vision_model_string(
+    provider: str, model_name: str, custom_provider: str | None
+) -> str:
+    if custom_provider:
+        return f"{custom_provider}/{model_name}"
+    prefix = VISION_PROVIDER_MAP.get(provider.upper(), provider.lower())
+    return f"{prefix}/{model_name}"
+
+
+def get_global_vision_llm_config(config_id: int) -> dict | None:
+    from app.config import config
+
+    if config_id == VISION_AUTO_MODE_ID:
+        return {
+            "id": VISION_AUTO_MODE_ID,
+            "name": "Auto (Fastest)",
+            "provider": "AUTO",
+            "model_name": "auto",
+            "is_auto_mode": True,
+        }
+    if config_id > 0:
+        return None
+    for cfg in config.GLOBAL_VISION_LLM_CONFIGS:
+        if cfg.get("id") == config_id:
+            return cfg
+    return None

From 7448f27ee01ce1619ff02f61ab3b12b6f085e60e Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 19:02:18 +0200
Subject: [PATCH 180/202] Add vision LLM config loading and router
 initialization to Config

---
 surfsense_backend/app/config/__init__.py | 67 ++++++++++++++++++++++++
 1 file changed, 67 insertions(+)

diff --git a/surfsense_backend/app/config/__init__.py b/surfsense_backend/app/config/__init__.py
index 7c4baf923..4c49a4f8b 100644
--- a/surfsense_backend/app/config/__init__.py
+++ b/surfsense_backend/app/config/__init__.py
@@ -102,6 +102,44 @@ def load_global_image_gen_configs():
         return []
 
 
+def load_global_vision_llm_configs():
+    global_config_file = BASE_DIR / "app" / "config" / "global_llm_config.yaml"
+
+    if not global_config_file.exists():
+        return []
+
+    try:
+        with open(global_config_file, encoding="utf-8") as f:
+            data = yaml.safe_load(f)
+            return data.get("global_vision_llm_configs", [])
+    except Exception as e:
+        print(f"Warning: Failed to load global vision LLM configs: {e}")
+        return []
+
+
+def load_vision_llm_router_settings():
+    default_settings = {
+        "routing_strategy": "usage-based-routing",
+        "num_retries": 3,
+        "allowed_fails": 3,
+        "cooldown_time": 60,
+    }
+
+    global_config_file = BASE_DIR / "app" / "config" / "global_llm_config.yaml"
+
+    if not global_config_file.exists():
+        return default_settings
+
+    try:
+        with open(global_config_file, encoding="utf-8") as f:
+            data = yaml.safe_load(f)
+            settings = data.get("vision_llm_router_settings", {})
+            return {**default_settings, **settings}
+    except Exception as e:
+        print(f"Warning: Failed to load vision LLM router settings: {e}")
+        return default_settings
+
+
 def load_image_gen_router_settings():
     """
     Load router settings for image generation Auto mode from YAML file.
@@ -182,6 +220,29 @@ def initialize_image_gen_router():
         print(f"Warning: Failed to initialize Image Generation Router: {e}")
 
 
+def initialize_vision_llm_router():
+    vision_configs = load_global_vision_llm_configs()
+    router_settings = load_vision_llm_router_settings()
+
+    if not vision_configs:
+        print(
+            "Info: No global vision LLM configs found, "
+            "Vision LLM Auto mode will not be available"
+        )
+        return
+
+    try:
+        from app.services.vision_llm_router_service import VisionLLMRouterService
+
+        VisionLLMRouterService.initialize(vision_configs, router_settings)
+        print(
+            f"Info: Vision LLM Router initialized with {len(vision_configs)} models "
+            f"(strategy: {router_settings.get('routing_strategy', 'usage-based-routing')})"
+        )
+    except Exception as e:
+        print(f"Warning: Failed to initialize Vision LLM Router: {e}")
+
+
 class Config:
     # Check if ffmpeg is installed
     if not is_ffmpeg_installed():
@@ -335,6 +396,12 @@ class Config:
     # Router settings for Image Generation Auto mode
     IMAGE_GEN_ROUTER_SETTINGS = load_image_gen_router_settings()
 
+    # Global Vision LLM Configurations (optional)
+    GLOBAL_VISION_LLM_CONFIGS = load_global_vision_llm_configs()
+
+    # Router settings for Vision LLM Auto mode
+    VISION_LLM_ROUTER_SETTINGS = load_vision_llm_router_settings()
+
     # Chonkie Configuration | Edit this to your needs
     EMBEDDING_MODEL = os.getenv("EMBEDDING_MODEL")
     # Azure OpenAI credentials from environment variables

From bdbc4ce4a1cc4b6d4426e7537a7818ec19a5bfb3 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 19:04:03 +0200
Subject: [PATCH 181/202] Add vision LLM config CRUD and global configs routes

---
 .../app/routes/vision_llm_routes.py           | 267 ++++++++++++++++++
 1 file changed, 267 insertions(+)
 create mode 100644 surfsense_backend/app/routes/vision_llm_routes.py

diff --git a/surfsense_backend/app/routes/vision_llm_routes.py b/surfsense_backend/app/routes/vision_llm_routes.py
new file mode 100644
index 000000000..29d1a2757
--- /dev/null
+++ b/surfsense_backend/app/routes/vision_llm_routes.py
@@ -0,0 +1,267 @@
+import logging
+
+from fastapi import APIRouter, Depends, HTTPException
+from sqlalchemy import select
+from sqlalchemy.ext.asyncio import AsyncSession
+
+from app.config import config
+from app.db import (
+    Permission,
+    User,
+    VisionLLMConfig,
+    get_async_session,
+)
+from app.schemas import (
+    GlobalVisionLLMConfigRead,
+    VisionLLMConfigCreate,
+    VisionLLMConfigRead,
+    VisionLLMConfigUpdate,
+)
+from app.users import current_active_user
+from app.utils.rbac import check_permission
+
+router = APIRouter()
+logger = logging.getLogger(__name__)
+
+
+# =============================================================================
+# Global Vision LLM Configs (from YAML)
+# =============================================================================
+
+
+@router.get(
+    "/global-vision-llm-configs",
+    response_model=list[GlobalVisionLLMConfigRead],
+)
+async def get_global_vision_llm_configs(
+    user: User = Depends(current_active_user),
+):
+    try:
+        global_configs = config.GLOBAL_VISION_LLM_CONFIGS
+        safe_configs = []
+
+        if global_configs and len(global_configs) > 0:
+            safe_configs.append(
+                {
+                    "id": 0,
+                    "name": "Auto (Fastest)",
+                    "description": "Automatically routes across available vision LLM providers.",
+                    "provider": "AUTO",
+                    "custom_provider": None,
+                    "model_name": "auto",
+                    "api_base": None,
+                    "api_version": None,
+                    "litellm_params": {},
+                    "is_global": True,
+                    "is_auto_mode": True,
+                }
+            )
+
+        for cfg in global_configs:
+            safe_configs.append(
+                {
+                    "id": cfg.get("id"),
+                    "name": cfg.get("name"),
+                    "description": cfg.get("description"),
+                    "provider": cfg.get("provider"),
+                    "custom_provider": cfg.get("custom_provider"),
+                    "model_name": cfg.get("model_name"),
+                    "api_base": cfg.get("api_base") or None,
+                    "api_version": cfg.get("api_version") or None,
+                    "litellm_params": cfg.get("litellm_params", {}),
+                    "is_global": True,
+                }
+            )
+
+        return safe_configs
+    except Exception as e:
+        logger.exception("Failed to fetch global vision LLM configs")
+        raise HTTPException(
+            status_code=500, detail=f"Failed to fetch configs: {e!s}"
+        ) from e
+
+
+# =============================================================================
+# VisionLLMConfig CRUD
+# =============================================================================
+
+
+@router.post("/vision-llm-configs", response_model=VisionLLMConfigRead)
+async def create_vision_llm_config(
+    config_data: VisionLLMConfigCreate,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    try:
+        await check_permission(
+            session,
+            user,
+            config_data.search_space_id,
+            Permission.VISION_CONFIGS_CREATE.value,
+            "You don't have permission to create vision LLM configs in this search space",
+        )
+
+        db_config = VisionLLMConfig(**config_data.model_dump(), user_id=user.id)
+        session.add(db_config)
+        await session.commit()
+        await session.refresh(db_config)
+        return db_config
+
+    except HTTPException:
+        raise
+    except Exception as e:
+        await session.rollback()
+        logger.exception("Failed to create VisionLLMConfig")
+        raise HTTPException(
+            status_code=500, detail=f"Failed to create config: {e!s}"
+        ) from e
+
+
+@router.get("/vision-llm-configs", response_model=list[VisionLLMConfigRead])
+async def list_vision_llm_configs(
+    search_space_id: int,
+    skip: int = 0,
+    limit: int = 100,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    try:
+        await check_permission(
+            session,
+            user,
+            search_space_id,
+            Permission.VISION_CONFIGS_READ.value,
+            "You don't have permission to view vision LLM configs in this search space",
+        )
+
+        result = await session.execute(
+            select(VisionLLMConfig)
+            .filter(VisionLLMConfig.search_space_id == search_space_id)
+            .order_by(VisionLLMConfig.created_at.desc())
+            .offset(skip)
+            .limit(limit)
+        )
+        return result.scalars().all()
+
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.exception("Failed to list VisionLLMConfigs")
+        raise HTTPException(
+            status_code=500, detail=f"Failed to fetch configs: {e!s}"
+        ) from e
+
+
+@router.get(
+    "/vision-llm-configs/{config_id}", response_model=VisionLLMConfigRead
+)
+async def get_vision_llm_config(
+    config_id: int,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    try:
+        result = await session.execute(
+            select(VisionLLMConfig).filter(VisionLLMConfig.id == config_id)
+        )
+        db_config = result.scalars().first()
+        if not db_config:
+            raise HTTPException(status_code=404, detail="Config not found")
+
+        await check_permission(
+            session,
+            user,
+            db_config.search_space_id,
+            Permission.VISION_CONFIGS_READ.value,
+            "You don't have permission to view vision LLM configs in this search space",
+        )
+        return db_config
+
+    except HTTPException:
+        raise
+    except Exception as e:
+        logger.exception("Failed to get VisionLLMConfig")
+        raise HTTPException(
+            status_code=500, detail=f"Failed to fetch config: {e!s}"
+        ) from e
+
+
+@router.put(
+    "/vision-llm-configs/{config_id}", response_model=VisionLLMConfigRead
+)
+async def update_vision_llm_config(
+    config_id: int,
+    update_data: VisionLLMConfigUpdate,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    try:
+        result = await session.execute(
+            select(VisionLLMConfig).filter(VisionLLMConfig.id == config_id)
+        )
+        db_config = result.scalars().first()
+        if not db_config:
+            raise HTTPException(status_code=404, detail="Config not found")
+
+        await check_permission(
+            session,
+            user,
+            db_config.search_space_id,
+            Permission.VISION_CONFIGS_CREATE.value,
+            "You don't have permission to update vision LLM configs in this search space",
+        )
+
+        for key, value in update_data.model_dump(exclude_unset=True).items():
+            setattr(db_config, key, value)
+
+        await session.commit()
+        await session.refresh(db_config)
+        return db_config
+
+    except HTTPException:
+        raise
+    except Exception as e:
+        await session.rollback()
+        logger.exception("Failed to update VisionLLMConfig")
+        raise HTTPException(
+            status_code=500, detail=f"Failed to update config: {e!s}"
+        ) from e
+
+
+@router.delete("/vision-llm-configs/{config_id}", response_model=dict)
+async def delete_vision_llm_config(
+    config_id: int,
+    session: AsyncSession = Depends(get_async_session),
+    user: User = Depends(current_active_user),
+):
+    try:
+        result = await session.execute(
+            select(VisionLLMConfig).filter(VisionLLMConfig.id == config_id)
+        )
+        db_config = result.scalars().first()
+        if not db_config:
+            raise HTTPException(status_code=404, detail="Config not found")
+
+        await check_permission(
+            session,
+            user,
+            db_config.search_space_id,
+            Permission.VISION_CONFIGS_DELETE.value,
+            "You don't have permission to delete vision LLM configs in this search space",
+        )
+
+        await session.delete(db_config)
+        await session.commit()
+        return {
+            "message": "Vision LLM config deleted successfully",
+            "id": config_id,
+        }
+
+    except HTTPException:
+        raise
+    except Exception as e:
+        await session.rollback()
+        logger.exception("Failed to delete VisionLLMConfig")
+        raise HTTPException(
+            status_code=500, detail=f"Failed to delete config: {e!s}"
+        ) from e

From 43b8862ac77b3351cd068d762563ff985568447e Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 19:16:51 +0200
Subject: [PATCH 182/202] Update get_vision_llm to use dedicated
 VisionLLMConfig system

---
 surfsense_backend/app/services/llm_service.py | 119 +++++++++++++++++-
 1 file changed, 113 insertions(+), 6 deletions(-)

diff --git a/surfsense_backend/app/services/llm_service.py b/surfsense_backend/app/services/llm_service.py
index 7c0f9e7e3..e531aeabb 100644
--- a/surfsense_backend/app/services/llm_service.py
+++ b/surfsense_backend/app/services/llm_service.py
@@ -32,7 +32,6 @@ logger = logging.getLogger(__name__)
 class LLMRole:
     AGENT = "agent"  # For agent/chat operations
     DOCUMENT_SUMMARY = "document_summary"  # For document summarization
-    VISION = "vision"  # For vision/screenshot analysis
 
 
 def get_global_llm_config(llm_config_id: int) -> dict | None:
@@ -188,7 +187,7 @@ async def get_search_space_llm_instance(
     Args:
         session: Database session
         search_space_id: Search Space ID
-        role: LLM role ('agent', 'document_summary', or 'vision')
+        role: LLM role ('agent' or 'document_summary')
 
     Returns:
         ChatLiteLLM or ChatLiteLLMRouter instance, or None if not found
@@ -210,8 +209,6 @@ async def get_search_space_llm_instance(
             llm_config_id = search_space.agent_llm_id
         elif role == LLMRole.DOCUMENT_SUMMARY:
             llm_config_id = search_space.document_summary_llm_id
-        elif role == LLMRole.VISION:
-            llm_config_id = search_space.vision_llm_id
         else:
             logger.error(f"Invalid LLM role: {role}")
             return None
@@ -411,8 +408,118 @@ async def get_document_summary_llm(
 async def get_vision_llm(
     session: AsyncSession, search_space_id: int
 ) -> ChatLiteLLM | ChatLiteLLMRouter | None:
-    """Get the search space's vision LLM instance for screenshot analysis."""
-    return await get_search_space_llm_instance(session, search_space_id, LLMRole.VISION)
+    """Get the search space's vision LLM instance for screenshot analysis.
+
+    Resolves from the dedicated VisionLLMConfig system:
+    - Auto mode (ID 0): VisionLLMRouterService
+    - Global (negative ID): YAML configs
+    - DB (positive ID): VisionLLMConfig table
+    """
+    from app.db import VisionLLMConfig
+    from app.services.vision_llm_router_service import (
+        VISION_PROVIDER_MAP,
+        VisionLLMRouterService,
+        get_global_vision_llm_config,
+        is_vision_auto_mode,
+    )
+
+    try:
+        result = await session.execute(
+            select(SearchSpace).where(SearchSpace.id == search_space_id)
+        )
+        search_space = result.scalars().first()
+        if not search_space:
+            logger.error(f"Search space {search_space_id} not found")
+            return None
+
+        config_id = search_space.vision_llm_config_id
+        if config_id is None:
+            logger.error(
+                f"No vision LLM configured for search space {search_space_id}"
+            )
+            return None
+
+        if is_vision_auto_mode(config_id):
+            if not VisionLLMRouterService.is_initialized():
+                logger.error(
+                    "Vision Auto mode requested but Vision LLM Router not initialized"
+                )
+                return None
+            try:
+                return ChatLiteLLMRouter(
+                    router=VisionLLMRouterService.get_router(),
+                    streaming=True,
+                )
+            except Exception as e:
+                logger.error(f"Failed to create vision ChatLiteLLMRouter: {e}")
+                return None
+
+        if config_id < 0:
+            global_cfg = get_global_vision_llm_config(config_id)
+            if not global_cfg:
+                logger.error(f"Global vision LLM config {config_id} not found")
+                return None
+
+            if global_cfg.get("custom_provider"):
+                model_string = (
+                    f"{global_cfg['custom_provider']}/{global_cfg['model_name']}"
+                )
+            else:
+                prefix = VISION_PROVIDER_MAP.get(
+                    global_cfg["provider"].upper(),
+                    global_cfg["provider"].lower(),
+                )
+                model_string = f"{prefix}/{global_cfg['model_name']}"
+
+            litellm_kwargs = {
+                "model": model_string,
+                "api_key": global_cfg["api_key"],
+            }
+            if global_cfg.get("api_base"):
+                litellm_kwargs["api_base"] = global_cfg["api_base"]
+            if global_cfg.get("litellm_params"):
+                litellm_kwargs.update(global_cfg["litellm_params"])
+
+            return ChatLiteLLM(**litellm_kwargs)
+
+        result = await session.execute(
+            select(VisionLLMConfig).where(
+                VisionLLMConfig.id == config_id,
+                VisionLLMConfig.search_space_id == search_space_id,
+            )
+        )
+        vision_cfg = result.scalars().first()
+        if not vision_cfg:
+            logger.error(
+                f"Vision LLM config {config_id} not found in search space {search_space_id}"
+            )
+            return None
+
+        if vision_cfg.custom_provider:
+            model_string = f"{vision_cfg.custom_provider}/{vision_cfg.model_name}"
+        else:
+            prefix = VISION_PROVIDER_MAP.get(
+                vision_cfg.provider.value.upper(),
+                vision_cfg.provider.value.lower(),
+            )
+            model_string = f"{prefix}/{vision_cfg.model_name}"
+
+        litellm_kwargs = {
+            "model": model_string,
+            "api_key": vision_cfg.api_key,
+        }
+        if vision_cfg.api_base:
+            litellm_kwargs["api_base"] = vision_cfg.api_base
+        if vision_cfg.litellm_params:
+            litellm_kwargs.update(vision_cfg.litellm_params)
+
+        return ChatLiteLLM(**litellm_kwargs)
+
+    except Exception as e:
+        logger.error(
+            f"Error getting vision LLM for search space {search_space_id}: {e!s}"
+        )
+        return None
 
 
 # Backward-compatible alias (LLM preferences are now per-search-space, not per-user)

From 6d85821ae95836978f63ccf18ddbfd693e2dd956 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 19:20:28 +0200
Subject: [PATCH 183/202] Wire vision_llm_config_id in preferences, register
 vision LLM router

---
 surfsense_backend/app/routes/__init__.py      |  2 +
 .../app/routes/search_spaces_routes.py        | 74 +++++++++++++++++--
 .../app/schemas/new_llm_config.py             | 10 +--
 3 files changed, 75 insertions(+), 11 deletions(-)

diff --git a/surfsense_backend/app/routes/__init__.py b/surfsense_backend/app/routes/__init__.py
index 22631bc1d..02367606b 100644
--- a/surfsense_backend/app/routes/__init__.py
+++ b/surfsense_backend/app/routes/__init__.py
@@ -49,6 +49,7 @@ from .stripe_routes import router as stripe_router
 from .surfsense_docs_routes import router as surfsense_docs_router
 from .teams_add_connector_route import router as teams_add_connector_router
 from .video_presentations_routes import router as video_presentations_router
+from .vision_llm_routes import router as vision_llm_router
 from .youtube_routes import router as youtube_router
 
 router = APIRouter()
@@ -68,6 +69,7 @@ router.include_router(
 )  # Video presentation status and streaming
 router.include_router(reports_router)  # Report CRUD and multi-format export
 router.include_router(image_generation_router)  # Image generation via litellm
+router.include_router(vision_llm_router)  # Vision LLM configs for screenshot analysis
 router.include_router(search_source_connectors_router)
 router.include_router(google_calendar_add_connector_router)
 router.include_router(google_gmail_add_connector_router)
diff --git a/surfsense_backend/app/routes/search_spaces_routes.py b/surfsense_backend/app/routes/search_spaces_routes.py
index c4f1ab035..78be97aa1 100644
--- a/surfsense_backend/app/routes/search_spaces_routes.py
+++ b/surfsense_backend/app/routes/search_spaces_routes.py
@@ -14,6 +14,7 @@ from app.db import (
     SearchSpaceMembership,
     SearchSpaceRole,
     User,
+    VisionLLMConfig,
     get_async_session,
     get_default_roles_config,
 )
@@ -483,6 +484,63 @@ async def _get_image_gen_config_by_id(
     return None
 
 
+async def _get_vision_llm_config_by_id(
+    session: AsyncSession, config_id: int | None
+) -> dict | None:
+    if config_id is None:
+        return None
+
+    if config_id == 0:
+        return {
+            "id": 0,
+            "name": "Auto (Fastest)",
+            "description": "Automatically routes requests across available vision LLM providers",
+            "provider": "AUTO",
+            "model_name": "auto",
+            "is_global": True,
+            "is_auto_mode": True,
+        }
+
+    if config_id < 0:
+        for cfg in config.GLOBAL_VISION_LLM_CONFIGS:
+            if cfg.get("id") == config_id:
+                return {
+                    "id": cfg.get("id"),
+                    "name": cfg.get("name"),
+                    "description": cfg.get("description"),
+                    "provider": cfg.get("provider"),
+                    "custom_provider": cfg.get("custom_provider"),
+                    "model_name": cfg.get("model_name"),
+                    "api_base": cfg.get("api_base") or None,
+                    "api_version": cfg.get("api_version") or None,
+                    "litellm_params": cfg.get("litellm_params", {}),
+                    "is_global": True,
+                }
+        return None
+
+    result = await session.execute(
+        select(VisionLLMConfig).filter(VisionLLMConfig.id == config_id)
+    )
+    db_config = result.scalars().first()
+    if db_config:
+        return {
+            "id": db_config.id,
+            "name": db_config.name,
+            "description": db_config.description,
+            "provider": db_config.provider.value if db_config.provider else None,
+            "custom_provider": db_config.custom_provider,
+            "model_name": db_config.model_name,
+            "api_base": db_config.api_base,
+            "api_version": db_config.api_version,
+            "litellm_params": db_config.litellm_params or {},
+            "created_at": db_config.created_at.isoformat()
+            if db_config.created_at
+            else None,
+            "search_space_id": db_config.search_space_id,
+        }
+    return None
+
+
 @router.get(
     "/search-spaces/{search_space_id}/llm-preferences",
     response_model=LLMPreferencesRead,
@@ -522,17 +580,19 @@ async def get_llm_preferences(
         image_generation_config = await _get_image_gen_config_by_id(
             session, search_space.image_generation_config_id
         )
-        vision_llm = await _get_llm_config_by_id(session, search_space.vision_llm_id)
+        vision_llm_config = await _get_vision_llm_config_by_id(
+            session, search_space.vision_llm_config_id
+        )
 
         return LLMPreferencesRead(
             agent_llm_id=search_space.agent_llm_id,
             document_summary_llm_id=search_space.document_summary_llm_id,
             image_generation_config_id=search_space.image_generation_config_id,
-            vision_llm_id=search_space.vision_llm_id,
+            vision_llm_config_id=search_space.vision_llm_config_id,
             agent_llm=agent_llm,
             document_summary_llm=document_summary_llm,
             image_generation_config=image_generation_config,
-            vision_llm=vision_llm,
+            vision_llm_config=vision_llm_config,
         )
 
     except HTTPException:
@@ -592,17 +652,19 @@ async def update_llm_preferences(
         image_generation_config = await _get_image_gen_config_by_id(
             session, search_space.image_generation_config_id
         )
-        vision_llm = await _get_llm_config_by_id(session, search_space.vision_llm_id)
+        vision_llm_config = await _get_vision_llm_config_by_id(
+            session, search_space.vision_llm_config_id
+        )
 
         return LLMPreferencesRead(
             agent_llm_id=search_space.agent_llm_id,
             document_summary_llm_id=search_space.document_summary_llm_id,
             image_generation_config_id=search_space.image_generation_config_id,
-            vision_llm_id=search_space.vision_llm_id,
+            vision_llm_config_id=search_space.vision_llm_config_id,
             agent_llm=agent_llm,
             document_summary_llm=document_summary_llm,
             image_generation_config=image_generation_config,
-            vision_llm=vision_llm,
+            vision_llm_config=vision_llm_config,
         )
 
     except HTTPException:
diff --git a/surfsense_backend/app/schemas/new_llm_config.py b/surfsense_backend/app/schemas/new_llm_config.py
index 6c76ca512..a466f2c99 100644
--- a/surfsense_backend/app/schemas/new_llm_config.py
+++ b/surfsense_backend/app/schemas/new_llm_config.py
@@ -182,8 +182,8 @@ class LLMPreferencesRead(BaseModel):
     image_generation_config_id: int | None = Field(
         None, description="ID of the image generation config to use"
     )
-    vision_llm_id: int | None = Field(
-        None, description="ID of the LLM config to use for vision/screenshot analysis"
+    vision_llm_config_id: int | None = Field(
+        None, description="ID of the vision LLM config to use for vision/screenshot analysis"
     )
     agent_llm: dict[str, Any] | None = Field(
         None, description="Full config for agent LLM"
@@ -194,7 +194,7 @@ class LLMPreferencesRead(BaseModel):
     image_generation_config: dict[str, Any] | None = Field(
         None, description="Full config for image generation"
     )
-    vision_llm: dict[str, Any] | None = Field(
+    vision_llm_config: dict[str, Any] | None = Field(
         None, description="Full config for vision LLM"
     )
 
@@ -213,6 +213,6 @@ class LLMPreferencesUpdate(BaseModel):
     image_generation_config_id: int | None = Field(
         None, description="ID of the image generation config to use"
     )
-    vision_llm_id: int | None = Field(
-        None, description="ID of the LLM config to use for vision/screenshot analysis"
+    vision_llm_config_id: int | None = Field(
+        None, description="ID of the vision LLM config to use for vision/screenshot analysis"
     )

From 4a675b64f4b066a6148126df0121ccfbdc9dbe0a Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 19:21:10 +0200
Subject: [PATCH 184/202] Initialize vision LLM router at app and celery
 startup

---
 surfsense_backend/app/app.py        | 8 +++++++-
 surfsense_backend/app/celery_app.py | 7 ++++++-
 2 files changed, 13 insertions(+), 2 deletions(-)

diff --git a/surfsense_backend/app/app.py b/surfsense_backend/app/app.py
index bba2f1f3a..7b2b421ac 100644
--- a/surfsense_backend/app/app.py
+++ b/surfsense_backend/app/app.py
@@ -25,7 +25,12 @@ from app.agents.new_chat.checkpointer import (
     close_checkpointer,
     setup_checkpointer_tables,
 )
-from app.config import config, initialize_image_gen_router, initialize_llm_router
+from app.config import (
+    config,
+    initialize_image_gen_router,
+    initialize_llm_router,
+    initialize_vision_llm_router,
+)
 from app.db import User, create_db_and_tables, get_async_session
 from app.routes import router as crud_router
 from app.routes.auth_routes import router as auth_router
@@ -223,6 +228,7 @@ async def lifespan(app: FastAPI):
     await setup_checkpointer_tables()
     initialize_llm_router()
     initialize_image_gen_router()
+    initialize_vision_llm_router()
     try:
         await asyncio.wait_for(seed_surfsense_docs(), timeout=120)
     except TimeoutError:
diff --git a/surfsense_backend/app/celery_app.py b/surfsense_backend/app/celery_app.py
index 684da6a13..bf2fdcb39 100644
--- a/surfsense_backend/app/celery_app.py
+++ b/surfsense_backend/app/celery_app.py
@@ -18,10 +18,15 @@ def init_worker(**kwargs):
     This ensures the Auto mode (LiteLLM Router) is available for background tasks
     like document summarization and image generation.
     """
-    from app.config import initialize_image_gen_router, initialize_llm_router
+    from app.config import (
+        initialize_image_gen_router,
+        initialize_llm_router,
+        initialize_vision_llm_router,
+    )
 
     initialize_llm_router()
     initialize_image_gen_router()
+    initialize_vision_llm_router()
 
 
 # Get Celery configuration from environment

From 3369b8a83210e9afc62f9c0db91d87a13fb0c478 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 19:24:43 +0200
Subject: [PATCH 185/202] Add frontend vision LLM config types, API, atoms, and
 role manager wiring

---
 .../vision-llm-config-mutation.atoms.ts       |  84 +++++++++++++++
 .../vision-llm-config-query.atoms.ts          |  27 +++++
 .../components/settings/llm-role-manager.tsx  |  66 +++++++++---
 .../contracts/enums/vision-providers.ts       | 102 ++++++++++++++++++
 .../contracts/types/new-llm-config.types.ts   |  99 +++++++++++++++--
 .../lib/apis/vision-llm-config-api.service.ts |  58 ++++++++++
 surfsense_web/lib/query-client/cache-keys.ts  |   5 +
 7 files changed, 421 insertions(+), 20 deletions(-)
 create mode 100644 surfsense_web/atoms/vision-llm-config/vision-llm-config-mutation.atoms.ts
 create mode 100644 surfsense_web/atoms/vision-llm-config/vision-llm-config-query.atoms.ts
 create mode 100644 surfsense_web/contracts/enums/vision-providers.ts
 create mode 100644 surfsense_web/lib/apis/vision-llm-config-api.service.ts

diff --git a/surfsense_web/atoms/vision-llm-config/vision-llm-config-mutation.atoms.ts b/surfsense_web/atoms/vision-llm-config/vision-llm-config-mutation.atoms.ts
new file mode 100644
index 000000000..b1aa01c6b
--- /dev/null
+++ b/surfsense_web/atoms/vision-llm-config/vision-llm-config-mutation.atoms.ts
@@ -0,0 +1,84 @@
+import { atomWithMutation } from "jotai-tanstack-query";
+import { toast } from "sonner";
+import type {
+	CreateVisionLLMConfigRequest,
+	CreateVisionLLMConfigResponse,
+	DeleteVisionLLMConfigResponse,
+	GetVisionLLMConfigsResponse,
+	UpdateVisionLLMConfigRequest,
+	UpdateVisionLLMConfigResponse,
+} from "@/contracts/types/new-llm-config.types";
+import { visionLLMConfigApiService } from "@/lib/apis/vision-llm-config-api.service";
+import { cacheKeys } from "@/lib/query-client/cache-keys";
+import { queryClient } from "@/lib/query-client/client";
+import { activeSearchSpaceIdAtom } from "../search-spaces/search-space-query.atoms";
+
+export const createVisionLLMConfigMutationAtom = atomWithMutation((get) => {
+	const searchSpaceId = get(activeSearchSpaceIdAtom);
+
+	return {
+		mutationKey: ["vision-llm-configs", "create"],
+		enabled: !!searchSpaceId,
+		mutationFn: async (request: CreateVisionLLMConfigRequest) => {
+			return visionLLMConfigApiService.createConfig(request);
+		},
+		onSuccess: (_: CreateVisionLLMConfigResponse, request: CreateVisionLLMConfigRequest) => {
+			toast.success(`${request.name} created`);
+			queryClient.invalidateQueries({
+				queryKey: cacheKeys.visionLLMConfigs.all(Number(searchSpaceId)),
+			});
+		},
+		onError: (error: Error) => {
+			toast.error(error.message || "Failed to create vision model");
+		},
+	};
+});
+
+export const updateVisionLLMConfigMutationAtom = atomWithMutation((get) => {
+	const searchSpaceId = get(activeSearchSpaceIdAtom);
+
+	return {
+		mutationKey: ["vision-llm-configs", "update"],
+		enabled: !!searchSpaceId,
+		mutationFn: async (request: UpdateVisionLLMConfigRequest) => {
+			return visionLLMConfigApiService.updateConfig(request);
+		},
+		onSuccess: (_: UpdateVisionLLMConfigResponse, request: UpdateVisionLLMConfigRequest) => {
+			toast.success(`${request.data.name ?? "Configuration"} updated`);
+			queryClient.invalidateQueries({
+				queryKey: cacheKeys.visionLLMConfigs.all(Number(searchSpaceId)),
+			});
+			queryClient.invalidateQueries({
+				queryKey: cacheKeys.visionLLMConfigs.byId(request.id),
+			});
+		},
+		onError: (error: Error) => {
+			toast.error(error.message || "Failed to update vision model");
+		},
+	};
+});
+
+export const deleteVisionLLMConfigMutationAtom = atomWithMutation((get) => {
+	const searchSpaceId = get(activeSearchSpaceIdAtom);
+
+	return {
+		mutationKey: ["vision-llm-configs", "delete"],
+		enabled: !!searchSpaceId,
+		mutationFn: async (request: { id: number; name: string }) => {
+			return visionLLMConfigApiService.deleteConfig(request.id);
+		},
+		onSuccess: (_: DeleteVisionLLMConfigResponse, request: { id: number; name: string }) => {
+			toast.success(`${request.name} deleted`);
+			queryClient.setQueryData(
+				cacheKeys.visionLLMConfigs.all(Number(searchSpaceId)),
+				(oldData: GetVisionLLMConfigsResponse | undefined) => {
+					if (!oldData) return oldData;
+					return oldData.filter((config) => config.id !== request.id);
+				}
+			);
+		},
+		onError: (error: Error) => {
+			toast.error(error.message || "Failed to delete vision model");
+		},
+	};
+});
diff --git a/surfsense_web/atoms/vision-llm-config/vision-llm-config-query.atoms.ts b/surfsense_web/atoms/vision-llm-config/vision-llm-config-query.atoms.ts
new file mode 100644
index 000000000..53264fb24
--- /dev/null
+++ b/surfsense_web/atoms/vision-llm-config/vision-llm-config-query.atoms.ts
@@ -0,0 +1,27 @@
+import { atomWithQuery } from "jotai-tanstack-query";
+import { visionLLMConfigApiService } from "@/lib/apis/vision-llm-config-api.service";
+import { cacheKeys } from "@/lib/query-client/cache-keys";
+import { activeSearchSpaceIdAtom } from "../search-spaces/search-space-query.atoms";
+
+export const visionLLMConfigsAtom = atomWithQuery((get) => {
+	const searchSpaceId = get(activeSearchSpaceIdAtom);
+
+	return {
+		queryKey: cacheKeys.visionLLMConfigs.all(Number(searchSpaceId)),
+		enabled: !!searchSpaceId,
+		staleTime: 5 * 60 * 1000,
+		queryFn: async () => {
+			return visionLLMConfigApiService.getConfigs(Number(searchSpaceId));
+		},
+	};
+});
+
+export const globalVisionLLMConfigsAtom = atomWithQuery(() => {
+	return {
+		queryKey: cacheKeys.visionLLMConfigs.global(),
+		staleTime: 10 * 60 * 1000,
+		queryFn: async () => {
+			return visionLLMConfigApiService.getGlobalConfigs();
+		},
+	};
+});
diff --git a/surfsense_web/components/settings/llm-role-manager.tsx b/surfsense_web/components/settings/llm-role-manager.tsx
index 386845d7d..995159d58 100644
--- a/surfsense_web/components/settings/llm-role-manager.tsx
+++ b/surfsense_web/components/settings/llm-role-manager.tsx
@@ -24,6 +24,10 @@ import {
 	llmPreferencesAtom,
 	newLLMConfigsAtom,
 } from "@/atoms/new-llm-config/new-llm-config-query.atoms";
+import {
+	globalVisionLLMConfigsAtom,
+	visionLLMConfigsAtom,
+} from "@/atoms/vision-llm-config/vision-llm-config-query.atoms";
 import { Alert, AlertDescription } from "@/components/ui/alert";
 import { Badge } from "@/components/ui/badge";
 import { Button } from "@/components/ui/button";
@@ -77,8 +81,8 @@ const ROLE_DESCRIPTIONS = {
 		description: "Vision-capable model for screenshot analysis and context extraction",
 		color: "text-amber-600 dark:text-amber-400",
 		bgColor: "bg-amber-500/10",
-		prefKey: "vision_llm_id" as const,
-		configType: "llm" as const,
+		prefKey: "vision_llm_config_id" as const,
+		configType: "vision" as const,
 	},
 };
 
@@ -112,6 +116,18 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 		error: globalImageConfigsError,
 	} = useAtomValue(globalImageGenConfigsAtom);
 
+	// Vision LLM configs
+	const {
+		data: userVisionConfigs = [],
+		isFetching: visionConfigsLoading,
+		error: visionConfigsError,
+	} = useAtomValue(visionLLMConfigsAtom);
+	const {
+		data: globalVisionConfigs = [],
+		isFetching: globalVisionConfigsLoading,
+		error: globalVisionConfigsError,
+	} = useAtomValue(globalVisionLLMConfigsAtom);
+
 	// Preferences
 	const {
 		data: preferences = {},
@@ -125,7 +141,7 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 		agent_llm_id: preferences.agent_llm_id ?? "",
 		document_summary_llm_id: preferences.document_summary_llm_id ?? "",
 		image_generation_config_id: preferences.image_generation_config_id ?? "",
-		vision_llm_id: preferences.vision_llm_id ?? "",
+		vision_llm_config_id: preferences.vision_llm_config_id ?? "",
 	}));
 
 	const [savingRole, setSavingRole] = useState<string | null>(null);
@@ -137,14 +153,14 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 				agent_llm_id: preferences.agent_llm_id ?? "",
 				document_summary_llm_id: preferences.document_summary_llm_id ?? "",
 				image_generation_config_id: preferences.image_generation_config_id ?? "",
-				vision_llm_id: preferences.vision_llm_id ?? "",
+				vision_llm_config_id: preferences.vision_llm_config_id ?? "",
 			});
 		}
 	}, [
 		preferences?.agent_llm_id,
 		preferences?.document_summary_llm_id,
 		preferences?.image_generation_config_id,
-		preferences?.vision_llm_id,
+		preferences?.vision_llm_config_id,
 	]);
 
 	const handleRoleAssignment = useCallback(
@@ -181,6 +197,14 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 		...(userImageConfigs ?? []).filter((config) => config.id && config.id.toString().trim() !== ""),
 	];
 
+	// Combine global and custom vision LLM configs
+	const allVisionConfigs = [
+		...globalVisionConfigs.map((config) => ({ ...config, is_global: true })),
+		...(userVisionConfigs ?? []).filter(
+			(config) => config.id && config.id.toString().trim() !== ""
+		),
+	];
+
 	const isAssignmentComplete =
 		allLLMConfigs.some((c) => c.id === assignments.agent_llm_id) &&
 		allLLMConfigs.some((c) => c.id === assignments.document_summary_llm_id) &&
@@ -191,13 +215,17 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 		preferencesLoading ||
 		globalConfigsLoading ||
 		imageConfigsLoading ||
-		globalImageConfigsLoading;
+		globalImageConfigsLoading ||
+		visionConfigsLoading ||
+		globalVisionConfigsLoading;
 	const hasError =
 		configsError ||
 		preferencesError ||
 		globalConfigsError ||
 		imageConfigsError ||
-		globalImageConfigsError;
+		globalImageConfigsError ||
+		visionConfigsError ||
+		globalVisionConfigsError;
 	const hasAnyConfigs = allLLMConfigs.length > 0 || allImageConfigs.length > 0;
 
 	return (
@@ -291,15 +319,27 @@ export function LLMRoleManager({ searchSpaceId }: LLMRoleManagerProps) {
 				<div className="grid gap-4 grid-cols-1 lg:grid-cols-2">
 					{Object.entries(ROLE_DESCRIPTIONS).map(([key, role]) => {
 						const IconComponent = role.icon;
-						const isImageRole = role.configType === "image";
 						const currentAssignment = assignments[role.prefKey as keyof typeof assignments];
 
 						// Pick the right config lists based on role type
-						const roleGlobalConfigs = isImageRole ? globalImageConfigs : globalConfigs;
-						const roleUserConfigs = isImageRole
-							? (userImageConfigs ?? []).filter((c) => c.id && c.id.toString().trim() !== "")
-							: newLLMConfigs.filter((c) => c.id && c.id.toString().trim() !== "");
-						const roleAllConfigs = isImageRole ? allImageConfigs : allLLMConfigs;
+						const roleGlobalConfigs =
+							role.configType === "image"
+								? globalImageConfigs
+								: role.configType === "vision"
+									? globalVisionConfigs
+									: globalConfigs;
+						const roleUserConfigs =
+							role.configType === "image"
+								? (userImageConfigs ?? []).filter((c) => c.id && c.id.toString().trim() !== "")
+								: role.configType === "vision"
+									? (userVisionConfigs ?? []).filter((c) => c.id && c.id.toString().trim() !== "")
+									: newLLMConfigs.filter((c) => c.id && c.id.toString().trim() !== "");
+						const roleAllConfigs =
+							role.configType === "image"
+								? allImageConfigs
+								: role.configType === "vision"
+									? allVisionConfigs
+									: allLLMConfigs;
 
 						const assignedConfig = roleAllConfigs.find((config) => config.id === currentAssignment);
 						const isAssigned = !!assignedConfig;
diff --git a/surfsense_web/contracts/enums/vision-providers.ts b/surfsense_web/contracts/enums/vision-providers.ts
new file mode 100644
index 000000000..260b03585
--- /dev/null
+++ b/surfsense_web/contracts/enums/vision-providers.ts
@@ -0,0 +1,102 @@
+export interface VisionProviderInfo {
+	value: string;
+	label: string;
+	example: string;
+	description: string;
+	apiBase?: string;
+}
+
+export const VISION_PROVIDERS: VisionProviderInfo[] = [
+	{
+		value: "OPENAI",
+		label: "OpenAI",
+		example: "gpt-4o, gpt-4o-mini",
+		description: "GPT-4o vision models",
+	},
+	{
+		value: "ANTHROPIC",
+		label: "Anthropic",
+		example: "claude-sonnet-4-20250514",
+		description: "Claude vision models",
+	},
+	{
+		value: "GOOGLE",
+		label: "Google AI Studio",
+		example: "gemini-2.5-flash, gemini-2.0-flash",
+		description: "Gemini vision models",
+	},
+	{
+		value: "AZURE_OPENAI",
+		label: "Azure OpenAI",
+		example: "azure/gpt-4o",
+		description: "OpenAI vision models on Azure",
+	},
+	{
+		value: "VERTEX_AI",
+		label: "Google Vertex AI",
+		example: "vertex_ai/gemini-2.5-flash",
+		description: "Gemini vision models on Vertex AI",
+	},
+	{
+		value: "BEDROCK",
+		label: "AWS Bedrock",
+		example: "bedrock/anthropic.claude-sonnet-4-20250514-v1:0",
+		description: "Vision models on AWS Bedrock",
+	},
+	{
+		value: "XAI",
+		label: "xAI",
+		example: "grok-2-vision",
+		description: "Grok vision models",
+	},
+	{
+		value: "OPENROUTER",
+		label: "OpenRouter",
+		example: "openrouter/openai/gpt-4o",
+		description: "Vision models via OpenRouter",
+	},
+	{
+		value: "OLLAMA",
+		label: "Ollama",
+		example: "llava, bakllava",
+		description: "Local vision models via Ollama",
+		apiBase: "http://localhost:11434",
+	},
+	{
+		value: "GROQ",
+		label: "Groq",
+		example: "llama-4-scout-17b-16e-instruct",
+		description: "Vision models on Groq",
+	},
+	{
+		value: "TOGETHER_AI",
+		label: "Together AI",
+		example: "meta-llama/Llama-4-Scout-17B-16E-Instruct",
+		description: "Vision models on Together AI",
+	},
+	{
+		value: "FIREWORKS_AI",
+		label: "Fireworks AI",
+		example: "fireworks_ai/phi-3-vision-128k-instruct",
+		description: "Vision models on Fireworks AI",
+	},
+	{
+		value: "DEEPSEEK",
+		label: "DeepSeek",
+		example: "deepseek-chat",
+		description: "DeepSeek vision models",
+		apiBase: "https://api.deepseek.com",
+	},
+	{
+		value: "MISTRAL",
+		label: "Mistral",
+		example: "pixtral-large-latest",
+		description: "Pixtral vision models",
+	},
+	{
+		value: "CUSTOM",
+		label: "Custom Provider",
+		example: "custom/my-vision-model",
+		description: "Custom OpenAI-compatible vision endpoint",
+	},
+];
diff --git a/surfsense_web/contracts/types/new-llm-config.types.ts b/surfsense_web/contracts/types/new-llm-config.types.ts
index 02837cc73..6bef94bac 100644
--- a/surfsense_web/contracts/types/new-llm-config.types.ts
+++ b/surfsense_web/contracts/types/new-llm-config.types.ts
@@ -252,23 +252,99 @@ export const globalImageGenConfig = z.object({
 
 export const getGlobalImageGenConfigsResponse = z.array(globalImageGenConfig);
 
+// =============================================================================
+// Vision LLM Config (separate table for vision-capable models)
+// =============================================================================
+
+export const visionProviderEnum = z.enum([
+	"OPENAI",
+	"ANTHROPIC",
+	"GOOGLE",
+	"AZURE_OPENAI",
+	"VERTEX_AI",
+	"BEDROCK",
+	"XAI",
+	"OPENROUTER",
+	"OLLAMA",
+	"GROQ",
+	"TOGETHER_AI",
+	"FIREWORKS_AI",
+	"DEEPSEEK",
+	"MISTRAL",
+	"CUSTOM",
+]);
+
+export type VisionProvider = z.infer<typeof visionProviderEnum>;
+
+export const visionLLMConfig = z.object({
+	id: z.number(),
+	name: z.string().max(100),
+	description: z.string().max(500).nullable().optional(),
+	provider: visionProviderEnum,
+	custom_provider: z.string().max(100).nullable().optional(),
+	model_name: z.string().max(100),
+	api_key: z.string(),
+	api_base: z.string().max(500).nullable().optional(),
+	api_version: z.string().max(50).nullable().optional(),
+	litellm_params: z.record(z.string(), z.any()).nullable().optional(),
+	created_at: z.string(),
+	search_space_id: z.number(),
+	user_id: z.string(),
+});
+
+export const createVisionLLMConfigRequest = visionLLMConfig.omit({
+	id: true,
+	created_at: true,
+	user_id: true,
+});
+
+export const createVisionLLMConfigResponse = visionLLMConfig;
+
+export const getVisionLLMConfigsResponse = z.array(visionLLMConfig);
+
+export const updateVisionLLMConfigRequest = z.object({
+	id: z.number(),
+	data: visionLLMConfig
+		.omit({ id: true, created_at: true, search_space_id: true, user_id: true })
+		.partial(),
+});
+
+export const updateVisionLLMConfigResponse = visionLLMConfig;
+
+export const deleteVisionLLMConfigResponse = z.object({
+	message: z.string(),
+	id: z.number(),
+});
+
+export const globalVisionLLMConfig = z.object({
+	id: z.number(),
+	name: z.string(),
+	description: z.string().nullable().optional(),
+	provider: z.string(),
+	custom_provider: z.string().nullable().optional(),
+	model_name: z.string(),
+	api_base: z.string().nullable().optional(),
+	api_version: z.string().nullable().optional(),
+	litellm_params: z.record(z.string(), z.any()).nullable().optional(),
+	is_global: z.literal(true),
+	is_auto_mode: z.boolean().optional().default(false),
+});
+
+export const getGlobalVisionLLMConfigsResponse = z.array(globalVisionLLMConfig);
+
 // =============================================================================
 // LLM Preferences (Role Assignments)
 // =============================================================================
 
-/**
- * LLM Preferences schemas - for role assignments
- * image_generation uses image_generation_config_id (not llm_id)
- */
 export const llmPreferences = z.object({
 	agent_llm_id: z.union([z.number(), z.null()]).optional(),
 	document_summary_llm_id: z.union([z.number(), z.null()]).optional(),
 	image_generation_config_id: z.union([z.number(), z.null()]).optional(),
-	vision_llm_id: z.union([z.number(), z.null()]).optional(),
+	vision_llm_config_id: z.union([z.number(), z.null()]).optional(),
 	agent_llm: z.union([z.record(z.string(), z.unknown()), z.null()]).optional(),
 	document_summary_llm: z.union([z.record(z.string(), z.unknown()), z.null()]).optional(),
 	image_generation_config: z.union([z.record(z.string(), z.unknown()), z.null()]).optional(),
-	vision_llm: z.union([z.record(z.string(), z.unknown()), z.null()]).optional(),
+	vision_llm_config: z.union([z.record(z.string(), z.unknown()), z.null()]).optional(),
 });
 
 /**
@@ -289,7 +365,7 @@ export const updateLLMPreferencesRequest = z.object({
 		agent_llm_id: true,
 		document_summary_llm_id: true,
 		image_generation_config_id: true,
-		vision_llm_id: true,
+		vision_llm_config_id: true,
 	}),
 });
 
@@ -341,6 +417,15 @@ export type UpdateImageGenConfigResponse = z.infer<typeof updateImageGenConfigRe
 export type DeleteImageGenConfigResponse = z.infer<typeof deleteImageGenConfigResponse>;
 export type GlobalImageGenConfig = z.infer<typeof globalImageGenConfig>;
 export type GetGlobalImageGenConfigsResponse = z.infer<typeof getGlobalImageGenConfigsResponse>;
+export type VisionLLMConfig = z.infer<typeof visionLLMConfig>;
+export type CreateVisionLLMConfigRequest = z.infer<typeof createVisionLLMConfigRequest>;
+export type CreateVisionLLMConfigResponse = z.infer<typeof createVisionLLMConfigResponse>;
+export type GetVisionLLMConfigsResponse = z.infer<typeof getVisionLLMConfigsResponse>;
+export type UpdateVisionLLMConfigRequest = z.infer<typeof updateVisionLLMConfigRequest>;
+export type UpdateVisionLLMConfigResponse = z.infer<typeof updateVisionLLMConfigResponse>;
+export type DeleteVisionLLMConfigResponse = z.infer<typeof deleteVisionLLMConfigResponse>;
+export type GlobalVisionLLMConfig = z.infer<typeof globalVisionLLMConfig>;
+export type GetGlobalVisionLLMConfigsResponse = z.infer<typeof getGlobalVisionLLMConfigsResponse>;
 export type LLMPreferences = z.infer<typeof llmPreferences>;
 export type GetLLMPreferencesRequest = z.infer<typeof getLLMPreferencesRequest>;
 export type GetLLMPreferencesResponse = z.infer<typeof getLLMPreferencesResponse>;
diff --git a/surfsense_web/lib/apis/vision-llm-config-api.service.ts b/surfsense_web/lib/apis/vision-llm-config-api.service.ts
new file mode 100644
index 000000000..4099c6b39
--- /dev/null
+++ b/surfsense_web/lib/apis/vision-llm-config-api.service.ts
@@ -0,0 +1,58 @@
+import {
+	type CreateVisionLLMConfigRequest,
+	createVisionLLMConfigRequest,
+	createVisionLLMConfigResponse,
+	deleteVisionLLMConfigResponse,
+	getGlobalVisionLLMConfigsResponse,
+	getVisionLLMConfigsResponse,
+	type UpdateVisionLLMConfigRequest,
+	updateVisionLLMConfigRequest,
+	updateVisionLLMConfigResponse,
+} from "@/contracts/types/new-llm-config.types";
+import { ValidationError } from "../error";
+import { baseApiService } from "./base-api.service";
+
+class VisionLLMConfigApiService {
+	getGlobalConfigs = async () => {
+		return baseApiService.get(
+			`/api/v1/global-vision-llm-configs`,
+			getGlobalVisionLLMConfigsResponse
+		);
+	};
+
+	createConfig = async (request: CreateVisionLLMConfigRequest) => {
+		const parsed = createVisionLLMConfigRequest.safeParse(request);
+		if (!parsed.success) {
+			const msg = parsed.error.issues.map((i) => i.message).join(", ");
+			throw new ValidationError(`Invalid request: ${msg}`);
+		}
+		return baseApiService.post(`/api/v1/vision-llm-configs`, createVisionLLMConfigResponse, {
+			body: parsed.data,
+		});
+	};
+
+	getConfigs = async (searchSpaceId: number) => {
+		const params = new URLSearchParams({
+			search_space_id: String(searchSpaceId),
+		}).toString();
+		return baseApiService.get(`/api/v1/vision-llm-configs?${params}`, getVisionLLMConfigsResponse);
+	};
+
+	updateConfig = async (request: UpdateVisionLLMConfigRequest) => {
+		const parsed = updateVisionLLMConfigRequest.safeParse(request);
+		if (!parsed.success) {
+			const msg = parsed.error.issues.map((i) => i.message).join(", ");
+			throw new ValidationError(`Invalid request: ${msg}`);
+		}
+		const { id, data } = parsed.data;
+		return baseApiService.put(`/api/v1/vision-llm-configs/${id}`, updateVisionLLMConfigResponse, {
+			body: data,
+		});
+	};
+
+	deleteConfig = async (id: number) => {
+		return baseApiService.delete(`/api/v1/vision-llm-configs/${id}`, deleteVisionLLMConfigResponse);
+	};
+}
+
+export const visionLLMConfigApiService = new VisionLLMConfigApiService();
diff --git a/surfsense_web/lib/query-client/cache-keys.ts b/surfsense_web/lib/query-client/cache-keys.ts
index 754886618..04f348ff8 100644
--- a/surfsense_web/lib/query-client/cache-keys.ts
+++ b/surfsense_web/lib/query-client/cache-keys.ts
@@ -39,6 +39,11 @@ export const cacheKeys = {
 		byId: (configId: number) => ["image-gen-configs", "detail", configId] as const,
 		global: () => ["image-gen-configs", "global"] as const,
 	},
+	visionLLMConfigs: {
+		all: (searchSpaceId: number) => ["vision-llm-configs", searchSpaceId] as const,
+		byId: (configId: number) => ["vision-llm-configs", "detail", configId] as const,
+		global: () => ["vision-llm-configs", "global"] as const,
+	},
 	auth: {
 		user: ["auth", "user"] as const,
 	},

From 3bbe6c303737f63b089ddb5501d67f47d65a37b5 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 19:27:24 +0200
Subject: [PATCH 186/202] Add VisionModelManager and VisionConfigDialog
 components

---
 .../settings/vision-model-manager.tsx         | 401 ++++++++++++++++++
 .../shared/vision-config-dialog.tsx           | 381 +++++++++++++++++
 2 files changed, 782 insertions(+)
 create mode 100644 surfsense_web/components/settings/vision-model-manager.tsx
 create mode 100644 surfsense_web/components/shared/vision-config-dialog.tsx

diff --git a/surfsense_web/components/settings/vision-model-manager.tsx b/surfsense_web/components/settings/vision-model-manager.tsx
new file mode 100644
index 000000000..31e6655cb
--- /dev/null
+++ b/surfsense_web/components/settings/vision-model-manager.tsx
@@ -0,0 +1,401 @@
+"use client";
+
+import { useAtomValue } from "jotai";
+import { AlertCircle, Dot, Edit3, Info, RefreshCw, Trash2 } from "lucide-react";
+import { useMemo, useState } from "react";
+import { membersAtom, myAccessAtom } from "@/atoms/members/members-query.atoms";
+import { deleteVisionLLMConfigMutationAtom } from "@/atoms/vision-llm-config/vision-llm-config-mutation.atoms";
+import {
+	globalVisionLLMConfigsAtom,
+	visionLLMConfigsAtom,
+} from "@/atoms/vision-llm-config/vision-llm-config-query.atoms";
+import { VisionConfigDialog } from "@/components/shared/vision-config-dialog";
+import { Alert, AlertDescription } from "@/components/ui/alert";
+import {
+	AlertDialog,
+	AlertDialogAction,
+	AlertDialogCancel,
+	AlertDialogContent,
+	AlertDialogDescription,
+	AlertDialogFooter,
+	AlertDialogHeader,
+	AlertDialogTitle,
+} from "@/components/ui/alert-dialog";
+import { Avatar, AvatarFallback, AvatarImage } from "@/components/ui/avatar";
+import { Button } from "@/components/ui/button";
+import { Card, CardContent } from "@/components/ui/card";
+import { Skeleton } from "@/components/ui/skeleton";
+import { Spinner } from "@/components/ui/spinner";
+import { Tooltip, TooltipContent, TooltipProvider, TooltipTrigger } from "@/components/ui/tooltip";
+import type { VisionLLMConfig } from "@/contracts/types/new-llm-config.types";
+import { useMediaQuery } from "@/hooks/use-media-query";
+import { getProviderIcon } from "@/lib/provider-icons";
+import { cn } from "@/lib/utils";
+
+interface VisionModelManagerProps {
+	searchSpaceId: number;
+}
+
+function getInitials(name: string): string {
+	const parts = name.trim().split(/\s+/);
+	if (parts.length >= 2) {
+		return (parts[0][0] + parts[1][0]).toUpperCase();
+	}
+	return name.slice(0, 2).toUpperCase();
+}
+
+export function VisionModelManager({ searchSpaceId }: VisionModelManagerProps) {
+	const isDesktop = useMediaQuery("(min-width: 768px)");
+
+	const {
+		mutateAsync: deleteConfig,
+		isPending: isDeleting,
+		error: deleteError,
+	} = useAtomValue(deleteVisionLLMConfigMutationAtom);
+
+	const {
+		data: userConfigs,
+		isFetching: configsLoading,
+		error: fetchError,
+		refetch: refreshConfigs,
+	} = useAtomValue(visionLLMConfigsAtom);
+	const { data: globalConfigs = [], isFetching: globalLoading } = useAtomValue(
+		globalVisionLLMConfigsAtom
+	);
+
+	const { data: members } = useAtomValue(membersAtom);
+	const memberMap = useMemo(() => {
+		const map = new Map<string, { name: string; email?: string; avatarUrl?: string }>();
+		if (members) {
+			for (const m of members) {
+				map.set(m.user_id, {
+					name: m.user_display_name || m.user_email || "Unknown",
+					email: m.user_email || undefined,
+					avatarUrl: m.user_avatar_url || undefined,
+				});
+			}
+		}
+		return map;
+	}, [members]);
+
+	const { data: access } = useAtomValue(myAccessAtom);
+	const canCreate = useMemo(() => {
+		if (!access) return false;
+		if (access.is_owner) return true;
+		return access.permissions?.includes("vision_configs:create") ?? false;
+	}, [access]);
+	const canDelete = useMemo(() => {
+		if (!access) return false;
+		if (access.is_owner) return true;
+		return access.permissions?.includes("vision_configs:delete") ?? false;
+	}, [access]);
+	const canUpdate = canCreate;
+	const isReadOnly = !canCreate && !canDelete;
+
+	const [isDialogOpen, setIsDialogOpen] = useState(false);
+	const [editingConfig, setEditingConfig] = useState<VisionLLMConfig | null>(null);
+	const [configToDelete, setConfigToDelete] = useState<VisionLLMConfig | null>(null);
+
+	const isLoading = configsLoading || globalLoading;
+	const errors = [deleteError, fetchError].filter(Boolean) as Error[];
+
+	const openEditDialog = (config: VisionLLMConfig) => {
+		setEditingConfig(config);
+		setIsDialogOpen(true);
+	};
+
+	const openNewDialog = () => {
+		setEditingConfig(null);
+		setIsDialogOpen(true);
+	};
+
+	const handleDelete = async () => {
+		if (!configToDelete) return;
+		try {
+			await deleteConfig({ id: configToDelete.id, name: configToDelete.name });
+			setConfigToDelete(null);
+		} catch {
+			// Error handled by mutation
+		}
+	};
+
+	return (
+		<div className="space-y-4 md:space-y-6">
+			<div className="flex flex-col space-y-4 sm:flex-row sm:items-center sm:justify-between sm:space-y-0">
+				<Button
+					variant="secondary"
+					size="sm"
+					onClick={() => refreshConfigs()}
+					disabled={isLoading}
+					className="gap-2"
+				>
+					<RefreshCw className={cn("h-3.5 w-3.5", configsLoading && "animate-spin")} />
+					Refresh
+				</Button>
+				{canCreate && (
+					<Button
+						variant="outline"
+						onClick={openNewDialog}
+						className="gap-2 bg-white text-black hover:bg-neutral-100 dark:bg-white dark:text-black dark:hover:bg-neutral-200"
+					>
+						Add Vision Model
+					</Button>
+				)}
+			</div>
+
+			{errors.map((err) => (
+				<div key={err?.message}>
+					<Alert variant="destructive" className="py-3">
+						<AlertCircle className="h-3 w-3 md:h-4 md:w-4 shrink-0" />
+						<AlertDescription className="text-xs md:text-sm">{err?.message}</AlertDescription>
+					</Alert>
+				</div>
+			))}
+
+			{access && !isLoading && isReadOnly && (
+				<div>
+					<Alert className="bg-muted/50 py-3 md:py-4">
+						<Info className="h-3 w-3 md:h-4 md:w-4 shrink-0" />
+						<AlertDescription className="text-xs md:text-sm">
+							You have <span className="font-medium">read-only</span> access to vision model
+							configurations. Contact a space owner to request additional permissions.
+						</AlertDescription>
+					</Alert>
+				</div>
+			)}
+			{access && !isLoading && !isReadOnly && (!canCreate || !canDelete) && (
+				<div>
+					<Alert className="bg-muted/50 py-3 md:py-4">
+						<Info className="h-3 w-3 md:h-4 md:w-4 shrink-0" />
+						<AlertDescription className="text-xs md:text-sm">
+							You can{" "}
+							{[canCreate && "create and edit", canDelete && "delete"]
+								.filter(Boolean)
+								.join(" and ")}{" "}
+							vision model configurations
+							{!canDelete && ", but cannot delete them"}.
+						</AlertDescription>
+					</Alert>
+				</div>
+			)}
+
+			{globalConfigs.filter((g) => !("is_auto_mode" in g && g.is_auto_mode)).length > 0 && (
+				<Alert className="bg-muted/50 py-3">
+					<Info className="h-3 w-3 md:h-4 md:w-4 shrink-0" />
+					<AlertDescription className="text-xs md:text-sm">
+						<p>
+							<span className="font-medium">
+								{globalConfigs.filter((g) => !("is_auto_mode" in g && g.is_auto_mode)).length}{" "}
+								global vision{" "}
+								{globalConfigs.filter((g) => !("is_auto_mode" in g && g.is_auto_mode)).length === 1
+									? "model"
+									: "models"}
+							</span>{" "}
+							available from your administrator. Use the model selector to view and select them.
+						</p>
+					</AlertDescription>
+				</Alert>
+			)}
+
+			{isLoading && (
+				<div className="space-y-4 md:space-y-6">
+					<div className="space-y-4">
+						<div className="flex items-center justify-between">
+							<Skeleton className="h-6 md:h-7 w-40 md:w-48" />
+							<Skeleton className="h-8 md:h-9 w-32 md:w-36 rounded-md" />
+						</div>
+						<div className="grid gap-3 grid-cols-1 sm:grid-cols-2 xl:grid-cols-3">
+							{["skeleton-a", "skeleton-b", "skeleton-c"].map((key) => (
+								<Card key={key} className="border-border/60">
+									<CardContent className="p-4 flex flex-col gap-3">
+										<div className="flex items-start justify-between gap-2">
+											<div className="space-y-1.5 flex-1 min-w-0">
+												<Skeleton className="h-4 w-28 md:w-32" />
+												<Skeleton className="h-3 w-40 md:w-48" />
+											</div>
+										</div>
+										<div className="flex items-center gap-2">
+											<Skeleton className="h-5 w-16 rounded-full" />
+											<Skeleton className="h-5 w-24 rounded-md" />
+										</div>
+										<div className="flex items-center gap-2 pt-2 border-t border-border/40">
+											<Skeleton className="h-3 w-20" />
+											<Skeleton className="h-4 w-4 rounded-full" />
+											<Skeleton className="h-3 w-16" />
+										</div>
+									</CardContent>
+								</Card>
+							))}
+						</div>
+					</div>
+				</div>
+			)}
+
+			{!isLoading && (
+				<div className="space-y-4 md:space-y-6">
+					{(userConfigs?.length ?? 0) === 0 ? (
+						<Card className="border-0 bg-transparent shadow-none">
+							<CardContent className="flex flex-col items-center justify-center py-10 md:py-16 text-center">
+								<h3 className="text-sm md:text-base font-semibold mb-2">No Vision Models Yet</h3>
+								<p className="text-[11px] md:text-xs text-muted-foreground max-w-sm mb-4">
+									{canCreate
+										? "Add your own vision-capable model (GPT-4o, Claude, Gemini, etc.)"
+										: "No vision models have been added to this space yet. Contact a space owner to add one."}
+								</p>
+							</CardContent>
+						</Card>
+					) : (
+						<div className="grid gap-3 grid-cols-1 sm:grid-cols-2 xl:grid-cols-3">
+							{userConfigs?.map((config) => {
+								const member = config.user_id ? memberMap.get(config.user_id) : null;
+
+								return (
+									<div key={config.id}>
+										<Card className="group relative overflow-hidden transition-all duration-200 border-border/60 hover:shadow-md h-full">
+											<CardContent className="p-4 flex flex-col gap-3 h-full">
+												<div className="flex items-start justify-between gap-2">
+													<div className="min-w-0 flex-1">
+														<h4 className="text-sm font-semibold tracking-tight truncate">
+															{config.name}
+														</h4>
+														{config.description && (
+															<p className="text-[11px] text-muted-foreground/70 truncate mt-0.5">
+																{config.description}
+															</p>
+														)}
+													</div>
+													{(canUpdate || canDelete) && (
+														<div className="flex items-center gap-0.5 shrink-0 sm:opacity-0 sm:group-hover:opacity-100 transition-opacity duration-150">
+															{canUpdate && (
+																<TooltipProvider>
+																	<Tooltip open={isDesktop ? undefined : false}>
+																		<TooltipTrigger asChild>
+																			<Button
+																				variant="ghost"
+																				size="icon"
+																				onClick={() => openEditDialog(config)}
+																				className="h-7 w-7 text-muted-foreground hover:text-foreground"
+																			>
+																				<Edit3 className="h-3 w-3" />
+																			</Button>
+																		</TooltipTrigger>
+																		<TooltipContent>Edit</TooltipContent>
+																	</Tooltip>
+																</TooltipProvider>
+															)}
+															{canDelete && (
+																<TooltipProvider>
+																	<Tooltip open={isDesktop ? undefined : false}>
+																		<TooltipTrigger asChild>
+																			<Button
+																				variant="ghost"
+																				size="icon"
+																				onClick={() => setConfigToDelete(config)}
+																				className="h-7 w-7 text-muted-foreground hover:text-destructive"
+																			>
+																				<Trash2 className="h-3 w-3" />
+																			</Button>
+																		</TooltipTrigger>
+																		<TooltipContent>Delete</TooltipContent>
+																	</Tooltip>
+																</TooltipProvider>
+															)}
+														</div>
+													)}
+												</div>
+
+												<div className="flex items-center gap-2 flex-wrap">
+													{getProviderIcon(config.provider, {
+														className: "size-3.5 shrink-0",
+													})}
+													<code className="text-[11px] font-mono text-muted-foreground bg-muted/60 px-2 py-0.5 rounded-md truncate max-w-[160px]">
+														{config.model_name}
+													</code>
+												</div>
+
+												<div className="flex items-center gap-2 pt-2 border-t border-border/40 mt-auto">
+													<span className="text-[11px] text-muted-foreground/60">
+														{new Date(config.created_at).toLocaleDateString(undefined, {
+															year: "numeric",
+															month: "short",
+															day: "numeric",
+														})}
+													</span>
+													{member && (
+														<>
+															<Dot className="h-4 w-4 text-muted-foreground/30" />
+															<TooltipProvider>
+																<Tooltip open={isDesktop ? undefined : false}>
+																	<TooltipTrigger asChild>
+																		<div className="flex items-center gap-1.5 cursor-default">
+																			<Avatar className="size-4.5 shrink-0">
+																				{member.avatarUrl && (
+																					<AvatarImage src={member.avatarUrl} alt={member.name} />
+																				)}
+																				<AvatarFallback className="text-[9px]">
+																					{getInitials(member.name)}
+																				</AvatarFallback>
+																			</Avatar>
+																			<span className="text-[11px] text-muted-foreground/60 truncate max-w-[120px]">
+																				{member.name}
+																			</span>
+																		</div>
+																	</TooltipTrigger>
+																	<TooltipContent side="bottom">
+																		{member.email || member.name}
+																	</TooltipContent>
+																</Tooltip>
+															</TooltipProvider>
+														</>
+													)}
+												</div>
+											</CardContent>
+										</Card>
+									</div>
+								);
+							})}
+						</div>
+					)}
+				</div>
+			)}
+
+			<VisionConfigDialog
+				open={isDialogOpen}
+				onOpenChange={(open) => {
+					setIsDialogOpen(open);
+					if (!open) setEditingConfig(null);
+				}}
+				config={editingConfig}
+				isGlobal={false}
+				searchSpaceId={searchSpaceId}
+				mode={editingConfig ? "edit" : "create"}
+			/>
+
+			<AlertDialog
+				open={!!configToDelete}
+				onOpenChange={(open) => !open && setConfigToDelete(null)}
+			>
+				<AlertDialogContent className="select-none">
+					<AlertDialogHeader>
+						<AlertDialogTitle>Delete Vision Model</AlertDialogTitle>
+						<AlertDialogDescription>
+							Are you sure you want to delete{" "}
+							<span className="font-semibold text-foreground">{configToDelete?.name}</span>?
+						</AlertDialogDescription>
+					</AlertDialogHeader>
+					<AlertDialogFooter>
+						<AlertDialogCancel disabled={isDeleting}>Cancel</AlertDialogCancel>
+						<AlertDialogAction
+							onClick={handleDelete}
+							disabled={isDeleting}
+							className="relative bg-destructive text-destructive-foreground hover:bg-destructive/90"
+						>
+							<span className={isDeleting ? "opacity-0" : ""}>Delete</span>
+							{isDeleting && <Spinner size="sm" className="absolute" />}
+						</AlertDialogAction>
+					</AlertDialogFooter>
+				</AlertDialogContent>
+			</AlertDialog>
+		</div>
+	);
+}
diff --git a/surfsense_web/components/shared/vision-config-dialog.tsx b/surfsense_web/components/shared/vision-config-dialog.tsx
new file mode 100644
index 000000000..d69750316
--- /dev/null
+++ b/surfsense_web/components/shared/vision-config-dialog.tsx
@@ -0,0 +1,381 @@
+"use client";
+
+import { useAtomValue } from "jotai";
+import { AlertCircle } from "lucide-react";
+import { useCallback, useEffect, useRef, useState } from "react";
+import { toast } from "sonner";
+import { updateLLMPreferencesMutationAtom } from "@/atoms/new-llm-config/new-llm-config-mutation.atoms";
+import {
+	createVisionLLMConfigMutationAtom,
+	updateVisionLLMConfigMutationAtom,
+} from "@/atoms/vision-llm-config/vision-llm-config-mutation.atoms";
+import { Alert, AlertDescription } from "@/components/ui/alert";
+import { Badge } from "@/components/ui/badge";
+import { Button } from "@/components/ui/button";
+import { Dialog, DialogContent, DialogTitle } from "@/components/ui/dialog";
+import { Input } from "@/components/ui/input";
+import { Label } from "@/components/ui/label";
+import {
+	Select,
+	SelectContent,
+	SelectItem,
+	SelectTrigger,
+	SelectValue,
+} from "@/components/ui/select";
+import { Separator } from "@/components/ui/separator";
+import { Spinner } from "@/components/ui/spinner";
+import { VISION_PROVIDERS } from "@/contracts/enums/vision-providers";
+import type {
+	GlobalVisionLLMConfig,
+	VisionLLMConfig,
+	VisionProvider,
+} from "@/contracts/types/new-llm-config.types";
+
+interface VisionConfigDialogProps {
+	open: boolean;
+	onOpenChange: (open: boolean) => void;
+	config: VisionLLMConfig | GlobalVisionLLMConfig | null;
+	isGlobal: boolean;
+	searchSpaceId: number;
+	mode: "create" | "edit" | "view";
+}
+
+const INITIAL_FORM = {
+	name: "",
+	description: "",
+	provider: "",
+	model_name: "",
+	api_key: "",
+	api_base: "",
+	api_version: "",
+};
+
+export function VisionConfigDialog({
+	open,
+	onOpenChange,
+	config,
+	isGlobal,
+	searchSpaceId,
+	mode,
+}: VisionConfigDialogProps) {
+	const [isSubmitting, setIsSubmitting] = useState(false);
+	const [formData, setFormData] = useState(INITIAL_FORM);
+	const [scrollPos, setScrollPos] = useState<"top" | "middle" | "bottom">("top");
+	const scrollRef = useRef<HTMLDivElement>(null);
+
+	useEffect(() => {
+		if (open) {
+			if (mode === "edit" && config && !isGlobal) {
+				setFormData({
+					name: config.name || "",
+					description: config.description || "",
+					provider: config.provider || "",
+					model_name: config.model_name || "",
+					api_key: (config as VisionLLMConfig).api_key || "",
+					api_base: config.api_base || "",
+					api_version: (config as VisionLLMConfig).api_version || "",
+				});
+			} else if (mode === "create") {
+				setFormData(INITIAL_FORM);
+			}
+			setScrollPos("top");
+		}
+	}, [open, mode, config, isGlobal]);
+
+	const { mutateAsync: createConfig } = useAtomValue(createVisionLLMConfigMutationAtom);
+	const { mutateAsync: updateConfig } = useAtomValue(updateVisionLLMConfigMutationAtom);
+	const { mutateAsync: updatePreferences } = useAtomValue(updateLLMPreferencesMutationAtom);
+
+	const handleScroll = useCallback((e: React.UIEvent<HTMLDivElement>) => {
+		const el = e.currentTarget;
+		const atTop = el.scrollTop <= 2;
+		const atBottom = el.scrollHeight - el.scrollTop - el.clientHeight <= 2;
+		setScrollPos(atTop ? "top" : atBottom ? "bottom" : "middle");
+	}, []);
+
+	const getTitle = () => {
+		if (mode === "create") return "Add Vision Model";
+		if (isGlobal) return "View Global Vision Model";
+		return "Edit Vision Model";
+	};
+
+	const getSubtitle = () => {
+		if (mode === "create") return "Set up a new vision-capable LLM provider";
+		if (isGlobal) return "Read-only global configuration";
+		return "Update your vision model settings";
+	};
+
+	const handleSubmit = useCallback(async () => {
+		setIsSubmitting(true);
+		try {
+			if (mode === "create") {
+				const result = await createConfig({
+					name: formData.name,
+					provider: formData.provider as VisionProvider,
+					model_name: formData.model_name,
+					api_key: formData.api_key,
+					api_base: formData.api_base || undefined,
+					api_version: formData.api_version || undefined,
+					description: formData.description || undefined,
+					search_space_id: searchSpaceId,
+				});
+				if (result?.id) {
+					await updatePreferences({
+						search_space_id: searchSpaceId,
+						data: { vision_llm_config_id: result.id },
+					});
+				}
+				onOpenChange(false);
+			} else if (!isGlobal && config) {
+				await updateConfig({
+					id: config.id,
+					data: {
+						name: formData.name,
+						description: formData.description || undefined,
+						provider: formData.provider as VisionProvider,
+						model_name: formData.model_name,
+						api_key: formData.api_key,
+						api_base: formData.api_base || undefined,
+						api_version: formData.api_version || undefined,
+					},
+				});
+				onOpenChange(false);
+			}
+		} catch (error) {
+			console.error("Failed to save vision config:", error);
+			toast.error("Failed to save vision model");
+		} finally {
+			setIsSubmitting(false);
+		}
+	}, [
+		mode,
+		isGlobal,
+		config,
+		formData,
+		searchSpaceId,
+		createConfig,
+		updateConfig,
+		updatePreferences,
+		onOpenChange,
+	]);
+
+	const handleUseGlobalConfig = useCallback(async () => {
+		if (!config || !isGlobal) return;
+		setIsSubmitting(true);
+		try {
+			await updatePreferences({
+				search_space_id: searchSpaceId,
+				data: { vision_llm_config_id: config.id },
+			});
+			toast.success(`Now using ${config.name}`);
+			onOpenChange(false);
+		} catch (error) {
+			console.error("Failed to set vision model:", error);
+			toast.error("Failed to set vision model");
+		} finally {
+			setIsSubmitting(false);
+		}
+	}, [config, isGlobal, searchSpaceId, updatePreferences, onOpenChange]);
+
+	const isFormValid = formData.name && formData.provider && formData.model_name && formData.api_key;
+	const selectedProvider = VISION_PROVIDERS.find((p) => p.value === formData.provider);
+
+	return (
+		<Dialog open={open} onOpenChange={onOpenChange}>
+			<DialogContent
+				className="max-w-lg h-[85vh] flex flex-col p-0 gap-0 overflow-hidden"
+				onOpenAutoFocus={(e) => e.preventDefault()}
+			>
+				<DialogTitle className="sr-only">{getTitle()}</DialogTitle>
+
+				<div className="flex items-start justify-between px-6 pt-6 pb-4 pr-14">
+					<div className="space-y-1">
+						<div className="flex items-center gap-2">
+							<h2 className="text-lg font-semibold tracking-tight">{getTitle()}</h2>
+							{isGlobal && mode !== "create" && (
+								<Badge variant="secondary" className="text-[10px]">
+									Global
+								</Badge>
+							)}
+						</div>
+						<p className="text-sm text-muted-foreground">{getSubtitle()}</p>
+						{config && mode !== "create" && (
+							<p className="text-xs font-mono text-muted-foreground/70">{config.model_name}</p>
+						)}
+					</div>
+				</div>
+
+				<div
+					ref={scrollRef}
+					onScroll={handleScroll}
+					className="flex-1 overflow-y-auto px-6 py-5"
+					style={{
+						maskImage: `linear-gradient(to bottom, ${scrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${scrollPos === "bottom" ? "black" : "transparent"})`,
+						WebkitMaskImage: `linear-gradient(to bottom, ${scrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${scrollPos === "bottom" ? "black" : "transparent"})`,
+					}}
+				>
+					{isGlobal && config && (
+						<>
+							<Alert className="mb-5 border-amber-500/30 bg-amber-500/5">
+								<AlertCircle className="size-4 text-amber-500" />
+								<AlertDescription className="text-sm text-amber-700 dark:text-amber-400">
+									Global configurations are read-only. To customize, create a new model.
+								</AlertDescription>
+							</Alert>
+							<div className="space-y-4">
+								<div className="grid gap-4 sm:grid-cols-2">
+									<div className="space-y-1.5">
+										<div className="text-xs font-medium text-muted-foreground uppercase tracking-wider">
+											Name
+										</div>
+										<p className="text-sm font-medium">{config.name}</p>
+									</div>
+									{config.description && (
+										<div className="space-y-1.5">
+											<div className="text-xs font-medium text-muted-foreground uppercase tracking-wider">
+												Description
+											</div>
+											<p className="text-sm text-muted-foreground">{config.description}</p>
+										</div>
+									)}
+								</div>
+								<Separator />
+								<div className="grid gap-4 sm:grid-cols-2">
+									<div className="space-y-1.5">
+										<div className="text-xs font-medium text-muted-foreground uppercase tracking-wider">
+											Provider
+										</div>
+										<p className="text-sm font-medium">{config.provider}</p>
+									</div>
+									<div className="space-y-1.5">
+										<div className="text-xs font-medium text-muted-foreground uppercase tracking-wider">
+											Model
+										</div>
+										<p className="text-sm font-medium font-mono">{config.model_name}</p>
+									</div>
+								</div>
+							</div>
+						</>
+					)}
+
+					{(mode === "create" || (mode === "edit" && !isGlobal)) && (
+						<div className="space-y-4">
+							<div className="space-y-2">
+								<Label className="text-sm font-medium">Name *</Label>
+								<Input
+									placeholder="e.g., My GPT-4o Vision"
+									value={formData.name}
+									onChange={(e) => setFormData((p) => ({ ...p, name: e.target.value }))}
+								/>
+							</div>
+
+							<div className="space-y-2">
+								<Label className="text-sm font-medium">Description</Label>
+								<Input
+									placeholder="Optional description"
+									value={formData.description}
+									onChange={(e) => setFormData((p) => ({ ...p, description: e.target.value }))}
+								/>
+							</div>
+
+							<Separator />
+
+							<div className="space-y-2">
+								<Label className="text-sm font-medium">Provider *</Label>
+								<Select
+									value={formData.provider}
+									onValueChange={(val) =>
+										setFormData((p) => ({ ...p, provider: val, model_name: "" }))
+									}
+								>
+									<SelectTrigger>
+										<SelectValue placeholder="Select a provider" />
+									</SelectTrigger>
+									<SelectContent>
+										{VISION_PROVIDERS.map((p) => (
+											<SelectItem key={p.value} value={p.value} description={p.example}>
+												{p.label}
+											</SelectItem>
+										))}
+									</SelectContent>
+								</Select>
+							</div>
+
+							<div className="space-y-2">
+								<Label className="text-sm font-medium">Model Name *</Label>
+								<Input
+									placeholder={selectedProvider?.example?.split(",")[0]?.trim() || "e.g., gpt-4o"}
+									value={formData.model_name}
+									onChange={(e) => setFormData((p) => ({ ...p, model_name: e.target.value }))}
+								/>
+							</div>
+
+							<div className="space-y-2">
+								<Label className="text-sm font-medium">API Key *</Label>
+								<Input
+									type="password"
+									placeholder="sk-..."
+									value={formData.api_key}
+									onChange={(e) => setFormData((p) => ({ ...p, api_key: e.target.value }))}
+								/>
+							</div>
+
+							<div className="space-y-2">
+								<Label className="text-sm font-medium">API Base URL</Label>
+								<Input
+									placeholder={selectedProvider?.apiBase || "Optional"}
+									value={formData.api_base}
+									onChange={(e) => setFormData((p) => ({ ...p, api_base: e.target.value }))}
+								/>
+							</div>
+
+							{formData.provider === "AZURE_OPENAI" && (
+								<div className="space-y-2">
+									<Label className="text-sm font-medium">API Version (Azure)</Label>
+									<Input
+										placeholder="2024-02-15-preview"
+										value={formData.api_version}
+										onChange={(e) => setFormData((p) => ({ ...p, api_version: e.target.value }))}
+									/>
+								</div>
+							)}
+						</div>
+					)}
+				</div>
+
+				<div className="shrink-0 px-6 py-4 flex items-center justify-end gap-3">
+					<Button
+						type="button"
+						variant="secondary"
+						onClick={() => onOpenChange(false)}
+						disabled={isSubmitting}
+						className="text-sm h-9"
+					>
+						Cancel
+					</Button>
+					{mode === "create" || (mode === "edit" && !isGlobal) ? (
+						<Button
+							onClick={handleSubmit}
+							disabled={isSubmitting || !isFormValid}
+							className="relative text-sm h-9 min-w-[120px]"
+						>
+							<span className={isSubmitting ? "opacity-0" : ""}>
+								{mode === "edit" ? "Save Changes" : "Add Model"}
+							</span>
+							{isSubmitting && <Spinner size="sm" className="absolute" />}
+						</Button>
+					) : isGlobal && config ? (
+						<Button
+							className="relative text-sm h-9"
+							onClick={handleUseGlobalConfig}
+							disabled={isSubmitting}
+						>
+							<span className={isSubmitting ? "opacity-0" : ""}>Use This Model</span>
+							{isSubmitting && <Spinner size="sm" className="absolute" />}
+						</Button>
+					) : null}
+				</div>
+			</DialogContent>
+		</Dialog>
+	);
+}

From 035a4862f9c78fa75c3e209534e0b553148f12a5 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 19:29:24 +0200
Subject: [PATCH 187/202] Add Vision Models tab to settings dialog with i18n

---
 .../components/settings/search-space-settings-dialog.tsx | 9 ++++++++-
 surfsense_web/messages/en.json                           | 2 ++
 surfsense_web/messages/es.json                           | 2 ++
 surfsense_web/messages/hi.json                           | 2 ++
 surfsense_web/messages/pt.json                           | 2 ++
 surfsense_web/messages/zh.json                           | 2 ++
 6 files changed, 18 insertions(+), 1 deletion(-)

diff --git a/surfsense_web/components/settings/search-space-settings-dialog.tsx b/surfsense_web/components/settings/search-space-settings-dialog.tsx
index 47094d0c9..6573bc271 100644
--- a/surfsense_web/components/settings/search-space-settings-dialog.tsx
+++ b/surfsense_web/components/settings/search-space-settings-dialog.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useAtom } from "jotai";
-import { Bot, Brain, FileText, Globe, ImageIcon, MessageSquare, Shield } from "lucide-react";
+import { Bot, Brain, Eye, FileText, Globe, ImageIcon, MessageSquare, Shield } from "lucide-react";
 import { useTranslations } from "next-intl";
 import type React from "react";
 import { searchSpaceSettingsDialogAtom } from "@/atoms/settings/settings-dialog.atoms";
@@ -13,6 +13,7 @@ import { ModelConfigManager } from "@/components/settings/model-config-manager";
 import { PromptConfigManager } from "@/components/settings/prompt-config-manager";
 import { RolesManager } from "@/components/settings/roles-manager";
 import { SettingsDialog } from "@/components/settings/settings-dialog";
+import { VisionModelManager } from "@/components/settings/vision-model-manager";
 
 interface SearchSpaceSettingsDialogProps {
 	searchSpaceId: number;
@@ -31,6 +32,11 @@ export function SearchSpaceSettingsDialog({ searchSpaceId }: SearchSpaceSettings
 			label: t("nav_image_models"),
 			icon: <ImageIcon className="h-4 w-4" />,
 		},
+		{
+			value: "vision-models",
+			label: t("nav_vision_models"),
+			icon: <Eye className="h-4 w-4" />,
+		},
 		{ value: "team-roles", label: t("nav_team_roles"), icon: <Shield className="h-4 w-4" /> },
 		{
 			value: "prompts",
@@ -45,6 +51,7 @@ export function SearchSpaceSettingsDialog({ searchSpaceId }: SearchSpaceSettings
 		models: <ModelConfigManager searchSpaceId={searchSpaceId} />,
 		roles: <LLMRoleManager searchSpaceId={searchSpaceId} />,
 		"image-models": <ImageModelManager searchSpaceId={searchSpaceId} />,
+		"vision-models": <VisionModelManager searchSpaceId={searchSpaceId} />,
 		"team-roles": <RolesManager searchSpaceId={searchSpaceId} />,
 		prompts: <PromptConfigManager searchSpaceId={searchSpaceId} />,
 		"public-links": <PublicChatSnapshotsManager searchSpaceId={searchSpaceId} />,
diff --git a/surfsense_web/messages/en.json b/surfsense_web/messages/en.json
index b67f9db22..a3a4e8853 100644
--- a/surfsense_web/messages/en.json
+++ b/surfsense_web/messages/en.json
@@ -738,6 +738,8 @@
 		"nav_role_assignments_desc": "Assign configs to agent roles",
 		"nav_image_models": "Image Models",
 		"nav_image_models_desc": "Configure image generation models",
+		"nav_vision_models": "Vision Models",
+		"nav_vision_models_desc": "Configure vision-capable LLM models",
 		"nav_system_instructions": "System Instructions",
 		"nav_system_instructions_desc": "SearchSpace-wide AI instructions",
 		"nav_public_links": "Public Chat Links",
diff --git a/surfsense_web/messages/es.json b/surfsense_web/messages/es.json
index 5cf248a3a..fa620e271 100644
--- a/surfsense_web/messages/es.json
+++ b/surfsense_web/messages/es.json
@@ -738,6 +738,8 @@
 		"nav_role_assignments_desc": "Asignar configuraciones a roles de agente",
 		"nav_image_models": "Modelos de imagen",
 		"nav_image_models_desc": "Configurar modelos de generación de imágenes",
+		"nav_vision_models": "Modelos de visión",
+		"nav_vision_models_desc": "Configurar modelos LLM con capacidad de visión",
 		"nav_system_instructions": "Instrucciones del sistema",
 		"nav_system_instructions_desc": "Instrucciones de IA a nivel del espacio de búsqueda",
 		"nav_public_links": "Enlaces de chat públicos",
diff --git a/surfsense_web/messages/hi.json b/surfsense_web/messages/hi.json
index 0e7194832..faeb4cb94 100644
--- a/surfsense_web/messages/hi.json
+++ b/surfsense_web/messages/hi.json
@@ -738,6 +738,8 @@
 		"nav_role_assignments_desc": "एजेंट भूमिकाओं को कॉन्फ़िगरेशन असाइन करें",
 		"nav_image_models": "इमेज मॉडल",
 		"nav_image_models_desc": "इमेज जनरेशन मॉडल कॉन्फ़िगर करें",
+		"nav_vision_models": "विज़न मॉडल",
+		"nav_vision_models_desc": "विज़न-सक्षम LLM मॉडल कॉन्फ़िगर करें",
 		"nav_system_instructions": "सिस्टम निर्देश",
 		"nav_system_instructions_desc": "सर्च स्पेस-व्यापी AI निर्देश",
 		"nav_public_links": "सार्वजनिक चैट लिंक",
diff --git a/surfsense_web/messages/pt.json b/surfsense_web/messages/pt.json
index 00ae18eae..0bed7c6cc 100644
--- a/surfsense_web/messages/pt.json
+++ b/surfsense_web/messages/pt.json
@@ -738,6 +738,8 @@
 		"nav_role_assignments_desc": "Atribuir configurações a funções do agente",
 		"nav_image_models": "Modelos de imagem",
 		"nav_image_models_desc": "Configurar modelos de geração de imagens",
+		"nav_vision_models": "Modelos de visão",
+		"nav_vision_models_desc": "Configurar modelos LLM com capacidade de visão",
 		"nav_system_instructions": "Instruções do sistema",
 		"nav_system_instructions_desc": "Instruções de IA em nível do espaço de pesquisa",
 		"nav_public_links": "Links de chat públicos",
diff --git a/surfsense_web/messages/zh.json b/surfsense_web/messages/zh.json
index a6f3b5b84..0d4f7e1c9 100644
--- a/surfsense_web/messages/zh.json
+++ b/surfsense_web/messages/zh.json
@@ -722,6 +722,8 @@
 		"nav_role_assignments_desc": "为代理角色分配配置",
 		"nav_image_models": "图像模型",
 		"nav_image_models_desc": "配置图像生成模型",
+		"nav_vision_models": "视觉模型",
+		"nav_vision_models_desc": "配置具有视觉能力的LLM模型",
 		"nav_system_instructions": "系统指令",
 		"nav_system_instructions_desc": "搜索空间级别的 AI 指令",
 		"nav_public_links": "公开聊天链接",

From e85c355592676d19bd47820981bf62c6ad8bdc1b Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 19:45:30 +0200
Subject: [PATCH 188/202] Add NEXT_PUBLIC_POSTHOG_KEY to desktop release CI and
 .env.example

---
 .github/workflows/desktop-release.yml | 1 +
 surfsense_web/.env.example            | 5 ++++-
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/desktop-release.yml b/.github/workflows/desktop-release.yml
index 491df0992..4d217562a 100644
--- a/.github/workflows/desktop-release.yml
+++ b/.github/workflows/desktop-release.yml
@@ -60,6 +60,7 @@ jobs:
           NEXT_PUBLIC_ZERO_CACHE_URL: ${{ vars.NEXT_PUBLIC_ZERO_CACHE_URL }}
           NEXT_PUBLIC_DEPLOYMENT_MODE: ${{ vars.NEXT_PUBLIC_DEPLOYMENT_MODE }}
           NEXT_PUBLIC_FASTAPI_BACKEND_AUTH_TYPE: ${{ vars.NEXT_PUBLIC_FASTAPI_BACKEND_AUTH_TYPE }}
+          NEXT_PUBLIC_POSTHOG_KEY: ${{ secrets.NEXT_PUBLIC_POSTHOG_KEY }}
 
       - name: Install desktop dependencies
         run: pnpm install
diff --git a/surfsense_web/.env.example b/surfsense_web/.env.example
index b674d8e9b..b448c1f71 100644
--- a/surfsense_web/.env.example
+++ b/surfsense_web/.env.example
@@ -7,4 +7,7 @@ NEXT_PUBLIC_ZERO_CACHE_URL=http://localhost:4848
 DATABASE_URL=postgresql://postgres:[YOUR-PASSWORD]@db.sdsf.supabase.co:5432/postgres
 
 # Deployment mode (optional)
-NEXT_PUBLIC_DEPLOYMENT_MODE="self-hosted" or "cloud"
\ No newline at end of file
+NEXT_PUBLIC_DEPLOYMENT_MODE="self-hosted" or "cloud"
+
+# PostHog analytics (optional, leave empty to disable)
+NEXT_PUBLIC_POSTHOG_KEY=
\ No newline at end of file

From 8566b03c91b5a69efd8359c52889b6bb0118a657 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 20:18:42 +0200
Subject: [PATCH 189/202] Add PostHog analytics to desktop main process

---
 .github/workflows/desktop-release.yml         |  2 +
 surfsense_desktop/.env                        |  4 ++
 surfsense_desktop/scripts/build-electron.mjs  |  6 +++
 surfsense_desktop/src/main.ts                 | 11 ++++-
 surfsense_desktop/src/modules/analytics.ts    | 46 +++++++++++++++++++
 .../src/modules/autocomplete/index.ts         |  4 ++
 surfsense_desktop/src/modules/quick-ask.ts    |  3 ++
 7 files changed, 75 insertions(+), 1 deletion(-)
 create mode 100644 surfsense_desktop/src/modules/analytics.ts

diff --git a/.github/workflows/desktop-release.yml b/.github/workflows/desktop-release.yml
index 4d217562a..62ba5d445 100644
--- a/.github/workflows/desktop-release.yml
+++ b/.github/workflows/desktop-release.yml
@@ -71,6 +71,8 @@ jobs:
         working-directory: surfsense_desktop
         env:
           HOSTED_FRONTEND_URL: ${{ vars.HOSTED_FRONTEND_URL }}
+          POSTHOG_KEY: ${{ secrets.POSTHOG_KEY }}
+          POSTHOG_HOST: ${{ vars.POSTHOG_HOST }}
 
       - name: Package & Publish
         run: pnpm exec electron-builder ${{ matrix.platform }} --config electron-builder.yml --publish always -c.extraMetadata.version=${{ steps.version.outputs.VERSION }}
diff --git a/surfsense_desktop/.env b/surfsense_desktop/.env
index d053aac97..a0463a39d 100644
--- a/surfsense_desktop/.env
+++ b/surfsense_desktop/.env
@@ -4,3 +4,7 @@
 # The hosted web frontend URL. Used to intercept OAuth redirects and keep them
 # inside the desktop app. Set to your production frontend domain.
 HOSTED_FRONTEND_URL=https://surfsense.net
+
+# PostHog analytics (leave empty to disable)
+POSTHOG_KEY=
+POSTHOG_HOST=https://us.i.posthog.com
diff --git a/surfsense_desktop/scripts/build-electron.mjs b/surfsense_desktop/scripts/build-electron.mjs
index 9f507ea37..bfce6a9ad 100644
--- a/surfsense_desktop/scripts/build-electron.mjs
+++ b/surfsense_desktop/scripts/build-electron.mjs
@@ -111,6 +111,12 @@ async function buildElectron() {
       'process.env.HOSTED_FRONTEND_URL': JSON.stringify(
         process.env.HOSTED_FRONTEND_URL || desktopEnv.HOSTED_FRONTEND_URL || 'https://surfsense.net'
       ),
+      'process.env.POSTHOG_KEY': JSON.stringify(
+        process.env.POSTHOG_KEY || desktopEnv.POSTHOG_KEY || ''
+      ),
+      'process.env.POSTHOG_HOST': JSON.stringify(
+        process.env.POSTHOG_HOST || desktopEnv.POSTHOG_HOST || 'https://us.i.posthog.com'
+      ),
     },
   };
 
diff --git a/surfsense_desktop/src/main.ts b/surfsense_desktop/src/main.ts
index 95b0359c8..231553f9a 100644
--- a/surfsense_desktop/src/main.ts
+++ b/surfsense_desktop/src/main.ts
@@ -12,6 +12,7 @@ import { registerAutocomplete, unregisterAutocomplete } from './modules/autocomp
 import { registerFolderWatcher, unregisterFolderWatcher } from './modules/folder-watcher';
 import { registerIpcHandlers } from './ipc/handlers';
 import { createTray, destroyTray } from './modules/tray';
+import { initAnalytics, shutdownAnalytics, trackEvent } from './modules/analytics';
 
 registerGlobalErrorHandlers();
 
@@ -22,6 +23,8 @@ if (!setupDeepLinks()) {
 registerIpcHandlers();
 
 app.whenReady().then(async () => {
+  initAnalytics();
+  trackEvent('desktop_app_launched');
   setupMenu();
   try {
     await startNextServer();
@@ -70,9 +73,15 @@ app.on('before-quit', () => {
   isQuitting = true;
 });
 
-app.on('will-quit', () => {
+let didCleanup = false;
+app.on('will-quit', async (e) => {
+  if (didCleanup) return;
+  didCleanup = true;
+  e.preventDefault();
   unregisterQuickAsk();
   unregisterAutocomplete();
   unregisterFolderWatcher();
   destroyTray();
+  await shutdownAnalytics();
+  app.exit();
 });
diff --git a/surfsense_desktop/src/modules/analytics.ts b/surfsense_desktop/src/modules/analytics.ts
new file mode 100644
index 000000000..8f64c1bd8
--- /dev/null
+++ b/surfsense_desktop/src/modules/analytics.ts
@@ -0,0 +1,46 @@
+import { PostHog } from 'posthog-node';
+import { machineIdSync } from 'node-machine-id';
+import { app } from 'electron';
+
+let client: PostHog | null = null;
+let distinctId = '';
+
+export function initAnalytics(): void {
+  const key = process.env.POSTHOG_KEY;
+  if (!key) return;
+
+  try {
+    distinctId = machineIdSync(true);
+  } catch {
+    return;
+  }
+
+  client = new PostHog(key, {
+    host: process.env.POSTHOG_HOST || 'https://us.i.posthog.com',
+    flushAt: 20,
+    flushInterval: 10000,
+  });
+}
+
+export function trackEvent(event: string, properties?: Record<string, unknown>): void {
+  if (!client) return;
+
+  client.capture({
+    distinctId,
+    event,
+    properties: {
+      platform: 'desktop',
+      app_version: app.getVersion(),
+      os: process.platform,
+      ...properties,
+    },
+  });
+}
+
+export async function shutdownAnalytics(): Promise<void> {
+  if (!client) return;
+
+  const timeout = new Promise<void>((resolve) => setTimeout(resolve, 3000));
+  await Promise.race([client.shutdown(), timeout]);
+  client = null;
+}
diff --git a/surfsense_desktop/src/modules/autocomplete/index.ts b/surfsense_desktop/src/modules/autocomplete/index.ts
index cb09a42e1..d4eb727fd 100644
--- a/surfsense_desktop/src/modules/autocomplete/index.ts
+++ b/surfsense_desktop/src/modules/autocomplete/index.ts
@@ -6,6 +6,7 @@ import { captureScreen } from './screenshot';
 import { createSuggestionWindow, destroySuggestion, getSuggestionWindow } from './suggestion-window';
 import { getShortcuts } from '../shortcuts';
 import { getActiveSearchSpaceId } from '../active-search-space';
+import { trackEvent } from '../analytics';
 
 let currentShortcut = '';
 let autocompleteEnabled = true;
@@ -41,6 +42,7 @@ async function triggerAutocomplete(): Promise<void> {
     console.warn('[autocomplete] No active search space. Select a search space first.');
     return;
   }
+  trackEvent('desktop_autocomplete_triggered', { search_space_id: searchSpaceId });
   const cursor = screen.getCursorScreenPoint();
   const win = createSuggestionWindow(cursor.x, cursor.y);
 
@@ -87,9 +89,11 @@ function registerIpcHandlers(): void {
   ipcRegistered = true;
 
   ipcMain.handle(IPC_CHANNELS.ACCEPT_SUGGESTION, async (_event, text: string) => {
+    trackEvent('desktop_autocomplete_accepted');
     await acceptAndInject(text);
   });
   ipcMain.handle(IPC_CHANNELS.DISMISS_SUGGESTION, () => {
+    trackEvent('desktop_autocomplete_dismissed');
     destroySuggestion();
   });
   ipcMain.handle(IPC_CHANNELS.SET_AUTOCOMPLETE_ENABLED, (_event, enabled: boolean) => {
diff --git a/surfsense_desktop/src/modules/quick-ask.ts b/surfsense_desktop/src/modules/quick-ask.ts
index d5a2a9c2e..d700b421a 100644
--- a/surfsense_desktop/src/modules/quick-ask.ts
+++ b/surfsense_desktop/src/modules/quick-ask.ts
@@ -5,6 +5,7 @@ import { checkAccessibilityPermission, getFrontmostApp, simulateCopy, simulatePa
 import { getServerPort } from './server';
 import { getShortcuts } from './shortcuts';
 import { getActiveSearchSpaceId } from './active-search-space';
+import { trackEvent } from './analytics';
 
 let currentShortcut = '';
 let quickAskWindow: BrowserWindow | null = null;
@@ -120,6 +121,7 @@ async function quickAskHandler(): Promise<void> {
 
   sourceApp = getFrontmostApp();
   console.log('[quick-ask] Source app:', sourceApp, '| Opening Quick Assist with', text.length, 'chars', selected ? '(selected)' : text ? '(clipboard fallback)' : '(empty)');
+  trackEvent('desktop_quick_ask_opened', { has_selected_text: !!selected });
   openQuickAsk(text);
 }
 
@@ -151,6 +153,7 @@ function registerIpcHandlers(): void {
 
     if (!checkAccessibilityPermission()) return;
 
+    trackEvent('desktop_quick_ask_replaced');
     clipboard.writeText(text);
     destroyQuickAsk();
 

From 556646fe9740c3e8f05aae9722f51b44dc5d55f0 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 20:20:56 +0200
Subject: [PATCH 190/202] Use assets.surfsense.com as PostHog host

---
 surfsense_desktop/.env                       | 2 +-
 surfsense_desktop/scripts/build-electron.mjs | 2 +-
 surfsense_desktop/src/modules/analytics.ts   | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/surfsense_desktop/.env b/surfsense_desktop/.env
index a0463a39d..e127b99e0 100644
--- a/surfsense_desktop/.env
+++ b/surfsense_desktop/.env
@@ -7,4 +7,4 @@ HOSTED_FRONTEND_URL=https://surfsense.net
 
 # PostHog analytics (leave empty to disable)
 POSTHOG_KEY=
-POSTHOG_HOST=https://us.i.posthog.com
+POSTHOG_HOST=https://assets.surfsense.com
diff --git a/surfsense_desktop/scripts/build-electron.mjs b/surfsense_desktop/scripts/build-electron.mjs
index bfce6a9ad..90d76ef7a 100644
--- a/surfsense_desktop/scripts/build-electron.mjs
+++ b/surfsense_desktop/scripts/build-electron.mjs
@@ -115,7 +115,7 @@ async function buildElectron() {
         process.env.POSTHOG_KEY || desktopEnv.POSTHOG_KEY || ''
       ),
       'process.env.POSTHOG_HOST': JSON.stringify(
-        process.env.POSTHOG_HOST || desktopEnv.POSTHOG_HOST || 'https://us.i.posthog.com'
+        process.env.POSTHOG_HOST || desktopEnv.POSTHOG_HOST || 'https://assets.surfsense.com'
       ),
     },
   };
diff --git a/surfsense_desktop/src/modules/analytics.ts b/surfsense_desktop/src/modules/analytics.ts
index 8f64c1bd8..ee6ae8722 100644
--- a/surfsense_desktop/src/modules/analytics.ts
+++ b/surfsense_desktop/src/modules/analytics.ts
@@ -16,7 +16,7 @@ export function initAnalytics(): void {
   }
 
   client = new PostHog(key, {
-    host: process.env.POSTHOG_HOST || 'https://us.i.posthog.com',
+    host: process.env.POSTHOG_HOST || 'https://assets.surfsense.com',
     flushAt: 20,
     flushInterval: 10000,
   });

From 0be3c796354347e8a1e570233a7f560cbd22181c Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 20:22:00 +0200
Subject: [PATCH 191/202] Guard trackEvent with try-catch

---
 surfsense_desktop/src/modules/analytics.ts | 24 +++++++++++++---------
 1 file changed, 14 insertions(+), 10 deletions(-)

diff --git a/surfsense_desktop/src/modules/analytics.ts b/surfsense_desktop/src/modules/analytics.ts
index ee6ae8722..0bbcb3026 100644
--- a/surfsense_desktop/src/modules/analytics.ts
+++ b/surfsense_desktop/src/modules/analytics.ts
@@ -25,16 +25,20 @@ export function initAnalytics(): void {
 export function trackEvent(event: string, properties?: Record<string, unknown>): void {
   if (!client) return;
 
-  client.capture({
-    distinctId,
-    event,
-    properties: {
-      platform: 'desktop',
-      app_version: app.getVersion(),
-      os: process.platform,
-      ...properties,
-    },
-  });
+  try {
+    client.capture({
+      distinctId,
+      event,
+      properties: {
+        platform: 'desktop',
+        app_version: app.getVersion(),
+        os: process.platform,
+        ...properties,
+      },
+    });
+  } catch {
+    // Analytics should never break the app
+  }
 }
 
 export async function shutdownAnalytics(): Promise<void> {

From c5646eef6620ef673b8dc7bf136068112a619b03 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 20:28:07 +0200
Subject: [PATCH 192/202] Formatting

---
 .../[search_space_id]/client-layout.tsx       | 13 ++--
 .../components/DesktopContent.tsx             | 78 +++++++++++--------
 surfsense_web/app/desktop/login/page.tsx      |  4 +-
 surfsense_web/app/desktop/suggestion/page.tsx |  4 +-
 surfsense_web/components/TokenHandler.tsx     |  2 +-
 .../components/desktop/shortcut-recorder.tsx  |  4 +-
 6 files changed, 59 insertions(+), 46 deletions(-)

diff --git a/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx b/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx
index 16af9ac6b..eceb46231 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/client-layout.tsx
@@ -154,11 +154,14 @@ export function DashboardClientLayout({
 
 		// Sync to Electron store if stored value is null (first navigation)
 		if (electronAPI?.setActiveSearchSpace) {
-			electronAPI.getActiveSearchSpace?.().then((stored) => {
-				if (!stored) {
-					electronAPI.setActiveSearchSpace!(activeSeacrhSpaceId);
-				}
-			}).catch(() => {});
+			electronAPI
+				.getActiveSearchSpace?.()
+				.then((stored) => {
+					if (!stored) {
+						electronAPI.setActiveSearchSpace!(activeSeacrhSpaceId);
+					}
+				})
+				.catch(() => {});
 		}
 	}, [search_space_id, setActiveSearchSpaceIdState, electronAPI]);
 
diff --git a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
index 596ed3e8b..c3f457f96 100644
--- a/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
+++ b/surfsense_web/app/dashboard/[search_space_id]/user-settings/components/DesktopContent.tsx
@@ -6,12 +6,18 @@ import { toast } from "sonner";
 import { DEFAULT_SHORTCUTS, ShortcutRecorder } from "@/components/desktop/shortcut-recorder";
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from "@/components/ui/card";
 import { Label } from "@/components/ui/label";
-import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue } from "@/components/ui/select";
+import {
+	Select,
+	SelectContent,
+	SelectItem,
+	SelectTrigger,
+	SelectValue,
+} from "@/components/ui/select";
 import { Spinner } from "@/components/ui/spinner";
 import { Switch } from "@/components/ui/switch";
+import type { SearchSpace } from "@/contracts/types/search-space.types";
 import { useElectronAPI } from "@/hooks/use-platform";
 import { searchSpacesApiService } from "@/lib/apis/search-spaces-api.service";
-import type { SearchSpace } from "@/contracts/types/search-space.types";
 
 export function DesktopContent() {
 	const api = useElectronAPI();
@@ -82,7 +88,10 @@ export function DesktopContent() {
 		await api.setAutocompleteEnabled(checked);
 	};
 
-	const updateShortcut = (key: "generalAssist" | "quickAsk" | "autocomplete", accelerator: string) => {
+	const updateShortcut = (
+		key: "generalAssist" | "quickAsk" | "autocomplete",
+		accelerator: string
+	) => {
 		setShortcuts((prev) => {
 			const updated = { ...prev, [key]: accelerator };
 			api.setShortcuts?.({ [key]: accelerator }).catch(() => {
@@ -110,7 +119,8 @@ export function DesktopContent() {
 				<CardHeader className="px-3 md:px-6 pt-3 md:pt-6 pb-2 md:pb-3">
 					<CardTitle className="text-base md:text-lg">Default Search Space</CardTitle>
 					<CardDescription className="text-xs md:text-sm">
-						Choose which search space General Assist, Quick Assist, and Extreme Assist operate against.
+						Choose which search space General Assist, Quick Assist, and Extreme Assist operate
+						against.
 					</CardDescription>
 				</CardHeader>
 				<CardContent className="px-3 md:px-6 pb-3 md:pb-6">
@@ -128,7 +138,9 @@ export function DesktopContent() {
 							</SelectContent>
 						</Select>
 					) : (
-						<p className="text-sm text-muted-foreground">No search spaces found. Create one first.</p>
+						<p className="text-sm text-muted-foreground">
+							No search spaces found. Create one first.
+						</p>
 					)}
 				</CardContent>
 			</Card>
@@ -143,34 +155,34 @@ export function DesktopContent() {
 				</CardHeader>
 				<CardContent className="px-3 md:px-6 pb-3 md:pb-6">
 					{shortcutsLoaded ? (
-					<div className="flex flex-col gap-3">
-						<ShortcutRecorder
-							value={shortcuts.generalAssist}
-							onChange={(accel) => updateShortcut("generalAssist", accel)}
-							onReset={() => resetShortcut("generalAssist")}
-							defaultValue={DEFAULT_SHORTCUTS.generalAssist}
-							label="General Assist"
-							description="Launch SurfSense instantly from any application"
-							icon={Rocket}
-						/>
-						<ShortcutRecorder
-							value={shortcuts.quickAsk}
-							onChange={(accel) => updateShortcut("quickAsk", accel)}
-							onReset={() => resetShortcut("quickAsk")}
-							defaultValue={DEFAULT_SHORTCUTS.quickAsk}
-							label="Quick Assist"
-							description="Select text anywhere, then ask AI to explain, rewrite, or act on it"
-							icon={Zap}
-						/>
-						<ShortcutRecorder
-							value={shortcuts.autocomplete}
-							onChange={(accel) => updateShortcut("autocomplete", accel)}
-							onReset={() => resetShortcut("autocomplete")}
-							defaultValue={DEFAULT_SHORTCUTS.autocomplete}
-							label="Extreme Assist"
-							description="AI drafts text using your screen context and knowledge base"
-							icon={BrainCog}
-						/>
+						<div className="flex flex-col gap-3">
+							<ShortcutRecorder
+								value={shortcuts.generalAssist}
+								onChange={(accel) => updateShortcut("generalAssist", accel)}
+								onReset={() => resetShortcut("generalAssist")}
+								defaultValue={DEFAULT_SHORTCUTS.generalAssist}
+								label="General Assist"
+								description="Launch SurfSense instantly from any application"
+								icon={Rocket}
+							/>
+							<ShortcutRecorder
+								value={shortcuts.quickAsk}
+								onChange={(accel) => updateShortcut("quickAsk", accel)}
+								onReset={() => resetShortcut("quickAsk")}
+								defaultValue={DEFAULT_SHORTCUTS.quickAsk}
+								label="Quick Assist"
+								description="Select text anywhere, then ask AI to explain, rewrite, or act on it"
+								icon={Zap}
+							/>
+							<ShortcutRecorder
+								value={shortcuts.autocomplete}
+								onChange={(accel) => updateShortcut("autocomplete", accel)}
+								onReset={() => resetShortcut("autocomplete")}
+								defaultValue={DEFAULT_SHORTCUTS.autocomplete}
+								label="Extreme Assist"
+								description="AI drafts text using your screen context and knowledge base"
+								icon={BrainCog}
+							/>
 							<p className="text-[11px] text-muted-foreground">
 								Click a shortcut and press a new key combination to change it.
 							</p>
diff --git a/surfsense_web/app/desktop/login/page.tsx b/surfsense_web/app/desktop/login/page.tsx
index 744680010..8f68d20c1 100644
--- a/surfsense_web/app/desktop/login/page.tsx
+++ b/surfsense_web/app/desktop/login/page.tsx
@@ -139,9 +139,7 @@ export default function DesktopLoginPage() {
 						height={48}
 						priority
 					/>
-					<h1 className="text-lg font-semibold tracking-tight">
-						Welcome to SurfSense Desktop
-					</h1>
+					<h1 className="text-lg font-semibold tracking-tight">Welcome to SurfSense Desktop</h1>
 					<p className="mt-1 text-sm text-muted-foreground">
 						Configure shortcuts, then sign in to get started.
 					</p>
diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index e458f6615..0815ba622 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -297,9 +297,7 @@ export default function SuggestionPage() {
 					const isExpanded = expandedOption === index;
 					const needsTruncation = option.length > TRUNCATE_LENGTH;
 					const displayText =
-						needsTruncation && !isExpanded
-							? option.slice(0, TRUNCATE_LENGTH) + "…"
-							: option;
+						needsTruncation && !isExpanded ? option.slice(0, TRUNCATE_LENGTH) + "…" : option;
 
 					return (
 						<div
diff --git a/surfsense_web/components/TokenHandler.tsx b/surfsense_web/components/TokenHandler.tsx
index cd585f0ca..e81a1bf2b 100644
--- a/surfsense_web/components/TokenHandler.tsx
+++ b/surfsense_web/components/TokenHandler.tsx
@@ -2,8 +2,8 @@
 
 import { useEffect } from "react";
 import { useGlobalLoadingEffect } from "@/hooks/use-global-loading";
-import { getAndClearRedirectPath, setBearerToken, setRefreshToken } from "@/lib/auth-utils";
 import { searchSpacesApiService } from "@/lib/apis/search-spaces-api.service";
+import { getAndClearRedirectPath, setBearerToken, setRefreshToken } from "@/lib/auth-utils";
 import { trackLoginSuccess } from "@/lib/posthog/events";
 
 interface TokenHandlerProps {
diff --git a/surfsense_web/components/desktop/shortcut-recorder.tsx b/surfsense_web/components/desktop/shortcut-recorder.tsx
index ec4e5a528..c872afaf1 100644
--- a/surfsense_web/components/desktop/shortcut-recorder.tsx
+++ b/surfsense_web/components/desktop/shortcut-recorder.tsx
@@ -150,7 +150,9 @@ export function ShortcutRecorder({
 					)}
 				>
 					{recording ? (
-						<span className="text-[11px] text-primary animate-pulse whitespace-nowrap">Press keys…</span>
+						<span className="text-[11px] text-primary animate-pulse whitespace-nowrap">
+							Press keys…
+						</span>
 					) : (
 						<Kbd keys={displayKeys} />
 					)}

From 13625acdd5ceddeb66a03d7aaeaf1cc9e1dc16b1 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 20:47:17 +0200
Subject: [PATCH 193/202] Add vision model tab to chat page model selector

---
 .../components/new-chat/chat-header.tsx       |  44 +++
 .../components/new-chat/model-selector.tsx    | 304 +++++++++++++++++-
 2 files changed, 339 insertions(+), 9 deletions(-)

diff --git a/surfsense_web/components/new-chat/chat-header.tsx b/surfsense_web/components/new-chat/chat-header.tsx
index 3263a2b07..0c5253c6c 100644
--- a/surfsense_web/components/new-chat/chat-header.tsx
+++ b/surfsense_web/components/new-chat/chat-header.tsx
@@ -3,11 +3,14 @@
 import { useCallback, useState } from "react";
 import { ImageConfigDialog } from "@/components/shared/image-config-dialog";
 import { ModelConfigDialog } from "@/components/shared/model-config-dialog";
+import { VisionConfigDialog } from "@/components/shared/vision-config-dialog";
 import type {
 	GlobalImageGenConfig,
 	GlobalNewLLMConfig,
+	GlobalVisionLLMConfig,
 	ImageGenerationConfig,
 	NewLLMConfigPublic,
+	VisionLLMConfig,
 } from "@/contracts/types/new-llm-config.types";
 import { ModelSelector } from "./model-selector";
 
@@ -33,6 +36,14 @@ export function ChatHeader({ searchSpaceId, className }: ChatHeaderProps) {
 	const [isImageGlobal, setIsImageGlobal] = useState(false);
 	const [imageDialogMode, setImageDialogMode] = useState<"create" | "edit" | "view">("view");
 
+	// Vision config dialog state
+	const [visionDialogOpen, setVisionDialogOpen] = useState(false);
+	const [selectedVisionConfig, setSelectedVisionConfig] = useState<
+		VisionLLMConfig | GlobalVisionLLMConfig | null
+	>(null);
+	const [isVisionGlobal, setIsVisionGlobal] = useState(false);
+	const [visionDialogMode, setVisionDialogMode] = useState<"create" | "edit" | "view">("view");
+
 	// LLM handlers
 	const handleEditLLMConfig = useCallback(
 		(config: NewLLMConfigPublic | GlobalNewLLMConfig, global: boolean) => {
@@ -79,6 +90,29 @@ export function ChatHeader({ searchSpaceId, className }: ChatHeaderProps) {
 		if (!open) setSelectedImageConfig(null);
 	}, []);
 
+	// Vision model handlers
+	const handleAddVisionModel = useCallback(() => {
+		setSelectedVisionConfig(null);
+		setIsVisionGlobal(false);
+		setVisionDialogMode("create");
+		setVisionDialogOpen(true);
+	}, []);
+
+	const handleEditVisionConfig = useCallback(
+		(config: VisionLLMConfig | GlobalVisionLLMConfig, global: boolean) => {
+			setSelectedVisionConfig(config);
+			setIsVisionGlobal(global);
+			setVisionDialogMode(global ? "view" : "edit");
+			setVisionDialogOpen(true);
+		},
+		[]
+	);
+
+	const handleVisionDialogClose = useCallback((open: boolean) => {
+		setVisionDialogOpen(open);
+		if (!open) setSelectedVisionConfig(null);
+	}, []);
+
 	return (
 		<div className="flex items-center gap-2">
 			<ModelSelector
@@ -86,6 +120,8 @@ export function ChatHeader({ searchSpaceId, className }: ChatHeaderProps) {
 				onAddNewLLM={handleAddNewLLM}
 				onEditImage={handleEditImageConfig}
 				onAddNewImage={handleAddImageModel}
+				onEditVision={handleEditVisionConfig}
+				onAddNewVision={handleAddVisionModel}
 				className={className}
 			/>
 			<ModelConfigDialog
@@ -104,6 +140,14 @@ export function ChatHeader({ searchSpaceId, className }: ChatHeaderProps) {
 				searchSpaceId={searchSpaceId}
 				mode={imageDialogMode}
 			/>
+			<VisionConfigDialog
+				open={visionDialogOpen}
+				onOpenChange={handleVisionDialogClose}
+				config={selectedVisionConfig}
+				isGlobal={isVisionGlobal}
+				searchSpaceId={searchSpaceId}
+				mode={visionDialogMode}
+			/>
 		</div>
 	);
 }
diff --git a/surfsense_web/components/new-chat/model-selector.tsx b/surfsense_web/components/new-chat/model-selector.tsx
index 39f88f794..46b4a2c3a 100644
--- a/surfsense_web/components/new-chat/model-selector.tsx
+++ b/surfsense_web/components/new-chat/model-selector.tsx
@@ -1,7 +1,7 @@
 "use client";
 
 import { useAtomValue } from "jotai";
-import { Bot, Check, ChevronDown, Edit3, ImageIcon, Plus, Search, Zap } from "lucide-react";
+import { Bot, Check, ChevronDown, Edit3, Eye, ImageIcon, Plus, Search, Zap } from "lucide-react";
 import { type UIEvent, useCallback, useMemo, useState } from "react";
 import { toast } from "sonner";
 import {
@@ -15,6 +15,10 @@ import {
 	newLLMConfigsAtom,
 } from "@/atoms/new-llm-config/new-llm-config-query.atoms";
 import { activeSearchSpaceIdAtom } from "@/atoms/search-spaces/search-space-query.atoms";
+import {
+	globalVisionLLMConfigsAtom,
+	visionLLMConfigsAtom,
+} from "@/atoms/vision-llm-config/vision-llm-config-query.atoms";
 import { Badge } from "@/components/ui/badge";
 import { Button } from "@/components/ui/button";
 import {
@@ -32,8 +36,10 @@ import { Tabs, TabsContent, TabsList, TabsTrigger } from "@/components/ui/tabs";
 import type {
 	GlobalImageGenConfig,
 	GlobalNewLLMConfig,
+	GlobalVisionLLMConfig,
 	ImageGenerationConfig,
 	NewLLMConfigPublic,
+	VisionLLMConfig,
 } from "@/contracts/types/new-llm-config.types";
 import { getProviderIcon } from "@/lib/provider-icons";
 import { cn } from "@/lib/utils";
@@ -43,6 +49,8 @@ interface ModelSelectorProps {
 	onAddNewLLM: () => void;
 	onEditImage?: (config: ImageGenerationConfig | GlobalImageGenConfig, isGlobal: boolean) => void;
 	onAddNewImage?: () => void;
+	onEditVision?: (config: VisionLLMConfig | GlobalVisionLLMConfig, isGlobal: boolean) => void;
+	onAddNewVision?: () => void;
 	className?: string;
 }
 
@@ -51,14 +59,18 @@ export function ModelSelector({
 	onAddNewLLM,
 	onEditImage,
 	onAddNewImage,
+	onEditVision,
+	onAddNewVision,
 	className,
 }: ModelSelectorProps) {
 	const [open, setOpen] = useState(false);
-	const [activeTab, setActiveTab] = useState<"llm" | "image">("llm");
+	const [activeTab, setActiveTab] = useState<"llm" | "image" | "vision">("llm");
 	const [llmSearchQuery, setLlmSearchQuery] = useState("");
 	const [imageSearchQuery, setImageSearchQuery] = useState("");
+	const [visionSearchQuery, setVisionSearchQuery] = useState("");
 	const [llmScrollPos, setLlmScrollPos] = useState<"top" | "middle" | "bottom">("top");
 	const [imageScrollPos, setImageScrollPos] = useState<"top" | "middle" | "bottom">("top");
+	const [visionScrollPos, setVisionScrollPos] = useState<"top" | "middle" | "bottom">("top");
 	const handleListScroll = useCallback(
 		(setter: typeof setLlmScrollPos) => (e: UIEvent<HTMLDivElement>) => {
 			const el = e.currentTarget;
@@ -82,8 +94,21 @@ export function ModelSelector({
 		useAtomValue(globalImageGenConfigsAtom);
 	const { data: imageUserConfigs, isLoading: imageUserLoading } = useAtomValue(imageGenConfigsAtom);
 
+	// Vision data
+	const { data: visionGlobalConfigs, isLoading: visionGlobalLoading } = useAtomValue(
+		globalVisionLLMConfigsAtom
+	);
+	const { data: visionUserConfigs, isLoading: visionUserLoading } =
+		useAtomValue(visionLLMConfigsAtom);
+
 	const isLoading =
-		llmUserLoading || llmGlobalLoading || prefsLoading || imageGlobalLoading || imageUserLoading;
+		llmUserLoading ||
+		llmGlobalLoading ||
+		prefsLoading ||
+		imageGlobalLoading ||
+		imageUserLoading ||
+		visionGlobalLoading ||
+		visionUserLoading;
 
 	// ─── LLM current config ───
 	const currentLLMConfig = useMemo(() => {
@@ -116,6 +141,24 @@ export function ModelSelector({
 		);
 	}, [currentImageConfig]);
 
+	// ─── Vision current config ───
+	const currentVisionConfig = useMemo(() => {
+		if (!preferences) return null;
+		const id = preferences.vision_llm_config_id;
+		if (id === null || id === undefined) return null;
+		const globalMatch = visionGlobalConfigs?.find((c) => c.id === id);
+		if (globalMatch) return globalMatch;
+		return visionUserConfigs?.find((c) => c.id === id) ?? null;
+	}, [preferences, visionGlobalConfigs, visionUserConfigs]);
+
+	const isVisionAutoMode = useMemo(() => {
+		return (
+			currentVisionConfig &&
+			"is_auto_mode" in currentVisionConfig &&
+			currentVisionConfig.is_auto_mode
+		);
+	}, [currentVisionConfig]);
+
 	// ─── LLM filtering ───
 	const filteredLLMGlobal = useMemo(() => {
 		if (!llmGlobalConfigs) return [];
@@ -170,6 +213,33 @@ export function ModelSelector({
 
 	const totalImageModels = (imageGlobalConfigs?.length ?? 0) + (imageUserConfigs?.length ?? 0);
 
+	// ─── Vision filtering ───
+	const filteredVisionGlobal = useMemo(() => {
+		if (!visionGlobalConfigs) return [];
+		if (!visionSearchQuery) return visionGlobalConfigs;
+		const q = visionSearchQuery.toLowerCase();
+		return visionGlobalConfigs.filter(
+			(c) =>
+				c.name.toLowerCase().includes(q) ||
+				c.model_name.toLowerCase().includes(q) ||
+				c.provider.toLowerCase().includes(q)
+		);
+	}, [visionGlobalConfigs, visionSearchQuery]);
+
+	const filteredVisionUser = useMemo(() => {
+		if (!visionUserConfigs) return [];
+		if (!visionSearchQuery) return visionUserConfigs;
+		const q = visionSearchQuery.toLowerCase();
+		return visionUserConfigs.filter(
+			(c) =>
+				c.name.toLowerCase().includes(q) ||
+				c.model_name.toLowerCase().includes(q) ||
+				c.provider.toLowerCase().includes(q)
+		);
+	}, [visionUserConfigs, visionSearchQuery]);
+
+	const totalVisionModels = (visionGlobalConfigs?.length ?? 0) + (visionUserConfigs?.length ?? 0);
+
 	// ─── Handlers ───
 	const handleSelectLLM = useCallback(
 		async (config: NewLLMConfigPublic | GlobalNewLLMConfig) => {
@@ -229,6 +299,30 @@ export function ModelSelector({
 		[currentImageConfig, searchSpaceId, updatePreferences]
 	);
 
+	const handleSelectVision = useCallback(
+		async (configId: number) => {
+			if (currentVisionConfig?.id === configId) {
+				setOpen(false);
+				return;
+			}
+			if (!searchSpaceId) {
+				toast.error("No search space selected");
+				return;
+			}
+			try {
+				await updatePreferences({
+					search_space_id: Number(searchSpaceId),
+					data: { vision_llm_config_id: configId },
+				});
+				toast.success("Vision model updated");
+				setOpen(false);
+			} catch {
+				toast.error("Failed to switch vision model");
+			}
+		},
+		[currentVisionConfig, searchSpaceId, updatePreferences]
+	);
+
 	return (
 		<Popover open={open} onOpenChange={setOpen}>
 			<PopoverTrigger asChild>
@@ -282,6 +376,23 @@ export function ModelSelector({
 							) : (
 								<ImageIcon className="size-4 text-muted-foreground" />
 							)}
+
+							{/* Divider */}
+							<div className="h-4 w-px bg-border/60 dark:bg-white/10 mx-0.5" />
+
+							{/* Vision section */}
+							{currentVisionConfig ? (
+								<>
+									{getProviderIcon(currentVisionConfig.provider, {
+										isAutoMode: isVisionAutoMode ?? false,
+									})}
+									<span className="max-w-[80px] md:max-w-[100px] truncate hidden md:inline">
+										{currentVisionConfig.name}
+									</span>
+								</>
+							) : (
+								<Eye className="size-4 text-muted-foreground" />
+							)}
 						</>
 					)}
 					<ChevronDown className="h-3.5 w-3.5 text-muted-foreground ml-1 shrink-0" />
@@ -295,25 +406,32 @@ export function ModelSelector({
 			>
 				<Tabs
 					value={activeTab}
-					onValueChange={(v) => setActiveTab(v as "llm" | "image")}
+					onValueChange={(v) => setActiveTab(v as "llm" | "image" | "vision")}
 					className="w-full"
 				>
 					<div className="border-b border-border/80 dark:border-neutral-800">
-						<TabsList className="w-full grid grid-cols-2 rounded-none rounded-t-lg bg-transparent h-11 p-0 gap-0">
+						<TabsList className="w-full grid grid-cols-3 rounded-none rounded-t-lg bg-transparent h-11 p-0 gap-0">
 							<TabsTrigger
 								value="llm"
-								className="gap-2 text-sm font-medium rounded-none text-muted-foreground transition-all duration-200 h-full bg-transparent data-[state=active]:bg-transparent shadow-none data-[state=active]:shadow-none border-b-[1.5px] border-transparent data-[state=active]:border-foreground dark:data-[state=active]:border-white data-[state=active]:text-foreground"
+								className="gap-1.5 text-sm font-medium rounded-none text-muted-foreground transition-all duration-200 h-full bg-transparent data-[state=active]:bg-transparent shadow-none data-[state=active]:shadow-none border-b-[1.5px] border-transparent data-[state=active]:border-foreground dark:data-[state=active]:border-white data-[state=active]:text-foreground"
 							>
-								<Zap className="size-4" />
+								<Zap className="size-3.5" />
 								LLM
 							</TabsTrigger>
 							<TabsTrigger
 								value="image"
-								className="gap-2 text-sm font-medium rounded-none text-muted-foreground transition-all duration-200 h-full bg-transparent data-[state=active]:bg-transparent shadow-none data-[state=active]:shadow-none border-b-[1.5px] border-transparent data-[state=active]:border-foreground dark:data-[state=active]:border-white data-[state=active]:text-foreground"
+								className="gap-1.5 text-sm font-medium rounded-none text-muted-foreground transition-all duration-200 h-full bg-transparent data-[state=active]:bg-transparent shadow-none data-[state=active]:shadow-none border-b-[1.5px] border-transparent data-[state=active]:border-foreground dark:data-[state=active]:border-white data-[state=active]:text-foreground"
 							>
-								<ImageIcon className="size-4" />
+								<ImageIcon className="size-3.5" />
 								Image
 							</TabsTrigger>
+							<TabsTrigger
+								value="vision"
+								className="gap-1.5 text-sm font-medium rounded-none text-muted-foreground transition-all duration-200 h-full bg-transparent data-[state=active]:bg-transparent shadow-none data-[state=active]:shadow-none border-b-[1.5px] border-transparent data-[state=active]:border-foreground dark:data-[state=active]:border-white data-[state=active]:text-foreground"
+							>
+								<Eye className="size-3.5" />
+								Vision
+							</TabsTrigger>
 						</TabsList>
 					</div>
 
@@ -676,6 +794,174 @@ export function ModelSelector({
 							</CommandList>
 						</Command>
 					</TabsContent>
+
+					{/* ─── Vision Tab ─── */}
+					<TabsContent value="vision" className="mt-0">
+						<Command
+							shouldFilter={false}
+							className="rounded-none rounded-b-lg dark:bg-neutral-900 [&_[data-slot=command-input-wrapper]]:border-0 [&_[data-slot=command-input-wrapper]]:px-0 [&_[data-slot=command-input-wrapper]]:gap-2"
+						>
+							{totalVisionModels > 3 && (
+								<div className="px-2 md:px-3 py-1.5 md:py-2">
+									<CommandInput
+										placeholder="Search vision models"
+										value={visionSearchQuery}
+										onValueChange={setVisionSearchQuery}
+										className="h-7 md:h-8 w-full text-xs md:text-sm border-0 bg-transparent focus:ring-0 placeholder:text-muted-foreground/60"
+									/>
+								</div>
+							)}
+							<CommandList
+								className="max-h-[300px] md:max-h-[400px] overflow-y-auto"
+								onScroll={handleListScroll(setVisionScrollPos)}
+								style={{
+									maskImage: `linear-gradient(to bottom, ${visionScrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${visionScrollPos === "bottom" ? "black" : "transparent"})`,
+									WebkitMaskImage: `linear-gradient(to bottom, ${visionScrollPos === "top" ? "black" : "transparent"}, black 16px, black calc(100% - 16px), ${visionScrollPos === "bottom" ? "black" : "transparent"})`,
+								}}
+							>
+								<CommandEmpty className="py-8 text-center">
+									<div className="flex flex-col items-center gap-2">
+										<Search className="size-8 text-muted-foreground" />
+										<p className="text-sm text-muted-foreground">No vision models found</p>
+										<p className="text-xs text-muted-foreground/60">Try a different search term</p>
+									</div>
+								</CommandEmpty>
+
+								{filteredVisionGlobal.length > 0 && (
+									<CommandGroup>
+										<div className="flex items-center gap-2 px-3 py-2 text-xs font-semibold text-muted-foreground tracking-wider">
+											Global Vision Models
+										</div>
+										{filteredVisionGlobal.map((config) => {
+											const isSelected = currentVisionConfig?.id === config.id;
+											const isAuto = "is_auto_mode" in config && config.is_auto_mode;
+											return (
+												<CommandItem
+													key={`vis-g-${config.id}`}
+													value={`vis-g-${config.id}`}
+													onSelect={() => handleSelectVision(config.id)}
+													className={cn(
+														"mx-2 rounded-lg mb-1 cursor-pointer group transition-all hover:bg-accent/50 dark:hover:bg-white/[0.06]",
+														isSelected && "bg-accent/80 dark:bg-white/[0.06]"
+													)}
+												>
+													<div className="flex items-center gap-3 min-w-0 flex-1">
+														<div className="shrink-0">
+															{getProviderIcon(config.provider, { isAutoMode: isAuto })}
+														</div>
+														<div className="min-w-0 flex-1">
+															<div className="flex items-center gap-2">
+																<span className="font-medium truncate">{config.name}</span>
+																{isAuto && (
+																	<Badge
+																		variant="secondary"
+																		className="text-[9px] px-1 py-0 h-3.5 bg-violet-800 text-white dark:bg-violet-800 dark:text-white border-0"
+																	>
+																		Recommended
+																	</Badge>
+																)}
+																{isSelected && <Check className="size-3.5 text-primary shrink-0" />}
+															</div>
+															<span className="text-xs text-muted-foreground truncate block">
+																{isAuto ? "Auto Mode" : config.model_name}
+															</span>
+														</div>
+														{onEditVision && !isAuto && (
+															<Button
+																variant="ghost"
+																size="icon"
+																className="size-7 shrink-0 rounded-md hover:bg-muted opacity-0 group-hover:opacity-100 transition-opacity"
+																onClick={(e) => {
+																	e.stopPropagation();
+																	setOpen(false);
+																	onEditVision(config as VisionLLMConfig, true);
+																}}
+															>
+																<Edit3 className="size-3.5 text-muted-foreground" />
+															</Button>
+														)}
+													</div>
+												</CommandItem>
+											);
+										})}
+									</CommandGroup>
+								)}
+
+								{filteredVisionUser.length > 0 && (
+									<>
+										{filteredVisionGlobal.length > 0 && (
+											<CommandSeparator className="my-1 mx-4 bg-border/60" />
+										)}
+										<CommandGroup>
+											<div className="flex items-center gap-2 px-3 py-2 text-xs font-semibold text-muted-foreground tracking-wider">
+												Your Vision Models
+											</div>
+											{filteredVisionUser.map((config) => {
+												const isSelected = currentVisionConfig?.id === config.id;
+												return (
+													<CommandItem
+														key={`vis-u-${config.id}`}
+														value={`vis-u-${config.id}`}
+														onSelect={() => handleSelectVision(config.id)}
+														className={cn(
+															"mx-2 rounded-lg mb-1 cursor-pointer group transition-all hover:bg-accent/50 dark:hover:bg-white/[0.06]",
+															isSelected && "bg-accent/80 dark:bg-white/[0.06]"
+														)}
+													>
+														<div className="flex items-center gap-3 min-w-0 flex-1">
+															<div className="shrink-0">{getProviderIcon(config.provider)}</div>
+															<div className="min-w-0 flex-1">
+																<div className="flex items-center gap-2">
+																	<span className="font-medium truncate">{config.name}</span>
+																	{isSelected && (
+																		<Check className="size-3.5 text-primary shrink-0" />
+																	)}
+																</div>
+																<span className="text-xs text-muted-foreground truncate block">
+																	{config.model_name}
+																</span>
+															</div>
+															{onEditVision && (
+																<Button
+																	variant="ghost"
+																	size="icon"
+																	className="h-7 w-7 shrink-0 opacity-0 group-hover:opacity-100 transition-opacity"
+																	onClick={(e) => {
+																		e.stopPropagation();
+																		setOpen(false);
+																		onEditVision(config, false);
+																	}}
+																>
+																	<Edit3 className="size-3.5 text-muted-foreground" />
+																</Button>
+															)}
+														</div>
+													</CommandItem>
+												);
+											})}
+										</CommandGroup>
+									</>
+								)}
+
+								{onAddNewVision && (
+									<div className="p-2 bg-muted/20 dark:bg-neutral-900">
+										<Button
+											variant="ghost"
+											size="sm"
+											className="w-full justify-start gap-2 h-9 rounded-lg hover:bg-accent/50 dark:hover:bg-white/[0.06]"
+											onClick={() => {
+												setOpen(false);
+												onAddNewVision();
+											}}
+										>
+											<Plus className="size-4 text-primary" />
+											<span className="text-sm font-medium">Add Vision Model</span>
+										</Button>
+									</div>
+								)}
+							</CommandList>
+						</Command>
+					</TabsContent>
 				</Tabs>
 			</PopoverContent>
 		</Popover>

From 087b1498431ec60943a7d680af1f198876dc019b Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 21:06:11 +0200
Subject: [PATCH 194/202] Add setup prompt in overlay when vision model not
 configured

---
 surfsense_web/app/desktop/suggestion/page.tsx | 74 +++++++++++++++----
 .../app/desktop/suggestion/suggestion.css     | 60 +++++++++++++++
 2 files changed, 120 insertions(+), 14 deletions(-)

diff --git a/surfsense_web/app/desktop/suggestion/page.tsx b/surfsense_web/app/desktop/suggestion/page.tsx
index 0815ba622..46e388568 100644
--- a/surfsense_web/app/desktop/suggestion/page.tsx
+++ b/surfsense_web/app/desktop/suggestion/page.tsx
@@ -27,24 +27,32 @@ interface AgentStep {
 	items: string[];
 }
 
-function friendlyError(raw: string | number): string {
+type FriendlyError = { message: string; isSetup?: boolean };
+
+function friendlyError(raw: string | number): FriendlyError {
 	if (typeof raw === "number") {
-		if (raw === 401) return "Please sign in to use suggestions.";
-		if (raw === 403) return "You don\u2019t have permission for this.";
-		if (raw === 404) return "Suggestion service not found. Is the backend running?";
-		if (raw >= 500) return "Something went wrong on the server. Try again.";
-		return "Something went wrong. Try again.";
+		if (raw === 401) return { message: "Please sign in to use suggestions." };
+		if (raw === 403) return { message: "You don\u2019t have permission for this." };
+		if (raw === 404) return { message: "Suggestion service not found. Is the backend running?" };
+		if (raw >= 500) return { message: "Something went wrong on the server. Try again." };
+		return { message: "Something went wrong. Try again." };
 	}
 	const lower = raw.toLowerCase();
 	if (lower.includes("not authenticated") || lower.includes("unauthorized"))
-		return "Please sign in to use suggestions.";
+		return { message: "Please sign in to use suggestions." };
 	if (lower.includes("no vision llm configured") || lower.includes("no llm configured"))
-		return "No Vision LLM configured. Set one in search space settings.";
+		return {
+			message: "Configure a vision-capable model (e.g. GPT-4o, Gemini) to enable autocomplete.",
+			isSetup: true,
+		};
 	if (lower.includes("does not support vision"))
-		return "Selected model doesn\u2019t support vision. Set a vision-capable model in settings.";
+		return {
+			message: "The selected model doesn\u2019t support vision. Choose a vision-capable model.",
+			isSetup: true,
+		};
 	if (lower.includes("fetch") || lower.includes("network") || lower.includes("econnrefused"))
-		return "Can\u2019t reach the server. Check your connection.";
-	return "Something went wrong. Try again.";
+		return { message: "Can\u2019t reach the server. Check your connection." };
+	return { message: "Something went wrong. Try again." };
 }
 
 const AUTO_DISMISS_MS = 3000;
@@ -76,7 +84,7 @@ export default function SuggestionPage() {
 	const api = useElectronAPI();
 	const [options, setOptions] = useState<string[]>([]);
 	const [isLoading, setIsLoading] = useState(true);
-	const [error, setError] = useState<string | null>(null);
+	const [error, setError] = useState<FriendlyError | null>(null);
 	const [steps, setSteps] = useState<AgentStep[]>([]);
 	const [expandedOption, setExpandedOption] = useState<number | null>(null);
 	const abortRef = useRef<AbortController | null>(null);
@@ -90,7 +98,7 @@ export default function SuggestionPage() {
 	}, [api]);
 
 	useEffect(() => {
-		if (!error) return;
+		if (!error || error.isSetup) return;
 		const timer = setTimeout(() => {
 			api?.dismissSuggestion?.();
 		}, AUTO_DISMISS_MS);
@@ -233,9 +241,47 @@ export default function SuggestionPage() {
 	}
 
 	if (error) {
+		if (error.isSetup) {
+			return (
+				<div className="suggestion-tooltip suggestion-setup">
+					<div className="setup-icon">
+						<svg viewBox="0 0 24 24" fill="none" width="28" height="28" aria-hidden="true">
+							<path
+								d="M1 12C1 12 5 4 12 4C19 4 23 12 23 12C23 12 19 20 12 20C5 20 1 12 1 12Z"
+								stroke="#a78bfa"
+								strokeWidth="1.5"
+								strokeLinecap="round"
+								strokeLinejoin="round"
+							/>
+							<circle
+								cx="12"
+								cy="12"
+								r="3"
+								stroke="#a78bfa"
+								strokeWidth="1.5"
+								strokeLinecap="round"
+								strokeLinejoin="round"
+							/>
+						</svg>
+					</div>
+					<div className="setup-content">
+						<span className="setup-title">Vision Model Required</span>
+						<span className="setup-message">{error.message}</span>
+						<span className="setup-hint">Settings → Vision Models</span>
+					</div>
+					<button
+						type="button"
+						className="setup-dismiss"
+						onClick={() => api?.dismissSuggestion?.()}
+					>
+						✕
+					</button>
+				</div>
+			);
+		}
 		return (
 			<div className="suggestion-tooltip suggestion-error">
-				<span className="suggestion-error-text">{error}</span>
+				<span className="suggestion-error-text">{error.message}</span>
 			</div>
 		);
 	}
diff --git a/surfsense_web/app/desktop/suggestion/suggestion.css b/surfsense_web/app/desktop/suggestion/suggestion.css
index f5471cf37..fd5ec5d3b 100644
--- a/surfsense_web/app/desktop/suggestion/suggestion.css
+++ b/surfsense_web/app/desktop/suggestion/suggestion.css
@@ -117,6 +117,66 @@ body:has(.suggestion-body) {
 	font-size: 12px;
 }
 
+/* --- Setup prompt (vision model not configured) --- */
+
+.suggestion-setup {
+	display: flex;
+	flex-direction: row;
+	align-items: flex-start;
+	gap: 10px;
+	border-color: #3b2d6b;
+	padding: 10px 14px;
+}
+
+.setup-icon {
+	flex-shrink: 0;
+	margin-top: 1px;
+}
+
+.setup-content {
+	display: flex;
+	flex-direction: column;
+	gap: 3px;
+	min-width: 0;
+}
+
+.setup-title {
+	font-size: 13px;
+	font-weight: 600;
+	color: #c4b5fd;
+}
+
+.setup-message {
+	font-size: 11.5px;
+	color: #a1a1aa;
+	line-height: 1.4;
+}
+
+.setup-hint {
+	font-size: 10.5px;
+	color: #7c6dac;
+	margin-top: 2px;
+}
+
+.setup-dismiss {
+	flex-shrink: 0;
+	align-self: flex-start;
+	background: none;
+	border: none;
+	color: #6b6b7b;
+	font-size: 14px;
+	cursor: pointer;
+	padding: 2px 4px;
+	line-height: 1;
+	border-radius: 4px;
+	transition: color 0.15s, background 0.15s;
+}
+
+.setup-dismiss:hover {
+	color: #c4b5fd;
+	background: rgba(124, 109, 172, 0.15);
+}
+
 /* --- Agent activity indicator --- */
 
 .agent-activity {

From 36b8a84b0b6353e4bf608bd19fde2ff729faca2f Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 21:55:58 +0200
Subject: [PATCH 195/202] Add vision LLM config examples to
 global_llm_config.example.yaml

---
 .../app/config/global_llm_config.example.yaml | 82 +++++++++++++++++++
 1 file changed, 82 insertions(+)

diff --git a/surfsense_backend/app/config/global_llm_config.example.yaml b/surfsense_backend/app/config/global_llm_config.example.yaml
index 49a8d0295..e382fdc74 100644
--- a/surfsense_backend/app/config/global_llm_config.example.yaml
+++ b/surfsense_backend/app/config/global_llm_config.example.yaml
@@ -263,6 +263,82 @@ global_image_generation_configs:
   #   rpm: 30
   #   litellm_params: {}
 
+# =============================================================================
+# Vision LLM Configuration
+# =============================================================================
+# These configurations power the vision autocomplete feature (screenshot analysis).
+# Only vision-capable models should be used here (e.g. GPT-4o, Gemini Pro, Claude 3).
+# Supported providers: OpenAI, Anthropic, Google, Azure OpenAI, Vertex AI, Bedrock,
+# xAI, OpenRouter, Ollama, Groq, Together AI, Fireworks AI, DeepSeek, Mistral, Custom
+#
+# Auto mode (ID 0) uses LiteLLM Router for load balancing across all vision configs.
+
+# Router Settings for Vision LLM Auto Mode
+vision_llm_router_settings:
+  routing_strategy: "usage-based-routing"
+  num_retries: 3
+  allowed_fails: 3
+  cooldown_time: 60
+
+global_vision_llm_configs:
+  # Example: OpenAI GPT-4o (recommended for vision)
+  - id: -1
+    name: "Global GPT-4o Vision"
+    description: "OpenAI's GPT-4o with strong vision capabilities"
+    provider: "OPENAI"
+    model_name: "gpt-4o"
+    api_key: "sk-your-openai-api-key-here"
+    api_base: ""
+    rpm: 500
+    tpm: 100000
+    litellm_params:
+      temperature: 0.3
+      max_tokens: 1000
+
+  # Example: Google Gemini 2.0 Flash
+  - id: -2
+    name: "Global Gemini 2.0 Flash"
+    description: "Google's fast vision model with large context"
+    provider: "GOOGLE"
+    model_name: "gemini-2.0-flash"
+    api_key: "your-google-ai-api-key-here"
+    api_base: ""
+    rpm: 1000
+    tpm: 200000
+    litellm_params:
+      temperature: 0.3
+      max_tokens: 1000
+
+  # Example: Anthropic Claude 3.5 Sonnet
+  - id: -3
+    name: "Global Claude 3.5 Sonnet Vision"
+    description: "Anthropic's Claude 3.5 Sonnet with vision support"
+    provider: "ANTHROPIC"
+    model_name: "claude-3-5-sonnet-20241022"
+    api_key: "sk-ant-your-anthropic-api-key-here"
+    api_base: ""
+    rpm: 1000
+    tpm: 100000
+    litellm_params:
+      temperature: 0.3
+      max_tokens: 1000
+
+  # Example: Azure OpenAI GPT-4o
+  # - id: -4
+  #   name: "Global Azure GPT-4o Vision"
+  #   description: "Azure-hosted GPT-4o for vision analysis"
+  #   provider: "AZURE_OPENAI"
+  #   model_name: "azure/gpt-4o-deployment"
+  #   api_key: "your-azure-api-key-here"
+  #   api_base: "https://your-resource.openai.azure.com"
+  #   api_version: "2024-02-15-preview"
+  #   rpm: 500
+  #   tpm: 100000
+  #   litellm_params:
+  #     temperature: 0.3
+  #     max_tokens: 1000
+  #     base_model: "gpt-4o"
+
 # Notes:
 # - ID 0 is reserved for "Auto" mode - uses LiteLLM Router for load balancing
 # - Use negative IDs to distinguish global configs from user configs (NewLLMConfig in DB)
@@ -283,3 +359,9 @@ global_image_generation_configs:
 # - The router uses litellm.aimage_generation() for async image generation
 # - Only RPM (requests per minute) is relevant for image generation rate limiting.
 #   TPM (tokens per minute) does not apply since image APIs are billed/rate-limited per request, not per token.
+#
+# VISION LLM NOTES:
+# - Vision configs use the same ID scheme (negative for global, positive for user DB)
+# - Only use vision-capable models (GPT-4o, Gemini, Claude 3, etc.)
+# - Lower temperature (0.3) is recommended for accurate screenshot analysis
+# - Lower max_tokens (1000) is sufficient since autocomplete produces short suggestions

From 00ee7974f6b4624050ca0065f303d1cca2d4da57 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 13:13:16 -0700
Subject: [PATCH 196/202] fix(desktop): pasteback issues in quick ask

- Updated the quick ask window URL to include a query parameter for quick assist mode.
- Introduced a constant to detect quick assist mode based on the URL parameter in the assistant message component.
- Simplified state management for quick assist detection, improving component performance and clarity.
---
 surfsense_desktop/src/modules/quick-ask.ts          |  3 ++-
 .../components/assistant-ui/assistant-message.tsx   | 13 ++++++-------
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/surfsense_desktop/src/modules/quick-ask.ts b/surfsense_desktop/src/modules/quick-ask.ts
index d5a2a9c2e..b738a864d 100644
--- a/surfsense_desktop/src/modules/quick-ask.ts
+++ b/surfsense_desktop/src/modules/quick-ask.ts
@@ -57,7 +57,7 @@ function createQuickAskWindow(x: number, y: number): BrowserWindow {
 
   const spaceId = pendingSearchSpaceId;
   const route = spaceId ? `/dashboard/${spaceId}/new-chat` : '/dashboard';
-  quickAskWindow.loadURL(`http://localhost:${getServerPort()}${route}`);
+  quickAskWindow.loadURL(`http://localhost:${getServerPort()}${route}?quickAssist=true`);
 
   quickAskWindow.once('ready-to-show', () => {
     quickAskWindow?.show();
@@ -84,6 +84,7 @@ function createQuickAskWindow(x: number, y: number): BrowserWindow {
 
 async function openQuickAsk(text: string): Promise<void> {
   pendingText = text;
+  pendingMode = 'quick-assist';
   pendingSearchSpaceId = await getActiveSearchSpaceId();
   const cursor = screen.getCursorScreenPoint();
   const pos = clampToScreen(cursor.x, cursor.y, 450, 750);
diff --git a/surfsense_web/components/assistant-ui/assistant-message.tsx b/surfsense_web/components/assistant-ui/assistant-message.tsx
index 49853b0b5..605d9d518 100644
--- a/surfsense_web/components/assistant-ui/assistant-message.tsx
+++ b/surfsense_web/components/assistant-ui/assistant-message.tsx
@@ -90,6 +90,11 @@ import { useMediaQuery } from "@/hooks/use-media-query";
 import { useElectronAPI } from "@/hooks/use-platform";
 import { cn } from "@/lib/utils";
 
+// Captured once at module load — survives client-side navigations that strip the query param.
+const IS_QUICK_ASSIST_WINDOW =
+	typeof window !== "undefined" &&
+	new URLSearchParams(window.location.search).get("quickAssist") === "true";
+
 // Dynamically import video presentation tool to avoid loading Babel and Remotion in main bundle
 const GenerateVideoPresentationToolUI = dynamic(
 	() =>
@@ -465,14 +470,8 @@ const AssistantActionBar: FC = () => {
 	const isLast = useAuiState((s) => s.message.isLast);
 	const aui = useAui();
 	const api = useElectronAPI();
-	const [isQuickAssist, setIsQuickAssist] = useState(false);
 
-	useEffect(() => {
-		if (!api?.getQuickAskMode) return;
-		api.getQuickAskMode().then((mode) => {
-			if (mode) setIsQuickAssist(true);
-		});
-	}, [api]);
+	const isQuickAssist = !!api?.replaceText && IS_QUICK_ASSIST_WINDOW;
 
 	return (
 		<ActionBarPrimitive.Root

From 4dd1b6c64f19bd840925f1d252450a944cb10d58 Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 22:15:35 +0200
Subject: [PATCH 197/202] Add posthog-node and node-machine-id dependencies for
 desktop analytics

---
 surfsense_desktop/package.json   |  4 +++-
 surfsense_desktop/pnpm-lock.yaml | 31 +++++++++++++++++++++++++++++++
 2 files changed, 34 insertions(+), 1 deletion(-)

diff --git a/surfsense_desktop/package.json b/surfsense_desktop/package.json
index 74f6274cb..7b91d70c9 100644
--- a/surfsense_desktop/package.json
+++ b/surfsense_desktop/package.json
@@ -34,6 +34,8 @@
     "electron-store": "^11.0.2",
     "electron-updater": "^6.8.3",
     "get-port-please": "^3.2.0",
-    "node-mac-permissions": "^2.5.0"
+    "node-mac-permissions": "^2.5.0",
+    "node-machine-id": "^1.1.12",
+    "posthog-node": "^5.29.0"
   }
 }
diff --git a/surfsense_desktop/pnpm-lock.yaml b/surfsense_desktop/pnpm-lock.yaml
index e1df34fb2..e7b84cc01 100644
--- a/surfsense_desktop/pnpm-lock.yaml
+++ b/surfsense_desktop/pnpm-lock.yaml
@@ -26,6 +26,12 @@ importers:
       node-mac-permissions:
         specifier: ^2.5.0
         version: 2.5.0
+      node-machine-id:
+        specifier: ^1.1.12
+        version: 1.1.12
+      posthog-node:
+        specifier: ^5.29.0
+        version: 5.29.0(rxjs@7.8.2)
     devDependencies:
       '@electron/rebuild':
         specifier: ^4.0.3
@@ -308,6 +314,9 @@ packages:
     resolution: {integrity: sha512-+1VkjdD0QBLPodGrJUeqarH8VAIvQODIbwh9XpP5Syisf7YoQgsJKPNFoqqLQlu+VQ/tVSshMR6loPMn8U+dPg==}
     engines: {node: '>=14'}
 
+  '@posthog/core@1.25.0':
+    resolution: {integrity: sha512-XKaHvRFIIN7Dw84r1eKimV1rl9DS+9XMCPPZ7P3+l8fE+rDsmumebiTFsY+q40bVXflcGW9wB+57LH0lvcGmhw==}
+
   '@sindresorhus/is@4.6.0':
     resolution: {integrity: sha512-t09vSN3MdfsyCHoFcTRCH/iUtG7OJ0CsjzB8cjAmKc/va/kIgeDI/TxsigdncE/4be734m0cvIYwNaV4i2XqAw==}
     engines: {node: '>=10'}
@@ -1194,6 +1203,9 @@ packages:
     resolution: {integrity: sha512-zR8SVCaN3WqV1xwWd04XVAdzm3UTdjbxciLrZtB0Cc7F2Kd34AJfhPD4hm1HU0YH3oGUZO4X9OBLY5ijSTHsGw==}
     os: [darwin]
 
+  node-machine-id@1.1.12:
+    resolution: {integrity: sha512-QNABxbrPa3qEIfrE6GOJ7BYIuignnJw7iQ2YPbc3Nla1HzRJjXzZOiikfF8m7eAMfichLt3M4VgLOetqgDmgGQ==}
+
   nopt@8.1.0:
     resolution: {integrity: sha512-ieGu42u/Qsa4TFktmaKEwM6MQH0pOWnaB3htzh0JRtx84+Mebc0cbZYN5bC+6WTZ4+77xrL9Pn5m7CV6VIkV7A==}
     engines: {node: ^18.17.0 || >=20.5.0}
@@ -1263,6 +1275,15 @@ packages:
     resolution: {integrity: sha512-uysumyrvkUX0rX/dEVqt8gC3sTBzd4zoWfLeS29nb53imdaXVvLINYXTI2GNqzaMuvacNx4uJQ8+b3zXR0pkgQ==}
     engines: {node: '>=10.4.0'}
 
+  posthog-node@5.29.0:
+    resolution: {integrity: sha512-po7N55haSKxV8VOulkBZJja938yILShl6+fFjoUV3iQgOBCg4Muu615/xRg8mpNiz+UASvL0EEiGvIxdhXfj6Q==}
+    engines: {node: ^20.20.0 || >=22.22.0}
+    peerDependencies:
+      rxjs: ^7.0.0
+    peerDependenciesMeta:
+      rxjs:
+        optional: true
+
   postject@1.0.0-alpha.6:
     resolution: {integrity: sha512-b9Eb8h2eVqNE8edvKdwqkrY6O7kAwmI8kcnBv1NScolYJbo59XUF0noFq+lxbC1yN20bmC0WBEbDC5H/7ASb0A==}
     engines: {node: '>=14.0.0'}
@@ -1876,6 +1897,8 @@ snapshots:
   '@pkgjs/parseargs@0.11.0':
     optional: true
 
+  '@posthog/core@1.25.0': {}
+
   '@sindresorhus/is@4.6.0': {}
 
   '@standard-schema/spec@1.1.0': {}
@@ -2940,6 +2963,8 @@ snapshots:
       bindings: 1.5.0
       node-addon-api: 7.1.1
 
+  node-machine-id@1.1.12: {}
+
   nopt@8.1.0:
     dependencies:
       abbrev: 3.0.1
@@ -3002,6 +3027,12 @@ snapshots:
       base64-js: 1.5.1
       xmlbuilder: 15.1.1
 
+  posthog-node@5.29.0(rxjs@7.8.2):
+    dependencies:
+      '@posthog/core': 1.25.0
+    optionalDependencies:
+      rxjs: 7.8.2
+
   postject@1.0.0-alpha.6:
     dependencies:
       commander: 9.5.0

From 26bffbcc47d0d19148963815c83eefb7cf6cfeae Mon Sep 17 00:00:00 2001
From: CREDO23 <thierrybakera12@gmail.com>
Date: Tue, 7 Apr 2026 23:39:52 +0200
Subject: [PATCH 198/202] Add dynamic vision model list from OpenRouter with
 combobox selector

---
 .../config/vision_model_list_fallback.json    |  23 +++
 .../app/routes/vision_llm_routes.py           |  28 ++++
 .../app/services/vision_model_list_service.py | 132 ++++++++++++++++++
 .../vision-llm-config-query.atoms.ts          |  24 ++++
 .../shared/vision-config-dialog.tsx           | 114 ++++++++++++++-
 .../contracts/enums/vision-providers.ts       |  26 ++++
 .../lib/apis/vision-llm-config-api.service.ts |   5 +
 surfsense_web/lib/query-client/cache-keys.ts  |   1 +
 8 files changed, 346 insertions(+), 7 deletions(-)
 create mode 100644 surfsense_backend/app/config/vision_model_list_fallback.json
 create mode 100644 surfsense_backend/app/services/vision_model_list_service.py

diff --git a/surfsense_backend/app/config/vision_model_list_fallback.json b/surfsense_backend/app/config/vision_model_list_fallback.json
new file mode 100644
index 000000000..830eb6517
--- /dev/null
+++ b/surfsense_backend/app/config/vision_model_list_fallback.json
@@ -0,0 +1,23 @@
+[
+  {"value": "gpt-4o", "label": "GPT-4o", "provider": "OPENAI", "context_window": "128K"},
+  {"value": "gpt-4o-mini", "label": "GPT-4o Mini", "provider": "OPENAI", "context_window": "128K"},
+  {"value": "gpt-4-turbo", "label": "GPT-4 Turbo", "provider": "OPENAI", "context_window": "128K"},
+  {"value": "claude-sonnet-4-20250514", "label": "Claude Sonnet 4", "provider": "ANTHROPIC", "context_window": "200K"},
+  {"value": "claude-3-7-sonnet-20250219", "label": "Claude 3.7 Sonnet", "provider": "ANTHROPIC", "context_window": "200K"},
+  {"value": "claude-3-5-sonnet-20241022", "label": "Claude 3.5 Sonnet", "provider": "ANTHROPIC", "context_window": "200K"},
+  {"value": "claude-3-opus-20240229", "label": "Claude 3 Opus", "provider": "ANTHROPIC", "context_window": "200K"},
+  {"value": "claude-3-haiku-20240307", "label": "Claude 3 Haiku", "provider": "ANTHROPIC", "context_window": "200K"},
+  {"value": "gemini-2.5-flash", "label": "Gemini 2.5 Flash", "provider": "GOOGLE", "context_window": "1M"},
+  {"value": "gemini-2.5-pro", "label": "Gemini 2.5 Pro", "provider": "GOOGLE", "context_window": "1M"},
+  {"value": "gemini-2.0-flash", "label": "Gemini 2.0 Flash", "provider": "GOOGLE", "context_window": "1M"},
+  {"value": "gemini-1.5-pro", "label": "Gemini 1.5 Pro", "provider": "GOOGLE", "context_window": "1M"},
+  {"value": "gemini-1.5-flash", "label": "Gemini 1.5 Flash", "provider": "GOOGLE", "context_window": "1M"},
+  {"value": "pixtral-large-latest", "label": "Pixtral Large", "provider": "MISTRAL", "context_window": "128K"},
+  {"value": "pixtral-12b-2409", "label": "Pixtral 12B", "provider": "MISTRAL", "context_window": "128K"},
+  {"value": "grok-2-vision-1212", "label": "Grok 2 Vision", "provider": "XAI", "context_window": "32K"},
+  {"value": "llava", "label": "LLaVA", "provider": "OLLAMA"},
+  {"value": "bakllava", "label": "BakLLaVA", "provider": "OLLAMA"},
+  {"value": "llava-llama3", "label": "LLaVA Llama 3", "provider": "OLLAMA"},
+  {"value": "llama-4-scout-17b-16e-instruct", "label": "Llama 4 Scout 17B", "provider": "GROQ", "context_window": "128K"},
+  {"value": "meta-llama/Llama-4-Scout-17B-16E-Instruct", "label": "Llama 4 Scout 17B", "provider": "TOGETHER_AI", "context_window": "128K"}
+]
diff --git a/surfsense_backend/app/routes/vision_llm_routes.py b/surfsense_backend/app/routes/vision_llm_routes.py
index 29d1a2757..eddd5e367 100644
--- a/surfsense_backend/app/routes/vision_llm_routes.py
+++ b/surfsense_backend/app/routes/vision_llm_routes.py
@@ -1,6 +1,7 @@
 import logging
 
 from fastapi import APIRouter, Depends, HTTPException
+from pydantic import BaseModel
 from sqlalchemy import select
 from sqlalchemy.ext.asyncio import AsyncSession
 
@@ -17,6 +18,7 @@ from app.schemas import (
     VisionLLMConfigRead,
     VisionLLMConfigUpdate,
 )
+from app.services.vision_model_list_service import get_vision_model_list
 from app.users import current_active_user
 from app.utils.rbac import check_permission
 
@@ -24,6 +26,32 @@ router = APIRouter()
 logger = logging.getLogger(__name__)
 
 
+# =============================================================================
+# Vision Model Catalogue (from OpenRouter, filtered for image-input models)
+# =============================================================================
+
+
+class VisionModelListItem(BaseModel):
+    value: str
+    label: str
+    provider: str
+    context_window: str | None = None
+
+
+@router.get("/vision-models", response_model=list[VisionModelListItem])
+async def list_vision_models(
+    user: User = Depends(current_active_user),
+):
+    """Return vision-capable models sourced from OpenRouter (filtered by image input)."""
+    try:
+        return await get_vision_model_list()
+    except Exception as e:
+        logger.exception("Failed to fetch vision model list")
+        raise HTTPException(
+            status_code=500, detail=f"Failed to fetch vision model list: {e!s}"
+        ) from e
+
+
 # =============================================================================
 # Global Vision LLM Configs (from YAML)
 # =============================================================================
diff --git a/surfsense_backend/app/services/vision_model_list_service.py b/surfsense_backend/app/services/vision_model_list_service.py
new file mode 100644
index 000000000..09893dd06
--- /dev/null
+++ b/surfsense_backend/app/services/vision_model_list_service.py
@@ -0,0 +1,132 @@
+"""
+Service for fetching and caching the vision-capable model list.
+
+Reuses the same OpenRouter public API and local fallback as the LLM model
+list service, but filters for models that accept image input.
+"""
+
+import json
+import logging
+import time
+from pathlib import Path
+
+import httpx
+
+logger = logging.getLogger(__name__)
+
+OPENROUTER_API_URL = "https://openrouter.ai/api/v1/models"
+FALLBACK_FILE = Path(__file__).parent.parent / "config" / "vision_model_list_fallback.json"
+CACHE_TTL_SECONDS = 86400  # 24 hours
+
+_cache: list[dict] | None = None
+_cache_timestamp: float = 0
+
+OPENROUTER_SLUG_TO_VISION_PROVIDER: dict[str, str] = {
+    "openai": "OPENAI",
+    "anthropic": "ANTHROPIC",
+    "google": "GOOGLE",
+    "mistralai": "MISTRAL",
+    "x-ai": "XAI",
+}
+
+
+def _format_context_length(length: int | None) -> str | None:
+    if not length:
+        return None
+    if length >= 1_000_000:
+        return f"{length / 1_000_000:g}M"
+    if length >= 1_000:
+        return f"{length / 1_000:g}K"
+    return str(length)
+
+
+async def _fetch_from_openrouter() -> list[dict] | None:
+    try:
+        async with httpx.AsyncClient(timeout=15) as client:
+            response = await client.get(OPENROUTER_API_URL)
+            response.raise_for_status()
+            data = response.json()
+            return data.get("data", [])
+    except Exception as e:
+        logger.warning("Failed to fetch from OpenRouter API for vision models: %s", e)
+        return None
+
+
+def _load_fallback() -> list[dict]:
+    try:
+        with open(FALLBACK_FILE, encoding="utf-8") as f:
+            return json.load(f)
+    except Exception as e:
+        logger.error("Failed to load vision model fallback list: %s", e)
+        return []
+
+
+def _is_vision_model(model: dict) -> bool:
+    """Return True if the model accepts image input and outputs text."""
+    arch = model.get("architecture", {})
+    input_mods = arch.get("input_modalities", [])
+    output_mods = arch.get("output_modalities", [])
+    return "image" in input_mods and "text" in output_mods
+
+
+def _process_vision_models(raw_models: list[dict]) -> list[dict]:
+    processed: list[dict] = []
+
+    for model in raw_models:
+        model_id: str = model.get("id", "")
+        name: str = model.get("name", "")
+        context_length = model.get("context_length")
+
+        if "/" not in model_id:
+            continue
+
+        if not _is_vision_model(model):
+            continue
+
+        provider_slug, model_name = model_id.split("/", 1)
+        context_window = _format_context_length(context_length)
+
+        processed.append(
+            {
+                "value": model_id,
+                "label": name,
+                "provider": "OPENROUTER",
+                "context_window": context_window,
+            }
+        )
+
+        native_provider = OPENROUTER_SLUG_TO_VISION_PROVIDER.get(provider_slug)
+        if native_provider:
+            if native_provider == "GOOGLE" and not model_name.startswith("gemini-"):
+                continue
+
+            processed.append(
+                {
+                    "value": model_name,
+                    "label": name,
+                    "provider": native_provider,
+                    "context_window": context_window,
+                }
+            )
+
+    return processed
+
+
+async def get_vision_model_list() -> list[dict]:
+    global _cache, _cache_timestamp
+
+    if _cache is not None and (time.time() - _cache_timestamp) < CACHE_TTL_SECONDS:
+        return _cache
+
+    raw_models = await _fetch_from_openrouter()
+
+    if raw_models is None:
+        logger.info("Using fallback vision model list")
+        return _load_fallback()
+
+    processed = _process_vision_models(raw_models)
+
+    _cache = processed
+    _cache_timestamp = time.time()
+
+    return processed
diff --git a/surfsense_web/atoms/vision-llm-config/vision-llm-config-query.atoms.ts b/surfsense_web/atoms/vision-llm-config/vision-llm-config-query.atoms.ts
index 53264fb24..906ce638f 100644
--- a/surfsense_web/atoms/vision-llm-config/vision-llm-config-query.atoms.ts
+++ b/surfsense_web/atoms/vision-llm-config/vision-llm-config-query.atoms.ts
@@ -1,4 +1,6 @@
 import { atomWithQuery } from "jotai-tanstack-query";
+import type { LLMModel } from "@/contracts/enums/llm-models";
+import { VISION_MODELS } from "@/contracts/enums/vision-providers";
 import { visionLLMConfigApiService } from "@/lib/apis/vision-llm-config-api.service";
 import { cacheKeys } from "@/lib/query-client/cache-keys";
 import { activeSearchSpaceIdAtom } from "../search-spaces/search-space-query.atoms";
@@ -25,3 +27,25 @@ export const globalVisionLLMConfigsAtom = atomWithQuery(() => {
 		},
 	};
 });
+
+export const visionModelListAtom = atomWithQuery(() => {
+	return {
+		queryKey: cacheKeys.visionLLMConfigs.modelList(),
+		staleTime: 60 * 60 * 1000,
+		placeholderData: VISION_MODELS,
+		queryFn: async (): Promise<LLMModel[]> => {
+			const data = await visionLLMConfigApiService.getModels();
+			const dynamicModels = data.map((m) => ({
+				value: m.value,
+				label: m.label,
+				provider: m.provider,
+				contextWindow: m.context_window ?? undefined,
+			}));
+
+			const coveredProviders = new Set(dynamicModels.map((m) => m.provider));
+			const staticFallbacks = VISION_MODELS.filter((m) => !coveredProviders.has(m.provider));
+
+			return [...dynamicModels, ...staticFallbacks];
+		},
+	};
+});
diff --git a/surfsense_web/components/shared/vision-config-dialog.tsx b/surfsense_web/components/shared/vision-config-dialog.tsx
index d69750316..6a494e0a6 100644
--- a/surfsense_web/components/shared/vision-config-dialog.tsx
+++ b/surfsense_web/components/shared/vision-config-dialog.tsx
@@ -1,20 +1,30 @@
 "use client";
 
 import { useAtomValue } from "jotai";
-import { AlertCircle } from "lucide-react";
-import { useCallback, useEffect, useRef, useState } from "react";
+import { AlertCircle, Check, ChevronsUpDown } from "lucide-react";
+import { useCallback, useEffect, useMemo, useRef, useState } from "react";
 import { toast } from "sonner";
 import { updateLLMPreferencesMutationAtom } from "@/atoms/new-llm-config/new-llm-config-mutation.atoms";
 import {
 	createVisionLLMConfigMutationAtom,
 	updateVisionLLMConfigMutationAtom,
 } from "@/atoms/vision-llm-config/vision-llm-config-mutation.atoms";
+import { visionModelListAtom } from "@/atoms/vision-llm-config/vision-llm-config-query.atoms";
 import { Alert, AlertDescription } from "@/components/ui/alert";
 import { Badge } from "@/components/ui/badge";
 import { Button } from "@/components/ui/button";
+import {
+	Command,
+	CommandEmpty,
+	CommandGroup,
+	CommandInput,
+	CommandItem,
+	CommandList,
+} from "@/components/ui/command";
 import { Dialog, DialogContent, DialogTitle } from "@/components/ui/dialog";
 import { Input } from "@/components/ui/input";
 import { Label } from "@/components/ui/label";
+import { Popover, PopoverContent, PopoverTrigger } from "@/components/ui/popover";
 import {
 	Select,
 	SelectContent,
@@ -30,6 +40,7 @@ import type {
 	VisionLLMConfig,
 	VisionProvider,
 } from "@/contracts/types/new-llm-config.types";
+import { cn } from "@/lib/utils";
 
 interface VisionConfigDialogProps {
 	open: boolean;
@@ -177,6 +188,14 @@ export function VisionConfigDialog({
 		}
 	}, [config, isGlobal, searchSpaceId, updatePreferences, onOpenChange]);
 
+	const { data: dynamicModels } = useAtomValue(visionModelListAtom);
+	const [modelComboboxOpen, setModelComboboxOpen] = useState(false);
+
+	const availableModels = useMemo(
+		() => (dynamicModels ?? []).filter((m) => m.provider === formData.provider),
+		[dynamicModels, formData.provider]
+	);
+
 	const isFormValid = formData.name && formData.provider && formData.model_name && formData.api_key;
 	const selectedProvider = VISION_PROVIDERS.find((p) => p.value === formData.provider);
 
@@ -303,11 +322,92 @@ export function VisionConfigDialog({
 
 							<div className="space-y-2">
 								<Label className="text-sm font-medium">Model Name *</Label>
-								<Input
-									placeholder={selectedProvider?.example?.split(",")[0]?.trim() || "e.g., gpt-4o"}
-									value={formData.model_name}
-									onChange={(e) => setFormData((p) => ({ ...p, model_name: e.target.value }))}
-								/>
+								<Popover open={modelComboboxOpen} onOpenChange={setModelComboboxOpen}>
+									<PopoverTrigger asChild>
+										<Button
+											variant="outline"
+											role="combobox"
+											aria-expanded={modelComboboxOpen}
+											className={cn(
+												"w-full justify-between font-normal bg-transparent",
+												!formData.model_name && "text-muted-foreground"
+											)}
+										>
+											{formData.model_name || "Select a model"}
+											<ChevronsUpDown className="ml-2 h-4 w-4 shrink-0 opacity-50" />
+										</Button>
+									</PopoverTrigger>
+									<PopoverContent
+										className="w-full p-0 bg-muted dark:border-neutral-700"
+										align="start"
+									>
+										<Command shouldFilter={false} className="bg-transparent">
+											<CommandInput
+												placeholder={selectedProvider?.example || "Search model name"}
+												value={formData.model_name}
+												onValueChange={(val) =>
+													setFormData((p) => ({ ...p, model_name: val }))
+												}
+											/>
+											<CommandList className="max-h-[300px]">
+												<CommandEmpty>
+													<div className="py-3 text-center text-sm text-muted-foreground">
+														{formData.model_name
+															? `Using: "${formData.model_name}"`
+															: "Type your model name"}
+													</div>
+												</CommandEmpty>
+												{availableModels.length > 0 && (
+													<CommandGroup heading="Suggested Models">
+														{availableModels
+															.filter(
+																(model) =>
+																	!formData.model_name ||
+																	model.value
+																		.toLowerCase()
+																		.includes(formData.model_name.toLowerCase()) ||
+																	model.label
+																		.toLowerCase()
+																		.includes(formData.model_name.toLowerCase())
+															)
+															.slice(0, 50)
+															.map((model) => (
+																<CommandItem
+																	key={model.value}
+																	value={model.value}
+																	onSelect={(value) => {
+																		setFormData((p) => ({
+																			...p,
+																			model_name: value,
+																		}));
+																		setModelComboboxOpen(false);
+																	}}
+																	className="py-2"
+																>
+																	<Check
+																		className={cn(
+																			"mr-2 h-4 w-4",
+																			formData.model_name === model.value
+																				? "opacity-100"
+																				: "opacity-0"
+																		)}
+																	/>
+																	<div>
+																		<div className="font-medium">{model.label}</div>
+																		{model.contextWindow && (
+																			<div className="text-xs text-muted-foreground">
+																				Context: {model.contextWindow}
+																			</div>
+																		)}
+																	</div>
+																</CommandItem>
+															))}
+													</CommandGroup>
+												)}
+											</CommandList>
+										</Command>
+									</PopoverContent>
+								</Popover>
 							</div>
 
 							<div className="space-y-2">
diff --git a/surfsense_web/contracts/enums/vision-providers.ts b/surfsense_web/contracts/enums/vision-providers.ts
index 260b03585..08be93b74 100644
--- a/surfsense_web/contracts/enums/vision-providers.ts
+++ b/surfsense_web/contracts/enums/vision-providers.ts
@@ -1,3 +1,5 @@
+import type { LLMModel } from "./llm-models";
+
 export interface VisionProviderInfo {
 	value: string;
 	label: string;
@@ -100,3 +102,27 @@ export const VISION_PROVIDERS: VisionProviderInfo[] = [
 		description: "Custom OpenAI-compatible vision endpoint",
 	},
 ];
+
+export const VISION_MODELS: LLMModel[] = [
+	{ value: "gpt-4o", label: "GPT-4o", provider: "OPENAI", contextWindow: "128K" },
+	{ value: "gpt-4o-mini", label: "GPT-4o Mini", provider: "OPENAI", contextWindow: "128K" },
+	{ value: "gpt-4-turbo", label: "GPT-4 Turbo", provider: "OPENAI", contextWindow: "128K" },
+	{ value: "claude-sonnet-4-20250514", label: "Claude Sonnet 4", provider: "ANTHROPIC", contextWindow: "200K" },
+	{ value: "claude-3-7-sonnet-20250219", label: "Claude 3.7 Sonnet", provider: "ANTHROPIC", contextWindow: "200K" },
+	{ value: "claude-3-5-sonnet-20241022", label: "Claude 3.5 Sonnet", provider: "ANTHROPIC", contextWindow: "200K" },
+	{ value: "claude-3-opus-20240229", label: "Claude 3 Opus", provider: "ANTHROPIC", contextWindow: "200K" },
+	{ value: "claude-3-haiku-20240307", label: "Claude 3 Haiku", provider: "ANTHROPIC", contextWindow: "200K" },
+	{ value: "gemini-2.5-flash", label: "Gemini 2.5 Flash", provider: "GOOGLE", contextWindow: "1M" },
+	{ value: "gemini-2.5-pro", label: "Gemini 2.5 Pro", provider: "GOOGLE", contextWindow: "1M" },
+	{ value: "gemini-2.0-flash", label: "Gemini 2.0 Flash", provider: "GOOGLE", contextWindow: "1M" },
+	{ value: "gemini-1.5-pro", label: "Gemini 1.5 Pro", provider: "GOOGLE", contextWindow: "1M" },
+	{ value: "gemini-1.5-flash", label: "Gemini 1.5 Flash", provider: "GOOGLE", contextWindow: "1M" },
+	{ value: "pixtral-large-latest", label: "Pixtral Large", provider: "MISTRAL", contextWindow: "128K" },
+	{ value: "pixtral-12b-2409", label: "Pixtral 12B", provider: "MISTRAL", contextWindow: "128K" },
+	{ value: "grok-2-vision-1212", label: "Grok 2 Vision", provider: "XAI", contextWindow: "32K" },
+	{ value: "llava", label: "LLaVA", provider: "OLLAMA" },
+	{ value: "bakllava", label: "BakLLaVA", provider: "OLLAMA" },
+	{ value: "llava-llama3", label: "LLaVA Llama 3", provider: "OLLAMA" },
+	{ value: "llama-4-scout-17b-16e-instruct", label: "Llama 4 Scout 17B", provider: "GROQ", contextWindow: "128K" },
+	{ value: "meta-llama/Llama-4-Scout-17B-16E-Instruct", label: "Llama 4 Scout 17B", provider: "TOGETHER_AI", contextWindow: "128K" },
+];
diff --git a/surfsense_web/lib/apis/vision-llm-config-api.service.ts b/surfsense_web/lib/apis/vision-llm-config-api.service.ts
index 4099c6b39..537cecbd1 100644
--- a/surfsense_web/lib/apis/vision-llm-config-api.service.ts
+++ b/surfsense_web/lib/apis/vision-llm-config-api.service.ts
@@ -4,6 +4,7 @@ import {
 	createVisionLLMConfigResponse,
 	deleteVisionLLMConfigResponse,
 	getGlobalVisionLLMConfigsResponse,
+	getModelListResponse,
 	getVisionLLMConfigsResponse,
 	type UpdateVisionLLMConfigRequest,
 	updateVisionLLMConfigRequest,
@@ -13,6 +14,10 @@ import { ValidationError } from "../error";
 import { baseApiService } from "./base-api.service";
 
 class VisionLLMConfigApiService {
+	getModels = async () => {
+		return baseApiService.get(`/api/v1/vision-models`, getModelListResponse);
+	};
+
 	getGlobalConfigs = async () => {
 		return baseApiService.get(
 			`/api/v1/global-vision-llm-configs`,
diff --git a/surfsense_web/lib/query-client/cache-keys.ts b/surfsense_web/lib/query-client/cache-keys.ts
index 04f348ff8..10aba7ef4 100644
--- a/surfsense_web/lib/query-client/cache-keys.ts
+++ b/surfsense_web/lib/query-client/cache-keys.ts
@@ -43,6 +43,7 @@ export const cacheKeys = {
 		all: (searchSpaceId: number) => ["vision-llm-configs", searchSpaceId] as const,
 		byId: (configId: number) => ["vision-llm-configs", "detail", configId] as const,
 		global: () => ["vision-llm-configs", "global"] as const,
+		modelList: () => ["vision-models", "catalogue"] as const,
 	},
 	auth: {
 		user: ["auth", "user"] as const,

From a38ec3f5dc3ef20354a1acc4f4b4eb3e64c207d4 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 14:59:40 -0700
Subject: [PATCH 199/202] fix: desktop release

TODO: Move to monorepo here
---
 package.json | 5 +++++
 1 file changed, 5 insertions(+)
 create mode 100644 package.json

diff --git a/package.json b/package.json
new file mode 100644
index 000000000..8a1a6add8
--- /dev/null
+++ b/package.json
@@ -0,0 +1,5 @@
+{
+  "name": "surfsense",
+  "private": true,
+  "packageManager": "pnpm@10.24.0"
+}

From 9ac062ad7e18c524979c33cd3b2583905d825d5d Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 15:03:33 -0700
Subject: [PATCH 200/202] ci: add workflow_dispatch to desktop release for
 manual testing

---
 .github/workflows/desktop-release.yml | 28 ++++++++++++++++++++++-----
 1 file changed, 23 insertions(+), 5 deletions(-)

diff --git a/.github/workflows/desktop-release.yml b/.github/workflows/desktop-release.yml
index 62ba5d445..1f7e06a0c 100644
--- a/.github/workflows/desktop-release.yml
+++ b/.github/workflows/desktop-release.yml
@@ -5,6 +5,20 @@ on:
     tags:
       - 'v*'
       - 'beta-v*'
+  workflow_dispatch:
+    inputs:
+      version:
+        description: 'Version number (e.g. 0.0.15) — used for dry-run testing without a tag'
+        required: true
+        default: '0.0.0-test'
+      publish:
+        description: 'Publish to GitHub Releases'
+        required: true
+        type: choice
+        options:
+          - never
+          - always
+        default: 'never'
 
 permissions:
   contents: write
@@ -27,13 +41,17 @@ jobs:
       - name: Checkout
         uses: actions/checkout@v4
 
-      - name: Extract version from tag
+      - name: Extract version
         id: version
         shell: bash
         run: |
-          TAG=${GITHUB_REF#refs/tags/}
-          VERSION=${TAG#beta-}
-          VERSION=${VERSION#v}
+          if [ "${{ github.event_name }}" = "workflow_dispatch" ]; then
+            VERSION="${{ inputs.version }}"
+          else
+            TAG=${GITHUB_REF#refs/tags/}
+            VERSION=${TAG#beta-}
+            VERSION=${VERSION#v}
+          fi
           echo "VERSION=$VERSION" >> "$GITHUB_OUTPUT"
 
       - name: Setup pnpm
@@ -75,7 +93,7 @@ jobs:
           POSTHOG_HOST: ${{ vars.POSTHOG_HOST }}
 
       - name: Package & Publish
-        run: pnpm exec electron-builder ${{ matrix.platform }} --config electron-builder.yml --publish always -c.extraMetadata.version=${{ steps.version.outputs.VERSION }}
+        run: pnpm exec electron-builder ${{ matrix.platform }} --config electron-builder.yml --publish ${{ inputs.publish || 'always' }} -c.extraMetadata.version=${{ steps.version.outputs.VERSION }}
         working-directory: surfsense_desktop
         env:
           GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}

From b9b567fe303b933e4688306a1c2b860fc392902e Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 15:13:26 -0700
Subject: [PATCH 201/202] chore: update desktop release workflow and
 configuration

- Changed shell to bash in the desktop release workflow for consistency.
- Updated the hosted frontend URL in the .env file to point to the new domain.
- Enhanced package.json with homepage and author details for better project metadata.
---
 .github/workflows/desktop-release.yml | 1 +
 surfsense_desktop/.env                | 2 +-
 surfsense_desktop/package.json        | 6 +++++-
 3 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/desktop-release.yml b/.github/workflows/desktop-release.yml
index 1f7e06a0c..f0fdee17d 100644
--- a/.github/workflows/desktop-release.yml
+++ b/.github/workflows/desktop-release.yml
@@ -93,6 +93,7 @@ jobs:
           POSTHOG_HOST: ${{ vars.POSTHOG_HOST }}
 
       - name: Package & Publish
+        shell: bash
         run: pnpm exec electron-builder ${{ matrix.platform }} --config electron-builder.yml --publish ${{ inputs.publish || 'always' }} -c.extraMetadata.version=${{ steps.version.outputs.VERSION }}
         working-directory: surfsense_desktop
         env:
diff --git a/surfsense_desktop/.env b/surfsense_desktop/.env
index e127b99e0..40e151c10 100644
--- a/surfsense_desktop/.env
+++ b/surfsense_desktop/.env
@@ -3,7 +3,7 @@
 
 # The hosted web frontend URL. Used to intercept OAuth redirects and keep them
 # inside the desktop app. Set to your production frontend domain.
-HOSTED_FRONTEND_URL=https://surfsense.net
+HOSTED_FRONTEND_URL=https://surfsense.com
 
 # PostHog analytics (leave empty to disable)
 POSTHOG_KEY=
diff --git a/surfsense_desktop/package.json b/surfsense_desktop/package.json
index 7b91d70c9..634783e47 100644
--- a/surfsense_desktop/package.json
+++ b/surfsense_desktop/package.json
@@ -14,7 +14,11 @@
     "typecheck": "tsc --noEmit",
     "postinstall": "electron-rebuild"
   },
-  "author": "MODSetter",
+  "homepage": "https://github.com/MODSetter/SurfSense",
+  "author": {
+    "name": "MODSetter",
+    "email": "rohan@surfsense.com"
+  },
   "license": "MIT",
   "packageManager": "pnpm@10.24.0",
   "devDependencies": {

From 526057022d422908b3d7d6329c95f4488046c420 Mon Sep 17 00:00:00 2001
From: "DESKTOP-RTLN3BA\\$punk" <vermarohanfinal@gmail.com>
Date: Tue, 7 Apr 2026 15:25:48 -0700
Subject: [PATCH 202/202] chore: update dependencies in desktop release
 workflow

- Upgraded actions/checkout from v4 to v5.
- Upgraded pnpm/action-setup from v4 to v5.
- Upgraded actions/setup-node from v4 to v5 and changed node version from 20 to 22.
---
 .github/workflows/desktop-release.yml | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/desktop-release.yml b/.github/workflows/desktop-release.yml
index f0fdee17d..784dffb32 100644
--- a/.github/workflows/desktop-release.yml
+++ b/.github/workflows/desktop-release.yml
@@ -39,7 +39,7 @@ jobs:
 
     steps:
       - name: Checkout
-        uses: actions/checkout@v4
+        uses: actions/checkout@v5
 
       - name: Extract version
         id: version
@@ -55,12 +55,12 @@ jobs:
           echo "VERSION=$VERSION" >> "$GITHUB_OUTPUT"
 
       - name: Setup pnpm
-        uses: pnpm/action-setup@v4
+        uses: pnpm/action-setup@v5
 
       - name: Setup Node.js
-        uses: actions/setup-node@v4
+        uses: actions/setup-node@v5
         with:
-          node-version: 20
+          node-version: 22
           cache: 'pnpm'
           cache-dependency-path: |
             surfsense_web/pnpm-lock.yaml