SurfSense/surfsense_web/components/markdown-viewer.tsx

222 lines
6.8 KiB
TypeScript
Raw Normal View History

import { createCodePlugin } from "@streamdown/code";
import { createMathPlugin } from "@streamdown/math";
import { Streamdown, type StreamdownProps } from "streamdown";
import "katex/dist/katex.min.css";
2026-04-07 05:55:39 +05:30
import Image from "next/image";
import { useMemo } from "react";
import { processChildrenWithCitations } from "@/components/citations/citation-renderer";
2026-04-30 18:42:38 -07:00
import { type CitationUrlMap, preprocessCitationMarkdown } from "@/lib/citations/citation-parser";
2026-04-07 05:55:39 +05:30
import { cn } from "@/lib/utils";
2025-04-07 23:47:06 -07:00
const code = createCodePlugin({
2026-02-13 02:43:26 +05:30
themes: ["nord", "nord"],
});
const math = createMathPlugin({
// Keep currency from being parsed as math; real math is normalized below.
2026-04-28 09:22:19 -07:00
singleDollarTextMath: false,
});
2025-04-07 23:47:06 -07:00
interface MarkdownViewerProps {
content: string;
className?: string;
maxLength?: number;
/** Render citation tokens as interactive badges. */
enableCitations?: boolean;
2025-04-07 23:47:06 -07:00
}
const EMPTY_URL_MAP: CitationUrlMap = new Map();
/** Strip a single outer markdown fence when the whole payload is fenced. */
function stripOuterMarkdownFence(content: string): string {
const trimmed = content.trim();
const match = trimmed.match(/^(`{3,})(?:markdown|md)?\s*\n([\s\S]+?)\n\1\s*$/);
return match ? match[2] : content;
}
/** Normalize common LaTeX delimiters to Streamdown's double-dollar syntax. */
function convertLatexDelimiters(content: string): string {
2026-02-14 19:09:45 +05:30
content = content.replace(/\\\[([\s\S]*?)\\\]/g, (_, inner) => `\n$$\n${inner.trim()}\n$$\n`);
content = content.replace(/\\\(([\s\S]*?)\\\)/g, (_, inner) => `$$${inner.trim()}$$`);
content = content.replace(
/\\begin\{equation\}([\s\S]*?)\\end\{equation\}/g,
2026-02-14 19:09:45 +05:30
(_, inner) => `\n$$\n${inner.trim()}\n$$\n`
);
content = content.replace(
/\\begin\{displaymath\}([\s\S]*?)\\end\{displaymath\}/g,
2026-02-14 19:09:45 +05:30
(_, inner) => `\n$$\n${inner.trim()}\n$$\n`
);
content = content.replace(
/\\begin\{math\}([\s\S]*?)\\end\{math\}/g,
2026-02-14 19:09:45 +05:30
(_, inner) => `$$${inner.trim()}$$`
);
content = content.replace(/`(\${1,2})((?:(?!\1).)+)\1`/g, "$1$2$1");
// Only convert command-style single-dollar math, leaving currency alone.
content = content.replace(
/(?<!\$)\$(?!\$)(\\[a-zA-Z][\s\S]*?)(?<!\$)\$(?!\$)/g,
2026-02-14 19:09:45 +05:30
(_, inner) => `$$${inner.trim()}$$`
);
return content;
}
export function MarkdownViewer({
content,
className,
maxLength,
enableCitations = false,
}: MarkdownViewerProps) {
const isTruncated = maxLength != null && content.length > maxLength;
const displayContent = isTruncated ? content.slice(0, maxLength) : content;
// Rewrite citation URLs before markdown autolinking can split them.
const { processedContent, urlMap } = useMemo(() => {
const stripped = stripOuterMarkdownFence(displayContent);
if (!enableCitations) {
return {
processedContent: convertLatexDelimiters(stripped),
urlMap: EMPTY_URL_MAP,
};
}
const { content: rewritten, urlMap: map } = preprocessCitationMarkdown(stripped);
return {
processedContent: convertLatexDelimiters(rewritten),
urlMap: map,
};
}, [displayContent, enableCitations]);
// Do not wrap anchors or code; citation buttons inside them would be invalid.
const wrap = (children: React.ReactNode): React.ReactNode =>
enableCitations ? processChildrenWithCitations(children, urlMap) : children;
const components: StreamdownProps["components"] = {
p: ({ children, ...props }) => (
<p className="my-2" {...props}>
{wrap(children)}
</p>
),
a: ({ children, ...props }) => (
<a
className="text-primary hover:underline"
target="_blank"
rel="noopener noreferrer"
{...props}
>
{children}
</a>
),
li: ({ children, ...props }) => <li {...props}>{wrap(children)}</li>,
ul: ({ ...props }) => <ul className="list-disc pl-5 my-2" {...props} />,
ol: ({ ...props }) => <ol className="list-decimal pl-5 my-2" {...props} />,
h1: ({ children, ...props }) => (
<h1 className="text-2xl font-bold mt-6 mb-2" {...props}>
{wrap(children)}
</h1>
),
h2: ({ children, ...props }) => (
<h2 className="text-xl font-bold mt-5 mb-2" {...props}>
{wrap(children)}
</h2>
),
h3: ({ children, ...props }) => (
<h3 className="text-lg font-bold mt-4 mb-2" {...props}>
{wrap(children)}
</h3>
),
h4: ({ children, ...props }) => (
<h4 className="text-base font-bold mt-3 mb-1" {...props}>
{wrap(children)}
</h4>
),
h5: ({ children, ...props }) => (
<h5 className="text-sm font-bold mt-3 mb-1" {...props}>
{wrap(children)}
</h5>
),
h6: ({ children, ...props }) => (
<h6 className="text-xs font-bold mt-3 mb-1" {...props}>
{wrap(children)}
</h6>
),
strong: ({ children, ...props }) => (
<strong className="font-semibold" {...props}>
{wrap(children)}
</strong>
),
em: ({ children, ...props }) => <em {...props}>{wrap(children)}</em>,
blockquote: ({ children, ...props }) => (
<blockquote className="border-l-4 border-muted pl-4 italic my-2" {...props}>
{wrap(children)}
</blockquote>
),
hr: ({ ...props }) => <hr className="my-4 border-muted" {...props} />,
img: ({ src, alt, width: _w, height: _h, ...props }) => {
if (typeof src !== "string") return null;
const width = typeof _w === "number" ? _w : Number(_w) || 800;
const height = typeof _h === "number" ? _h : Number(_h) || 600;
const shouldSkipOptimization = src.startsWith("data:");
return (
2026-04-07 05:55:39 +05:30
<Image
className="max-w-full h-auto my-4 rounded"
alt={alt || "markdown image"}
src={src}
width={width}
height={height}
2026-04-07 05:55:39 +05:30
sizes="(max-width: 768px) 100vw, (max-width: 1200px) 75vw, 60vw"
unoptimized={shouldSkipOptimization}
2026-04-07 05:55:39 +05:30
{...props}
/>
);
},
table: ({ ...props }) => (
<div className="overflow-x-auto my-4 rounded-lg border border-border w-full">
<table className="w-full divide-y divide-border" {...props} />
</div>
),
th: ({ children, ...props }) => (
2026-02-13 02:43:26 +05:30
<th
className="px-4 py-2.5 text-left text-sm font-semibold text-muted-foreground/80 bg-muted/30 border-r border-border/40 last:border-r-0"
{...props}
>
{wrap(children)}
</th>
2026-02-13 02:43:26 +05:30
),
td: ({ children, ...props }) => (
2026-02-13 02:43:26 +05:30
<td
className="px-4 py-2.5 text-sm border-t border-r border-border/40 last:border-r-0"
{...props}
>
{wrap(children)}
</td>
2026-02-13 02:43:26 +05:30
),
};
return (
<div
className={cn(
"max-w-none overflow-hidden",
"[&_[data-streamdown=code-block-header]]:!bg-transparent",
"[&_[data-streamdown=code-block]>*]:!border-none [&_[data-streamdown=code-block]>*]:![box-shadow:none]",
"[&_[data-streamdown=code-block-download-button]]:!hidden",
className
)}
>
<Streamdown
components={components}
plugins={{ code, math }}
controls={{ code: true }}
mode="static"
>
{processedContent}
</Streamdown>
{isTruncated && (
<p className="mt-4 text-sm text-muted-foreground italic">
2026-04-02 19:45:28 -07:00
Content truncated ({Math.round(content.length / 1024)}KB total). Showing first{" "}
{Math.round(maxLength / 1024)}KB.
</p>
)}
</div>
);
2025-04-07 23:47:06 -07:00
}