chat: fix mixed-decision HITL crash and fold resumed assistant messages into the interrupted bubble.

This commit is contained in:
CREDO23 2026-05-09 22:54:07 +02:00
parent 2e132513be
commit 932bf22a34
6 changed files with 208 additions and 40 deletions

View file

@ -1,7 +1,7 @@
import type { ThreadMessageLike } from "@assistant-ui/react";
import type { MessageRecord } from "./thread-persistence";
/** Minimal shape used by ``filterSupersededAbortedMessages``. */
/** Minimal shape used by the interrupt/resume reconciler. */
interface AbortableMessage {
id: number;
role: string;
@ -9,14 +9,28 @@ interface AbortableMessage {
turn_id?: string | null;
}
function isAssistant(msg: AbortableMessage): boolean {
return msg.role.toLowerCase() === "assistant";
}
/** True when the row carries at least one tool-call with ``state: "aborted"``. */
function hasAbortedToolCall(msg: AbortableMessage): boolean {
if (!isAssistant(msg) || !Array.isArray(msg.content)) return false;
for (const part of msg.content) {
if (typeof part !== "object" || part === null) continue;
if ((part as { type?: string }).type !== "tool-call") continue;
if ((part as { state?: unknown }).state === "aborted") return true;
}
return false;
}
/**
* True when the row is a frozen interrupt frame: an assistant message
* whose tool-calls all carry ``state: "aborted"``. A single non-aborted
* tool-call disqualifies (defensive against future mixed states).
* True when EVERY tool-call on the row is aborted. The row is then a
* frozen interrupt frame with no salvageable activity safe to drop
* outright.
*/
function isAbortedAssistantMessage(msg: AbortableMessage): boolean {
if (msg.role.toLowerCase() !== "assistant") return false;
if (!Array.isArray(msg.content)) return false;
function isFullyAbortedAssistantMessage(msg: AbortableMessage): boolean {
if (!isAssistant(msg) || !Array.isArray(msg.content)) return false;
let hasToolCalls = false;
for (const part of msg.content) {
if (typeof part !== "object" || part === null) continue;
@ -28,42 +42,140 @@ function isAbortedAssistantMessage(msg: AbortableMessage): boolean {
}
/**
* Positional supersede check: an aborted assistant row is superseded
* iff another assistant row appears later before any user row.
*
* NOT turn-id-based: ``stream_resume_chat`` allocates a fresh
* ``turn_id`` for the resumed row, so interrupt+resume rows never
* share a turn_id. Conversational adjacency is the reliable signal
* an assistantassistant pair without a user row between them is the
* unique signature of an interrupt+resume cycle.
* Locate the resume row that supersedes ``messages[idx]``. The
* ``stream_resume_chat`` flow allocates a fresh ``turn_id`` so we
* can't pair on it; conversational adjacency (assistant assistant
* with no user row between) is the unique signature. Skips already-
* dropped indices so chained interrupt-resumes still pair cleanly.
*/
function isSupersededByLaterAssistant<T extends AbortableMessage>(
function findResumeSuccessorIdx<T extends AbortableMessage>(
messages: readonly T[],
idx: number
): boolean {
idx: number,
dropped: ReadonlySet<number>
): number | null {
for (let i = idx + 1; i < messages.length; i++) {
if (dropped.has(i)) continue;
const role = messages[i].role.toLowerCase();
if (role === "user") return false;
if (role === "assistant") return true;
if (role === "user") return null;
if (role === "assistant") return i;
}
return false;
return null;
}
/** Read ``data.steps`` from either ``data-thinking-steps`` (modern) or ``thinking-steps`` (legacy). */
function extractStepsFromPart(part: unknown): unknown[] | null {
if (typeof part !== "object" || part === null) return null;
const p = part as { type?: unknown; data?: unknown; steps?: unknown };
if (p.type === "data-thinking-steps") {
const data = p.data as { steps?: unknown } | undefined;
return Array.isArray(data?.steps) ? data.steps : [];
}
if (p.type === "thinking-steps") {
return Array.isArray(p.steps) ? (p.steps as unknown[]) : [];
}
return null;
}
/** Split a content array into (combined steps, all other parts in order). */
function partitionContent(content: unknown): { steps: unknown[]; others: unknown[] } {
if (!Array.isArray(content)) return { steps: [], others: [] };
const steps: unknown[] = [];
const others: unknown[] = [];
for (const part of content) {
const partSteps = extractStepsFromPart(part);
if (partSteps !== null) {
steps.push(...partSteps);
continue;
}
others.push(part);
}
return { steps, others };
}
/**
* Drop frozen interrupt-frame rows once they have a resumed
* continuation. Pure (returns a new array). Caller passes messages in
* chronological order.
* Fold an interrupt-frame row's content into its resume successor so
* the user sees one assistant turn instead of two stacked bubbles.
* Successor's metadata wins (id, created_at, turn_id, token_usage,
* author) that's the row the per-turn revert button keys to.
*
* Never-resumed aborts are preserved (user navigated away mid-decision)
* so the user still sees what happened.
* Order: combined ``data-thinking-steps`` (older steps then newer) at
* index 0, followed by older's other parts in order, then newer's. The
* older row's aborted ``task`` wrapper is preserved so the rejected
* attempt remains visible alongside the successful retry; both spans
* survive and ``groupItems`` renders them as sibling task branches in
* one timeline.
*/
export function filterSupersededAbortedMessages<T extends AbortableMessage>(
function mergeInterruptedIntoResume<T extends AbortableMessage>(older: T, newer: T): T {
const olderParts = partitionContent(older.content);
const newerParts = partitionContent(newer.content);
const mergedSteps = [...olderParts.steps, ...newerParts.steps];
const mergedContent: unknown[] = [];
if (mergedSteps.length > 0) {
mergedContent.push({ type: "data-thinking-steps", data: { steps: mergedSteps } });
}
mergedContent.push(...olderParts.others, ...newerParts.others);
return { ...newer, content: mergedContent };
}
/**
* Reconcile interrupt-frame and resume rows so the UI shows one
* assistant turn per user turn even when the backend persists them as
* separate ``new_chat_messages`` rows.
*
* Two cases, both keyed on conversational adjacency (assistant
* assistant with no user row between):
*
* - **Fully aborted older row** (every tool-call ``state: "aborted"``,
* no salvageable activity) drop the older row.
* - **Partially aborted older row** (mixed completed + aborted, e.g.
* inner subagent tools ran before the interrupt) fold its content
* into the successor. Successor metadata wins.
*
* Never-resumed aborts (user navigated away mid-decision) survive so
* the user still sees what happened.
*
* Pure: returns a new array with new merged objects when needed.
* Caller passes messages in chronological order.
*/
export function reconcileInterruptedAssistantMessages<T extends AbortableMessage>(
messages: readonly T[]
): T[] {
return messages.filter((msg, idx) => {
if (!isAbortedAssistantMessage(msg)) return true;
return !isSupersededByLaterAssistant(messages, idx);
});
const dropped = new Set<number>();
const mergeInto = new Map<number, number[]>();
for (let i = 0; i < messages.length; i++) {
if (dropped.has(i)) continue;
const msg = messages[i];
if (!hasAbortedToolCall(msg)) continue;
const successorIdx = findResumeSuccessorIdx(messages, i, dropped);
if (successorIdx === null) continue;
dropped.add(i);
if (!isFullyAbortedAssistantMessage(msg)) {
const list = mergeInto.get(successorIdx) ?? [];
list.push(i);
mergeInto.set(successorIdx, list);
}
}
const result: T[] = [];
for (let i = 0; i < messages.length; i++) {
if (dropped.has(i)) continue;
const olderIdxs = mergeInto.get(i);
if (olderIdxs && olderIdxs.length > 0) {
let merged = messages[i];
for (const olderIdx of olderIdxs) {
merged = mergeInterruptedIntoResume(messages[olderIdx], merged);
}
result.push(merged);
continue;
}
result.push(messages[i]);
}
return result;
}
/**