Enhance Rowboat Copilot functionality:

- Expanded the system prompt to support a wider range of actions, including general chat and agent management. - Implemented conversational memory, allowing the assistant to maintain context and respond in natural language. - Updated the interpret function to accept conversation history, improving command parsing. - Enhanced the rendering of assistant responses to include command outcomes and maintain conversational flow. - Updated documentation to reflect new features, including conversational context and debug mode for inspecting raw commands.
2026-04-26 00:46:23 +02:00 · 2025-11-04 16:39:23 +05:30 · 2025-11-04 16:39:23 +05:30 · 0eda81b33c
commit 0eda81b33c
parent 4310b1d45d
4 changed files with 661 additions and 64 deletions
--- a/apps/cli/src/application/assistant/chat.ts
+++ b/apps/cli/src/application/assistant/chat.ts
@ -1,80 +1,149 @@
 import readline from "readline";
-import { z } from "zod";
 import { openai } from "@ai-sdk/openai";
-import { generateObject } from "ai";
-import { Workflow } from "../../application/entities/workflow.js";
-import { listWorkflows, getWorkflow, upsertWorkflow, deleteWorkflow } from "./workflows/service.js";
+import { generateObject, streamText } from "ai";
+import type { CoreMessage } from "ai";
+import {
+  ChatCommand,
+  ChatCommandT,
+  CommandOutcome,
+  executeCommand,
+} from "./commands.js";

-const ChatCommand = z.object({
-  action: z.enum([
-    "help",
-    "list_workflows",
-    "get_workflow",
-    "create_workflow",
-    "update_workflow",
-    "delete_workflow",
-    "unknown",
-  ]),
-  id: z.string().optional(),
-  updates: Workflow.partial().optional(),
-});
-
-type ChatCommandT = z.infer<typeof ChatCommand>;
+type ConversationMessage = {
+  role: "user" | "assistant";
+  content: string;
+};

 const systemPrompt = `
-You are a CLI assistant that converts the user's natural language into a JSON command for managing workflows.
+You are a general-purpose CLI copilot that converts the user's natural language into structured commands the Rowboat assistant runtime can execute, and you can also hold a regular conversation when no command fits.

 Rules:
 - Only output JSON matching the provided schema. No extra commentary.
- Choose the most appropriate action from: help, list_workflows, get_workflow, create_workflow, update_workflow, delete_workflow, unknown.
- For actions that need an id (get/update/delete/create), set "id" to the workflow identifier (e.g. "example_workflow").
- For create/update, include only provided fields in "updates". If not provided, omit.
+- Select the most appropriate action from: help, general_chat, list_workflows, get_workflow, describe_workflows, create_workflow, update_workflow, delete_workflow, list_agents, get_agent, create_agent, update_agent, delete_agent, list_mcp_servers, add_mcp_server, remove_mcp_server, run_workflow, unknown.
+- Use describe_workflows with { scope: "all" } to show every workflow, or provide specific ids when the user names particular workflows (including pronouns like "them" or "those" referring to previously listed workflows).
+- For actions that need an id (workflow/agent), set "id" to the identifier (e.g. "example_workflow").
+- For create/update actions, only include provided fields in "updates".
 - Workflow shape reminder: { name: string, description: string, steps: Step[] } where Step is either { type: "function", id: string } or { type: "agent", id: string }.
+- Agent shape reminder: { name: string, model: string, description: string, instructions: string }.
+- MCP server shape reminder: { name: string, url: string }.
 - If the request is ambiguous, set action to "unknown".
+- If the user is just chatting or asking for general help or explanations, use action "general_chat" with their full prompt in "query".
 `;

-async function interpret(input: string): Promise<ChatCommandT> {
-  const { object } = await generateObject({
-    model: openai("gpt-4.1"),
-    system: systemPrompt,
-    prompt: input,
-    schema: ChatCommand,
-  });
-  return object;
+const responseSystemPrompt = `
+You are Skipper, the Rowboat CLI copilot. You maintain an ongoing conversation, remember prior questions, run commands when requested, and give helpful free-form answers when a general reply is appropriate.
+
+Guidelines:
+- Respond in natural language with short, helpful paragraphs or bullet lists when useful.
+- Summarise command results plainly (lists, confirmations, errors) and mention next steps when appropriate.
+- If a command could not be inferred (action "unknown"), clarify what additional detail is needed or answer the query directly using the conversation history when possible.
+- Use the conversation history to answer memory questions (for example "what was the first question I asked?").
+- Avoid repeating the raw JSON command or result unless explicitly asked; focus on what the outcome means.
+- Deliver everything requested in one response. Do not say you'll follow up later—include all available details right away.
+- For general_chat actions, respond directly to the user's query with the best answer you can provide.
+`;
+
+function buildMessageHistory(history: ConversationMessage[]): CoreMessage[] {
+  return history.map((message) => ({
+    role: message.role,
+    content: message.content,
+  }));
 }

-async function execute(cmd: ChatCommandT): Promise<unknown> {
-  switch (cmd.action) {
-    case "help":
-      return {
-        usage: [
-          "Examples:",
-          "- list workflows",
-          "- show workflow example_workflow",
-          "- create workflow demo with one step calling function get_date",
-          "- update workflow demo: add agent step default_assistant",
-          "- delete workflow demo",
-        ],
-      };
-    case "list_workflows":
-      return { items: listWorkflows() };
-    case "get_workflow":
-      if (!cmd.id) return { error: "id required" };
-      return getWorkflow(cmd.id) ?? null;
-    case "create_workflow":
-      if (!cmd.id) return { error: "id required" };
-      return upsertWorkflow(cmd.id, { ...(cmd.updates ?? {}) });
-    case "update_workflow":
-      if (!cmd.id) return { error: "id required" };
-      return upsertWorkflow(cmd.id, { ...(cmd.updates ?? {}) });
-    case "delete_workflow":
-      if (!cmd.id) return { error: "id required" };
-      return { deleted: deleteWorkflow(cmd.id) };
-    case "unknown":
-      return { error: "Could not determine intent. Try again or ask for help." };
+async function interpret(input: string, history: ConversationMessage[]): Promise<ChatCommandT> {
+  const stopSpinner = startSpinner("Analyzing…", { persist: false });
+  const conversation: CoreMessage[] = [
+    { role: "system", content: systemPrompt },
+    ...buildMessageHistory(history),
+    { role: "user", content: input },
+  ];
+
+  try {
+    const { object } = await generateObject({
+      model: openai("gpt-4.1"),
+      messages: conversation,
+      schema: ChatCommand,
+    });
+    return object;
+  } finally {
+    stopSpinner();
  }
 }

+function startSpinner(
+  label: string,
+  options: { persist?: boolean } = {}
+): (finalMessage?: string) => void {
+  const { persist = true } = options;
+  const frames = ["⠋", "⠙", "⠹", "⠸", "⠼", "⠴"];
+  let index = 0;
+  const render = () => {
+    const frame = frames[index];
+    index = (index + 1) % frames.length;
+    process.stdout.write(`\r${frame} ${label}`);
+  };
+  render();
+  const timer = setInterval(render, 80);
+  return (finalMessage?: string) => {
+    clearInterval(timer);
+    const doneFrame = frames[(index + frames.length - 1) % frames.length];
+    const message = finalMessage ?? "done";
+    const clearWidth = doneFrame.length + label.length + (persist ? message.length + 3 : 2);
+    const clear = " ".repeat(clearWidth);
+    process.stdout.write(`\r${clear}`);
+    if (persist) {
+      process.stdout.write(`\r${doneFrame} ${label} ${message}\n`);
+    } else {
+      process.stdout.write("\r");
+    }
+  };
+}
+
+async function renderAssistantResponse(
+  input: string,
+  cmd: ChatCommandT,
+  outcome: CommandOutcome,
+  history: ConversationMessage[]
+): Promise<string> {
+  const condensedCommand = JSON.stringify(cmd, null, 2);
+  const condensedResult = JSON.stringify(outcome, null, 2);
+
+  const { textStream } = await streamText({
+    model: openai("gpt-4.1"),
+    messages: [
+      { role: "system", content: responseSystemPrompt },
+      ...buildMessageHistory(history),
+      {
+        role: "user",
+        content: [
+          `Most recent request: ${input}`,
+          `Interpreter output:\n${condensedCommand}`,
+          `Command result:\n${condensedResult}`,
+        ].join("\n\n"),
+      },
+    ],
+  });
+
+  let final = "";
+  for await (const textChunk of textStream as AsyncIterable<unknown>) {
+    const chunk =
+      typeof textChunk === "string"
+        ? textChunk
+        : typeof (textChunk as { value?: string }).value === "string"
+          ? (textChunk as { value?: string }).value ?? ""
+          : "";
+    if (!chunk) continue;
+    process.stdout.write(chunk);
+    final += chunk;
+  }
+
+  if (!final.endsWith("\n")) {
+    process.stdout.write("\n");
+  }
+
+  return final.trim();
+}
+
 export async function startCopilot(): Promise<void> {
  if (!process.env.OPENAI_API_KEY) {
    console.error("OPENAI_API_KEY is not set. Please export it to use chat.");
@ -85,16 +154,38 @@ export async function startCopilot(): Promise<void> {
  const rl = readline.createInterface({ input: process.stdin, output: process.stdout });
  console.log("Rowboat Copilot (type 'exit' to quit)");

+  const debugMode = process.argv.includes("--debug") || process.env.COPILOT_DEBUG === "1";
+  const conversationHistory: ConversationMessage[] = [];
+
  const ask = () => rl.question("> ", async (line) => {
    if (!line || line.trim().toLowerCase() === "exit") {
      rl.close();
      return;
    }
    try {
-      const cmd = await interpret(line);
-      console.log("\n=== Parsed Command ===\n" + JSON.stringify(cmd, null, 2));
-      const result = await execute(cmd);
-      console.log("\n=== Result ===\n" + JSON.stringify(result, null, 2) + "\n");
+      const trimmed = line.trim();
+      const cmd = await interpret(trimmed, conversationHistory);
+      let outcome: CommandOutcome;
+      try {
+        outcome = await executeCommand(cmd);
+      } finally {
+        // no-op
+      }
+
+      const historyWithLatestUser: ConversationMessage[] = [
+        ...conversationHistory,
+        { role: "user", content: trimmed },
+      ];
+      const assistantReply = await renderAssistantResponse(trimmed, cmd, outcome, historyWithLatestUser);
+      console.log("");
+
+      if (debugMode) {
+        console.log("=== Parsed Command ===\n" + JSON.stringify(cmd, null, 2));
+        console.log("\n=== Outcome ===\n" + JSON.stringify(outcome, null, 2) + "\n");
+      }
+
+      conversationHistory.push({ role: "user", content: trimmed });
+      conversationHistory.push({ role: "assistant", content: assistantReply });
    } catch (err) {
      console.error("Error:", (err as Error).message);
    }