Enhance Rowboat Copilot functionality:

- Expanded the system prompt to support a wider range of actions, including general chat and agent management.
- Implemented conversational memory, allowing the assistant to maintain context and respond in natural language.
- Updated the interpret function to accept conversation history, improving command parsing.
- Enhanced the rendering of assistant responses to include command outcomes and maintain conversational flow.
- Updated documentation to reflect new features, including conversational context and debug mode for inspecting raw commands.
This commit is contained in:
tusharmagar 2025-11-04 16:39:23 +05:30 committed by Ramnique Singh
parent 4310b1d45d
commit 0eda81b33c
4 changed files with 661 additions and 64 deletions

View file

@ -1,80 +1,149 @@
import readline from "readline";
import { z } from "zod";
import { openai } from "@ai-sdk/openai";
import { generateObject } from "ai";
import { Workflow } from "../../application/entities/workflow.js";
import { listWorkflows, getWorkflow, upsertWorkflow, deleteWorkflow } from "./workflows/service.js";
import { generateObject, streamText } from "ai";
import type { CoreMessage } from "ai";
import {
ChatCommand,
ChatCommandT,
CommandOutcome,
executeCommand,
} from "./commands.js";
const ChatCommand = z.object({
action: z.enum([
"help",
"list_workflows",
"get_workflow",
"create_workflow",
"update_workflow",
"delete_workflow",
"unknown",
]),
id: z.string().optional(),
updates: Workflow.partial().optional(),
});
type ChatCommandT = z.infer<typeof ChatCommand>;
type ConversationMessage = {
role: "user" | "assistant";
content: string;
};
const systemPrompt = `
You are a CLI assistant that converts the user's natural language into a JSON command for managing workflows.
You are a general-purpose CLI copilot that converts the user's natural language into structured commands the Rowboat assistant runtime can execute, and you can also hold a regular conversation when no command fits.
Rules:
- Only output JSON matching the provided schema. No extra commentary.
- Choose the most appropriate action from: help, list_workflows, get_workflow, create_workflow, update_workflow, delete_workflow, unknown.
- For actions that need an id (get/update/delete/create), set "id" to the workflow identifier (e.g. "example_workflow").
- For create/update, include only provided fields in "updates". If not provided, omit.
- Select the most appropriate action from: help, general_chat, list_workflows, get_workflow, describe_workflows, create_workflow, update_workflow, delete_workflow, list_agents, get_agent, create_agent, update_agent, delete_agent, list_mcp_servers, add_mcp_server, remove_mcp_server, run_workflow, unknown.
- Use describe_workflows with { scope: "all" } to show every workflow, or provide specific ids when the user names particular workflows (including pronouns like "them" or "those" referring to previously listed workflows).
- For actions that need an id (workflow/agent), set "id" to the identifier (e.g. "example_workflow").
- For create/update actions, only include provided fields in "updates".
- Workflow shape reminder: { name: string, description: string, steps: Step[] } where Step is either { type: "function", id: string } or { type: "agent", id: string }.
- Agent shape reminder: { name: string, model: string, description: string, instructions: string }.
- MCP server shape reminder: { name: string, url: string }.
- If the request is ambiguous, set action to "unknown".
- If the user is just chatting or asking for general help or explanations, use action "general_chat" with their full prompt in "query".
`;
async function interpret(input: string): Promise<ChatCommandT> {
const { object } = await generateObject({
model: openai("gpt-4.1"),
system: systemPrompt,
prompt: input,
schema: ChatCommand,
});
return object;
const responseSystemPrompt = `
You are Skipper, the Rowboat CLI copilot. You maintain an ongoing conversation, remember prior questions, run commands when requested, and give helpful free-form answers when a general reply is appropriate.
Guidelines:
- Respond in natural language with short, helpful paragraphs or bullet lists when useful.
- Summarise command results plainly (lists, confirmations, errors) and mention next steps when appropriate.
- If a command could not be inferred (action "unknown"), clarify what additional detail is needed or answer the query directly using the conversation history when possible.
- Use the conversation history to answer memory questions (for example "what was the first question I asked?").
- Avoid repeating the raw JSON command or result unless explicitly asked; focus on what the outcome means.
- Deliver everything requested in one response. Do not say you'll follow up laterinclude all available details right away.
- For general_chat actions, respond directly to the user's query with the best answer you can provide.
`;
function buildMessageHistory(history: ConversationMessage[]): CoreMessage[] {
return history.map((message) => ({
role: message.role,
content: message.content,
}));
}
async function execute(cmd: ChatCommandT): Promise<unknown> {
switch (cmd.action) {
case "help":
return {
usage: [
"Examples:",
"- list workflows",
"- show workflow example_workflow",
"- create workflow demo with one step calling function get_date",
"- update workflow demo: add agent step default_assistant",
"- delete workflow demo",
],
};
case "list_workflows":
return { items: listWorkflows() };
case "get_workflow":
if (!cmd.id) return { error: "id required" };
return getWorkflow(cmd.id) ?? null;
case "create_workflow":
if (!cmd.id) return { error: "id required" };
return upsertWorkflow(cmd.id, { ...(cmd.updates ?? {}) });
case "update_workflow":
if (!cmd.id) return { error: "id required" };
return upsertWorkflow(cmd.id, { ...(cmd.updates ?? {}) });
case "delete_workflow":
if (!cmd.id) return { error: "id required" };
return { deleted: deleteWorkflow(cmd.id) };
case "unknown":
return { error: "Could not determine intent. Try again or ask for help." };
async function interpret(input: string, history: ConversationMessage[]): Promise<ChatCommandT> {
const stopSpinner = startSpinner("Analyzing…", { persist: false });
const conversation: CoreMessage[] = [
{ role: "system", content: systemPrompt },
...buildMessageHistory(history),
{ role: "user", content: input },
];
try {
const { object } = await generateObject({
model: openai("gpt-4.1"),
messages: conversation,
schema: ChatCommand,
});
return object;
} finally {
stopSpinner();
}
}
function startSpinner(
label: string,
options: { persist?: boolean } = {}
): (finalMessage?: string) => void {
const { persist = true } = options;
const frames = ["⠋", "⠙", "⠹", "⠸", "⠼", "⠴"];
let index = 0;
const render = () => {
const frame = frames[index];
index = (index + 1) % frames.length;
process.stdout.write(`\r${frame} ${label}`);
};
render();
const timer = setInterval(render, 80);
return (finalMessage?: string) => {
clearInterval(timer);
const doneFrame = frames[(index + frames.length - 1) % frames.length];
const message = finalMessage ?? "done";
const clearWidth = doneFrame.length + label.length + (persist ? message.length + 3 : 2);
const clear = " ".repeat(clearWidth);
process.stdout.write(`\r${clear}`);
if (persist) {
process.stdout.write(`\r${doneFrame} ${label} ${message}\n`);
} else {
process.stdout.write("\r");
}
};
}
async function renderAssistantResponse(
input: string,
cmd: ChatCommandT,
outcome: CommandOutcome,
history: ConversationMessage[]
): Promise<string> {
const condensedCommand = JSON.stringify(cmd, null, 2);
const condensedResult = JSON.stringify(outcome, null, 2);
const { textStream } = await streamText({
model: openai("gpt-4.1"),
messages: [
{ role: "system", content: responseSystemPrompt },
...buildMessageHistory(history),
{
role: "user",
content: [
`Most recent request: ${input}`,
`Interpreter output:\n${condensedCommand}`,
`Command result:\n${condensedResult}`,
].join("\n\n"),
},
],
});
let final = "";
for await (const textChunk of textStream as AsyncIterable<unknown>) {
const chunk =
typeof textChunk === "string"
? textChunk
: typeof (textChunk as { value?: string }).value === "string"
? (textChunk as { value?: string }).value ?? ""
: "";
if (!chunk) continue;
process.stdout.write(chunk);
final += chunk;
}
if (!final.endsWith("\n")) {
process.stdout.write("\n");
}
return final.trim();
}
export async function startCopilot(): Promise<void> {
if (!process.env.OPENAI_API_KEY) {
console.error("OPENAI_API_KEY is not set. Please export it to use chat.");
@ -85,16 +154,38 @@ export async function startCopilot(): Promise<void> {
const rl = readline.createInterface({ input: process.stdin, output: process.stdout });
console.log("Rowboat Copilot (type 'exit' to quit)");
const debugMode = process.argv.includes("--debug") || process.env.COPILOT_DEBUG === "1";
const conversationHistory: ConversationMessage[] = [];
const ask = () => rl.question("> ", async (line) => {
if (!line || line.trim().toLowerCase() === "exit") {
rl.close();
return;
}
try {
const cmd = await interpret(line);
console.log("\n=== Parsed Command ===\n" + JSON.stringify(cmd, null, 2));
const result = await execute(cmd);
console.log("\n=== Result ===\n" + JSON.stringify(result, null, 2) + "\n");
const trimmed = line.trim();
const cmd = await interpret(trimmed, conversationHistory);
let outcome: CommandOutcome;
try {
outcome = await executeCommand(cmd);
} finally {
// no-op
}
const historyWithLatestUser: ConversationMessage[] = [
...conversationHistory,
{ role: "user", content: trimmed },
];
const assistantReply = await renderAssistantResponse(trimmed, cmd, outcome, historyWithLatestUser);
console.log("");
if (debugMode) {
console.log("=== Parsed Command ===\n" + JSON.stringify(cmd, null, 2));
console.log("\n=== Outcome ===\n" + JSON.stringify(outcome, null, 2) + "\n");
}
conversationHistory.push({ role: "user", content: trimmed });
conversationHistory.push({ role: "assistant", content: assistantReply });
} catch (err) {
console.error("Error:", (err as Error).message);
}