feat: add claude-code llm backend with runtime port (#115)

* docs: revise claude-code ingest backend spec * docs: keep claude-code spec focused on ingest * docs: expand claude-code spec to full llm parity * Refine claude-code backend spec after adversarial review iteration 1 * Refine claude-code backend spec after adversarial review iteration 2 * Refine claude-code backend spec after adversarial review iteration 3 * feat: recognize claude-code llm backend * feat: add ktx llm runtime port * feat: add claude-code llm runtime * feat: route non-agent llm calls through runtime * feat: run ingest agents through llm runtime * feat: support claude-code setup and status * test: verify claude-code backend runtime * docs: add claude-code backend v1 runtime plan * fix: close claude-code runtime isolation checks * fix: warn on claude-code prompt caching during setup * chore: verify claude-code v1 closure * docs: add claude-code backend v1 isolation closure plan * fix: update claude-code ingest setup guidance * docs: add claude-code backend v1 ingest guidance closure plan * docs: align claude-code isolation spec with sdk metadata * test: cover claude-code host discovery metadata * fix: tolerate claude-code host discovery metadata * docs: clarify claude-code host discovery metadata * docs: add claude-code auth-probe isolation fix plan * chore: prepare kaelio ktx rc1 release * chore: add semantic release workflow * fix: unblock ci checks * chore(release): 0.1.0-rc.1 * feat: add Claude Code model selection to setup * fix: keep git maintenance attached in local repos
2026-06-28 08:49:38 +02:00 · 2026-05-16 12:06:34 +02:00 · 2026-05-16 12:06:34 +02:00 · b565e44a22
commit b565e44a22
parent e6d578c03f
109 changed files with 10218 additions and 1093 deletions
--- a/packages/context/src/llm/claude-code-runtime.ts
+++ b/packages/context/src/llm/claude-code-runtime.ts
@ -0,0 +1,327 @@
+import {
+  createSdkMcpServer,
+  query as defaultQuery,
+  type Options,
+  type SDKMessage,
+  type SDKResultMessage,
+} from '@anthropic-ai/claude-agent-sdk';
+import { z } from 'zod';
+import { noopLogger, type KtxLogger } from '../core/index.js';
+import { createKtxClaudeCodeEnv } from './claude-code-env.js';
+import { resolveClaudeCodeModel } from './claude-code-models.js';
+import { createClaudeSdkTools, mcpToolIds } from './runtime-tools.js';
+import type {
+  KtxGenerateObjectInput,
+  KtxGenerateTextInput,
+  KtxLlmRuntimePort,
+  KtxRuntimeToolSet,
+  RunLoopParams,
+  RunLoopResult,
+  RunLoopStopReason,
+} from './runtime-port.js';
+
+type QueryFn = (params: Parameters<typeof defaultQuery>[0]) => AsyncIterable<SDKMessage>;
+
+export interface ClaudeCodeKtxLlmRuntimeDeps {
+  projectDir: string;
+  modelSlots: { default: string } & Partial<Record<string, string>>;
+  query?: QueryFn;
+  env?: NodeJS.ProcessEnv;
+  logger?: KtxLogger;
+}
+
+const BUILTIN_TOOLS = [
+  'Agent',
+  'Task',
+  'AskUserQuestion',
+  'Bash',
+  'Read',
+  'Edit',
+  'Write',
+  'Glob',
+  'Grep',
+  'WebFetch',
+  'WebSearch',
+  'TodoWrite',
+];
+
+function isResult(message: SDKMessage): message is SDKResultMessage {
+  return message.type === 'result';
+}
+
+function resultError(result: SDKResultMessage): Error | undefined {
+  if (result.subtype === 'success') {
+    return undefined;
+  }
+  const details = result.errors.length > 0 ? `: ${result.errors.join('; ')}` : '';
+  return new Error(`Claude Code query failed (${result.subtype})${details}`);
+}
+
+export function mapClaudeCodeStopReason(result: SDKResultMessage): RunLoopStopReason {
+  if (result.subtype === 'error_max_turns') {
+    return 'budget';
+  }
+  if (result.terminal_reason === 'max_turns' || result.stop_reason === 'max_turns') {
+    return 'budget';
+  }
+  if (result.subtype === 'success') {
+    return result.terminal_reason && result.terminal_reason !== 'completed' ? 'error' : 'natural';
+  }
+  return 'error';
+}
+
+function jsonSchema(schema: z.ZodType): Record<string, unknown> {
+  return z.toJSONSchema(schema, { target: 'draft-7' }) as Record<string, unknown>;
+}
+
+function modelForRole(modelSlots: ClaudeCodeKtxLlmRuntimeDeps['modelSlots'], role: string): string {
+  return resolveClaudeCodeModel(modelSlots[role] ?? modelSlots.default);
+}
+
+function assertInitIsolation(
+  message: SDKMessage,
+  allowedToolIds: Set<string>,
+  expectedMcpServerNames: Set<string>,
+): void {
+  if (message.type !== 'system' || message.subtype !== 'init') {
+    return;
+  }
+  const activeToolIds = new Set(message.tools);
+  const unexpectedTools = message.tools.filter((toolName) => !allowedToolIds.has(toolName));
+  const missingTools = [...allowedToolIds].filter((toolName) => !activeToolIds.has(toolName));
+  const activeMcpServerNames = message.mcp_servers.map((server) => server.name);
+  const unexpectedMcpServers = activeMcpServerNames.filter((name) => !expectedMcpServerNames.has(name));
+  const missingMcpServers = [...expectedMcpServerNames].filter((name) => !activeMcpServerNames.includes(name));
+  const unexpectedPlugins = message.plugins.map((plugin) => plugin.name);
+  if (
+    unexpectedTools.length > 0 ||
+    missingTools.length > 0 ||
+    unexpectedMcpServers.length > 0 ||
+    missingMcpServers.length > 0 ||
+    unexpectedPlugins.length > 0
+  ) {
+    throw new Error(
+      `Claude Code runtime isolation failed: tools=${unexpectedTools.join(',') || '(none)'} missing_tools=${
+        missingTools.join(',') || '(none)'
+      } mcp_servers=${unexpectedMcpServers.join(',') || '(none)'} missing_mcp_servers=${
+        missingMcpServers.join(',') || '(none)'
+      } plugins=${unexpectedPlugins.join(',') || '(none)'} host_slash_commands=${
+        message.slash_commands.length
+      } host_skills=${message.skills.length} host_agents=${message.agents?.join(',') || '(none)'}`,
+    );
+  }
+}
+
+function expectedMcpServerNames(tools: KtxRuntimeToolSet | undefined): Set<string> {
+  return tools && Object.keys(tools).length > 0 ? new Set(['ktx']) : new Set();
+}
+
+function baseOptions(input: {
+  projectDir: string;
+  model: string;
+  env: NodeJS.ProcessEnv | undefined;
+  maxTurns: number;
+  tools?: KtxRuntimeToolSet;
+}): Options {
+  const toolIds = mcpToolIds(input.tools ?? {});
+  const allowedToolIds = new Set(toolIds);
+  return {
+    cwd: input.projectDir,
+    model: input.model,
+    maxTurns: input.maxTurns,
+    settingSources: [],
+    skills: [],
+    plugins: [],
+    tools: [],
+    allowedTools: toolIds,
+    disallowedTools: BUILTIN_TOOLS,
+    canUseTool: async (toolName, _toolInput, options) =>
+      allowedToolIds.has(toolName)
+        ? { behavior: 'allow', toolUseID: options.toolUseID }
+        : {
+            behavior: 'deny',
+            message: `KTX claude-code runtime only permits current KTX MCP tools; denied ${toolName}.`,
+            toolUseID: options.toolUseID,
+          },
+    permissionMode: 'dontAsk',
+    persistSession: false,
+    env: createKtxClaudeCodeEnv(input.env),
+    ...(input.tools && Object.keys(input.tools).length > 0
+      ? { mcpServers: { ktx: createSdkMcpServer({ name: 'ktx', tools: createClaudeSdkTools(input.tools) }) } }
+      : {}),
+  };
+}
+
+async function collectResult(params: {
+  query: QueryFn;
+  prompt: string;
+  options: Options;
+  allowedToolIds: Set<string>;
+  expectedMcpServerNames: Set<string>;
+  onAssistantTurn?: () => Promise<void>;
+}): Promise<SDKResultMessage> {
+  let result: SDKResultMessage | undefined;
+  for await (const message of params.query({ prompt: params.prompt, options: params.options })) {
+    assertInitIsolation(message, params.allowedToolIds, params.expectedMcpServerNames);
+    if (message.type === 'assistant' && message.parent_tool_use_id === null) {
+      await params.onAssistantTurn?.();
+    }
+    if (isResult(message)) {
+      result = message;
+    }
+  }
+  if (!result) {
+    throw new Error('Claude Code query returned no result message');
+  }
+  return result;
+}
+
+export class ClaudeCodeKtxLlmRuntime implements KtxLlmRuntimePort {
+  private readonly runQuery: QueryFn;
+  private readonly logger: KtxLogger;
+
+  constructor(private readonly deps: ClaudeCodeKtxLlmRuntimeDeps) {
+    this.runQuery = deps.query ?? defaultQuery;
+    this.logger = deps.logger ?? noopLogger;
+  }
+
+  async generateText(input: KtxGenerateTextInput): Promise<string> {
+    const options = baseOptions({
+      projectDir: this.deps.projectDir,
+      model: modelForRole(this.deps.modelSlots, input.role),
+      env: this.deps.env,
+      maxTurns: 1,
+      tools: input.tools,
+    });
+    const result = await collectResult({
+      query: this.runQuery,
+      prompt: [input.system, input.prompt].filter(Boolean).join('\n\n'),
+      options,
+      allowedToolIds: new Set(mcpToolIds(input.tools ?? {})),
+      expectedMcpServerNames: expectedMcpServerNames(input.tools),
+    });
+    const error = resultError(result);
+    if (error) {
+      throw error;
+    }
+    if (result.subtype !== 'success') {
+      throw new Error(`Claude Code query failed (${result.subtype})`);
+    }
+    return result.result;
+  }
+
+  async generateObject<TOutput, TSchema extends z.ZodType<TOutput>>(
+    input: KtxGenerateObjectInput<TOutput, TSchema>,
+  ): Promise<TOutput> {
+    const options = {
+      ...baseOptions({
+        projectDir: this.deps.projectDir,
+        model: modelForRole(this.deps.modelSlots, input.role),
+        env: this.deps.env,
+        maxTurns: 1,
+        tools: input.tools,
+      }),
+      outputFormat: { type: 'json_schema' as const, schema: jsonSchema(input.schema as z.ZodType) },
+    };
+    const result = await collectResult({
+      query: this.runQuery,
+      prompt: [input.system, input.prompt].filter(Boolean).join('\n\n'),
+      options,
+      allowedToolIds: new Set(mcpToolIds(input.tools ?? {})),
+      expectedMcpServerNames: expectedMcpServerNames(input.tools),
+    });
+    const error = resultError(result);
+    if (error) {
+      throw error;
+    }
+    if (result.subtype !== 'success') {
+      throw new Error(`Claude Code query failed (${result.subtype})`);
+    }
+    return (input.schema as z.ZodType<TOutput>).parse(result.structured_output);
+  }
+
+  async runAgentLoop(params: RunLoopParams): Promise<RunLoopResult> {
+    let stepIndex = 0;
+    try {
+      const options = baseOptions({
+        projectDir: this.deps.projectDir,
+        model: modelForRole(this.deps.modelSlots, params.modelRole),
+        env: this.deps.env,
+        maxTurns: params.stepBudget,
+        tools: params.toolSet,
+      });
+      const result = await collectResult({
+        query: this.runQuery,
+        prompt: params.userPrompt,
+        options: { ...options, systemPrompt: params.systemPrompt },
+        allowedToolIds: new Set(mcpToolIds(params.toolSet)),
+        expectedMcpServerNames: expectedMcpServerNames(params.toolSet),
+        onAssistantTurn: async () => {
+          stepIndex += 1;
+          if (!params.onStepFinish) {
+            return;
+          }
+          try {
+            await params.onStepFinish({ stepIndex, stepBudget: params.stepBudget });
+          } catch (error) {
+            this.logger.warn(
+              `[claude-code-runner] onStepFinish callback threw; ignoring: ${
+                error instanceof Error ? error.message : String(error)
+              }`,
+            );
+          }
+        },
+      });
+      const stopReason = mapClaudeCodeStopReason(result);
+      const error = resultError(result);
+      return { stopReason, ...(stopReason === 'error' && error ? { error } : {}) };
+    } catch (error) {
+      const err = error instanceof Error ? error : new Error(String(error));
+      return { stopReason: 'error', error: err };
+    }
+  }
+}
+
+export async function runClaudeCodeAuthProbe(input: {
+  projectDir: string;
+  model: string;
+  query?: QueryFn;
+  env?: NodeJS.ProcessEnv;
+}): Promise<{ ok: true } | { ok: false; message: string }> {
+  let model: string;
+  try {
+    model = resolveClaudeCodeModel(input.model);
+  } catch (error) {
+    return {
+      ok: false,
+      message: error instanceof Error ? error.message : String(error),
+    };
+  }
+
+  try {
+    const options = baseOptions({
+      projectDir: input.projectDir,
+      model,
+      env: input.env,
+      maxTurns: 1,
+    });
+    const result = await collectResult({
+      query: input.query ?? defaultQuery,
+      prompt: 'Reply with exactly: ok',
+      options,
+      allowedToolIds: new Set(),
+      expectedMcpServerNames: new Set(),
+    });
+    const error = resultError(result);
+    if (error) {
+      throw error;
+    }
+    return { ok: true };
+  } catch (error) {
+    const message = error instanceof Error ? error.message : String(error);
+    return {
+      ok: false,
+      message: `Claude Code authentication is not usable. Authenticate Claude Code locally with the Claude Code CLI, then rerun setup or the command. ${message}`,
+    };
+  }
+}